{ "best_metric": 0.9143955354015062, "best_model_checkpoint": "./models/bart-base-spelling-nl-3m-3-2nd/checkpoint-390000", "epoch": 1.999991171063792, "global_step": 396422, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 0.00029999243230698596, "loss": 0.7347, "step": 10 }, { "epoch": 0.0, "learning_rate": 0.00029998486461397194, "loss": 0.2215, "step": 20 }, { "epoch": 0.0, "learning_rate": 0.0002999772969209579, "loss": 0.1811, "step": 30 }, { "epoch": 0.0, "learning_rate": 0.00029996972922794395, "loss": 0.1745, "step": 40 }, { "epoch": 0.0, "learning_rate": 0.00029996216153492994, "loss": 0.1605, "step": 50 }, { "epoch": 0.0, "learning_rate": 0.0002999545938419159, "loss": 0.1534, "step": 60 }, { "epoch": 0.0, "learning_rate": 0.0002999470261489019, "loss": 0.1525, "step": 70 }, { "epoch": 0.0, "learning_rate": 0.0002999394584558879, "loss": 0.1273, "step": 80 }, { "epoch": 0.0, "learning_rate": 0.00029993189076287386, "loss": 0.144, "step": 90 }, { "epoch": 0.0, "learning_rate": 0.0002999243230698599, "loss": 0.172, "step": 100 }, { "epoch": 0.0, "learning_rate": 0.0002999167553768459, "loss": 0.1288, "step": 110 }, { "epoch": 0.0, "learning_rate": 0.00029990918768383186, "loss": 0.1398, "step": 120 }, { "epoch": 0.0, "learning_rate": 0.00029990161999081784, "loss": 0.164, "step": 130 }, { "epoch": 0.0, "learning_rate": 0.0002998940522978038, "loss": 0.1436, "step": 140 }, { "epoch": 0.0, "learning_rate": 0.0002998864846047898, "loss": 0.1263, "step": 150 }, { "epoch": 0.0, "learning_rate": 0.00029987891691177584, "loss": 0.1235, "step": 160 }, { "epoch": 0.0, "learning_rate": 0.0002998713492187618, "loss": 0.1192, "step": 170 }, { "epoch": 0.0, "learning_rate": 0.0002998637815257478, "loss": 0.1067, "step": 180 }, { "epoch": 0.0, "learning_rate": 0.0002998562138327338, "loss": 0.1085, "step": 190 }, { "epoch": 0.0, "learning_rate": 0.00029984864613971977, "loss": 0.1203, "step": 200 }, { "epoch": 0.0, "learning_rate": 0.00029984107844670575, "loss": 0.1025, "step": 210 }, { "epoch": 0.0, "learning_rate": 0.00029983351075369173, "loss": 0.1044, "step": 220 }, { "epoch": 0.0, "learning_rate": 0.00029982594306067776, "loss": 0.0965, "step": 230 }, { "epoch": 0.0, "learning_rate": 0.00029981837536766375, "loss": 0.1083, "step": 240 }, { "epoch": 0.0, "learning_rate": 0.0002998108076746497, "loss": 0.106, "step": 250 }, { "epoch": 0.0, "learning_rate": 0.0002998032399816357, "loss": 0.1017, "step": 260 }, { "epoch": 0.0, "learning_rate": 0.0002997956722886217, "loss": 0.1216, "step": 270 }, { "epoch": 0.0, "learning_rate": 0.00029978810459560767, "loss": 0.1059, "step": 280 }, { "epoch": 0.0, "learning_rate": 0.0002997805369025937, "loss": 0.0953, "step": 290 }, { "epoch": 0.0, "learning_rate": 0.0002997729692095797, "loss": 0.0948, "step": 300 }, { "epoch": 0.0, "learning_rate": 0.00029976540151656567, "loss": 0.1041, "step": 310 }, { "epoch": 0.0, "learning_rate": 0.00029975783382355165, "loss": 0.0998, "step": 320 }, { "epoch": 0.0, "learning_rate": 0.00029975026613053763, "loss": 0.0976, "step": 330 }, { "epoch": 0.0, "learning_rate": 0.0002997426984375236, "loss": 0.1064, "step": 340 }, { "epoch": 0.0, "learning_rate": 0.0002997351307445096, "loss": 0.1054, "step": 350 }, { "epoch": 0.0, "learning_rate": 0.00029972756305149563, "loss": 0.084, "step": 360 }, { "epoch": 0.0, "learning_rate": 0.0002997199953584816, "loss": 0.0937, "step": 370 }, { "epoch": 0.0, "learning_rate": 0.0002997124276654676, "loss": 0.1096, "step": 380 }, { "epoch": 0.0, "learning_rate": 0.0002997048599724536, "loss": 0.1014, "step": 390 }, { "epoch": 0.0, "learning_rate": 0.00029969729227943956, "loss": 0.0946, "step": 400 }, { "epoch": 0.0, "learning_rate": 0.00029968972458642554, "loss": 0.0951, "step": 410 }, { "epoch": 0.0, "learning_rate": 0.0002996821568934116, "loss": 0.0892, "step": 420 }, { "epoch": 0.0, "learning_rate": 0.00029967458920039756, "loss": 0.0945, "step": 430 }, { "epoch": 0.0, "learning_rate": 0.00029966702150738354, "loss": 0.0932, "step": 440 }, { "epoch": 0.0, "learning_rate": 0.0002996594538143695, "loss": 0.0833, "step": 450 }, { "epoch": 0.0, "learning_rate": 0.0002996518861213555, "loss": 0.0837, "step": 460 }, { "epoch": 0.0, "learning_rate": 0.0002996443184283415, "loss": 0.085, "step": 470 }, { "epoch": 0.0, "learning_rate": 0.0002996367507353275, "loss": 0.086, "step": 480 }, { "epoch": 0.0, "learning_rate": 0.0002996291830423135, "loss": 0.079, "step": 490 }, { "epoch": 0.0, "learning_rate": 0.0002996216153492995, "loss": 0.0793, "step": 500 }, { "epoch": 0.0, "learning_rate": 0.00029961404765628546, "loss": 0.0857, "step": 510 }, { "epoch": 0.0, "learning_rate": 0.00029960647996327144, "loss": 0.0824, "step": 520 }, { "epoch": 0.0, "learning_rate": 0.0002995989122702574, "loss": 0.0853, "step": 530 }, { "epoch": 0.0, "learning_rate": 0.0002995913445772434, "loss": 0.0837, "step": 540 }, { "epoch": 0.0, "learning_rate": 0.00029958377688422944, "loss": 0.0743, "step": 550 }, { "epoch": 0.0, "learning_rate": 0.0002995762091912154, "loss": 0.0792, "step": 560 }, { "epoch": 0.0, "learning_rate": 0.0002995686414982014, "loss": 0.0767, "step": 570 }, { "epoch": 0.0, "learning_rate": 0.0002995610738051874, "loss": 0.0813, "step": 580 }, { "epoch": 0.0, "learning_rate": 0.00029955350611217337, "loss": 0.0869, "step": 590 }, { "epoch": 0.0, "learning_rate": 0.00029954593841915935, "loss": 0.0795, "step": 600 }, { "epoch": 0.0, "learning_rate": 0.0002995383707261454, "loss": 0.0784, "step": 610 }, { "epoch": 0.0, "learning_rate": 0.00029953080303313137, "loss": 0.0813, "step": 620 }, { "epoch": 0.0, "learning_rate": 0.0002995232353401173, "loss": 0.0906, "step": 630 }, { "epoch": 0.0, "learning_rate": 0.0002995156676471033, "loss": 0.0762, "step": 640 }, { "epoch": 0.0, "learning_rate": 0.0002995080999540893, "loss": 0.0874, "step": 650 }, { "epoch": 0.0, "learning_rate": 0.0002995005322610753, "loss": 0.0744, "step": 660 }, { "epoch": 0.0, "learning_rate": 0.00029949296456806127, "loss": 0.0719, "step": 670 }, { "epoch": 0.0, "learning_rate": 0.00029948539687504725, "loss": 0.0757, "step": 680 }, { "epoch": 0.0, "learning_rate": 0.00029947782918203324, "loss": 0.0752, "step": 690 }, { "epoch": 0.0, "learning_rate": 0.0002994702614890192, "loss": 0.0854, "step": 700 }, { "epoch": 0.0, "learning_rate": 0.00029946269379600525, "loss": 0.0878, "step": 710 }, { "epoch": 0.0, "learning_rate": 0.00029945512610299123, "loss": 0.0747, "step": 720 }, { "epoch": 0.0, "learning_rate": 0.0002994475584099772, "loss": 0.0783, "step": 730 }, { "epoch": 0.0, "learning_rate": 0.0002994399907169632, "loss": 0.0841, "step": 740 }, { "epoch": 0.0, "learning_rate": 0.0002994324230239492, "loss": 0.0798, "step": 750 }, { "epoch": 0.0, "learning_rate": 0.00029942485533093516, "loss": 0.0835, "step": 760 }, { "epoch": 0.0, "learning_rate": 0.00029941728763792114, "loss": 0.0709, "step": 770 }, { "epoch": 0.0, "learning_rate": 0.0002994097199449072, "loss": 0.0715, "step": 780 }, { "epoch": 0.0, "learning_rate": 0.00029940215225189316, "loss": 0.0859, "step": 790 }, { "epoch": 0.0, "learning_rate": 0.00029939458455887914, "loss": 0.0811, "step": 800 }, { "epoch": 0.0, "learning_rate": 0.0002993870168658651, "loss": 0.0768, "step": 810 }, { "epoch": 0.0, "learning_rate": 0.0002993794491728511, "loss": 0.0736, "step": 820 }, { "epoch": 0.0, "learning_rate": 0.0002993718814798371, "loss": 0.0673, "step": 830 }, { "epoch": 0.0, "learning_rate": 0.0002993643137868231, "loss": 0.0703, "step": 840 }, { "epoch": 0.0, "learning_rate": 0.0002993567460938091, "loss": 0.0774, "step": 850 }, { "epoch": 0.0, "learning_rate": 0.0002993491784007951, "loss": 0.0795, "step": 860 }, { "epoch": 0.0, "learning_rate": 0.00029934161070778106, "loss": 0.0833, "step": 870 }, { "epoch": 0.0, "learning_rate": 0.00029933404301476705, "loss": 0.077, "step": 880 }, { "epoch": 0.0, "learning_rate": 0.000299326475321753, "loss": 0.0724, "step": 890 }, { "epoch": 0.0, "learning_rate": 0.000299318907628739, "loss": 0.0766, "step": 900 }, { "epoch": 0.0, "learning_rate": 0.00029931133993572504, "loss": 0.0849, "step": 910 }, { "epoch": 0.0, "learning_rate": 0.000299303772242711, "loss": 0.0761, "step": 920 }, { "epoch": 0.0, "learning_rate": 0.000299296204549697, "loss": 0.0725, "step": 930 }, { "epoch": 0.0, "learning_rate": 0.000299288636856683, "loss": 0.0778, "step": 940 }, { "epoch": 0.0, "learning_rate": 0.00029928106916366897, "loss": 0.0758, "step": 950 }, { "epoch": 0.0, "learning_rate": 0.00029927350147065495, "loss": 0.0794, "step": 960 }, { "epoch": 0.0, "learning_rate": 0.000299265933777641, "loss": 0.0707, "step": 970 }, { "epoch": 0.0, "learning_rate": 0.00029925836608462697, "loss": 0.0737, "step": 980 }, { "epoch": 0.0, "learning_rate": 0.00029925079839161295, "loss": 0.0756, "step": 990 }, { "epoch": 0.01, "learning_rate": 0.00029924323069859893, "loss": 0.0794, "step": 1000 }, { "epoch": 0.01, "eval_cer": 0.914636193640606, "eval_loss": 0.057572510093450546, "eval_runtime": 117.4563, "eval_samples_per_second": 17.028, "eval_steps_per_second": 4.257, "step": 1000 }, { "epoch": 0.01, "learning_rate": 0.0002992356630055849, "loss": 0.0786, "step": 1010 }, { "epoch": 0.01, "learning_rate": 0.0002992280953125709, "loss": 0.0757, "step": 1020 }, { "epoch": 0.01, "learning_rate": 0.00029922052761955693, "loss": 0.079, "step": 1030 }, { "epoch": 0.01, "learning_rate": 0.0002992129599265429, "loss": 0.0718, "step": 1040 }, { "epoch": 0.01, "learning_rate": 0.0002992053922335289, "loss": 0.083, "step": 1050 }, { "epoch": 0.01, "learning_rate": 0.0002991978245405149, "loss": 0.0785, "step": 1060 }, { "epoch": 0.01, "learning_rate": 0.00029919025684750086, "loss": 0.0776, "step": 1070 }, { "epoch": 0.01, "learning_rate": 0.00029918268915448684, "loss": 0.0747, "step": 1080 }, { "epoch": 0.01, "learning_rate": 0.0002991751214614728, "loss": 0.082, "step": 1090 }, { "epoch": 0.01, "learning_rate": 0.00029916755376845885, "loss": 0.073, "step": 1100 }, { "epoch": 0.01, "learning_rate": 0.00029915998607544484, "loss": 0.0719, "step": 1110 }, { "epoch": 0.01, "learning_rate": 0.0002991524183824308, "loss": 0.0861, "step": 1120 }, { "epoch": 0.01, "learning_rate": 0.0002991448506894168, "loss": 0.0647, "step": 1130 }, { "epoch": 0.01, "learning_rate": 0.0002991372829964028, "loss": 0.0666, "step": 1140 }, { "epoch": 0.01, "learning_rate": 0.00029912971530338876, "loss": 0.0736, "step": 1150 }, { "epoch": 0.01, "learning_rate": 0.0002991221476103748, "loss": 0.0638, "step": 1160 }, { "epoch": 0.01, "learning_rate": 0.0002991145799173608, "loss": 0.0711, "step": 1170 }, { "epoch": 0.01, "learning_rate": 0.00029910701222434676, "loss": 0.0683, "step": 1180 }, { "epoch": 0.01, "learning_rate": 0.00029909944453133274, "loss": 0.0695, "step": 1190 }, { "epoch": 0.01, "learning_rate": 0.0002990918768383187, "loss": 0.0733, "step": 1200 }, { "epoch": 0.01, "learning_rate": 0.0002990843091453047, "loss": 0.0736, "step": 1210 }, { "epoch": 0.01, "learning_rate": 0.00029907674145229074, "loss": 0.0725, "step": 1220 }, { "epoch": 0.01, "learning_rate": 0.0002990691737592767, "loss": 0.0629, "step": 1230 }, { "epoch": 0.01, "learning_rate": 0.0002990616060662627, "loss": 0.061, "step": 1240 }, { "epoch": 0.01, "learning_rate": 0.0002990540383732487, "loss": 0.059, "step": 1250 }, { "epoch": 0.01, "learning_rate": 0.00029904647068023467, "loss": 0.0654, "step": 1260 }, { "epoch": 0.01, "learning_rate": 0.00029903890298722065, "loss": 0.0563, "step": 1270 }, { "epoch": 0.01, "learning_rate": 0.00029903133529420663, "loss": 0.0666, "step": 1280 }, { "epoch": 0.01, "learning_rate": 0.00029902376760119266, "loss": 0.0655, "step": 1290 }, { "epoch": 0.01, "learning_rate": 0.00029901619990817865, "loss": 0.0569, "step": 1300 }, { "epoch": 0.01, "learning_rate": 0.0002990086322151646, "loss": 0.0673, "step": 1310 }, { "epoch": 0.01, "learning_rate": 0.0002990010645221506, "loss": 0.0653, "step": 1320 }, { "epoch": 0.01, "learning_rate": 0.0002989934968291366, "loss": 0.0668, "step": 1330 }, { "epoch": 0.01, "learning_rate": 0.00029898592913612257, "loss": 0.0727, "step": 1340 }, { "epoch": 0.01, "learning_rate": 0.0002989783614431086, "loss": 0.0714, "step": 1350 }, { "epoch": 0.01, "learning_rate": 0.0002989707937500946, "loss": 0.0657, "step": 1360 }, { "epoch": 0.01, "learning_rate": 0.00029896322605708057, "loss": 0.0631, "step": 1370 }, { "epoch": 0.01, "learning_rate": 0.00029895565836406655, "loss": 0.0658, "step": 1380 }, { "epoch": 0.01, "learning_rate": 0.00029894809067105253, "loss": 0.0652, "step": 1390 }, { "epoch": 0.01, "learning_rate": 0.0002989405229780385, "loss": 0.0743, "step": 1400 }, { "epoch": 0.01, "learning_rate": 0.0002989329552850245, "loss": 0.0639, "step": 1410 }, { "epoch": 0.01, "learning_rate": 0.00029892538759201053, "loss": 0.0642, "step": 1420 }, { "epoch": 0.01, "learning_rate": 0.0002989178198989965, "loss": 0.0706, "step": 1430 }, { "epoch": 0.01, "learning_rate": 0.0002989102522059825, "loss": 0.0656, "step": 1440 }, { "epoch": 0.01, "learning_rate": 0.0002989026845129685, "loss": 0.0714, "step": 1450 }, { "epoch": 0.01, "learning_rate": 0.00029889511681995446, "loss": 0.0703, "step": 1460 }, { "epoch": 0.01, "learning_rate": 0.00029888754912694044, "loss": 0.0675, "step": 1470 }, { "epoch": 0.01, "learning_rate": 0.0002988799814339265, "loss": 0.0703, "step": 1480 }, { "epoch": 0.01, "learning_rate": 0.00029887241374091246, "loss": 0.0671, "step": 1490 }, { "epoch": 0.01, "learning_rate": 0.00029886484604789844, "loss": 0.0668, "step": 1500 }, { "epoch": 0.01, "learning_rate": 0.0002988572783548844, "loss": 0.0688, "step": 1510 }, { "epoch": 0.01, "learning_rate": 0.0002988497106618704, "loss": 0.065, "step": 1520 }, { "epoch": 0.01, "learning_rate": 0.0002988421429688564, "loss": 0.0656, "step": 1530 }, { "epoch": 0.01, "learning_rate": 0.0002988345752758424, "loss": 0.0695, "step": 1540 }, { "epoch": 0.01, "learning_rate": 0.0002988270075828284, "loss": 0.0732, "step": 1550 }, { "epoch": 0.01, "learning_rate": 0.0002988194398898144, "loss": 0.0693, "step": 1560 }, { "epoch": 0.01, "learning_rate": 0.00029881187219680036, "loss": 0.0653, "step": 1570 }, { "epoch": 0.01, "learning_rate": 0.00029880430450378634, "loss": 0.0652, "step": 1580 }, { "epoch": 0.01, "learning_rate": 0.0002987967368107723, "loss": 0.0775, "step": 1590 }, { "epoch": 0.01, "learning_rate": 0.0002987891691177583, "loss": 0.069, "step": 1600 }, { "epoch": 0.01, "learning_rate": 0.00029878160142474434, "loss": 0.0666, "step": 1610 }, { "epoch": 0.01, "learning_rate": 0.0002987740337317303, "loss": 0.0642, "step": 1620 }, { "epoch": 0.01, "learning_rate": 0.0002987664660387163, "loss": 0.0659, "step": 1630 }, { "epoch": 0.01, "learning_rate": 0.0002987588983457023, "loss": 0.0657, "step": 1640 }, { "epoch": 0.01, "learning_rate": 0.00029875133065268827, "loss": 0.0655, "step": 1650 }, { "epoch": 0.01, "learning_rate": 0.00029874376295967425, "loss": 0.0605, "step": 1660 }, { "epoch": 0.01, "learning_rate": 0.0002987361952666603, "loss": 0.0676, "step": 1670 }, { "epoch": 0.01, "learning_rate": 0.00029872862757364627, "loss": 0.0536, "step": 1680 }, { "epoch": 0.01, "learning_rate": 0.00029872105988063225, "loss": 0.059, "step": 1690 }, { "epoch": 0.01, "learning_rate": 0.00029871349218761823, "loss": 0.059, "step": 1700 }, { "epoch": 0.01, "learning_rate": 0.0002987059244946042, "loss": 0.0586, "step": 1710 }, { "epoch": 0.01, "learning_rate": 0.0002986983568015902, "loss": 0.0583, "step": 1720 }, { "epoch": 0.01, "learning_rate": 0.0002986907891085762, "loss": 0.0589, "step": 1730 }, { "epoch": 0.01, "learning_rate": 0.0002986832214155622, "loss": 0.0582, "step": 1740 }, { "epoch": 0.01, "learning_rate": 0.0002986756537225482, "loss": 0.0708, "step": 1750 }, { "epoch": 0.01, "learning_rate": 0.00029866808602953417, "loss": 0.0637, "step": 1760 }, { "epoch": 0.01, "learning_rate": 0.00029866051833652015, "loss": 0.0645, "step": 1770 }, { "epoch": 0.01, "learning_rate": 0.00029865295064350613, "loss": 0.0582, "step": 1780 }, { "epoch": 0.01, "learning_rate": 0.0002986453829504921, "loss": 0.058, "step": 1790 }, { "epoch": 0.01, "learning_rate": 0.00029863781525747815, "loss": 0.0606, "step": 1800 }, { "epoch": 0.01, "learning_rate": 0.00029863024756446413, "loss": 0.0569, "step": 1810 }, { "epoch": 0.01, "learning_rate": 0.0002986226798714501, "loss": 0.0622, "step": 1820 }, { "epoch": 0.01, "learning_rate": 0.0002986151121784361, "loss": 0.0669, "step": 1830 }, { "epoch": 0.01, "learning_rate": 0.0002986075444854221, "loss": 0.0735, "step": 1840 }, { "epoch": 0.01, "learning_rate": 0.00029859997679240806, "loss": 0.0759, "step": 1850 }, { "epoch": 0.01, "learning_rate": 0.0002985924090993941, "loss": 0.0636, "step": 1860 }, { "epoch": 0.01, "learning_rate": 0.0002985848414063801, "loss": 0.0633, "step": 1870 }, { "epoch": 0.01, "learning_rate": 0.00029857727371336606, "loss": 0.064, "step": 1880 }, { "epoch": 0.01, "learning_rate": 0.000298569706020352, "loss": 0.0751, "step": 1890 }, { "epoch": 0.01, "learning_rate": 0.000298562138327338, "loss": 0.0611, "step": 1900 }, { "epoch": 0.01, "learning_rate": 0.000298554570634324, "loss": 0.0672, "step": 1910 }, { "epoch": 0.01, "learning_rate": 0.00029854700294131, "loss": 0.0659, "step": 1920 }, { "epoch": 0.01, "learning_rate": 0.00029853943524829596, "loss": 0.0645, "step": 1930 }, { "epoch": 0.01, "learning_rate": 0.00029853186755528195, "loss": 0.0679, "step": 1940 }, { "epoch": 0.01, "learning_rate": 0.0002985242998622679, "loss": 0.0619, "step": 1950 }, { "epoch": 0.01, "learning_rate": 0.00029851673216925396, "loss": 0.0564, "step": 1960 }, { "epoch": 0.01, "learning_rate": 0.00029850916447623994, "loss": 0.053, "step": 1970 }, { "epoch": 0.01, "learning_rate": 0.0002985015967832259, "loss": 0.0625, "step": 1980 }, { "epoch": 0.01, "learning_rate": 0.0002984940290902119, "loss": 0.063, "step": 1990 }, { "epoch": 0.01, "learning_rate": 0.0002984864613971979, "loss": 0.0629, "step": 2000 }, { "epoch": 0.01, "eval_cer": 0.9145119829365546, "eval_loss": 0.04564144089818001, "eval_runtime": 117.4132, "eval_samples_per_second": 17.034, "eval_steps_per_second": 4.258, "step": 2000 }, { "epoch": 0.01, "learning_rate": 0.00029847889370418387, "loss": 0.052, "step": 2010 }, { "epoch": 0.01, "learning_rate": 0.00029847132601116985, "loss": 0.0563, "step": 2020 }, { "epoch": 0.01, "learning_rate": 0.0002984637583181559, "loss": 0.0644, "step": 2030 }, { "epoch": 0.01, "learning_rate": 0.00029845619062514187, "loss": 0.0555, "step": 2040 }, { "epoch": 0.01, "learning_rate": 0.00029844862293212785, "loss": 0.0578, "step": 2050 }, { "epoch": 0.01, "learning_rate": 0.00029844105523911383, "loss": 0.0626, "step": 2060 }, { "epoch": 0.01, "learning_rate": 0.0002984334875460998, "loss": 0.0582, "step": 2070 }, { "epoch": 0.01, "learning_rate": 0.0002984259198530858, "loss": 0.0599, "step": 2080 }, { "epoch": 0.01, "learning_rate": 0.00029841835216007183, "loss": 0.0776, "step": 2090 }, { "epoch": 0.01, "learning_rate": 0.0002984107844670578, "loss": 0.0647, "step": 2100 }, { "epoch": 0.01, "learning_rate": 0.0002984032167740438, "loss": 0.0603, "step": 2110 }, { "epoch": 0.01, "learning_rate": 0.0002983956490810298, "loss": 0.0652, "step": 2120 }, { "epoch": 0.01, "learning_rate": 0.00029838808138801576, "loss": 0.0623, "step": 2130 }, { "epoch": 0.01, "learning_rate": 0.00029838051369500174, "loss": 0.0579, "step": 2140 }, { "epoch": 0.01, "learning_rate": 0.0002983729460019877, "loss": 0.0577, "step": 2150 }, { "epoch": 0.01, "learning_rate": 0.00029836537830897375, "loss": 0.0613, "step": 2160 }, { "epoch": 0.01, "learning_rate": 0.00029835781061595974, "loss": 0.0641, "step": 2170 }, { "epoch": 0.01, "learning_rate": 0.0002983502429229457, "loss": 0.0597, "step": 2180 }, { "epoch": 0.01, "learning_rate": 0.0002983426752299317, "loss": 0.0632, "step": 2190 }, { "epoch": 0.01, "learning_rate": 0.0002983351075369177, "loss": 0.0626, "step": 2200 }, { "epoch": 0.01, "learning_rate": 0.00029832753984390366, "loss": 0.0596, "step": 2210 }, { "epoch": 0.01, "learning_rate": 0.0002983199721508897, "loss": 0.0594, "step": 2220 }, { "epoch": 0.01, "learning_rate": 0.0002983124044578757, "loss": 0.0628, "step": 2230 }, { "epoch": 0.01, "learning_rate": 0.00029830483676486166, "loss": 0.0622, "step": 2240 }, { "epoch": 0.01, "learning_rate": 0.00029829726907184764, "loss": 0.07, "step": 2250 }, { "epoch": 0.01, "learning_rate": 0.0002982897013788336, "loss": 0.0618, "step": 2260 }, { "epoch": 0.01, "learning_rate": 0.0002982821336858196, "loss": 0.0629, "step": 2270 }, { "epoch": 0.01, "learning_rate": 0.00029827456599280564, "loss": 0.0638, "step": 2280 }, { "epoch": 0.01, "learning_rate": 0.0002982669982997916, "loss": 0.0545, "step": 2290 }, { "epoch": 0.01, "learning_rate": 0.0002982594306067776, "loss": 0.0578, "step": 2300 }, { "epoch": 0.01, "learning_rate": 0.0002982518629137636, "loss": 0.0553, "step": 2310 }, { "epoch": 0.01, "learning_rate": 0.00029824429522074957, "loss": 0.0535, "step": 2320 }, { "epoch": 0.01, "learning_rate": 0.00029823672752773555, "loss": 0.0537, "step": 2330 }, { "epoch": 0.01, "learning_rate": 0.00029822915983472153, "loss": 0.05, "step": 2340 }, { "epoch": 0.01, "learning_rate": 0.00029822159214170756, "loss": 0.0571, "step": 2350 }, { "epoch": 0.01, "learning_rate": 0.00029821402444869355, "loss": 0.0539, "step": 2360 }, { "epoch": 0.01, "learning_rate": 0.00029820645675567953, "loss": 0.0569, "step": 2370 }, { "epoch": 0.01, "learning_rate": 0.0002981988890626655, "loss": 0.0556, "step": 2380 }, { "epoch": 0.01, "learning_rate": 0.0002981913213696515, "loss": 0.0565, "step": 2390 }, { "epoch": 0.01, "learning_rate": 0.00029818375367663747, "loss": 0.0538, "step": 2400 }, { "epoch": 0.01, "learning_rate": 0.0002981761859836235, "loss": 0.0501, "step": 2410 }, { "epoch": 0.01, "learning_rate": 0.0002981686182906095, "loss": 0.0545, "step": 2420 }, { "epoch": 0.01, "learning_rate": 0.00029816105059759547, "loss": 0.0578, "step": 2430 }, { "epoch": 0.01, "learning_rate": 0.00029815348290458145, "loss": 0.052, "step": 2440 }, { "epoch": 0.01, "learning_rate": 0.00029814591521156743, "loss": 0.0606, "step": 2450 }, { "epoch": 0.01, "learning_rate": 0.0002981383475185534, "loss": 0.0619, "step": 2460 }, { "epoch": 0.01, "learning_rate": 0.00029813077982553945, "loss": 0.0514, "step": 2470 }, { "epoch": 0.01, "learning_rate": 0.00029812321213252543, "loss": 0.0585, "step": 2480 }, { "epoch": 0.01, "learning_rate": 0.0002981156444395114, "loss": 0.0566, "step": 2490 }, { "epoch": 0.01, "learning_rate": 0.0002981080767464974, "loss": 0.05, "step": 2500 }, { "epoch": 0.01, "learning_rate": 0.0002981005090534834, "loss": 0.0573, "step": 2510 }, { "epoch": 0.01, "learning_rate": 0.00029809294136046936, "loss": 0.0556, "step": 2520 }, { "epoch": 0.01, "learning_rate": 0.00029808537366745534, "loss": 0.0588, "step": 2530 }, { "epoch": 0.01, "learning_rate": 0.0002980778059744414, "loss": 0.0521, "step": 2540 }, { "epoch": 0.01, "learning_rate": 0.00029807023828142736, "loss": 0.0625, "step": 2550 }, { "epoch": 0.01, "learning_rate": 0.00029806267058841334, "loss": 0.077, "step": 2560 }, { "epoch": 0.01, "learning_rate": 0.0002980551028953993, "loss": 0.0558, "step": 2570 }, { "epoch": 0.01, "learning_rate": 0.0002980475352023853, "loss": 0.0603, "step": 2580 }, { "epoch": 0.01, "learning_rate": 0.0002980399675093713, "loss": 0.0523, "step": 2590 }, { "epoch": 0.01, "learning_rate": 0.0002980323998163573, "loss": 0.0529, "step": 2600 }, { "epoch": 0.01, "learning_rate": 0.0002980248321233433, "loss": 0.0549, "step": 2610 }, { "epoch": 0.01, "learning_rate": 0.0002980172644303293, "loss": 0.0527, "step": 2620 }, { "epoch": 0.01, "learning_rate": 0.00029800969673731526, "loss": 0.0494, "step": 2630 }, { "epoch": 0.01, "learning_rate": 0.00029800212904430124, "loss": 0.0557, "step": 2640 }, { "epoch": 0.01, "learning_rate": 0.0002979945613512872, "loss": 0.056, "step": 2650 }, { "epoch": 0.01, "learning_rate": 0.0002979869936582732, "loss": 0.0545, "step": 2660 }, { "epoch": 0.01, "learning_rate": 0.00029797942596525924, "loss": 0.0517, "step": 2670 }, { "epoch": 0.01, "learning_rate": 0.0002979718582722452, "loss": 0.052, "step": 2680 }, { "epoch": 0.01, "learning_rate": 0.0002979642905792312, "loss": 0.0551, "step": 2690 }, { "epoch": 0.01, "learning_rate": 0.0002979567228862172, "loss": 0.0493, "step": 2700 }, { "epoch": 0.01, "learning_rate": 0.00029794915519320317, "loss": 0.0518, "step": 2710 }, { "epoch": 0.01, "learning_rate": 0.00029794158750018915, "loss": 0.0528, "step": 2720 }, { "epoch": 0.01, "learning_rate": 0.0002979340198071752, "loss": 0.0472, "step": 2730 }, { "epoch": 0.01, "learning_rate": 0.00029792645211416117, "loss": 0.0541, "step": 2740 }, { "epoch": 0.01, "learning_rate": 0.00029791888442114715, "loss": 0.0504, "step": 2750 }, { "epoch": 0.01, "learning_rate": 0.00029791131672813313, "loss": 0.0628, "step": 2760 }, { "epoch": 0.01, "learning_rate": 0.0002979037490351191, "loss": 0.0572, "step": 2770 }, { "epoch": 0.01, "learning_rate": 0.0002978961813421051, "loss": 0.0541, "step": 2780 }, { "epoch": 0.01, "learning_rate": 0.00029788861364909113, "loss": 0.0556, "step": 2790 }, { "epoch": 0.01, "learning_rate": 0.0002978810459560771, "loss": 0.0557, "step": 2800 }, { "epoch": 0.01, "learning_rate": 0.0002978734782630631, "loss": 0.0725, "step": 2810 }, { "epoch": 0.01, "learning_rate": 0.00029786591057004907, "loss": 0.0681, "step": 2820 }, { "epoch": 0.01, "learning_rate": 0.00029785834287703505, "loss": 0.0572, "step": 2830 }, { "epoch": 0.01, "learning_rate": 0.00029785077518402103, "loss": 0.0536, "step": 2840 }, { "epoch": 0.01, "learning_rate": 0.000297843207491007, "loss": 0.0545, "step": 2850 }, { "epoch": 0.01, "learning_rate": 0.00029783563979799305, "loss": 0.0573, "step": 2860 }, { "epoch": 0.01, "learning_rate": 0.00029782807210497903, "loss": 0.0519, "step": 2870 }, { "epoch": 0.01, "learning_rate": 0.000297820504411965, "loss": 0.0539, "step": 2880 }, { "epoch": 0.01, "learning_rate": 0.000297812936718951, "loss": 0.0611, "step": 2890 }, { "epoch": 0.01, "learning_rate": 0.000297805369025937, "loss": 0.0533, "step": 2900 }, { "epoch": 0.01, "learning_rate": 0.00029779780133292296, "loss": 0.0537, "step": 2910 }, { "epoch": 0.01, "learning_rate": 0.000297790233639909, "loss": 0.0529, "step": 2920 }, { "epoch": 0.01, "learning_rate": 0.000297782665946895, "loss": 0.0539, "step": 2930 }, { "epoch": 0.01, "learning_rate": 0.00029777509825388096, "loss": 0.0511, "step": 2940 }, { "epoch": 0.01, "learning_rate": 0.00029776753056086694, "loss": 0.0568, "step": 2950 }, { "epoch": 0.01, "learning_rate": 0.0002977599628678529, "loss": 0.0534, "step": 2960 }, { "epoch": 0.01, "learning_rate": 0.0002977523951748389, "loss": 0.0514, "step": 2970 }, { "epoch": 0.02, "learning_rate": 0.00029774482748182494, "loss": 0.059, "step": 2980 }, { "epoch": 0.02, "learning_rate": 0.0002977372597888109, "loss": 0.06, "step": 2990 }, { "epoch": 0.02, "learning_rate": 0.0002977296920957969, "loss": 0.071, "step": 3000 }, { "epoch": 0.02, "eval_cer": 0.9145605027428246, "eval_loss": 0.04296322166919708, "eval_runtime": 117.3539, "eval_samples_per_second": 17.042, "eval_steps_per_second": 4.261, "step": 3000 }, { "epoch": 0.02, "learning_rate": 0.0002977221244027829, "loss": 0.0634, "step": 3010 }, { "epoch": 0.02, "learning_rate": 0.00029771455670976886, "loss": 0.055, "step": 3020 }, { "epoch": 0.02, "learning_rate": 0.00029770698901675484, "loss": 0.0572, "step": 3030 }, { "epoch": 0.02, "learning_rate": 0.0002976994213237408, "loss": 0.0522, "step": 3040 }, { "epoch": 0.02, "learning_rate": 0.00029769185363072686, "loss": 0.0582, "step": 3050 }, { "epoch": 0.02, "learning_rate": 0.00029768428593771284, "loss": 0.0513, "step": 3060 }, { "epoch": 0.02, "learning_rate": 0.0002976767182446988, "loss": 0.0565, "step": 3070 }, { "epoch": 0.02, "learning_rate": 0.0002976691505516848, "loss": 0.0509, "step": 3080 }, { "epoch": 0.02, "learning_rate": 0.0002976615828586708, "loss": 0.0587, "step": 3090 }, { "epoch": 0.02, "learning_rate": 0.00029765401516565677, "loss": 0.0504, "step": 3100 }, { "epoch": 0.02, "learning_rate": 0.0002976464474726428, "loss": 0.053, "step": 3110 }, { "epoch": 0.02, "learning_rate": 0.0002976388797796288, "loss": 0.0575, "step": 3120 }, { "epoch": 0.02, "learning_rate": 0.00029763131208661477, "loss": 0.069, "step": 3130 }, { "epoch": 0.02, "learning_rate": 0.00029762374439360075, "loss": 0.0556, "step": 3140 }, { "epoch": 0.02, "learning_rate": 0.00029761617670058673, "loss": 0.0563, "step": 3150 }, { "epoch": 0.02, "learning_rate": 0.0002976086090075727, "loss": 0.0533, "step": 3160 }, { "epoch": 0.02, "learning_rate": 0.0002976010413145587, "loss": 0.0604, "step": 3170 }, { "epoch": 0.02, "learning_rate": 0.0002975934736215447, "loss": 0.0548, "step": 3180 }, { "epoch": 0.02, "learning_rate": 0.00029758590592853066, "loss": 0.0575, "step": 3190 }, { "epoch": 0.02, "learning_rate": 0.00029757833823551664, "loss": 0.0544, "step": 3200 }, { "epoch": 0.02, "learning_rate": 0.0002975707705425026, "loss": 0.0557, "step": 3210 }, { "epoch": 0.02, "learning_rate": 0.00029756320284948865, "loss": 0.0545, "step": 3220 }, { "epoch": 0.02, "learning_rate": 0.00029755563515647464, "loss": 0.0549, "step": 3230 }, { "epoch": 0.02, "learning_rate": 0.0002975480674634606, "loss": 0.0504, "step": 3240 }, { "epoch": 0.02, "learning_rate": 0.0002975404997704466, "loss": 0.0501, "step": 3250 }, { "epoch": 0.02, "learning_rate": 0.0002975329320774326, "loss": 0.0545, "step": 3260 }, { "epoch": 0.02, "learning_rate": 0.00029752536438441856, "loss": 0.0453, "step": 3270 }, { "epoch": 0.02, "learning_rate": 0.0002975177966914046, "loss": 0.0476, "step": 3280 }, { "epoch": 0.02, "learning_rate": 0.0002975102289983906, "loss": 0.0596, "step": 3290 }, { "epoch": 0.02, "learning_rate": 0.00029750266130537656, "loss": 0.06, "step": 3300 }, { "epoch": 0.02, "learning_rate": 0.00029749509361236254, "loss": 0.0556, "step": 3310 }, { "epoch": 0.02, "learning_rate": 0.0002974875259193485, "loss": 0.0532, "step": 3320 }, { "epoch": 0.02, "learning_rate": 0.0002974799582263345, "loss": 0.0508, "step": 3330 }, { "epoch": 0.02, "learning_rate": 0.00029747239053332054, "loss": 0.0553, "step": 3340 }, { "epoch": 0.02, "learning_rate": 0.0002974648228403065, "loss": 0.0571, "step": 3350 }, { "epoch": 0.02, "learning_rate": 0.0002974572551472925, "loss": 0.0518, "step": 3360 }, { "epoch": 0.02, "learning_rate": 0.0002974496874542785, "loss": 0.0596, "step": 3370 }, { "epoch": 0.02, "learning_rate": 0.00029744211976126447, "loss": 0.0473, "step": 3380 }, { "epoch": 0.02, "learning_rate": 0.00029743455206825045, "loss": 0.0541, "step": 3390 }, { "epoch": 0.02, "learning_rate": 0.00029742698437523643, "loss": 0.0475, "step": 3400 }, { "epoch": 0.02, "learning_rate": 0.00029741941668222246, "loss": 0.0535, "step": 3410 }, { "epoch": 0.02, "learning_rate": 0.00029741184898920845, "loss": 0.0912, "step": 3420 }, { "epoch": 0.02, "learning_rate": 0.00029740428129619443, "loss": 0.0654, "step": 3430 }, { "epoch": 0.02, "learning_rate": 0.0002973967136031804, "loss": 0.1074, "step": 3440 }, { "epoch": 0.02, "learning_rate": 0.0002973891459101664, "loss": 0.0576, "step": 3450 }, { "epoch": 0.02, "learning_rate": 0.00029738157821715237, "loss": 0.0517, "step": 3460 }, { "epoch": 0.02, "learning_rate": 0.0002973740105241384, "loss": 0.0604, "step": 3470 }, { "epoch": 0.02, "learning_rate": 0.0002973664428311244, "loss": 0.0488, "step": 3480 }, { "epoch": 0.02, "learning_rate": 0.00029735887513811037, "loss": 0.0484, "step": 3490 }, { "epoch": 0.02, "learning_rate": 0.00029735130744509635, "loss": 0.0547, "step": 3500 }, { "epoch": 0.02, "learning_rate": 0.00029734373975208233, "loss": 0.0545, "step": 3510 }, { "epoch": 0.02, "learning_rate": 0.0002973361720590683, "loss": 0.0482, "step": 3520 }, { "epoch": 0.02, "learning_rate": 0.00029732860436605435, "loss": 0.0554, "step": 3530 }, { "epoch": 0.02, "learning_rate": 0.00029732103667304033, "loss": 0.0561, "step": 3540 }, { "epoch": 0.02, "learning_rate": 0.0002973134689800263, "loss": 0.0556, "step": 3550 }, { "epoch": 0.02, "learning_rate": 0.0002973059012870123, "loss": 0.0797, "step": 3560 }, { "epoch": 0.02, "learning_rate": 0.0002972983335939983, "loss": 0.0609, "step": 3570 }, { "epoch": 0.02, "learning_rate": 0.00029729076590098426, "loss": 0.1602, "step": 3580 }, { "epoch": 0.02, "learning_rate": 0.00029728319820797024, "loss": 0.0635, "step": 3590 }, { "epoch": 0.02, "learning_rate": 0.0002972756305149563, "loss": 0.0597, "step": 3600 }, { "epoch": 0.02, "learning_rate": 0.00029726806282194226, "loss": 0.0554, "step": 3610 }, { "epoch": 0.02, "learning_rate": 0.00029726049512892824, "loss": 0.0558, "step": 3620 }, { "epoch": 0.02, "learning_rate": 0.0002972529274359142, "loss": 0.0559, "step": 3630 }, { "epoch": 0.02, "learning_rate": 0.0002972453597429002, "loss": 0.0551, "step": 3640 }, { "epoch": 0.02, "learning_rate": 0.0002972377920498862, "loss": 0.0566, "step": 3650 }, { "epoch": 0.02, "learning_rate": 0.0002972302243568722, "loss": 0.0545, "step": 3660 }, { "epoch": 0.02, "learning_rate": 0.0002972226566638582, "loss": 0.0498, "step": 3670 }, { "epoch": 0.02, "learning_rate": 0.0002972150889708442, "loss": 0.052, "step": 3680 }, { "epoch": 0.02, "learning_rate": 0.00029720752127783016, "loss": 0.0546, "step": 3690 }, { "epoch": 0.02, "learning_rate": 0.00029719995358481614, "loss": 0.0547, "step": 3700 }, { "epoch": 0.02, "learning_rate": 0.0002971923858918021, "loss": 0.0474, "step": 3710 }, { "epoch": 0.02, "learning_rate": 0.0002971848181987881, "loss": 0.0519, "step": 3720 }, { "epoch": 0.02, "learning_rate": 0.00029717725050577414, "loss": 0.0477, "step": 3730 }, { "epoch": 0.02, "learning_rate": 0.0002971696828127601, "loss": 0.0469, "step": 3740 }, { "epoch": 0.02, "learning_rate": 0.0002971621151197461, "loss": 0.0513, "step": 3750 }, { "epoch": 0.02, "learning_rate": 0.0002971545474267321, "loss": 0.0462, "step": 3760 }, { "epoch": 0.02, "learning_rate": 0.00029714697973371807, "loss": 0.0553, "step": 3770 }, { "epoch": 0.02, "learning_rate": 0.00029713941204070405, "loss": 0.0615, "step": 3780 }, { "epoch": 0.02, "learning_rate": 0.0002971318443476901, "loss": 0.0498, "step": 3790 }, { "epoch": 0.02, "learning_rate": 0.00029712427665467607, "loss": 0.0577, "step": 3800 }, { "epoch": 0.02, "learning_rate": 0.00029711670896166205, "loss": 0.0521, "step": 3810 }, { "epoch": 0.02, "learning_rate": 0.00029710914126864803, "loss": 0.0528, "step": 3820 }, { "epoch": 0.02, "learning_rate": 0.000297101573575634, "loss": 0.0476, "step": 3830 }, { "epoch": 0.02, "learning_rate": 0.00029709400588262, "loss": 0.0474, "step": 3840 }, { "epoch": 0.02, "learning_rate": 0.00029708643818960603, "loss": 0.0548, "step": 3850 }, { "epoch": 0.02, "learning_rate": 0.000297078870496592, "loss": 0.0538, "step": 3860 }, { "epoch": 0.02, "learning_rate": 0.000297071302803578, "loss": 0.0453, "step": 3870 }, { "epoch": 0.02, "learning_rate": 0.00029706373511056397, "loss": 0.052, "step": 3880 }, { "epoch": 0.02, "learning_rate": 0.00029705616741754995, "loss": 0.0486, "step": 3890 }, { "epoch": 0.02, "learning_rate": 0.00029704859972453593, "loss": 0.0462, "step": 3900 }, { "epoch": 0.02, "learning_rate": 0.0002970410320315219, "loss": 0.0425, "step": 3910 }, { "epoch": 0.02, "learning_rate": 0.00029703346433850795, "loss": 0.0561, "step": 3920 }, { "epoch": 0.02, "learning_rate": 0.00029702589664549393, "loss": 0.0472, "step": 3930 }, { "epoch": 0.02, "learning_rate": 0.0002970183289524799, "loss": 0.0526, "step": 3940 }, { "epoch": 0.02, "learning_rate": 0.0002970107612594659, "loss": 0.047, "step": 3950 }, { "epoch": 0.02, "learning_rate": 0.0002970031935664519, "loss": 0.051, "step": 3960 }, { "epoch": 0.02, "learning_rate": 0.00029699562587343786, "loss": 0.0456, "step": 3970 }, { "epoch": 0.02, "learning_rate": 0.0002969880581804239, "loss": 0.0425, "step": 3980 }, { "epoch": 0.02, "learning_rate": 0.0002969804904874099, "loss": 0.0543, "step": 3990 }, { "epoch": 0.02, "learning_rate": 0.00029697292279439586, "loss": 0.0542, "step": 4000 }, { "epoch": 0.02, "eval_cer": 0.9145430356125674, "eval_loss": 0.038954902440309525, "eval_runtime": 117.4435, "eval_samples_per_second": 17.029, "eval_steps_per_second": 4.257, "step": 4000 }, { "epoch": 0.02, "learning_rate": 0.00029696535510138184, "loss": 0.0502, "step": 4010 }, { "epoch": 0.02, "learning_rate": 0.0002969577874083678, "loss": 0.0453, "step": 4020 }, { "epoch": 0.02, "learning_rate": 0.0002969502197153538, "loss": 0.0519, "step": 4030 }, { "epoch": 0.02, "learning_rate": 0.00029694265202233984, "loss": 0.0464, "step": 4040 }, { "epoch": 0.02, "learning_rate": 0.0002969350843293258, "loss": 0.0494, "step": 4050 }, { "epoch": 0.02, "learning_rate": 0.0002969275166363118, "loss": 0.0455, "step": 4060 }, { "epoch": 0.02, "learning_rate": 0.0002969199489432978, "loss": 0.0543, "step": 4070 }, { "epoch": 0.02, "learning_rate": 0.00029691238125028376, "loss": 0.0464, "step": 4080 }, { "epoch": 0.02, "learning_rate": 0.00029690481355726974, "loss": 0.0518, "step": 4090 }, { "epoch": 0.02, "learning_rate": 0.0002968972458642557, "loss": 0.0526, "step": 4100 }, { "epoch": 0.02, "learning_rate": 0.00029688967817124176, "loss": 0.0541, "step": 4110 }, { "epoch": 0.02, "learning_rate": 0.00029688211047822774, "loss": 0.0511, "step": 4120 }, { "epoch": 0.02, "learning_rate": 0.0002968745427852137, "loss": 0.0495, "step": 4130 }, { "epoch": 0.02, "learning_rate": 0.0002968669750921997, "loss": 0.0424, "step": 4140 }, { "epoch": 0.02, "learning_rate": 0.0002968594073991857, "loss": 0.0516, "step": 4150 }, { "epoch": 0.02, "learning_rate": 0.00029685183970617167, "loss": 0.0454, "step": 4160 }, { "epoch": 0.02, "learning_rate": 0.0002968442720131577, "loss": 0.0522, "step": 4170 }, { "epoch": 0.02, "learning_rate": 0.0002968367043201437, "loss": 0.0516, "step": 4180 }, { "epoch": 0.02, "learning_rate": 0.00029682913662712967, "loss": 0.0462, "step": 4190 }, { "epoch": 0.02, "learning_rate": 0.00029682156893411565, "loss": 0.0546, "step": 4200 }, { "epoch": 0.02, "learning_rate": 0.00029681400124110163, "loss": 0.0444, "step": 4210 }, { "epoch": 0.02, "learning_rate": 0.0002968064335480876, "loss": 0.0504, "step": 4220 }, { "epoch": 0.02, "learning_rate": 0.0002967988658550736, "loss": 0.0566, "step": 4230 }, { "epoch": 0.02, "learning_rate": 0.00029679129816205963, "loss": 0.0473, "step": 4240 }, { "epoch": 0.02, "learning_rate": 0.0002967837304690456, "loss": 0.048, "step": 4250 }, { "epoch": 0.02, "learning_rate": 0.0002967761627760316, "loss": 0.049, "step": 4260 }, { "epoch": 0.02, "learning_rate": 0.0002967685950830176, "loss": 0.0518, "step": 4270 }, { "epoch": 0.02, "learning_rate": 0.00029676102739000355, "loss": 0.0496, "step": 4280 }, { "epoch": 0.02, "learning_rate": 0.00029675345969698954, "loss": 0.0528, "step": 4290 }, { "epoch": 0.02, "learning_rate": 0.00029674589200397557, "loss": 0.0442, "step": 4300 }, { "epoch": 0.02, "learning_rate": 0.00029673832431096155, "loss": 0.0463, "step": 4310 }, { "epoch": 0.02, "learning_rate": 0.00029673075661794753, "loss": 0.0494, "step": 4320 }, { "epoch": 0.02, "learning_rate": 0.0002967231889249335, "loss": 0.0448, "step": 4330 }, { "epoch": 0.02, "learning_rate": 0.0002967156212319195, "loss": 0.0654, "step": 4340 }, { "epoch": 0.02, "learning_rate": 0.0002967080535389055, "loss": 0.0627, "step": 4350 }, { "epoch": 0.02, "learning_rate": 0.0002967004858458915, "loss": 0.0456, "step": 4360 }, { "epoch": 0.02, "learning_rate": 0.0002966929181528775, "loss": 0.0504, "step": 4370 }, { "epoch": 0.02, "learning_rate": 0.0002966853504598635, "loss": 0.046, "step": 4380 }, { "epoch": 0.02, "learning_rate": 0.00029667778276684946, "loss": 0.046, "step": 4390 }, { "epoch": 0.02, "learning_rate": 0.00029667021507383544, "loss": 0.0498, "step": 4400 }, { "epoch": 0.02, "learning_rate": 0.0002966626473808214, "loss": 0.0465, "step": 4410 }, { "epoch": 0.02, "learning_rate": 0.0002966550796878074, "loss": 0.0443, "step": 4420 }, { "epoch": 0.02, "learning_rate": 0.0002966475119947934, "loss": 0.0482, "step": 4430 }, { "epoch": 0.02, "learning_rate": 0.00029663994430177937, "loss": 0.0453, "step": 4440 }, { "epoch": 0.02, "learning_rate": 0.00029663237660876535, "loss": 0.0473, "step": 4450 }, { "epoch": 0.02, "learning_rate": 0.00029662480891575133, "loss": 0.0463, "step": 4460 }, { "epoch": 0.02, "learning_rate": 0.00029661724122273736, "loss": 0.0426, "step": 4470 }, { "epoch": 0.02, "learning_rate": 0.00029660967352972335, "loss": 0.045, "step": 4480 }, { "epoch": 0.02, "learning_rate": 0.00029660210583670933, "loss": 0.0493, "step": 4490 }, { "epoch": 0.02, "learning_rate": 0.0002965945381436953, "loss": 0.0462, "step": 4500 }, { "epoch": 0.02, "learning_rate": 0.0002965869704506813, "loss": 0.047, "step": 4510 }, { "epoch": 0.02, "learning_rate": 0.00029657940275766727, "loss": 0.048, "step": 4520 }, { "epoch": 0.02, "learning_rate": 0.0002965718350646533, "loss": 0.0553, "step": 4530 }, { "epoch": 0.02, "learning_rate": 0.0002965642673716393, "loss": 0.0486, "step": 4540 }, { "epoch": 0.02, "learning_rate": 0.00029655669967862527, "loss": 0.0472, "step": 4550 }, { "epoch": 0.02, "learning_rate": 0.00029654913198561125, "loss": 0.0441, "step": 4560 }, { "epoch": 0.02, "learning_rate": 0.00029654156429259723, "loss": 0.0496, "step": 4570 }, { "epoch": 0.02, "learning_rate": 0.0002965339965995832, "loss": 0.0417, "step": 4580 }, { "epoch": 0.02, "learning_rate": 0.00029652642890656925, "loss": 0.0459, "step": 4590 }, { "epoch": 0.02, "learning_rate": 0.00029651886121355523, "loss": 0.0412, "step": 4600 }, { "epoch": 0.02, "learning_rate": 0.0002965112935205412, "loss": 0.0461, "step": 4610 }, { "epoch": 0.02, "learning_rate": 0.0002965037258275272, "loss": 0.0502, "step": 4620 }, { "epoch": 0.02, "learning_rate": 0.0002964961581345132, "loss": 0.0614, "step": 4630 }, { "epoch": 0.02, "learning_rate": 0.00029648859044149916, "loss": 0.0506, "step": 4640 }, { "epoch": 0.02, "learning_rate": 0.00029648102274848514, "loss": 0.0487, "step": 4650 }, { "epoch": 0.02, "learning_rate": 0.0002964734550554712, "loss": 0.0505, "step": 4660 }, { "epoch": 0.02, "learning_rate": 0.00029646588736245716, "loss": 0.0527, "step": 4670 }, { "epoch": 0.02, "learning_rate": 0.00029645831966944314, "loss": 0.0573, "step": 4680 }, { "epoch": 0.02, "learning_rate": 0.0002964507519764291, "loss": 0.0635, "step": 4690 }, { "epoch": 0.02, "learning_rate": 0.0002964431842834151, "loss": 0.0447, "step": 4700 }, { "epoch": 0.02, "learning_rate": 0.0002964356165904011, "loss": 0.0517, "step": 4710 }, { "epoch": 0.02, "learning_rate": 0.0002964280488973871, "loss": 0.0665, "step": 4720 }, { "epoch": 0.02, "learning_rate": 0.0002964204812043731, "loss": 0.0506, "step": 4730 }, { "epoch": 0.02, "learning_rate": 0.0002964129135113591, "loss": 0.0562, "step": 4740 }, { "epoch": 0.02, "learning_rate": 0.00029640534581834506, "loss": 0.052, "step": 4750 }, { "epoch": 0.02, "learning_rate": 0.00029639777812533104, "loss": 0.0505, "step": 4760 }, { "epoch": 0.02, "learning_rate": 0.000296390210432317, "loss": 0.0509, "step": 4770 }, { "epoch": 0.02, "learning_rate": 0.000296382642739303, "loss": 0.046, "step": 4780 }, { "epoch": 0.02, "learning_rate": 0.00029637507504628904, "loss": 0.0936, "step": 4790 }, { "epoch": 0.02, "learning_rate": 0.000296367507353275, "loss": 0.0593, "step": 4800 }, { "epoch": 0.02, "learning_rate": 0.000296359939660261, "loss": 0.0514, "step": 4810 }, { "epoch": 0.02, "learning_rate": 0.000296352371967247, "loss": 0.0491, "step": 4820 }, { "epoch": 0.02, "learning_rate": 0.00029634480427423297, "loss": 0.0521, "step": 4830 }, { "epoch": 0.02, "learning_rate": 0.00029633723658121895, "loss": 0.0521, "step": 4840 }, { "epoch": 0.02, "learning_rate": 0.000296329668888205, "loss": 0.0527, "step": 4850 }, { "epoch": 0.02, "learning_rate": 0.00029632210119519097, "loss": 0.0649, "step": 4860 }, { "epoch": 0.02, "learning_rate": 0.00029631453350217695, "loss": 0.0527, "step": 4870 }, { "epoch": 0.02, "learning_rate": 0.00029630696580916293, "loss": 0.0539, "step": 4880 }, { "epoch": 0.02, "learning_rate": 0.0002962993981161489, "loss": 0.0478, "step": 4890 }, { "epoch": 0.02, "learning_rate": 0.0002962918304231349, "loss": 0.0465, "step": 4900 }, { "epoch": 0.02, "learning_rate": 0.00029628426273012093, "loss": 0.0743, "step": 4910 }, { "epoch": 0.02, "learning_rate": 0.0002962766950371069, "loss": 0.073, "step": 4920 }, { "epoch": 0.02, "learning_rate": 0.0002962691273440929, "loss": 0.0692, "step": 4930 }, { "epoch": 0.02, "learning_rate": 0.00029626155965107887, "loss": 0.044, "step": 4940 }, { "epoch": 0.02, "learning_rate": 0.00029625399195806485, "loss": 0.0441, "step": 4950 }, { "epoch": 0.03, "learning_rate": 0.00029624642426505083, "loss": 0.0501, "step": 4960 }, { "epoch": 0.03, "learning_rate": 0.0002962388565720368, "loss": 0.0458, "step": 4970 }, { "epoch": 0.03, "learning_rate": 0.00029623128887902285, "loss": 0.0422, "step": 4980 }, { "epoch": 0.03, "learning_rate": 0.00029622372118600883, "loss": 0.0495, "step": 4990 }, { "epoch": 0.03, "learning_rate": 0.0002962161534929948, "loss": 0.0464, "step": 5000 }, { "epoch": 0.03, "eval_cer": 0.9145071309559275, "eval_loss": 0.03470829501748085, "eval_runtime": 117.4598, "eval_samples_per_second": 17.027, "eval_steps_per_second": 4.257, "step": 5000 }, { "epoch": 0.03, "learning_rate": 0.0002962085857999808, "loss": 0.0427, "step": 5010 }, { "epoch": 0.03, "learning_rate": 0.0002962010181069668, "loss": 0.0465, "step": 5020 }, { "epoch": 0.03, "learning_rate": 0.00029619345041395276, "loss": 0.0453, "step": 5030 }, { "epoch": 0.03, "learning_rate": 0.0002961858827209388, "loss": 0.0415, "step": 5040 }, { "epoch": 0.03, "learning_rate": 0.0002961783150279248, "loss": 0.0476, "step": 5050 }, { "epoch": 0.03, "learning_rate": 0.00029617074733491076, "loss": 0.0447, "step": 5060 }, { "epoch": 0.03, "learning_rate": 0.00029616317964189674, "loss": 0.0512, "step": 5070 }, { "epoch": 0.03, "learning_rate": 0.0002961556119488827, "loss": 0.0486, "step": 5080 }, { "epoch": 0.03, "learning_rate": 0.0002961480442558687, "loss": 0.0486, "step": 5090 }, { "epoch": 0.03, "learning_rate": 0.00029614047656285474, "loss": 0.0493, "step": 5100 }, { "epoch": 0.03, "learning_rate": 0.0002961329088698407, "loss": 0.0504, "step": 5110 }, { "epoch": 0.03, "learning_rate": 0.0002961253411768267, "loss": 0.0528, "step": 5120 }, { "epoch": 0.03, "learning_rate": 0.0002961177734838127, "loss": 0.046, "step": 5130 }, { "epoch": 0.03, "learning_rate": 0.00029611020579079866, "loss": 0.0519, "step": 5140 }, { "epoch": 0.03, "learning_rate": 0.00029610263809778465, "loss": 0.0498, "step": 5150 }, { "epoch": 0.03, "learning_rate": 0.0002960950704047706, "loss": 0.0432, "step": 5160 }, { "epoch": 0.03, "learning_rate": 0.00029608750271175666, "loss": 0.0501, "step": 5170 }, { "epoch": 0.03, "learning_rate": 0.00029607993501874264, "loss": 0.0449, "step": 5180 }, { "epoch": 0.03, "learning_rate": 0.0002960723673257286, "loss": 0.0499, "step": 5190 }, { "epoch": 0.03, "learning_rate": 0.0002960647996327146, "loss": 0.0484, "step": 5200 }, { "epoch": 0.03, "learning_rate": 0.0002960572319397006, "loss": 0.0483, "step": 5210 }, { "epoch": 0.03, "learning_rate": 0.00029604966424668657, "loss": 0.0518, "step": 5220 }, { "epoch": 0.03, "learning_rate": 0.0002960420965536726, "loss": 0.0527, "step": 5230 }, { "epoch": 0.03, "learning_rate": 0.0002960345288606586, "loss": 0.0436, "step": 5240 }, { "epoch": 0.03, "learning_rate": 0.00029602696116764457, "loss": 0.0591, "step": 5250 }, { "epoch": 0.03, "learning_rate": 0.00029601939347463055, "loss": 0.0473, "step": 5260 }, { "epoch": 0.03, "learning_rate": 0.00029601182578161653, "loss": 0.0429, "step": 5270 }, { "epoch": 0.03, "learning_rate": 0.0002960042580886025, "loss": 0.0483, "step": 5280 }, { "epoch": 0.03, "learning_rate": 0.0002959966903955885, "loss": 0.0446, "step": 5290 }, { "epoch": 0.03, "learning_rate": 0.00029598912270257453, "loss": 0.0484, "step": 5300 }, { "epoch": 0.03, "learning_rate": 0.0002959815550095605, "loss": 0.0453, "step": 5310 }, { "epoch": 0.03, "learning_rate": 0.0002959739873165465, "loss": 0.0419, "step": 5320 }, { "epoch": 0.03, "learning_rate": 0.0002959664196235325, "loss": 0.0449, "step": 5330 }, { "epoch": 0.03, "learning_rate": 0.00029595885193051846, "loss": 0.0401, "step": 5340 }, { "epoch": 0.03, "learning_rate": 0.00029595128423750444, "loss": 0.0498, "step": 5350 }, { "epoch": 0.03, "learning_rate": 0.00029594371654449047, "loss": 0.0448, "step": 5360 }, { "epoch": 0.03, "learning_rate": 0.00029593614885147645, "loss": 0.0476, "step": 5370 }, { "epoch": 0.03, "learning_rate": 0.00029592858115846244, "loss": 0.0491, "step": 5380 }, { "epoch": 0.03, "learning_rate": 0.0002959210134654484, "loss": 0.0471, "step": 5390 }, { "epoch": 0.03, "learning_rate": 0.0002959134457724344, "loss": 0.0448, "step": 5400 }, { "epoch": 0.03, "learning_rate": 0.0002959058780794204, "loss": 0.0648, "step": 5410 }, { "epoch": 0.03, "learning_rate": 0.0002958983103864064, "loss": 0.0482, "step": 5420 }, { "epoch": 0.03, "learning_rate": 0.0002958907426933924, "loss": 0.0484, "step": 5430 }, { "epoch": 0.03, "learning_rate": 0.0002958831750003784, "loss": 0.0545, "step": 5440 }, { "epoch": 0.03, "learning_rate": 0.00029587560730736436, "loss": 0.0501, "step": 5450 }, { "epoch": 0.03, "learning_rate": 0.00029586803961435034, "loss": 0.0431, "step": 5460 }, { "epoch": 0.03, "learning_rate": 0.0002958604719213363, "loss": 0.0424, "step": 5470 }, { "epoch": 0.03, "learning_rate": 0.0002958529042283223, "loss": 0.0434, "step": 5480 }, { "epoch": 0.03, "learning_rate": 0.00029584533653530834, "loss": 0.0432, "step": 5490 }, { "epoch": 0.03, "learning_rate": 0.0002958377688422943, "loss": 0.0436, "step": 5500 }, { "epoch": 0.03, "learning_rate": 0.0002958302011492803, "loss": 0.0486, "step": 5510 }, { "epoch": 0.03, "learning_rate": 0.0002958226334562663, "loss": 0.0478, "step": 5520 }, { "epoch": 0.03, "learning_rate": 0.00029581506576325227, "loss": 0.0438, "step": 5530 }, { "epoch": 0.03, "learning_rate": 0.00029580749807023825, "loss": 0.0386, "step": 5540 }, { "epoch": 0.03, "learning_rate": 0.0002957999303772243, "loss": 0.0411, "step": 5550 }, { "epoch": 0.03, "learning_rate": 0.00029579236268421026, "loss": 0.0462, "step": 5560 }, { "epoch": 0.03, "learning_rate": 0.00029578479499119625, "loss": 0.0436, "step": 5570 }, { "epoch": 0.03, "learning_rate": 0.0002957772272981822, "loss": 0.0457, "step": 5580 }, { "epoch": 0.03, "learning_rate": 0.0002957696596051682, "loss": 0.0425, "step": 5590 }, { "epoch": 0.03, "learning_rate": 0.0002957620919121542, "loss": 0.0486, "step": 5600 }, { "epoch": 0.03, "learning_rate": 0.0002957545242191402, "loss": 0.0496, "step": 5610 }, { "epoch": 0.03, "learning_rate": 0.0002957469565261262, "loss": 0.0534, "step": 5620 }, { "epoch": 0.03, "learning_rate": 0.0002957393888331122, "loss": 0.0385, "step": 5630 }, { "epoch": 0.03, "learning_rate": 0.00029573182114009817, "loss": 0.0467, "step": 5640 }, { "epoch": 0.03, "learning_rate": 0.00029572425344708415, "loss": 0.0478, "step": 5650 }, { "epoch": 0.03, "learning_rate": 0.00029571668575407013, "loss": 0.0406, "step": 5660 }, { "epoch": 0.03, "learning_rate": 0.0002957091180610561, "loss": 0.0493, "step": 5670 }, { "epoch": 0.03, "learning_rate": 0.0002957015503680421, "loss": 0.0448, "step": 5680 }, { "epoch": 0.03, "learning_rate": 0.0002956939826750281, "loss": 0.0465, "step": 5690 }, { "epoch": 0.03, "learning_rate": 0.00029568641498201406, "loss": 0.0485, "step": 5700 }, { "epoch": 0.03, "learning_rate": 0.00029567884728900004, "loss": 0.044, "step": 5710 }, { "epoch": 0.03, "learning_rate": 0.0002956712795959861, "loss": 0.0454, "step": 5720 }, { "epoch": 0.03, "learning_rate": 0.00029566371190297206, "loss": 0.0488, "step": 5730 }, { "epoch": 0.03, "learning_rate": 0.00029565614420995804, "loss": 0.042, "step": 5740 }, { "epoch": 0.03, "learning_rate": 0.000295648576516944, "loss": 0.046, "step": 5750 }, { "epoch": 0.03, "learning_rate": 0.00029564100882393, "loss": 0.0447, "step": 5760 }, { "epoch": 0.03, "learning_rate": 0.000295633441130916, "loss": 0.043, "step": 5770 }, { "epoch": 0.03, "learning_rate": 0.000295625873437902, "loss": 0.0484, "step": 5780 }, { "epoch": 0.03, "learning_rate": 0.000295618305744888, "loss": 0.0468, "step": 5790 }, { "epoch": 0.03, "learning_rate": 0.000295610738051874, "loss": 0.0498, "step": 5800 }, { "epoch": 0.03, "learning_rate": 0.00029560317035885996, "loss": 0.0474, "step": 5810 }, { "epoch": 0.03, "learning_rate": 0.00029559560266584594, "loss": 0.045, "step": 5820 }, { "epoch": 0.03, "learning_rate": 0.0002955880349728319, "loss": 0.0471, "step": 5830 }, { "epoch": 0.03, "learning_rate": 0.00029558046727981796, "loss": 0.0414, "step": 5840 }, { "epoch": 0.03, "learning_rate": 0.00029557289958680394, "loss": 0.0423, "step": 5850 }, { "epoch": 0.03, "learning_rate": 0.0002955653318937899, "loss": 0.0437, "step": 5860 }, { "epoch": 0.03, "learning_rate": 0.0002955577642007759, "loss": 0.0409, "step": 5870 }, { "epoch": 0.03, "learning_rate": 0.0002955501965077619, "loss": 0.0462, "step": 5880 }, { "epoch": 0.03, "learning_rate": 0.00029554262881474787, "loss": 0.0426, "step": 5890 }, { "epoch": 0.03, "learning_rate": 0.00029553506112173385, "loss": 0.0413, "step": 5900 }, { "epoch": 0.03, "learning_rate": 0.0002955274934287199, "loss": 0.0397, "step": 5910 }, { "epoch": 0.03, "learning_rate": 0.00029551992573570587, "loss": 0.0427, "step": 5920 }, { "epoch": 0.03, "learning_rate": 0.00029551235804269185, "loss": 0.0414, "step": 5930 }, { "epoch": 0.03, "learning_rate": 0.00029550479034967783, "loss": 0.0402, "step": 5940 }, { "epoch": 0.03, "learning_rate": 0.0002954972226566638, "loss": 0.0468, "step": 5950 }, { "epoch": 0.03, "learning_rate": 0.0002954896549636498, "loss": 0.0353, "step": 5960 }, { "epoch": 0.03, "learning_rate": 0.00029548208727063583, "loss": 0.0466, "step": 5970 }, { "epoch": 0.03, "learning_rate": 0.0002954745195776218, "loss": 0.0469, "step": 5980 }, { "epoch": 0.03, "learning_rate": 0.0002954669518846078, "loss": 0.0437, "step": 5990 }, { "epoch": 0.03, "learning_rate": 0.00029545938419159377, "loss": 0.0402, "step": 6000 }, { "epoch": 0.03, "eval_cer": 0.9144964565985481, "eval_loss": 0.03346065431833267, "eval_runtime": 117.4862, "eval_samples_per_second": 17.023, "eval_steps_per_second": 4.256, "step": 6000 }, { "epoch": 0.03, "learning_rate": 0.00029545181649857975, "loss": 0.0513, "step": 6010 }, { "epoch": 0.03, "learning_rate": 0.00029544424880556574, "loss": 0.0432, "step": 6020 }, { "epoch": 0.03, "learning_rate": 0.0002954366811125517, "loss": 0.0466, "step": 6030 }, { "epoch": 0.03, "learning_rate": 0.00029542911341953775, "loss": 0.0424, "step": 6040 }, { "epoch": 0.03, "learning_rate": 0.00029542154572652373, "loss": 0.0389, "step": 6050 }, { "epoch": 0.03, "learning_rate": 0.0002954139780335097, "loss": 0.0377, "step": 6060 }, { "epoch": 0.03, "learning_rate": 0.0002954064103404957, "loss": 0.0425, "step": 6070 }, { "epoch": 0.03, "learning_rate": 0.0002953988426474817, "loss": 0.0406, "step": 6080 }, { "epoch": 0.03, "learning_rate": 0.00029539127495446766, "loss": 0.0465, "step": 6090 }, { "epoch": 0.03, "learning_rate": 0.0002953837072614537, "loss": 0.0463, "step": 6100 }, { "epoch": 0.03, "learning_rate": 0.0002953761395684397, "loss": 0.0954, "step": 6110 }, { "epoch": 0.03, "learning_rate": 0.00029536857187542566, "loss": 0.068, "step": 6120 }, { "epoch": 0.03, "learning_rate": 0.00029536100418241164, "loss": 0.0656, "step": 6130 }, { "epoch": 0.03, "learning_rate": 0.0002953534364893976, "loss": 0.066, "step": 6140 }, { "epoch": 0.03, "learning_rate": 0.0002953458687963836, "loss": 0.0541, "step": 6150 }, { "epoch": 0.03, "learning_rate": 0.00029533830110336964, "loss": 0.0574, "step": 6160 }, { "epoch": 0.03, "learning_rate": 0.0002953307334103556, "loss": 0.0532, "step": 6170 }, { "epoch": 0.03, "learning_rate": 0.0002953231657173416, "loss": 0.0622, "step": 6180 }, { "epoch": 0.03, "learning_rate": 0.0002953155980243276, "loss": 0.0538, "step": 6190 }, { "epoch": 0.03, "learning_rate": 0.00029530803033131356, "loss": 0.0555, "step": 6200 }, { "epoch": 0.03, "learning_rate": 0.00029530046263829955, "loss": 0.0598, "step": 6210 }, { "epoch": 0.03, "learning_rate": 0.0002952928949452855, "loss": 0.046, "step": 6220 }, { "epoch": 0.03, "learning_rate": 0.00029528532725227156, "loss": 0.0497, "step": 6230 }, { "epoch": 0.03, "learning_rate": 0.00029527775955925754, "loss": 0.0507, "step": 6240 }, { "epoch": 0.03, "learning_rate": 0.0002952701918662435, "loss": 0.0494, "step": 6250 }, { "epoch": 0.03, "learning_rate": 0.0002952626241732295, "loss": 0.0491, "step": 6260 }, { "epoch": 0.03, "learning_rate": 0.0002952550564802155, "loss": 0.0548, "step": 6270 }, { "epoch": 0.03, "learning_rate": 0.00029524748878720147, "loss": 0.0527, "step": 6280 }, { "epoch": 0.03, "learning_rate": 0.0002952399210941875, "loss": 0.0517, "step": 6290 }, { "epoch": 0.03, "learning_rate": 0.0002952323534011735, "loss": 0.0451, "step": 6300 }, { "epoch": 0.03, "learning_rate": 0.00029522478570815947, "loss": 0.0527, "step": 6310 }, { "epoch": 0.03, "learning_rate": 0.00029521721801514545, "loss": 0.0539, "step": 6320 }, { "epoch": 0.03, "learning_rate": 0.00029520965032213143, "loss": 0.0477, "step": 6330 }, { "epoch": 0.03, "learning_rate": 0.0002952020826291174, "loss": 0.0627, "step": 6340 }, { "epoch": 0.03, "learning_rate": 0.00029519451493610345, "loss": 0.0474, "step": 6350 }, { "epoch": 0.03, "learning_rate": 0.00029518694724308943, "loss": 0.0467, "step": 6360 }, { "epoch": 0.03, "learning_rate": 0.0002951793795500754, "loss": 0.0516, "step": 6370 }, { "epoch": 0.03, "learning_rate": 0.0002951718118570614, "loss": 0.0443, "step": 6380 }, { "epoch": 0.03, "learning_rate": 0.0002951642441640474, "loss": 0.048, "step": 6390 }, { "epoch": 0.03, "learning_rate": 0.00029515667647103336, "loss": 0.0481, "step": 6400 }, { "epoch": 0.03, "learning_rate": 0.00029514910877801934, "loss": 0.0468, "step": 6410 }, { "epoch": 0.03, "learning_rate": 0.00029514154108500537, "loss": 0.0453, "step": 6420 }, { "epoch": 0.03, "learning_rate": 0.00029513397339199135, "loss": 0.0819, "step": 6430 }, { "epoch": 0.03, "learning_rate": 0.00029512640569897734, "loss": 0.0532, "step": 6440 }, { "epoch": 0.03, "learning_rate": 0.0002951188380059633, "loss": 0.0467, "step": 6450 }, { "epoch": 0.03, "learning_rate": 0.0002951112703129493, "loss": 0.048, "step": 6460 }, { "epoch": 0.03, "learning_rate": 0.0002951037026199353, "loss": 0.0522, "step": 6470 }, { "epoch": 0.03, "learning_rate": 0.0002950961349269213, "loss": 0.0526, "step": 6480 }, { "epoch": 0.03, "learning_rate": 0.0002950885672339073, "loss": 0.0431, "step": 6490 }, { "epoch": 0.03, "learning_rate": 0.0002950809995408933, "loss": 0.0413, "step": 6500 }, { "epoch": 0.03, "learning_rate": 0.00029507343184787926, "loss": 0.0447, "step": 6510 }, { "epoch": 0.03, "learning_rate": 0.00029506586415486524, "loss": 0.0429, "step": 6520 }, { "epoch": 0.03, "learning_rate": 0.0002950582964618512, "loss": 0.0491, "step": 6530 }, { "epoch": 0.03, "learning_rate": 0.0002950507287688372, "loss": 0.0441, "step": 6540 }, { "epoch": 0.03, "learning_rate": 0.00029504316107582324, "loss": 0.047, "step": 6550 }, { "epoch": 0.03, "learning_rate": 0.0002950355933828092, "loss": 0.0478, "step": 6560 }, { "epoch": 0.03, "learning_rate": 0.0002950280256897952, "loss": 0.0459, "step": 6570 }, { "epoch": 0.03, "learning_rate": 0.0002950204579967812, "loss": 0.0422, "step": 6580 }, { "epoch": 0.03, "learning_rate": 0.00029501289030376717, "loss": 0.044, "step": 6590 }, { "epoch": 0.03, "learning_rate": 0.00029500532261075315, "loss": 0.0382, "step": 6600 }, { "epoch": 0.03, "learning_rate": 0.0002949977549177392, "loss": 0.0437, "step": 6610 }, { "epoch": 0.03, "learning_rate": 0.00029499018722472516, "loss": 0.0372, "step": 6620 }, { "epoch": 0.03, "learning_rate": 0.00029498261953171115, "loss": 0.0367, "step": 6630 }, { "epoch": 0.03, "learning_rate": 0.0002949750518386971, "loss": 0.0394, "step": 6640 }, { "epoch": 0.03, "learning_rate": 0.0002949674841456831, "loss": 0.0373, "step": 6650 }, { "epoch": 0.03, "learning_rate": 0.0002949599164526691, "loss": 0.0447, "step": 6660 }, { "epoch": 0.03, "learning_rate": 0.0002949523487596551, "loss": 0.0398, "step": 6670 }, { "epoch": 0.03, "learning_rate": 0.0002949447810666411, "loss": 0.0366, "step": 6680 }, { "epoch": 0.03, "learning_rate": 0.0002949372133736271, "loss": 0.0432, "step": 6690 }, { "epoch": 0.03, "learning_rate": 0.00029492964568061307, "loss": 0.0436, "step": 6700 }, { "epoch": 0.03, "learning_rate": 0.00029492207798759905, "loss": 0.0411, "step": 6710 }, { "epoch": 0.03, "learning_rate": 0.00029491451029458503, "loss": 0.0417, "step": 6720 }, { "epoch": 0.03, "learning_rate": 0.000294906942601571, "loss": 0.0432, "step": 6730 }, { "epoch": 0.03, "learning_rate": 0.00029489937490855705, "loss": 0.0392, "step": 6740 }, { "epoch": 0.03, "learning_rate": 0.00029489180721554303, "loss": 0.0403, "step": 6750 }, { "epoch": 0.03, "learning_rate": 0.000294884239522529, "loss": 0.0409, "step": 6760 }, { "epoch": 0.03, "learning_rate": 0.000294876671829515, "loss": 0.0413, "step": 6770 }, { "epoch": 0.03, "learning_rate": 0.000294869104136501, "loss": 0.0445, "step": 6780 }, { "epoch": 0.03, "learning_rate": 0.00029486153644348696, "loss": 0.0415, "step": 6790 }, { "epoch": 0.03, "learning_rate": 0.000294853968750473, "loss": 0.0381, "step": 6800 }, { "epoch": 0.03, "learning_rate": 0.000294846401057459, "loss": 0.042, "step": 6810 }, { "epoch": 0.03, "learning_rate": 0.00029483883336444496, "loss": 0.0454, "step": 6820 }, { "epoch": 0.03, "learning_rate": 0.00029483126567143094, "loss": 0.0434, "step": 6830 }, { "epoch": 0.03, "learning_rate": 0.0002948236979784169, "loss": 0.0438, "step": 6840 }, { "epoch": 0.03, "learning_rate": 0.0002948161302854029, "loss": 0.0494, "step": 6850 }, { "epoch": 0.03, "learning_rate": 0.00029480856259238894, "loss": 0.0552, "step": 6860 }, { "epoch": 0.03, "learning_rate": 0.0002948009948993749, "loss": 0.0457, "step": 6870 }, { "epoch": 0.03, "learning_rate": 0.0002947934272063609, "loss": 0.0391, "step": 6880 }, { "epoch": 0.03, "learning_rate": 0.0002947858595133469, "loss": 0.0444, "step": 6890 }, { "epoch": 0.03, "learning_rate": 0.00029477829182033286, "loss": 0.0453, "step": 6900 }, { "epoch": 0.03, "learning_rate": 0.00029477072412731884, "loss": 0.045, "step": 6910 }, { "epoch": 0.03, "learning_rate": 0.0002947631564343048, "loss": 0.0388, "step": 6920 }, { "epoch": 0.03, "learning_rate": 0.0002947555887412908, "loss": 0.0405, "step": 6930 }, { "epoch": 0.04, "learning_rate": 0.0002947480210482768, "loss": 0.0415, "step": 6940 }, { "epoch": 0.04, "learning_rate": 0.00029474045335526277, "loss": 0.0424, "step": 6950 }, { "epoch": 0.04, "learning_rate": 0.00029473288566224875, "loss": 0.0373, "step": 6960 }, { "epoch": 0.04, "learning_rate": 0.0002947253179692348, "loss": 0.0375, "step": 6970 }, { "epoch": 0.04, "learning_rate": 0.00029471775027622077, "loss": 0.0396, "step": 6980 }, { "epoch": 0.04, "learning_rate": 0.00029471018258320675, "loss": 0.0405, "step": 6990 }, { "epoch": 0.04, "learning_rate": 0.00029470261489019273, "loss": 0.0927, "step": 7000 }, { "epoch": 0.04, "eval_cer": 0.9144498775845288, "eval_loss": 0.03059179149568081, "eval_runtime": 117.5676, "eval_samples_per_second": 17.011, "eval_steps_per_second": 4.253, "step": 7000 }, { "epoch": 0.04, "learning_rate": 0.0002946950471971787, "loss": 0.0505, "step": 7010 }, { "epoch": 0.04, "learning_rate": 0.0002946874795041647, "loss": 0.0615, "step": 7020 }, { "epoch": 0.04, "learning_rate": 0.00029467991181115073, "loss": 0.0509, "step": 7030 }, { "epoch": 0.04, "learning_rate": 0.0002946723441181367, "loss": 0.0462, "step": 7040 }, { "epoch": 0.04, "learning_rate": 0.0002946647764251227, "loss": 0.0421, "step": 7050 }, { "epoch": 0.04, "learning_rate": 0.00029465720873210867, "loss": 0.0414, "step": 7060 }, { "epoch": 0.04, "learning_rate": 0.00029464964103909465, "loss": 0.0405, "step": 7070 }, { "epoch": 0.04, "learning_rate": 0.00029464207334608064, "loss": 0.0436, "step": 7080 }, { "epoch": 0.04, "learning_rate": 0.0002946345056530666, "loss": 0.0425, "step": 7090 }, { "epoch": 0.04, "learning_rate": 0.00029462693796005265, "loss": 0.0442, "step": 7100 }, { "epoch": 0.04, "learning_rate": 0.00029461937026703863, "loss": 0.0411, "step": 7110 }, { "epoch": 0.04, "learning_rate": 0.0002946118025740246, "loss": 0.0409, "step": 7120 }, { "epoch": 0.04, "learning_rate": 0.0002946042348810106, "loss": 0.0415, "step": 7130 }, { "epoch": 0.04, "learning_rate": 0.0002945966671879966, "loss": 0.0379, "step": 7140 }, { "epoch": 0.04, "learning_rate": 0.00029458909949498256, "loss": 0.0438, "step": 7150 }, { "epoch": 0.04, "learning_rate": 0.0002945815318019686, "loss": 0.0488, "step": 7160 }, { "epoch": 0.04, "learning_rate": 0.0002945739641089546, "loss": 0.0399, "step": 7170 }, { "epoch": 0.04, "learning_rate": 0.00029456639641594056, "loss": 0.0477, "step": 7180 }, { "epoch": 0.04, "learning_rate": 0.00029455882872292654, "loss": 0.0425, "step": 7190 }, { "epoch": 0.04, "learning_rate": 0.0002945512610299125, "loss": 0.0436, "step": 7200 }, { "epoch": 0.04, "learning_rate": 0.0002945436933368985, "loss": 0.0417, "step": 7210 }, { "epoch": 0.04, "learning_rate": 0.00029453612564388454, "loss": 0.0403, "step": 7220 }, { "epoch": 0.04, "learning_rate": 0.0002945285579508705, "loss": 0.0378, "step": 7230 }, { "epoch": 0.04, "learning_rate": 0.0002945209902578565, "loss": 0.045, "step": 7240 }, { "epoch": 0.04, "learning_rate": 0.0002945134225648425, "loss": 0.0385, "step": 7250 }, { "epoch": 0.04, "learning_rate": 0.00029450585487182846, "loss": 0.0402, "step": 7260 }, { "epoch": 0.04, "learning_rate": 0.00029449828717881445, "loss": 0.0473, "step": 7270 }, { "epoch": 0.04, "learning_rate": 0.0002944907194858004, "loss": 0.0433, "step": 7280 }, { "epoch": 0.04, "learning_rate": 0.00029448315179278646, "loss": 0.0402, "step": 7290 }, { "epoch": 0.04, "learning_rate": 0.00029447558409977244, "loss": 0.04, "step": 7300 }, { "epoch": 0.04, "learning_rate": 0.0002944680164067584, "loss": 0.0422, "step": 7310 }, { "epoch": 0.04, "learning_rate": 0.0002944604487137444, "loss": 0.043, "step": 7320 }, { "epoch": 0.04, "learning_rate": 0.0002944528810207304, "loss": 0.0423, "step": 7330 }, { "epoch": 0.04, "learning_rate": 0.00029444531332771637, "loss": 0.0394, "step": 7340 }, { "epoch": 0.04, "learning_rate": 0.0002944377456347024, "loss": 0.0409, "step": 7350 }, { "epoch": 0.04, "learning_rate": 0.0002944301779416884, "loss": 0.038, "step": 7360 }, { "epoch": 0.04, "learning_rate": 0.00029442261024867437, "loss": 0.0363, "step": 7370 }, { "epoch": 0.04, "learning_rate": 0.00029441504255566035, "loss": 0.0443, "step": 7380 }, { "epoch": 0.04, "learning_rate": 0.00029440747486264633, "loss": 0.0407, "step": 7390 }, { "epoch": 0.04, "learning_rate": 0.0002943999071696323, "loss": 0.0506, "step": 7400 }, { "epoch": 0.04, "learning_rate": 0.00029439233947661835, "loss": 0.0434, "step": 7410 }, { "epoch": 0.04, "learning_rate": 0.00029438477178360433, "loss": 0.0501, "step": 7420 }, { "epoch": 0.04, "learning_rate": 0.0002943772040905903, "loss": 0.05, "step": 7430 }, { "epoch": 0.04, "learning_rate": 0.0002943696363975763, "loss": 0.0444, "step": 7440 }, { "epoch": 0.04, "learning_rate": 0.0002943620687045623, "loss": 0.0354, "step": 7450 }, { "epoch": 0.04, "learning_rate": 0.00029435450101154826, "loss": 0.0387, "step": 7460 }, { "epoch": 0.04, "learning_rate": 0.00029434693331853424, "loss": 0.0454, "step": 7470 }, { "epoch": 0.04, "learning_rate": 0.00029433936562552027, "loss": 0.0397, "step": 7480 }, { "epoch": 0.04, "learning_rate": 0.00029433179793250625, "loss": 0.0448, "step": 7490 }, { "epoch": 0.04, "learning_rate": 0.00029432423023949224, "loss": 0.0408, "step": 7500 }, { "epoch": 0.04, "learning_rate": 0.0002943166625464782, "loss": 0.046, "step": 7510 }, { "epoch": 0.04, "learning_rate": 0.0002943090948534642, "loss": 0.0449, "step": 7520 }, { "epoch": 0.04, "learning_rate": 0.0002943015271604502, "loss": 0.0428, "step": 7530 }, { "epoch": 0.04, "learning_rate": 0.0002942939594674362, "loss": 0.04, "step": 7540 }, { "epoch": 0.04, "learning_rate": 0.0002942863917744222, "loss": 0.0422, "step": 7550 }, { "epoch": 0.04, "learning_rate": 0.0002942788240814082, "loss": 0.0374, "step": 7560 }, { "epoch": 0.04, "learning_rate": 0.00029427125638839416, "loss": 0.0432, "step": 7570 }, { "epoch": 0.04, "learning_rate": 0.00029426368869538014, "loss": 0.0425, "step": 7580 }, { "epoch": 0.04, "learning_rate": 0.0002942561210023661, "loss": 0.0372, "step": 7590 }, { "epoch": 0.04, "learning_rate": 0.0002942485533093521, "loss": 0.0396, "step": 7600 }, { "epoch": 0.04, "learning_rate": 0.00029424098561633814, "loss": 0.0368, "step": 7610 }, { "epoch": 0.04, "learning_rate": 0.0002942334179233241, "loss": 0.0451, "step": 7620 }, { "epoch": 0.04, "learning_rate": 0.0002942258502303101, "loss": 0.0437, "step": 7630 }, { "epoch": 0.04, "learning_rate": 0.0002942182825372961, "loss": 0.0516, "step": 7640 }, { "epoch": 0.04, "learning_rate": 0.00029421071484428207, "loss": 0.0346, "step": 7650 }, { "epoch": 0.04, "learning_rate": 0.00029420314715126805, "loss": 0.0381, "step": 7660 }, { "epoch": 0.04, "learning_rate": 0.0002941955794582541, "loss": 0.0469, "step": 7670 }, { "epoch": 0.04, "learning_rate": 0.00029418801176524006, "loss": 0.0404, "step": 7680 }, { "epoch": 0.04, "learning_rate": 0.00029418044407222605, "loss": 0.0437, "step": 7690 }, { "epoch": 0.04, "learning_rate": 0.000294172876379212, "loss": 0.0414, "step": 7700 }, { "epoch": 0.04, "learning_rate": 0.000294165308686198, "loss": 0.0486, "step": 7710 }, { "epoch": 0.04, "learning_rate": 0.000294157740993184, "loss": 0.0429, "step": 7720 }, { "epoch": 0.04, "learning_rate": 0.00029415017330017, "loss": 0.0445, "step": 7730 }, { "epoch": 0.04, "learning_rate": 0.000294142605607156, "loss": 0.0423, "step": 7740 }, { "epoch": 0.04, "learning_rate": 0.000294135037914142, "loss": 0.0376, "step": 7750 }, { "epoch": 0.04, "learning_rate": 0.00029412747022112797, "loss": 0.0449, "step": 7760 }, { "epoch": 0.04, "learning_rate": 0.00029411990252811395, "loss": 0.0464, "step": 7770 }, { "epoch": 0.04, "learning_rate": 0.00029411233483509993, "loss": 0.0354, "step": 7780 }, { "epoch": 0.04, "learning_rate": 0.0002941047671420859, "loss": 0.0362, "step": 7790 }, { "epoch": 0.04, "learning_rate": 0.00029409719944907195, "loss": 0.0384, "step": 7800 }, { "epoch": 0.04, "learning_rate": 0.00029408963175605793, "loss": 0.036, "step": 7810 }, { "epoch": 0.04, "learning_rate": 0.0002940820640630439, "loss": 0.0413, "step": 7820 }, { "epoch": 0.04, "learning_rate": 0.0002940744963700299, "loss": 0.0345, "step": 7830 }, { "epoch": 0.04, "learning_rate": 0.0002940669286770159, "loss": 0.0379, "step": 7840 }, { "epoch": 0.04, "learning_rate": 0.00029405936098400186, "loss": 0.0438, "step": 7850 }, { "epoch": 0.04, "learning_rate": 0.0002940517932909879, "loss": 0.0433, "step": 7860 }, { "epoch": 0.04, "learning_rate": 0.0002940442255979739, "loss": 0.0404, "step": 7870 }, { "epoch": 0.04, "learning_rate": 0.00029403665790495986, "loss": 0.0398, "step": 7880 }, { "epoch": 0.04, "learning_rate": 0.00029402909021194584, "loss": 0.0438, "step": 7890 }, { "epoch": 0.04, "learning_rate": 0.0002940215225189318, "loss": 0.0405, "step": 7900 }, { "epoch": 0.04, "learning_rate": 0.0002940139548259178, "loss": 0.0459, "step": 7910 }, { "epoch": 0.04, "learning_rate": 0.00029400638713290384, "loss": 0.049, "step": 7920 }, { "epoch": 0.04, "learning_rate": 0.0002939988194398898, "loss": 0.0392, "step": 7930 }, { "epoch": 0.04, "learning_rate": 0.0002939912517468758, "loss": 0.0387, "step": 7940 }, { "epoch": 0.04, "learning_rate": 0.0002939836840538618, "loss": 0.0401, "step": 7950 }, { "epoch": 0.04, "learning_rate": 0.00029397611636084776, "loss": 0.0488, "step": 7960 }, { "epoch": 0.04, "learning_rate": 0.00029396854866783374, "loss": 0.0453, "step": 7970 }, { "epoch": 0.04, "learning_rate": 0.0002939609809748197, "loss": 0.0404, "step": 7980 }, { "epoch": 0.04, "learning_rate": 0.00029395341328180576, "loss": 0.0408, "step": 7990 }, { "epoch": 0.04, "learning_rate": 0.00029394584558879174, "loss": 0.0365, "step": 8000 }, { "epoch": 0.04, "eval_cer": 0.9145313908590625, "eval_loss": 0.03206906095147133, "eval_runtime": 117.4386, "eval_samples_per_second": 17.03, "eval_steps_per_second": 4.258, "step": 8000 }, { "epoch": 0.04, "learning_rate": 0.0002939382778957777, "loss": 0.0413, "step": 8010 }, { "epoch": 0.04, "learning_rate": 0.0002939307102027637, "loss": 0.0405, "step": 8020 }, { "epoch": 0.04, "learning_rate": 0.0002939231425097497, "loss": 0.0403, "step": 8030 }, { "epoch": 0.04, "learning_rate": 0.00029391557481673567, "loss": 0.0382, "step": 8040 }, { "epoch": 0.04, "learning_rate": 0.0002939080071237217, "loss": 0.0399, "step": 8050 }, { "epoch": 0.04, "learning_rate": 0.0002939004394307077, "loss": 0.0431, "step": 8060 }, { "epoch": 0.04, "learning_rate": 0.00029389287173769367, "loss": 0.0478, "step": 8070 }, { "epoch": 0.04, "learning_rate": 0.00029388530404467965, "loss": 0.0366, "step": 8080 }, { "epoch": 0.04, "learning_rate": 0.00029387773635166563, "loss": 0.037, "step": 8090 }, { "epoch": 0.04, "learning_rate": 0.0002938701686586516, "loss": 0.0357, "step": 8100 }, { "epoch": 0.04, "learning_rate": 0.0002938626009656376, "loss": 0.0408, "step": 8110 }, { "epoch": 0.04, "learning_rate": 0.0002938550332726236, "loss": 0.0392, "step": 8120 }, { "epoch": 0.04, "learning_rate": 0.0002938474655796096, "loss": 0.0465, "step": 8130 }, { "epoch": 0.04, "learning_rate": 0.0002938398978865956, "loss": 0.0369, "step": 8140 }, { "epoch": 0.04, "learning_rate": 0.00029383233019358157, "loss": 0.0439, "step": 8150 }, { "epoch": 0.04, "learning_rate": 0.00029382476250056755, "loss": 0.0455, "step": 8160 }, { "epoch": 0.04, "learning_rate": 0.00029381719480755353, "loss": 0.0379, "step": 8170 }, { "epoch": 0.04, "learning_rate": 0.0002938096271145395, "loss": 0.0352, "step": 8180 }, { "epoch": 0.04, "learning_rate": 0.0002938020594215255, "loss": 0.0366, "step": 8190 }, { "epoch": 0.04, "learning_rate": 0.0002937944917285115, "loss": 0.04, "step": 8200 }, { "epoch": 0.04, "learning_rate": 0.00029378692403549746, "loss": 0.0367, "step": 8210 }, { "epoch": 0.04, "learning_rate": 0.0002937793563424835, "loss": 0.0417, "step": 8220 }, { "epoch": 0.04, "learning_rate": 0.0002937717886494695, "loss": 0.0412, "step": 8230 }, { "epoch": 0.04, "learning_rate": 0.00029376422095645546, "loss": 0.0383, "step": 8240 }, { "epoch": 0.04, "learning_rate": 0.00029375665326344144, "loss": 0.0383, "step": 8250 }, { "epoch": 0.04, "learning_rate": 0.0002937490855704274, "loss": 0.0386, "step": 8260 }, { "epoch": 0.04, "learning_rate": 0.0002937415178774134, "loss": 0.041, "step": 8270 }, { "epoch": 0.04, "learning_rate": 0.00029373395018439944, "loss": 0.0444, "step": 8280 }, { "epoch": 0.04, "learning_rate": 0.0002937263824913854, "loss": 0.0399, "step": 8290 }, { "epoch": 0.04, "learning_rate": 0.0002937188147983714, "loss": 0.0458, "step": 8300 }, { "epoch": 0.04, "learning_rate": 0.0002937112471053574, "loss": 0.036, "step": 8310 }, { "epoch": 0.04, "learning_rate": 0.00029370367941234336, "loss": 0.0409, "step": 8320 }, { "epoch": 0.04, "learning_rate": 0.00029369611171932935, "loss": 0.0406, "step": 8330 }, { "epoch": 0.04, "learning_rate": 0.00029368854402631533, "loss": 0.0401, "step": 8340 }, { "epoch": 0.04, "learning_rate": 0.00029368097633330136, "loss": 0.0408, "step": 8350 }, { "epoch": 0.04, "learning_rate": 0.00029367340864028734, "loss": 0.035, "step": 8360 }, { "epoch": 0.04, "learning_rate": 0.0002936658409472733, "loss": 0.0411, "step": 8370 }, { "epoch": 0.04, "learning_rate": 0.0002936582732542593, "loss": 0.0472, "step": 8380 }, { "epoch": 0.04, "learning_rate": 0.0002936507055612453, "loss": 0.0372, "step": 8390 }, { "epoch": 0.04, "learning_rate": 0.00029364313786823127, "loss": 0.0366, "step": 8400 }, { "epoch": 0.04, "learning_rate": 0.0002936355701752173, "loss": 0.0368, "step": 8410 }, { "epoch": 0.04, "learning_rate": 0.0002936280024822033, "loss": 0.0372, "step": 8420 }, { "epoch": 0.04, "learning_rate": 0.00029362043478918927, "loss": 0.0373, "step": 8430 }, { "epoch": 0.04, "learning_rate": 0.00029361286709617525, "loss": 0.0376, "step": 8440 }, { "epoch": 0.04, "learning_rate": 0.00029360529940316123, "loss": 0.0405, "step": 8450 }, { "epoch": 0.04, "learning_rate": 0.0002935977317101472, "loss": 0.0445, "step": 8460 }, { "epoch": 0.04, "learning_rate": 0.00029359016401713325, "loss": 0.1198, "step": 8470 }, { "epoch": 0.04, "learning_rate": 0.00029358259632411923, "loss": 0.0436, "step": 8480 }, { "epoch": 0.04, "learning_rate": 0.0002935750286311052, "loss": 0.0414, "step": 8490 }, { "epoch": 0.04, "learning_rate": 0.0002935674609380912, "loss": 0.0396, "step": 8500 }, { "epoch": 0.04, "learning_rate": 0.0002935598932450772, "loss": 0.0366, "step": 8510 }, { "epoch": 0.04, "learning_rate": 0.00029355232555206316, "loss": 0.0383, "step": 8520 }, { "epoch": 0.04, "learning_rate": 0.00029354475785904914, "loss": 0.0715, "step": 8530 }, { "epoch": 0.04, "learning_rate": 0.0002935371901660352, "loss": 0.067, "step": 8540 }, { "epoch": 0.04, "learning_rate": 0.00029352962247302115, "loss": 0.0371, "step": 8550 }, { "epoch": 0.04, "learning_rate": 0.00029352205478000714, "loss": 0.0326, "step": 8560 }, { "epoch": 0.04, "learning_rate": 0.0002935144870869931, "loss": 0.0439, "step": 8570 }, { "epoch": 0.04, "learning_rate": 0.0002935069193939791, "loss": 0.0387, "step": 8580 }, { "epoch": 0.04, "learning_rate": 0.0002934993517009651, "loss": 0.0407, "step": 8590 }, { "epoch": 0.04, "learning_rate": 0.0002934917840079511, "loss": 0.0378, "step": 8600 }, { "epoch": 0.04, "learning_rate": 0.0002934842163149371, "loss": 0.0389, "step": 8610 }, { "epoch": 0.04, "learning_rate": 0.0002934766486219231, "loss": 0.0462, "step": 8620 }, { "epoch": 0.04, "learning_rate": 0.00029346908092890906, "loss": 0.0362, "step": 8630 }, { "epoch": 0.04, "learning_rate": 0.00029346151323589504, "loss": 0.0355, "step": 8640 }, { "epoch": 0.04, "learning_rate": 0.000293453945542881, "loss": 0.0501, "step": 8650 }, { "epoch": 0.04, "learning_rate": 0.000293446377849867, "loss": 0.0372, "step": 8660 }, { "epoch": 0.04, "learning_rate": 0.00029343881015685304, "loss": 0.047, "step": 8670 }, { "epoch": 0.04, "learning_rate": 0.000293431242463839, "loss": 0.0424, "step": 8680 }, { "epoch": 0.04, "learning_rate": 0.000293423674770825, "loss": 0.0412, "step": 8690 }, { "epoch": 0.04, "learning_rate": 0.000293416107077811, "loss": 0.0422, "step": 8700 }, { "epoch": 0.04, "learning_rate": 0.00029340853938479697, "loss": 0.0416, "step": 8710 }, { "epoch": 0.04, "learning_rate": 0.00029340097169178295, "loss": 0.0439, "step": 8720 }, { "epoch": 0.04, "learning_rate": 0.000293393403998769, "loss": 0.0432, "step": 8730 }, { "epoch": 0.04, "learning_rate": 0.00029338583630575496, "loss": 0.049, "step": 8740 }, { "epoch": 0.04, "learning_rate": 0.00029337826861274095, "loss": 0.0852, "step": 8750 }, { "epoch": 0.04, "learning_rate": 0.00029337070091972693, "loss": 0.0452, "step": 8760 }, { "epoch": 0.04, "learning_rate": 0.0002933631332267129, "loss": 0.0722, "step": 8770 }, { "epoch": 0.04, "learning_rate": 0.0002933555655336989, "loss": 0.0839, "step": 8780 }, { "epoch": 0.04, "learning_rate": 0.0002933479978406849, "loss": 0.0442, "step": 8790 }, { "epoch": 0.04, "learning_rate": 0.0002933404301476709, "loss": 0.044, "step": 8800 }, { "epoch": 0.04, "learning_rate": 0.0002933328624546569, "loss": 0.041, "step": 8810 }, { "epoch": 0.04, "learning_rate": 0.00029332529476164287, "loss": 0.0471, "step": 8820 }, { "epoch": 0.04, "learning_rate": 0.00029331772706862885, "loss": 0.037, "step": 8830 }, { "epoch": 0.04, "learning_rate": 0.00029331015937561483, "loss": 0.0418, "step": 8840 }, { "epoch": 0.04, "learning_rate": 0.0002933025916826008, "loss": 0.0411, "step": 8850 }, { "epoch": 0.04, "learning_rate": 0.00029329502398958685, "loss": 0.0448, "step": 8860 }, { "epoch": 0.04, "learning_rate": 0.00029328745629657283, "loss": 0.0363, "step": 8870 }, { "epoch": 0.04, "learning_rate": 0.0002932798886035588, "loss": 0.0438, "step": 8880 }, { "epoch": 0.04, "learning_rate": 0.0002932723209105448, "loss": 0.0372, "step": 8890 }, { "epoch": 0.04, "learning_rate": 0.0002932647532175308, "loss": 0.0423, "step": 8900 }, { "epoch": 0.04, "learning_rate": 0.00029325718552451676, "loss": 0.0412, "step": 8910 }, { "epoch": 0.05, "learning_rate": 0.0002932496178315028, "loss": 0.0338, "step": 8920 }, { "epoch": 0.05, "learning_rate": 0.0002932420501384888, "loss": 0.0347, "step": 8930 }, { "epoch": 0.05, "learning_rate": 0.00029323448244547476, "loss": 0.0444, "step": 8940 }, { "epoch": 0.05, "learning_rate": 0.00029322691475246074, "loss": 0.0343, "step": 8950 }, { "epoch": 0.05, "learning_rate": 0.0002932193470594467, "loss": 0.0437, "step": 8960 }, { "epoch": 0.05, "learning_rate": 0.0002932117793664327, "loss": 0.04, "step": 8970 }, { "epoch": 0.05, "learning_rate": 0.00029320421167341874, "loss": 0.0405, "step": 8980 }, { "epoch": 0.05, "learning_rate": 0.0002931966439804047, "loss": 0.0338, "step": 8990 }, { "epoch": 0.05, "learning_rate": 0.0002931890762873907, "loss": 0.043, "step": 9000 }, { "epoch": 0.05, "eval_cer": 0.9145352724435641, "eval_loss": 0.03075648657977581, "eval_runtime": 117.5474, "eval_samples_per_second": 17.014, "eval_steps_per_second": 4.254, "step": 9000 }, { "epoch": 0.05, "learning_rate": 0.0002931815085943767, "loss": 0.0435, "step": 9010 }, { "epoch": 0.05, "learning_rate": 0.00029317394090136266, "loss": 0.0368, "step": 9020 }, { "epoch": 0.05, "learning_rate": 0.00029316637320834864, "loss": 0.0428, "step": 9030 }, { "epoch": 0.05, "learning_rate": 0.0002931588055153346, "loss": 0.0391, "step": 9040 }, { "epoch": 0.05, "learning_rate": 0.00029315123782232066, "loss": 0.0364, "step": 9050 }, { "epoch": 0.05, "learning_rate": 0.00029314367012930664, "loss": 0.0351, "step": 9060 }, { "epoch": 0.05, "learning_rate": 0.0002931361024362926, "loss": 0.0363, "step": 9070 }, { "epoch": 0.05, "learning_rate": 0.0002931285347432786, "loss": 0.0389, "step": 9080 }, { "epoch": 0.05, "learning_rate": 0.0002931209670502646, "loss": 0.0447, "step": 9090 }, { "epoch": 0.05, "learning_rate": 0.00029311339935725057, "loss": 0.0385, "step": 9100 }, { "epoch": 0.05, "learning_rate": 0.0002931058316642366, "loss": 0.0429, "step": 9110 }, { "epoch": 0.05, "learning_rate": 0.0002930982639712226, "loss": 0.0399, "step": 9120 }, { "epoch": 0.05, "learning_rate": 0.00029309069627820857, "loss": 0.0383, "step": 9130 }, { "epoch": 0.05, "learning_rate": 0.00029308312858519455, "loss": 0.0303, "step": 9140 }, { "epoch": 0.05, "learning_rate": 0.00029307556089218053, "loss": 0.042, "step": 9150 }, { "epoch": 0.05, "learning_rate": 0.0002930679931991665, "loss": 0.0415, "step": 9160 }, { "epoch": 0.05, "learning_rate": 0.0002930604255061525, "loss": 0.038, "step": 9170 }, { "epoch": 0.05, "learning_rate": 0.00029305285781313853, "loss": 0.0375, "step": 9180 }, { "epoch": 0.05, "learning_rate": 0.0002930452901201245, "loss": 0.0364, "step": 9190 }, { "epoch": 0.05, "learning_rate": 0.0002930377224271105, "loss": 0.0377, "step": 9200 }, { "epoch": 0.05, "learning_rate": 0.00029303015473409647, "loss": 0.0382, "step": 9210 }, { "epoch": 0.05, "learning_rate": 0.00029302258704108245, "loss": 0.0425, "step": 9220 }, { "epoch": 0.05, "learning_rate": 0.00029301501934806843, "loss": 0.0377, "step": 9230 }, { "epoch": 0.05, "learning_rate": 0.00029300745165505447, "loss": 0.0442, "step": 9240 }, { "epoch": 0.05, "learning_rate": 0.00029299988396204045, "loss": 0.0396, "step": 9250 }, { "epoch": 0.05, "learning_rate": 0.00029299231626902643, "loss": 0.0383, "step": 9260 }, { "epoch": 0.05, "learning_rate": 0.0002929847485760124, "loss": 0.0436, "step": 9270 }, { "epoch": 0.05, "learning_rate": 0.0002929771808829984, "loss": 0.0385, "step": 9280 }, { "epoch": 0.05, "learning_rate": 0.0002929696131899844, "loss": 0.0407, "step": 9290 }, { "epoch": 0.05, "learning_rate": 0.0002929620454969704, "loss": 0.0399, "step": 9300 }, { "epoch": 0.05, "learning_rate": 0.0002929544778039564, "loss": 0.0396, "step": 9310 }, { "epoch": 0.05, "learning_rate": 0.0002929469101109424, "loss": 0.0334, "step": 9320 }, { "epoch": 0.05, "learning_rate": 0.00029293934241792836, "loss": 0.0379, "step": 9330 }, { "epoch": 0.05, "learning_rate": 0.00029293177472491434, "loss": 0.034, "step": 9340 }, { "epoch": 0.05, "learning_rate": 0.0002929242070319003, "loss": 0.0384, "step": 9350 }, { "epoch": 0.05, "learning_rate": 0.0002929166393388863, "loss": 0.0372, "step": 9360 }, { "epoch": 0.05, "learning_rate": 0.00029290907164587234, "loss": 0.0371, "step": 9370 }, { "epoch": 0.05, "learning_rate": 0.0002929015039528583, "loss": 0.0378, "step": 9380 }, { "epoch": 0.05, "learning_rate": 0.0002928939362598443, "loss": 0.0362, "step": 9390 }, { "epoch": 0.05, "learning_rate": 0.0002928863685668303, "loss": 0.0385, "step": 9400 }, { "epoch": 0.05, "learning_rate": 0.00029287880087381626, "loss": 0.0355, "step": 9410 }, { "epoch": 0.05, "learning_rate": 0.00029287123318080224, "loss": 0.0418, "step": 9420 }, { "epoch": 0.05, "learning_rate": 0.0002928636654877882, "loss": 0.0369, "step": 9430 }, { "epoch": 0.05, "learning_rate": 0.0002928560977947742, "loss": 0.0423, "step": 9440 }, { "epoch": 0.05, "learning_rate": 0.0002928485301017602, "loss": 0.0349, "step": 9450 }, { "epoch": 0.05, "learning_rate": 0.00029284096240874617, "loss": 0.0379, "step": 9460 }, { "epoch": 0.05, "learning_rate": 0.0002928333947157322, "loss": 0.0444, "step": 9470 }, { "epoch": 0.05, "learning_rate": 0.0002928258270227182, "loss": 0.0357, "step": 9480 }, { "epoch": 0.05, "learning_rate": 0.00029281825932970417, "loss": 0.0495, "step": 9490 }, { "epoch": 0.05, "learning_rate": 0.00029281069163669015, "loss": 0.0384, "step": 9500 }, { "epoch": 0.05, "learning_rate": 0.00029280312394367613, "loss": 0.0448, "step": 9510 }, { "epoch": 0.05, "learning_rate": 0.0002927955562506621, "loss": 0.0382, "step": 9520 }, { "epoch": 0.05, "learning_rate": 0.00029278798855764815, "loss": 0.0397, "step": 9530 }, { "epoch": 0.05, "learning_rate": 0.00029278042086463413, "loss": 0.0354, "step": 9540 }, { "epoch": 0.05, "learning_rate": 0.0002927728531716201, "loss": 0.042, "step": 9550 }, { "epoch": 0.05, "learning_rate": 0.0002927652854786061, "loss": 0.0458, "step": 9560 }, { "epoch": 0.05, "learning_rate": 0.0002927577177855921, "loss": 0.0349, "step": 9570 }, { "epoch": 0.05, "learning_rate": 0.00029275015009257806, "loss": 0.0386, "step": 9580 }, { "epoch": 0.05, "learning_rate": 0.00029274258239956404, "loss": 0.0407, "step": 9590 }, { "epoch": 0.05, "learning_rate": 0.0002927350147065501, "loss": 0.0397, "step": 9600 }, { "epoch": 0.05, "learning_rate": 0.00029272744701353605, "loss": 0.0394, "step": 9610 }, { "epoch": 0.05, "learning_rate": 0.00029271987932052204, "loss": 0.043, "step": 9620 }, { "epoch": 0.05, "learning_rate": 0.000292712311627508, "loss": 0.0395, "step": 9630 }, { "epoch": 0.05, "learning_rate": 0.000292704743934494, "loss": 0.0401, "step": 9640 }, { "epoch": 0.05, "learning_rate": 0.00029269717624148, "loss": 0.0418, "step": 9650 }, { "epoch": 0.05, "learning_rate": 0.000292689608548466, "loss": 0.0458, "step": 9660 }, { "epoch": 0.05, "learning_rate": 0.000292682040855452, "loss": 0.0492, "step": 9670 }, { "epoch": 0.05, "learning_rate": 0.000292674473162438, "loss": 0.0372, "step": 9680 }, { "epoch": 0.05, "learning_rate": 0.00029266690546942396, "loss": 0.0358, "step": 9690 }, { "epoch": 0.05, "learning_rate": 0.00029265933777640994, "loss": 0.0515, "step": 9700 }, { "epoch": 0.05, "learning_rate": 0.0002926517700833959, "loss": 0.0445, "step": 9710 }, { "epoch": 0.05, "learning_rate": 0.00029264420239038196, "loss": 0.0406, "step": 9720 }, { "epoch": 0.05, "learning_rate": 0.00029263663469736794, "loss": 0.0414, "step": 9730 }, { "epoch": 0.05, "learning_rate": 0.0002926290670043539, "loss": 0.0355, "step": 9740 }, { "epoch": 0.05, "learning_rate": 0.0002926214993113399, "loss": 0.0383, "step": 9750 }, { "epoch": 0.05, "learning_rate": 0.0002926139316183259, "loss": 0.0398, "step": 9760 }, { "epoch": 0.05, "learning_rate": 0.00029260636392531187, "loss": 0.0456, "step": 9770 }, { "epoch": 0.05, "learning_rate": 0.00029259879623229785, "loss": 0.0414, "step": 9780 }, { "epoch": 0.05, "learning_rate": 0.0002925912285392839, "loss": 0.0428, "step": 9790 }, { "epoch": 0.05, "learning_rate": 0.00029258366084626986, "loss": 0.038, "step": 9800 }, { "epoch": 0.05, "learning_rate": 0.00029257609315325585, "loss": 0.0365, "step": 9810 }, { "epoch": 0.05, "learning_rate": 0.00029256852546024183, "loss": 0.0341, "step": 9820 }, { "epoch": 0.05, "learning_rate": 0.0002925609577672278, "loss": 0.0397, "step": 9830 }, { "epoch": 0.05, "learning_rate": 0.0002925533900742138, "loss": 0.0363, "step": 9840 }, { "epoch": 0.05, "learning_rate": 0.0002925458223811998, "loss": 0.0411, "step": 9850 }, { "epoch": 0.05, "learning_rate": 0.0002925382546881858, "loss": 0.039, "step": 9860 }, { "epoch": 0.05, "learning_rate": 0.0002925306869951718, "loss": 0.0385, "step": 9870 }, { "epoch": 0.05, "learning_rate": 0.00029252311930215777, "loss": 0.0349, "step": 9880 }, { "epoch": 0.05, "learning_rate": 0.00029251555160914375, "loss": 0.0366, "step": 9890 }, { "epoch": 0.05, "learning_rate": 0.00029250798391612973, "loss": 0.0343, "step": 9900 }, { "epoch": 0.05, "learning_rate": 0.0002925004162231157, "loss": 0.0382, "step": 9910 }, { "epoch": 0.05, "learning_rate": 0.00029249284853010175, "loss": 0.036, "step": 9920 }, { "epoch": 0.05, "learning_rate": 0.00029248528083708773, "loss": 0.0409, "step": 9930 }, { "epoch": 0.05, "learning_rate": 0.0002924777131440737, "loss": 0.0425, "step": 9940 }, { "epoch": 0.05, "learning_rate": 0.0002924701454510597, "loss": 0.0364, "step": 9950 }, { "epoch": 0.05, "learning_rate": 0.0002924625777580457, "loss": 0.0376, "step": 9960 }, { "epoch": 0.05, "learning_rate": 0.00029245501006503166, "loss": 0.038, "step": 9970 }, { "epoch": 0.05, "learning_rate": 0.0002924474423720177, "loss": 0.0385, "step": 9980 }, { "epoch": 0.05, "learning_rate": 0.0002924398746790037, "loss": 0.0304, "step": 9990 }, { "epoch": 0.05, "learning_rate": 0.00029243230698598966, "loss": 0.0413, "step": 10000 }, { "epoch": 0.05, "eval_cer": 0.9145003381830497, "eval_loss": 0.02770831808447838, "eval_runtime": 117.615, "eval_samples_per_second": 17.005, "eval_steps_per_second": 4.251, "step": 10000 }, { "epoch": 0.05, "learning_rate": 0.00029242473929297564, "loss": 0.0328, "step": 10010 }, { "epoch": 0.05, "learning_rate": 0.0002924171715999616, "loss": 0.0358, "step": 10020 }, { "epoch": 0.05, "learning_rate": 0.0002924096039069476, "loss": 0.0386, "step": 10030 }, { "epoch": 0.05, "learning_rate": 0.00029240203621393364, "loss": 0.0341, "step": 10040 }, { "epoch": 0.05, "learning_rate": 0.0002923944685209196, "loss": 0.036, "step": 10050 }, { "epoch": 0.05, "learning_rate": 0.0002923869008279056, "loss": 0.046, "step": 10060 }, { "epoch": 0.05, "learning_rate": 0.0002923793331348916, "loss": 0.0378, "step": 10070 }, { "epoch": 0.05, "learning_rate": 0.00029237176544187756, "loss": 0.039, "step": 10080 }, { "epoch": 0.05, "learning_rate": 0.00029236419774886354, "loss": 0.0352, "step": 10090 }, { "epoch": 0.05, "learning_rate": 0.0002923566300558495, "loss": 0.0363, "step": 10100 }, { "epoch": 0.05, "learning_rate": 0.00029234906236283556, "loss": 0.039, "step": 10110 }, { "epoch": 0.05, "learning_rate": 0.00029234149466982154, "loss": 0.0353, "step": 10120 }, { "epoch": 0.05, "learning_rate": 0.0002923339269768075, "loss": 0.0336, "step": 10130 }, { "epoch": 0.05, "learning_rate": 0.0002923263592837935, "loss": 0.0427, "step": 10140 }, { "epoch": 0.05, "learning_rate": 0.0002923187915907795, "loss": 0.0359, "step": 10150 }, { "epoch": 0.05, "learning_rate": 0.00029231122389776547, "loss": 0.0366, "step": 10160 }, { "epoch": 0.05, "learning_rate": 0.0002923036562047515, "loss": 0.0341, "step": 10170 }, { "epoch": 0.05, "learning_rate": 0.0002922960885117375, "loss": 0.0412, "step": 10180 }, { "epoch": 0.05, "learning_rate": 0.00029228852081872347, "loss": 0.0317, "step": 10190 }, { "epoch": 0.05, "learning_rate": 0.00029228095312570945, "loss": 0.0363, "step": 10200 }, { "epoch": 0.05, "learning_rate": 0.00029227338543269543, "loss": 0.0357, "step": 10210 }, { "epoch": 0.05, "learning_rate": 0.0002922658177396814, "loss": 0.0333, "step": 10220 }, { "epoch": 0.05, "learning_rate": 0.00029225825004666745, "loss": 0.0419, "step": 10230 }, { "epoch": 0.05, "learning_rate": 0.00029225068235365343, "loss": 0.0327, "step": 10240 }, { "epoch": 0.05, "learning_rate": 0.0002922431146606394, "loss": 0.0337, "step": 10250 }, { "epoch": 0.05, "learning_rate": 0.0002922355469676254, "loss": 0.0386, "step": 10260 }, { "epoch": 0.05, "learning_rate": 0.00029222797927461137, "loss": 0.0347, "step": 10270 }, { "epoch": 0.05, "learning_rate": 0.00029222041158159735, "loss": 0.035, "step": 10280 }, { "epoch": 0.05, "learning_rate": 0.00029221284388858333, "loss": 0.0343, "step": 10290 }, { "epoch": 0.05, "learning_rate": 0.00029220527619556937, "loss": 0.0481, "step": 10300 }, { "epoch": 0.05, "learning_rate": 0.00029219770850255535, "loss": 0.0382, "step": 10310 }, { "epoch": 0.05, "learning_rate": 0.00029219014080954133, "loss": 0.0358, "step": 10320 }, { "epoch": 0.05, "learning_rate": 0.0002921825731165273, "loss": 0.0422, "step": 10330 }, { "epoch": 0.05, "learning_rate": 0.0002921750054235133, "loss": 0.0343, "step": 10340 }, { "epoch": 0.05, "learning_rate": 0.0002921674377304993, "loss": 0.046, "step": 10350 }, { "epoch": 0.05, "learning_rate": 0.0002921598700374853, "loss": 0.0407, "step": 10360 }, { "epoch": 0.05, "learning_rate": 0.0002921523023444713, "loss": 0.0364, "step": 10370 }, { "epoch": 0.05, "learning_rate": 0.0002921447346514573, "loss": 0.0349, "step": 10380 }, { "epoch": 0.05, "learning_rate": 0.00029213716695844326, "loss": 0.0338, "step": 10390 }, { "epoch": 0.05, "learning_rate": 0.00029212959926542924, "loss": 0.0333, "step": 10400 }, { "epoch": 0.05, "learning_rate": 0.0002921220315724152, "loss": 0.0347, "step": 10410 }, { "epoch": 0.05, "learning_rate": 0.0002921144638794012, "loss": 0.0357, "step": 10420 }, { "epoch": 0.05, "learning_rate": 0.00029210689618638724, "loss": 0.0351, "step": 10430 }, { "epoch": 0.05, "learning_rate": 0.0002920993284933732, "loss": 0.0356, "step": 10440 }, { "epoch": 0.05, "learning_rate": 0.0002920917608003592, "loss": 0.0394, "step": 10450 }, { "epoch": 0.05, "learning_rate": 0.0002920841931073452, "loss": 0.0376, "step": 10460 }, { "epoch": 0.05, "learning_rate": 0.00029207662541433116, "loss": 0.0374, "step": 10470 }, { "epoch": 0.05, "learning_rate": 0.00029206905772131714, "loss": 0.0333, "step": 10480 }, { "epoch": 0.05, "learning_rate": 0.0002920614900283032, "loss": 0.0313, "step": 10490 }, { "epoch": 0.05, "learning_rate": 0.00029205392233528916, "loss": 0.0328, "step": 10500 }, { "epoch": 0.05, "learning_rate": 0.00029204635464227514, "loss": 0.0339, "step": 10510 }, { "epoch": 0.05, "learning_rate": 0.0002920387869492611, "loss": 0.03, "step": 10520 }, { "epoch": 0.05, "learning_rate": 0.0002920312192562471, "loss": 0.0353, "step": 10530 }, { "epoch": 0.05, "learning_rate": 0.0002920236515632331, "loss": 0.035, "step": 10540 }, { "epoch": 0.05, "learning_rate": 0.0002920160838702191, "loss": 0.0311, "step": 10550 }, { "epoch": 0.05, "learning_rate": 0.0002920085161772051, "loss": 0.0359, "step": 10560 }, { "epoch": 0.05, "learning_rate": 0.0002920009484841911, "loss": 0.0373, "step": 10570 }, { "epoch": 0.05, "learning_rate": 0.00029199338079117707, "loss": 0.0408, "step": 10580 }, { "epoch": 0.05, "learning_rate": 0.00029198581309816305, "loss": 0.0406, "step": 10590 }, { "epoch": 0.05, "learning_rate": 0.00029197824540514903, "loss": 0.039, "step": 10600 }, { "epoch": 0.05, "learning_rate": 0.000291970677712135, "loss": 0.0318, "step": 10610 }, { "epoch": 0.05, "learning_rate": 0.00029196311001912105, "loss": 0.0357, "step": 10620 }, { "epoch": 0.05, "learning_rate": 0.00029195554232610703, "loss": 0.0354, "step": 10630 }, { "epoch": 0.05, "learning_rate": 0.000291947974633093, "loss": 0.0331, "step": 10640 }, { "epoch": 0.05, "learning_rate": 0.000291940406940079, "loss": 0.0322, "step": 10650 }, { "epoch": 0.05, "learning_rate": 0.000291932839247065, "loss": 0.0391, "step": 10660 }, { "epoch": 0.05, "learning_rate": 0.00029192527155405095, "loss": 0.0352, "step": 10670 }, { "epoch": 0.05, "learning_rate": 0.000291917703861037, "loss": 0.0335, "step": 10680 }, { "epoch": 0.05, "learning_rate": 0.0002919101361680229, "loss": 0.0336, "step": 10690 }, { "epoch": 0.05, "learning_rate": 0.0002919025684750089, "loss": 0.0392, "step": 10700 }, { "epoch": 0.05, "learning_rate": 0.0002918950007819949, "loss": 0.0347, "step": 10710 }, { "epoch": 0.05, "learning_rate": 0.0002918874330889809, "loss": 0.0386, "step": 10720 }, { "epoch": 0.05, "learning_rate": 0.0002918798653959669, "loss": 0.037, "step": 10730 }, { "epoch": 0.05, "learning_rate": 0.0002918722977029529, "loss": 0.042, "step": 10740 }, { "epoch": 0.05, "learning_rate": 0.00029186473000993886, "loss": 0.0359, "step": 10750 }, { "epoch": 0.05, "learning_rate": 0.00029185716231692484, "loss": 0.0392, "step": 10760 }, { "epoch": 0.05, "learning_rate": 0.0002918495946239108, "loss": 0.0366, "step": 10770 }, { "epoch": 0.05, "learning_rate": 0.00029184202693089686, "loss": 0.0351, "step": 10780 }, { "epoch": 0.05, "learning_rate": 0.00029183445923788284, "loss": 0.0386, "step": 10790 }, { "epoch": 0.05, "learning_rate": 0.0002918268915448688, "loss": 0.0321, "step": 10800 }, { "epoch": 0.05, "learning_rate": 0.0002918193238518548, "loss": 0.0346, "step": 10810 }, { "epoch": 0.05, "learning_rate": 0.0002918117561588408, "loss": 0.0375, "step": 10820 }, { "epoch": 0.05, "learning_rate": 0.00029180418846582677, "loss": 0.0344, "step": 10830 }, { "epoch": 0.05, "learning_rate": 0.00029179662077281275, "loss": 0.036, "step": 10840 }, { "epoch": 0.05, "learning_rate": 0.0002917890530797988, "loss": 0.0319, "step": 10850 }, { "epoch": 0.05, "learning_rate": 0.00029178148538678476, "loss": 0.0333, "step": 10860 }, { "epoch": 0.05, "learning_rate": 0.00029177391769377075, "loss": 0.0359, "step": 10870 }, { "epoch": 0.05, "learning_rate": 0.00029176635000075673, "loss": 0.0368, "step": 10880 }, { "epoch": 0.05, "learning_rate": 0.0002917587823077427, "loss": 0.0322, "step": 10890 }, { "epoch": 0.05, "learning_rate": 0.0002917512146147287, "loss": 0.0395, "step": 10900 }, { "epoch": 0.06, "learning_rate": 0.0002917436469217147, "loss": 0.0388, "step": 10910 }, { "epoch": 0.06, "learning_rate": 0.0002917360792287007, "loss": 0.0349, "step": 10920 }, { "epoch": 0.06, "learning_rate": 0.0002917285115356867, "loss": 0.0386, "step": 10930 }, { "epoch": 0.06, "learning_rate": 0.00029172094384267267, "loss": 0.0409, "step": 10940 }, { "epoch": 0.06, "learning_rate": 0.00029171337614965865, "loss": 0.0367, "step": 10950 }, { "epoch": 0.06, "learning_rate": 0.00029170580845664463, "loss": 0.0355, "step": 10960 }, { "epoch": 0.06, "learning_rate": 0.0002916982407636306, "loss": 0.0337, "step": 10970 }, { "epoch": 0.06, "learning_rate": 0.00029169067307061665, "loss": 0.0409, "step": 10980 }, { "epoch": 0.06, "learning_rate": 0.00029168310537760263, "loss": 0.0377, "step": 10990 }, { "epoch": 0.06, "learning_rate": 0.0002916755376845886, "loss": 0.0333, "step": 11000 }, { "epoch": 0.06, "eval_cer": 0.9145003381830497, "eval_loss": 0.027273865416646004, "eval_runtime": 117.4476, "eval_samples_per_second": 17.029, "eval_steps_per_second": 4.257, "step": 11000 }, { "epoch": 0.06, "learning_rate": 0.0002916679699915746, "loss": 0.032, "step": 11010 }, { "epoch": 0.06, "learning_rate": 0.0002916604022985606, "loss": 0.0327, "step": 11020 }, { "epoch": 0.06, "learning_rate": 0.00029165283460554656, "loss": 0.0479, "step": 11030 }, { "epoch": 0.06, "learning_rate": 0.0002916452669125326, "loss": 0.0659, "step": 11040 }, { "epoch": 0.06, "learning_rate": 0.0002916376992195186, "loss": 0.044, "step": 11050 }, { "epoch": 0.06, "learning_rate": 0.00029163013152650456, "loss": 0.0389, "step": 11060 }, { "epoch": 0.06, "learning_rate": 0.00029162256383349054, "loss": 0.0395, "step": 11070 }, { "epoch": 0.06, "learning_rate": 0.0002916149961404765, "loss": 0.0589, "step": 11080 }, { "epoch": 0.06, "learning_rate": 0.0002916074284474625, "loss": 0.0441, "step": 11090 }, { "epoch": 0.06, "learning_rate": 0.00029159986075444854, "loss": 0.0429, "step": 11100 }, { "epoch": 0.06, "learning_rate": 0.0002915922930614345, "loss": 0.0401, "step": 11110 }, { "epoch": 0.06, "learning_rate": 0.0002915847253684205, "loss": 0.0403, "step": 11120 }, { "epoch": 0.06, "learning_rate": 0.0002915771576754065, "loss": 0.0418, "step": 11130 }, { "epoch": 0.06, "learning_rate": 0.00029156958998239246, "loss": 0.0355, "step": 11140 }, { "epoch": 0.06, "learning_rate": 0.00029156202228937844, "loss": 0.0404, "step": 11150 }, { "epoch": 0.06, "learning_rate": 0.0002915544545963644, "loss": 0.0396, "step": 11160 }, { "epoch": 0.06, "learning_rate": 0.00029154688690335046, "loss": 0.0428, "step": 11170 }, { "epoch": 0.06, "learning_rate": 0.00029153931921033644, "loss": 0.0404, "step": 11180 }, { "epoch": 0.06, "learning_rate": 0.0002915317515173224, "loss": 0.0358, "step": 11190 }, { "epoch": 0.06, "learning_rate": 0.0002915241838243084, "loss": 0.0383, "step": 11200 }, { "epoch": 0.06, "learning_rate": 0.0002915166161312944, "loss": 0.0385, "step": 11210 }, { "epoch": 0.06, "learning_rate": 0.00029150904843828037, "loss": 0.0371, "step": 11220 }, { "epoch": 0.06, "learning_rate": 0.0002915014807452664, "loss": 0.0374, "step": 11230 }, { "epoch": 0.06, "learning_rate": 0.0002914939130522524, "loss": 0.0389, "step": 11240 }, { "epoch": 0.06, "learning_rate": 0.00029148634535923837, "loss": 0.0397, "step": 11250 }, { "epoch": 0.06, "learning_rate": 0.00029147877766622435, "loss": 0.0373, "step": 11260 }, { "epoch": 0.06, "learning_rate": 0.00029147120997321033, "loss": 0.0372, "step": 11270 }, { "epoch": 0.06, "learning_rate": 0.0002914636422801963, "loss": 0.0383, "step": 11280 }, { "epoch": 0.06, "learning_rate": 0.00029145607458718235, "loss": 0.036, "step": 11290 }, { "epoch": 0.06, "learning_rate": 0.00029144850689416833, "loss": 0.0377, "step": 11300 }, { "epoch": 0.06, "learning_rate": 0.0002914409392011543, "loss": 0.0394, "step": 11310 }, { "epoch": 0.06, "learning_rate": 0.0002914333715081403, "loss": 0.0408, "step": 11320 }, { "epoch": 0.06, "learning_rate": 0.00029142580381512627, "loss": 0.0381, "step": 11330 }, { "epoch": 0.06, "learning_rate": 0.00029141823612211225, "loss": 0.038, "step": 11340 }, { "epoch": 0.06, "learning_rate": 0.00029141066842909824, "loss": 0.0319, "step": 11350 }, { "epoch": 0.06, "learning_rate": 0.00029140310073608427, "loss": 0.0309, "step": 11360 }, { "epoch": 0.06, "learning_rate": 0.00029139553304307025, "loss": 0.036, "step": 11370 }, { "epoch": 0.06, "learning_rate": 0.00029138796535005623, "loss": 0.0346, "step": 11380 }, { "epoch": 0.06, "learning_rate": 0.0002913803976570422, "loss": 0.0753, "step": 11390 }, { "epoch": 0.06, "learning_rate": 0.0002913728299640282, "loss": 0.037, "step": 11400 }, { "epoch": 0.06, "learning_rate": 0.0002913652622710142, "loss": 0.0302, "step": 11410 }, { "epoch": 0.06, "learning_rate": 0.0002913576945780002, "loss": 0.0365, "step": 11420 }, { "epoch": 0.06, "learning_rate": 0.0002913501268849862, "loss": 0.0351, "step": 11430 }, { "epoch": 0.06, "learning_rate": 0.0002913425591919722, "loss": 0.0354, "step": 11440 }, { "epoch": 0.06, "learning_rate": 0.00029133499149895816, "loss": 0.0371, "step": 11450 }, { "epoch": 0.06, "learning_rate": 0.00029132742380594414, "loss": 0.0396, "step": 11460 }, { "epoch": 0.06, "learning_rate": 0.0002913198561129301, "loss": 0.0351, "step": 11470 }, { "epoch": 0.06, "learning_rate": 0.0002913122884199161, "loss": 0.0356, "step": 11480 }, { "epoch": 0.06, "learning_rate": 0.00029130472072690214, "loss": 0.0317, "step": 11490 }, { "epoch": 0.06, "learning_rate": 0.0002912971530338881, "loss": 0.0347, "step": 11500 }, { "epoch": 0.06, "learning_rate": 0.0002912895853408741, "loss": 0.0338, "step": 11510 }, { "epoch": 0.06, "learning_rate": 0.0002912820176478601, "loss": 0.0393, "step": 11520 }, { "epoch": 0.06, "learning_rate": 0.00029127444995484606, "loss": 0.0316, "step": 11530 }, { "epoch": 0.06, "learning_rate": 0.00029126688226183205, "loss": 0.04, "step": 11540 }, { "epoch": 0.06, "learning_rate": 0.0002912593145688181, "loss": 0.0313, "step": 11550 }, { "epoch": 0.06, "learning_rate": 0.00029125174687580406, "loss": 0.0319, "step": 11560 }, { "epoch": 0.06, "learning_rate": 0.00029124417918279004, "loss": 0.0326, "step": 11570 }, { "epoch": 0.06, "learning_rate": 0.000291236611489776, "loss": 0.038, "step": 11580 }, { "epoch": 0.06, "learning_rate": 0.000291229043796762, "loss": 0.0363, "step": 11590 }, { "epoch": 0.06, "learning_rate": 0.000291221476103748, "loss": 0.0331, "step": 11600 }, { "epoch": 0.06, "learning_rate": 0.000291213908410734, "loss": 0.033, "step": 11610 }, { "epoch": 0.06, "learning_rate": 0.00029120634071772, "loss": 0.0379, "step": 11620 }, { "epoch": 0.06, "learning_rate": 0.000291198773024706, "loss": 0.037, "step": 11630 }, { "epoch": 0.06, "learning_rate": 0.00029119120533169197, "loss": 0.038, "step": 11640 }, { "epoch": 0.06, "learning_rate": 0.00029118363763867795, "loss": 0.0337, "step": 11650 }, { "epoch": 0.06, "learning_rate": 0.00029117606994566393, "loss": 0.034, "step": 11660 }, { "epoch": 0.06, "learning_rate": 0.0002911685022526499, "loss": 0.0362, "step": 11670 }, { "epoch": 0.06, "learning_rate": 0.00029116093455963595, "loss": 0.0363, "step": 11680 }, { "epoch": 0.06, "learning_rate": 0.00029115336686662193, "loss": 0.0393, "step": 11690 }, { "epoch": 0.06, "learning_rate": 0.0002911457991736079, "loss": 0.0366, "step": 11700 }, { "epoch": 0.06, "learning_rate": 0.0002911382314805939, "loss": 0.0364, "step": 11710 }, { "epoch": 0.06, "learning_rate": 0.0002911306637875799, "loss": 0.0375, "step": 11720 }, { "epoch": 0.06, "learning_rate": 0.00029112309609456586, "loss": 0.0362, "step": 11730 }, { "epoch": 0.06, "learning_rate": 0.0002911155284015519, "loss": 0.0365, "step": 11740 }, { "epoch": 0.06, "learning_rate": 0.00029110796070853787, "loss": 0.0312, "step": 11750 }, { "epoch": 0.06, "learning_rate": 0.00029110039301552385, "loss": 0.0329, "step": 11760 }, { "epoch": 0.06, "learning_rate": 0.00029109282532250984, "loss": 0.0376, "step": 11770 }, { "epoch": 0.06, "learning_rate": 0.0002910852576294958, "loss": 0.0363, "step": 11780 }, { "epoch": 0.06, "learning_rate": 0.0002910776899364818, "loss": 0.0418, "step": 11790 }, { "epoch": 0.06, "learning_rate": 0.00029107012224346783, "loss": 0.0339, "step": 11800 }, { "epoch": 0.06, "learning_rate": 0.0002910625545504538, "loss": 0.0385, "step": 11810 }, { "epoch": 0.06, "learning_rate": 0.0002910549868574398, "loss": 0.0373, "step": 11820 }, { "epoch": 0.06, "learning_rate": 0.0002910474191644258, "loss": 0.0311, "step": 11830 }, { "epoch": 0.06, "learning_rate": 0.00029103985147141176, "loss": 0.0353, "step": 11840 }, { "epoch": 0.06, "learning_rate": 0.00029103228377839774, "loss": 0.0359, "step": 11850 }, { "epoch": 0.06, "learning_rate": 0.0002910247160853837, "loss": 0.0353, "step": 11860 }, { "epoch": 0.06, "learning_rate": 0.00029101714839236976, "loss": 0.0389, "step": 11870 }, { "epoch": 0.06, "learning_rate": 0.00029100958069935574, "loss": 0.0358, "step": 11880 }, { "epoch": 0.06, "learning_rate": 0.0002910020130063417, "loss": 0.0369, "step": 11890 }, { "epoch": 0.06, "learning_rate": 0.0002909944453133277, "loss": 0.0368, "step": 11900 }, { "epoch": 0.06, "learning_rate": 0.0002909868776203137, "loss": 0.0347, "step": 11910 }, { "epoch": 0.06, "learning_rate": 0.00029097930992729967, "loss": 0.0351, "step": 11920 }, { "epoch": 0.06, "learning_rate": 0.0002909717422342857, "loss": 0.0364, "step": 11930 }, { "epoch": 0.06, "learning_rate": 0.0002909641745412717, "loss": 0.0358, "step": 11940 }, { "epoch": 0.06, "learning_rate": 0.0002909566068482576, "loss": 0.0367, "step": 11950 }, { "epoch": 0.06, "learning_rate": 0.0002909490391552436, "loss": 0.0375, "step": 11960 }, { "epoch": 0.06, "learning_rate": 0.0002909414714622296, "loss": 0.0364, "step": 11970 }, { "epoch": 0.06, "learning_rate": 0.0002909339037692156, "loss": 0.0374, "step": 11980 }, { "epoch": 0.06, "learning_rate": 0.0002909263360762016, "loss": 0.0334, "step": 11990 }, { "epoch": 0.06, "learning_rate": 0.00029091876838318757, "loss": 0.0286, "step": 12000 }, { "epoch": 0.06, "eval_cer": 0.9145042197675514, "eval_loss": 0.026305437088012695, "eval_runtime": 117.4972, "eval_samples_per_second": 17.022, "eval_steps_per_second": 4.255, "step": 12000 }, { "epoch": 0.06, "learning_rate": 0.00029091120069017355, "loss": 0.0336, "step": 12010 }, { "epoch": 0.06, "learning_rate": 0.00029090363299715953, "loss": 0.0372, "step": 12020 }, { "epoch": 0.06, "learning_rate": 0.00029089606530414557, "loss": 0.0361, "step": 12030 }, { "epoch": 0.06, "learning_rate": 0.00029088849761113155, "loss": 0.0325, "step": 12040 }, { "epoch": 0.06, "learning_rate": 0.00029088092991811753, "loss": 0.0327, "step": 12050 }, { "epoch": 0.06, "learning_rate": 0.0002908733622251035, "loss": 0.0293, "step": 12060 }, { "epoch": 0.06, "learning_rate": 0.0002908657945320895, "loss": 0.033, "step": 12070 }, { "epoch": 0.06, "learning_rate": 0.0002908582268390755, "loss": 0.0414, "step": 12080 }, { "epoch": 0.06, "learning_rate": 0.00029085065914606146, "loss": 0.0345, "step": 12090 }, { "epoch": 0.06, "learning_rate": 0.0002908430914530475, "loss": 0.0344, "step": 12100 }, { "epoch": 0.06, "learning_rate": 0.0002908355237600335, "loss": 0.0329, "step": 12110 }, { "epoch": 0.06, "learning_rate": 0.00029082795606701946, "loss": 0.0307, "step": 12120 }, { "epoch": 0.06, "learning_rate": 0.00029082038837400544, "loss": 0.0321, "step": 12130 }, { "epoch": 0.06, "learning_rate": 0.0002908128206809914, "loss": 0.0359, "step": 12140 }, { "epoch": 0.06, "learning_rate": 0.0002908052529879774, "loss": 0.0324, "step": 12150 }, { "epoch": 0.06, "learning_rate": 0.00029079768529496344, "loss": 0.0349, "step": 12160 }, { "epoch": 0.06, "learning_rate": 0.0002907901176019494, "loss": 0.0323, "step": 12170 }, { "epoch": 0.06, "learning_rate": 0.0002907825499089354, "loss": 0.0378, "step": 12180 }, { "epoch": 0.06, "learning_rate": 0.0002907749822159214, "loss": 0.0332, "step": 12190 }, { "epoch": 0.06, "learning_rate": 0.00029076741452290736, "loss": 0.0339, "step": 12200 }, { "epoch": 0.06, "learning_rate": 0.00029075984682989334, "loss": 0.0361, "step": 12210 }, { "epoch": 0.06, "learning_rate": 0.0002907522791368793, "loss": 0.0336, "step": 12220 }, { "epoch": 0.06, "learning_rate": 0.00029074471144386536, "loss": 0.0313, "step": 12230 }, { "epoch": 0.06, "learning_rate": 0.00029073714375085134, "loss": 0.0326, "step": 12240 }, { "epoch": 0.06, "learning_rate": 0.0002907295760578373, "loss": 0.0321, "step": 12250 }, { "epoch": 0.06, "learning_rate": 0.0002907220083648233, "loss": 0.0311, "step": 12260 }, { "epoch": 0.06, "learning_rate": 0.0002907144406718093, "loss": 0.0396, "step": 12270 }, { "epoch": 0.06, "learning_rate": 0.00029070687297879527, "loss": 0.0312, "step": 12280 }, { "epoch": 0.06, "learning_rate": 0.0002906993052857813, "loss": 0.0345, "step": 12290 }, { "epoch": 0.06, "learning_rate": 0.0002906917375927673, "loss": 0.0336, "step": 12300 }, { "epoch": 0.06, "learning_rate": 0.00029068416989975327, "loss": 0.0433, "step": 12310 }, { "epoch": 0.06, "learning_rate": 0.00029067660220673925, "loss": 0.0356, "step": 12320 }, { "epoch": 0.06, "learning_rate": 0.00029066903451372523, "loss": 0.0329, "step": 12330 }, { "epoch": 0.06, "learning_rate": 0.0002906614668207112, "loss": 0.0341, "step": 12340 }, { "epoch": 0.06, "learning_rate": 0.00029065389912769725, "loss": 0.033, "step": 12350 }, { "epoch": 0.06, "learning_rate": 0.00029064633143468323, "loss": 0.0393, "step": 12360 }, { "epoch": 0.06, "learning_rate": 0.0002906387637416692, "loss": 0.0398, "step": 12370 }, { "epoch": 0.06, "learning_rate": 0.0002906311960486552, "loss": 0.0456, "step": 12380 }, { "epoch": 0.06, "learning_rate": 0.00029062362835564117, "loss": 0.0452, "step": 12390 }, { "epoch": 0.06, "learning_rate": 0.00029061606066262715, "loss": 0.0408, "step": 12400 }, { "epoch": 0.06, "learning_rate": 0.00029060849296961314, "loss": 0.0333, "step": 12410 }, { "epoch": 0.06, "learning_rate": 0.00029060092527659917, "loss": 0.0363, "step": 12420 }, { "epoch": 0.06, "learning_rate": 0.00029059335758358515, "loss": 0.036, "step": 12430 }, { "epoch": 0.06, "learning_rate": 0.00029058578989057113, "loss": 0.0361, "step": 12440 }, { "epoch": 0.06, "learning_rate": 0.0002905782221975571, "loss": 0.0384, "step": 12450 }, { "epoch": 0.06, "learning_rate": 0.0002905706545045431, "loss": 0.0354, "step": 12460 }, { "epoch": 0.06, "learning_rate": 0.0002905630868115291, "loss": 0.0404, "step": 12470 }, { "epoch": 0.06, "learning_rate": 0.0002905555191185151, "loss": 0.0301, "step": 12480 }, { "epoch": 0.06, "learning_rate": 0.0002905479514255011, "loss": 0.0325, "step": 12490 }, { "epoch": 0.06, "learning_rate": 0.0002905403837324871, "loss": 0.0303, "step": 12500 }, { "epoch": 0.06, "learning_rate": 0.00029053281603947306, "loss": 0.0342, "step": 12510 }, { "epoch": 0.06, "learning_rate": 0.00029052524834645904, "loss": 0.0303, "step": 12520 }, { "epoch": 0.06, "learning_rate": 0.000290517680653445, "loss": 0.0327, "step": 12530 }, { "epoch": 0.06, "learning_rate": 0.000290510112960431, "loss": 0.036, "step": 12540 }, { "epoch": 0.06, "learning_rate": 0.00029050254526741704, "loss": 0.0303, "step": 12550 }, { "epoch": 0.06, "learning_rate": 0.000290494977574403, "loss": 0.0349, "step": 12560 }, { "epoch": 0.06, "learning_rate": 0.000290487409881389, "loss": 0.0347, "step": 12570 }, { "epoch": 0.06, "learning_rate": 0.000290479842188375, "loss": 0.035, "step": 12580 }, { "epoch": 0.06, "learning_rate": 0.00029047227449536096, "loss": 0.0285, "step": 12590 }, { "epoch": 0.06, "learning_rate": 0.00029046470680234695, "loss": 0.032, "step": 12600 }, { "epoch": 0.06, "learning_rate": 0.000290457139109333, "loss": 0.0345, "step": 12610 }, { "epoch": 0.06, "learning_rate": 0.00029044957141631896, "loss": 0.0381, "step": 12620 }, { "epoch": 0.06, "learning_rate": 0.00029044200372330494, "loss": 0.04, "step": 12630 }, { "epoch": 0.06, "learning_rate": 0.0002904344360302909, "loss": 0.0362, "step": 12640 }, { "epoch": 0.06, "learning_rate": 0.0002904268683372769, "loss": 0.032, "step": 12650 }, { "epoch": 0.06, "learning_rate": 0.0002904193006442629, "loss": 0.0366, "step": 12660 }, { "epoch": 0.06, "learning_rate": 0.0002904117329512489, "loss": 0.0349, "step": 12670 }, { "epoch": 0.06, "learning_rate": 0.0002904041652582349, "loss": 0.0369, "step": 12680 }, { "epoch": 0.06, "learning_rate": 0.0002903965975652209, "loss": 0.0337, "step": 12690 }, { "epoch": 0.06, "learning_rate": 0.00029038902987220687, "loss": 0.0308, "step": 12700 }, { "epoch": 0.06, "learning_rate": 0.00029038146217919285, "loss": 0.0523, "step": 12710 }, { "epoch": 0.06, "learning_rate": 0.00029037389448617883, "loss": 0.0437, "step": 12720 }, { "epoch": 0.06, "learning_rate": 0.0002903663267931648, "loss": 0.0365, "step": 12730 }, { "epoch": 0.06, "learning_rate": 0.00029035875910015085, "loss": 0.0349, "step": 12740 }, { "epoch": 0.06, "learning_rate": 0.00029035119140713683, "loss": 0.0321, "step": 12750 }, { "epoch": 0.06, "learning_rate": 0.0002903436237141228, "loss": 0.0318, "step": 12760 }, { "epoch": 0.06, "learning_rate": 0.0002903360560211088, "loss": 0.0335, "step": 12770 }, { "epoch": 0.06, "learning_rate": 0.0002903284883280948, "loss": 0.0305, "step": 12780 }, { "epoch": 0.06, "learning_rate": 0.00029032092063508076, "loss": 0.0381, "step": 12790 }, { "epoch": 0.06, "learning_rate": 0.0002903133529420668, "loss": 0.0327, "step": 12800 }, { "epoch": 0.06, "learning_rate": 0.00029030578524905277, "loss": 0.0432, "step": 12810 }, { "epoch": 0.06, "learning_rate": 0.00029029821755603875, "loss": 0.0372, "step": 12820 }, { "epoch": 0.06, "learning_rate": 0.00029029064986302474, "loss": 0.0574, "step": 12830 }, { "epoch": 0.06, "learning_rate": 0.0002902830821700107, "loss": 0.045, "step": 12840 }, { "epoch": 0.06, "learning_rate": 0.0002902755144769967, "loss": 0.0303, "step": 12850 }, { "epoch": 0.06, "learning_rate": 0.00029026794678398273, "loss": 0.0365, "step": 12860 }, { "epoch": 0.06, "learning_rate": 0.0002902603790909687, "loss": 0.0443, "step": 12870 }, { "epoch": 0.06, "learning_rate": 0.0002902528113979547, "loss": 0.0384, "step": 12880 }, { "epoch": 0.07, "learning_rate": 0.0002902452437049407, "loss": 0.035, "step": 12890 }, { "epoch": 0.07, "learning_rate": 0.00029023767601192666, "loss": 0.0431, "step": 12900 }, { "epoch": 0.07, "learning_rate": 0.00029023010831891264, "loss": 0.0393, "step": 12910 }, { "epoch": 0.07, "learning_rate": 0.0002902225406258986, "loss": 0.0324, "step": 12920 }, { "epoch": 0.07, "learning_rate": 0.00029021497293288466, "loss": 0.0353, "step": 12930 }, { "epoch": 0.07, "learning_rate": 0.00029020740523987064, "loss": 0.0457, "step": 12940 }, { "epoch": 0.07, "learning_rate": 0.0002901998375468566, "loss": 0.0338, "step": 12950 }, { "epoch": 0.07, "learning_rate": 0.0002901922698538426, "loss": 0.0305, "step": 12960 }, { "epoch": 0.07, "learning_rate": 0.0002901847021608286, "loss": 0.0322, "step": 12970 }, { "epoch": 0.07, "learning_rate": 0.00029017713446781457, "loss": 0.0351, "step": 12980 }, { "epoch": 0.07, "learning_rate": 0.0002901695667748006, "loss": 0.0309, "step": 12990 }, { "epoch": 0.07, "learning_rate": 0.0002901619990817866, "loss": 0.0373, "step": 13000 }, { "epoch": 0.07, "eval_cer": 0.9145245980861848, "eval_loss": 0.026163555681705475, "eval_runtime": 116.7644, "eval_samples_per_second": 17.129, "eval_steps_per_second": 4.282, "step": 13000 }, { "epoch": 0.07, "learning_rate": 0.00029015443138877256, "loss": 0.0371, "step": 13010 }, { "epoch": 0.07, "learning_rate": 0.00029014686369575855, "loss": 0.0344, "step": 13020 }, { "epoch": 0.07, "learning_rate": 0.0002901392960027445, "loss": 0.0352, "step": 13030 }, { "epoch": 0.07, "learning_rate": 0.0002901317283097305, "loss": 0.0361, "step": 13040 }, { "epoch": 0.07, "learning_rate": 0.0002901241606167165, "loss": 0.0444, "step": 13050 }, { "epoch": 0.07, "learning_rate": 0.0002901165929237025, "loss": 0.0307, "step": 13060 }, { "epoch": 0.07, "learning_rate": 0.0002901090252306885, "loss": 0.034, "step": 13070 }, { "epoch": 0.07, "learning_rate": 0.0002901014575376745, "loss": 0.0451, "step": 13080 }, { "epoch": 0.07, "learning_rate": 0.00029009388984466047, "loss": 0.0379, "step": 13090 }, { "epoch": 0.07, "learning_rate": 0.00029008632215164645, "loss": 0.0347, "step": 13100 }, { "epoch": 0.07, "learning_rate": 0.00029007875445863243, "loss": 0.0288, "step": 13110 }, { "epoch": 0.07, "learning_rate": 0.00029007118676561847, "loss": 0.038, "step": 13120 }, { "epoch": 0.07, "learning_rate": 0.00029006361907260445, "loss": 0.032, "step": 13130 }, { "epoch": 0.07, "learning_rate": 0.00029005605137959043, "loss": 0.0372, "step": 13140 }, { "epoch": 0.07, "learning_rate": 0.0002900484836865764, "loss": 0.0325, "step": 13150 }, { "epoch": 0.07, "learning_rate": 0.0002900409159935624, "loss": 0.0342, "step": 13160 }, { "epoch": 0.07, "learning_rate": 0.0002900333483005484, "loss": 0.0377, "step": 13170 }, { "epoch": 0.07, "learning_rate": 0.0002900257806075344, "loss": 0.0408, "step": 13180 }, { "epoch": 0.07, "learning_rate": 0.0002900182129145204, "loss": 0.0353, "step": 13190 }, { "epoch": 0.07, "learning_rate": 0.0002900106452215063, "loss": 0.0307, "step": 13200 }, { "epoch": 0.07, "learning_rate": 0.0002900030775284923, "loss": 0.0331, "step": 13210 }, { "epoch": 0.07, "learning_rate": 0.00028999550983547834, "loss": 0.0322, "step": 13220 }, { "epoch": 0.07, "learning_rate": 0.0002899879421424643, "loss": 0.0342, "step": 13230 }, { "epoch": 0.07, "learning_rate": 0.0002899803744494503, "loss": 0.0312, "step": 13240 }, { "epoch": 0.07, "learning_rate": 0.0002899728067564363, "loss": 0.0645, "step": 13250 }, { "epoch": 0.07, "learning_rate": 0.00028996523906342226, "loss": 0.0352, "step": 13260 }, { "epoch": 0.07, "learning_rate": 0.00028995767137040824, "loss": 0.0671, "step": 13270 }, { "epoch": 0.07, "learning_rate": 0.0002899501036773942, "loss": 0.0338, "step": 13280 }, { "epoch": 0.07, "learning_rate": 0.00028994253598438026, "loss": 0.0341, "step": 13290 }, { "epoch": 0.07, "learning_rate": 0.00028993496829136624, "loss": 0.036, "step": 13300 }, { "epoch": 0.07, "learning_rate": 0.0002899274005983522, "loss": 0.0352, "step": 13310 }, { "epoch": 0.07, "learning_rate": 0.0002899198329053382, "loss": 0.0352, "step": 13320 }, { "epoch": 0.07, "learning_rate": 0.0002899122652123242, "loss": 0.0402, "step": 13330 }, { "epoch": 0.07, "learning_rate": 0.00028990469751931017, "loss": 0.0315, "step": 13340 }, { "epoch": 0.07, "learning_rate": 0.0002898971298262962, "loss": 0.0331, "step": 13350 }, { "epoch": 0.07, "learning_rate": 0.0002898895621332822, "loss": 0.0371, "step": 13360 }, { "epoch": 0.07, "learning_rate": 0.00028988199444026817, "loss": 0.0314, "step": 13370 }, { "epoch": 0.07, "learning_rate": 0.00028987442674725415, "loss": 0.0473, "step": 13380 }, { "epoch": 0.07, "learning_rate": 0.00028986685905424013, "loss": 0.0328, "step": 13390 }, { "epoch": 0.07, "learning_rate": 0.0002898592913612261, "loss": 0.0332, "step": 13400 }, { "epoch": 0.07, "learning_rate": 0.00028985172366821215, "loss": 0.0323, "step": 13410 }, { "epoch": 0.07, "learning_rate": 0.00028984415597519813, "loss": 0.0412, "step": 13420 }, { "epoch": 0.07, "learning_rate": 0.0002898365882821841, "loss": 0.037, "step": 13430 }, { "epoch": 0.07, "learning_rate": 0.0002898290205891701, "loss": 0.0363, "step": 13440 }, { "epoch": 0.07, "learning_rate": 0.00028982145289615607, "loss": 0.0358, "step": 13450 }, { "epoch": 0.07, "learning_rate": 0.00028981388520314205, "loss": 0.026, "step": 13460 }, { "epoch": 0.07, "learning_rate": 0.00028980631751012804, "loss": 0.04, "step": 13470 }, { "epoch": 0.07, "learning_rate": 0.00028979874981711407, "loss": 0.0377, "step": 13480 }, { "epoch": 0.07, "learning_rate": 0.00028979118212410005, "loss": 0.0385, "step": 13490 }, { "epoch": 0.07, "learning_rate": 0.00028978361443108603, "loss": 0.0294, "step": 13500 }, { "epoch": 0.07, "learning_rate": 0.000289776046738072, "loss": 0.0346, "step": 13510 }, { "epoch": 0.07, "learning_rate": 0.000289768479045058, "loss": 0.0333, "step": 13520 }, { "epoch": 0.07, "learning_rate": 0.000289760911352044, "loss": 0.0357, "step": 13530 }, { "epoch": 0.07, "learning_rate": 0.00028975334365903, "loss": 0.0348, "step": 13540 }, { "epoch": 0.07, "learning_rate": 0.000289745775966016, "loss": 0.0355, "step": 13550 }, { "epoch": 0.07, "learning_rate": 0.000289738208273002, "loss": 0.0329, "step": 13560 }, { "epoch": 0.07, "learning_rate": 0.00028973064057998796, "loss": 0.0385, "step": 13570 }, { "epoch": 0.07, "learning_rate": 0.00028972307288697394, "loss": 0.0433, "step": 13580 }, { "epoch": 0.07, "learning_rate": 0.0002897155051939599, "loss": 0.0325, "step": 13590 }, { "epoch": 0.07, "learning_rate": 0.00028970793750094596, "loss": 0.0367, "step": 13600 }, { "epoch": 0.07, "learning_rate": 0.00028970036980793194, "loss": 0.0551, "step": 13610 }, { "epoch": 0.07, "learning_rate": 0.0002896928021149179, "loss": 0.0347, "step": 13620 }, { "epoch": 0.07, "learning_rate": 0.0002896852344219039, "loss": 0.0574, "step": 13630 }, { "epoch": 0.07, "learning_rate": 0.0002896776667288899, "loss": 0.0331, "step": 13640 }, { "epoch": 0.07, "learning_rate": 0.00028967009903587586, "loss": 0.0646, "step": 13650 }, { "epoch": 0.07, "learning_rate": 0.00028966253134286185, "loss": 0.0507, "step": 13660 }, { "epoch": 0.07, "learning_rate": 0.0002896549636498479, "loss": 0.0312, "step": 13670 }, { "epoch": 0.07, "learning_rate": 0.00028964739595683386, "loss": 0.0364, "step": 13680 }, { "epoch": 0.07, "learning_rate": 0.00028963982826381984, "loss": 0.0587, "step": 13690 }, { "epoch": 0.07, "learning_rate": 0.0002896322605708058, "loss": 0.0328, "step": 13700 }, { "epoch": 0.07, "learning_rate": 0.0002896246928777918, "loss": 0.04, "step": 13710 }, { "epoch": 0.07, "learning_rate": 0.0002896171251847778, "loss": 0.0367, "step": 13720 }, { "epoch": 0.07, "learning_rate": 0.0002896095574917638, "loss": 0.0464, "step": 13730 }, { "epoch": 0.07, "learning_rate": 0.0002896019897987498, "loss": 0.0357, "step": 13740 }, { "epoch": 0.07, "learning_rate": 0.0002895944221057358, "loss": 0.0395, "step": 13750 }, { "epoch": 0.07, "learning_rate": 0.00028958685441272177, "loss": 0.0346, "step": 13760 }, { "epoch": 0.07, "learning_rate": 0.00028957928671970775, "loss": 0.0306, "step": 13770 }, { "epoch": 0.07, "learning_rate": 0.00028957171902669373, "loss": 0.0604, "step": 13780 }, { "epoch": 0.07, "learning_rate": 0.0002895641513336797, "loss": 0.0405, "step": 13790 }, { "epoch": 0.07, "learning_rate": 0.00028955658364066575, "loss": 0.0467, "step": 13800 }, { "epoch": 0.07, "learning_rate": 0.00028954901594765173, "loss": 0.0378, "step": 13810 }, { "epoch": 0.07, "learning_rate": 0.0002895414482546377, "loss": 0.0559, "step": 13820 }, { "epoch": 0.07, "learning_rate": 0.0002895338805616237, "loss": 0.0322, "step": 13830 }, { "epoch": 0.07, "learning_rate": 0.0002895263128686097, "loss": 0.0332, "step": 13840 }, { "epoch": 0.07, "learning_rate": 0.00028951874517559566, "loss": 0.0363, "step": 13850 }, { "epoch": 0.07, "learning_rate": 0.0002895111774825817, "loss": 0.0429, "step": 13860 }, { "epoch": 0.07, "learning_rate": 0.00028950360978956767, "loss": 0.0317, "step": 13870 }, { "epoch": 0.07, "learning_rate": 0.00028949604209655365, "loss": 0.0326, "step": 13880 }, { "epoch": 0.07, "learning_rate": 0.00028948847440353964, "loss": 0.0333, "step": 13890 }, { "epoch": 0.07, "learning_rate": 0.0002894809067105256, "loss": 0.0299, "step": 13900 }, { "epoch": 0.07, "learning_rate": 0.0002894733390175116, "loss": 0.0324, "step": 13910 }, { "epoch": 0.07, "learning_rate": 0.00028946577132449763, "loss": 0.0354, "step": 13920 }, { "epoch": 0.07, "learning_rate": 0.0002894582036314836, "loss": 0.0404, "step": 13930 }, { "epoch": 0.07, "learning_rate": 0.0002894506359384696, "loss": 0.0354, "step": 13940 }, { "epoch": 0.07, "learning_rate": 0.0002894430682454556, "loss": 0.0367, "step": 13950 }, { "epoch": 0.07, "learning_rate": 0.00028943550055244156, "loss": 0.031, "step": 13960 }, { "epoch": 0.07, "learning_rate": 0.00028942793285942754, "loss": 0.0277, "step": 13970 }, { "epoch": 0.07, "learning_rate": 0.0002894203651664135, "loss": 0.0345, "step": 13980 }, { "epoch": 0.07, "learning_rate": 0.00028941279747339956, "loss": 0.0318, "step": 13990 }, { "epoch": 0.07, "learning_rate": 0.00028940522978038554, "loss": 0.0418, "step": 14000 }, { "epoch": 0.07, "eval_cer": 0.9144731670915385, "eval_loss": 0.02422579564154148, "eval_runtime": 116.5786, "eval_samples_per_second": 17.156, "eval_steps_per_second": 4.289, "step": 14000 }, { "epoch": 0.07, "learning_rate": 0.0002893976620873715, "loss": 0.0302, "step": 14010 }, { "epoch": 0.07, "learning_rate": 0.0002893900943943575, "loss": 0.0365, "step": 14020 }, { "epoch": 0.07, "learning_rate": 0.0002893825267013435, "loss": 0.0346, "step": 14030 }, { "epoch": 0.07, "learning_rate": 0.00028937495900832947, "loss": 0.0365, "step": 14040 }, { "epoch": 0.07, "learning_rate": 0.0002893673913153155, "loss": 0.0297, "step": 14050 }, { "epoch": 0.07, "learning_rate": 0.0002893598236223015, "loss": 0.0367, "step": 14060 }, { "epoch": 0.07, "learning_rate": 0.00028935225592928746, "loss": 0.0343, "step": 14070 }, { "epoch": 0.07, "learning_rate": 0.00028934468823627345, "loss": 0.0285, "step": 14080 }, { "epoch": 0.07, "learning_rate": 0.00028933712054325943, "loss": 0.0311, "step": 14090 }, { "epoch": 0.07, "learning_rate": 0.0002893295528502454, "loss": 0.0287, "step": 14100 }, { "epoch": 0.07, "learning_rate": 0.00028932198515723144, "loss": 0.034, "step": 14110 }, { "epoch": 0.07, "learning_rate": 0.0002893144174642174, "loss": 0.0345, "step": 14120 }, { "epoch": 0.07, "learning_rate": 0.0002893068497712034, "loss": 0.0444, "step": 14130 }, { "epoch": 0.07, "learning_rate": 0.0002892992820781894, "loss": 0.0327, "step": 14140 }, { "epoch": 0.07, "learning_rate": 0.00028929171438517537, "loss": 0.0286, "step": 14150 }, { "epoch": 0.07, "learning_rate": 0.00028928414669216135, "loss": 0.0295, "step": 14160 }, { "epoch": 0.07, "learning_rate": 0.00028927657899914733, "loss": 0.0294, "step": 14170 }, { "epoch": 0.07, "learning_rate": 0.00028926901130613337, "loss": 0.0357, "step": 14180 }, { "epoch": 0.07, "learning_rate": 0.00028926144361311935, "loss": 0.035, "step": 14190 }, { "epoch": 0.07, "learning_rate": 0.00028925387592010533, "loss": 0.0372, "step": 14200 }, { "epoch": 0.07, "learning_rate": 0.0002892463082270913, "loss": 0.036, "step": 14210 }, { "epoch": 0.07, "learning_rate": 0.0002892387405340773, "loss": 0.0359, "step": 14220 }, { "epoch": 0.07, "learning_rate": 0.0002892311728410633, "loss": 0.0477, "step": 14230 }, { "epoch": 0.07, "learning_rate": 0.0002892236051480493, "loss": 0.0356, "step": 14240 }, { "epoch": 0.07, "learning_rate": 0.0002892160374550353, "loss": 0.0357, "step": 14250 }, { "epoch": 0.07, "learning_rate": 0.0002892084697620213, "loss": 0.0348, "step": 14260 }, { "epoch": 0.07, "learning_rate": 0.00028920090206900726, "loss": 0.0356, "step": 14270 }, { "epoch": 0.07, "learning_rate": 0.00028919333437599324, "loss": 0.0336, "step": 14280 }, { "epoch": 0.07, "learning_rate": 0.0002891857666829792, "loss": 0.053, "step": 14290 }, { "epoch": 0.07, "learning_rate": 0.0002891781989899652, "loss": 0.0315, "step": 14300 }, { "epoch": 0.07, "learning_rate": 0.00028917063129695124, "loss": 0.0358, "step": 14310 }, { "epoch": 0.07, "learning_rate": 0.0002891630636039372, "loss": 0.0324, "step": 14320 }, { "epoch": 0.07, "learning_rate": 0.0002891554959109232, "loss": 0.0473, "step": 14330 }, { "epoch": 0.07, "learning_rate": 0.0002891479282179092, "loss": 0.0392, "step": 14340 }, { "epoch": 0.07, "learning_rate": 0.00028914036052489516, "loss": 0.0394, "step": 14350 }, { "epoch": 0.07, "learning_rate": 0.00028913279283188114, "loss": 0.0356, "step": 14360 }, { "epoch": 0.07, "learning_rate": 0.0002891252251388672, "loss": 0.0348, "step": 14370 }, { "epoch": 0.07, "learning_rate": 0.00028911765744585316, "loss": 0.0415, "step": 14380 }, { "epoch": 0.07, "learning_rate": 0.00028911008975283914, "loss": 0.0364, "step": 14390 }, { "epoch": 0.07, "learning_rate": 0.0002891025220598251, "loss": 0.0495, "step": 14400 }, { "epoch": 0.07, "learning_rate": 0.0002890949543668111, "loss": 0.0333, "step": 14410 }, { "epoch": 0.07, "learning_rate": 0.0002890873866737971, "loss": 0.0472, "step": 14420 }, { "epoch": 0.07, "learning_rate": 0.0002890798189807831, "loss": 0.0325, "step": 14430 }, { "epoch": 0.07, "learning_rate": 0.0002890722512877691, "loss": 0.0442, "step": 14440 }, { "epoch": 0.07, "learning_rate": 0.0002890646835947551, "loss": 0.0373, "step": 14450 }, { "epoch": 0.07, "learning_rate": 0.000289057115901741, "loss": 0.0391, "step": 14460 }, { "epoch": 0.07, "learning_rate": 0.00028904954820872705, "loss": 0.0436, "step": 14470 }, { "epoch": 0.07, "learning_rate": 0.00028904198051571303, "loss": 0.037, "step": 14480 }, { "epoch": 0.07, "learning_rate": 0.000289034412822699, "loss": 0.0348, "step": 14490 }, { "epoch": 0.07, "learning_rate": 0.000289026845129685, "loss": 0.0468, "step": 14500 }, { "epoch": 0.07, "learning_rate": 0.000289019277436671, "loss": 0.0449, "step": 14510 }, { "epoch": 0.07, "learning_rate": 0.00028901170974365695, "loss": 0.035, "step": 14520 }, { "epoch": 0.07, "learning_rate": 0.00028900414205064294, "loss": 0.0357, "step": 14530 }, { "epoch": 0.07, "learning_rate": 0.00028899657435762897, "loss": 0.0312, "step": 14540 }, { "epoch": 0.07, "learning_rate": 0.00028898900666461495, "loss": 0.038, "step": 14550 }, { "epoch": 0.07, "learning_rate": 0.00028898143897160093, "loss": 0.0329, "step": 14560 }, { "epoch": 0.07, "learning_rate": 0.0002889738712785869, "loss": 0.0311, "step": 14570 }, { "epoch": 0.07, "learning_rate": 0.0002889663035855729, "loss": 0.0367, "step": 14580 }, { "epoch": 0.07, "learning_rate": 0.0002889587358925589, "loss": 0.0503, "step": 14590 }, { "epoch": 0.07, "learning_rate": 0.0002889511681995449, "loss": 0.0425, "step": 14600 }, { "epoch": 0.07, "learning_rate": 0.0002889436005065309, "loss": 0.0403, "step": 14610 }, { "epoch": 0.07, "learning_rate": 0.0002889360328135169, "loss": 0.0389, "step": 14620 }, { "epoch": 0.07, "learning_rate": 0.00028892846512050286, "loss": 0.0358, "step": 14630 }, { "epoch": 0.07, "learning_rate": 0.00028892089742748884, "loss": 0.0336, "step": 14640 }, { "epoch": 0.07, "learning_rate": 0.0002889133297344748, "loss": 0.0622, "step": 14650 }, { "epoch": 0.07, "learning_rate": 0.00028890576204146086, "loss": 0.0343, "step": 14660 }, { "epoch": 0.07, "learning_rate": 0.00028889819434844684, "loss": 0.0374, "step": 14670 }, { "epoch": 0.07, "learning_rate": 0.0002888906266554328, "loss": 0.0478, "step": 14680 }, { "epoch": 0.07, "learning_rate": 0.0002888830589624188, "loss": 0.0415, "step": 14690 }, { "epoch": 0.07, "learning_rate": 0.0002888754912694048, "loss": 0.0346, "step": 14700 }, { "epoch": 0.07, "learning_rate": 0.00028886792357639076, "loss": 0.0348, "step": 14710 }, { "epoch": 0.07, "learning_rate": 0.00028886035588337675, "loss": 0.0324, "step": 14720 }, { "epoch": 0.07, "learning_rate": 0.0002888527881903628, "loss": 0.0433, "step": 14730 }, { "epoch": 0.07, "learning_rate": 0.00028884522049734876, "loss": 0.03, "step": 14740 }, { "epoch": 0.07, "learning_rate": 0.00028883765280433474, "loss": 0.0347, "step": 14750 }, { "epoch": 0.07, "learning_rate": 0.0002888300851113207, "loss": 0.0369, "step": 14760 }, { "epoch": 0.07, "learning_rate": 0.0002888225174183067, "loss": 0.0439, "step": 14770 }, { "epoch": 0.07, "learning_rate": 0.0002888149497252927, "loss": 0.0368, "step": 14780 }, { "epoch": 0.07, "learning_rate": 0.0002888073820322787, "loss": 0.0311, "step": 14790 }, { "epoch": 0.07, "learning_rate": 0.0002887998143392647, "loss": 0.0356, "step": 14800 }, { "epoch": 0.07, "learning_rate": 0.0002887922466462507, "loss": 0.0304, "step": 14810 }, { "epoch": 0.07, "learning_rate": 0.00028878467895323667, "loss": 0.0304, "step": 14820 }, { "epoch": 0.07, "learning_rate": 0.00028877711126022265, "loss": 0.037, "step": 14830 }, { "epoch": 0.07, "learning_rate": 0.00028876954356720863, "loss": 0.0331, "step": 14840 }, { "epoch": 0.07, "learning_rate": 0.0002887619758741946, "loss": 0.0329, "step": 14850 }, { "epoch": 0.07, "learning_rate": 0.00028875440818118065, "loss": 0.0359, "step": 14860 }, { "epoch": 0.08, "learning_rate": 0.00028874684048816663, "loss": 0.0347, "step": 14870 }, { "epoch": 0.08, "learning_rate": 0.0002887392727951526, "loss": 0.0534, "step": 14880 }, { "epoch": 0.08, "learning_rate": 0.0002887317051021386, "loss": 0.0317, "step": 14890 }, { "epoch": 0.08, "learning_rate": 0.0002887241374091246, "loss": 0.0433, "step": 14900 }, { "epoch": 0.08, "learning_rate": 0.00028871656971611056, "loss": 0.0429, "step": 14910 }, { "epoch": 0.08, "learning_rate": 0.0002887090020230966, "loss": 0.0369, "step": 14920 }, { "epoch": 0.08, "learning_rate": 0.0002887014343300826, "loss": 0.0347, "step": 14930 }, { "epoch": 0.08, "learning_rate": 0.00028869386663706855, "loss": 0.0352, "step": 14940 }, { "epoch": 0.08, "learning_rate": 0.00028868629894405454, "loss": 0.0322, "step": 14950 }, { "epoch": 0.08, "learning_rate": 0.0002886787312510405, "loss": 0.0314, "step": 14960 }, { "epoch": 0.08, "learning_rate": 0.0002886711635580265, "loss": 0.0342, "step": 14970 }, { "epoch": 0.08, "learning_rate": 0.00028866359586501253, "loss": 0.0588, "step": 14980 }, { "epoch": 0.08, "learning_rate": 0.0002886560281719985, "loss": 0.0336, "step": 14990 }, { "epoch": 0.08, "learning_rate": 0.0002886484604789845, "loss": 0.0316, "step": 15000 }, { "epoch": 0.08, "eval_cer": 0.9145216868978086, "eval_loss": 0.025017283856868744, "eval_runtime": 116.429, "eval_samples_per_second": 17.178, "eval_steps_per_second": 4.294, "step": 15000 }, { "epoch": 0.08, "learning_rate": 0.0002886408927859705, "loss": 0.0325, "step": 15010 }, { "epoch": 0.08, "learning_rate": 0.00028863332509295646, "loss": 0.0274, "step": 15020 }, { "epoch": 0.08, "learning_rate": 0.00028862575739994244, "loss": 0.0345, "step": 15030 }, { "epoch": 0.08, "learning_rate": 0.0002886181897069284, "loss": 0.0322, "step": 15040 }, { "epoch": 0.08, "learning_rate": 0.00028861062201391446, "loss": 0.0358, "step": 15050 }, { "epoch": 0.08, "learning_rate": 0.00028860305432090044, "loss": 0.0312, "step": 15060 }, { "epoch": 0.08, "learning_rate": 0.0002885954866278864, "loss": 0.0317, "step": 15070 }, { "epoch": 0.08, "learning_rate": 0.0002885879189348724, "loss": 0.0374, "step": 15080 }, { "epoch": 0.08, "learning_rate": 0.0002885803512418584, "loss": 0.0311, "step": 15090 }, { "epoch": 0.08, "learning_rate": 0.00028857278354884437, "loss": 0.0347, "step": 15100 }, { "epoch": 0.08, "learning_rate": 0.0002885652158558304, "loss": 0.0314, "step": 15110 }, { "epoch": 0.08, "learning_rate": 0.0002885576481628164, "loss": 0.0334, "step": 15120 }, { "epoch": 0.08, "learning_rate": 0.00028855008046980236, "loss": 0.0437, "step": 15130 }, { "epoch": 0.08, "learning_rate": 0.00028854251277678835, "loss": 0.0346, "step": 15140 }, { "epoch": 0.08, "learning_rate": 0.00028853494508377433, "loss": 0.0357, "step": 15150 }, { "epoch": 0.08, "learning_rate": 0.0002885273773907603, "loss": 0.0331, "step": 15160 }, { "epoch": 0.08, "learning_rate": 0.00028851980969774634, "loss": 0.0358, "step": 15170 }, { "epoch": 0.08, "learning_rate": 0.0002885122420047323, "loss": 0.0401, "step": 15180 }, { "epoch": 0.08, "learning_rate": 0.0002885046743117183, "loss": 0.0337, "step": 15190 }, { "epoch": 0.08, "learning_rate": 0.0002884971066187043, "loss": 0.0365, "step": 15200 }, { "epoch": 0.08, "learning_rate": 0.00028848953892569027, "loss": 0.0399, "step": 15210 }, { "epoch": 0.08, "learning_rate": 0.00028848197123267625, "loss": 0.0353, "step": 15220 }, { "epoch": 0.08, "learning_rate": 0.00028847440353966223, "loss": 0.0325, "step": 15230 }, { "epoch": 0.08, "learning_rate": 0.00028846683584664827, "loss": 0.0345, "step": 15240 }, { "epoch": 0.08, "learning_rate": 0.00028845926815363425, "loss": 0.0326, "step": 15250 }, { "epoch": 0.08, "learning_rate": 0.00028845170046062023, "loss": 0.0296, "step": 15260 }, { "epoch": 0.08, "learning_rate": 0.0002884441327676062, "loss": 0.033, "step": 15270 }, { "epoch": 0.08, "learning_rate": 0.0002884365650745922, "loss": 0.0354, "step": 15280 }, { "epoch": 0.08, "learning_rate": 0.0002884289973815782, "loss": 0.0502, "step": 15290 }, { "epoch": 0.08, "learning_rate": 0.0002884214296885642, "loss": 0.0442, "step": 15300 }, { "epoch": 0.08, "learning_rate": 0.0002884138619955502, "loss": 0.0323, "step": 15310 }, { "epoch": 0.08, "learning_rate": 0.0002884062943025362, "loss": 0.0361, "step": 15320 }, { "epoch": 0.08, "learning_rate": 0.00028839872660952216, "loss": 0.0331, "step": 15330 }, { "epoch": 0.08, "learning_rate": 0.00028839115891650814, "loss": 0.0325, "step": 15340 }, { "epoch": 0.08, "learning_rate": 0.0002883835912234941, "loss": 0.032, "step": 15350 }, { "epoch": 0.08, "learning_rate": 0.0002883760235304801, "loss": 0.0329, "step": 15360 }, { "epoch": 0.08, "learning_rate": 0.00028836845583746614, "loss": 0.0304, "step": 15370 }, { "epoch": 0.08, "learning_rate": 0.0002883608881444521, "loss": 0.038, "step": 15380 }, { "epoch": 0.08, "learning_rate": 0.0002883533204514381, "loss": 0.0385, "step": 15390 }, { "epoch": 0.08, "learning_rate": 0.0002883457527584241, "loss": 0.0355, "step": 15400 }, { "epoch": 0.08, "learning_rate": 0.00028833818506541006, "loss": 0.0344, "step": 15410 }, { "epoch": 0.08, "learning_rate": 0.00028833061737239604, "loss": 0.0325, "step": 15420 }, { "epoch": 0.08, "learning_rate": 0.0002883230496793821, "loss": 0.0305, "step": 15430 }, { "epoch": 0.08, "learning_rate": 0.00028831548198636806, "loss": 0.0391, "step": 15440 }, { "epoch": 0.08, "learning_rate": 0.00028830791429335404, "loss": 0.0369, "step": 15450 }, { "epoch": 0.08, "learning_rate": 0.00028830034660034, "loss": 0.0324, "step": 15460 }, { "epoch": 0.08, "learning_rate": 0.000288292778907326, "loss": 0.0283, "step": 15470 }, { "epoch": 0.08, "learning_rate": 0.000288285211214312, "loss": 0.0287, "step": 15480 }, { "epoch": 0.08, "learning_rate": 0.000288277643521298, "loss": 0.0327, "step": 15490 }, { "epoch": 0.08, "learning_rate": 0.000288270075828284, "loss": 0.0333, "step": 15500 }, { "epoch": 0.08, "learning_rate": 0.00028826250813527, "loss": 0.0343, "step": 15510 }, { "epoch": 0.08, "learning_rate": 0.00028825494044225597, "loss": 0.0327, "step": 15520 }, { "epoch": 0.08, "learning_rate": 0.00028824737274924195, "loss": 0.0358, "step": 15530 }, { "epoch": 0.08, "learning_rate": 0.00028823980505622793, "loss": 0.0328, "step": 15540 }, { "epoch": 0.08, "learning_rate": 0.0002882322373632139, "loss": 0.0307, "step": 15550 }, { "epoch": 0.08, "learning_rate": 0.00028822466967019995, "loss": 0.032, "step": 15560 }, { "epoch": 0.08, "learning_rate": 0.00028821710197718593, "loss": 0.0351, "step": 15570 }, { "epoch": 0.08, "learning_rate": 0.0002882095342841719, "loss": 0.036, "step": 15580 }, { "epoch": 0.08, "learning_rate": 0.0002882019665911579, "loss": 0.0309, "step": 15590 }, { "epoch": 0.08, "learning_rate": 0.00028819439889814387, "loss": 0.0341, "step": 15600 }, { "epoch": 0.08, "learning_rate": 0.00028818683120512985, "loss": 0.0327, "step": 15610 }, { "epoch": 0.08, "learning_rate": 0.0002881792635121159, "loss": 0.0377, "step": 15620 }, { "epoch": 0.08, "learning_rate": 0.00028817169581910187, "loss": 0.0316, "step": 15630 }, { "epoch": 0.08, "learning_rate": 0.00028816412812608785, "loss": 0.0298, "step": 15640 }, { "epoch": 0.08, "learning_rate": 0.00028815656043307383, "loss": 0.0327, "step": 15650 }, { "epoch": 0.08, "learning_rate": 0.0002881489927400598, "loss": 0.0333, "step": 15660 }, { "epoch": 0.08, "learning_rate": 0.0002881414250470458, "loss": 0.0334, "step": 15670 }, { "epoch": 0.08, "learning_rate": 0.00028813385735403183, "loss": 0.0327, "step": 15680 }, { "epoch": 0.08, "learning_rate": 0.0002881262896610178, "loss": 0.0317, "step": 15690 }, { "epoch": 0.08, "learning_rate": 0.0002881187219680038, "loss": 0.0317, "step": 15700 }, { "epoch": 0.08, "learning_rate": 0.0002881111542749898, "loss": 0.0326, "step": 15710 }, { "epoch": 0.08, "learning_rate": 0.00028810358658197576, "loss": 0.0316, "step": 15720 }, { "epoch": 0.08, "learning_rate": 0.00028809601888896174, "loss": 0.0351, "step": 15730 }, { "epoch": 0.08, "learning_rate": 0.0002880884511959477, "loss": 0.0318, "step": 15740 }, { "epoch": 0.08, "learning_rate": 0.0002880808835029337, "loss": 0.0348, "step": 15750 }, { "epoch": 0.08, "learning_rate": 0.0002880733158099197, "loss": 0.0315, "step": 15760 }, { "epoch": 0.08, "learning_rate": 0.00028806574811690566, "loss": 0.0285, "step": 15770 }, { "epoch": 0.08, "learning_rate": 0.00028805818042389165, "loss": 0.0318, "step": 15780 }, { "epoch": 0.08, "learning_rate": 0.0002880506127308777, "loss": 0.0326, "step": 15790 }, { "epoch": 0.08, "learning_rate": 0.00028804304503786366, "loss": 0.0285, "step": 15800 }, { "epoch": 0.08, "learning_rate": 0.00028803547734484964, "loss": 0.034, "step": 15810 }, { "epoch": 0.08, "learning_rate": 0.0002880279096518356, "loss": 0.0324, "step": 15820 }, { "epoch": 0.08, "learning_rate": 0.0002880203419588216, "loss": 0.0292, "step": 15830 }, { "epoch": 0.08, "learning_rate": 0.0002880127742658076, "loss": 0.0298, "step": 15840 }, { "epoch": 0.08, "learning_rate": 0.0002880052065727936, "loss": 0.0283, "step": 15850 }, { "epoch": 0.08, "learning_rate": 0.0002879976388797796, "loss": 0.0338, "step": 15860 }, { "epoch": 0.08, "learning_rate": 0.0002879900711867656, "loss": 0.0364, "step": 15870 }, { "epoch": 0.08, "learning_rate": 0.00028798250349375157, "loss": 0.028, "step": 15880 }, { "epoch": 0.08, "learning_rate": 0.00028797493580073755, "loss": 0.0322, "step": 15890 }, { "epoch": 0.08, "learning_rate": 0.00028796736810772353, "loss": 0.0321, "step": 15900 }, { "epoch": 0.08, "learning_rate": 0.00028795980041470957, "loss": 0.0291, "step": 15910 }, { "epoch": 0.08, "learning_rate": 0.00028795223272169555, "loss": 0.032, "step": 15920 }, { "epoch": 0.08, "learning_rate": 0.00028794466502868153, "loss": 0.0289, "step": 15930 }, { "epoch": 0.08, "learning_rate": 0.0002879370973356675, "loss": 0.0352, "step": 15940 }, { "epoch": 0.08, "learning_rate": 0.0002879295296426535, "loss": 0.032, "step": 15950 }, { "epoch": 0.08, "learning_rate": 0.0002879219619496395, "loss": 0.0366, "step": 15960 }, { "epoch": 0.08, "learning_rate": 0.00028791439425662546, "loss": 0.0315, "step": 15970 }, { "epoch": 0.08, "learning_rate": 0.0002879068265636115, "loss": 0.0363, "step": 15980 }, { "epoch": 0.08, "learning_rate": 0.0002878992588705975, "loss": 0.0299, "step": 15990 }, { "epoch": 0.08, "learning_rate": 0.00028789169117758345, "loss": 0.0304, "step": 16000 }, { "epoch": 0.08, "eval_cer": 0.9144945158062973, "eval_loss": 0.02421427145600319, "eval_runtime": 116.6835, "eval_samples_per_second": 17.14, "eval_steps_per_second": 4.285, "step": 16000 }, { "epoch": 0.08, "learning_rate": 0.00028788412348456944, "loss": 0.0314, "step": 16010 }, { "epoch": 0.08, "learning_rate": 0.0002878765557915554, "loss": 0.0338, "step": 16020 }, { "epoch": 0.08, "learning_rate": 0.0002878689880985414, "loss": 0.0299, "step": 16030 }, { "epoch": 0.08, "learning_rate": 0.00028786142040552743, "loss": 0.0328, "step": 16040 }, { "epoch": 0.08, "learning_rate": 0.0002878538527125134, "loss": 0.0309, "step": 16050 }, { "epoch": 0.08, "learning_rate": 0.0002878462850194994, "loss": 0.0302, "step": 16060 }, { "epoch": 0.08, "learning_rate": 0.0002878387173264854, "loss": 0.0344, "step": 16070 }, { "epoch": 0.08, "learning_rate": 0.00028783114963347136, "loss": 0.0316, "step": 16080 }, { "epoch": 0.08, "learning_rate": 0.00028782358194045734, "loss": 0.034, "step": 16090 }, { "epoch": 0.08, "learning_rate": 0.0002878160142474433, "loss": 0.0352, "step": 16100 }, { "epoch": 0.08, "learning_rate": 0.00028780844655442936, "loss": 0.0281, "step": 16110 }, { "epoch": 0.08, "learning_rate": 0.00028780087886141534, "loss": 0.0263, "step": 16120 }, { "epoch": 0.08, "learning_rate": 0.0002877933111684013, "loss": 0.0265, "step": 16130 }, { "epoch": 0.08, "learning_rate": 0.0002877857434753873, "loss": 0.0284, "step": 16140 }, { "epoch": 0.08, "learning_rate": 0.0002877781757823733, "loss": 0.0324, "step": 16150 }, { "epoch": 0.08, "learning_rate": 0.00028777060808935927, "loss": 0.0283, "step": 16160 }, { "epoch": 0.08, "learning_rate": 0.0002877630403963453, "loss": 0.033, "step": 16170 }, { "epoch": 0.08, "learning_rate": 0.0002877554727033313, "loss": 0.0318, "step": 16180 }, { "epoch": 0.08, "learning_rate": 0.00028774790501031726, "loss": 0.0317, "step": 16190 }, { "epoch": 0.08, "learning_rate": 0.00028774033731730325, "loss": 0.0316, "step": 16200 }, { "epoch": 0.08, "learning_rate": 0.00028773276962428923, "loss": 0.0288, "step": 16210 }, { "epoch": 0.08, "learning_rate": 0.0002877252019312752, "loss": 0.0331, "step": 16220 }, { "epoch": 0.08, "learning_rate": 0.00028771763423826124, "loss": 0.03, "step": 16230 }, { "epoch": 0.08, "learning_rate": 0.0002877100665452472, "loss": 0.0282, "step": 16240 }, { "epoch": 0.08, "learning_rate": 0.0002877024988522332, "loss": 0.0327, "step": 16250 }, { "epoch": 0.08, "learning_rate": 0.0002876949311592192, "loss": 0.0297, "step": 16260 }, { "epoch": 0.08, "learning_rate": 0.00028768736346620517, "loss": 0.0416, "step": 16270 }, { "epoch": 0.08, "learning_rate": 0.00028767979577319115, "loss": 0.0328, "step": 16280 }, { "epoch": 0.08, "learning_rate": 0.00028767222808017713, "loss": 0.028, "step": 16290 }, { "epoch": 0.08, "learning_rate": 0.00028766466038716317, "loss": 0.0305, "step": 16300 }, { "epoch": 0.08, "learning_rate": 0.00028765709269414915, "loss": 0.0321, "step": 16310 }, { "epoch": 0.08, "learning_rate": 0.00028764952500113513, "loss": 0.0368, "step": 16320 }, { "epoch": 0.08, "learning_rate": 0.0002876419573081211, "loss": 0.0294, "step": 16330 }, { "epoch": 0.08, "learning_rate": 0.0002876343896151071, "loss": 0.028, "step": 16340 }, { "epoch": 0.08, "learning_rate": 0.0002876268219220931, "loss": 0.031, "step": 16350 }, { "epoch": 0.08, "learning_rate": 0.0002876192542290791, "loss": 0.0304, "step": 16360 }, { "epoch": 0.08, "learning_rate": 0.0002876116865360651, "loss": 0.0365, "step": 16370 }, { "epoch": 0.08, "learning_rate": 0.0002876041188430511, "loss": 0.0327, "step": 16380 }, { "epoch": 0.08, "learning_rate": 0.00028759655115003706, "loss": 0.0309, "step": 16390 }, { "epoch": 0.08, "learning_rate": 0.00028758898345702304, "loss": 0.0306, "step": 16400 }, { "epoch": 0.08, "learning_rate": 0.000287581415764009, "loss": 0.0296, "step": 16410 }, { "epoch": 0.08, "learning_rate": 0.000287573848070995, "loss": 0.032, "step": 16420 }, { "epoch": 0.08, "learning_rate": 0.00028756628037798104, "loss": 0.0331, "step": 16430 }, { "epoch": 0.08, "learning_rate": 0.000287558712684967, "loss": 0.0354, "step": 16440 }, { "epoch": 0.08, "learning_rate": 0.000287551144991953, "loss": 0.0395, "step": 16450 }, { "epoch": 0.08, "learning_rate": 0.000287543577298939, "loss": 0.0339, "step": 16460 }, { "epoch": 0.08, "learning_rate": 0.00028753600960592496, "loss": 0.0355, "step": 16470 }, { "epoch": 0.08, "learning_rate": 0.00028752844191291094, "loss": 0.0343, "step": 16480 }, { "epoch": 0.08, "learning_rate": 0.000287520874219897, "loss": 0.0391, "step": 16490 }, { "epoch": 0.08, "learning_rate": 0.00028751330652688296, "loss": 0.0339, "step": 16500 }, { "epoch": 0.08, "learning_rate": 0.00028750573883386894, "loss": 0.0301, "step": 16510 }, { "epoch": 0.08, "learning_rate": 0.0002874981711408549, "loss": 0.0293, "step": 16520 }, { "epoch": 0.08, "learning_rate": 0.0002874906034478409, "loss": 0.03, "step": 16530 }, { "epoch": 0.08, "learning_rate": 0.0002874830357548269, "loss": 0.0332, "step": 16540 }, { "epoch": 0.08, "learning_rate": 0.0002874754680618129, "loss": 0.033, "step": 16550 }, { "epoch": 0.08, "learning_rate": 0.0002874679003687989, "loss": 0.0313, "step": 16560 }, { "epoch": 0.08, "learning_rate": 0.0002874603326757849, "loss": 0.0316, "step": 16570 }, { "epoch": 0.08, "learning_rate": 0.00028745276498277087, "loss": 0.0291, "step": 16580 }, { "epoch": 0.08, "learning_rate": 0.00028744519728975685, "loss": 0.0332, "step": 16590 }, { "epoch": 0.08, "learning_rate": 0.00028743762959674283, "loss": 0.03, "step": 16600 }, { "epoch": 0.08, "learning_rate": 0.0002874300619037288, "loss": 0.0315, "step": 16610 }, { "epoch": 0.08, "learning_rate": 0.00028742249421071485, "loss": 0.0341, "step": 16620 }, { "epoch": 0.08, "learning_rate": 0.00028741492651770083, "loss": 0.0323, "step": 16630 }, { "epoch": 0.08, "learning_rate": 0.0002874073588246868, "loss": 0.0294, "step": 16640 }, { "epoch": 0.08, "learning_rate": 0.0002873997911316728, "loss": 0.0272, "step": 16650 }, { "epoch": 0.08, "learning_rate": 0.00028739222343865877, "loss": 0.0345, "step": 16660 }, { "epoch": 0.08, "learning_rate": 0.00028738465574564475, "loss": 0.0328, "step": 16670 }, { "epoch": 0.08, "learning_rate": 0.0002873770880526308, "loss": 0.0294, "step": 16680 }, { "epoch": 0.08, "learning_rate": 0.00028736952035961677, "loss": 0.0301, "step": 16690 }, { "epoch": 0.08, "learning_rate": 0.00028736195266660275, "loss": 0.0301, "step": 16700 }, { "epoch": 0.08, "learning_rate": 0.00028735438497358873, "loss": 0.0299, "step": 16710 }, { "epoch": 0.08, "learning_rate": 0.0002873468172805747, "loss": 0.0355, "step": 16720 }, { "epoch": 0.08, "learning_rate": 0.0002873392495875607, "loss": 0.0324, "step": 16730 }, { "epoch": 0.08, "learning_rate": 0.00028733168189454673, "loss": 0.0323, "step": 16740 }, { "epoch": 0.08, "learning_rate": 0.0002873241142015327, "loss": 0.0399, "step": 16750 }, { "epoch": 0.08, "learning_rate": 0.0002873165465085187, "loss": 0.034, "step": 16760 }, { "epoch": 0.08, "learning_rate": 0.0002873089788155047, "loss": 0.036, "step": 16770 }, { "epoch": 0.08, "learning_rate": 0.00028730141112249066, "loss": 0.0351, "step": 16780 }, { "epoch": 0.08, "learning_rate": 0.00028729384342947664, "loss": 0.033, "step": 16790 }, { "epoch": 0.08, "learning_rate": 0.0002872862757364626, "loss": 0.0324, "step": 16800 }, { "epoch": 0.08, "learning_rate": 0.00028727870804344866, "loss": 0.0323, "step": 16810 }, { "epoch": 0.08, "learning_rate": 0.00028727114035043464, "loss": 0.0301, "step": 16820 }, { "epoch": 0.08, "learning_rate": 0.0002872635726574206, "loss": 0.0378, "step": 16830 }, { "epoch": 0.08, "learning_rate": 0.0002872560049644066, "loss": 0.0318, "step": 16840 }, { "epoch": 0.09, "learning_rate": 0.0002872484372713926, "loss": 0.0299, "step": 16850 }, { "epoch": 0.09, "learning_rate": 0.00028724086957837856, "loss": 0.0302, "step": 16860 }, { "epoch": 0.09, "learning_rate": 0.0002872333018853646, "loss": 0.0349, "step": 16870 }, { "epoch": 0.09, "learning_rate": 0.0002872257341923506, "loss": 0.0315, "step": 16880 }, { "epoch": 0.09, "learning_rate": 0.00028721816649933656, "loss": 0.0354, "step": 16890 }, { "epoch": 0.09, "learning_rate": 0.00028721059880632254, "loss": 0.0333, "step": 16900 }, { "epoch": 0.09, "learning_rate": 0.0002872030311133085, "loss": 0.0322, "step": 16910 }, { "epoch": 0.09, "learning_rate": 0.0002871954634202945, "loss": 0.0345, "step": 16920 }, { "epoch": 0.09, "learning_rate": 0.0002871878957272805, "loss": 0.0307, "step": 16930 }, { "epoch": 0.09, "learning_rate": 0.0002871803280342665, "loss": 0.032, "step": 16940 }, { "epoch": 0.09, "learning_rate": 0.0002871727603412525, "loss": 0.0293, "step": 16950 }, { "epoch": 0.09, "learning_rate": 0.0002871651926482385, "loss": 0.0304, "step": 16960 }, { "epoch": 0.09, "learning_rate": 0.00028715762495522447, "loss": 0.0278, "step": 16970 }, { "epoch": 0.09, "learning_rate": 0.00028715005726221045, "loss": 0.0296, "step": 16980 }, { "epoch": 0.09, "learning_rate": 0.00028714248956919643, "loss": 0.0333, "step": 16990 }, { "epoch": 0.09, "learning_rate": 0.0002871349218761824, "loss": 0.0302, "step": 17000 }, { "epoch": 0.09, "eval_cer": 0.9145527395738214, "eval_loss": 0.023293539881706238, "eval_runtime": 117.3978, "eval_samples_per_second": 17.036, "eval_steps_per_second": 4.259, "step": 17000 }, { "epoch": 0.09, "learning_rate": 0.0002871273541831684, "loss": 0.0279, "step": 17010 }, { "epoch": 0.09, "learning_rate": 0.0002871197864901544, "loss": 0.0322, "step": 17020 }, { "epoch": 0.09, "learning_rate": 0.00028711221879714036, "loss": 0.0283, "step": 17030 }, { "epoch": 0.09, "learning_rate": 0.0002871046511041264, "loss": 0.0282, "step": 17040 }, { "epoch": 0.09, "learning_rate": 0.0002870970834111124, "loss": 0.0307, "step": 17050 }, { "epoch": 0.09, "learning_rate": 0.00028708951571809836, "loss": 0.0334, "step": 17060 }, { "epoch": 0.09, "learning_rate": 0.00028708194802508434, "loss": 0.0319, "step": 17070 }, { "epoch": 0.09, "learning_rate": 0.0002870743803320703, "loss": 0.0328, "step": 17080 }, { "epoch": 0.09, "learning_rate": 0.0002870668126390563, "loss": 0.027, "step": 17090 }, { "epoch": 0.09, "learning_rate": 0.00028705924494604234, "loss": 0.0343, "step": 17100 }, { "epoch": 0.09, "learning_rate": 0.0002870516772530283, "loss": 0.0314, "step": 17110 }, { "epoch": 0.09, "learning_rate": 0.0002870441095600143, "loss": 0.0286, "step": 17120 }, { "epoch": 0.09, "learning_rate": 0.0002870365418670003, "loss": 0.0317, "step": 17130 }, { "epoch": 0.09, "learning_rate": 0.00028702897417398626, "loss": 0.0329, "step": 17140 }, { "epoch": 0.09, "learning_rate": 0.00028702140648097224, "loss": 0.0308, "step": 17150 }, { "epoch": 0.09, "learning_rate": 0.0002870138387879582, "loss": 0.0304, "step": 17160 }, { "epoch": 0.09, "learning_rate": 0.00028700627109494426, "loss": 0.0315, "step": 17170 }, { "epoch": 0.09, "learning_rate": 0.00028699870340193024, "loss": 0.0325, "step": 17180 }, { "epoch": 0.09, "learning_rate": 0.0002869911357089162, "loss": 0.0328, "step": 17190 }, { "epoch": 0.09, "learning_rate": 0.0002869835680159022, "loss": 0.0369, "step": 17200 }, { "epoch": 0.09, "learning_rate": 0.0002869760003228882, "loss": 0.0303, "step": 17210 }, { "epoch": 0.09, "learning_rate": 0.00028696843262987417, "loss": 0.0252, "step": 17220 }, { "epoch": 0.09, "learning_rate": 0.0002869608649368602, "loss": 0.0312, "step": 17230 }, { "epoch": 0.09, "learning_rate": 0.0002869532972438462, "loss": 0.0317, "step": 17240 }, { "epoch": 0.09, "learning_rate": 0.00028694572955083217, "loss": 0.0286, "step": 17250 }, { "epoch": 0.09, "learning_rate": 0.00028693816185781815, "loss": 0.0246, "step": 17260 }, { "epoch": 0.09, "learning_rate": 0.00028693059416480413, "loss": 0.0347, "step": 17270 }, { "epoch": 0.09, "learning_rate": 0.0002869230264717901, "loss": 0.0277, "step": 17280 }, { "epoch": 0.09, "learning_rate": 0.00028691545877877615, "loss": 0.0274, "step": 17290 }, { "epoch": 0.09, "learning_rate": 0.0002869078910857621, "loss": 0.0322, "step": 17300 }, { "epoch": 0.09, "learning_rate": 0.0002869003233927481, "loss": 0.0295, "step": 17310 }, { "epoch": 0.09, "learning_rate": 0.0002868927556997341, "loss": 0.0297, "step": 17320 }, { "epoch": 0.09, "learning_rate": 0.00028688518800672007, "loss": 0.0277, "step": 17330 }, { "epoch": 0.09, "learning_rate": 0.00028687762031370605, "loss": 0.0328, "step": 17340 }, { "epoch": 0.09, "learning_rate": 0.00028687005262069203, "loss": 0.0314, "step": 17350 }, { "epoch": 0.09, "learning_rate": 0.00028686248492767807, "loss": 0.0325, "step": 17360 }, { "epoch": 0.09, "learning_rate": 0.00028685491723466405, "loss": 0.0294, "step": 17370 }, { "epoch": 0.09, "learning_rate": 0.00028684734954165003, "loss": 0.0308, "step": 17380 }, { "epoch": 0.09, "learning_rate": 0.000286839781848636, "loss": 0.0306, "step": 17390 }, { "epoch": 0.09, "learning_rate": 0.000286832214155622, "loss": 0.0317, "step": 17400 }, { "epoch": 0.09, "learning_rate": 0.000286824646462608, "loss": 0.0297, "step": 17410 }, { "epoch": 0.09, "learning_rate": 0.000286817078769594, "loss": 0.0334, "step": 17420 }, { "epoch": 0.09, "learning_rate": 0.00028680951107658, "loss": 0.0304, "step": 17430 }, { "epoch": 0.09, "learning_rate": 0.000286801943383566, "loss": 0.0283, "step": 17440 }, { "epoch": 0.09, "learning_rate": 0.00028679437569055196, "loss": 0.032, "step": 17450 }, { "epoch": 0.09, "learning_rate": 0.00028678680799753794, "loss": 0.0244, "step": 17460 }, { "epoch": 0.09, "learning_rate": 0.0002867792403045239, "loss": 0.0285, "step": 17470 }, { "epoch": 0.09, "learning_rate": 0.00028677167261150996, "loss": 0.0329, "step": 17480 }, { "epoch": 0.09, "learning_rate": 0.00028676410491849594, "loss": 0.034, "step": 17490 }, { "epoch": 0.09, "learning_rate": 0.0002867565372254819, "loss": 0.0267, "step": 17500 }, { "epoch": 0.09, "learning_rate": 0.0002867489695324679, "loss": 0.0285, "step": 17510 }, { "epoch": 0.09, "learning_rate": 0.0002867414018394539, "loss": 0.0289, "step": 17520 }, { "epoch": 0.09, "learning_rate": 0.00028673383414643986, "loss": 0.0278, "step": 17530 }, { "epoch": 0.09, "learning_rate": 0.00028672626645342584, "loss": 0.035, "step": 17540 }, { "epoch": 0.09, "learning_rate": 0.0002867186987604119, "loss": 0.0308, "step": 17550 }, { "epoch": 0.09, "learning_rate": 0.00028671113106739786, "loss": 0.0327, "step": 17560 }, { "epoch": 0.09, "learning_rate": 0.00028670356337438384, "loss": 0.0316, "step": 17570 }, { "epoch": 0.09, "learning_rate": 0.0002866959956813698, "loss": 0.0309, "step": 17580 }, { "epoch": 0.09, "learning_rate": 0.0002866884279883558, "loss": 0.0327, "step": 17590 }, { "epoch": 0.09, "learning_rate": 0.0002866808602953418, "loss": 0.0384, "step": 17600 }, { "epoch": 0.09, "learning_rate": 0.0002866732926023278, "loss": 0.0315, "step": 17610 }, { "epoch": 0.09, "learning_rate": 0.0002866657249093138, "loss": 0.0297, "step": 17620 }, { "epoch": 0.09, "learning_rate": 0.0002866581572162998, "loss": 0.0297, "step": 17630 }, { "epoch": 0.09, "learning_rate": 0.00028665058952328577, "loss": 0.0306, "step": 17640 }, { "epoch": 0.09, "learning_rate": 0.00028664302183027175, "loss": 0.0346, "step": 17650 }, { "epoch": 0.09, "learning_rate": 0.00028663545413725773, "loss": 0.0285, "step": 17660 }, { "epoch": 0.09, "learning_rate": 0.0002866278864442437, "loss": 0.0316, "step": 17670 }, { "epoch": 0.09, "learning_rate": 0.00028662031875122975, "loss": 0.0325, "step": 17680 }, { "epoch": 0.09, "learning_rate": 0.00028661275105821573, "loss": 0.0299, "step": 17690 }, { "epoch": 0.09, "learning_rate": 0.0002866051833652017, "loss": 0.0311, "step": 17700 }, { "epoch": 0.09, "learning_rate": 0.0002865976156721877, "loss": 0.0324, "step": 17710 }, { "epoch": 0.09, "learning_rate": 0.00028659004797917367, "loss": 0.0285, "step": 17720 }, { "epoch": 0.09, "learning_rate": 0.00028658248028615965, "loss": 0.0352, "step": 17730 }, { "epoch": 0.09, "learning_rate": 0.0002865749125931457, "loss": 0.0326, "step": 17740 }, { "epoch": 0.09, "learning_rate": 0.00028656734490013167, "loss": 0.0296, "step": 17750 }, { "epoch": 0.09, "learning_rate": 0.00028655977720711765, "loss": 0.0295, "step": 17760 }, { "epoch": 0.09, "learning_rate": 0.00028655220951410363, "loss": 0.0297, "step": 17770 }, { "epoch": 0.09, "learning_rate": 0.0002865446418210896, "loss": 0.0272, "step": 17780 }, { "epoch": 0.09, "learning_rate": 0.0002865370741280756, "loss": 0.0346, "step": 17790 }, { "epoch": 0.09, "learning_rate": 0.00028652950643506163, "loss": 0.0318, "step": 17800 }, { "epoch": 0.09, "learning_rate": 0.0002865219387420476, "loss": 0.0374, "step": 17810 }, { "epoch": 0.09, "learning_rate": 0.0002865143710490336, "loss": 0.0299, "step": 17820 }, { "epoch": 0.09, "learning_rate": 0.0002865068033560196, "loss": 0.0341, "step": 17830 }, { "epoch": 0.09, "learning_rate": 0.00028649923566300556, "loss": 0.0345, "step": 17840 }, { "epoch": 0.09, "learning_rate": 0.00028649166796999154, "loss": 0.0286, "step": 17850 }, { "epoch": 0.09, "learning_rate": 0.0002864841002769775, "loss": 0.0388, "step": 17860 }, { "epoch": 0.09, "learning_rate": 0.00028647653258396356, "loss": 0.0298, "step": 17870 }, { "epoch": 0.09, "learning_rate": 0.00028646896489094954, "loss": 0.0301, "step": 17880 }, { "epoch": 0.09, "learning_rate": 0.0002864613971979355, "loss": 0.0287, "step": 17890 }, { "epoch": 0.09, "learning_rate": 0.0002864538295049215, "loss": 0.0287, "step": 17900 }, { "epoch": 0.09, "learning_rate": 0.0002864462618119075, "loss": 0.0306, "step": 17910 }, { "epoch": 0.09, "learning_rate": 0.00028643869411889346, "loss": 0.035, "step": 17920 }, { "epoch": 0.09, "learning_rate": 0.0002864311264258795, "loss": 0.033, "step": 17930 }, { "epoch": 0.09, "learning_rate": 0.0002864235587328655, "loss": 0.0329, "step": 17940 }, { "epoch": 0.09, "learning_rate": 0.00028641599103985146, "loss": 0.0307, "step": 17950 }, { "epoch": 0.09, "learning_rate": 0.00028640842334683744, "loss": 0.0367, "step": 17960 }, { "epoch": 0.09, "learning_rate": 0.0002864008556538234, "loss": 0.0327, "step": 17970 }, { "epoch": 0.09, "learning_rate": 0.0002863932879608094, "loss": 0.032, "step": 17980 }, { "epoch": 0.09, "learning_rate": 0.00028638572026779544, "loss": 0.0309, "step": 17990 }, { "epoch": 0.09, "learning_rate": 0.0002863781525747814, "loss": 0.03, "step": 18000 }, { "epoch": 0.09, "eval_cer": 0.9144838414489178, "eval_loss": 0.022705839946866035, "eval_runtime": 117.5421, "eval_samples_per_second": 17.015, "eval_steps_per_second": 4.254, "step": 18000 }, { "epoch": 0.09, "learning_rate": 0.0002863705848817674, "loss": 0.0372, "step": 18010 }, { "epoch": 0.09, "learning_rate": 0.0002863630171887534, "loss": 0.0282, "step": 18020 }, { "epoch": 0.09, "learning_rate": 0.00028635544949573937, "loss": 0.0285, "step": 18030 }, { "epoch": 0.09, "learning_rate": 0.00028634788180272535, "loss": 0.0286, "step": 18040 }, { "epoch": 0.09, "learning_rate": 0.00028634031410971133, "loss": 0.0281, "step": 18050 }, { "epoch": 0.09, "learning_rate": 0.00028633274641669737, "loss": 0.0328, "step": 18060 }, { "epoch": 0.09, "learning_rate": 0.00028632517872368335, "loss": 0.0322, "step": 18070 }, { "epoch": 0.09, "learning_rate": 0.00028631761103066933, "loss": 0.0291, "step": 18080 }, { "epoch": 0.09, "learning_rate": 0.0002863100433376553, "loss": 0.0304, "step": 18090 }, { "epoch": 0.09, "learning_rate": 0.0002863024756446413, "loss": 0.0311, "step": 18100 }, { "epoch": 0.09, "learning_rate": 0.0002862949079516273, "loss": 0.0275, "step": 18110 }, { "epoch": 0.09, "learning_rate": 0.0002862873402586133, "loss": 0.0325, "step": 18120 }, { "epoch": 0.09, "learning_rate": 0.0002862797725655993, "loss": 0.0323, "step": 18130 }, { "epoch": 0.09, "learning_rate": 0.00028627220487258527, "loss": 0.0348, "step": 18140 }, { "epoch": 0.09, "learning_rate": 0.00028626463717957125, "loss": 0.0337, "step": 18150 }, { "epoch": 0.09, "learning_rate": 0.00028625706948655724, "loss": 0.0313, "step": 18160 }, { "epoch": 0.09, "learning_rate": 0.0002862495017935432, "loss": 0.039, "step": 18170 }, { "epoch": 0.09, "learning_rate": 0.0002862419341005292, "loss": 0.0294, "step": 18180 }, { "epoch": 0.09, "learning_rate": 0.00028623436640751523, "loss": 0.0348, "step": 18190 }, { "epoch": 0.09, "learning_rate": 0.0002862267987145012, "loss": 0.0318, "step": 18200 }, { "epoch": 0.09, "learning_rate": 0.0002862192310214872, "loss": 0.0327, "step": 18210 }, { "epoch": 0.09, "learning_rate": 0.0002862116633284732, "loss": 0.0282, "step": 18220 }, { "epoch": 0.09, "learning_rate": 0.00028620409563545916, "loss": 0.025, "step": 18230 }, { "epoch": 0.09, "learning_rate": 0.00028619652794244514, "loss": 0.0287, "step": 18240 }, { "epoch": 0.09, "learning_rate": 0.0002861889602494311, "loss": 0.0319, "step": 18250 }, { "epoch": 0.09, "learning_rate": 0.0002861813925564171, "loss": 0.0291, "step": 18260 }, { "epoch": 0.09, "learning_rate": 0.0002861738248634031, "loss": 0.0253, "step": 18270 }, { "epoch": 0.09, "learning_rate": 0.00028616625717038907, "loss": 0.0311, "step": 18280 }, { "epoch": 0.09, "learning_rate": 0.0002861586894773751, "loss": 0.0287, "step": 18290 }, { "epoch": 0.09, "learning_rate": 0.0002861511217843611, "loss": 0.0257, "step": 18300 }, { "epoch": 0.09, "learning_rate": 0.00028614355409134707, "loss": 0.0315, "step": 18310 }, { "epoch": 0.09, "learning_rate": 0.00028613598639833305, "loss": 0.0318, "step": 18320 }, { "epoch": 0.09, "learning_rate": 0.00028612841870531903, "loss": 0.0262, "step": 18330 }, { "epoch": 0.09, "learning_rate": 0.000286120851012305, "loss": 0.0273, "step": 18340 }, { "epoch": 0.09, "learning_rate": 0.00028611328331929105, "loss": 0.0336, "step": 18350 }, { "epoch": 0.09, "learning_rate": 0.000286105715626277, "loss": 0.0279, "step": 18360 }, { "epoch": 0.09, "learning_rate": 0.000286098147933263, "loss": 0.0287, "step": 18370 }, { "epoch": 0.09, "learning_rate": 0.000286090580240249, "loss": 0.036, "step": 18380 }, { "epoch": 0.09, "learning_rate": 0.00028608301254723497, "loss": 0.0276, "step": 18390 }, { "epoch": 0.09, "learning_rate": 0.00028607544485422095, "loss": 0.0329, "step": 18400 }, { "epoch": 0.09, "learning_rate": 0.00028606787716120693, "loss": 0.0358, "step": 18410 }, { "epoch": 0.09, "learning_rate": 0.00028606030946819297, "loss": 0.0325, "step": 18420 }, { "epoch": 0.09, "learning_rate": 0.00028605274177517895, "loss": 0.0329, "step": 18430 }, { "epoch": 0.09, "learning_rate": 0.00028604517408216493, "loss": 0.0289, "step": 18440 }, { "epoch": 0.09, "learning_rate": 0.0002860376063891509, "loss": 0.0284, "step": 18450 }, { "epoch": 0.09, "learning_rate": 0.0002860300386961369, "loss": 0.0318, "step": 18460 }, { "epoch": 0.09, "learning_rate": 0.0002860224710031229, "loss": 0.0249, "step": 18470 }, { "epoch": 0.09, "learning_rate": 0.0002860149033101089, "loss": 0.0263, "step": 18480 }, { "epoch": 0.09, "learning_rate": 0.0002860073356170949, "loss": 0.0298, "step": 18490 }, { "epoch": 0.09, "learning_rate": 0.0002859997679240809, "loss": 0.0277, "step": 18500 }, { "epoch": 0.09, "learning_rate": 0.00028599220023106686, "loss": 0.0284, "step": 18510 }, { "epoch": 0.09, "learning_rate": 0.00028598463253805284, "loss": 0.0301, "step": 18520 }, { "epoch": 0.09, "learning_rate": 0.0002859770648450388, "loss": 0.0301, "step": 18530 }, { "epoch": 0.09, "learning_rate": 0.00028596949715202486, "loss": 0.0339, "step": 18540 }, { "epoch": 0.09, "learning_rate": 0.00028596192945901084, "loss": 0.0324, "step": 18550 }, { "epoch": 0.09, "learning_rate": 0.0002859543617659968, "loss": 0.0304, "step": 18560 }, { "epoch": 0.09, "learning_rate": 0.0002859467940729828, "loss": 0.031, "step": 18570 }, { "epoch": 0.09, "learning_rate": 0.0002859392263799688, "loss": 0.0351, "step": 18580 }, { "epoch": 0.09, "learning_rate": 0.00028593165868695476, "loss": 0.0335, "step": 18590 }, { "epoch": 0.09, "learning_rate": 0.00028592409099394074, "loss": 0.0335, "step": 18600 }, { "epoch": 0.09, "learning_rate": 0.0002859165233009268, "loss": 0.0265, "step": 18610 }, { "epoch": 0.09, "learning_rate": 0.00028590895560791276, "loss": 0.0344, "step": 18620 }, { "epoch": 0.09, "learning_rate": 0.00028590138791489874, "loss": 0.0333, "step": 18630 }, { "epoch": 0.09, "learning_rate": 0.0002858938202218847, "loss": 0.0277, "step": 18640 }, { "epoch": 0.09, "learning_rate": 0.0002858862525288707, "loss": 0.0324, "step": 18650 }, { "epoch": 0.09, "learning_rate": 0.0002858786848358567, "loss": 0.0307, "step": 18660 }, { "epoch": 0.09, "learning_rate": 0.0002858711171428427, "loss": 0.0319, "step": 18670 }, { "epoch": 0.09, "learning_rate": 0.0002858635494498287, "loss": 0.0381, "step": 18680 }, { "epoch": 0.09, "learning_rate": 0.0002858559817568147, "loss": 0.0307, "step": 18690 }, { "epoch": 0.09, "learning_rate": 0.00028584841406380067, "loss": 0.0364, "step": 18700 }, { "epoch": 0.09, "learning_rate": 0.00028584084637078665, "loss": 0.034, "step": 18710 }, { "epoch": 0.09, "learning_rate": 0.00028583327867777263, "loss": 0.0288, "step": 18720 }, { "epoch": 0.09, "learning_rate": 0.0002858257109847586, "loss": 0.0339, "step": 18730 }, { "epoch": 0.09, "learning_rate": 0.00028581814329174465, "loss": 0.0319, "step": 18740 }, { "epoch": 0.09, "learning_rate": 0.00028581057559873063, "loss": 0.0273, "step": 18750 }, { "epoch": 0.09, "learning_rate": 0.0002858030079057166, "loss": 0.0301, "step": 18760 }, { "epoch": 0.09, "learning_rate": 0.0002857954402127026, "loss": 0.0277, "step": 18770 }, { "epoch": 0.09, "learning_rate": 0.00028578787251968857, "loss": 0.0278, "step": 18780 }, { "epoch": 0.09, "learning_rate": 0.00028578030482667455, "loss": 0.0277, "step": 18790 }, { "epoch": 0.09, "learning_rate": 0.0002857727371336606, "loss": 0.0293, "step": 18800 }, { "epoch": 0.09, "learning_rate": 0.00028576516944064657, "loss": 0.029, "step": 18810 }, { "epoch": 0.09, "learning_rate": 0.00028575760174763255, "loss": 0.0273, "step": 18820 }, { "epoch": 0.09, "learning_rate": 0.00028575003405461853, "loss": 0.0286, "step": 18830 }, { "epoch": 0.1, "learning_rate": 0.0002857424663616045, "loss": 0.0345, "step": 18840 }, { "epoch": 0.1, "learning_rate": 0.0002857348986685905, "loss": 0.0305, "step": 18850 }, { "epoch": 0.1, "learning_rate": 0.00028572733097557653, "loss": 0.0274, "step": 18860 }, { "epoch": 0.1, "learning_rate": 0.0002857197632825625, "loss": 0.0319, "step": 18870 }, { "epoch": 0.1, "learning_rate": 0.0002857121955895485, "loss": 0.0284, "step": 18880 }, { "epoch": 0.1, "learning_rate": 0.0002857046278965345, "loss": 0.0303, "step": 18890 }, { "epoch": 0.1, "learning_rate": 0.00028569706020352046, "loss": 0.0354, "step": 18900 }, { "epoch": 0.1, "learning_rate": 0.00028568949251050644, "loss": 0.0368, "step": 18910 }, { "epoch": 0.1, "learning_rate": 0.0002856819248174924, "loss": 0.0355, "step": 18920 }, { "epoch": 0.1, "learning_rate": 0.00028567435712447846, "loss": 0.0382, "step": 18930 }, { "epoch": 0.1, "learning_rate": 0.00028566678943146444, "loss": 0.0309, "step": 18940 }, { "epoch": 0.1, "learning_rate": 0.0002856592217384504, "loss": 0.0295, "step": 18950 }, { "epoch": 0.1, "learning_rate": 0.0002856516540454364, "loss": 0.0314, "step": 18960 }, { "epoch": 0.1, "learning_rate": 0.0002856440863524224, "loss": 0.033, "step": 18970 }, { "epoch": 0.1, "learning_rate": 0.00028563651865940836, "loss": 0.0307, "step": 18980 }, { "epoch": 0.1, "learning_rate": 0.0002856289509663944, "loss": 0.0315, "step": 18990 }, { "epoch": 0.1, "learning_rate": 0.0002856213832733804, "loss": 0.0316, "step": 19000 }, { "epoch": 0.1, "eval_cer": 0.9144974269946735, "eval_loss": 0.022285686805844307, "eval_runtime": 117.4593, "eval_samples_per_second": 17.027, "eval_steps_per_second": 4.257, "step": 19000 }, { "epoch": 0.1, "learning_rate": 0.00028561381558036636, "loss": 0.0299, "step": 19010 }, { "epoch": 0.1, "learning_rate": 0.00028560624788735234, "loss": 0.0285, "step": 19020 }, { "epoch": 0.1, "learning_rate": 0.0002855986801943383, "loss": 0.0294, "step": 19030 }, { "epoch": 0.1, "learning_rate": 0.0002855911125013243, "loss": 0.0314, "step": 19040 }, { "epoch": 0.1, "learning_rate": 0.00028558354480831034, "loss": 0.0298, "step": 19050 }, { "epoch": 0.1, "learning_rate": 0.0002855759771152963, "loss": 0.0323, "step": 19060 }, { "epoch": 0.1, "learning_rate": 0.0002855684094222823, "loss": 0.031, "step": 19070 }, { "epoch": 0.1, "learning_rate": 0.0002855608417292683, "loss": 0.0292, "step": 19080 }, { "epoch": 0.1, "learning_rate": 0.00028555327403625427, "loss": 0.0276, "step": 19090 }, { "epoch": 0.1, "learning_rate": 0.00028554570634324025, "loss": 0.0284, "step": 19100 }, { "epoch": 0.1, "learning_rate": 0.00028553813865022623, "loss": 0.0268, "step": 19110 }, { "epoch": 0.1, "learning_rate": 0.00028553057095721227, "loss": 0.0259, "step": 19120 }, { "epoch": 0.1, "learning_rate": 0.00028552300326419825, "loss": 0.0297, "step": 19130 }, { "epoch": 0.1, "learning_rate": 0.00028551543557118423, "loss": 0.0303, "step": 19140 }, { "epoch": 0.1, "learning_rate": 0.0002855078678781702, "loss": 0.0296, "step": 19150 }, { "epoch": 0.1, "learning_rate": 0.0002855003001851562, "loss": 0.028, "step": 19160 }, { "epoch": 0.1, "learning_rate": 0.0002854927324921422, "loss": 0.0298, "step": 19170 }, { "epoch": 0.1, "learning_rate": 0.0002854851647991282, "loss": 0.0316, "step": 19180 }, { "epoch": 0.1, "learning_rate": 0.0002854775971061142, "loss": 0.0261, "step": 19190 }, { "epoch": 0.1, "learning_rate": 0.00028547002941310017, "loss": 0.03, "step": 19200 }, { "epoch": 0.1, "learning_rate": 0.00028546246172008615, "loss": 0.035, "step": 19210 }, { "epoch": 0.1, "learning_rate": 0.00028545489402707214, "loss": 0.0365, "step": 19220 }, { "epoch": 0.1, "learning_rate": 0.0002854473263340581, "loss": 0.0318, "step": 19230 }, { "epoch": 0.1, "learning_rate": 0.0002854397586410441, "loss": 0.0317, "step": 19240 }, { "epoch": 0.1, "learning_rate": 0.00028543219094803013, "loss": 0.0303, "step": 19250 }, { "epoch": 0.1, "learning_rate": 0.0002854246232550161, "loss": 0.0304, "step": 19260 }, { "epoch": 0.1, "learning_rate": 0.0002854170555620021, "loss": 0.0328, "step": 19270 }, { "epoch": 0.1, "learning_rate": 0.0002854094878689881, "loss": 0.0278, "step": 19280 }, { "epoch": 0.1, "learning_rate": 0.00028540192017597406, "loss": 0.0338, "step": 19290 }, { "epoch": 0.1, "learning_rate": 0.00028539435248296004, "loss": 0.0286, "step": 19300 }, { "epoch": 0.1, "learning_rate": 0.0002853867847899461, "loss": 0.0311, "step": 19310 }, { "epoch": 0.1, "learning_rate": 0.00028537921709693206, "loss": 0.0334, "step": 19320 }, { "epoch": 0.1, "learning_rate": 0.00028537164940391804, "loss": 0.0312, "step": 19330 }, { "epoch": 0.1, "learning_rate": 0.000285364081710904, "loss": 0.03, "step": 19340 }, { "epoch": 0.1, "learning_rate": 0.00028535651401789, "loss": 0.0294, "step": 19350 }, { "epoch": 0.1, "learning_rate": 0.000285348946324876, "loss": 0.027, "step": 19360 }, { "epoch": 0.1, "learning_rate": 0.000285341378631862, "loss": 0.0306, "step": 19370 }, { "epoch": 0.1, "learning_rate": 0.000285333810938848, "loss": 0.0287, "step": 19380 }, { "epoch": 0.1, "learning_rate": 0.000285326243245834, "loss": 0.0291, "step": 19390 }, { "epoch": 0.1, "learning_rate": 0.00028531867555281996, "loss": 0.0293, "step": 19400 }, { "epoch": 0.1, "learning_rate": 0.00028531110785980595, "loss": 0.0271, "step": 19410 }, { "epoch": 0.1, "learning_rate": 0.0002853035401667919, "loss": 0.0244, "step": 19420 }, { "epoch": 0.1, "learning_rate": 0.0002852959724737779, "loss": 0.026, "step": 19430 }, { "epoch": 0.1, "learning_rate": 0.00028528840478076394, "loss": 0.0297, "step": 19440 }, { "epoch": 0.1, "learning_rate": 0.0002852808370877499, "loss": 0.0319, "step": 19450 }, { "epoch": 0.1, "learning_rate": 0.0002852732693947359, "loss": 0.0329, "step": 19460 }, { "epoch": 0.1, "learning_rate": 0.0002852657017017219, "loss": 0.027, "step": 19470 }, { "epoch": 0.1, "learning_rate": 0.00028525813400870787, "loss": 0.0247, "step": 19480 }, { "epoch": 0.1, "learning_rate": 0.00028525056631569385, "loss": 0.0297, "step": 19490 }, { "epoch": 0.1, "learning_rate": 0.00028524299862267983, "loss": 0.0291, "step": 19500 }, { "epoch": 0.1, "learning_rate": 0.0002852354309296658, "loss": 0.0279, "step": 19510 }, { "epoch": 0.1, "learning_rate": 0.0002852278632366518, "loss": 0.0299, "step": 19520 }, { "epoch": 0.1, "learning_rate": 0.0002852202955436378, "loss": 0.0304, "step": 19530 }, { "epoch": 0.1, "learning_rate": 0.0002852127278506238, "loss": 0.0317, "step": 19540 }, { "epoch": 0.1, "learning_rate": 0.0002852051601576098, "loss": 0.0305, "step": 19550 }, { "epoch": 0.1, "learning_rate": 0.0002851975924645958, "loss": 0.027, "step": 19560 }, { "epoch": 0.1, "learning_rate": 0.00028519002477158176, "loss": 0.0297, "step": 19570 }, { "epoch": 0.1, "learning_rate": 0.00028518245707856774, "loss": 0.028, "step": 19580 }, { "epoch": 0.1, "learning_rate": 0.0002851748893855537, "loss": 0.028, "step": 19590 }, { "epoch": 0.1, "learning_rate": 0.00028516732169253976, "loss": 0.032, "step": 19600 }, { "epoch": 0.1, "learning_rate": 0.00028515975399952574, "loss": 0.0251, "step": 19610 }, { "epoch": 0.1, "learning_rate": 0.0002851521863065117, "loss": 0.0283, "step": 19620 }, { "epoch": 0.1, "learning_rate": 0.0002851446186134977, "loss": 0.0369, "step": 19630 }, { "epoch": 0.1, "learning_rate": 0.0002851370509204837, "loss": 0.0311, "step": 19640 }, { "epoch": 0.1, "learning_rate": 0.00028512948322746966, "loss": 0.0303, "step": 19650 }, { "epoch": 0.1, "learning_rate": 0.00028512191553445564, "loss": 0.0286, "step": 19660 }, { "epoch": 0.1, "learning_rate": 0.0002851143478414417, "loss": 0.0365, "step": 19670 }, { "epoch": 0.1, "learning_rate": 0.00028510678014842766, "loss": 0.0292, "step": 19680 }, { "epoch": 0.1, "learning_rate": 0.00028509921245541364, "loss": 0.0282, "step": 19690 }, { "epoch": 0.1, "learning_rate": 0.0002850916447623996, "loss": 0.0279, "step": 19700 }, { "epoch": 0.1, "learning_rate": 0.0002850840770693856, "loss": 0.0292, "step": 19710 }, { "epoch": 0.1, "learning_rate": 0.0002850765093763716, "loss": 0.0304, "step": 19720 }, { "epoch": 0.1, "learning_rate": 0.0002850689416833576, "loss": 0.0246, "step": 19730 }, { "epoch": 0.1, "learning_rate": 0.0002850613739903436, "loss": 0.0289, "step": 19740 }, { "epoch": 0.1, "learning_rate": 0.0002850538062973296, "loss": 0.0257, "step": 19750 }, { "epoch": 0.1, "learning_rate": 0.00028504623860431557, "loss": 0.0324, "step": 19760 }, { "epoch": 0.1, "learning_rate": 0.00028503867091130155, "loss": 0.0291, "step": 19770 }, { "epoch": 0.1, "learning_rate": 0.00028503110321828753, "loss": 0.0306, "step": 19780 }, { "epoch": 0.1, "learning_rate": 0.00028502353552527357, "loss": 0.0287, "step": 19790 }, { "epoch": 0.1, "learning_rate": 0.00028501596783225955, "loss": 0.0239, "step": 19800 }, { "epoch": 0.1, "learning_rate": 0.00028500840013924553, "loss": 0.0271, "step": 19810 }, { "epoch": 0.1, "learning_rate": 0.0002850008324462315, "loss": 0.0309, "step": 19820 }, { "epoch": 0.1, "learning_rate": 0.0002849932647532175, "loss": 0.0273, "step": 19830 }, { "epoch": 0.1, "learning_rate": 0.0002849856970602035, "loss": 0.0309, "step": 19840 }, { "epoch": 0.1, "learning_rate": 0.00028497812936718945, "loss": 0.0265, "step": 19850 }, { "epoch": 0.1, "learning_rate": 0.0002849705616741755, "loss": 0.0284, "step": 19860 }, { "epoch": 0.1, "learning_rate": 0.00028496299398116147, "loss": 0.0309, "step": 19870 }, { "epoch": 0.1, "learning_rate": 0.00028495542628814745, "loss": 0.0278, "step": 19880 }, { "epoch": 0.1, "learning_rate": 0.00028494785859513343, "loss": 0.0259, "step": 19890 }, { "epoch": 0.1, "learning_rate": 0.0002849402909021194, "loss": 0.0321, "step": 19900 }, { "epoch": 0.1, "learning_rate": 0.0002849327232091054, "loss": 0.0266, "step": 19910 }, { "epoch": 0.1, "learning_rate": 0.00028492515551609143, "loss": 0.0298, "step": 19920 }, { "epoch": 0.1, "learning_rate": 0.0002849175878230774, "loss": 0.0257, "step": 19930 }, { "epoch": 0.1, "learning_rate": 0.0002849100201300634, "loss": 0.0303, "step": 19940 }, { "epoch": 0.1, "learning_rate": 0.0002849024524370494, "loss": 0.0253, "step": 19950 }, { "epoch": 0.1, "learning_rate": 0.00028489488474403536, "loss": 0.0291, "step": 19960 }, { "epoch": 0.1, "learning_rate": 0.00028488731705102134, "loss": 0.0324, "step": 19970 }, { "epoch": 0.1, "learning_rate": 0.0002848797493580073, "loss": 0.0314, "step": 19980 }, { "epoch": 0.1, "learning_rate": 0.00028487218166499336, "loss": 0.0295, "step": 19990 }, { "epoch": 0.1, "learning_rate": 0.00028486461397197934, "loss": 0.0302, "step": 20000 }, { "epoch": 0.1, "eval_cer": 0.9145546803660722, "eval_loss": 0.023069359362125397, "eval_runtime": 117.5456, "eval_samples_per_second": 17.015, "eval_steps_per_second": 4.254, "step": 20000 }, { "epoch": 0.1, "learning_rate": 0.0002848570462789653, "loss": 0.0283, "step": 20010 }, { "epoch": 0.1, "learning_rate": 0.0002848494785859513, "loss": 0.0321, "step": 20020 }, { "epoch": 0.1, "learning_rate": 0.0002848419108929373, "loss": 0.0329, "step": 20030 }, { "epoch": 0.1, "learning_rate": 0.00028483434319992326, "loss": 0.0282, "step": 20040 }, { "epoch": 0.1, "learning_rate": 0.0002848267755069093, "loss": 0.0307, "step": 20050 }, { "epoch": 0.1, "learning_rate": 0.0002848192078138953, "loss": 0.0305, "step": 20060 }, { "epoch": 0.1, "learning_rate": 0.00028481164012088126, "loss": 0.0291, "step": 20070 }, { "epoch": 0.1, "learning_rate": 0.00028480407242786724, "loss": 0.0331, "step": 20080 }, { "epoch": 0.1, "learning_rate": 0.0002847965047348532, "loss": 0.0245, "step": 20090 }, { "epoch": 0.1, "learning_rate": 0.0002847889370418392, "loss": 0.0304, "step": 20100 }, { "epoch": 0.1, "learning_rate": 0.00028478136934882524, "loss": 0.0276, "step": 20110 }, { "epoch": 0.1, "learning_rate": 0.0002847738016558112, "loss": 0.023, "step": 20120 }, { "epoch": 0.1, "learning_rate": 0.0002847662339627972, "loss": 0.0354, "step": 20130 }, { "epoch": 0.1, "learning_rate": 0.0002847586662697832, "loss": 0.0302, "step": 20140 }, { "epoch": 0.1, "learning_rate": 0.00028475109857676917, "loss": 0.0276, "step": 20150 }, { "epoch": 0.1, "learning_rate": 0.00028474353088375515, "loss": 0.0319, "step": 20160 }, { "epoch": 0.1, "learning_rate": 0.00028473596319074113, "loss": 0.0318, "step": 20170 }, { "epoch": 0.1, "learning_rate": 0.00028472839549772717, "loss": 0.0328, "step": 20180 }, { "epoch": 0.1, "learning_rate": 0.00028472082780471315, "loss": 0.0325, "step": 20190 }, { "epoch": 0.1, "learning_rate": 0.00028471326011169913, "loss": 0.0266, "step": 20200 }, { "epoch": 0.1, "learning_rate": 0.0002847056924186851, "loss": 0.0299, "step": 20210 }, { "epoch": 0.1, "learning_rate": 0.0002846981247256711, "loss": 0.032, "step": 20220 }, { "epoch": 0.1, "learning_rate": 0.0002846905570326571, "loss": 0.0276, "step": 20230 }, { "epoch": 0.1, "learning_rate": 0.0002846829893396431, "loss": 0.0329, "step": 20240 }, { "epoch": 0.1, "learning_rate": 0.0002846754216466291, "loss": 0.034, "step": 20250 }, { "epoch": 0.1, "learning_rate": 0.0002846678539536151, "loss": 0.0277, "step": 20260 }, { "epoch": 0.1, "learning_rate": 0.00028466028626060105, "loss": 0.0356, "step": 20270 }, { "epoch": 0.1, "learning_rate": 0.00028465271856758704, "loss": 0.0342, "step": 20280 }, { "epoch": 0.1, "learning_rate": 0.000284645150874573, "loss": 0.0367, "step": 20290 }, { "epoch": 0.1, "learning_rate": 0.000284637583181559, "loss": 0.0308, "step": 20300 }, { "epoch": 0.1, "learning_rate": 0.00028463001548854503, "loss": 0.0358, "step": 20310 }, { "epoch": 0.1, "learning_rate": 0.000284622447795531, "loss": 0.0264, "step": 20320 }, { "epoch": 0.1, "learning_rate": 0.000284614880102517, "loss": 0.0355, "step": 20330 }, { "epoch": 0.1, "learning_rate": 0.000284607312409503, "loss": 0.0305, "step": 20340 }, { "epoch": 0.1, "learning_rate": 0.00028459974471648896, "loss": 0.0311, "step": 20350 }, { "epoch": 0.1, "learning_rate": 0.00028459217702347494, "loss": 0.0282, "step": 20360 }, { "epoch": 0.1, "learning_rate": 0.000284584609330461, "loss": 0.0418, "step": 20370 }, { "epoch": 0.1, "learning_rate": 0.00028457704163744696, "loss": 0.0341, "step": 20380 }, { "epoch": 0.1, "learning_rate": 0.00028456947394443294, "loss": 0.0329, "step": 20390 }, { "epoch": 0.1, "learning_rate": 0.0002845619062514189, "loss": 0.0361, "step": 20400 }, { "epoch": 0.1, "learning_rate": 0.0002845543385584049, "loss": 0.0252, "step": 20410 }, { "epoch": 0.1, "learning_rate": 0.0002845467708653909, "loss": 0.0322, "step": 20420 }, { "epoch": 0.1, "learning_rate": 0.0002845392031723769, "loss": 0.0348, "step": 20430 }, { "epoch": 0.1, "learning_rate": 0.0002845316354793629, "loss": 0.0338, "step": 20440 }, { "epoch": 0.1, "learning_rate": 0.0002845240677863489, "loss": 0.0335, "step": 20450 }, { "epoch": 0.1, "learning_rate": 0.00028451650009333486, "loss": 0.0374, "step": 20460 }, { "epoch": 0.1, "learning_rate": 0.00028450893240032085, "loss": 0.0308, "step": 20470 }, { "epoch": 0.1, "learning_rate": 0.00028450136470730683, "loss": 0.0306, "step": 20480 }, { "epoch": 0.1, "learning_rate": 0.0002844937970142928, "loss": 0.0352, "step": 20490 }, { "epoch": 0.1, "learning_rate": 0.00028448622932127884, "loss": 0.0332, "step": 20500 }, { "epoch": 0.1, "learning_rate": 0.0002844786616282648, "loss": 0.0285, "step": 20510 }, { "epoch": 0.1, "learning_rate": 0.0002844710939352508, "loss": 0.0285, "step": 20520 }, { "epoch": 0.1, "learning_rate": 0.0002844635262422368, "loss": 0.0246, "step": 20530 }, { "epoch": 0.1, "learning_rate": 0.00028445595854922277, "loss": 0.0316, "step": 20540 }, { "epoch": 0.1, "learning_rate": 0.00028444839085620875, "loss": 0.0396, "step": 20550 }, { "epoch": 0.1, "learning_rate": 0.0002844408231631948, "loss": 0.0393, "step": 20560 }, { "epoch": 0.1, "learning_rate": 0.00028443325547018077, "loss": 0.0275, "step": 20570 }, { "epoch": 0.1, "learning_rate": 0.00028442568777716675, "loss": 0.0317, "step": 20580 }, { "epoch": 0.1, "learning_rate": 0.00028441812008415273, "loss": 0.0321, "step": 20590 }, { "epoch": 0.1, "learning_rate": 0.0002844105523911387, "loss": 0.0297, "step": 20600 }, { "epoch": 0.1, "learning_rate": 0.0002844029846981247, "loss": 0.0265, "step": 20610 }, { "epoch": 0.1, "learning_rate": 0.00028439541700511073, "loss": 0.0292, "step": 20620 }, { "epoch": 0.1, "learning_rate": 0.0002843878493120967, "loss": 0.031, "step": 20630 }, { "epoch": 0.1, "learning_rate": 0.0002843802816190827, "loss": 0.0291, "step": 20640 }, { "epoch": 0.1, "learning_rate": 0.0002843727139260687, "loss": 0.0292, "step": 20650 }, { "epoch": 0.1, "learning_rate": 0.00028436514623305466, "loss": 0.0298, "step": 20660 }, { "epoch": 0.1, "learning_rate": 0.00028435757854004064, "loss": 0.0309, "step": 20670 }, { "epoch": 0.1, "learning_rate": 0.0002843500108470266, "loss": 0.0288, "step": 20680 }, { "epoch": 0.1, "learning_rate": 0.00028434244315401265, "loss": 0.026, "step": 20690 }, { "epoch": 0.1, "learning_rate": 0.00028433487546099864, "loss": 0.0324, "step": 20700 }, { "epoch": 0.1, "learning_rate": 0.0002843273077679846, "loss": 0.027, "step": 20710 }, { "epoch": 0.1, "learning_rate": 0.0002843197400749706, "loss": 0.0312, "step": 20720 }, { "epoch": 0.1, "learning_rate": 0.0002843121723819566, "loss": 0.0291, "step": 20730 }, { "epoch": 0.1, "learning_rate": 0.00028430460468894256, "loss": 0.0281, "step": 20740 }, { "epoch": 0.1, "learning_rate": 0.00028429703699592854, "loss": 0.0328, "step": 20750 }, { "epoch": 0.1, "learning_rate": 0.0002842894693029145, "loss": 0.0289, "step": 20760 }, { "epoch": 0.1, "learning_rate": 0.0002842819016099005, "loss": 0.0331, "step": 20770 }, { "epoch": 0.1, "learning_rate": 0.0002842743339168865, "loss": 0.0302, "step": 20780 }, { "epoch": 0.1, "learning_rate": 0.0002842667662238725, "loss": 0.0316, "step": 20790 }, { "epoch": 0.1, "learning_rate": 0.0002842591985308585, "loss": 0.0358, "step": 20800 }, { "epoch": 0.1, "learning_rate": 0.0002842516308378445, "loss": 0.03, "step": 20810 }, { "epoch": 0.11, "learning_rate": 0.00028424406314483047, "loss": 0.0273, "step": 20820 }, { "epoch": 0.11, "learning_rate": 0.00028423649545181645, "loss": 0.0302, "step": 20830 }, { "epoch": 0.11, "learning_rate": 0.00028422892775880243, "loss": 0.0328, "step": 20840 }, { "epoch": 0.11, "learning_rate": 0.00028422136006578847, "loss": 0.0305, "step": 20850 }, { "epoch": 0.11, "learning_rate": 0.00028421379237277445, "loss": 0.0309, "step": 20860 }, { "epoch": 0.11, "learning_rate": 0.00028420622467976043, "loss": 0.0297, "step": 20870 }, { "epoch": 0.11, "learning_rate": 0.0002841986569867464, "loss": 0.0318, "step": 20880 }, { "epoch": 0.11, "learning_rate": 0.0002841910892937324, "loss": 0.0358, "step": 20890 }, { "epoch": 0.11, "learning_rate": 0.0002841835216007184, "loss": 0.0282, "step": 20900 }, { "epoch": 0.11, "learning_rate": 0.00028417595390770435, "loss": 0.0285, "step": 20910 }, { "epoch": 0.11, "learning_rate": 0.0002841683862146904, "loss": 0.0371, "step": 20920 }, { "epoch": 0.11, "learning_rate": 0.00028416081852167637, "loss": 0.0311, "step": 20930 }, { "epoch": 0.11, "learning_rate": 0.00028415325082866235, "loss": 0.0481, "step": 20940 }, { "epoch": 0.11, "learning_rate": 0.00028414568313564833, "loss": 0.0307, "step": 20950 }, { "epoch": 0.11, "learning_rate": 0.0002841381154426343, "loss": 0.031, "step": 20960 }, { "epoch": 0.11, "learning_rate": 0.0002841305477496203, "loss": 0.0286, "step": 20970 }, { "epoch": 0.11, "learning_rate": 0.00028412298005660633, "loss": 0.03, "step": 20980 }, { "epoch": 0.11, "learning_rate": 0.0002841154123635923, "loss": 0.0331, "step": 20990 }, { "epoch": 0.11, "learning_rate": 0.0002841078446705783, "loss": 0.0248, "step": 21000 }, { "epoch": 0.11, "eval_cer": 0.9145119829365546, "eval_loss": 0.021799687296152115, "eval_runtime": 117.5088, "eval_samples_per_second": 17.02, "eval_steps_per_second": 4.255, "step": 21000 }, { "epoch": 0.11, "learning_rate": 0.0002841002769775643, "loss": 0.0341, "step": 21010 }, { "epoch": 0.11, "learning_rate": 0.00028409270928455026, "loss": 0.0298, "step": 21020 }, { "epoch": 0.11, "learning_rate": 0.00028408514159153624, "loss": 0.0277, "step": 21030 }, { "epoch": 0.11, "learning_rate": 0.0002840775738985222, "loss": 0.0317, "step": 21040 }, { "epoch": 0.11, "learning_rate": 0.00028407000620550826, "loss": 0.0341, "step": 21050 }, { "epoch": 0.11, "learning_rate": 0.00028406243851249424, "loss": 0.0266, "step": 21060 }, { "epoch": 0.11, "learning_rate": 0.0002840548708194802, "loss": 0.0294, "step": 21070 }, { "epoch": 0.11, "learning_rate": 0.0002840473031264662, "loss": 0.0324, "step": 21080 }, { "epoch": 0.11, "learning_rate": 0.0002840397354334522, "loss": 0.0352, "step": 21090 }, { "epoch": 0.11, "learning_rate": 0.00028403216774043816, "loss": 0.0292, "step": 21100 }, { "epoch": 0.11, "learning_rate": 0.0002840246000474242, "loss": 0.0342, "step": 21110 }, { "epoch": 0.11, "learning_rate": 0.0002840170323544102, "loss": 0.0298, "step": 21120 }, { "epoch": 0.11, "learning_rate": 0.00028400946466139616, "loss": 0.0297, "step": 21130 }, { "epoch": 0.11, "learning_rate": 0.00028400189696838214, "loss": 0.0291, "step": 21140 }, { "epoch": 0.11, "learning_rate": 0.0002839943292753681, "loss": 0.0265, "step": 21150 }, { "epoch": 0.11, "learning_rate": 0.0002839867615823541, "loss": 0.0303, "step": 21160 }, { "epoch": 0.11, "learning_rate": 0.00028397919388934014, "loss": 0.0283, "step": 21170 }, { "epoch": 0.11, "learning_rate": 0.0002839716261963261, "loss": 0.0293, "step": 21180 }, { "epoch": 0.11, "learning_rate": 0.0002839640585033121, "loss": 0.0316, "step": 21190 }, { "epoch": 0.11, "learning_rate": 0.0002839564908102981, "loss": 0.0332, "step": 21200 }, { "epoch": 0.11, "learning_rate": 0.00028394892311728407, "loss": 0.0376, "step": 21210 }, { "epoch": 0.11, "learning_rate": 0.00028394135542427005, "loss": 0.0328, "step": 21220 }, { "epoch": 0.11, "learning_rate": 0.00028393378773125603, "loss": 0.0347, "step": 21230 }, { "epoch": 0.11, "learning_rate": 0.00028392622003824207, "loss": 0.0322, "step": 21240 }, { "epoch": 0.11, "learning_rate": 0.00028391865234522805, "loss": 0.0329, "step": 21250 }, { "epoch": 0.11, "learning_rate": 0.00028391108465221403, "loss": 0.0309, "step": 21260 }, { "epoch": 0.11, "learning_rate": 0.0002839035169592, "loss": 0.0357, "step": 21270 }, { "epoch": 0.11, "learning_rate": 0.000283895949266186, "loss": 0.0267, "step": 21280 }, { "epoch": 0.11, "learning_rate": 0.000283888381573172, "loss": 0.0262, "step": 21290 }, { "epoch": 0.11, "learning_rate": 0.000283880813880158, "loss": 0.0326, "step": 21300 }, { "epoch": 0.11, "learning_rate": 0.000283873246187144, "loss": 0.0297, "step": 21310 }, { "epoch": 0.11, "learning_rate": 0.00028386567849413, "loss": 0.0262, "step": 21320 }, { "epoch": 0.11, "learning_rate": 0.00028385811080111595, "loss": 0.0247, "step": 21330 }, { "epoch": 0.11, "learning_rate": 0.00028385054310810194, "loss": 0.0314, "step": 21340 }, { "epoch": 0.11, "learning_rate": 0.0002838429754150879, "loss": 0.0338, "step": 21350 }, { "epoch": 0.11, "learning_rate": 0.00028383540772207395, "loss": 0.028, "step": 21360 }, { "epoch": 0.11, "learning_rate": 0.00028382784002905993, "loss": 0.0307, "step": 21370 }, { "epoch": 0.11, "learning_rate": 0.0002838202723360459, "loss": 0.0314, "step": 21380 }, { "epoch": 0.11, "learning_rate": 0.0002838127046430319, "loss": 0.0284, "step": 21390 }, { "epoch": 0.11, "learning_rate": 0.0002838051369500179, "loss": 0.0304, "step": 21400 }, { "epoch": 0.11, "learning_rate": 0.00028379756925700386, "loss": 0.0336, "step": 21410 }, { "epoch": 0.11, "learning_rate": 0.00028379000156398984, "loss": 0.0312, "step": 21420 }, { "epoch": 0.11, "learning_rate": 0.0002837824338709759, "loss": 0.0311, "step": 21430 }, { "epoch": 0.11, "learning_rate": 0.00028377486617796186, "loss": 0.0293, "step": 21440 }, { "epoch": 0.11, "learning_rate": 0.00028376729848494784, "loss": 0.0297, "step": 21450 }, { "epoch": 0.11, "learning_rate": 0.0002837597307919338, "loss": 0.032, "step": 21460 }, { "epoch": 0.11, "learning_rate": 0.0002837521630989198, "loss": 0.0243, "step": 21470 }, { "epoch": 0.11, "learning_rate": 0.0002837445954059058, "loss": 0.0277, "step": 21480 }, { "epoch": 0.11, "learning_rate": 0.0002837370277128918, "loss": 0.0269, "step": 21490 }, { "epoch": 0.11, "learning_rate": 0.0002837294600198778, "loss": 0.0302, "step": 21500 }, { "epoch": 0.11, "learning_rate": 0.0002837218923268638, "loss": 0.0276, "step": 21510 }, { "epoch": 0.11, "learning_rate": 0.00028371432463384976, "loss": 0.0306, "step": 21520 }, { "epoch": 0.11, "learning_rate": 0.00028370675694083575, "loss": 0.0309, "step": 21530 }, { "epoch": 0.11, "learning_rate": 0.00028369918924782173, "loss": 0.029, "step": 21540 }, { "epoch": 0.11, "learning_rate": 0.0002836916215548077, "loss": 0.0354, "step": 21550 }, { "epoch": 0.11, "learning_rate": 0.00028368405386179374, "loss": 0.039, "step": 21560 }, { "epoch": 0.11, "learning_rate": 0.0002836764861687797, "loss": 0.0296, "step": 21570 }, { "epoch": 0.11, "learning_rate": 0.0002836689184757657, "loss": 0.0278, "step": 21580 }, { "epoch": 0.11, "learning_rate": 0.0002836613507827517, "loss": 0.0293, "step": 21590 }, { "epoch": 0.11, "learning_rate": 0.00028365378308973767, "loss": 0.0288, "step": 21600 }, { "epoch": 0.11, "learning_rate": 0.00028364621539672365, "loss": 0.0281, "step": 21610 }, { "epoch": 0.11, "learning_rate": 0.0002836386477037097, "loss": 0.0231, "step": 21620 }, { "epoch": 0.11, "learning_rate": 0.00028363108001069567, "loss": 0.0244, "step": 21630 }, { "epoch": 0.11, "learning_rate": 0.00028362351231768165, "loss": 0.0288, "step": 21640 }, { "epoch": 0.11, "learning_rate": 0.00028361594462466763, "loss": 0.0277, "step": 21650 }, { "epoch": 0.11, "learning_rate": 0.0002836083769316536, "loss": 0.0264, "step": 21660 }, { "epoch": 0.11, "learning_rate": 0.0002836008092386396, "loss": 0.0247, "step": 21670 }, { "epoch": 0.11, "learning_rate": 0.00028359324154562563, "loss": 0.0261, "step": 21680 }, { "epoch": 0.11, "learning_rate": 0.0002835856738526116, "loss": 0.0295, "step": 21690 }, { "epoch": 0.11, "learning_rate": 0.0002835781061595976, "loss": 0.0298, "step": 21700 }, { "epoch": 0.11, "learning_rate": 0.0002835705384665836, "loss": 0.0272, "step": 21710 }, { "epoch": 0.11, "learning_rate": 0.00028356297077356956, "loss": 0.0324, "step": 21720 }, { "epoch": 0.11, "learning_rate": 0.00028355540308055554, "loss": 0.0303, "step": 21730 }, { "epoch": 0.11, "learning_rate": 0.0002835478353875415, "loss": 0.0288, "step": 21740 }, { "epoch": 0.11, "learning_rate": 0.00028354026769452755, "loss": 0.0307, "step": 21750 }, { "epoch": 0.11, "learning_rate": 0.00028353270000151354, "loss": 0.0302, "step": 21760 }, { "epoch": 0.11, "learning_rate": 0.0002835251323084995, "loss": 0.0283, "step": 21770 }, { "epoch": 0.11, "learning_rate": 0.0002835175646154855, "loss": 0.0261, "step": 21780 }, { "epoch": 0.11, "learning_rate": 0.0002835099969224715, "loss": 0.033, "step": 21790 }, { "epoch": 0.11, "learning_rate": 0.00028350242922945746, "loss": 0.0286, "step": 21800 }, { "epoch": 0.11, "learning_rate": 0.0002834948615364435, "loss": 0.0291, "step": 21810 }, { "epoch": 0.11, "learning_rate": 0.0002834872938434295, "loss": 0.0286, "step": 21820 }, { "epoch": 0.11, "learning_rate": 0.00028347972615041546, "loss": 0.0283, "step": 21830 }, { "epoch": 0.11, "learning_rate": 0.00028347215845740144, "loss": 0.0422, "step": 21840 }, { "epoch": 0.11, "learning_rate": 0.0002834645907643874, "loss": 0.0347, "step": 21850 }, { "epoch": 0.11, "learning_rate": 0.0002834570230713734, "loss": 0.0353, "step": 21860 }, { "epoch": 0.11, "learning_rate": 0.00028344945537835944, "loss": 0.0305, "step": 21870 }, { "epoch": 0.11, "learning_rate": 0.0002834418876853454, "loss": 0.0271, "step": 21880 }, { "epoch": 0.11, "learning_rate": 0.0002834343199923314, "loss": 0.0306, "step": 21890 }, { "epoch": 0.11, "learning_rate": 0.0002834267522993174, "loss": 0.03, "step": 21900 }, { "epoch": 0.11, "learning_rate": 0.00028341918460630337, "loss": 0.0346, "step": 21910 }, { "epoch": 0.11, "learning_rate": 0.00028341161691328935, "loss": 0.03, "step": 21920 }, { "epoch": 0.11, "learning_rate": 0.00028340404922027533, "loss": 0.0244, "step": 21930 }, { "epoch": 0.11, "learning_rate": 0.00028339648152726136, "loss": 0.0304, "step": 21940 }, { "epoch": 0.11, "learning_rate": 0.00028338891383424735, "loss": 0.0304, "step": 21950 }, { "epoch": 0.11, "learning_rate": 0.00028338134614123333, "loss": 0.0289, "step": 21960 }, { "epoch": 0.11, "learning_rate": 0.0002833737784482193, "loss": 0.0245, "step": 21970 }, { "epoch": 0.11, "learning_rate": 0.0002833662107552053, "loss": 0.0291, "step": 21980 }, { "epoch": 0.11, "learning_rate": 0.00028335864306219127, "loss": 0.0277, "step": 21990 }, { "epoch": 0.11, "learning_rate": 0.00028335107536917725, "loss": 0.026, "step": 22000 }, { "epoch": 0.11, "eval_cer": 0.9144663743186606, "eval_loss": 0.021011509001255035, "eval_runtime": 117.4912, "eval_samples_per_second": 17.023, "eval_steps_per_second": 4.256, "step": 22000 }, { "epoch": 0.11, "learning_rate": 0.00028334350767616323, "loss": 0.0327, "step": 22010 }, { "epoch": 0.11, "learning_rate": 0.0002833359399831492, "loss": 0.0257, "step": 22020 }, { "epoch": 0.11, "learning_rate": 0.0002833283722901352, "loss": 0.0277, "step": 22030 }, { "epoch": 0.11, "learning_rate": 0.00028332080459712123, "loss": 0.0319, "step": 22040 }, { "epoch": 0.11, "learning_rate": 0.0002833132369041072, "loss": 0.0257, "step": 22050 }, { "epoch": 0.11, "learning_rate": 0.0002833056692110932, "loss": 0.0284, "step": 22060 }, { "epoch": 0.11, "learning_rate": 0.0002832981015180792, "loss": 0.0336, "step": 22070 }, { "epoch": 0.11, "learning_rate": 0.00028329053382506516, "loss": 0.0331, "step": 22080 }, { "epoch": 0.11, "learning_rate": 0.00028328296613205114, "loss": 0.0259, "step": 22090 }, { "epoch": 0.11, "learning_rate": 0.0002832753984390371, "loss": 0.03, "step": 22100 }, { "epoch": 0.11, "learning_rate": 0.00028326783074602316, "loss": 0.0331, "step": 22110 }, { "epoch": 0.11, "learning_rate": 0.00028326026305300914, "loss": 0.0306, "step": 22120 }, { "epoch": 0.11, "learning_rate": 0.0002832526953599951, "loss": 0.0292, "step": 22130 }, { "epoch": 0.11, "learning_rate": 0.0002832451276669811, "loss": 0.0302, "step": 22140 }, { "epoch": 0.11, "learning_rate": 0.0002832375599739671, "loss": 0.0326, "step": 22150 }, { "epoch": 0.11, "learning_rate": 0.00028322999228095306, "loss": 0.0353, "step": 22160 }, { "epoch": 0.11, "learning_rate": 0.0002832224245879391, "loss": 0.0253, "step": 22170 }, { "epoch": 0.11, "learning_rate": 0.0002832148568949251, "loss": 0.0283, "step": 22180 }, { "epoch": 0.11, "learning_rate": 0.00028320728920191106, "loss": 0.0256, "step": 22190 }, { "epoch": 0.11, "learning_rate": 0.00028319972150889704, "loss": 0.031, "step": 22200 }, { "epoch": 0.11, "learning_rate": 0.000283192153815883, "loss": 0.0296, "step": 22210 }, { "epoch": 0.11, "learning_rate": 0.000283184586122869, "loss": 0.027, "step": 22220 }, { "epoch": 0.11, "learning_rate": 0.00028317701842985504, "loss": 0.0318, "step": 22230 }, { "epoch": 0.11, "learning_rate": 0.000283169450736841, "loss": 0.0297, "step": 22240 }, { "epoch": 0.11, "learning_rate": 0.000283161883043827, "loss": 0.0266, "step": 22250 }, { "epoch": 0.11, "learning_rate": 0.000283154315350813, "loss": 0.0307, "step": 22260 }, { "epoch": 0.11, "learning_rate": 0.00028314674765779897, "loss": 0.0264, "step": 22270 }, { "epoch": 0.11, "learning_rate": 0.00028313917996478495, "loss": 0.028, "step": 22280 }, { "epoch": 0.11, "learning_rate": 0.00028313161227177093, "loss": 0.0313, "step": 22290 }, { "epoch": 0.11, "learning_rate": 0.00028312404457875697, "loss": 0.0223, "step": 22300 }, { "epoch": 0.11, "learning_rate": 0.00028311647688574295, "loss": 0.0285, "step": 22310 }, { "epoch": 0.11, "learning_rate": 0.00028310890919272893, "loss": 0.0331, "step": 22320 }, { "epoch": 0.11, "learning_rate": 0.0002831013414997149, "loss": 0.0389, "step": 22330 }, { "epoch": 0.11, "learning_rate": 0.0002830937738067009, "loss": 0.037, "step": 22340 }, { "epoch": 0.11, "learning_rate": 0.0002830862061136869, "loss": 0.0304, "step": 22350 }, { "epoch": 0.11, "learning_rate": 0.0002830786384206729, "loss": 0.0333, "step": 22360 }, { "epoch": 0.11, "learning_rate": 0.0002830710707276589, "loss": 0.0416, "step": 22370 }, { "epoch": 0.11, "learning_rate": 0.0002830635030346449, "loss": 0.0273, "step": 22380 }, { "epoch": 0.11, "learning_rate": 0.00028305593534163085, "loss": 0.0299, "step": 22390 }, { "epoch": 0.11, "learning_rate": 0.00028304836764861684, "loss": 0.0309, "step": 22400 }, { "epoch": 0.11, "learning_rate": 0.0002830407999556028, "loss": 0.0304, "step": 22410 }, { "epoch": 0.11, "learning_rate": 0.00028303323226258885, "loss": 0.0312, "step": 22420 }, { "epoch": 0.11, "learning_rate": 0.00028302566456957483, "loss": 0.0316, "step": 22430 }, { "epoch": 0.11, "learning_rate": 0.0002830180968765608, "loss": 0.0328, "step": 22440 }, { "epoch": 0.11, "learning_rate": 0.0002830105291835468, "loss": 0.0317, "step": 22450 }, { "epoch": 0.11, "learning_rate": 0.0002830029614905328, "loss": 0.0324, "step": 22460 }, { "epoch": 0.11, "learning_rate": 0.00028299539379751876, "loss": 0.0302, "step": 22470 }, { "epoch": 0.11, "learning_rate": 0.00028298782610450474, "loss": 0.0318, "step": 22480 }, { "epoch": 0.11, "learning_rate": 0.0002829802584114908, "loss": 0.0316, "step": 22490 }, { "epoch": 0.11, "learning_rate": 0.00028297269071847676, "loss": 0.0309, "step": 22500 }, { "epoch": 0.11, "learning_rate": 0.00028296512302546274, "loss": 0.0304, "step": 22510 }, { "epoch": 0.11, "learning_rate": 0.0002829575553324487, "loss": 0.0312, "step": 22520 }, { "epoch": 0.11, "learning_rate": 0.0002829499876394347, "loss": 0.0314, "step": 22530 }, { "epoch": 0.11, "learning_rate": 0.0002829424199464207, "loss": 0.035, "step": 22540 }, { "epoch": 0.11, "learning_rate": 0.0002829348522534067, "loss": 0.0283, "step": 22550 }, { "epoch": 0.11, "learning_rate": 0.0002829272845603927, "loss": 0.0304, "step": 22560 }, { "epoch": 0.11, "learning_rate": 0.0002829197168673787, "loss": 0.03, "step": 22570 }, { "epoch": 0.11, "learning_rate": 0.00028291214917436466, "loss": 0.0296, "step": 22580 }, { "epoch": 0.11, "learning_rate": 0.00028290458148135065, "loss": 0.0294, "step": 22590 }, { "epoch": 0.11, "learning_rate": 0.00028289701378833663, "loss": 0.0285, "step": 22600 }, { "epoch": 0.11, "learning_rate": 0.0002828894460953226, "loss": 0.028, "step": 22610 }, { "epoch": 0.11, "learning_rate": 0.00028288187840230864, "loss": 0.0311, "step": 22620 }, { "epoch": 0.11, "learning_rate": 0.0002828743107092946, "loss": 0.029, "step": 22630 }, { "epoch": 0.11, "learning_rate": 0.0002828667430162806, "loss": 0.0341, "step": 22640 }, { "epoch": 0.11, "learning_rate": 0.0002828591753232666, "loss": 0.0317, "step": 22650 }, { "epoch": 0.11, "learning_rate": 0.00028285160763025257, "loss": 0.0263, "step": 22660 }, { "epoch": 0.11, "learning_rate": 0.00028284403993723855, "loss": 0.0257, "step": 22670 }, { "epoch": 0.11, "learning_rate": 0.0002828364722442246, "loss": 0.0298, "step": 22680 }, { "epoch": 0.11, "learning_rate": 0.00028282890455121057, "loss": 0.0329, "step": 22690 }, { "epoch": 0.11, "learning_rate": 0.00028282133685819655, "loss": 0.0311, "step": 22700 }, { "epoch": 0.11, "learning_rate": 0.00028281376916518253, "loss": 0.0481, "step": 22710 }, { "epoch": 0.11, "learning_rate": 0.0002828062014721685, "loss": 0.0289, "step": 22720 }, { "epoch": 0.11, "learning_rate": 0.0002827986337791545, "loss": 0.0321, "step": 22730 }, { "epoch": 0.11, "learning_rate": 0.00028279106608614053, "loss": 0.0291, "step": 22740 }, { "epoch": 0.11, "learning_rate": 0.0002827834983931265, "loss": 0.0326, "step": 22750 }, { "epoch": 0.11, "learning_rate": 0.0002827759307001125, "loss": 0.0284, "step": 22760 }, { "epoch": 0.11, "learning_rate": 0.0002827683630070985, "loss": 0.0327, "step": 22770 }, { "epoch": 0.11, "learning_rate": 0.00028276079531408446, "loss": 0.0308, "step": 22780 }, { "epoch": 0.11, "learning_rate": 0.00028275322762107044, "loss": 0.0304, "step": 22790 }, { "epoch": 0.12, "learning_rate": 0.0002827456599280564, "loss": 0.0265, "step": 22800 }, { "epoch": 0.12, "learning_rate": 0.00028273809223504246, "loss": 0.032, "step": 22810 }, { "epoch": 0.12, "learning_rate": 0.00028273052454202844, "loss": 0.0385, "step": 22820 }, { "epoch": 0.12, "learning_rate": 0.0002827229568490144, "loss": 0.03, "step": 22830 }, { "epoch": 0.12, "learning_rate": 0.0002827153891560004, "loss": 0.0387, "step": 22840 }, { "epoch": 0.12, "learning_rate": 0.0002827078214629864, "loss": 0.0367, "step": 22850 }, { "epoch": 0.12, "learning_rate": 0.00028270025376997236, "loss": 0.0381, "step": 22860 }, { "epoch": 0.12, "learning_rate": 0.0002826926860769584, "loss": 0.0264, "step": 22870 }, { "epoch": 0.12, "learning_rate": 0.0002826851183839444, "loss": 0.0268, "step": 22880 }, { "epoch": 0.12, "learning_rate": 0.00028267755069093036, "loss": 0.0304, "step": 22890 }, { "epoch": 0.12, "learning_rate": 0.00028266998299791634, "loss": 0.0339, "step": 22900 }, { "epoch": 0.12, "learning_rate": 0.0002826624153049023, "loss": 0.0295, "step": 22910 }, { "epoch": 0.12, "learning_rate": 0.0002826548476118883, "loss": 0.0362, "step": 22920 }, { "epoch": 0.12, "learning_rate": 0.00028264727991887434, "loss": 0.0312, "step": 22930 }, { "epoch": 0.12, "learning_rate": 0.0002826397122258603, "loss": 0.0301, "step": 22940 }, { "epoch": 0.12, "learning_rate": 0.0002826321445328463, "loss": 0.0318, "step": 22950 }, { "epoch": 0.12, "learning_rate": 0.0002826245768398323, "loss": 0.0324, "step": 22960 }, { "epoch": 0.12, "learning_rate": 0.00028261700914681827, "loss": 0.0326, "step": 22970 }, { "epoch": 0.12, "learning_rate": 0.00028260944145380425, "loss": 0.0282, "step": 22980 }, { "epoch": 0.12, "learning_rate": 0.00028260187376079023, "loss": 0.0255, "step": 22990 }, { "epoch": 0.12, "learning_rate": 0.00028259430606777627, "loss": 0.0325, "step": 23000 }, { "epoch": 0.12, "eval_cer": 0.9145051901636767, "eval_loss": 0.02104305848479271, "eval_runtime": 117.2879, "eval_samples_per_second": 17.052, "eval_steps_per_second": 4.263, "step": 23000 }, { "epoch": 0.12, "learning_rate": 0.00028258673837476225, "loss": 0.0284, "step": 23010 }, { "epoch": 0.12, "learning_rate": 0.00028257917068174823, "loss": 0.0292, "step": 23020 }, { "epoch": 0.12, "learning_rate": 0.0002825716029887342, "loss": 0.0379, "step": 23030 }, { "epoch": 0.12, "learning_rate": 0.0002825640352957202, "loss": 0.0286, "step": 23040 }, { "epoch": 0.12, "learning_rate": 0.00028255646760270617, "loss": 0.028, "step": 23050 }, { "epoch": 0.12, "learning_rate": 0.0002825488999096922, "loss": 0.0265, "step": 23060 }, { "epoch": 0.12, "learning_rate": 0.0002825413322166782, "loss": 0.0265, "step": 23070 }, { "epoch": 0.12, "learning_rate": 0.00028253376452366417, "loss": 0.0236, "step": 23080 }, { "epoch": 0.12, "learning_rate": 0.00028252619683065015, "loss": 0.0313, "step": 23090 }, { "epoch": 0.12, "learning_rate": 0.00028251862913763613, "loss": 0.0322, "step": 23100 }, { "epoch": 0.12, "learning_rate": 0.0002825110614446221, "loss": 0.0246, "step": 23110 }, { "epoch": 0.12, "learning_rate": 0.0002825034937516081, "loss": 0.0267, "step": 23120 }, { "epoch": 0.12, "learning_rate": 0.00028249592605859413, "loss": 0.0279, "step": 23130 }, { "epoch": 0.12, "learning_rate": 0.0002824883583655801, "loss": 0.0299, "step": 23140 }, { "epoch": 0.12, "learning_rate": 0.0002824807906725661, "loss": 0.0319, "step": 23150 }, { "epoch": 0.12, "learning_rate": 0.0002824732229795521, "loss": 0.0298, "step": 23160 }, { "epoch": 0.12, "learning_rate": 0.00028246565528653806, "loss": 0.0317, "step": 23170 }, { "epoch": 0.12, "learning_rate": 0.00028245808759352404, "loss": 0.0303, "step": 23180 }, { "epoch": 0.12, "learning_rate": 0.0002824505199005101, "loss": 0.0286, "step": 23190 }, { "epoch": 0.12, "learning_rate": 0.00028244295220749606, "loss": 0.0312, "step": 23200 }, { "epoch": 0.12, "learning_rate": 0.00028243538451448204, "loss": 0.033, "step": 23210 }, { "epoch": 0.12, "learning_rate": 0.000282427816821468, "loss": 0.0292, "step": 23220 }, { "epoch": 0.12, "learning_rate": 0.000282420249128454, "loss": 0.0307, "step": 23230 }, { "epoch": 0.12, "learning_rate": 0.00028241268143544, "loss": 0.0273, "step": 23240 }, { "epoch": 0.12, "learning_rate": 0.000282405113742426, "loss": 0.0331, "step": 23250 }, { "epoch": 0.12, "learning_rate": 0.00028239754604941195, "loss": 0.028, "step": 23260 }, { "epoch": 0.12, "learning_rate": 0.0002823899783563979, "loss": 0.0332, "step": 23270 }, { "epoch": 0.12, "learning_rate": 0.0002823824106633839, "loss": 0.026, "step": 23280 }, { "epoch": 0.12, "learning_rate": 0.00028237484297036994, "loss": 0.0326, "step": 23290 }, { "epoch": 0.12, "learning_rate": 0.0002823672752773559, "loss": 0.0301, "step": 23300 }, { "epoch": 0.12, "learning_rate": 0.0002823597075843419, "loss": 0.0236, "step": 23310 }, { "epoch": 0.12, "learning_rate": 0.0002823521398913279, "loss": 0.0281, "step": 23320 }, { "epoch": 0.12, "learning_rate": 0.00028234457219831387, "loss": 0.0325, "step": 23330 }, { "epoch": 0.12, "learning_rate": 0.00028233700450529985, "loss": 0.0255, "step": 23340 }, { "epoch": 0.12, "learning_rate": 0.00028232943681228583, "loss": 0.0332, "step": 23350 }, { "epoch": 0.12, "learning_rate": 0.00028232186911927187, "loss": 0.0365, "step": 23360 }, { "epoch": 0.12, "learning_rate": 0.00028231430142625785, "loss": 0.0262, "step": 23370 }, { "epoch": 0.12, "learning_rate": 0.00028230673373324383, "loss": 0.03, "step": 23380 }, { "epoch": 0.12, "learning_rate": 0.0002822991660402298, "loss": 0.0291, "step": 23390 }, { "epoch": 0.12, "learning_rate": 0.0002822915983472158, "loss": 0.0318, "step": 23400 }, { "epoch": 0.12, "learning_rate": 0.0002822840306542018, "loss": 0.027, "step": 23410 }, { "epoch": 0.12, "learning_rate": 0.0002822764629611878, "loss": 0.0291, "step": 23420 }, { "epoch": 0.12, "learning_rate": 0.0002822688952681738, "loss": 0.0266, "step": 23430 }, { "epoch": 0.12, "learning_rate": 0.0002822613275751598, "loss": 0.0257, "step": 23440 }, { "epoch": 0.12, "learning_rate": 0.00028225375988214576, "loss": 0.0247, "step": 23450 }, { "epoch": 0.12, "learning_rate": 0.00028224619218913174, "loss": 0.0295, "step": 23460 }, { "epoch": 0.12, "learning_rate": 0.0002822386244961177, "loss": 0.0279, "step": 23470 }, { "epoch": 0.12, "learning_rate": 0.00028223105680310375, "loss": 0.0316, "step": 23480 }, { "epoch": 0.12, "learning_rate": 0.00028222348911008974, "loss": 0.0258, "step": 23490 }, { "epoch": 0.12, "learning_rate": 0.0002822159214170757, "loss": 0.0262, "step": 23500 }, { "epoch": 0.12, "learning_rate": 0.0002822083537240617, "loss": 0.033, "step": 23510 }, { "epoch": 0.12, "learning_rate": 0.0002822007860310477, "loss": 0.0299, "step": 23520 }, { "epoch": 0.12, "learning_rate": 0.00028219321833803366, "loss": 0.0252, "step": 23530 }, { "epoch": 0.12, "learning_rate": 0.00028218565064501964, "loss": 0.0287, "step": 23540 }, { "epoch": 0.12, "learning_rate": 0.0002821780829520057, "loss": 0.1276, "step": 23550 }, { "epoch": 0.12, "learning_rate": 0.00028217051525899166, "loss": 0.0328, "step": 23560 }, { "epoch": 0.12, "learning_rate": 0.00028216294756597764, "loss": 0.0346, "step": 23570 }, { "epoch": 0.12, "learning_rate": 0.0002821553798729636, "loss": 0.0323, "step": 23580 }, { "epoch": 0.12, "learning_rate": 0.0002821478121799496, "loss": 0.0339, "step": 23590 }, { "epoch": 0.12, "learning_rate": 0.0002821402444869356, "loss": 0.0294, "step": 23600 }, { "epoch": 0.12, "learning_rate": 0.0002821326767939216, "loss": 0.0275, "step": 23610 }, { "epoch": 0.12, "learning_rate": 0.0002821251091009076, "loss": 0.0323, "step": 23620 }, { "epoch": 0.12, "learning_rate": 0.0002821175414078936, "loss": 0.0292, "step": 23630 }, { "epoch": 0.12, "learning_rate": 0.00028210997371487957, "loss": 0.0291, "step": 23640 }, { "epoch": 0.12, "learning_rate": 0.00028210240602186555, "loss": 0.0379, "step": 23650 }, { "epoch": 0.12, "learning_rate": 0.00028209483832885153, "loss": 0.0279, "step": 23660 }, { "epoch": 0.12, "learning_rate": 0.00028208727063583756, "loss": 0.0226, "step": 23670 }, { "epoch": 0.12, "learning_rate": 0.00028207970294282355, "loss": 0.0285, "step": 23680 }, { "epoch": 0.12, "learning_rate": 0.0002820721352498095, "loss": 0.0275, "step": 23690 }, { "epoch": 0.12, "learning_rate": 0.0002820645675567955, "loss": 0.0252, "step": 23700 }, { "epoch": 0.12, "learning_rate": 0.0002820569998637815, "loss": 0.0279, "step": 23710 }, { "epoch": 0.12, "learning_rate": 0.00028204943217076747, "loss": 0.0306, "step": 23720 }, { "epoch": 0.12, "learning_rate": 0.00028204186447775345, "loss": 0.0272, "step": 23730 }, { "epoch": 0.12, "learning_rate": 0.0002820342967847395, "loss": 0.0456, "step": 23740 }, { "epoch": 0.12, "learning_rate": 0.00028202672909172547, "loss": 0.0343, "step": 23750 }, { "epoch": 0.12, "learning_rate": 0.00028201916139871145, "loss": 0.0281, "step": 23760 }, { "epoch": 0.12, "learning_rate": 0.00028201159370569743, "loss": 0.0254, "step": 23770 }, { "epoch": 0.12, "learning_rate": 0.0002820040260126834, "loss": 0.0322, "step": 23780 }, { "epoch": 0.12, "learning_rate": 0.0002819964583196694, "loss": 0.03, "step": 23790 }, { "epoch": 0.12, "learning_rate": 0.00028198889062665543, "loss": 0.0271, "step": 23800 }, { "epoch": 0.12, "learning_rate": 0.0002819813229336414, "loss": 0.029, "step": 23810 }, { "epoch": 0.12, "learning_rate": 0.0002819737552406274, "loss": 0.0246, "step": 23820 }, { "epoch": 0.12, "learning_rate": 0.0002819661875476134, "loss": 0.0308, "step": 23830 }, { "epoch": 0.12, "learning_rate": 0.00028195861985459936, "loss": 0.027, "step": 23840 }, { "epoch": 0.12, "learning_rate": 0.00028195105216158534, "loss": 0.0289, "step": 23850 }, { "epoch": 0.12, "learning_rate": 0.0002819434844685713, "loss": 0.0263, "step": 23860 }, { "epoch": 0.12, "learning_rate": 0.00028193591677555736, "loss": 0.0278, "step": 23870 }, { "epoch": 0.12, "learning_rate": 0.00028192834908254334, "loss": 0.0247, "step": 23880 }, { "epoch": 0.12, "learning_rate": 0.0002819207813895293, "loss": 0.03, "step": 23890 }, { "epoch": 0.12, "learning_rate": 0.0002819132136965153, "loss": 0.031, "step": 23900 }, { "epoch": 0.12, "learning_rate": 0.0002819056460035013, "loss": 0.0288, "step": 23910 }, { "epoch": 0.12, "learning_rate": 0.00028189807831048726, "loss": 0.0339, "step": 23920 }, { "epoch": 0.12, "learning_rate": 0.0002818905106174733, "loss": 0.0262, "step": 23930 }, { "epoch": 0.12, "learning_rate": 0.0002818829429244593, "loss": 0.0301, "step": 23940 }, { "epoch": 0.12, "learning_rate": 0.00028187537523144526, "loss": 0.0292, "step": 23950 }, { "epoch": 0.12, "learning_rate": 0.00028186780753843124, "loss": 0.0291, "step": 23960 }, { "epoch": 0.12, "learning_rate": 0.0002818602398454172, "loss": 0.0244, "step": 23970 }, { "epoch": 0.12, "learning_rate": 0.0002818526721524032, "loss": 0.0304, "step": 23980 }, { "epoch": 0.12, "learning_rate": 0.00028184510445938924, "loss": 0.0227, "step": 23990 }, { "epoch": 0.12, "learning_rate": 0.0002818375367663752, "loss": 0.0285, "step": 24000 }, { "epoch": 0.12, "eval_cer": 0.9144692855070369, "eval_loss": 0.02072213776409626, "eval_runtime": 117.2385, "eval_samples_per_second": 17.059, "eval_steps_per_second": 4.265, "step": 24000 }, { "epoch": 0.12, "learning_rate": 0.0002818299690733612, "loss": 0.0287, "step": 24010 }, { "epoch": 0.12, "learning_rate": 0.0002818224013803472, "loss": 0.0316, "step": 24020 }, { "epoch": 0.12, "learning_rate": 0.00028181483368733317, "loss": 0.0248, "step": 24030 }, { "epoch": 0.12, "learning_rate": 0.00028180726599431915, "loss": 0.0284, "step": 24040 }, { "epoch": 0.12, "learning_rate": 0.00028179969830130513, "loss": 0.0252, "step": 24050 }, { "epoch": 0.12, "learning_rate": 0.00028179213060829117, "loss": 0.0277, "step": 24060 }, { "epoch": 0.12, "learning_rate": 0.00028178456291527715, "loss": 0.0269, "step": 24070 }, { "epoch": 0.12, "learning_rate": 0.00028177699522226313, "loss": 0.0237, "step": 24080 }, { "epoch": 0.12, "learning_rate": 0.0002817694275292491, "loss": 0.0218, "step": 24090 }, { "epoch": 0.12, "learning_rate": 0.0002817618598362351, "loss": 0.0265, "step": 24100 }, { "epoch": 0.12, "learning_rate": 0.00028175429214322107, "loss": 0.0265, "step": 24110 }, { "epoch": 0.12, "learning_rate": 0.0002817467244502071, "loss": 0.0246, "step": 24120 }, { "epoch": 0.12, "learning_rate": 0.0002817391567571931, "loss": 0.032, "step": 24130 }, { "epoch": 0.12, "learning_rate": 0.00028173158906417907, "loss": 0.0256, "step": 24140 }, { "epoch": 0.12, "learning_rate": 0.00028172402137116505, "loss": 0.028, "step": 24150 }, { "epoch": 0.12, "learning_rate": 0.00028171645367815103, "loss": 0.0244, "step": 24160 }, { "epoch": 0.12, "learning_rate": 0.000281708885985137, "loss": 0.0364, "step": 24170 }, { "epoch": 0.12, "learning_rate": 0.000281701318292123, "loss": 0.0286, "step": 24180 }, { "epoch": 0.12, "learning_rate": 0.00028169375059910903, "loss": 0.0318, "step": 24190 }, { "epoch": 0.12, "learning_rate": 0.000281686182906095, "loss": 0.027, "step": 24200 }, { "epoch": 0.12, "learning_rate": 0.000281678615213081, "loss": 0.0287, "step": 24210 }, { "epoch": 0.12, "learning_rate": 0.000281671047520067, "loss": 0.0317, "step": 24220 }, { "epoch": 0.12, "learning_rate": 0.00028166347982705296, "loss": 0.0302, "step": 24230 }, { "epoch": 0.12, "learning_rate": 0.00028165591213403894, "loss": 0.0272, "step": 24240 }, { "epoch": 0.12, "learning_rate": 0.000281648344441025, "loss": 0.0273, "step": 24250 }, { "epoch": 0.12, "learning_rate": 0.00028164077674801096, "loss": 0.0303, "step": 24260 }, { "epoch": 0.12, "learning_rate": 0.00028163320905499694, "loss": 0.0329, "step": 24270 }, { "epoch": 0.12, "learning_rate": 0.0002816256413619829, "loss": 0.0332, "step": 24280 }, { "epoch": 0.12, "learning_rate": 0.0002816180736689689, "loss": 0.0362, "step": 24290 }, { "epoch": 0.12, "learning_rate": 0.0002816105059759549, "loss": 0.0304, "step": 24300 }, { "epoch": 0.12, "learning_rate": 0.0002816029382829409, "loss": 0.0287, "step": 24310 }, { "epoch": 0.12, "learning_rate": 0.0002815953705899269, "loss": 0.0327, "step": 24320 }, { "epoch": 0.12, "learning_rate": 0.0002815878028969129, "loss": 0.0282, "step": 24330 }, { "epoch": 0.12, "learning_rate": 0.00028158023520389886, "loss": 0.0288, "step": 24340 }, { "epoch": 0.12, "learning_rate": 0.00028157266751088484, "loss": 0.0349, "step": 24350 }, { "epoch": 0.12, "learning_rate": 0.0002815650998178708, "loss": 0.0319, "step": 24360 }, { "epoch": 0.12, "learning_rate": 0.0002815575321248568, "loss": 0.0286, "step": 24370 }, { "epoch": 0.12, "learning_rate": 0.00028154996443184284, "loss": 0.0275, "step": 24380 }, { "epoch": 0.12, "learning_rate": 0.0002815423967388288, "loss": 0.0355, "step": 24390 }, { "epoch": 0.12, "learning_rate": 0.0002815348290458148, "loss": 0.0302, "step": 24400 }, { "epoch": 0.12, "learning_rate": 0.0002815272613528008, "loss": 0.0293, "step": 24410 }, { "epoch": 0.12, "learning_rate": 0.00028151969365978677, "loss": 0.0315, "step": 24420 }, { "epoch": 0.12, "learning_rate": 0.00028151212596677275, "loss": 0.0235, "step": 24430 }, { "epoch": 0.12, "learning_rate": 0.0002815045582737588, "loss": 0.0301, "step": 24440 }, { "epoch": 0.12, "learning_rate": 0.00028149699058074477, "loss": 0.029, "step": 24450 }, { "epoch": 0.12, "learning_rate": 0.00028148942288773075, "loss": 0.0302, "step": 24460 }, { "epoch": 0.12, "learning_rate": 0.00028148185519471673, "loss": 0.0273, "step": 24470 }, { "epoch": 0.12, "learning_rate": 0.0002814742875017027, "loss": 0.0269, "step": 24480 }, { "epoch": 0.12, "learning_rate": 0.0002814667198086887, "loss": 0.0247, "step": 24490 }, { "epoch": 0.12, "learning_rate": 0.00028145915211567473, "loss": 0.026, "step": 24500 }, { "epoch": 0.12, "learning_rate": 0.00028145158442266066, "loss": 0.0294, "step": 24510 }, { "epoch": 0.12, "learning_rate": 0.00028144401672964664, "loss": 0.0272, "step": 24520 }, { "epoch": 0.12, "learning_rate": 0.0002814364490366326, "loss": 0.0217, "step": 24530 }, { "epoch": 0.12, "learning_rate": 0.00028142888134361865, "loss": 0.0293, "step": 24540 }, { "epoch": 0.12, "learning_rate": 0.00028142131365060464, "loss": 0.0248, "step": 24550 }, { "epoch": 0.12, "learning_rate": 0.0002814137459575906, "loss": 0.0291, "step": 24560 }, { "epoch": 0.12, "learning_rate": 0.0002814061782645766, "loss": 0.0301, "step": 24570 }, { "epoch": 0.12, "learning_rate": 0.0002813986105715626, "loss": 0.027, "step": 24580 }, { "epoch": 0.12, "learning_rate": 0.00028139104287854856, "loss": 0.0261, "step": 24590 }, { "epoch": 0.12, "learning_rate": 0.00028138347518553454, "loss": 0.034, "step": 24600 }, { "epoch": 0.12, "learning_rate": 0.0002813759074925206, "loss": 0.028, "step": 24610 }, { "epoch": 0.12, "learning_rate": 0.00028136833979950656, "loss": 0.0271, "step": 24620 }, { "epoch": 0.12, "learning_rate": 0.00028136077210649254, "loss": 0.0243, "step": 24630 }, { "epoch": 0.12, "learning_rate": 0.0002813532044134785, "loss": 0.0262, "step": 24640 }, { "epoch": 0.12, "learning_rate": 0.0002813456367204645, "loss": 0.0321, "step": 24650 }, { "epoch": 0.12, "learning_rate": 0.0002813380690274505, "loss": 0.0278, "step": 24660 }, { "epoch": 0.12, "learning_rate": 0.0002813305013344365, "loss": 0.0268, "step": 24670 }, { "epoch": 0.12, "learning_rate": 0.0002813229336414225, "loss": 0.0261, "step": 24680 }, { "epoch": 0.12, "learning_rate": 0.0002813153659484085, "loss": 0.0272, "step": 24690 }, { "epoch": 0.12, "learning_rate": 0.00028130779825539447, "loss": 0.0261, "step": 24700 }, { "epoch": 0.12, "learning_rate": 0.00028130023056238045, "loss": 0.0262, "step": 24710 }, { "epoch": 0.12, "learning_rate": 0.00028129266286936643, "loss": 0.0257, "step": 24720 }, { "epoch": 0.12, "learning_rate": 0.00028128509517635246, "loss": 0.0253, "step": 24730 }, { "epoch": 0.12, "learning_rate": 0.00028127752748333845, "loss": 0.0288, "step": 24740 }, { "epoch": 0.12, "learning_rate": 0.0002812699597903244, "loss": 0.0277, "step": 24750 }, { "epoch": 0.12, "learning_rate": 0.0002812623920973104, "loss": 0.0255, "step": 24760 }, { "epoch": 0.12, "learning_rate": 0.0002812548244042964, "loss": 0.0246, "step": 24770 }, { "epoch": 0.13, "learning_rate": 0.00028124725671128237, "loss": 0.0251, "step": 24780 }, { "epoch": 0.13, "learning_rate": 0.00028123968901826835, "loss": 0.0291, "step": 24790 }, { "epoch": 0.13, "learning_rate": 0.0002812321213252544, "loss": 0.0275, "step": 24800 }, { "epoch": 0.13, "learning_rate": 0.00028122455363224037, "loss": 0.0207, "step": 24810 }, { "epoch": 0.13, "learning_rate": 0.00028121698593922635, "loss": 0.023, "step": 24820 }, { "epoch": 0.13, "learning_rate": 0.00028120941824621233, "loss": 0.0244, "step": 24830 }, { "epoch": 0.13, "learning_rate": 0.0002812018505531983, "loss": 0.0243, "step": 24840 }, { "epoch": 0.13, "learning_rate": 0.0002811942828601843, "loss": 0.0252, "step": 24850 }, { "epoch": 0.13, "learning_rate": 0.00028118671516717033, "loss": 0.0266, "step": 24860 }, { "epoch": 0.13, "learning_rate": 0.0002811791474741563, "loss": 0.0278, "step": 24870 }, { "epoch": 0.13, "learning_rate": 0.0002811715797811423, "loss": 0.0258, "step": 24880 }, { "epoch": 0.13, "learning_rate": 0.0002811640120881283, "loss": 0.0303, "step": 24890 }, { "epoch": 0.13, "learning_rate": 0.00028115644439511426, "loss": 0.0255, "step": 24900 }, { "epoch": 0.13, "learning_rate": 0.00028114887670210024, "loss": 0.0287, "step": 24910 }, { "epoch": 0.13, "learning_rate": 0.0002811413090090862, "loss": 0.0292, "step": 24920 }, { "epoch": 0.13, "learning_rate": 0.00028113374131607226, "loss": 0.0314, "step": 24930 }, { "epoch": 0.13, "learning_rate": 0.00028112617362305824, "loss": 0.0283, "step": 24940 }, { "epoch": 0.13, "learning_rate": 0.0002811186059300442, "loss": 0.0254, "step": 24950 }, { "epoch": 0.13, "learning_rate": 0.0002811110382370302, "loss": 0.0273, "step": 24960 }, { "epoch": 0.13, "learning_rate": 0.0002811034705440162, "loss": 0.0274, "step": 24970 }, { "epoch": 0.13, "learning_rate": 0.00028109590285100216, "loss": 0.0304, "step": 24980 }, { "epoch": 0.13, "learning_rate": 0.0002810883351579882, "loss": 0.0299, "step": 24990 }, { "epoch": 0.13, "learning_rate": 0.0002810807674649742, "loss": 0.0289, "step": 25000 }, { "epoch": 0.13, "eval_cer": 0.9144751078837893, "eval_loss": 0.01934368908405304, "eval_runtime": 117.2646, "eval_samples_per_second": 17.055, "eval_steps_per_second": 4.264, "step": 25000 }, { "epoch": 0.13, "learning_rate": 0.00028107319977196016, "loss": 0.032, "step": 25010 }, { "epoch": 0.13, "learning_rate": 0.00028106563207894614, "loss": 0.0244, "step": 25020 }, { "epoch": 0.13, "learning_rate": 0.0002810580643859321, "loss": 0.0296, "step": 25030 }, { "epoch": 0.13, "learning_rate": 0.0002810504966929181, "loss": 0.0274, "step": 25040 }, { "epoch": 0.13, "learning_rate": 0.00028104292899990414, "loss": 0.0288, "step": 25050 }, { "epoch": 0.13, "learning_rate": 0.0002810353613068901, "loss": 0.0311, "step": 25060 }, { "epoch": 0.13, "learning_rate": 0.0002810277936138761, "loss": 0.0269, "step": 25070 }, { "epoch": 0.13, "learning_rate": 0.0002810202259208621, "loss": 0.0316, "step": 25080 }, { "epoch": 0.13, "learning_rate": 0.00028101265822784807, "loss": 0.0299, "step": 25090 }, { "epoch": 0.13, "learning_rate": 0.00028100509053483405, "loss": 0.0291, "step": 25100 }, { "epoch": 0.13, "learning_rate": 0.00028099752284182003, "loss": 0.0313, "step": 25110 }, { "epoch": 0.13, "learning_rate": 0.00028098995514880607, "loss": 0.031, "step": 25120 }, { "epoch": 0.13, "learning_rate": 0.00028098238745579205, "loss": 0.028, "step": 25130 }, { "epoch": 0.13, "learning_rate": 0.00028097481976277803, "loss": 0.025, "step": 25140 }, { "epoch": 0.13, "learning_rate": 0.000280967252069764, "loss": 0.0181, "step": 25150 }, { "epoch": 0.13, "learning_rate": 0.00028095968437675, "loss": 0.027, "step": 25160 }, { "epoch": 0.13, "learning_rate": 0.00028095211668373597, "loss": 0.0255, "step": 25170 }, { "epoch": 0.13, "learning_rate": 0.000280944548990722, "loss": 0.0309, "step": 25180 }, { "epoch": 0.13, "learning_rate": 0.000280936981297708, "loss": 0.0269, "step": 25190 }, { "epoch": 0.13, "learning_rate": 0.00028092941360469397, "loss": 0.0306, "step": 25200 }, { "epoch": 0.13, "learning_rate": 0.00028092184591167995, "loss": 0.0282, "step": 25210 }, { "epoch": 0.13, "learning_rate": 0.00028091427821866593, "loss": 0.0253, "step": 25220 }, { "epoch": 0.13, "learning_rate": 0.0002809067105256519, "loss": 0.0256, "step": 25230 }, { "epoch": 0.13, "learning_rate": 0.00028089914283263795, "loss": 0.0316, "step": 25240 }, { "epoch": 0.13, "learning_rate": 0.00028089157513962393, "loss": 0.0256, "step": 25250 }, { "epoch": 0.13, "learning_rate": 0.0002808840074466099, "loss": 0.0257, "step": 25260 }, { "epoch": 0.13, "learning_rate": 0.0002808764397535959, "loss": 0.0248, "step": 25270 }, { "epoch": 0.13, "learning_rate": 0.0002808688720605819, "loss": 0.0261, "step": 25280 }, { "epoch": 0.13, "learning_rate": 0.00028086130436756786, "loss": 0.0283, "step": 25290 }, { "epoch": 0.13, "learning_rate": 0.00028085373667455384, "loss": 0.0252, "step": 25300 }, { "epoch": 0.13, "learning_rate": 0.0002808461689815399, "loss": 0.0266, "step": 25310 }, { "epoch": 0.13, "learning_rate": 0.00028083860128852586, "loss": 0.0215, "step": 25320 }, { "epoch": 0.13, "learning_rate": 0.00028083103359551184, "loss": 0.0299, "step": 25330 }, { "epoch": 0.13, "learning_rate": 0.0002808234659024978, "loss": 0.0243, "step": 25340 }, { "epoch": 0.13, "learning_rate": 0.0002808158982094838, "loss": 0.0348, "step": 25350 }, { "epoch": 0.13, "learning_rate": 0.0002808083305164698, "loss": 0.0266, "step": 25360 }, { "epoch": 0.13, "learning_rate": 0.0002808007628234558, "loss": 0.0305, "step": 25370 }, { "epoch": 0.13, "learning_rate": 0.0002807931951304418, "loss": 0.0269, "step": 25380 }, { "epoch": 0.13, "learning_rate": 0.0002807856274374278, "loss": 0.0313, "step": 25390 }, { "epoch": 0.13, "learning_rate": 0.00028077805974441376, "loss": 0.03, "step": 25400 }, { "epoch": 0.13, "learning_rate": 0.00028077049205139974, "loss": 0.0283, "step": 25410 }, { "epoch": 0.13, "learning_rate": 0.0002807629243583857, "loss": 0.0247, "step": 25420 }, { "epoch": 0.13, "learning_rate": 0.0002807553566653717, "loss": 0.0282, "step": 25430 }, { "epoch": 0.13, "learning_rate": 0.00028074778897235774, "loss": 0.0228, "step": 25440 }, { "epoch": 0.13, "learning_rate": 0.0002807402212793437, "loss": 0.027, "step": 25450 }, { "epoch": 0.13, "learning_rate": 0.0002807326535863297, "loss": 0.0335, "step": 25460 }, { "epoch": 0.13, "learning_rate": 0.0002807250858933157, "loss": 0.0284, "step": 25470 }, { "epoch": 0.13, "learning_rate": 0.00028071751820030167, "loss": 0.03, "step": 25480 }, { "epoch": 0.13, "learning_rate": 0.00028070995050728765, "loss": 0.0267, "step": 25490 }, { "epoch": 0.13, "learning_rate": 0.0002807023828142737, "loss": 0.0261, "step": 25500 }, { "epoch": 0.13, "learning_rate": 0.00028069481512125967, "loss": 0.0282, "step": 25510 }, { "epoch": 0.13, "learning_rate": 0.00028068724742824565, "loss": 0.0257, "step": 25520 }, { "epoch": 0.13, "learning_rate": 0.00028067967973523163, "loss": 0.0275, "step": 25530 }, { "epoch": 0.13, "learning_rate": 0.0002806721120422176, "loss": 0.0248, "step": 25540 }, { "epoch": 0.13, "learning_rate": 0.0002806645443492036, "loss": 0.0252, "step": 25550 }, { "epoch": 0.13, "learning_rate": 0.00028065697665618963, "loss": 0.0278, "step": 25560 }, { "epoch": 0.13, "learning_rate": 0.0002806494089631756, "loss": 0.0305, "step": 25570 }, { "epoch": 0.13, "learning_rate": 0.0002806418412701616, "loss": 0.0253, "step": 25580 }, { "epoch": 0.13, "learning_rate": 0.00028063427357714757, "loss": 0.0302, "step": 25590 }, { "epoch": 0.13, "learning_rate": 0.00028062670588413355, "loss": 0.0312, "step": 25600 }, { "epoch": 0.13, "learning_rate": 0.00028061913819111954, "loss": 0.0293, "step": 25610 }, { "epoch": 0.13, "learning_rate": 0.0002806115704981055, "loss": 0.0286, "step": 25620 }, { "epoch": 0.13, "learning_rate": 0.00028060400280509155, "loss": 0.0266, "step": 25630 }, { "epoch": 0.13, "learning_rate": 0.00028059643511207753, "loss": 0.0245, "step": 25640 }, { "epoch": 0.13, "learning_rate": 0.0002805888674190635, "loss": 0.0277, "step": 25650 }, { "epoch": 0.13, "learning_rate": 0.0002805812997260495, "loss": 0.0281, "step": 25660 }, { "epoch": 0.13, "learning_rate": 0.0002805737320330355, "loss": 0.0347, "step": 25670 }, { "epoch": 0.13, "learning_rate": 0.00028056616434002146, "loss": 0.0276, "step": 25680 }, { "epoch": 0.13, "learning_rate": 0.0002805585966470075, "loss": 0.03, "step": 25690 }, { "epoch": 0.13, "learning_rate": 0.0002805510289539935, "loss": 0.0271, "step": 25700 }, { "epoch": 0.13, "learning_rate": 0.00028054346126097946, "loss": 0.0377, "step": 25710 }, { "epoch": 0.13, "learning_rate": 0.00028053589356796544, "loss": 0.0605, "step": 25720 }, { "epoch": 0.13, "learning_rate": 0.0002805283258749514, "loss": 0.032, "step": 25730 }, { "epoch": 0.13, "learning_rate": 0.0002805207581819374, "loss": 0.0337, "step": 25740 }, { "epoch": 0.13, "learning_rate": 0.00028051319048892344, "loss": 0.0272, "step": 25750 }, { "epoch": 0.13, "learning_rate": 0.0002805056227959094, "loss": 0.0316, "step": 25760 }, { "epoch": 0.13, "learning_rate": 0.00028049805510289535, "loss": 0.0249, "step": 25770 }, { "epoch": 0.13, "learning_rate": 0.00028049048740988133, "loss": 0.0272, "step": 25780 }, { "epoch": 0.13, "learning_rate": 0.00028048291971686736, "loss": 0.0345, "step": 25790 }, { "epoch": 0.13, "learning_rate": 0.00028047535202385335, "loss": 0.0284, "step": 25800 }, { "epoch": 0.13, "learning_rate": 0.00028046778433083933, "loss": 0.0267, "step": 25810 }, { "epoch": 0.13, "learning_rate": 0.0002804602166378253, "loss": 0.0271, "step": 25820 }, { "epoch": 0.13, "learning_rate": 0.0002804526489448113, "loss": 0.0298, "step": 25830 }, { "epoch": 0.13, "learning_rate": 0.00028044508125179727, "loss": 0.0277, "step": 25840 }, { "epoch": 0.13, "learning_rate": 0.00028043751355878325, "loss": 0.0267, "step": 25850 }, { "epoch": 0.13, "learning_rate": 0.0002804299458657693, "loss": 0.0267, "step": 25860 }, { "epoch": 0.13, "learning_rate": 0.00028042237817275527, "loss": 0.024, "step": 25870 }, { "epoch": 0.13, "learning_rate": 0.00028041481047974125, "loss": 0.0263, "step": 25880 }, { "epoch": 0.13, "learning_rate": 0.00028040724278672723, "loss": 0.0284, "step": 25890 }, { "epoch": 0.13, "learning_rate": 0.0002803996750937132, "loss": 0.0283, "step": 25900 }, { "epoch": 0.13, "learning_rate": 0.0002803921074006992, "loss": 0.0398, "step": 25910 }, { "epoch": 0.13, "learning_rate": 0.00028038453970768523, "loss": 0.0498, "step": 25920 }, { "epoch": 0.13, "learning_rate": 0.0002803769720146712, "loss": 0.03, "step": 25930 }, { "epoch": 0.13, "learning_rate": 0.0002803694043216572, "loss": 0.0254, "step": 25940 }, { "epoch": 0.13, "learning_rate": 0.0002803618366286432, "loss": 0.027, "step": 25950 }, { "epoch": 0.13, "learning_rate": 0.00028035426893562916, "loss": 0.0304, "step": 25960 }, { "epoch": 0.13, "learning_rate": 0.00028034670124261514, "loss": 0.0237, "step": 25970 }, { "epoch": 0.13, "learning_rate": 0.0002803391335496011, "loss": 0.0255, "step": 25980 }, { "epoch": 0.13, "learning_rate": 0.00028033156585658716, "loss": 0.0223, "step": 25990 }, { "epoch": 0.13, "learning_rate": 0.00028032399816357314, "loss": 0.0258, "step": 26000 }, { "epoch": 0.13, "eval_cer": 0.9144799598644162, "eval_loss": 0.019629212096333504, "eval_runtime": 117.332, "eval_samples_per_second": 17.046, "eval_steps_per_second": 4.261, "step": 26000 }, { "epoch": 0.13, "learning_rate": 0.0002803164304705591, "loss": 0.0294, "step": 26010 }, { "epoch": 0.13, "learning_rate": 0.0002803088627775451, "loss": 0.028, "step": 26020 }, { "epoch": 0.13, "learning_rate": 0.0002803012950845311, "loss": 0.0272, "step": 26030 }, { "epoch": 0.13, "learning_rate": 0.00028029372739151706, "loss": 0.0292, "step": 26040 }, { "epoch": 0.13, "learning_rate": 0.0002802861596985031, "loss": 0.0327, "step": 26050 }, { "epoch": 0.13, "learning_rate": 0.0002802785920054891, "loss": 0.0273, "step": 26060 }, { "epoch": 0.13, "learning_rate": 0.00028027102431247506, "loss": 0.0342, "step": 26070 }, { "epoch": 0.13, "learning_rate": 0.00028026345661946104, "loss": 0.0319, "step": 26080 }, { "epoch": 0.13, "learning_rate": 0.000280255888926447, "loss": 0.031, "step": 26090 }, { "epoch": 0.13, "learning_rate": 0.000280248321233433, "loss": 0.0213, "step": 26100 }, { "epoch": 0.13, "learning_rate": 0.00028024075354041904, "loss": 0.0271, "step": 26110 }, { "epoch": 0.13, "learning_rate": 0.000280233185847405, "loss": 0.0279, "step": 26120 }, { "epoch": 0.13, "learning_rate": 0.000280225618154391, "loss": 0.0244, "step": 26130 }, { "epoch": 0.13, "learning_rate": 0.000280218050461377, "loss": 0.0294, "step": 26140 }, { "epoch": 0.13, "learning_rate": 0.00028021048276836297, "loss": 0.0253, "step": 26150 }, { "epoch": 0.13, "learning_rate": 0.00028020291507534895, "loss": 0.0221, "step": 26160 }, { "epoch": 0.13, "learning_rate": 0.00028019534738233493, "loss": 0.0235, "step": 26170 }, { "epoch": 0.13, "learning_rate": 0.00028018777968932097, "loss": 0.0256, "step": 26180 }, { "epoch": 0.13, "learning_rate": 0.00028018021199630695, "loss": 0.0281, "step": 26190 }, { "epoch": 0.13, "learning_rate": 0.00028017264430329293, "loss": 0.0277, "step": 26200 }, { "epoch": 0.13, "learning_rate": 0.0002801650766102789, "loss": 0.0247, "step": 26210 }, { "epoch": 0.13, "learning_rate": 0.0002801575089172649, "loss": 0.0251, "step": 26220 }, { "epoch": 0.13, "learning_rate": 0.0002801499412242509, "loss": 0.0261, "step": 26230 }, { "epoch": 0.13, "learning_rate": 0.0002801423735312369, "loss": 0.0286, "step": 26240 }, { "epoch": 0.13, "learning_rate": 0.0002801348058382229, "loss": 0.0289, "step": 26250 }, { "epoch": 0.13, "learning_rate": 0.00028012723814520887, "loss": 0.0265, "step": 26260 }, { "epoch": 0.13, "learning_rate": 0.00028011967045219485, "loss": 0.0294, "step": 26270 }, { "epoch": 0.13, "learning_rate": 0.00028011210275918083, "loss": 0.0306, "step": 26280 }, { "epoch": 0.13, "learning_rate": 0.0002801045350661668, "loss": 0.0267, "step": 26290 }, { "epoch": 0.13, "learning_rate": 0.00028009696737315285, "loss": 0.0307, "step": 26300 }, { "epoch": 0.13, "learning_rate": 0.00028008939968013883, "loss": 0.027, "step": 26310 }, { "epoch": 0.13, "learning_rate": 0.0002800818319871248, "loss": 0.0289, "step": 26320 }, { "epoch": 0.13, "learning_rate": 0.0002800742642941108, "loss": 0.0275, "step": 26330 }, { "epoch": 0.13, "learning_rate": 0.0002800666966010968, "loss": 0.0258, "step": 26340 }, { "epoch": 0.13, "learning_rate": 0.00028005912890808276, "loss": 0.0311, "step": 26350 }, { "epoch": 0.13, "learning_rate": 0.00028005156121506874, "loss": 0.0253, "step": 26360 }, { "epoch": 0.13, "learning_rate": 0.0002800439935220548, "loss": 0.0236, "step": 26370 }, { "epoch": 0.13, "learning_rate": 0.00028003642582904076, "loss": 0.0235, "step": 26380 }, { "epoch": 0.13, "learning_rate": 0.00028002885813602674, "loss": 0.0272, "step": 26390 }, { "epoch": 0.13, "learning_rate": 0.0002800212904430127, "loss": 0.0229, "step": 26400 }, { "epoch": 0.13, "learning_rate": 0.0002800137227499987, "loss": 0.0255, "step": 26410 }, { "epoch": 0.13, "learning_rate": 0.0002800061550569847, "loss": 0.0301, "step": 26420 }, { "epoch": 0.13, "learning_rate": 0.0002799985873639707, "loss": 0.0259, "step": 26430 }, { "epoch": 0.13, "learning_rate": 0.0002799910196709567, "loss": 0.0226, "step": 26440 }, { "epoch": 0.13, "learning_rate": 0.0002799834519779427, "loss": 0.0285, "step": 26450 }, { "epoch": 0.13, "learning_rate": 0.00027997588428492866, "loss": 0.0286, "step": 26460 }, { "epoch": 0.13, "learning_rate": 0.00027996831659191464, "loss": 0.027, "step": 26470 }, { "epoch": 0.13, "learning_rate": 0.0002799607488989006, "loss": 0.0276, "step": 26480 }, { "epoch": 0.13, "learning_rate": 0.0002799531812058866, "loss": 0.0285, "step": 26490 }, { "epoch": 0.13, "learning_rate": 0.00027994561351287264, "loss": 0.0327, "step": 26500 }, { "epoch": 0.13, "learning_rate": 0.0002799380458198586, "loss": 0.0265, "step": 26510 }, { "epoch": 0.13, "learning_rate": 0.0002799304781268446, "loss": 0.0286, "step": 26520 }, { "epoch": 0.13, "learning_rate": 0.0002799229104338306, "loss": 0.0261, "step": 26530 }, { "epoch": 0.13, "learning_rate": 0.00027991534274081657, "loss": 0.0244, "step": 26540 }, { "epoch": 0.13, "learning_rate": 0.00027990777504780255, "loss": 0.0262, "step": 26550 }, { "epoch": 0.13, "learning_rate": 0.0002799002073547886, "loss": 0.0246, "step": 26560 }, { "epoch": 0.13, "learning_rate": 0.00027989263966177457, "loss": 0.0241, "step": 26570 }, { "epoch": 0.13, "learning_rate": 0.00027988507196876055, "loss": 0.0267, "step": 26580 }, { "epoch": 0.13, "learning_rate": 0.00027987750427574653, "loss": 0.0271, "step": 26590 }, { "epoch": 0.13, "learning_rate": 0.0002798699365827325, "loss": 0.0289, "step": 26600 }, { "epoch": 0.13, "learning_rate": 0.0002798623688897185, "loss": 0.0224, "step": 26610 }, { "epoch": 0.13, "learning_rate": 0.00027985480119670453, "loss": 0.0345, "step": 26620 }, { "epoch": 0.13, "learning_rate": 0.0002798472335036905, "loss": 0.0268, "step": 26630 }, { "epoch": 0.13, "learning_rate": 0.0002798396658106765, "loss": 0.0274, "step": 26640 }, { "epoch": 0.13, "learning_rate": 0.0002798320981176625, "loss": 0.0272, "step": 26650 }, { "epoch": 0.13, "learning_rate": 0.00027982453042464845, "loss": 0.0246, "step": 26660 }, { "epoch": 0.13, "learning_rate": 0.00027981696273163444, "loss": 0.0257, "step": 26670 }, { "epoch": 0.13, "learning_rate": 0.0002798093950386204, "loss": 0.0251, "step": 26680 }, { "epoch": 0.13, "learning_rate": 0.00027980182734560645, "loss": 0.0335, "step": 26690 }, { "epoch": 0.13, "learning_rate": 0.00027979425965259243, "loss": 0.0317, "step": 26700 }, { "epoch": 0.13, "learning_rate": 0.0002797866919595784, "loss": 0.029, "step": 26710 }, { "epoch": 0.13, "learning_rate": 0.0002797791242665644, "loss": 0.0285, "step": 26720 }, { "epoch": 0.13, "learning_rate": 0.0002797715565735504, "loss": 0.0266, "step": 26730 }, { "epoch": 0.13, "learning_rate": 0.00027976398888053636, "loss": 0.0233, "step": 26740 }, { "epoch": 0.13, "learning_rate": 0.0002797564211875224, "loss": 0.0269, "step": 26750 }, { "epoch": 0.14, "learning_rate": 0.0002797488534945084, "loss": 0.0241, "step": 26760 }, { "epoch": 0.14, "learning_rate": 0.00027974128580149436, "loss": 0.0285, "step": 26770 }, { "epoch": 0.14, "learning_rate": 0.00027973371810848034, "loss": 0.0314, "step": 26780 }, { "epoch": 0.14, "learning_rate": 0.0002797261504154663, "loss": 0.0305, "step": 26790 }, { "epoch": 0.14, "learning_rate": 0.0002797185827224523, "loss": 0.0261, "step": 26800 }, { "epoch": 0.14, "learning_rate": 0.00027971101502943834, "loss": 0.0316, "step": 26810 }, { "epoch": 0.14, "learning_rate": 0.0002797034473364243, "loss": 0.0237, "step": 26820 }, { "epoch": 0.14, "learning_rate": 0.0002796958796434103, "loss": 0.0287, "step": 26830 }, { "epoch": 0.14, "learning_rate": 0.0002796883119503963, "loss": 0.024, "step": 26840 }, { "epoch": 0.14, "learning_rate": 0.00027968074425738226, "loss": 0.0314, "step": 26850 }, { "epoch": 0.14, "learning_rate": 0.00027967317656436825, "loss": 0.0315, "step": 26860 }, { "epoch": 0.14, "learning_rate": 0.00027966560887135423, "loss": 0.0268, "step": 26870 }, { "epoch": 0.14, "learning_rate": 0.00027965804117834026, "loss": 0.0279, "step": 26880 }, { "epoch": 0.14, "learning_rate": 0.00027965047348532624, "loss": 0.0324, "step": 26890 }, { "epoch": 0.14, "learning_rate": 0.0002796429057923122, "loss": 0.0249, "step": 26900 }, { "epoch": 0.14, "learning_rate": 0.0002796353380992982, "loss": 0.0301, "step": 26910 }, { "epoch": 0.14, "learning_rate": 0.0002796277704062842, "loss": 0.0246, "step": 26920 }, { "epoch": 0.14, "learning_rate": 0.00027962020271327017, "loss": 0.0289, "step": 26930 }, { "epoch": 0.14, "learning_rate": 0.0002796126350202562, "loss": 0.0264, "step": 26940 }, { "epoch": 0.14, "learning_rate": 0.0002796050673272422, "loss": 0.0234, "step": 26950 }, { "epoch": 0.14, "learning_rate": 0.00027959749963422817, "loss": 0.0335, "step": 26960 }, { "epoch": 0.14, "learning_rate": 0.00027958993194121415, "loss": 0.0256, "step": 26970 }, { "epoch": 0.14, "learning_rate": 0.00027958236424820013, "loss": 0.0356, "step": 26980 }, { "epoch": 0.14, "learning_rate": 0.0002795747965551861, "loss": 0.0252, "step": 26990 }, { "epoch": 0.14, "learning_rate": 0.0002795672288621721, "loss": 0.0255, "step": 27000 }, { "epoch": 0.14, "eval_cer": 0.9144469663961525, "eval_loss": 0.020766137167811394, "eval_runtime": 117.1709, "eval_samples_per_second": 17.069, "eval_steps_per_second": 4.267, "step": 27000 }, { "epoch": 0.14, "learning_rate": 0.00027955966116915813, "loss": 0.0269, "step": 27010 }, { "epoch": 0.14, "learning_rate": 0.0002795520934761441, "loss": 0.0345, "step": 27020 }, { "epoch": 0.14, "learning_rate": 0.00027954452578313004, "loss": 0.0293, "step": 27030 }, { "epoch": 0.14, "learning_rate": 0.0002795369580901161, "loss": 0.0293, "step": 27040 }, { "epoch": 0.14, "learning_rate": 0.00027952939039710206, "loss": 0.0265, "step": 27050 }, { "epoch": 0.14, "learning_rate": 0.00027952182270408804, "loss": 0.0272, "step": 27060 }, { "epoch": 0.14, "learning_rate": 0.000279514255011074, "loss": 0.0266, "step": 27070 }, { "epoch": 0.14, "learning_rate": 0.00027950668731806, "loss": 0.0241, "step": 27080 }, { "epoch": 0.14, "learning_rate": 0.000279499119625046, "loss": 0.0265, "step": 27090 }, { "epoch": 0.14, "learning_rate": 0.00027949155193203196, "loss": 0.0272, "step": 27100 }, { "epoch": 0.14, "learning_rate": 0.000279483984239018, "loss": 0.033, "step": 27110 }, { "epoch": 0.14, "learning_rate": 0.000279476416546004, "loss": 0.0283, "step": 27120 }, { "epoch": 0.14, "learning_rate": 0.00027946884885298996, "loss": 0.0311, "step": 27130 }, { "epoch": 0.14, "learning_rate": 0.00027946128115997594, "loss": 0.0304, "step": 27140 }, { "epoch": 0.14, "learning_rate": 0.0002794537134669619, "loss": 0.0269, "step": 27150 }, { "epoch": 0.14, "learning_rate": 0.0002794461457739479, "loss": 0.0238, "step": 27160 }, { "epoch": 0.14, "learning_rate": 0.00027943857808093394, "loss": 0.0255, "step": 27170 }, { "epoch": 0.14, "learning_rate": 0.0002794310103879199, "loss": 0.0229, "step": 27180 }, { "epoch": 0.14, "learning_rate": 0.0002794234426949059, "loss": 0.026, "step": 27190 }, { "epoch": 0.14, "learning_rate": 0.0002794158750018919, "loss": 0.0263, "step": 27200 }, { "epoch": 0.14, "learning_rate": 0.00027940830730887787, "loss": 0.0264, "step": 27210 }, { "epoch": 0.14, "learning_rate": 0.00027940073961586385, "loss": 0.0274, "step": 27220 }, { "epoch": 0.14, "learning_rate": 0.00027939317192284983, "loss": 0.0254, "step": 27230 }, { "epoch": 0.14, "learning_rate": 0.00027938560422983587, "loss": 0.0266, "step": 27240 }, { "epoch": 0.14, "learning_rate": 0.00027937803653682185, "loss": 0.0252, "step": 27250 }, { "epoch": 0.14, "learning_rate": 0.00027937046884380783, "loss": 0.0275, "step": 27260 }, { "epoch": 0.14, "learning_rate": 0.0002793629011507938, "loss": 0.023, "step": 27270 }, { "epoch": 0.14, "learning_rate": 0.0002793553334577798, "loss": 0.0264, "step": 27280 }, { "epoch": 0.14, "learning_rate": 0.0002793477657647658, "loss": 0.0249, "step": 27290 }, { "epoch": 0.14, "learning_rate": 0.0002793401980717518, "loss": 0.0292, "step": 27300 }, { "epoch": 0.14, "learning_rate": 0.0002793326303787378, "loss": 0.0271, "step": 27310 }, { "epoch": 0.14, "learning_rate": 0.00027932506268572377, "loss": 0.0252, "step": 27320 }, { "epoch": 0.14, "learning_rate": 0.00027931749499270975, "loss": 0.0293, "step": 27330 }, { "epoch": 0.14, "learning_rate": 0.00027930992729969573, "loss": 0.027, "step": 27340 }, { "epoch": 0.14, "learning_rate": 0.0002793023596066817, "loss": 0.0279, "step": 27350 }, { "epoch": 0.14, "learning_rate": 0.00027929479191366775, "loss": 0.0275, "step": 27360 }, { "epoch": 0.14, "learning_rate": 0.00027928722422065373, "loss": 0.0384, "step": 27370 }, { "epoch": 0.14, "learning_rate": 0.0002792796565276397, "loss": 0.0245, "step": 27380 }, { "epoch": 0.14, "learning_rate": 0.0002792720888346257, "loss": 0.0309, "step": 27390 }, { "epoch": 0.14, "learning_rate": 0.0002792645211416117, "loss": 0.0259, "step": 27400 }, { "epoch": 0.14, "learning_rate": 0.00027925695344859766, "loss": 0.0272, "step": 27410 }, { "epoch": 0.14, "learning_rate": 0.00027924938575558364, "loss": 0.0263, "step": 27420 }, { "epoch": 0.14, "learning_rate": 0.0002792418180625697, "loss": 0.0229, "step": 27430 }, { "epoch": 0.14, "learning_rate": 0.00027923425036955566, "loss": 0.0285, "step": 27440 }, { "epoch": 0.14, "learning_rate": 0.00027922668267654164, "loss": 0.0271, "step": 27450 }, { "epoch": 0.14, "learning_rate": 0.0002792191149835276, "loss": 0.0283, "step": 27460 }, { "epoch": 0.14, "learning_rate": 0.0002792115472905136, "loss": 0.0266, "step": 27470 }, { "epoch": 0.14, "learning_rate": 0.0002792039795974996, "loss": 0.0267, "step": 27480 }, { "epoch": 0.14, "learning_rate": 0.0002791964119044856, "loss": 0.0275, "step": 27490 }, { "epoch": 0.14, "learning_rate": 0.0002791888442114716, "loss": 0.0313, "step": 27500 }, { "epoch": 0.14, "learning_rate": 0.0002791812765184576, "loss": 0.0277, "step": 27510 }, { "epoch": 0.14, "learning_rate": 0.00027917370882544356, "loss": 0.0307, "step": 27520 }, { "epoch": 0.14, "learning_rate": 0.00027916614113242954, "loss": 0.0735, "step": 27530 }, { "epoch": 0.14, "learning_rate": 0.0002791585734394155, "loss": 0.0338, "step": 27540 }, { "epoch": 0.14, "learning_rate": 0.00027915100574640156, "loss": 0.0304, "step": 27550 }, { "epoch": 0.14, "learning_rate": 0.00027914343805338754, "loss": 0.036, "step": 27560 }, { "epoch": 0.14, "learning_rate": 0.0002791358703603735, "loss": 0.0325, "step": 27570 }, { "epoch": 0.14, "learning_rate": 0.0002791283026673595, "loss": 0.0392, "step": 27580 }, { "epoch": 0.14, "learning_rate": 0.0002791207349743455, "loss": 0.0254, "step": 27590 }, { "epoch": 0.14, "learning_rate": 0.00027911316728133147, "loss": 0.0372, "step": 27600 }, { "epoch": 0.14, "learning_rate": 0.00027910559958831745, "loss": 0.0293, "step": 27610 }, { "epoch": 0.14, "learning_rate": 0.0002790980318953035, "loss": 0.0353, "step": 27620 }, { "epoch": 0.14, "learning_rate": 0.00027909046420228947, "loss": 0.0362, "step": 27630 }, { "epoch": 0.14, "learning_rate": 0.00027908289650927545, "loss": 0.0291, "step": 27640 }, { "epoch": 0.14, "learning_rate": 0.00027907532881626143, "loss": 0.0336, "step": 27650 }, { "epoch": 0.14, "learning_rate": 0.0002790677611232474, "loss": 0.0239, "step": 27660 }, { "epoch": 0.14, "learning_rate": 0.0002790601934302334, "loss": 0.0268, "step": 27670 }, { "epoch": 0.14, "learning_rate": 0.00027905262573721943, "loss": 0.026, "step": 27680 }, { "epoch": 0.14, "learning_rate": 0.0002790450580442054, "loss": 0.0304, "step": 27690 }, { "epoch": 0.14, "learning_rate": 0.0002790374903511914, "loss": 0.0298, "step": 27700 }, { "epoch": 0.14, "learning_rate": 0.0002790299226581774, "loss": 0.0302, "step": 27710 }, { "epoch": 0.14, "learning_rate": 0.00027902235496516335, "loss": 0.0229, "step": 27720 }, { "epoch": 0.14, "learning_rate": 0.00027901478727214934, "loss": 0.0303, "step": 27730 }, { "epoch": 0.14, "learning_rate": 0.0002790072195791353, "loss": 0.0267, "step": 27740 }, { "epoch": 0.14, "learning_rate": 0.00027899965188612135, "loss": 0.0317, "step": 27750 }, { "epoch": 0.14, "learning_rate": 0.00027899208419310733, "loss": 0.028, "step": 27760 }, { "epoch": 0.14, "learning_rate": 0.0002789845165000933, "loss": 0.0281, "step": 27770 }, { "epoch": 0.14, "learning_rate": 0.0002789769488070793, "loss": 0.0298, "step": 27780 }, { "epoch": 0.14, "learning_rate": 0.0002789693811140653, "loss": 0.0308, "step": 27790 }, { "epoch": 0.14, "learning_rate": 0.00027896181342105126, "loss": 0.0301, "step": 27800 }, { "epoch": 0.14, "learning_rate": 0.0002789542457280373, "loss": 0.0275, "step": 27810 }, { "epoch": 0.14, "learning_rate": 0.0002789466780350233, "loss": 0.0259, "step": 27820 }, { "epoch": 0.14, "learning_rate": 0.00027893911034200926, "loss": 0.0266, "step": 27830 }, { "epoch": 0.14, "learning_rate": 0.00027893154264899524, "loss": 0.022, "step": 27840 }, { "epoch": 0.14, "learning_rate": 0.0002789239749559812, "loss": 0.0281, "step": 27850 }, { "epoch": 0.14, "learning_rate": 0.0002789164072629672, "loss": 0.0254, "step": 27860 }, { "epoch": 0.14, "learning_rate": 0.00027890883956995324, "loss": 0.0222, "step": 27870 }, { "epoch": 0.14, "learning_rate": 0.0002789012718769392, "loss": 0.0244, "step": 27880 }, { "epoch": 0.14, "learning_rate": 0.0002788937041839252, "loss": 0.023, "step": 27890 }, { "epoch": 0.14, "learning_rate": 0.0002788861364909112, "loss": 0.0324, "step": 27900 }, { "epoch": 0.14, "learning_rate": 0.00027887856879789716, "loss": 0.025, "step": 27910 }, { "epoch": 0.14, "learning_rate": 0.00027887100110488315, "loss": 0.0321, "step": 27920 }, { "epoch": 0.14, "learning_rate": 0.00027886343341186913, "loss": 0.0259, "step": 27930 }, { "epoch": 0.14, "learning_rate": 0.00027885586571885516, "loss": 0.0302, "step": 27940 }, { "epoch": 0.14, "learning_rate": 0.00027884829802584114, "loss": 0.0277, "step": 27950 }, { "epoch": 0.14, "learning_rate": 0.0002788407303328271, "loss": 0.0261, "step": 27960 }, { "epoch": 0.14, "learning_rate": 0.0002788331626398131, "loss": 0.0243, "step": 27970 }, { "epoch": 0.14, "learning_rate": 0.0002788255949467991, "loss": 0.0271, "step": 27980 }, { "epoch": 0.14, "learning_rate": 0.00027881802725378507, "loss": 0.0277, "step": 27990 }, { "epoch": 0.14, "learning_rate": 0.0002788104595607711, "loss": 0.0278, "step": 28000 }, { "epoch": 0.14, "eval_cer": 0.9144489071884033, "eval_loss": 0.019581960514187813, "eval_runtime": 117.2391, "eval_samples_per_second": 17.059, "eval_steps_per_second": 4.265, "step": 28000 }, { "epoch": 0.14, "learning_rate": 0.0002788028918677571, "loss": 0.026, "step": 28010 }, { "epoch": 0.14, "learning_rate": 0.00027879532417474307, "loss": 0.0265, "step": 28020 }, { "epoch": 0.14, "learning_rate": 0.00027878775648172905, "loss": 0.0289, "step": 28030 }, { "epoch": 0.14, "learning_rate": 0.00027878018878871503, "loss": 0.0244, "step": 28040 }, { "epoch": 0.14, "learning_rate": 0.000278772621095701, "loss": 0.026, "step": 28050 }, { "epoch": 0.14, "learning_rate": 0.000278765053402687, "loss": 0.0308, "step": 28060 }, { "epoch": 0.14, "learning_rate": 0.00027875748570967303, "loss": 0.0273, "step": 28070 }, { "epoch": 0.14, "learning_rate": 0.000278749918016659, "loss": 0.0355, "step": 28080 }, { "epoch": 0.14, "learning_rate": 0.000278742350323645, "loss": 0.0232, "step": 28090 }, { "epoch": 0.14, "learning_rate": 0.000278734782630631, "loss": 0.0242, "step": 28100 }, { "epoch": 0.14, "learning_rate": 0.00027872721493761696, "loss": 0.024, "step": 28110 }, { "epoch": 0.14, "learning_rate": 0.00027871964724460294, "loss": 0.0248, "step": 28120 }, { "epoch": 0.14, "learning_rate": 0.000278712079551589, "loss": 0.0276, "step": 28130 }, { "epoch": 0.14, "learning_rate": 0.00027870451185857495, "loss": 0.0257, "step": 28140 }, { "epoch": 0.14, "learning_rate": 0.00027869694416556094, "loss": 0.0262, "step": 28150 }, { "epoch": 0.14, "learning_rate": 0.0002786893764725469, "loss": 0.0285, "step": 28160 }, { "epoch": 0.14, "learning_rate": 0.0002786818087795329, "loss": 0.0277, "step": 28170 }, { "epoch": 0.14, "learning_rate": 0.0002786742410865189, "loss": 0.0282, "step": 28180 }, { "epoch": 0.14, "learning_rate": 0.0002786666733935049, "loss": 0.0276, "step": 28190 }, { "epoch": 0.14, "learning_rate": 0.0002786591057004909, "loss": 0.0262, "step": 28200 }, { "epoch": 0.14, "learning_rate": 0.0002786515380074769, "loss": 0.0309, "step": 28210 }, { "epoch": 0.14, "learning_rate": 0.00027864397031446286, "loss": 0.027, "step": 28220 }, { "epoch": 0.14, "learning_rate": 0.00027863640262144884, "loss": 0.028, "step": 28230 }, { "epoch": 0.14, "learning_rate": 0.0002786288349284348, "loss": 0.0263, "step": 28240 }, { "epoch": 0.14, "learning_rate": 0.0002786212672354208, "loss": 0.0252, "step": 28250 }, { "epoch": 0.14, "learning_rate": 0.00027861369954240684, "loss": 0.0231, "step": 28260 }, { "epoch": 0.14, "learning_rate": 0.0002786061318493928, "loss": 0.0324, "step": 28270 }, { "epoch": 0.14, "learning_rate": 0.00027859856415637875, "loss": 0.0271, "step": 28280 }, { "epoch": 0.14, "learning_rate": 0.00027859099646336473, "loss": 0.0323, "step": 28290 }, { "epoch": 0.14, "learning_rate": 0.00027858342877035077, "loss": 0.0298, "step": 28300 }, { "epoch": 0.14, "learning_rate": 0.00027857586107733675, "loss": 0.0259, "step": 28310 }, { "epoch": 0.14, "learning_rate": 0.00027856829338432273, "loss": 0.0275, "step": 28320 }, { "epoch": 0.14, "learning_rate": 0.0002785607256913087, "loss": 0.0289, "step": 28330 }, { "epoch": 0.14, "learning_rate": 0.0002785531579982947, "loss": 0.0295, "step": 28340 }, { "epoch": 0.14, "learning_rate": 0.0002785455903052807, "loss": 0.0278, "step": 28350 }, { "epoch": 0.14, "learning_rate": 0.0002785380226122667, "loss": 0.0243, "step": 28360 }, { "epoch": 0.14, "learning_rate": 0.0002785304549192527, "loss": 0.0245, "step": 28370 }, { "epoch": 0.14, "learning_rate": 0.00027852288722623867, "loss": 0.0259, "step": 28380 }, { "epoch": 0.14, "learning_rate": 0.00027851531953322465, "loss": 0.0271, "step": 28390 }, { "epoch": 0.14, "learning_rate": 0.00027850775184021064, "loss": 0.0339, "step": 28400 }, { "epoch": 0.14, "learning_rate": 0.0002785001841471966, "loss": 0.0302, "step": 28410 }, { "epoch": 0.14, "learning_rate": 0.00027849261645418265, "loss": 0.0254, "step": 28420 }, { "epoch": 0.14, "learning_rate": 0.00027848504876116863, "loss": 0.0304, "step": 28430 }, { "epoch": 0.14, "learning_rate": 0.0002784774810681546, "loss": 0.0308, "step": 28440 }, { "epoch": 0.14, "learning_rate": 0.0002784699133751406, "loss": 0.0263, "step": 28450 }, { "epoch": 0.14, "learning_rate": 0.0002784623456821266, "loss": 0.0257, "step": 28460 }, { "epoch": 0.14, "learning_rate": 0.00027845477798911256, "loss": 0.0271, "step": 28470 }, { "epoch": 0.14, "learning_rate": 0.00027844721029609854, "loss": 0.0242, "step": 28480 }, { "epoch": 0.14, "learning_rate": 0.0002784396426030846, "loss": 0.0299, "step": 28490 }, { "epoch": 0.14, "learning_rate": 0.00027843207491007056, "loss": 0.0269, "step": 28500 }, { "epoch": 0.14, "learning_rate": 0.00027842450721705654, "loss": 0.0218, "step": 28510 }, { "epoch": 0.14, "learning_rate": 0.0002784169395240425, "loss": 0.0264, "step": 28520 }, { "epoch": 0.14, "learning_rate": 0.0002784093718310285, "loss": 0.0277, "step": 28530 }, { "epoch": 0.14, "learning_rate": 0.0002784018041380145, "loss": 0.022, "step": 28540 }, { "epoch": 0.14, "learning_rate": 0.0002783942364450005, "loss": 0.0259, "step": 28550 }, { "epoch": 0.14, "learning_rate": 0.0002783866687519865, "loss": 0.0247, "step": 28560 }, { "epoch": 0.14, "learning_rate": 0.0002783791010589725, "loss": 0.0326, "step": 28570 }, { "epoch": 0.14, "learning_rate": 0.00027837153336595846, "loss": 0.0264, "step": 28580 }, { "epoch": 0.14, "learning_rate": 0.00027836396567294445, "loss": 0.0302, "step": 28590 }, { "epoch": 0.14, "learning_rate": 0.0002783563979799304, "loss": 0.0238, "step": 28600 }, { "epoch": 0.14, "learning_rate": 0.00027834883028691646, "loss": 0.0248, "step": 28610 }, { "epoch": 0.14, "learning_rate": 0.00027834126259390244, "loss": 0.0241, "step": 28620 }, { "epoch": 0.14, "learning_rate": 0.0002783336949008884, "loss": 0.0256, "step": 28630 }, { "epoch": 0.14, "learning_rate": 0.0002783261272078744, "loss": 0.0241, "step": 28640 }, { "epoch": 0.14, "learning_rate": 0.0002783185595148604, "loss": 0.0243, "step": 28650 }, { "epoch": 0.14, "learning_rate": 0.00027831099182184637, "loss": 0.0278, "step": 28660 }, { "epoch": 0.14, "learning_rate": 0.00027830342412883235, "loss": 0.0215, "step": 28670 }, { "epoch": 0.14, "learning_rate": 0.0002782958564358184, "loss": 0.0272, "step": 28680 }, { "epoch": 0.14, "learning_rate": 0.00027828828874280437, "loss": 0.0275, "step": 28690 }, { "epoch": 0.14, "learning_rate": 0.00027828072104979035, "loss": 0.0244, "step": 28700 }, { "epoch": 0.14, "learning_rate": 0.00027827315335677633, "loss": 0.0249, "step": 28710 }, { "epoch": 0.14, "learning_rate": 0.0002782655856637623, "loss": 0.0267, "step": 28720 }, { "epoch": 0.14, "learning_rate": 0.0002782580179707483, "loss": 0.0328, "step": 28730 }, { "epoch": 0.14, "learning_rate": 0.00027825045027773433, "loss": 0.0308, "step": 28740 }, { "epoch": 0.15, "learning_rate": 0.0002782428825847203, "loss": 0.0261, "step": 28750 }, { "epoch": 0.15, "learning_rate": 0.0002782353148917063, "loss": 0.0326, "step": 28760 }, { "epoch": 0.15, "learning_rate": 0.0002782277471986923, "loss": 0.0281, "step": 28770 }, { "epoch": 0.15, "learning_rate": 0.00027822017950567826, "loss": 0.0258, "step": 28780 }, { "epoch": 0.15, "learning_rate": 0.00027821261181266424, "loss": 0.0279, "step": 28790 }, { "epoch": 0.15, "learning_rate": 0.0002782050441196502, "loss": 0.0553, "step": 28800 }, { "epoch": 0.15, "learning_rate": 0.00027819747642663625, "loss": 0.0291, "step": 28810 }, { "epoch": 0.15, "learning_rate": 0.00027818990873362224, "loss": 0.0254, "step": 28820 }, { "epoch": 0.15, "learning_rate": 0.0002781823410406082, "loss": 0.0298, "step": 28830 }, { "epoch": 0.15, "learning_rate": 0.0002781747733475942, "loss": 0.0266, "step": 28840 }, { "epoch": 0.15, "learning_rate": 0.0002781672056545802, "loss": 0.025, "step": 28850 }, { "epoch": 0.15, "learning_rate": 0.00027815963796156616, "loss": 0.0223, "step": 28860 }, { "epoch": 0.15, "learning_rate": 0.0002781520702685522, "loss": 0.0274, "step": 28870 }, { "epoch": 0.15, "learning_rate": 0.0002781445025755382, "loss": 0.0294, "step": 28880 }, { "epoch": 0.15, "learning_rate": 0.00027813693488252416, "loss": 0.021, "step": 28890 }, { "epoch": 0.15, "learning_rate": 0.00027812936718951014, "loss": 0.0343, "step": 28900 }, { "epoch": 0.15, "learning_rate": 0.0002781217994964961, "loss": 0.0349, "step": 28910 }, { "epoch": 0.15, "learning_rate": 0.0002781142318034821, "loss": 0.028, "step": 28920 }, { "epoch": 0.15, "learning_rate": 0.00027810666411046814, "loss": 0.0245, "step": 28930 }, { "epoch": 0.15, "learning_rate": 0.0002780990964174541, "loss": 0.0247, "step": 28940 }, { "epoch": 0.15, "learning_rate": 0.0002780915287244401, "loss": 0.0269, "step": 28950 }, { "epoch": 0.15, "learning_rate": 0.0002780839610314261, "loss": 0.0236, "step": 28960 }, { "epoch": 0.15, "learning_rate": 0.00027807639333841207, "loss": 0.0265, "step": 28970 }, { "epoch": 0.15, "learning_rate": 0.00027806882564539805, "loss": 0.0263, "step": 28980 }, { "epoch": 0.15, "learning_rate": 0.00027806125795238403, "loss": 0.0232, "step": 28990 }, { "epoch": 0.15, "learning_rate": 0.00027805369025937006, "loss": 0.0245, "step": 29000 }, { "epoch": 0.15, "eval_cer": 0.914481900656667, "eval_loss": 0.019330712035298347, "eval_runtime": 117.3753, "eval_samples_per_second": 17.039, "eval_steps_per_second": 4.26, "step": 29000 }, { "epoch": 0.15, "learning_rate": 0.00027804612256635605, "loss": 0.0274, "step": 29010 }, { "epoch": 0.15, "learning_rate": 0.000278038554873342, "loss": 0.0276, "step": 29020 }, { "epoch": 0.15, "learning_rate": 0.000278030987180328, "loss": 0.0246, "step": 29030 }, { "epoch": 0.15, "learning_rate": 0.000278023419487314, "loss": 0.0309, "step": 29040 }, { "epoch": 0.15, "learning_rate": 0.00027801585179429997, "loss": 0.0265, "step": 29050 }, { "epoch": 0.15, "learning_rate": 0.000278008284101286, "loss": 0.0284, "step": 29060 }, { "epoch": 0.15, "learning_rate": 0.000278000716408272, "loss": 0.0239, "step": 29070 }, { "epoch": 0.15, "learning_rate": 0.00027799314871525797, "loss": 0.0235, "step": 29080 }, { "epoch": 0.15, "learning_rate": 0.00027798558102224395, "loss": 0.0256, "step": 29090 }, { "epoch": 0.15, "learning_rate": 0.00027797801332922993, "loss": 0.0255, "step": 29100 }, { "epoch": 0.15, "learning_rate": 0.0002779704456362159, "loss": 0.0223, "step": 29110 }, { "epoch": 0.15, "learning_rate": 0.00027796287794320195, "loss": 0.025, "step": 29120 }, { "epoch": 0.15, "learning_rate": 0.00027795531025018793, "loss": 0.027, "step": 29130 }, { "epoch": 0.15, "learning_rate": 0.0002779477425571739, "loss": 0.0279, "step": 29140 }, { "epoch": 0.15, "learning_rate": 0.0002779401748641599, "loss": 0.0236, "step": 29150 }, { "epoch": 0.15, "learning_rate": 0.0002779326071711459, "loss": 0.0221, "step": 29160 }, { "epoch": 0.15, "learning_rate": 0.00027792503947813186, "loss": 0.0285, "step": 29170 }, { "epoch": 0.15, "learning_rate": 0.00027791747178511784, "loss": 0.0282, "step": 29180 }, { "epoch": 0.15, "learning_rate": 0.0002779099040921039, "loss": 0.0262, "step": 29190 }, { "epoch": 0.15, "learning_rate": 0.00027790233639908986, "loss": 0.0262, "step": 29200 }, { "epoch": 0.15, "learning_rate": 0.00027789476870607584, "loss": 0.0211, "step": 29210 }, { "epoch": 0.15, "learning_rate": 0.0002778872010130618, "loss": 0.0244, "step": 29220 }, { "epoch": 0.15, "learning_rate": 0.0002778796333200478, "loss": 0.0257, "step": 29230 }, { "epoch": 0.15, "learning_rate": 0.0002778720656270338, "loss": 0.0246, "step": 29240 }, { "epoch": 0.15, "learning_rate": 0.0002778644979340198, "loss": 0.026, "step": 29250 }, { "epoch": 0.15, "learning_rate": 0.0002778569302410058, "loss": 0.0239, "step": 29260 }, { "epoch": 0.15, "learning_rate": 0.0002778493625479918, "loss": 0.0322, "step": 29270 }, { "epoch": 0.15, "learning_rate": 0.00027784179485497776, "loss": 0.0275, "step": 29280 }, { "epoch": 0.15, "learning_rate": 0.00027783422716196374, "loss": 0.038, "step": 29290 }, { "epoch": 0.15, "learning_rate": 0.0002778266594689497, "loss": 0.0285, "step": 29300 }, { "epoch": 0.15, "learning_rate": 0.0002778190917759357, "loss": 0.0286, "step": 29310 }, { "epoch": 0.15, "learning_rate": 0.00027781152408292174, "loss": 0.0296, "step": 29320 }, { "epoch": 0.15, "learning_rate": 0.0002778039563899077, "loss": 0.0242, "step": 29330 }, { "epoch": 0.15, "learning_rate": 0.0002777963886968937, "loss": 0.0275, "step": 29340 }, { "epoch": 0.15, "learning_rate": 0.0002777888210038797, "loss": 0.0258, "step": 29350 }, { "epoch": 0.15, "learning_rate": 0.00027778125331086567, "loss": 0.025, "step": 29360 }, { "epoch": 0.15, "learning_rate": 0.00027777368561785165, "loss": 0.0303, "step": 29370 }, { "epoch": 0.15, "learning_rate": 0.0002777661179248377, "loss": 0.0265, "step": 29380 }, { "epoch": 0.15, "learning_rate": 0.00027775855023182367, "loss": 0.0271, "step": 29390 }, { "epoch": 0.15, "learning_rate": 0.00027775098253880965, "loss": 0.0256, "step": 29400 }, { "epoch": 0.15, "learning_rate": 0.00027774341484579563, "loss": 0.0277, "step": 29410 }, { "epoch": 0.15, "learning_rate": 0.0002777358471527816, "loss": 0.023, "step": 29420 }, { "epoch": 0.15, "learning_rate": 0.0002777282794597676, "loss": 0.0252, "step": 29430 }, { "epoch": 0.15, "learning_rate": 0.0002777207117667536, "loss": 0.027, "step": 29440 }, { "epoch": 0.15, "learning_rate": 0.0002777131440737396, "loss": 0.027, "step": 29450 }, { "epoch": 0.15, "learning_rate": 0.0002777055763807256, "loss": 0.0269, "step": 29460 }, { "epoch": 0.15, "learning_rate": 0.00027769800868771157, "loss": 0.0234, "step": 29470 }, { "epoch": 0.15, "learning_rate": 0.00027769044099469755, "loss": 0.0261, "step": 29480 }, { "epoch": 0.15, "learning_rate": 0.00027768287330168353, "loss": 0.026, "step": 29490 }, { "epoch": 0.15, "learning_rate": 0.0002776753056086695, "loss": 0.0213, "step": 29500 }, { "epoch": 0.15, "learning_rate": 0.00027766773791565555, "loss": 0.0267, "step": 29510 }, { "epoch": 0.15, "learning_rate": 0.00027766017022264153, "loss": 0.0263, "step": 29520 }, { "epoch": 0.15, "learning_rate": 0.0002776526025296275, "loss": 0.026, "step": 29530 }, { "epoch": 0.15, "learning_rate": 0.00027764503483661344, "loss": 0.0273, "step": 29540 }, { "epoch": 0.15, "learning_rate": 0.0002776374671435995, "loss": 0.0258, "step": 29550 }, { "epoch": 0.15, "learning_rate": 0.00027762989945058546, "loss": 0.0249, "step": 29560 }, { "epoch": 0.15, "learning_rate": 0.00027762233175757144, "loss": 0.0302, "step": 29570 }, { "epoch": 0.15, "learning_rate": 0.0002776147640645574, "loss": 0.034, "step": 29580 }, { "epoch": 0.15, "learning_rate": 0.0002776071963715434, "loss": 0.0244, "step": 29590 }, { "epoch": 0.15, "learning_rate": 0.0002775996286785294, "loss": 0.0234, "step": 29600 }, { "epoch": 0.15, "learning_rate": 0.0002775920609855154, "loss": 0.0261, "step": 29610 }, { "epoch": 0.15, "learning_rate": 0.0002775844932925014, "loss": 0.0279, "step": 29620 }, { "epoch": 0.15, "learning_rate": 0.0002775769255994874, "loss": 0.0277, "step": 29630 }, { "epoch": 0.15, "learning_rate": 0.00027756935790647336, "loss": 0.0304, "step": 29640 }, { "epoch": 0.15, "learning_rate": 0.00027756179021345935, "loss": 0.0272, "step": 29650 }, { "epoch": 0.15, "learning_rate": 0.0002775542225204453, "loss": 0.0267, "step": 29660 }, { "epoch": 0.15, "learning_rate": 0.00027754665482743136, "loss": 0.0304, "step": 29670 }, { "epoch": 0.15, "learning_rate": 0.00027753908713441734, "loss": 0.024, "step": 29680 }, { "epoch": 0.15, "learning_rate": 0.0002775315194414033, "loss": 0.0297, "step": 29690 }, { "epoch": 0.15, "learning_rate": 0.0002775239517483893, "loss": 0.0217, "step": 29700 }, { "epoch": 0.15, "learning_rate": 0.0002775163840553753, "loss": 0.0248, "step": 29710 }, { "epoch": 0.15, "learning_rate": 0.00027750881636236127, "loss": 0.0237, "step": 29720 }, { "epoch": 0.15, "learning_rate": 0.00027750124866934725, "loss": 0.0281, "step": 29730 }, { "epoch": 0.15, "learning_rate": 0.0002774936809763333, "loss": 0.0284, "step": 29740 }, { "epoch": 0.15, "learning_rate": 0.00027748611328331927, "loss": 0.0239, "step": 29750 }, { "epoch": 0.15, "learning_rate": 0.00027747854559030525, "loss": 0.0253, "step": 29760 }, { "epoch": 0.15, "learning_rate": 0.00027747097789729123, "loss": 0.026, "step": 29770 }, { "epoch": 0.15, "learning_rate": 0.0002774634102042772, "loss": 0.0258, "step": 29780 }, { "epoch": 0.15, "learning_rate": 0.0002774558425112632, "loss": 0.0239, "step": 29790 }, { "epoch": 0.15, "learning_rate": 0.00027744827481824923, "loss": 0.0196, "step": 29800 }, { "epoch": 0.15, "learning_rate": 0.0002774407071252352, "loss": 0.0255, "step": 29810 }, { "epoch": 0.15, "learning_rate": 0.0002774331394322212, "loss": 0.0267, "step": 29820 }, { "epoch": 0.15, "learning_rate": 0.0002774255717392072, "loss": 0.0261, "step": 29830 }, { "epoch": 0.15, "learning_rate": 0.00027741800404619316, "loss": 0.0263, "step": 29840 }, { "epoch": 0.15, "learning_rate": 0.00027741043635317914, "loss": 0.0293, "step": 29850 }, { "epoch": 0.15, "learning_rate": 0.0002774028686601651, "loss": 0.0241, "step": 29860 }, { "epoch": 0.15, "learning_rate": 0.00027739530096715115, "loss": 0.0231, "step": 29870 }, { "epoch": 0.15, "learning_rate": 0.00027738773327413714, "loss": 0.0228, "step": 29880 }, { "epoch": 0.15, "learning_rate": 0.0002773801655811231, "loss": 0.026, "step": 29890 }, { "epoch": 0.15, "learning_rate": 0.0002773725978881091, "loss": 0.027, "step": 29900 }, { "epoch": 0.15, "learning_rate": 0.0002773650301950951, "loss": 0.0249, "step": 29910 }, { "epoch": 0.15, "learning_rate": 0.00027735746250208106, "loss": 0.0291, "step": 29920 }, { "epoch": 0.15, "learning_rate": 0.0002773498948090671, "loss": 0.0242, "step": 29930 }, { "epoch": 0.15, "learning_rate": 0.0002773423271160531, "loss": 0.0272, "step": 29940 }, { "epoch": 0.15, "learning_rate": 0.00027733475942303906, "loss": 0.0286, "step": 29950 }, { "epoch": 0.15, "learning_rate": 0.00027732719173002504, "loss": 0.0244, "step": 29960 }, { "epoch": 0.15, "learning_rate": 0.000277319624037011, "loss": 0.0281, "step": 29970 }, { "epoch": 0.15, "learning_rate": 0.000277312056343997, "loss": 0.0295, "step": 29980 }, { "epoch": 0.15, "learning_rate": 0.00027730448865098304, "loss": 0.0313, "step": 29990 }, { "epoch": 0.15, "learning_rate": 0.000277296920957969, "loss": 0.0226, "step": 30000 }, { "epoch": 0.15, "eval_cer": 0.9144518183767796, "eval_loss": 0.019204232841730118, "eval_runtime": 117.3422, "eval_samples_per_second": 17.044, "eval_steps_per_second": 4.261, "step": 30000 }, { "epoch": 0.15, "learning_rate": 0.000277289353264955, "loss": 0.0214, "step": 30010 }, { "epoch": 0.15, "learning_rate": 0.000277281785571941, "loss": 0.0318, "step": 30020 }, { "epoch": 0.15, "learning_rate": 0.00027727421787892697, "loss": 0.0273, "step": 30030 }, { "epoch": 0.15, "learning_rate": 0.00027726665018591295, "loss": 0.025, "step": 30040 }, { "epoch": 0.15, "learning_rate": 0.00027725908249289893, "loss": 0.0252, "step": 30050 }, { "epoch": 0.15, "learning_rate": 0.00027725151479988496, "loss": 0.0308, "step": 30060 }, { "epoch": 0.15, "learning_rate": 0.00027724394710687095, "loss": 0.0281, "step": 30070 }, { "epoch": 0.15, "learning_rate": 0.0002772363794138569, "loss": 0.0299, "step": 30080 }, { "epoch": 0.15, "learning_rate": 0.0002772288117208429, "loss": 0.03, "step": 30090 }, { "epoch": 0.15, "learning_rate": 0.0002772212440278289, "loss": 0.0269, "step": 30100 }, { "epoch": 0.15, "learning_rate": 0.00027721367633481487, "loss": 0.0316, "step": 30110 }, { "epoch": 0.15, "learning_rate": 0.0002772061086418009, "loss": 0.0249, "step": 30120 }, { "epoch": 0.15, "learning_rate": 0.0002771985409487869, "loss": 0.0273, "step": 30130 }, { "epoch": 0.15, "learning_rate": 0.00027719097325577287, "loss": 0.0247, "step": 30140 }, { "epoch": 0.15, "learning_rate": 0.00027718340556275885, "loss": 0.0259, "step": 30150 }, { "epoch": 0.15, "learning_rate": 0.00027717583786974483, "loss": 0.0293, "step": 30160 }, { "epoch": 0.15, "learning_rate": 0.0002771682701767308, "loss": 0.0249, "step": 30170 }, { "epoch": 0.15, "learning_rate": 0.00027716070248371685, "loss": 0.0281, "step": 30180 }, { "epoch": 0.15, "learning_rate": 0.00027715313479070283, "loss": 0.0224, "step": 30190 }, { "epoch": 0.15, "learning_rate": 0.0002771455670976888, "loss": 0.0264, "step": 30200 }, { "epoch": 0.15, "learning_rate": 0.0002771379994046748, "loss": 0.0284, "step": 30210 }, { "epoch": 0.15, "learning_rate": 0.0002771304317116608, "loss": 0.0267, "step": 30220 }, { "epoch": 0.15, "learning_rate": 0.00027712286401864676, "loss": 0.0297, "step": 30230 }, { "epoch": 0.15, "learning_rate": 0.00027711529632563274, "loss": 0.0244, "step": 30240 }, { "epoch": 0.15, "learning_rate": 0.0002771077286326188, "loss": 0.0247, "step": 30250 }, { "epoch": 0.15, "learning_rate": 0.00027710016093960476, "loss": 0.026, "step": 30260 }, { "epoch": 0.15, "learning_rate": 0.00027709259324659074, "loss": 0.0262, "step": 30270 }, { "epoch": 0.15, "learning_rate": 0.0002770850255535767, "loss": 0.0253, "step": 30280 }, { "epoch": 0.15, "learning_rate": 0.0002770774578605627, "loss": 0.0328, "step": 30290 }, { "epoch": 0.15, "learning_rate": 0.0002770698901675487, "loss": 0.0283, "step": 30300 }, { "epoch": 0.15, "learning_rate": 0.0002770623224745347, "loss": 0.0256, "step": 30310 }, { "epoch": 0.15, "learning_rate": 0.0002770547547815207, "loss": 0.0247, "step": 30320 }, { "epoch": 0.15, "learning_rate": 0.0002770471870885067, "loss": 0.0259, "step": 30330 }, { "epoch": 0.15, "learning_rate": 0.00027703961939549266, "loss": 0.0289, "step": 30340 }, { "epoch": 0.15, "learning_rate": 0.00027703205170247864, "loss": 0.0257, "step": 30350 }, { "epoch": 0.15, "learning_rate": 0.0002770244840094646, "loss": 0.031, "step": 30360 }, { "epoch": 0.15, "learning_rate": 0.0002770169163164506, "loss": 0.0309, "step": 30370 }, { "epoch": 0.15, "learning_rate": 0.00027700934862343664, "loss": 0.0271, "step": 30380 }, { "epoch": 0.15, "learning_rate": 0.0002770017809304226, "loss": 0.0275, "step": 30390 }, { "epoch": 0.15, "learning_rate": 0.0002769942132374086, "loss": 0.0253, "step": 30400 }, { "epoch": 0.15, "learning_rate": 0.0002769866455443946, "loss": 0.0263, "step": 30410 }, { "epoch": 0.15, "learning_rate": 0.00027697907785138057, "loss": 0.0239, "step": 30420 }, { "epoch": 0.15, "learning_rate": 0.00027697151015836655, "loss": 0.039, "step": 30430 }, { "epoch": 0.15, "learning_rate": 0.0002769639424653526, "loss": 0.0278, "step": 30440 }, { "epoch": 0.15, "learning_rate": 0.00027695637477233857, "loss": 0.0306, "step": 30450 }, { "epoch": 0.15, "learning_rate": 0.00027694880707932455, "loss": 0.0284, "step": 30460 }, { "epoch": 0.15, "learning_rate": 0.00027694123938631053, "loss": 0.0228, "step": 30470 }, { "epoch": 0.15, "learning_rate": 0.0002769336716932965, "loss": 0.0214, "step": 30480 }, { "epoch": 0.15, "learning_rate": 0.0002769261040002825, "loss": 0.0261, "step": 30490 }, { "epoch": 0.15, "learning_rate": 0.0002769185363072685, "loss": 0.0256, "step": 30500 }, { "epoch": 0.15, "learning_rate": 0.0002769109686142545, "loss": 0.0233, "step": 30510 }, { "epoch": 0.15, "learning_rate": 0.0002769034009212405, "loss": 0.027, "step": 30520 }, { "epoch": 0.15, "learning_rate": 0.00027689583322822647, "loss": 0.0232, "step": 30530 }, { "epoch": 0.15, "learning_rate": 0.00027688826553521245, "loss": 0.0211, "step": 30540 }, { "epoch": 0.15, "learning_rate": 0.00027688069784219843, "loss": 0.0259, "step": 30550 }, { "epoch": 0.15, "learning_rate": 0.0002768731301491844, "loss": 0.0233, "step": 30560 }, { "epoch": 0.15, "learning_rate": 0.00027686556245617045, "loss": 0.0195, "step": 30570 }, { "epoch": 0.15, "learning_rate": 0.00027685799476315643, "loss": 0.0276, "step": 30580 }, { "epoch": 0.15, "learning_rate": 0.0002768504270701424, "loss": 0.0213, "step": 30590 }, { "epoch": 0.15, "learning_rate": 0.0002768428593771284, "loss": 0.0234, "step": 30600 }, { "epoch": 0.15, "learning_rate": 0.0002768352916841144, "loss": 0.0259, "step": 30610 }, { "epoch": 0.15, "learning_rate": 0.00027682772399110036, "loss": 0.0246, "step": 30620 }, { "epoch": 0.15, "learning_rate": 0.0002768201562980864, "loss": 0.0295, "step": 30630 }, { "epoch": 0.15, "learning_rate": 0.0002768125886050724, "loss": 0.0258, "step": 30640 }, { "epoch": 0.15, "learning_rate": 0.00027680502091205836, "loss": 0.0265, "step": 30650 }, { "epoch": 0.15, "learning_rate": 0.00027679745321904434, "loss": 0.0241, "step": 30660 }, { "epoch": 0.15, "learning_rate": 0.0002767898855260303, "loss": 0.0441, "step": 30670 }, { "epoch": 0.15, "learning_rate": 0.0002767823178330163, "loss": 0.0257, "step": 30680 }, { "epoch": 0.15, "learning_rate": 0.00027677475014000234, "loss": 0.029, "step": 30690 }, { "epoch": 0.15, "learning_rate": 0.0002767671824469883, "loss": 0.0312, "step": 30700 }, { "epoch": 0.15, "learning_rate": 0.0002767596147539743, "loss": 0.0256, "step": 30710 }, { "epoch": 0.15, "learning_rate": 0.0002767520470609603, "loss": 0.0256, "step": 30720 }, { "epoch": 0.16, "learning_rate": 0.00027674447936794626, "loss": 0.0235, "step": 30730 }, { "epoch": 0.16, "learning_rate": 0.00027673691167493224, "loss": 0.0247, "step": 30740 }, { "epoch": 0.16, "learning_rate": 0.0002767293439819182, "loss": 0.0266, "step": 30750 }, { "epoch": 0.16, "learning_rate": 0.00027672177628890426, "loss": 0.0233, "step": 30760 }, { "epoch": 0.16, "learning_rate": 0.00027671420859589024, "loss": 0.0232, "step": 30770 }, { "epoch": 0.16, "learning_rate": 0.0002767066409028762, "loss": 0.0239, "step": 30780 }, { "epoch": 0.16, "learning_rate": 0.0002766990732098622, "loss": 0.0255, "step": 30790 }, { "epoch": 0.16, "learning_rate": 0.0002766915055168482, "loss": 0.0253, "step": 30800 }, { "epoch": 0.16, "learning_rate": 0.00027668393782383417, "loss": 0.0265, "step": 30810 }, { "epoch": 0.16, "learning_rate": 0.00027667637013082015, "loss": 0.0232, "step": 30820 }, { "epoch": 0.16, "learning_rate": 0.00027666880243780613, "loss": 0.0303, "step": 30830 }, { "epoch": 0.16, "learning_rate": 0.0002766612347447921, "loss": 0.0239, "step": 30840 }, { "epoch": 0.16, "learning_rate": 0.0002766536670517781, "loss": 0.0263, "step": 30850 }, { "epoch": 0.16, "learning_rate": 0.00027664609935876413, "loss": 0.0243, "step": 30860 }, { "epoch": 0.16, "learning_rate": 0.0002766385316657501, "loss": 0.0242, "step": 30870 }, { "epoch": 0.16, "learning_rate": 0.0002766309639727361, "loss": 0.0213, "step": 30880 }, { "epoch": 0.16, "learning_rate": 0.0002766233962797221, "loss": 0.0252, "step": 30890 }, { "epoch": 0.16, "learning_rate": 0.00027661582858670806, "loss": 0.0249, "step": 30900 }, { "epoch": 0.16, "learning_rate": 0.00027660826089369404, "loss": 0.0239, "step": 30910 }, { "epoch": 0.16, "learning_rate": 0.00027660069320068007, "loss": 0.0233, "step": 30920 }, { "epoch": 0.16, "learning_rate": 0.00027659312550766605, "loss": 0.0233, "step": 30930 }, { "epoch": 0.16, "learning_rate": 0.00027658555781465204, "loss": 0.0249, "step": 30940 }, { "epoch": 0.16, "learning_rate": 0.000276577990121638, "loss": 0.0231, "step": 30950 }, { "epoch": 0.16, "learning_rate": 0.000276570422428624, "loss": 0.0243, "step": 30960 }, { "epoch": 0.16, "learning_rate": 0.00027656285473561, "loss": 0.032, "step": 30970 }, { "epoch": 0.16, "learning_rate": 0.00027655528704259596, "loss": 0.0222, "step": 30980 }, { "epoch": 0.16, "learning_rate": 0.000276547719349582, "loss": 0.0229, "step": 30990 }, { "epoch": 0.16, "learning_rate": 0.000276540151656568, "loss": 0.0259, "step": 31000 }, { "epoch": 0.16, "eval_cer": 0.914447936792278, "eval_loss": 0.018999282270669937, "eval_runtime": 117.1152, "eval_samples_per_second": 17.077, "eval_steps_per_second": 4.269, "step": 31000 }, { "epoch": 0.16, "learning_rate": 0.00027653258396355396, "loss": 0.0254, "step": 31010 }, { "epoch": 0.16, "learning_rate": 0.00027652501627053994, "loss": 0.0239, "step": 31020 }, { "epoch": 0.16, "learning_rate": 0.0002765174485775259, "loss": 0.0342, "step": 31030 }, { "epoch": 0.16, "learning_rate": 0.0002765098808845119, "loss": 0.0252, "step": 31040 }, { "epoch": 0.16, "learning_rate": 0.00027650231319149794, "loss": 0.0225, "step": 31050 }, { "epoch": 0.16, "learning_rate": 0.0002764947454984839, "loss": 0.0251, "step": 31060 }, { "epoch": 0.16, "learning_rate": 0.0002764871778054699, "loss": 0.0287, "step": 31070 }, { "epoch": 0.16, "learning_rate": 0.0002764796101124559, "loss": 0.0304, "step": 31080 }, { "epoch": 0.16, "learning_rate": 0.00027647204241944187, "loss": 0.0259, "step": 31090 }, { "epoch": 0.16, "learning_rate": 0.00027646447472642785, "loss": 0.0233, "step": 31100 }, { "epoch": 0.16, "learning_rate": 0.00027645690703341383, "loss": 0.0262, "step": 31110 }, { "epoch": 0.16, "learning_rate": 0.00027644933934039986, "loss": 0.0269, "step": 31120 }, { "epoch": 0.16, "learning_rate": 0.00027644177164738585, "loss": 0.0222, "step": 31130 }, { "epoch": 0.16, "learning_rate": 0.0002764342039543718, "loss": 0.0196, "step": 31140 }, { "epoch": 0.16, "learning_rate": 0.0002764266362613578, "loss": 0.0283, "step": 31150 }, { "epoch": 0.16, "learning_rate": 0.0002764190685683438, "loss": 0.024, "step": 31160 }, { "epoch": 0.16, "learning_rate": 0.00027641150087532977, "loss": 0.0239, "step": 31170 }, { "epoch": 0.16, "learning_rate": 0.0002764039331823158, "loss": 0.0208, "step": 31180 }, { "epoch": 0.16, "learning_rate": 0.0002763963654893018, "loss": 0.024, "step": 31190 }, { "epoch": 0.16, "learning_rate": 0.00027638879779628777, "loss": 0.0275, "step": 31200 }, { "epoch": 0.16, "learning_rate": 0.00027638123010327375, "loss": 0.0274, "step": 31210 }, { "epoch": 0.16, "learning_rate": 0.00027637366241025973, "loss": 0.0258, "step": 31220 }, { "epoch": 0.16, "learning_rate": 0.0002763660947172457, "loss": 0.0258, "step": 31230 }, { "epoch": 0.16, "learning_rate": 0.00027635852702423175, "loss": 0.0236, "step": 31240 }, { "epoch": 0.16, "learning_rate": 0.00027635095933121773, "loss": 0.0244, "step": 31250 }, { "epoch": 0.16, "learning_rate": 0.0002763433916382037, "loss": 0.0262, "step": 31260 }, { "epoch": 0.16, "learning_rate": 0.0002763358239451897, "loss": 0.0266, "step": 31270 }, { "epoch": 0.16, "learning_rate": 0.0002763282562521757, "loss": 0.0286, "step": 31280 }, { "epoch": 0.16, "learning_rate": 0.00027632068855916166, "loss": 0.0289, "step": 31290 }, { "epoch": 0.16, "learning_rate": 0.00027631312086614764, "loss": 0.0289, "step": 31300 }, { "epoch": 0.16, "learning_rate": 0.0002763055531731337, "loss": 0.0294, "step": 31310 }, { "epoch": 0.16, "learning_rate": 0.00027629798548011966, "loss": 0.0253, "step": 31320 }, { "epoch": 0.16, "learning_rate": 0.00027629041778710564, "loss": 0.0262, "step": 31330 }, { "epoch": 0.16, "learning_rate": 0.0002762828500940916, "loss": 0.0199, "step": 31340 }, { "epoch": 0.16, "learning_rate": 0.0002762752824010776, "loss": 0.024, "step": 31350 }, { "epoch": 0.16, "learning_rate": 0.0002762677147080636, "loss": 0.0228, "step": 31360 }, { "epoch": 0.16, "learning_rate": 0.0002762601470150496, "loss": 0.0392, "step": 31370 }, { "epoch": 0.16, "learning_rate": 0.0002762525793220356, "loss": 0.0231, "step": 31380 }, { "epoch": 0.16, "learning_rate": 0.0002762450116290216, "loss": 0.0297, "step": 31390 }, { "epoch": 0.16, "learning_rate": 0.00027623744393600756, "loss": 0.0354, "step": 31400 }, { "epoch": 0.16, "learning_rate": 0.00027622987624299354, "loss": 0.0284, "step": 31410 }, { "epoch": 0.16, "learning_rate": 0.0002762223085499795, "loss": 0.0366, "step": 31420 }, { "epoch": 0.16, "learning_rate": 0.00027621474085696556, "loss": 0.0256, "step": 31430 }, { "epoch": 0.16, "learning_rate": 0.00027620717316395154, "loss": 0.0294, "step": 31440 }, { "epoch": 0.16, "learning_rate": 0.0002761996054709375, "loss": 0.0249, "step": 31450 }, { "epoch": 0.16, "learning_rate": 0.0002761920377779235, "loss": 0.0317, "step": 31460 }, { "epoch": 0.16, "learning_rate": 0.0002761844700849095, "loss": 0.0279, "step": 31470 }, { "epoch": 0.16, "learning_rate": 0.00027617690239189547, "loss": 0.0217, "step": 31480 }, { "epoch": 0.16, "learning_rate": 0.00027616933469888145, "loss": 0.0259, "step": 31490 }, { "epoch": 0.16, "learning_rate": 0.0002761617670058675, "loss": 0.0209, "step": 31500 }, { "epoch": 0.16, "learning_rate": 0.00027615419931285347, "loss": 0.0255, "step": 31510 }, { "epoch": 0.16, "learning_rate": 0.00027614663161983945, "loss": 0.0325, "step": 31520 }, { "epoch": 0.16, "learning_rate": 0.00027613906392682543, "loss": 0.0311, "step": 31530 }, { "epoch": 0.16, "learning_rate": 0.0002761314962338114, "loss": 0.0289, "step": 31540 }, { "epoch": 0.16, "learning_rate": 0.0002761239285407974, "loss": 0.0283, "step": 31550 }, { "epoch": 0.16, "learning_rate": 0.00027611636084778343, "loss": 0.0269, "step": 31560 }, { "epoch": 0.16, "learning_rate": 0.0002761087931547694, "loss": 0.027, "step": 31570 }, { "epoch": 0.16, "learning_rate": 0.0002761012254617554, "loss": 0.0232, "step": 31580 }, { "epoch": 0.16, "learning_rate": 0.00027609365776874137, "loss": 0.025, "step": 31590 }, { "epoch": 0.16, "learning_rate": 0.00027608609007572735, "loss": 0.025, "step": 31600 }, { "epoch": 0.16, "learning_rate": 0.00027607852238271333, "loss": 0.0265, "step": 31610 }, { "epoch": 0.16, "learning_rate": 0.0002760709546896993, "loss": 0.0258, "step": 31620 }, { "epoch": 0.16, "learning_rate": 0.00027606338699668535, "loss": 0.0225, "step": 31630 }, { "epoch": 0.16, "learning_rate": 0.00027605581930367133, "loss": 0.0229, "step": 31640 }, { "epoch": 0.16, "learning_rate": 0.0002760482516106573, "loss": 0.0274, "step": 31650 }, { "epoch": 0.16, "learning_rate": 0.0002760406839176433, "loss": 0.0216, "step": 31660 }, { "epoch": 0.16, "learning_rate": 0.0002760331162246293, "loss": 0.0267, "step": 31670 }, { "epoch": 0.16, "learning_rate": 0.00027602554853161526, "loss": 0.0232, "step": 31680 }, { "epoch": 0.16, "learning_rate": 0.0002760179808386013, "loss": 0.0241, "step": 31690 }, { "epoch": 0.16, "learning_rate": 0.0002760104131455873, "loss": 0.0282, "step": 31700 }, { "epoch": 0.16, "learning_rate": 0.00027600284545257326, "loss": 0.0242, "step": 31710 }, { "epoch": 0.16, "learning_rate": 0.00027599527775955924, "loss": 0.0243, "step": 31720 }, { "epoch": 0.16, "learning_rate": 0.0002759877100665452, "loss": 0.027, "step": 31730 }, { "epoch": 0.16, "learning_rate": 0.0002759801423735312, "loss": 0.0262, "step": 31740 }, { "epoch": 0.16, "learning_rate": 0.00027597257468051724, "loss": 0.0339, "step": 31750 }, { "epoch": 0.16, "learning_rate": 0.0002759650069875032, "loss": 0.0257, "step": 31760 }, { "epoch": 0.16, "learning_rate": 0.0002759574392944892, "loss": 0.0305, "step": 31770 }, { "epoch": 0.16, "learning_rate": 0.0002759498716014752, "loss": 0.0229, "step": 31780 }, { "epoch": 0.16, "learning_rate": 0.00027594230390846116, "loss": 0.0226, "step": 31790 }, { "epoch": 0.16, "learning_rate": 0.00027593473621544714, "loss": 0.0289, "step": 31800 }, { "epoch": 0.16, "learning_rate": 0.0002759271685224331, "loss": 0.0262, "step": 31810 }, { "epoch": 0.16, "learning_rate": 0.00027591960082941916, "loss": 0.0232, "step": 31820 }, { "epoch": 0.16, "learning_rate": 0.00027591203313640514, "loss": 0.0242, "step": 31830 }, { "epoch": 0.16, "learning_rate": 0.0002759044654433911, "loss": 0.0299, "step": 31840 }, { "epoch": 0.16, "learning_rate": 0.0002758968977503771, "loss": 0.0288, "step": 31850 }, { "epoch": 0.16, "learning_rate": 0.0002758893300573631, "loss": 0.0235, "step": 31860 }, { "epoch": 0.16, "learning_rate": 0.00027588176236434907, "loss": 0.0263, "step": 31870 }, { "epoch": 0.16, "learning_rate": 0.0002758741946713351, "loss": 0.0336, "step": 31880 }, { "epoch": 0.16, "learning_rate": 0.0002758666269783211, "loss": 0.0238, "step": 31890 }, { "epoch": 0.16, "learning_rate": 0.00027585905928530707, "loss": 0.0272, "step": 31900 }, { "epoch": 0.16, "learning_rate": 0.00027585149159229305, "loss": 0.0237, "step": 31910 }, { "epoch": 0.16, "learning_rate": 0.00027584392389927903, "loss": 0.0236, "step": 31920 }, { "epoch": 0.16, "learning_rate": 0.000275836356206265, "loss": 0.0247, "step": 31930 }, { "epoch": 0.16, "learning_rate": 0.000275828788513251, "loss": 0.0271, "step": 31940 }, { "epoch": 0.16, "learning_rate": 0.00027582122082023703, "loss": 0.0268, "step": 31950 }, { "epoch": 0.16, "learning_rate": 0.000275813653127223, "loss": 0.0238, "step": 31960 }, { "epoch": 0.16, "learning_rate": 0.000275806085434209, "loss": 0.0258, "step": 31970 }, { "epoch": 0.16, "learning_rate": 0.000275798517741195, "loss": 0.0256, "step": 31980 }, { "epoch": 0.16, "learning_rate": 0.00027579095004818095, "loss": 0.0247, "step": 31990 }, { "epoch": 0.16, "learning_rate": 0.00027578338235516694, "loss": 0.0273, "step": 32000 }, { "epoch": 0.16, "eval_cer": 0.9144896638256703, "eval_loss": 0.017893997952342033, "eval_runtime": 117.1916, "eval_samples_per_second": 17.066, "eval_steps_per_second": 4.267, "step": 32000 }, { "epoch": 0.16, "learning_rate": 0.00027577581466215297, "loss": 0.0236, "step": 32010 }, { "epoch": 0.16, "learning_rate": 0.00027576824696913895, "loss": 0.0283, "step": 32020 }, { "epoch": 0.16, "learning_rate": 0.00027576067927612493, "loss": 0.025, "step": 32030 }, { "epoch": 0.16, "learning_rate": 0.0002757531115831109, "loss": 0.0208, "step": 32040 }, { "epoch": 0.16, "learning_rate": 0.0002757455438900969, "loss": 0.025, "step": 32050 }, { "epoch": 0.16, "learning_rate": 0.0002757379761970829, "loss": 0.023, "step": 32060 }, { "epoch": 0.16, "learning_rate": 0.00027573040850406886, "loss": 0.0272, "step": 32070 }, { "epoch": 0.16, "learning_rate": 0.00027572284081105484, "loss": 0.0225, "step": 32080 }, { "epoch": 0.16, "learning_rate": 0.0002757152731180408, "loss": 0.0277, "step": 32090 }, { "epoch": 0.16, "learning_rate": 0.0002757077054250268, "loss": 0.0251, "step": 32100 }, { "epoch": 0.16, "learning_rate": 0.00027570013773201284, "loss": 0.0266, "step": 32110 }, { "epoch": 0.16, "learning_rate": 0.0002756925700389988, "loss": 0.0257, "step": 32120 }, { "epoch": 0.16, "learning_rate": 0.0002756850023459848, "loss": 0.0245, "step": 32130 }, { "epoch": 0.16, "learning_rate": 0.0002756774346529708, "loss": 0.0266, "step": 32140 }, { "epoch": 0.16, "learning_rate": 0.00027566986695995677, "loss": 0.0264, "step": 32150 }, { "epoch": 0.16, "learning_rate": 0.00027566229926694275, "loss": 0.0255, "step": 32160 }, { "epoch": 0.16, "learning_rate": 0.00027565473157392873, "loss": 0.0344, "step": 32170 }, { "epoch": 0.16, "learning_rate": 0.00027564716388091476, "loss": 0.0269, "step": 32180 }, { "epoch": 0.16, "learning_rate": 0.00027563959618790075, "loss": 0.0241, "step": 32190 }, { "epoch": 0.16, "learning_rate": 0.00027563202849488673, "loss": 0.0234, "step": 32200 }, { "epoch": 0.16, "learning_rate": 0.0002756244608018727, "loss": 0.028, "step": 32210 }, { "epoch": 0.16, "learning_rate": 0.0002756168931088587, "loss": 0.0252, "step": 32220 }, { "epoch": 0.16, "learning_rate": 0.00027560932541584467, "loss": 0.0261, "step": 32230 }, { "epoch": 0.16, "learning_rate": 0.0002756017577228307, "loss": 0.0281, "step": 32240 }, { "epoch": 0.16, "learning_rate": 0.0002755941900298167, "loss": 0.0255, "step": 32250 }, { "epoch": 0.16, "learning_rate": 0.00027558662233680267, "loss": 0.0309, "step": 32260 }, { "epoch": 0.16, "learning_rate": 0.00027557905464378865, "loss": 0.0308, "step": 32270 }, { "epoch": 0.16, "learning_rate": 0.00027557148695077463, "loss": 0.0274, "step": 32280 }, { "epoch": 0.16, "learning_rate": 0.0002755639192577606, "loss": 0.0283, "step": 32290 }, { "epoch": 0.16, "learning_rate": 0.00027555635156474665, "loss": 0.0241, "step": 32300 }, { "epoch": 0.16, "learning_rate": 0.00027554878387173263, "loss": 0.0299, "step": 32310 }, { "epoch": 0.16, "learning_rate": 0.0002755412161787186, "loss": 0.0252, "step": 32320 }, { "epoch": 0.16, "learning_rate": 0.0002755336484857046, "loss": 0.0258, "step": 32330 }, { "epoch": 0.16, "learning_rate": 0.0002755260807926906, "loss": 0.0216, "step": 32340 }, { "epoch": 0.16, "learning_rate": 0.00027551851309967656, "loss": 0.0266, "step": 32350 }, { "epoch": 0.16, "learning_rate": 0.00027551094540666254, "loss": 0.0251, "step": 32360 }, { "epoch": 0.16, "learning_rate": 0.0002755033777136486, "loss": 0.0318, "step": 32370 }, { "epoch": 0.16, "learning_rate": 0.00027549581002063456, "loss": 0.0237, "step": 32380 }, { "epoch": 0.16, "learning_rate": 0.00027548824232762054, "loss": 0.0221, "step": 32390 }, { "epoch": 0.16, "learning_rate": 0.0002754806746346065, "loss": 0.0226, "step": 32400 }, { "epoch": 0.16, "learning_rate": 0.0002754731069415925, "loss": 0.0262, "step": 32410 }, { "epoch": 0.16, "learning_rate": 0.0002754655392485785, "loss": 0.0233, "step": 32420 }, { "epoch": 0.16, "learning_rate": 0.0002754579715555645, "loss": 0.0227, "step": 32430 }, { "epoch": 0.16, "learning_rate": 0.0002754504038625505, "loss": 0.0267, "step": 32440 }, { "epoch": 0.16, "learning_rate": 0.0002754428361695365, "loss": 0.0282, "step": 32450 }, { "epoch": 0.16, "learning_rate": 0.00027543526847652246, "loss": 0.0243, "step": 32460 }, { "epoch": 0.16, "learning_rate": 0.00027542770078350844, "loss": 0.0223, "step": 32470 }, { "epoch": 0.16, "learning_rate": 0.0002754201330904944, "loss": 0.0243, "step": 32480 }, { "epoch": 0.16, "learning_rate": 0.00027541256539748046, "loss": 0.0246, "step": 32490 }, { "epoch": 0.16, "learning_rate": 0.00027540499770446644, "loss": 0.0247, "step": 32500 }, { "epoch": 0.16, "learning_rate": 0.0002753974300114524, "loss": 0.0245, "step": 32510 }, { "epoch": 0.16, "learning_rate": 0.0002753898623184384, "loss": 0.0256, "step": 32520 }, { "epoch": 0.16, "learning_rate": 0.0002753822946254244, "loss": 0.0232, "step": 32530 }, { "epoch": 0.16, "learning_rate": 0.00027537472693241037, "loss": 0.0264, "step": 32540 }, { "epoch": 0.16, "learning_rate": 0.00027536715923939635, "loss": 0.024, "step": 32550 }, { "epoch": 0.16, "learning_rate": 0.0002753595915463824, "loss": 0.026, "step": 32560 }, { "epoch": 0.16, "learning_rate": 0.00027535202385336837, "loss": 0.0236, "step": 32570 }, { "epoch": 0.16, "learning_rate": 0.00027534445616035435, "loss": 0.0233, "step": 32580 }, { "epoch": 0.16, "learning_rate": 0.00027533688846734033, "loss": 0.0288, "step": 32590 }, { "epoch": 0.16, "learning_rate": 0.0002753293207743263, "loss": 0.026, "step": 32600 }, { "epoch": 0.16, "learning_rate": 0.0002753217530813123, "loss": 0.0255, "step": 32610 }, { "epoch": 0.16, "learning_rate": 0.00027531418538829833, "loss": 0.0266, "step": 32620 }, { "epoch": 0.16, "learning_rate": 0.0002753066176952843, "loss": 0.0249, "step": 32630 }, { "epoch": 0.16, "learning_rate": 0.0002752990500022703, "loss": 0.0277, "step": 32640 }, { "epoch": 0.16, "learning_rate": 0.00027529148230925627, "loss": 0.0321, "step": 32650 }, { "epoch": 0.16, "learning_rate": 0.00027528391461624225, "loss": 0.026, "step": 32660 }, { "epoch": 0.16, "learning_rate": 0.00027527634692322823, "loss": 0.0227, "step": 32670 }, { "epoch": 0.16, "learning_rate": 0.0002752687792302142, "loss": 0.0266, "step": 32680 }, { "epoch": 0.16, "learning_rate": 0.00027526121153720025, "loss": 0.0263, "step": 32690 }, { "epoch": 0.16, "learning_rate": 0.00027525364384418623, "loss": 0.0239, "step": 32700 }, { "epoch": 0.17, "learning_rate": 0.0002752460761511722, "loss": 0.0281, "step": 32710 }, { "epoch": 0.17, "learning_rate": 0.0002752385084581582, "loss": 0.0254, "step": 32720 }, { "epoch": 0.17, "learning_rate": 0.0002752309407651442, "loss": 0.0253, "step": 32730 }, { "epoch": 0.17, "learning_rate": 0.00027522337307213016, "loss": 0.0253, "step": 32740 }, { "epoch": 0.17, "learning_rate": 0.0002752158053791162, "loss": 0.0266, "step": 32750 }, { "epoch": 0.17, "learning_rate": 0.0002752082376861022, "loss": 0.028, "step": 32760 }, { "epoch": 0.17, "learning_rate": 0.00027520066999308816, "loss": 0.0268, "step": 32770 }, { "epoch": 0.17, "learning_rate": 0.00027519310230007414, "loss": 0.0232, "step": 32780 }, { "epoch": 0.17, "learning_rate": 0.0002751855346070601, "loss": 0.0297, "step": 32790 }, { "epoch": 0.17, "learning_rate": 0.0002751779669140461, "loss": 0.0244, "step": 32800 }, { "epoch": 0.17, "learning_rate": 0.00027517039922103214, "loss": 0.0301, "step": 32810 }, { "epoch": 0.17, "learning_rate": 0.0002751628315280181, "loss": 0.03, "step": 32820 }, { "epoch": 0.17, "learning_rate": 0.0002751552638350041, "loss": 0.0269, "step": 32830 }, { "epoch": 0.17, "learning_rate": 0.0002751476961419901, "loss": 0.0339, "step": 32840 }, { "epoch": 0.17, "learning_rate": 0.00027514012844897606, "loss": 0.0306, "step": 32850 }, { "epoch": 0.17, "learning_rate": 0.00027513256075596204, "loss": 0.0241, "step": 32860 }, { "epoch": 0.17, "learning_rate": 0.000275124993062948, "loss": 0.0235, "step": 32870 }, { "epoch": 0.17, "learning_rate": 0.00027511742536993406, "loss": 0.0263, "step": 32880 }, { "epoch": 0.17, "learning_rate": 0.00027510985767692004, "loss": 0.023, "step": 32890 }, { "epoch": 0.17, "learning_rate": 0.000275102289983906, "loss": 0.0251, "step": 32900 }, { "epoch": 0.17, "learning_rate": 0.000275094722290892, "loss": 0.0289, "step": 32910 }, { "epoch": 0.17, "learning_rate": 0.000275087154597878, "loss": 0.0268, "step": 32920 }, { "epoch": 0.17, "learning_rate": 0.00027507958690486397, "loss": 0.0261, "step": 32930 }, { "epoch": 0.17, "learning_rate": 0.00027507201921185, "loss": 0.0416, "step": 32940 }, { "epoch": 0.17, "learning_rate": 0.000275064451518836, "loss": 0.0258, "step": 32950 }, { "epoch": 0.17, "learning_rate": 0.00027505688382582197, "loss": 0.0251, "step": 32960 }, { "epoch": 0.17, "learning_rate": 0.00027504931613280795, "loss": 0.0262, "step": 32970 }, { "epoch": 0.17, "learning_rate": 0.00027504174843979393, "loss": 0.0235, "step": 32980 }, { "epoch": 0.17, "learning_rate": 0.0002750341807467799, "loss": 0.023, "step": 32990 }, { "epoch": 0.17, "learning_rate": 0.00027502661305376595, "loss": 0.0284, "step": 33000 }, { "epoch": 0.17, "eval_cer": 0.9144838414489178, "eval_loss": 0.018402038142085075, "eval_runtime": 117.2116, "eval_samples_per_second": 17.063, "eval_steps_per_second": 4.266, "step": 33000 }, { "epoch": 0.17, "learning_rate": 0.00027501904536075193, "loss": 0.0259, "step": 33010 }, { "epoch": 0.17, "learning_rate": 0.0002750114776677379, "loss": 0.0246, "step": 33020 }, { "epoch": 0.17, "learning_rate": 0.0002750039099747239, "loss": 0.0264, "step": 33030 }, { "epoch": 0.17, "learning_rate": 0.0002749963422817099, "loss": 0.0245, "step": 33040 }, { "epoch": 0.17, "learning_rate": 0.00027498877458869585, "loss": 0.0211, "step": 33050 }, { "epoch": 0.17, "learning_rate": 0.00027498120689568184, "loss": 0.021, "step": 33060 }, { "epoch": 0.17, "learning_rate": 0.00027497363920266787, "loss": 0.0223, "step": 33070 }, { "epoch": 0.17, "learning_rate": 0.00027496607150965385, "loss": 0.0232, "step": 33080 }, { "epoch": 0.17, "learning_rate": 0.00027495850381663983, "loss": 0.0241, "step": 33090 }, { "epoch": 0.17, "learning_rate": 0.0002749509361236258, "loss": 0.0265, "step": 33100 }, { "epoch": 0.17, "learning_rate": 0.0002749433684306118, "loss": 0.0264, "step": 33110 }, { "epoch": 0.17, "learning_rate": 0.0002749358007375978, "loss": 0.026, "step": 33120 }, { "epoch": 0.17, "learning_rate": 0.0002749282330445838, "loss": 0.0317, "step": 33130 }, { "epoch": 0.17, "learning_rate": 0.0002749206653515698, "loss": 0.0236, "step": 33140 }, { "epoch": 0.17, "learning_rate": 0.0002749130976585558, "loss": 0.0231, "step": 33150 }, { "epoch": 0.17, "learning_rate": 0.00027490552996554176, "loss": 0.0312, "step": 33160 }, { "epoch": 0.17, "learning_rate": 0.00027489796227252774, "loss": 0.026, "step": 33170 }, { "epoch": 0.17, "learning_rate": 0.0002748903945795137, "loss": 0.0219, "step": 33180 }, { "epoch": 0.17, "learning_rate": 0.0002748828268864997, "loss": 0.023, "step": 33190 }, { "epoch": 0.17, "learning_rate": 0.00027487525919348574, "loss": 0.0482, "step": 33200 }, { "epoch": 0.17, "learning_rate": 0.0002748676915004717, "loss": 0.0344, "step": 33210 }, { "epoch": 0.17, "learning_rate": 0.0002748601238074577, "loss": 0.0282, "step": 33220 }, { "epoch": 0.17, "learning_rate": 0.0002748525561144437, "loss": 0.0291, "step": 33230 }, { "epoch": 0.17, "learning_rate": 0.00027484498842142966, "loss": 0.0255, "step": 33240 }, { "epoch": 0.17, "learning_rate": 0.00027483742072841565, "loss": 0.0249, "step": 33250 }, { "epoch": 0.17, "learning_rate": 0.0002748298530354017, "loss": 0.0304, "step": 33260 }, { "epoch": 0.17, "learning_rate": 0.00027482228534238766, "loss": 0.0233, "step": 33270 }, { "epoch": 0.17, "learning_rate": 0.00027481471764937364, "loss": 0.0265, "step": 33280 }, { "epoch": 0.17, "learning_rate": 0.0002748071499563596, "loss": 0.0249, "step": 33290 }, { "epoch": 0.17, "learning_rate": 0.0002747995822633456, "loss": 0.024, "step": 33300 }, { "epoch": 0.17, "learning_rate": 0.0002747920145703316, "loss": 0.0461, "step": 33310 }, { "epoch": 0.17, "learning_rate": 0.00027478444687731757, "loss": 0.0418, "step": 33320 }, { "epoch": 0.17, "learning_rate": 0.00027477687918430355, "loss": 0.024, "step": 33330 }, { "epoch": 0.17, "learning_rate": 0.00027476931149128953, "loss": 0.0279, "step": 33340 }, { "epoch": 0.17, "learning_rate": 0.0002747617437982755, "loss": 0.0224, "step": 33350 }, { "epoch": 0.17, "learning_rate": 0.00027475417610526155, "loss": 0.0258, "step": 33360 }, { "epoch": 0.17, "learning_rate": 0.00027474660841224753, "loss": 0.0233, "step": 33370 }, { "epoch": 0.17, "learning_rate": 0.0002747390407192335, "loss": 0.0235, "step": 33380 }, { "epoch": 0.17, "learning_rate": 0.0002747314730262195, "loss": 0.0258, "step": 33390 }, { "epoch": 0.17, "learning_rate": 0.0002747239053332055, "loss": 0.0259, "step": 33400 }, { "epoch": 0.17, "learning_rate": 0.00027471633764019146, "loss": 0.0227, "step": 33410 }, { "epoch": 0.17, "learning_rate": 0.00027470876994717744, "loss": 0.0265, "step": 33420 }, { "epoch": 0.17, "learning_rate": 0.0002747012022541635, "loss": 0.0227, "step": 33430 }, { "epoch": 0.17, "learning_rate": 0.00027469363456114946, "loss": 0.026, "step": 33440 }, { "epoch": 0.17, "learning_rate": 0.00027468606686813544, "loss": 0.031, "step": 33450 }, { "epoch": 0.17, "learning_rate": 0.0002746784991751214, "loss": 0.0264, "step": 33460 }, { "epoch": 0.17, "learning_rate": 0.0002746709314821074, "loss": 0.0224, "step": 33470 }, { "epoch": 0.17, "learning_rate": 0.0002746633637890934, "loss": 0.0261, "step": 33480 }, { "epoch": 0.17, "learning_rate": 0.0002746557960960794, "loss": 0.026, "step": 33490 }, { "epoch": 0.17, "learning_rate": 0.0002746482284030654, "loss": 0.0263, "step": 33500 }, { "epoch": 0.17, "learning_rate": 0.0002746406607100514, "loss": 0.0246, "step": 33510 }, { "epoch": 0.17, "learning_rate": 0.00027463309301703736, "loss": 0.0218, "step": 33520 }, { "epoch": 0.17, "learning_rate": 0.00027462552532402334, "loss": 0.0232, "step": 33530 }, { "epoch": 0.17, "learning_rate": 0.0002746179576310093, "loss": 0.0267, "step": 33540 }, { "epoch": 0.17, "learning_rate": 0.00027461038993799536, "loss": 0.0298, "step": 33550 }, { "epoch": 0.17, "learning_rate": 0.00027460282224498134, "loss": 0.0277, "step": 33560 }, { "epoch": 0.17, "learning_rate": 0.0002745952545519673, "loss": 0.0324, "step": 33570 }, { "epoch": 0.17, "learning_rate": 0.0002745876868589533, "loss": 0.0339, "step": 33580 }, { "epoch": 0.17, "learning_rate": 0.0002745801191659393, "loss": 0.0385, "step": 33590 }, { "epoch": 0.17, "learning_rate": 0.00027457255147292527, "loss": 0.0297, "step": 33600 }, { "epoch": 0.17, "learning_rate": 0.00027456498377991125, "loss": 0.0355, "step": 33610 }, { "epoch": 0.17, "learning_rate": 0.0002745574160868973, "loss": 0.0277, "step": 33620 }, { "epoch": 0.17, "learning_rate": 0.00027454984839388327, "loss": 0.0244, "step": 33630 }, { "epoch": 0.17, "learning_rate": 0.00027454228070086925, "loss": 0.0249, "step": 33640 }, { "epoch": 0.17, "learning_rate": 0.00027453471300785523, "loss": 0.0265, "step": 33650 }, { "epoch": 0.17, "learning_rate": 0.0002745271453148412, "loss": 0.0274, "step": 33660 }, { "epoch": 0.17, "learning_rate": 0.0002745195776218272, "loss": 0.0221, "step": 33670 }, { "epoch": 0.17, "learning_rate": 0.00027451200992881323, "loss": 0.0293, "step": 33680 }, { "epoch": 0.17, "learning_rate": 0.0002745044422357992, "loss": 0.031, "step": 33690 }, { "epoch": 0.17, "learning_rate": 0.0002744968745427852, "loss": 0.0247, "step": 33700 }, { "epoch": 0.17, "learning_rate": 0.00027448930684977117, "loss": 0.0258, "step": 33710 }, { "epoch": 0.17, "learning_rate": 0.00027448173915675715, "loss": 0.0284, "step": 33720 }, { "epoch": 0.17, "learning_rate": 0.00027447417146374313, "loss": 0.0239, "step": 33730 }, { "epoch": 0.17, "learning_rate": 0.0002744666037707291, "loss": 0.0254, "step": 33740 }, { "epoch": 0.17, "learning_rate": 0.00027445903607771515, "loss": 0.0232, "step": 33750 }, { "epoch": 0.17, "learning_rate": 0.00027445146838470113, "loss": 0.0246, "step": 33760 }, { "epoch": 0.17, "learning_rate": 0.0002744439006916871, "loss": 0.0247, "step": 33770 }, { "epoch": 0.17, "learning_rate": 0.0002744363329986731, "loss": 0.0282, "step": 33780 }, { "epoch": 0.17, "learning_rate": 0.0002744287653056591, "loss": 0.021, "step": 33790 }, { "epoch": 0.17, "learning_rate": 0.00027442119761264506, "loss": 0.0207, "step": 33800 }, { "epoch": 0.17, "learning_rate": 0.0002744136299196311, "loss": 0.0308, "step": 33810 }, { "epoch": 0.17, "learning_rate": 0.0002744060622266171, "loss": 0.0278, "step": 33820 }, { "epoch": 0.17, "learning_rate": 0.00027439849453360306, "loss": 0.0252, "step": 33830 }, { "epoch": 0.17, "learning_rate": 0.00027439092684058904, "loss": 0.025, "step": 33840 }, { "epoch": 0.17, "learning_rate": 0.000274383359147575, "loss": 0.0246, "step": 33850 }, { "epoch": 0.17, "learning_rate": 0.000274375791454561, "loss": 0.0229, "step": 33860 }, { "epoch": 0.17, "learning_rate": 0.00027436822376154704, "loss": 0.027, "step": 33870 }, { "epoch": 0.17, "learning_rate": 0.000274360656068533, "loss": 0.028, "step": 33880 }, { "epoch": 0.17, "learning_rate": 0.000274353088375519, "loss": 0.0222, "step": 33890 }, { "epoch": 0.17, "learning_rate": 0.000274345520682505, "loss": 0.0245, "step": 33900 }, { "epoch": 0.17, "learning_rate": 0.00027433795298949096, "loss": 0.029, "step": 33910 }, { "epoch": 0.17, "learning_rate": 0.00027433038529647694, "loss": 0.0274, "step": 33920 }, { "epoch": 0.17, "learning_rate": 0.0002743228176034629, "loss": 0.0244, "step": 33930 }, { "epoch": 0.17, "learning_rate": 0.00027431524991044896, "loss": 0.0235, "step": 33940 }, { "epoch": 0.17, "learning_rate": 0.00027430768221743494, "loss": 0.0224, "step": 33950 }, { "epoch": 0.17, "learning_rate": 0.0002743001145244209, "loss": 0.0215, "step": 33960 }, { "epoch": 0.17, "learning_rate": 0.0002742925468314069, "loss": 0.0234, "step": 33970 }, { "epoch": 0.17, "learning_rate": 0.0002742849791383929, "loss": 0.021, "step": 33980 }, { "epoch": 0.17, "learning_rate": 0.00027427741144537887, "loss": 0.0245, "step": 33990 }, { "epoch": 0.17, "learning_rate": 0.0002742698437523649, "loss": 0.0264, "step": 34000 }, { "epoch": 0.17, "eval_cer": 0.9144916046179211, "eval_loss": 0.017292475327849388, "eval_runtime": 117.3012, "eval_samples_per_second": 17.05, "eval_steps_per_second": 4.263, "step": 34000 }, { "epoch": 0.17, "learning_rate": 0.0002742622760593509, "loss": 0.0221, "step": 34010 }, { "epoch": 0.17, "learning_rate": 0.00027425470836633687, "loss": 0.0193, "step": 34020 }, { "epoch": 0.17, "learning_rate": 0.00027424714067332285, "loss": 0.0214, "step": 34030 }, { "epoch": 0.17, "learning_rate": 0.00027423957298030883, "loss": 0.0213, "step": 34040 }, { "epoch": 0.17, "learning_rate": 0.0002742320052872948, "loss": 0.026, "step": 34050 }, { "epoch": 0.17, "learning_rate": 0.00027422443759428085, "loss": 0.0271, "step": 34060 }, { "epoch": 0.17, "learning_rate": 0.00027421686990126683, "loss": 0.0249, "step": 34070 }, { "epoch": 0.17, "learning_rate": 0.0002742093022082528, "loss": 0.0263, "step": 34080 }, { "epoch": 0.17, "learning_rate": 0.0002742017345152388, "loss": 0.0283, "step": 34090 }, { "epoch": 0.17, "learning_rate": 0.0002741941668222248, "loss": 0.0274, "step": 34100 }, { "epoch": 0.17, "learning_rate": 0.00027418659912921075, "loss": 0.0246, "step": 34110 }, { "epoch": 0.17, "learning_rate": 0.00027417903143619674, "loss": 0.032, "step": 34120 }, { "epoch": 0.17, "learning_rate": 0.00027417146374318277, "loss": 0.0216, "step": 34130 }, { "epoch": 0.17, "learning_rate": 0.00027416389605016875, "loss": 0.0195, "step": 34140 }, { "epoch": 0.17, "learning_rate": 0.00027415632835715473, "loss": 0.0229, "step": 34150 }, { "epoch": 0.17, "learning_rate": 0.0002741487606641407, "loss": 0.023, "step": 34160 }, { "epoch": 0.17, "learning_rate": 0.0002741411929711267, "loss": 0.0224, "step": 34170 }, { "epoch": 0.17, "learning_rate": 0.0002741336252781127, "loss": 0.0255, "step": 34180 }, { "epoch": 0.17, "learning_rate": 0.0002741260575850987, "loss": 0.0225, "step": 34190 }, { "epoch": 0.17, "learning_rate": 0.0002741184898920847, "loss": 0.0278, "step": 34200 }, { "epoch": 0.17, "learning_rate": 0.0002741109221990707, "loss": 0.024, "step": 34210 }, { "epoch": 0.17, "learning_rate": 0.00027410335450605666, "loss": 0.0245, "step": 34220 }, { "epoch": 0.17, "learning_rate": 0.00027409578681304264, "loss": 0.0246, "step": 34230 }, { "epoch": 0.17, "learning_rate": 0.0002740882191200286, "loss": 0.0223, "step": 34240 }, { "epoch": 0.17, "learning_rate": 0.0002740806514270146, "loss": 0.0229, "step": 34250 }, { "epoch": 0.17, "learning_rate": 0.00027407308373400064, "loss": 0.0231, "step": 34260 }, { "epoch": 0.17, "learning_rate": 0.0002740655160409866, "loss": 0.0233, "step": 34270 }, { "epoch": 0.17, "learning_rate": 0.0002740579483479726, "loss": 0.0288, "step": 34280 }, { "epoch": 0.17, "learning_rate": 0.0002740503806549586, "loss": 0.0272, "step": 34290 }, { "epoch": 0.17, "learning_rate": 0.00027404281296194457, "loss": 0.0274, "step": 34300 }, { "epoch": 0.17, "learning_rate": 0.00027403524526893055, "loss": 0.0286, "step": 34310 }, { "epoch": 0.17, "learning_rate": 0.0002740276775759166, "loss": 0.0246, "step": 34320 }, { "epoch": 0.17, "learning_rate": 0.00027402010988290256, "loss": 0.0235, "step": 34330 }, { "epoch": 0.17, "learning_rate": 0.00027401254218988854, "loss": 0.0323, "step": 34340 }, { "epoch": 0.17, "learning_rate": 0.0002740049744968745, "loss": 0.0235, "step": 34350 }, { "epoch": 0.17, "learning_rate": 0.0002739974068038605, "loss": 0.0277, "step": 34360 }, { "epoch": 0.17, "learning_rate": 0.0002739898391108465, "loss": 0.0265, "step": 34370 }, { "epoch": 0.17, "learning_rate": 0.0002739822714178325, "loss": 0.025, "step": 34380 }, { "epoch": 0.17, "learning_rate": 0.0002739747037248185, "loss": 0.025, "step": 34390 }, { "epoch": 0.17, "learning_rate": 0.0002739671360318045, "loss": 0.0258, "step": 34400 }, { "epoch": 0.17, "learning_rate": 0.00027395956833879047, "loss": 0.0213, "step": 34410 }, { "epoch": 0.17, "learning_rate": 0.00027395200064577645, "loss": 0.0279, "step": 34420 }, { "epoch": 0.17, "learning_rate": 0.00027394443295276243, "loss": 0.0225, "step": 34430 }, { "epoch": 0.17, "learning_rate": 0.0002739368652597484, "loss": 0.0276, "step": 34440 }, { "epoch": 0.17, "learning_rate": 0.00027392929756673445, "loss": 0.0242, "step": 34450 }, { "epoch": 0.17, "learning_rate": 0.00027392172987372043, "loss": 0.0296, "step": 34460 }, { "epoch": 0.17, "learning_rate": 0.0002739141621807064, "loss": 0.0247, "step": 34470 }, { "epoch": 0.17, "learning_rate": 0.0002739065944876924, "loss": 0.0257, "step": 34480 }, { "epoch": 0.17, "learning_rate": 0.0002738990267946784, "loss": 0.0237, "step": 34490 }, { "epoch": 0.17, "learning_rate": 0.00027389145910166436, "loss": 0.0226, "step": 34500 }, { "epoch": 0.17, "learning_rate": 0.0002738838914086504, "loss": 0.0243, "step": 34510 }, { "epoch": 0.17, "learning_rate": 0.0002738763237156364, "loss": 0.0301, "step": 34520 }, { "epoch": 0.17, "learning_rate": 0.00027386875602262236, "loss": 0.0272, "step": 34530 }, { "epoch": 0.17, "learning_rate": 0.00027386118832960834, "loss": 0.0241, "step": 34540 }, { "epoch": 0.17, "learning_rate": 0.0002738536206365943, "loss": 0.0273, "step": 34550 }, { "epoch": 0.17, "learning_rate": 0.0002738460529435803, "loss": 0.0228, "step": 34560 }, { "epoch": 0.17, "learning_rate": 0.0002738384852505663, "loss": 0.0235, "step": 34570 }, { "epoch": 0.17, "learning_rate": 0.00027383091755755226, "loss": 0.0268, "step": 34580 }, { "epoch": 0.17, "learning_rate": 0.00027382334986453824, "loss": 0.0245, "step": 34590 }, { "epoch": 0.17, "learning_rate": 0.0002738157821715242, "loss": 0.0313, "step": 34600 }, { "epoch": 0.17, "learning_rate": 0.00027380821447851026, "loss": 0.0229, "step": 34610 }, { "epoch": 0.17, "learning_rate": 0.00027380064678549624, "loss": 0.0182, "step": 34620 }, { "epoch": 0.17, "learning_rate": 0.0002737930790924822, "loss": 0.0224, "step": 34630 }, { "epoch": 0.17, "learning_rate": 0.0002737855113994682, "loss": 0.026, "step": 34640 }, { "epoch": 0.17, "learning_rate": 0.0002737779437064542, "loss": 0.0218, "step": 34650 }, { "epoch": 0.17, "learning_rate": 0.00027377037601344017, "loss": 0.024, "step": 34660 }, { "epoch": 0.17, "learning_rate": 0.00027376280832042615, "loss": 0.0258, "step": 34670 }, { "epoch": 0.17, "learning_rate": 0.0002737552406274122, "loss": 0.0192, "step": 34680 }, { "epoch": 0.18, "learning_rate": 0.00027374767293439817, "loss": 0.0239, "step": 34690 }, { "epoch": 0.18, "learning_rate": 0.00027374010524138415, "loss": 0.0198, "step": 34700 }, { "epoch": 0.18, "learning_rate": 0.00027373253754837013, "loss": 0.0267, "step": 34710 }, { "epoch": 0.18, "learning_rate": 0.0002737249698553561, "loss": 0.0285, "step": 34720 }, { "epoch": 0.18, "learning_rate": 0.0002737174021623421, "loss": 0.0223, "step": 34730 }, { "epoch": 0.18, "learning_rate": 0.00027370983446932813, "loss": 0.0228, "step": 34740 }, { "epoch": 0.18, "learning_rate": 0.0002737022667763141, "loss": 0.0204, "step": 34750 }, { "epoch": 0.18, "learning_rate": 0.0002736946990833001, "loss": 0.0211, "step": 34760 }, { "epoch": 0.18, "learning_rate": 0.00027368713139028607, "loss": 0.0231, "step": 34770 }, { "epoch": 0.18, "learning_rate": 0.00027367956369727205, "loss": 0.0251, "step": 34780 }, { "epoch": 0.18, "learning_rate": 0.00027367199600425804, "loss": 0.0243, "step": 34790 }, { "epoch": 0.18, "learning_rate": 0.00027366442831124407, "loss": 0.0338, "step": 34800 }, { "epoch": 0.18, "learning_rate": 0.00027365686061823005, "loss": 0.026, "step": 34810 }, { "epoch": 0.18, "learning_rate": 0.00027364929292521603, "loss": 0.0304, "step": 34820 }, { "epoch": 0.18, "learning_rate": 0.000273641725232202, "loss": 0.0239, "step": 34830 }, { "epoch": 0.18, "learning_rate": 0.000273634157539188, "loss": 0.0232, "step": 34840 }, { "epoch": 0.18, "learning_rate": 0.000273626589846174, "loss": 0.0273, "step": 34850 }, { "epoch": 0.18, "learning_rate": 0.00027361902215315996, "loss": 0.0241, "step": 34860 }, { "epoch": 0.18, "learning_rate": 0.000273611454460146, "loss": 0.0213, "step": 34870 }, { "epoch": 0.18, "learning_rate": 0.000273603886767132, "loss": 0.0225, "step": 34880 }, { "epoch": 0.18, "learning_rate": 0.00027359631907411796, "loss": 0.0259, "step": 34890 }, { "epoch": 0.18, "learning_rate": 0.00027358875138110394, "loss": 0.0226, "step": 34900 }, { "epoch": 0.18, "learning_rate": 0.0002735811836880899, "loss": 0.0247, "step": 34910 }, { "epoch": 0.18, "learning_rate": 0.0002735736159950759, "loss": 0.0255, "step": 34920 }, { "epoch": 0.18, "learning_rate": 0.00027356604830206194, "loss": 0.0268, "step": 34930 }, { "epoch": 0.18, "learning_rate": 0.0002735584806090479, "loss": 0.0275, "step": 34940 }, { "epoch": 0.18, "learning_rate": 0.0002735509129160339, "loss": 0.0252, "step": 34950 }, { "epoch": 0.18, "learning_rate": 0.0002735433452230199, "loss": 0.0232, "step": 34960 }, { "epoch": 0.18, "learning_rate": 0.00027353577753000586, "loss": 0.0231, "step": 34970 }, { "epoch": 0.18, "learning_rate": 0.00027352820983699185, "loss": 0.0299, "step": 34980 }, { "epoch": 0.18, "learning_rate": 0.0002735206421439778, "loss": 0.0257, "step": 34990 }, { "epoch": 0.18, "learning_rate": 0.00027351307445096386, "loss": 0.0209, "step": 35000 }, { "epoch": 0.18, "eval_cer": 0.9144683151109114, "eval_loss": 0.01787448488175869, "eval_runtime": 117.4101, "eval_samples_per_second": 17.034, "eval_steps_per_second": 4.259, "step": 35000 }, { "epoch": 0.18, "learning_rate": 0.00027350550675794984, "loss": 0.0287, "step": 35010 }, { "epoch": 0.18, "learning_rate": 0.0002734979390649358, "loss": 0.0266, "step": 35020 }, { "epoch": 0.18, "learning_rate": 0.0002734903713719218, "loss": 0.0211, "step": 35030 }, { "epoch": 0.18, "learning_rate": 0.0002734828036789078, "loss": 0.0224, "step": 35040 }, { "epoch": 0.18, "learning_rate": 0.00027347523598589377, "loss": 0.0237, "step": 35050 }, { "epoch": 0.18, "learning_rate": 0.0002734676682928798, "loss": 0.0263, "step": 35060 }, { "epoch": 0.18, "learning_rate": 0.0002734601005998658, "loss": 0.0274, "step": 35070 }, { "epoch": 0.18, "learning_rate": 0.00027345253290685177, "loss": 0.0227, "step": 35080 }, { "epoch": 0.18, "learning_rate": 0.00027344496521383775, "loss": 0.0284, "step": 35090 }, { "epoch": 0.18, "learning_rate": 0.00027343739752082373, "loss": 0.0232, "step": 35100 }, { "epoch": 0.18, "learning_rate": 0.0002734298298278097, "loss": 0.0241, "step": 35110 }, { "epoch": 0.18, "learning_rate": 0.00027342226213479575, "loss": 0.025, "step": 35120 }, { "epoch": 0.18, "learning_rate": 0.00027341469444178173, "loss": 0.0251, "step": 35130 }, { "epoch": 0.18, "learning_rate": 0.0002734071267487677, "loss": 0.0227, "step": 35140 }, { "epoch": 0.18, "learning_rate": 0.0002733995590557537, "loss": 0.0239, "step": 35150 }, { "epoch": 0.18, "learning_rate": 0.0002733919913627397, "loss": 0.0263, "step": 35160 }, { "epoch": 0.18, "learning_rate": 0.00027338442366972566, "loss": 0.0257, "step": 35170 }, { "epoch": 0.18, "learning_rate": 0.00027337685597671164, "loss": 0.0263, "step": 35180 }, { "epoch": 0.18, "learning_rate": 0.00027336928828369767, "loss": 0.0274, "step": 35190 }, { "epoch": 0.18, "learning_rate": 0.00027336172059068365, "loss": 0.0238, "step": 35200 }, { "epoch": 0.18, "learning_rate": 0.00027335415289766964, "loss": 0.0302, "step": 35210 }, { "epoch": 0.18, "learning_rate": 0.0002733465852046556, "loss": 0.0245, "step": 35220 }, { "epoch": 0.18, "learning_rate": 0.0002733390175116416, "loss": 0.0286, "step": 35230 }, { "epoch": 0.18, "learning_rate": 0.0002733314498186276, "loss": 0.028, "step": 35240 }, { "epoch": 0.18, "learning_rate": 0.0002733238821256136, "loss": 0.0231, "step": 35250 }, { "epoch": 0.18, "learning_rate": 0.0002733163144325996, "loss": 0.0244, "step": 35260 }, { "epoch": 0.18, "learning_rate": 0.0002733087467395856, "loss": 0.0279, "step": 35270 }, { "epoch": 0.18, "learning_rate": 0.00027330117904657156, "loss": 0.0198, "step": 35280 }, { "epoch": 0.18, "learning_rate": 0.00027329361135355754, "loss": 0.0243, "step": 35290 }, { "epoch": 0.18, "learning_rate": 0.0002732860436605435, "loss": 0.0212, "step": 35300 }, { "epoch": 0.18, "learning_rate": 0.00027327847596752956, "loss": 0.0283, "step": 35310 }, { "epoch": 0.18, "learning_rate": 0.00027327090827451554, "loss": 0.0241, "step": 35320 }, { "epoch": 0.18, "learning_rate": 0.0002732633405815015, "loss": 0.0221, "step": 35330 }, { "epoch": 0.18, "learning_rate": 0.0002732557728884875, "loss": 0.023, "step": 35340 }, { "epoch": 0.18, "learning_rate": 0.0002732482051954735, "loss": 0.0209, "step": 35350 }, { "epoch": 0.18, "learning_rate": 0.00027324063750245947, "loss": 0.0215, "step": 35360 }, { "epoch": 0.18, "learning_rate": 0.00027323306980944545, "loss": 0.0196, "step": 35370 }, { "epoch": 0.18, "learning_rate": 0.0002732255021164315, "loss": 0.0241, "step": 35380 }, { "epoch": 0.18, "learning_rate": 0.00027321793442341746, "loss": 0.0289, "step": 35390 }, { "epoch": 0.18, "learning_rate": 0.00027321036673040345, "loss": 0.0303, "step": 35400 }, { "epoch": 0.18, "learning_rate": 0.0002732027990373894, "loss": 0.0211, "step": 35410 }, { "epoch": 0.18, "learning_rate": 0.0002731952313443754, "loss": 0.025, "step": 35420 }, { "epoch": 0.18, "learning_rate": 0.0002731876636513614, "loss": 0.0214, "step": 35430 }, { "epoch": 0.18, "learning_rate": 0.0002731800959583474, "loss": 0.0198, "step": 35440 }, { "epoch": 0.18, "learning_rate": 0.0002731725282653334, "loss": 0.0235, "step": 35450 }, { "epoch": 0.18, "learning_rate": 0.0002731649605723194, "loss": 0.0231, "step": 35460 }, { "epoch": 0.18, "learning_rate": 0.00027315739287930537, "loss": 0.0221, "step": 35470 }, { "epoch": 0.18, "learning_rate": 0.00027314982518629135, "loss": 0.0224, "step": 35480 }, { "epoch": 0.18, "learning_rate": 0.00027314225749327733, "loss": 0.0221, "step": 35490 }, { "epoch": 0.18, "learning_rate": 0.0002731346898002633, "loss": 0.024, "step": 35500 }, { "epoch": 0.18, "learning_rate": 0.00027312712210724935, "loss": 0.0291, "step": 35510 }, { "epoch": 0.18, "learning_rate": 0.00027311955441423533, "loss": 0.0322, "step": 35520 }, { "epoch": 0.18, "learning_rate": 0.0002731119867212213, "loss": 0.0227, "step": 35530 }, { "epoch": 0.18, "learning_rate": 0.0002731044190282073, "loss": 0.026, "step": 35540 }, { "epoch": 0.18, "learning_rate": 0.0002730968513351933, "loss": 0.0252, "step": 35550 }, { "epoch": 0.18, "learning_rate": 0.00027308928364217926, "loss": 0.0342, "step": 35560 }, { "epoch": 0.18, "learning_rate": 0.0002730817159491653, "loss": 0.0298, "step": 35570 }, { "epoch": 0.18, "learning_rate": 0.0002730741482561513, "loss": 0.0258, "step": 35580 }, { "epoch": 0.18, "learning_rate": 0.00027306658056313726, "loss": 0.0257, "step": 35590 }, { "epoch": 0.18, "learning_rate": 0.00027305901287012324, "loss": 0.0302, "step": 35600 }, { "epoch": 0.18, "learning_rate": 0.0002730514451771092, "loss": 0.0247, "step": 35610 }, { "epoch": 0.18, "learning_rate": 0.0002730438774840952, "loss": 0.0255, "step": 35620 }, { "epoch": 0.18, "learning_rate": 0.00027303630979108124, "loss": 0.0271, "step": 35630 }, { "epoch": 0.18, "learning_rate": 0.0002730287420980672, "loss": 0.0264, "step": 35640 }, { "epoch": 0.18, "learning_rate": 0.0002730211744050532, "loss": 0.0195, "step": 35650 }, { "epoch": 0.18, "learning_rate": 0.0002730136067120392, "loss": 0.0241, "step": 35660 }, { "epoch": 0.18, "learning_rate": 0.00027300603901902516, "loss": 0.0244, "step": 35670 }, { "epoch": 0.18, "learning_rate": 0.00027299847132601114, "loss": 0.0245, "step": 35680 }, { "epoch": 0.18, "learning_rate": 0.0002729909036329971, "loss": 0.0234, "step": 35690 }, { "epoch": 0.18, "learning_rate": 0.00027298333593998316, "loss": 0.0209, "step": 35700 }, { "epoch": 0.18, "learning_rate": 0.00027297576824696914, "loss": 0.0244, "step": 35710 }, { "epoch": 0.18, "learning_rate": 0.0002729682005539551, "loss": 0.0224, "step": 35720 }, { "epoch": 0.18, "learning_rate": 0.0002729606328609411, "loss": 0.0231, "step": 35730 }, { "epoch": 0.18, "learning_rate": 0.0002729530651679271, "loss": 0.0246, "step": 35740 }, { "epoch": 0.18, "learning_rate": 0.00027294549747491307, "loss": 0.0195, "step": 35750 }, { "epoch": 0.18, "learning_rate": 0.0002729379297818991, "loss": 0.0239, "step": 35760 }, { "epoch": 0.18, "learning_rate": 0.0002729303620888851, "loss": 0.0248, "step": 35770 }, { "epoch": 0.18, "learning_rate": 0.00027292279439587107, "loss": 0.0257, "step": 35780 }, { "epoch": 0.18, "learning_rate": 0.00027291522670285705, "loss": 0.0179, "step": 35790 }, { "epoch": 0.18, "learning_rate": 0.00027290765900984303, "loss": 0.0221, "step": 35800 }, { "epoch": 0.18, "learning_rate": 0.000272900091316829, "loss": 0.0205, "step": 35810 }, { "epoch": 0.18, "learning_rate": 0.000272892523623815, "loss": 0.0231, "step": 35820 }, { "epoch": 0.18, "learning_rate": 0.00027288495593080097, "loss": 0.0268, "step": 35830 }, { "epoch": 0.18, "learning_rate": 0.00027287738823778695, "loss": 0.0242, "step": 35840 }, { "epoch": 0.18, "learning_rate": 0.00027286982054477294, "loss": 0.0212, "step": 35850 }, { "epoch": 0.18, "learning_rate": 0.00027286225285175897, "loss": 0.0261, "step": 35860 }, { "epoch": 0.18, "learning_rate": 0.00027285468515874495, "loss": 0.0323, "step": 35870 }, { "epoch": 0.18, "learning_rate": 0.00027284711746573093, "loss": 0.0225, "step": 35880 }, { "epoch": 0.18, "learning_rate": 0.0002728395497727169, "loss": 0.0265, "step": 35890 }, { "epoch": 0.18, "learning_rate": 0.0002728319820797029, "loss": 0.0262, "step": 35900 }, { "epoch": 0.18, "learning_rate": 0.0002728244143866889, "loss": 0.0237, "step": 35910 }, { "epoch": 0.18, "learning_rate": 0.00027281684669367486, "loss": 0.0243, "step": 35920 }, { "epoch": 0.18, "learning_rate": 0.0002728092790006609, "loss": 0.0249, "step": 35930 }, { "epoch": 0.18, "learning_rate": 0.0002728017113076469, "loss": 0.0273, "step": 35940 }, { "epoch": 0.18, "learning_rate": 0.00027279414361463286, "loss": 0.0284, "step": 35950 }, { "epoch": 0.18, "learning_rate": 0.00027278657592161884, "loss": 0.0232, "step": 35960 }, { "epoch": 0.18, "learning_rate": 0.0002727790082286048, "loss": 0.0257, "step": 35970 }, { "epoch": 0.18, "learning_rate": 0.0002727714405355908, "loss": 0.0219, "step": 35980 }, { "epoch": 0.18, "learning_rate": 0.00027276387284257684, "loss": 0.0303, "step": 35990 }, { "epoch": 0.18, "learning_rate": 0.0002727563051495628, "loss": 0.0288, "step": 36000 }, { "epoch": 0.18, "eval_cer": 0.9144993677869243, "eval_loss": 0.017736734822392464, "eval_runtime": 117.3015, "eval_samples_per_second": 17.05, "eval_steps_per_second": 4.263, "step": 36000 }, { "epoch": 0.18, "learning_rate": 0.0002727487374565488, "loss": 0.024, "step": 36010 }, { "epoch": 0.18, "learning_rate": 0.0002727411697635348, "loss": 0.0263, "step": 36020 }, { "epoch": 0.18, "learning_rate": 0.00027273360207052076, "loss": 0.0304, "step": 36030 }, { "epoch": 0.18, "learning_rate": 0.00027272603437750675, "loss": 0.0227, "step": 36040 }, { "epoch": 0.18, "learning_rate": 0.0002727184666844927, "loss": 0.0254, "step": 36050 }, { "epoch": 0.18, "learning_rate": 0.00027271089899147876, "loss": 0.0246, "step": 36060 }, { "epoch": 0.18, "learning_rate": 0.00027270333129846474, "loss": 0.0275, "step": 36070 }, { "epoch": 0.18, "learning_rate": 0.0002726957636054507, "loss": 0.0228, "step": 36080 }, { "epoch": 0.18, "learning_rate": 0.0002726881959124367, "loss": 0.0233, "step": 36090 }, { "epoch": 0.18, "learning_rate": 0.0002726806282194227, "loss": 0.0226, "step": 36100 }, { "epoch": 0.18, "learning_rate": 0.00027267306052640867, "loss": 0.0244, "step": 36110 }, { "epoch": 0.18, "learning_rate": 0.0002726654928333947, "loss": 0.0246, "step": 36120 }, { "epoch": 0.18, "learning_rate": 0.0002726579251403807, "loss": 0.0263, "step": 36130 }, { "epoch": 0.18, "learning_rate": 0.00027265035744736667, "loss": 0.0262, "step": 36140 }, { "epoch": 0.18, "learning_rate": 0.00027264278975435265, "loss": 0.0247, "step": 36150 }, { "epoch": 0.18, "learning_rate": 0.00027263522206133863, "loss": 0.0173, "step": 36160 }, { "epoch": 0.18, "learning_rate": 0.0002726276543683246, "loss": 0.0275, "step": 36170 }, { "epoch": 0.18, "learning_rate": 0.00027262008667531065, "loss": 0.0216, "step": 36180 }, { "epoch": 0.18, "learning_rate": 0.00027261251898229663, "loss": 0.0252, "step": 36190 }, { "epoch": 0.18, "learning_rate": 0.0002726049512892826, "loss": 0.0233, "step": 36200 }, { "epoch": 0.18, "learning_rate": 0.0002725973835962686, "loss": 0.0243, "step": 36210 }, { "epoch": 0.18, "learning_rate": 0.0002725898159032546, "loss": 0.0275, "step": 36220 }, { "epoch": 0.18, "learning_rate": 0.00027258224821024056, "loss": 0.0284, "step": 36230 }, { "epoch": 0.18, "learning_rate": 0.00027257468051722654, "loss": 0.034, "step": 36240 }, { "epoch": 0.18, "learning_rate": 0.00027256711282421257, "loss": 0.024, "step": 36250 }, { "epoch": 0.18, "learning_rate": 0.00027255954513119855, "loss": 0.0281, "step": 36260 }, { "epoch": 0.18, "learning_rate": 0.00027255197743818454, "loss": 0.0238, "step": 36270 }, { "epoch": 0.18, "learning_rate": 0.0002725444097451705, "loss": 0.0279, "step": 36280 }, { "epoch": 0.18, "learning_rate": 0.0002725368420521565, "loss": 0.0303, "step": 36290 }, { "epoch": 0.18, "learning_rate": 0.0002725292743591425, "loss": 0.0305, "step": 36300 }, { "epoch": 0.18, "learning_rate": 0.0002725217066661285, "loss": 0.0226, "step": 36310 }, { "epoch": 0.18, "learning_rate": 0.0002725141389731145, "loss": 0.0211, "step": 36320 }, { "epoch": 0.18, "learning_rate": 0.0002725065712801005, "loss": 0.0224, "step": 36330 }, { "epoch": 0.18, "learning_rate": 0.00027249900358708646, "loss": 0.021, "step": 36340 }, { "epoch": 0.18, "learning_rate": 0.00027249143589407244, "loss": 0.0276, "step": 36350 }, { "epoch": 0.18, "learning_rate": 0.0002724838682010584, "loss": 0.0245, "step": 36360 }, { "epoch": 0.18, "learning_rate": 0.00027247630050804446, "loss": 0.024, "step": 36370 }, { "epoch": 0.18, "learning_rate": 0.00027246873281503044, "loss": 0.0213, "step": 36380 }, { "epoch": 0.18, "learning_rate": 0.0002724611651220164, "loss": 0.0307, "step": 36390 }, { "epoch": 0.18, "learning_rate": 0.0002724535974290024, "loss": 0.0263, "step": 36400 }, { "epoch": 0.18, "learning_rate": 0.0002724460297359884, "loss": 0.0227, "step": 36410 }, { "epoch": 0.18, "learning_rate": 0.00027243846204297437, "loss": 0.0236, "step": 36420 }, { "epoch": 0.18, "learning_rate": 0.00027243089434996035, "loss": 0.026, "step": 36430 }, { "epoch": 0.18, "learning_rate": 0.0002724233266569464, "loss": 0.0254, "step": 36440 }, { "epoch": 0.18, "learning_rate": 0.00027241575896393236, "loss": 0.0281, "step": 36450 }, { "epoch": 0.18, "learning_rate": 0.00027240819127091835, "loss": 0.0232, "step": 36460 }, { "epoch": 0.18, "learning_rate": 0.0002724006235779043, "loss": 0.0223, "step": 36470 }, { "epoch": 0.18, "learning_rate": 0.0002723930558848903, "loss": 0.0208, "step": 36480 }, { "epoch": 0.18, "learning_rate": 0.0002723854881918763, "loss": 0.0249, "step": 36490 }, { "epoch": 0.18, "learning_rate": 0.0002723779204988623, "loss": 0.023, "step": 36500 }, { "epoch": 0.18, "learning_rate": 0.0002723703528058483, "loss": 0.021, "step": 36510 }, { "epoch": 0.18, "learning_rate": 0.0002723627851128343, "loss": 0.03, "step": 36520 }, { "epoch": 0.18, "learning_rate": 0.00027235521741982027, "loss": 0.0234, "step": 36530 }, { "epoch": 0.18, "learning_rate": 0.00027234764972680625, "loss": 0.0242, "step": 36540 }, { "epoch": 0.18, "learning_rate": 0.00027234008203379223, "loss": 0.0294, "step": 36550 }, { "epoch": 0.18, "learning_rate": 0.0002723325143407782, "loss": 0.0256, "step": 36560 }, { "epoch": 0.18, "learning_rate": 0.00027232494664776425, "loss": 0.021, "step": 36570 }, { "epoch": 0.18, "learning_rate": 0.00027231737895475023, "loss": 0.0243, "step": 36580 }, { "epoch": 0.18, "learning_rate": 0.0002723098112617362, "loss": 0.028, "step": 36590 }, { "epoch": 0.18, "learning_rate": 0.0002723022435687222, "loss": 0.0244, "step": 36600 }, { "epoch": 0.18, "learning_rate": 0.0002722946758757082, "loss": 0.0219, "step": 36610 }, { "epoch": 0.18, "learning_rate": 0.00027228710818269416, "loss": 0.026, "step": 36620 }, { "epoch": 0.18, "learning_rate": 0.0002722795404896802, "loss": 0.0216, "step": 36630 }, { "epoch": 0.18, "learning_rate": 0.0002722719727966662, "loss": 0.0226, "step": 36640 }, { "epoch": 0.18, "learning_rate": 0.00027226440510365216, "loss": 0.0201, "step": 36650 }, { "epoch": 0.18, "learning_rate": 0.00027225683741063814, "loss": 0.0263, "step": 36660 }, { "epoch": 0.19, "learning_rate": 0.0002722492697176241, "loss": 0.0205, "step": 36670 }, { "epoch": 0.19, "learning_rate": 0.0002722417020246101, "loss": 0.0231, "step": 36680 }, { "epoch": 0.19, "learning_rate": 0.00027223413433159614, "loss": 0.0238, "step": 36690 }, { "epoch": 0.19, "learning_rate": 0.0002722265666385821, "loss": 0.0249, "step": 36700 }, { "epoch": 0.19, "learning_rate": 0.0002722189989455681, "loss": 0.0224, "step": 36710 }, { "epoch": 0.19, "learning_rate": 0.0002722114312525541, "loss": 0.0221, "step": 36720 }, { "epoch": 0.19, "learning_rate": 0.00027220386355954006, "loss": 0.0247, "step": 36730 }, { "epoch": 0.19, "learning_rate": 0.00027219629586652604, "loss": 0.0195, "step": 36740 }, { "epoch": 0.19, "learning_rate": 0.000272188728173512, "loss": 0.0206, "step": 36750 }, { "epoch": 0.19, "learning_rate": 0.00027218116048049806, "loss": 0.0219, "step": 36760 }, { "epoch": 0.19, "learning_rate": 0.00027217359278748404, "loss": 0.0263, "step": 36770 }, { "epoch": 0.19, "learning_rate": 0.00027216602509447, "loss": 0.0195, "step": 36780 }, { "epoch": 0.19, "learning_rate": 0.000272158457401456, "loss": 0.0277, "step": 36790 }, { "epoch": 0.19, "learning_rate": 0.000272150889708442, "loss": 0.0247, "step": 36800 }, { "epoch": 0.19, "learning_rate": 0.00027214332201542797, "loss": 0.0289, "step": 36810 }, { "epoch": 0.19, "learning_rate": 0.000272135754322414, "loss": 0.0276, "step": 36820 }, { "epoch": 0.19, "learning_rate": 0.0002721281866294, "loss": 0.0266, "step": 36830 }, { "epoch": 0.19, "learning_rate": 0.00027212061893638597, "loss": 0.0258, "step": 36840 }, { "epoch": 0.19, "learning_rate": 0.00027211305124337195, "loss": 0.0262, "step": 36850 }, { "epoch": 0.19, "learning_rate": 0.00027210548355035793, "loss": 0.0253, "step": 36860 }, { "epoch": 0.19, "learning_rate": 0.0002720979158573439, "loss": 0.028, "step": 36870 }, { "epoch": 0.19, "learning_rate": 0.00027209034816432995, "loss": 0.0239, "step": 36880 }, { "epoch": 0.19, "learning_rate": 0.0002720827804713159, "loss": 0.0191, "step": 36890 }, { "epoch": 0.19, "learning_rate": 0.0002720752127783019, "loss": 0.0267, "step": 36900 }, { "epoch": 0.19, "learning_rate": 0.0002720676450852879, "loss": 0.0195, "step": 36910 }, { "epoch": 0.19, "learning_rate": 0.00027206007739227387, "loss": 0.0199, "step": 36920 }, { "epoch": 0.19, "learning_rate": 0.00027205250969925985, "loss": 0.02, "step": 36930 }, { "epoch": 0.19, "learning_rate": 0.00027204494200624583, "loss": 0.0271, "step": 36940 }, { "epoch": 0.19, "learning_rate": 0.00027203737431323187, "loss": 0.021, "step": 36950 }, { "epoch": 0.19, "learning_rate": 0.00027202980662021785, "loss": 0.0229, "step": 36960 }, { "epoch": 0.19, "learning_rate": 0.00027202223892720383, "loss": 0.0295, "step": 36970 }, { "epoch": 0.19, "learning_rate": 0.0002720146712341898, "loss": 0.0239, "step": 36980 }, { "epoch": 0.19, "learning_rate": 0.0002720071035411758, "loss": 0.0301, "step": 36990 }, { "epoch": 0.19, "learning_rate": 0.0002719995358481618, "loss": 0.0227, "step": 37000 }, { "epoch": 0.19, "eval_cer": 0.9144654039225352, "eval_loss": 0.018076682463288307, "eval_runtime": 117.2546, "eval_samples_per_second": 17.057, "eval_steps_per_second": 4.264, "step": 37000 }, { "epoch": 0.19, "learning_rate": 0.0002719919681551478, "loss": 0.0242, "step": 37010 }, { "epoch": 0.19, "learning_rate": 0.0002719844004621338, "loss": 0.0248, "step": 37020 }, { "epoch": 0.19, "learning_rate": 0.0002719768327691198, "loss": 0.0234, "step": 37030 }, { "epoch": 0.19, "learning_rate": 0.00027196926507610576, "loss": 0.0233, "step": 37040 }, { "epoch": 0.19, "learning_rate": 0.00027196169738309174, "loss": 0.022, "step": 37050 }, { "epoch": 0.19, "learning_rate": 0.0002719541296900777, "loss": 0.0241, "step": 37060 }, { "epoch": 0.19, "learning_rate": 0.0002719465619970637, "loss": 0.0235, "step": 37070 }, { "epoch": 0.19, "learning_rate": 0.0002719389943040497, "loss": 0.0225, "step": 37080 }, { "epoch": 0.19, "learning_rate": 0.00027193142661103566, "loss": 0.0228, "step": 37090 }, { "epoch": 0.19, "learning_rate": 0.00027192385891802165, "loss": 0.0285, "step": 37100 }, { "epoch": 0.19, "learning_rate": 0.00027191629122500763, "loss": 0.0269, "step": 37110 }, { "epoch": 0.19, "learning_rate": 0.00027190872353199366, "loss": 0.0351, "step": 37120 }, { "epoch": 0.19, "learning_rate": 0.00027190115583897964, "loss": 0.022, "step": 37130 }, { "epoch": 0.19, "learning_rate": 0.0002718935881459656, "loss": 0.0265, "step": 37140 }, { "epoch": 0.19, "learning_rate": 0.0002718860204529516, "loss": 0.0259, "step": 37150 }, { "epoch": 0.19, "learning_rate": 0.0002718784527599376, "loss": 0.0287, "step": 37160 }, { "epoch": 0.19, "learning_rate": 0.00027187088506692357, "loss": 0.0231, "step": 37170 }, { "epoch": 0.19, "learning_rate": 0.0002718633173739096, "loss": 0.0226, "step": 37180 }, { "epoch": 0.19, "learning_rate": 0.0002718557496808956, "loss": 0.0229, "step": 37190 }, { "epoch": 0.19, "learning_rate": 0.00027184818198788157, "loss": 0.0229, "step": 37200 }, { "epoch": 0.19, "learning_rate": 0.00027184061429486755, "loss": 0.0209, "step": 37210 }, { "epoch": 0.19, "learning_rate": 0.00027183304660185353, "loss": 0.0271, "step": 37220 }, { "epoch": 0.19, "learning_rate": 0.0002718254789088395, "loss": 0.0244, "step": 37230 }, { "epoch": 0.19, "learning_rate": 0.00027181791121582555, "loss": 0.0243, "step": 37240 }, { "epoch": 0.19, "learning_rate": 0.00027181034352281153, "loss": 0.0232, "step": 37250 }, { "epoch": 0.19, "learning_rate": 0.0002718027758297975, "loss": 0.0268, "step": 37260 }, { "epoch": 0.19, "learning_rate": 0.0002717952081367835, "loss": 0.0252, "step": 37270 }, { "epoch": 0.19, "learning_rate": 0.0002717876404437695, "loss": 0.0229, "step": 37280 }, { "epoch": 0.19, "learning_rate": 0.00027178007275075546, "loss": 0.0231, "step": 37290 }, { "epoch": 0.19, "learning_rate": 0.00027177250505774144, "loss": 0.0274, "step": 37300 }, { "epoch": 0.19, "learning_rate": 0.00027176493736472747, "loss": 0.0264, "step": 37310 }, { "epoch": 0.19, "learning_rate": 0.00027175736967171345, "loss": 0.0235, "step": 37320 }, { "epoch": 0.19, "learning_rate": 0.00027174980197869944, "loss": 0.0239, "step": 37330 }, { "epoch": 0.19, "learning_rate": 0.0002717422342856854, "loss": 0.0247, "step": 37340 }, { "epoch": 0.19, "learning_rate": 0.0002717346665926714, "loss": 0.0207, "step": 37350 }, { "epoch": 0.19, "learning_rate": 0.0002717270988996574, "loss": 0.024, "step": 37360 }, { "epoch": 0.19, "learning_rate": 0.0002717195312066434, "loss": 0.023, "step": 37370 }, { "epoch": 0.19, "learning_rate": 0.0002717119635136294, "loss": 0.0235, "step": 37380 }, { "epoch": 0.19, "learning_rate": 0.0002717043958206154, "loss": 0.0214, "step": 37390 }, { "epoch": 0.19, "learning_rate": 0.00027169682812760136, "loss": 0.0215, "step": 37400 }, { "epoch": 0.19, "learning_rate": 0.00027168926043458734, "loss": 0.0285, "step": 37410 }, { "epoch": 0.19, "learning_rate": 0.0002716816927415733, "loss": 0.0205, "step": 37420 }, { "epoch": 0.19, "learning_rate": 0.00027167412504855936, "loss": 0.0256, "step": 37430 }, { "epoch": 0.19, "learning_rate": 0.00027166655735554534, "loss": 0.0243, "step": 37440 }, { "epoch": 0.19, "learning_rate": 0.0002716589896625313, "loss": 0.0226, "step": 37450 }, { "epoch": 0.19, "learning_rate": 0.0002716514219695173, "loss": 0.0223, "step": 37460 }, { "epoch": 0.19, "learning_rate": 0.0002716438542765033, "loss": 0.0222, "step": 37470 }, { "epoch": 0.19, "learning_rate": 0.00027163628658348927, "loss": 0.0239, "step": 37480 }, { "epoch": 0.19, "learning_rate": 0.00027162871889047525, "loss": 0.0225, "step": 37490 }, { "epoch": 0.19, "learning_rate": 0.0002716211511974613, "loss": 0.0236, "step": 37500 }, { "epoch": 0.19, "learning_rate": 0.00027161358350444726, "loss": 0.0356, "step": 37510 }, { "epoch": 0.19, "learning_rate": 0.00027160601581143325, "loss": 0.0258, "step": 37520 }, { "epoch": 0.19, "learning_rate": 0.00027159844811841923, "loss": 0.0573, "step": 37530 }, { "epoch": 0.19, "learning_rate": 0.0002715908804254052, "loss": 0.0224, "step": 37540 }, { "epoch": 0.19, "learning_rate": 0.0002715833127323912, "loss": 0.029, "step": 37550 }, { "epoch": 0.19, "learning_rate": 0.0002715757450393772, "loss": 0.0239, "step": 37560 }, { "epoch": 0.19, "learning_rate": 0.0002715681773463632, "loss": 0.0277, "step": 37570 }, { "epoch": 0.19, "learning_rate": 0.0002715606096533492, "loss": 0.0256, "step": 37580 }, { "epoch": 0.19, "learning_rate": 0.00027155304196033517, "loss": 0.0228, "step": 37590 }, { "epoch": 0.19, "learning_rate": 0.00027154547426732115, "loss": 0.0249, "step": 37600 }, { "epoch": 0.19, "learning_rate": 0.00027153790657430713, "loss": 0.0267, "step": 37610 }, { "epoch": 0.19, "learning_rate": 0.0002715303388812931, "loss": 0.0274, "step": 37620 }, { "epoch": 0.19, "learning_rate": 0.00027152277118827915, "loss": 0.0216, "step": 37630 }, { "epoch": 0.19, "learning_rate": 0.00027151520349526513, "loss": 0.0267, "step": 37640 }, { "epoch": 0.19, "learning_rate": 0.0002715076358022511, "loss": 0.0227, "step": 37650 }, { "epoch": 0.19, "learning_rate": 0.0002715000681092371, "loss": 0.0254, "step": 37660 }, { "epoch": 0.19, "learning_rate": 0.0002714925004162231, "loss": 0.0251, "step": 37670 }, { "epoch": 0.19, "learning_rate": 0.00027148493272320906, "loss": 0.0245, "step": 37680 }, { "epoch": 0.19, "learning_rate": 0.0002714773650301951, "loss": 0.0204, "step": 37690 }, { "epoch": 0.19, "learning_rate": 0.0002714697973371811, "loss": 0.0244, "step": 37700 }, { "epoch": 0.19, "learning_rate": 0.00027146222964416706, "loss": 0.0219, "step": 37710 }, { "epoch": 0.19, "learning_rate": 0.00027145466195115304, "loss": 0.0314, "step": 37720 }, { "epoch": 0.19, "learning_rate": 0.000271447094258139, "loss": 0.0242, "step": 37730 }, { "epoch": 0.19, "learning_rate": 0.000271439526565125, "loss": 0.0268, "step": 37740 }, { "epoch": 0.19, "learning_rate": 0.00027143195887211104, "loss": 0.0227, "step": 37750 }, { "epoch": 0.19, "learning_rate": 0.000271424391179097, "loss": 0.0201, "step": 37760 }, { "epoch": 0.19, "learning_rate": 0.000271416823486083, "loss": 0.0246, "step": 37770 }, { "epoch": 0.19, "learning_rate": 0.000271409255793069, "loss": 0.0236, "step": 37780 }, { "epoch": 0.19, "learning_rate": 0.00027140168810005496, "loss": 0.0226, "step": 37790 }, { "epoch": 0.19, "learning_rate": 0.00027139412040704094, "loss": 0.0216, "step": 37800 }, { "epoch": 0.19, "learning_rate": 0.0002713865527140269, "loss": 0.0255, "step": 37810 }, { "epoch": 0.19, "learning_rate": 0.00027137898502101296, "loss": 0.0256, "step": 37820 }, { "epoch": 0.19, "learning_rate": 0.00027137141732799894, "loss": 0.0245, "step": 37830 }, { "epoch": 0.19, "learning_rate": 0.0002713638496349849, "loss": 0.0247, "step": 37840 }, { "epoch": 0.19, "learning_rate": 0.0002713562819419709, "loss": 0.0286, "step": 37850 }, { "epoch": 0.19, "learning_rate": 0.0002713487142489569, "loss": 0.0241, "step": 37860 }, { "epoch": 0.19, "learning_rate": 0.00027134114655594287, "loss": 0.0217, "step": 37870 }, { "epoch": 0.19, "learning_rate": 0.0002713335788629289, "loss": 0.0241, "step": 37880 }, { "epoch": 0.19, "learning_rate": 0.0002713260111699149, "loss": 0.0218, "step": 37890 }, { "epoch": 0.19, "learning_rate": 0.00027131844347690087, "loss": 0.0275, "step": 37900 }, { "epoch": 0.19, "learning_rate": 0.00027131087578388685, "loss": 0.0215, "step": 37910 }, { "epoch": 0.19, "learning_rate": 0.00027130330809087283, "loss": 0.0254, "step": 37920 }, { "epoch": 0.19, "learning_rate": 0.0002712957403978588, "loss": 0.0232, "step": 37930 }, { "epoch": 0.19, "learning_rate": 0.00027128817270484485, "loss": 0.024, "step": 37940 }, { "epoch": 0.19, "learning_rate": 0.00027128060501183083, "loss": 0.0253, "step": 37950 }, { "epoch": 0.19, "learning_rate": 0.0002712730373188168, "loss": 0.0263, "step": 37960 }, { "epoch": 0.19, "learning_rate": 0.0002712654696258028, "loss": 0.0271, "step": 37970 }, { "epoch": 0.19, "learning_rate": 0.00027125790193278877, "loss": 0.028, "step": 37980 }, { "epoch": 0.19, "learning_rate": 0.00027125033423977475, "loss": 0.0321, "step": 37990 }, { "epoch": 0.19, "learning_rate": 0.00027124276654676073, "loss": 0.0245, "step": 38000 }, { "epoch": 0.19, "eval_cer": 0.9144780190721654, "eval_loss": 0.018160896375775337, "eval_runtime": 117.0624, "eval_samples_per_second": 17.085, "eval_steps_per_second": 4.271, "step": 38000 }, { "epoch": 0.19, "learning_rate": 0.00027123519885374677, "loss": 0.0257, "step": 38010 }, { "epoch": 0.19, "learning_rate": 0.00027122763116073275, "loss": 0.0244, "step": 38020 }, { "epoch": 0.19, "learning_rate": 0.00027122006346771873, "loss": 0.0204, "step": 38030 }, { "epoch": 0.19, "learning_rate": 0.0002712124957747047, "loss": 0.0242, "step": 38040 }, { "epoch": 0.19, "learning_rate": 0.0002712049280816907, "loss": 0.0324, "step": 38050 }, { "epoch": 0.19, "learning_rate": 0.0002711973603886767, "loss": 0.0269, "step": 38060 }, { "epoch": 0.19, "learning_rate": 0.0002711897926956627, "loss": 0.0237, "step": 38070 }, { "epoch": 0.19, "learning_rate": 0.0002711822250026487, "loss": 0.0293, "step": 38080 }, { "epoch": 0.19, "learning_rate": 0.0002711746573096347, "loss": 0.0288, "step": 38090 }, { "epoch": 0.19, "learning_rate": 0.00027116708961662066, "loss": 0.0234, "step": 38100 }, { "epoch": 0.19, "learning_rate": 0.00027115952192360664, "loss": 0.0216, "step": 38110 }, { "epoch": 0.19, "learning_rate": 0.0002711519542305926, "loss": 0.0203, "step": 38120 }, { "epoch": 0.19, "learning_rate": 0.0002711443865375786, "loss": 0.0267, "step": 38130 }, { "epoch": 0.19, "learning_rate": 0.00027113681884456464, "loss": 0.0253, "step": 38140 }, { "epoch": 0.19, "learning_rate": 0.0002711292511515506, "loss": 0.0211, "step": 38150 }, { "epoch": 0.19, "learning_rate": 0.0002711216834585366, "loss": 0.0251, "step": 38160 }, { "epoch": 0.19, "learning_rate": 0.0002711141157655226, "loss": 0.0225, "step": 38170 }, { "epoch": 0.19, "learning_rate": 0.00027110654807250856, "loss": 0.024, "step": 38180 }, { "epoch": 0.19, "learning_rate": 0.00027109898037949454, "loss": 0.0287, "step": 38190 }, { "epoch": 0.19, "learning_rate": 0.0002710914126864806, "loss": 0.0216, "step": 38200 }, { "epoch": 0.19, "learning_rate": 0.00027108384499346656, "loss": 0.0233, "step": 38210 }, { "epoch": 0.19, "learning_rate": 0.00027107627730045254, "loss": 0.0227, "step": 38220 }, { "epoch": 0.19, "learning_rate": 0.0002710687096074385, "loss": 0.0231, "step": 38230 }, { "epoch": 0.19, "learning_rate": 0.0002710611419144245, "loss": 0.0255, "step": 38240 }, { "epoch": 0.19, "learning_rate": 0.0002710535742214105, "loss": 0.0211, "step": 38250 }, { "epoch": 0.19, "learning_rate": 0.0002710460065283965, "loss": 0.0203, "step": 38260 }, { "epoch": 0.19, "learning_rate": 0.0002710384388353825, "loss": 0.0245, "step": 38270 }, { "epoch": 0.19, "learning_rate": 0.0002710308711423685, "loss": 0.025, "step": 38280 }, { "epoch": 0.19, "learning_rate": 0.00027102330344935447, "loss": 0.0281, "step": 38290 }, { "epoch": 0.19, "learning_rate": 0.00027101573575634045, "loss": 0.021, "step": 38300 }, { "epoch": 0.19, "learning_rate": 0.00027100816806332643, "loss": 0.023, "step": 38310 }, { "epoch": 0.19, "learning_rate": 0.0002710006003703124, "loss": 0.0235, "step": 38320 }, { "epoch": 0.19, "learning_rate": 0.00027099303267729845, "loss": 0.0246, "step": 38330 }, { "epoch": 0.19, "learning_rate": 0.0002709854649842844, "loss": 0.0232, "step": 38340 }, { "epoch": 0.19, "learning_rate": 0.00027097789729127036, "loss": 0.0277, "step": 38350 }, { "epoch": 0.19, "learning_rate": 0.00027097032959825634, "loss": 0.0221, "step": 38360 }, { "epoch": 0.19, "learning_rate": 0.0002709627619052424, "loss": 0.0253, "step": 38370 }, { "epoch": 0.19, "learning_rate": 0.00027095519421222835, "loss": 0.0246, "step": 38380 }, { "epoch": 0.19, "learning_rate": 0.00027094762651921434, "loss": 0.0213, "step": 38390 }, { "epoch": 0.19, "learning_rate": 0.0002709400588262003, "loss": 0.0234, "step": 38400 }, { "epoch": 0.19, "learning_rate": 0.0002709324911331863, "loss": 0.0238, "step": 38410 }, { "epoch": 0.19, "learning_rate": 0.0002709249234401723, "loss": 0.0233, "step": 38420 }, { "epoch": 0.19, "learning_rate": 0.0002709173557471583, "loss": 0.0229, "step": 38430 }, { "epoch": 0.19, "learning_rate": 0.0002709097880541443, "loss": 0.0246, "step": 38440 }, { "epoch": 0.19, "learning_rate": 0.0002709022203611303, "loss": 0.0203, "step": 38450 }, { "epoch": 0.19, "learning_rate": 0.00027089465266811626, "loss": 0.0255, "step": 38460 }, { "epoch": 0.19, "learning_rate": 0.00027088708497510224, "loss": 0.0275, "step": 38470 }, { "epoch": 0.19, "learning_rate": 0.0002708795172820882, "loss": 0.0227, "step": 38480 }, { "epoch": 0.19, "learning_rate": 0.00027087194958907426, "loss": 0.0208, "step": 38490 }, { "epoch": 0.19, "learning_rate": 0.00027086438189606024, "loss": 0.027, "step": 38500 }, { "epoch": 0.19, "learning_rate": 0.0002708568142030462, "loss": 0.0239, "step": 38510 }, { "epoch": 0.19, "learning_rate": 0.0002708492465100322, "loss": 0.0232, "step": 38520 }, { "epoch": 0.19, "learning_rate": 0.0002708416788170182, "loss": 0.0218, "step": 38530 }, { "epoch": 0.19, "learning_rate": 0.00027083411112400417, "loss": 0.023, "step": 38540 }, { "epoch": 0.19, "learning_rate": 0.00027082654343099015, "loss": 0.0222, "step": 38550 }, { "epoch": 0.19, "learning_rate": 0.0002708189757379762, "loss": 0.024, "step": 38560 }, { "epoch": 0.19, "learning_rate": 0.00027081140804496216, "loss": 0.026, "step": 38570 }, { "epoch": 0.19, "learning_rate": 0.00027080384035194815, "loss": 0.0221, "step": 38580 }, { "epoch": 0.19, "learning_rate": 0.00027079627265893413, "loss": 0.0228, "step": 38590 }, { "epoch": 0.19, "learning_rate": 0.0002707887049659201, "loss": 0.0223, "step": 38600 }, { "epoch": 0.19, "learning_rate": 0.0002707811372729061, "loss": 0.0238, "step": 38610 }, { "epoch": 0.19, "learning_rate": 0.0002707735695798921, "loss": 0.0237, "step": 38620 }, { "epoch": 0.19, "learning_rate": 0.0002707660018868781, "loss": 0.0234, "step": 38630 }, { "epoch": 0.19, "learning_rate": 0.0002707584341938641, "loss": 0.0358, "step": 38640 }, { "epoch": 0.19, "learning_rate": 0.00027075086650085007, "loss": 0.023, "step": 38650 }, { "epoch": 0.2, "learning_rate": 0.00027074329880783605, "loss": 0.0247, "step": 38660 }, { "epoch": 0.2, "learning_rate": 0.00027073573111482203, "loss": 0.023, "step": 38670 }, { "epoch": 0.2, "learning_rate": 0.00027072816342180807, "loss": 0.0261, "step": 38680 }, { "epoch": 0.2, "learning_rate": 0.00027072059572879405, "loss": 0.0218, "step": 38690 }, { "epoch": 0.2, "learning_rate": 0.00027071302803578003, "loss": 0.0213, "step": 38700 }, { "epoch": 0.2, "learning_rate": 0.000270705460342766, "loss": 0.0222, "step": 38710 }, { "epoch": 0.2, "learning_rate": 0.000270697892649752, "loss": 0.0201, "step": 38720 }, { "epoch": 0.2, "learning_rate": 0.000270690324956738, "loss": 0.0257, "step": 38730 }, { "epoch": 0.2, "learning_rate": 0.00027068275726372396, "loss": 0.0273, "step": 38740 }, { "epoch": 0.2, "learning_rate": 0.00027067518957071, "loss": 0.0246, "step": 38750 }, { "epoch": 0.2, "learning_rate": 0.000270667621877696, "loss": 0.0204, "step": 38760 }, { "epoch": 0.2, "learning_rate": 0.00027066005418468196, "loss": 0.0256, "step": 38770 }, { "epoch": 0.2, "learning_rate": 0.00027065248649166794, "loss": 0.0281, "step": 38780 }, { "epoch": 0.2, "learning_rate": 0.0002706449187986539, "loss": 0.025, "step": 38790 }, { "epoch": 0.2, "learning_rate": 0.0002706373511056399, "loss": 0.0248, "step": 38800 }, { "epoch": 0.2, "learning_rate": 0.00027062978341262594, "loss": 0.021, "step": 38810 }, { "epoch": 0.2, "learning_rate": 0.0002706222157196119, "loss": 0.022, "step": 38820 }, { "epoch": 0.2, "learning_rate": 0.0002706146480265979, "loss": 0.0228, "step": 38830 }, { "epoch": 0.2, "learning_rate": 0.0002706070803335839, "loss": 0.025, "step": 38840 }, { "epoch": 0.2, "learning_rate": 0.00027059951264056986, "loss": 0.0249, "step": 38850 }, { "epoch": 0.2, "learning_rate": 0.00027059194494755584, "loss": 0.0241, "step": 38860 }, { "epoch": 0.2, "learning_rate": 0.0002705843772545418, "loss": 0.0215, "step": 38870 }, { "epoch": 0.2, "learning_rate": 0.00027057680956152786, "loss": 0.0224, "step": 38880 }, { "epoch": 0.2, "learning_rate": 0.00027056924186851384, "loss": 0.0258, "step": 38890 }, { "epoch": 0.2, "learning_rate": 0.0002705616741754998, "loss": 0.0223, "step": 38900 }, { "epoch": 0.2, "learning_rate": 0.0002705541064824858, "loss": 0.0228, "step": 38910 }, { "epoch": 0.2, "learning_rate": 0.0002705465387894718, "loss": 0.0234, "step": 38920 }, { "epoch": 0.2, "learning_rate": 0.00027053897109645777, "loss": 0.0203, "step": 38930 }, { "epoch": 0.2, "learning_rate": 0.0002705314034034438, "loss": 0.0235, "step": 38940 }, { "epoch": 0.2, "learning_rate": 0.0002705238357104298, "loss": 0.0233, "step": 38950 }, { "epoch": 0.2, "learning_rate": 0.00027051626801741577, "loss": 0.0212, "step": 38960 }, { "epoch": 0.2, "learning_rate": 0.00027050870032440175, "loss": 0.024, "step": 38970 }, { "epoch": 0.2, "learning_rate": 0.00027050113263138773, "loss": 0.0266, "step": 38980 }, { "epoch": 0.2, "learning_rate": 0.0002704935649383737, "loss": 0.0206, "step": 38990 }, { "epoch": 0.2, "learning_rate": 0.00027048599724535975, "loss": 0.0195, "step": 39000 }, { "epoch": 0.2, "eval_cer": 0.9144702559031622, "eval_loss": 0.017209572717547417, "eval_runtime": 117.1365, "eval_samples_per_second": 17.074, "eval_steps_per_second": 4.269, "step": 39000 }, { "epoch": 0.2, "learning_rate": 0.00027047842955234573, "loss": 0.0312, "step": 39010 }, { "epoch": 0.2, "learning_rate": 0.0002704708618593317, "loss": 0.0205, "step": 39020 }, { "epoch": 0.2, "learning_rate": 0.0002704632941663177, "loss": 0.0229, "step": 39030 }, { "epoch": 0.2, "learning_rate": 0.00027045572647330367, "loss": 0.0261, "step": 39040 }, { "epoch": 0.2, "learning_rate": 0.00027044815878028965, "loss": 0.0239, "step": 39050 }, { "epoch": 0.2, "learning_rate": 0.00027044059108727563, "loss": 0.0226, "step": 39060 }, { "epoch": 0.2, "learning_rate": 0.00027043302339426167, "loss": 0.02, "step": 39070 }, { "epoch": 0.2, "learning_rate": 0.00027042545570124765, "loss": 0.0231, "step": 39080 }, { "epoch": 0.2, "learning_rate": 0.00027041788800823363, "loss": 0.0229, "step": 39090 }, { "epoch": 0.2, "learning_rate": 0.0002704103203152196, "loss": 0.0216, "step": 39100 }, { "epoch": 0.2, "learning_rate": 0.0002704027526222056, "loss": 0.0231, "step": 39110 }, { "epoch": 0.2, "learning_rate": 0.0002703951849291916, "loss": 0.0219, "step": 39120 }, { "epoch": 0.2, "learning_rate": 0.0002703876172361776, "loss": 0.0231, "step": 39130 }, { "epoch": 0.2, "learning_rate": 0.0002703800495431636, "loss": 0.0235, "step": 39140 }, { "epoch": 0.2, "learning_rate": 0.0002703724818501496, "loss": 0.0223, "step": 39150 }, { "epoch": 0.2, "learning_rate": 0.00027036491415713556, "loss": 0.0233, "step": 39160 }, { "epoch": 0.2, "learning_rate": 0.00027035734646412154, "loss": 0.0252, "step": 39170 }, { "epoch": 0.2, "learning_rate": 0.0002703497787711075, "loss": 0.0246, "step": 39180 }, { "epoch": 0.2, "learning_rate": 0.00027034221107809356, "loss": 0.0284, "step": 39190 }, { "epoch": 0.2, "learning_rate": 0.00027033464338507954, "loss": 0.0259, "step": 39200 }, { "epoch": 0.2, "learning_rate": 0.0002703270756920655, "loss": 0.0266, "step": 39210 }, { "epoch": 0.2, "learning_rate": 0.0002703195079990515, "loss": 0.0246, "step": 39220 }, { "epoch": 0.2, "learning_rate": 0.0002703119403060375, "loss": 0.0243, "step": 39230 }, { "epoch": 0.2, "learning_rate": 0.00027030437261302346, "loss": 0.024, "step": 39240 }, { "epoch": 0.2, "learning_rate": 0.00027029680492000944, "loss": 0.021, "step": 39250 }, { "epoch": 0.2, "learning_rate": 0.0002702892372269955, "loss": 0.0294, "step": 39260 }, { "epoch": 0.2, "learning_rate": 0.00027028166953398146, "loss": 0.0238, "step": 39270 }, { "epoch": 0.2, "learning_rate": 0.00027027410184096744, "loss": 0.0232, "step": 39280 }, { "epoch": 0.2, "learning_rate": 0.0002702665341479534, "loss": 0.0227, "step": 39290 }, { "epoch": 0.2, "learning_rate": 0.0002702589664549394, "loss": 0.023, "step": 39300 }, { "epoch": 0.2, "learning_rate": 0.0002702513987619254, "loss": 0.0287, "step": 39310 }, { "epoch": 0.2, "learning_rate": 0.0002702438310689114, "loss": 0.0228, "step": 39320 }, { "epoch": 0.2, "learning_rate": 0.0002702362633758974, "loss": 0.0206, "step": 39330 }, { "epoch": 0.2, "learning_rate": 0.0002702286956828834, "loss": 0.0241, "step": 39340 }, { "epoch": 0.2, "learning_rate": 0.00027022112798986937, "loss": 0.0253, "step": 39350 }, { "epoch": 0.2, "learning_rate": 0.00027021356029685535, "loss": 0.0273, "step": 39360 }, { "epoch": 0.2, "learning_rate": 0.00027020599260384133, "loss": 0.0271, "step": 39370 }, { "epoch": 0.2, "learning_rate": 0.0002701984249108273, "loss": 0.0256, "step": 39380 }, { "epoch": 0.2, "learning_rate": 0.00027019085721781335, "loss": 0.0234, "step": 39390 }, { "epoch": 0.2, "learning_rate": 0.00027018328952479933, "loss": 0.0229, "step": 39400 }, { "epoch": 0.2, "learning_rate": 0.0002701757218317853, "loss": 0.025, "step": 39410 }, { "epoch": 0.2, "learning_rate": 0.0002701681541387713, "loss": 0.0244, "step": 39420 }, { "epoch": 0.2, "learning_rate": 0.0002701605864457573, "loss": 0.0249, "step": 39430 }, { "epoch": 0.2, "learning_rate": 0.00027015301875274325, "loss": 0.0284, "step": 39440 }, { "epoch": 0.2, "learning_rate": 0.0002701454510597293, "loss": 0.0252, "step": 39450 }, { "epoch": 0.2, "learning_rate": 0.00027013788336671527, "loss": 0.023, "step": 39460 }, { "epoch": 0.2, "learning_rate": 0.00027013031567370125, "loss": 0.0229, "step": 39470 }, { "epoch": 0.2, "learning_rate": 0.00027012274798068723, "loss": 0.025, "step": 39480 }, { "epoch": 0.2, "learning_rate": 0.0002701151802876732, "loss": 0.0308, "step": 39490 }, { "epoch": 0.2, "learning_rate": 0.0002701076125946592, "loss": 0.0258, "step": 39500 }, { "epoch": 0.2, "learning_rate": 0.00027010004490164523, "loss": 0.024, "step": 39510 }, { "epoch": 0.2, "learning_rate": 0.0002700924772086312, "loss": 0.0216, "step": 39520 }, { "epoch": 0.2, "learning_rate": 0.0002700849095156172, "loss": 0.0224, "step": 39530 }, { "epoch": 0.2, "learning_rate": 0.0002700773418226032, "loss": 0.0296, "step": 39540 }, { "epoch": 0.2, "learning_rate": 0.00027006977412958916, "loss": 0.0229, "step": 39550 }, { "epoch": 0.2, "learning_rate": 0.00027006220643657514, "loss": 0.0238, "step": 39560 }, { "epoch": 0.2, "learning_rate": 0.0002700546387435611, "loss": 0.0227, "step": 39570 }, { "epoch": 0.2, "learning_rate": 0.00027004707105054716, "loss": 0.0227, "step": 39580 }, { "epoch": 0.2, "learning_rate": 0.00027003950335753314, "loss": 0.0235, "step": 39590 }, { "epoch": 0.2, "learning_rate": 0.00027003193566451907, "loss": 0.0265, "step": 39600 }, { "epoch": 0.2, "learning_rate": 0.00027002436797150505, "loss": 0.0229, "step": 39610 }, { "epoch": 0.2, "learning_rate": 0.0002700168002784911, "loss": 0.0259, "step": 39620 }, { "epoch": 0.2, "learning_rate": 0.00027000923258547706, "loss": 0.021, "step": 39630 }, { "epoch": 0.2, "learning_rate": 0.00027000166489246305, "loss": 0.0199, "step": 39640 }, { "epoch": 0.2, "learning_rate": 0.00026999409719944903, "loss": 0.0248, "step": 39650 }, { "epoch": 0.2, "learning_rate": 0.000269986529506435, "loss": 0.0259, "step": 39660 }, { "epoch": 0.2, "learning_rate": 0.000269978961813421, "loss": 0.0222, "step": 39670 }, { "epoch": 0.2, "learning_rate": 0.000269971394120407, "loss": 0.0292, "step": 39680 }, { "epoch": 0.2, "learning_rate": 0.000269963826427393, "loss": 0.0235, "step": 39690 }, { "epoch": 0.2, "learning_rate": 0.000269956258734379, "loss": 0.0219, "step": 39700 }, { "epoch": 0.2, "learning_rate": 0.00026994869104136497, "loss": 0.0204, "step": 39710 }, { "epoch": 0.2, "learning_rate": 0.00026994112334835095, "loss": 0.0247, "step": 39720 }, { "epoch": 0.2, "learning_rate": 0.00026993355565533693, "loss": 0.0252, "step": 39730 }, { "epoch": 0.2, "learning_rate": 0.00026992598796232297, "loss": 0.0226, "step": 39740 }, { "epoch": 0.2, "learning_rate": 0.00026991842026930895, "loss": 0.0288, "step": 39750 }, { "epoch": 0.2, "learning_rate": 0.00026991085257629493, "loss": 0.0283, "step": 39760 }, { "epoch": 0.2, "learning_rate": 0.0002699032848832809, "loss": 0.0258, "step": 39770 }, { "epoch": 0.2, "learning_rate": 0.0002698957171902669, "loss": 0.0237, "step": 39780 }, { "epoch": 0.2, "learning_rate": 0.0002698881494972529, "loss": 0.0233, "step": 39790 }, { "epoch": 0.2, "learning_rate": 0.00026988058180423886, "loss": 0.0244, "step": 39800 }, { "epoch": 0.2, "learning_rate": 0.0002698730141112249, "loss": 0.0241, "step": 39810 }, { "epoch": 0.2, "learning_rate": 0.0002698654464182109, "loss": 0.0213, "step": 39820 }, { "epoch": 0.2, "learning_rate": 0.00026985787872519686, "loss": 0.0202, "step": 39830 }, { "epoch": 0.2, "learning_rate": 0.00026985031103218284, "loss": 0.0214, "step": 39840 }, { "epoch": 0.2, "learning_rate": 0.0002698427433391688, "loss": 0.0229, "step": 39850 }, { "epoch": 0.2, "learning_rate": 0.0002698351756461548, "loss": 0.0242, "step": 39860 }, { "epoch": 0.2, "learning_rate": 0.00026982760795314084, "loss": 0.024, "step": 39870 }, { "epoch": 0.2, "learning_rate": 0.0002698200402601268, "loss": 0.0255, "step": 39880 }, { "epoch": 0.2, "learning_rate": 0.0002698124725671128, "loss": 0.0256, "step": 39890 }, { "epoch": 0.2, "learning_rate": 0.0002698049048740988, "loss": 0.0242, "step": 39900 }, { "epoch": 0.2, "learning_rate": 0.00026979733718108476, "loss": 0.0215, "step": 39910 }, { "epoch": 0.2, "learning_rate": 0.00026978976948807074, "loss": 0.0348, "step": 39920 }, { "epoch": 0.2, "learning_rate": 0.0002697822017950567, "loss": 0.0344, "step": 39930 }, { "epoch": 0.2, "learning_rate": 0.00026977463410204276, "loss": 0.0237, "step": 39940 }, { "epoch": 0.2, "learning_rate": 0.00026976706640902874, "loss": 0.0288, "step": 39950 }, { "epoch": 0.2, "learning_rate": 0.0002697594987160147, "loss": 0.0227, "step": 39960 }, { "epoch": 0.2, "learning_rate": 0.0002697519310230007, "loss": 0.0276, "step": 39970 }, { "epoch": 0.2, "learning_rate": 0.0002697443633299867, "loss": 0.0226, "step": 39980 }, { "epoch": 0.2, "learning_rate": 0.00026973679563697267, "loss": 0.0191, "step": 39990 }, { "epoch": 0.2, "learning_rate": 0.0002697292279439587, "loss": 0.0253, "step": 40000 }, { "epoch": 0.2, "eval_cer": 0.9144896638256703, "eval_loss": 0.017527606338262558, "eval_runtime": 117.0438, "eval_samples_per_second": 17.088, "eval_steps_per_second": 4.272, "step": 40000 }, { "epoch": 0.2, "learning_rate": 0.0002697216602509447, "loss": 0.0219, "step": 40010 }, { "epoch": 0.2, "learning_rate": 0.00026971409255793067, "loss": 0.024, "step": 40020 }, { "epoch": 0.2, "learning_rate": 0.00026970652486491665, "loss": 0.0232, "step": 40030 }, { "epoch": 0.2, "learning_rate": 0.00026969895717190263, "loss": 0.0238, "step": 40040 }, { "epoch": 0.2, "learning_rate": 0.0002696913894788886, "loss": 0.0242, "step": 40050 }, { "epoch": 0.2, "learning_rate": 0.00026968382178587465, "loss": 0.0253, "step": 40060 }, { "epoch": 0.2, "learning_rate": 0.00026967625409286063, "loss": 0.0212, "step": 40070 }, { "epoch": 0.2, "learning_rate": 0.0002696686863998466, "loss": 0.0224, "step": 40080 }, { "epoch": 0.2, "learning_rate": 0.0002696611187068326, "loss": 0.0264, "step": 40090 }, { "epoch": 0.2, "learning_rate": 0.00026965355101381857, "loss": 0.0214, "step": 40100 }, { "epoch": 0.2, "learning_rate": 0.00026964598332080455, "loss": 0.0193, "step": 40110 }, { "epoch": 0.2, "learning_rate": 0.00026963841562779054, "loss": 0.023, "step": 40120 }, { "epoch": 0.2, "learning_rate": 0.00026963084793477657, "loss": 0.0233, "step": 40130 }, { "epoch": 0.2, "learning_rate": 0.00026962328024176255, "loss": 0.0214, "step": 40140 }, { "epoch": 0.2, "learning_rate": 0.00026961571254874853, "loss": 0.0225, "step": 40150 }, { "epoch": 0.2, "learning_rate": 0.0002696081448557345, "loss": 0.0234, "step": 40160 }, { "epoch": 0.2, "learning_rate": 0.0002696005771627205, "loss": 0.0214, "step": 40170 }, { "epoch": 0.2, "learning_rate": 0.0002695930094697065, "loss": 0.021, "step": 40180 }, { "epoch": 0.2, "learning_rate": 0.0002695854417766925, "loss": 0.0198, "step": 40190 }, { "epoch": 0.2, "learning_rate": 0.0002695778740836785, "loss": 0.023, "step": 40200 }, { "epoch": 0.2, "learning_rate": 0.0002695703063906645, "loss": 0.0218, "step": 40210 }, { "epoch": 0.2, "learning_rate": 0.00026956273869765046, "loss": 0.021, "step": 40220 }, { "epoch": 0.2, "learning_rate": 0.00026955517100463644, "loss": 0.021, "step": 40230 }, { "epoch": 0.2, "learning_rate": 0.0002695476033116224, "loss": 0.0228, "step": 40240 }, { "epoch": 0.2, "learning_rate": 0.00026954003561860846, "loss": 0.018, "step": 40250 }, { "epoch": 0.2, "learning_rate": 0.00026953246792559444, "loss": 0.0233, "step": 40260 }, { "epoch": 0.2, "learning_rate": 0.0002695249002325804, "loss": 0.0248, "step": 40270 }, { "epoch": 0.2, "learning_rate": 0.0002695173325395664, "loss": 0.0231, "step": 40280 }, { "epoch": 0.2, "learning_rate": 0.0002695097648465524, "loss": 0.0194, "step": 40290 }, { "epoch": 0.2, "learning_rate": 0.00026950219715353836, "loss": 0.0268, "step": 40300 }, { "epoch": 0.2, "learning_rate": 0.00026949462946052435, "loss": 0.0225, "step": 40310 }, { "epoch": 0.2, "learning_rate": 0.0002694870617675104, "loss": 0.021, "step": 40320 }, { "epoch": 0.2, "learning_rate": 0.00026947949407449636, "loss": 0.0212, "step": 40330 }, { "epoch": 0.2, "learning_rate": 0.00026947192638148234, "loss": 0.0196, "step": 40340 }, { "epoch": 0.2, "learning_rate": 0.0002694643586884683, "loss": 0.0207, "step": 40350 }, { "epoch": 0.2, "learning_rate": 0.0002694567909954543, "loss": 0.0239, "step": 40360 }, { "epoch": 0.2, "learning_rate": 0.0002694492233024403, "loss": 0.0247, "step": 40370 }, { "epoch": 0.2, "learning_rate": 0.0002694416556094263, "loss": 0.0192, "step": 40380 }, { "epoch": 0.2, "learning_rate": 0.0002694340879164123, "loss": 0.023, "step": 40390 }, { "epoch": 0.2, "learning_rate": 0.0002694265202233983, "loss": 0.0229, "step": 40400 }, { "epoch": 0.2, "learning_rate": 0.00026941895253038427, "loss": 0.0219, "step": 40410 }, { "epoch": 0.2, "learning_rate": 0.00026941138483737025, "loss": 0.0203, "step": 40420 }, { "epoch": 0.2, "learning_rate": 0.00026940381714435623, "loss": 0.0248, "step": 40430 }, { "epoch": 0.2, "learning_rate": 0.0002693962494513422, "loss": 0.0201, "step": 40440 }, { "epoch": 0.2, "learning_rate": 0.00026938868175832825, "loss": 0.0244, "step": 40450 }, { "epoch": 0.2, "learning_rate": 0.00026938111406531423, "loss": 0.0253, "step": 40460 }, { "epoch": 0.2, "learning_rate": 0.0002693735463723002, "loss": 0.0213, "step": 40470 }, { "epoch": 0.2, "learning_rate": 0.0002693659786792862, "loss": 0.0182, "step": 40480 }, { "epoch": 0.2, "learning_rate": 0.0002693584109862722, "loss": 0.0214, "step": 40490 }, { "epoch": 0.2, "learning_rate": 0.00026935084329325816, "loss": 0.0233, "step": 40500 }, { "epoch": 0.2, "learning_rate": 0.0002693432756002442, "loss": 0.0219, "step": 40510 }, { "epoch": 0.2, "learning_rate": 0.00026933570790723017, "loss": 0.0238, "step": 40520 }, { "epoch": 0.2, "learning_rate": 0.00026932814021421615, "loss": 0.0237, "step": 40530 }, { "epoch": 0.2, "learning_rate": 0.00026932057252120214, "loss": 0.027, "step": 40540 }, { "epoch": 0.2, "learning_rate": 0.0002693130048281881, "loss": 0.027, "step": 40550 }, { "epoch": 0.2, "learning_rate": 0.0002693054371351741, "loss": 0.0249, "step": 40560 }, { "epoch": 0.2, "learning_rate": 0.00026929786944216013, "loss": 0.0266, "step": 40570 }, { "epoch": 0.2, "learning_rate": 0.0002692903017491461, "loss": 0.0279, "step": 40580 }, { "epoch": 0.2, "learning_rate": 0.0002692827340561321, "loss": 0.0205, "step": 40590 }, { "epoch": 0.2, "learning_rate": 0.0002692751663631181, "loss": 0.0219, "step": 40600 }, { "epoch": 0.2, "learning_rate": 0.00026926759867010406, "loss": 0.0209, "step": 40610 }, { "epoch": 0.2, "learning_rate": 0.00026926003097709004, "loss": 0.0262, "step": 40620 }, { "epoch": 0.2, "learning_rate": 0.000269252463284076, "loss": 0.022, "step": 40630 }, { "epoch": 0.21, "learning_rate": 0.00026924489559106206, "loss": 0.0214, "step": 40640 }, { "epoch": 0.21, "learning_rate": 0.00026923732789804804, "loss": 0.0227, "step": 40650 }, { "epoch": 0.21, "learning_rate": 0.000269229760205034, "loss": 0.0242, "step": 40660 }, { "epoch": 0.21, "learning_rate": 0.00026922219251202, "loss": 0.0278, "step": 40670 }, { "epoch": 0.21, "learning_rate": 0.000269214624819006, "loss": 0.0184, "step": 40680 }, { "epoch": 0.21, "learning_rate": 0.00026920705712599197, "loss": 0.0232, "step": 40690 }, { "epoch": 0.21, "learning_rate": 0.000269199489432978, "loss": 0.0224, "step": 40700 }, { "epoch": 0.21, "learning_rate": 0.000269191921739964, "loss": 0.0214, "step": 40710 }, { "epoch": 0.21, "learning_rate": 0.00026918435404694996, "loss": 0.0192, "step": 40720 }, { "epoch": 0.21, "learning_rate": 0.00026917678635393595, "loss": 0.0214, "step": 40730 }, { "epoch": 0.21, "learning_rate": 0.0002691692186609219, "loss": 0.0217, "step": 40740 }, { "epoch": 0.21, "learning_rate": 0.0002691616509679079, "loss": 0.0259, "step": 40750 }, { "epoch": 0.21, "learning_rate": 0.00026915408327489394, "loss": 0.0215, "step": 40760 }, { "epoch": 0.21, "learning_rate": 0.0002691465155818799, "loss": 0.0231, "step": 40770 }, { "epoch": 0.21, "learning_rate": 0.0002691389478888659, "loss": 0.0236, "step": 40780 }, { "epoch": 0.21, "learning_rate": 0.0002691313801958519, "loss": 0.0194, "step": 40790 }, { "epoch": 0.21, "learning_rate": 0.00026912381250283787, "loss": 0.0237, "step": 40800 }, { "epoch": 0.21, "learning_rate": 0.00026911624480982385, "loss": 0.0226, "step": 40810 }, { "epoch": 0.21, "learning_rate": 0.00026910867711680983, "loss": 0.0246, "step": 40820 }, { "epoch": 0.21, "learning_rate": 0.00026910110942379587, "loss": 0.0228, "step": 40830 }, { "epoch": 0.21, "learning_rate": 0.00026909354173078185, "loss": 0.0255, "step": 40840 }, { "epoch": 0.21, "learning_rate": 0.0002690859740377678, "loss": 0.0248, "step": 40850 }, { "epoch": 0.21, "learning_rate": 0.00026907840634475376, "loss": 0.0238, "step": 40860 }, { "epoch": 0.21, "learning_rate": 0.0002690708386517398, "loss": 0.0216, "step": 40870 }, { "epoch": 0.21, "learning_rate": 0.0002690632709587258, "loss": 0.0244, "step": 40880 }, { "epoch": 0.21, "learning_rate": 0.00026905570326571176, "loss": 0.0219, "step": 40890 }, { "epoch": 0.21, "learning_rate": 0.00026904813557269774, "loss": 0.024, "step": 40900 }, { "epoch": 0.21, "learning_rate": 0.0002690405678796837, "loss": 0.0252, "step": 40910 }, { "epoch": 0.21, "learning_rate": 0.0002690330001866697, "loss": 0.0234, "step": 40920 }, { "epoch": 0.21, "learning_rate": 0.00026902543249365574, "loss": 0.0234, "step": 40930 }, { "epoch": 0.21, "learning_rate": 0.0002690178648006417, "loss": 0.0217, "step": 40940 }, { "epoch": 0.21, "learning_rate": 0.0002690102971076277, "loss": 0.0212, "step": 40950 }, { "epoch": 0.21, "learning_rate": 0.0002690027294146137, "loss": 0.0267, "step": 40960 }, { "epoch": 0.21, "learning_rate": 0.00026899516172159966, "loss": 0.0248, "step": 40970 }, { "epoch": 0.21, "learning_rate": 0.00026898759402858564, "loss": 0.025, "step": 40980 }, { "epoch": 0.21, "learning_rate": 0.0002689800263355716, "loss": 0.0233, "step": 40990 }, { "epoch": 0.21, "learning_rate": 0.00026897245864255766, "loss": 0.0207, "step": 41000 }, { "epoch": 0.21, "eval_cer": 0.914467344714786, "eval_loss": 0.01699613220989704, "eval_runtime": 117.194, "eval_samples_per_second": 17.066, "eval_steps_per_second": 4.266, "step": 41000 }, { "epoch": 0.21, "learning_rate": 0.00026896489094954364, "loss": 0.0217, "step": 41010 }, { "epoch": 0.21, "learning_rate": 0.0002689573232565296, "loss": 0.0221, "step": 41020 }, { "epoch": 0.21, "learning_rate": 0.0002689497555635156, "loss": 0.023, "step": 41030 }, { "epoch": 0.21, "learning_rate": 0.0002689421878705016, "loss": 0.0222, "step": 41040 }, { "epoch": 0.21, "learning_rate": 0.00026893462017748757, "loss": 0.0222, "step": 41050 }, { "epoch": 0.21, "learning_rate": 0.0002689270524844736, "loss": 0.0221, "step": 41060 }, { "epoch": 0.21, "learning_rate": 0.0002689194847914596, "loss": 0.0231, "step": 41070 }, { "epoch": 0.21, "learning_rate": 0.00026891191709844557, "loss": 0.0243, "step": 41080 }, { "epoch": 0.21, "learning_rate": 0.00026890434940543155, "loss": 0.023, "step": 41090 }, { "epoch": 0.21, "learning_rate": 0.00026889678171241753, "loss": 0.0216, "step": 41100 }, { "epoch": 0.21, "learning_rate": 0.0002688892140194035, "loss": 0.0208, "step": 41110 }, { "epoch": 0.21, "learning_rate": 0.00026888164632638955, "loss": 0.0247, "step": 41120 }, { "epoch": 0.21, "learning_rate": 0.00026887407863337553, "loss": 0.0211, "step": 41130 }, { "epoch": 0.21, "learning_rate": 0.0002688665109403615, "loss": 0.0257, "step": 41140 }, { "epoch": 0.21, "learning_rate": 0.0002688589432473475, "loss": 0.025, "step": 41150 }, { "epoch": 0.21, "learning_rate": 0.00026885137555433347, "loss": 0.0201, "step": 41160 }, { "epoch": 0.21, "learning_rate": 0.00026884380786131945, "loss": 0.0224, "step": 41170 }, { "epoch": 0.21, "learning_rate": 0.00026883624016830544, "loss": 0.0261, "step": 41180 }, { "epoch": 0.21, "learning_rate": 0.00026882867247529147, "loss": 0.0214, "step": 41190 }, { "epoch": 0.21, "learning_rate": 0.00026882110478227745, "loss": 0.0231, "step": 41200 }, { "epoch": 0.21, "learning_rate": 0.00026881353708926343, "loss": 0.0228, "step": 41210 }, { "epoch": 0.21, "learning_rate": 0.0002688059693962494, "loss": 0.0238, "step": 41220 }, { "epoch": 0.21, "learning_rate": 0.0002687984017032354, "loss": 0.023, "step": 41230 }, { "epoch": 0.21, "learning_rate": 0.0002687908340102214, "loss": 0.022, "step": 41240 }, { "epoch": 0.21, "learning_rate": 0.0002687832663172074, "loss": 0.0272, "step": 41250 }, { "epoch": 0.21, "learning_rate": 0.0002687756986241934, "loss": 0.0235, "step": 41260 }, { "epoch": 0.21, "learning_rate": 0.0002687681309311794, "loss": 0.0283, "step": 41270 }, { "epoch": 0.21, "learning_rate": 0.00026876056323816536, "loss": 0.0257, "step": 41280 }, { "epoch": 0.21, "learning_rate": 0.00026875299554515134, "loss": 0.0235, "step": 41290 }, { "epoch": 0.21, "learning_rate": 0.0002687454278521373, "loss": 0.0202, "step": 41300 }, { "epoch": 0.21, "learning_rate": 0.00026873786015912336, "loss": 0.0221, "step": 41310 }, { "epoch": 0.21, "learning_rate": 0.00026873029246610934, "loss": 0.029, "step": 41320 }, { "epoch": 0.21, "learning_rate": 0.0002687227247730953, "loss": 0.0238, "step": 41330 }, { "epoch": 0.21, "learning_rate": 0.0002687151570800813, "loss": 0.024, "step": 41340 }, { "epoch": 0.21, "learning_rate": 0.0002687075893870673, "loss": 0.0215, "step": 41350 }, { "epoch": 0.21, "learning_rate": 0.00026870002169405326, "loss": 0.0202, "step": 41360 }, { "epoch": 0.21, "learning_rate": 0.00026869245400103925, "loss": 0.026, "step": 41370 }, { "epoch": 0.21, "learning_rate": 0.0002686848863080253, "loss": 0.026, "step": 41380 }, { "epoch": 0.21, "learning_rate": 0.00026867731861501126, "loss": 0.0239, "step": 41390 }, { "epoch": 0.21, "learning_rate": 0.00026866975092199724, "loss": 0.0218, "step": 41400 }, { "epoch": 0.21, "learning_rate": 0.0002686621832289832, "loss": 0.0221, "step": 41410 }, { "epoch": 0.21, "learning_rate": 0.0002686546155359692, "loss": 0.0244, "step": 41420 }, { "epoch": 0.21, "learning_rate": 0.0002686470478429552, "loss": 0.0188, "step": 41430 }, { "epoch": 0.21, "learning_rate": 0.0002686394801499412, "loss": 0.0235, "step": 41440 }, { "epoch": 0.21, "learning_rate": 0.0002686319124569272, "loss": 0.0242, "step": 41450 }, { "epoch": 0.21, "learning_rate": 0.0002686243447639132, "loss": 0.0242, "step": 41460 }, { "epoch": 0.21, "learning_rate": 0.00026861677707089917, "loss": 0.02, "step": 41470 }, { "epoch": 0.21, "learning_rate": 0.00026860920937788515, "loss": 0.0226, "step": 41480 }, { "epoch": 0.21, "learning_rate": 0.00026860164168487113, "loss": 0.0202, "step": 41490 }, { "epoch": 0.21, "learning_rate": 0.0002685940739918571, "loss": 0.0231, "step": 41500 }, { "epoch": 0.21, "learning_rate": 0.00026858650629884315, "loss": 0.0227, "step": 41510 }, { "epoch": 0.21, "learning_rate": 0.00026857893860582913, "loss": 0.0243, "step": 41520 }, { "epoch": 0.21, "learning_rate": 0.0002685713709128151, "loss": 0.0223, "step": 41530 }, { "epoch": 0.21, "learning_rate": 0.0002685638032198011, "loss": 0.0314, "step": 41540 }, { "epoch": 0.21, "learning_rate": 0.0002685562355267871, "loss": 0.0217, "step": 41550 }, { "epoch": 0.21, "learning_rate": 0.00026854866783377306, "loss": 0.0286, "step": 41560 }, { "epoch": 0.21, "learning_rate": 0.0002685411001407591, "loss": 0.0293, "step": 41570 }, { "epoch": 0.21, "learning_rate": 0.00026853353244774507, "loss": 0.0253, "step": 41580 }, { "epoch": 0.21, "learning_rate": 0.00026852596475473105, "loss": 0.0232, "step": 41590 }, { "epoch": 0.21, "learning_rate": 0.00026851839706171704, "loss": 0.0243, "step": 41600 }, { "epoch": 0.21, "learning_rate": 0.000268510829368703, "loss": 0.0246, "step": 41610 }, { "epoch": 0.21, "learning_rate": 0.000268503261675689, "loss": 0.0231, "step": 41620 }, { "epoch": 0.21, "learning_rate": 0.00026849569398267503, "loss": 0.0237, "step": 41630 }, { "epoch": 0.21, "learning_rate": 0.000268488126289661, "loss": 0.0277, "step": 41640 }, { "epoch": 0.21, "learning_rate": 0.000268480558596647, "loss": 0.0246, "step": 41650 }, { "epoch": 0.21, "learning_rate": 0.000268472990903633, "loss": 0.0216, "step": 41660 }, { "epoch": 0.21, "learning_rate": 0.00026846542321061896, "loss": 0.0244, "step": 41670 }, { "epoch": 0.21, "learning_rate": 0.00026845785551760494, "loss": 0.0221, "step": 41680 }, { "epoch": 0.21, "learning_rate": 0.0002684502878245909, "loss": 0.0221, "step": 41690 }, { "epoch": 0.21, "learning_rate": 0.00026844272013157696, "loss": 0.026, "step": 41700 }, { "epoch": 0.21, "learning_rate": 0.00026843515243856294, "loss": 0.0245, "step": 41710 }, { "epoch": 0.21, "learning_rate": 0.0002684275847455489, "loss": 0.0195, "step": 41720 }, { "epoch": 0.21, "learning_rate": 0.0002684200170525349, "loss": 0.0212, "step": 41730 }, { "epoch": 0.21, "learning_rate": 0.0002684124493595209, "loss": 0.0242, "step": 41740 }, { "epoch": 0.21, "learning_rate": 0.00026840488166650687, "loss": 0.0231, "step": 41750 }, { "epoch": 0.21, "learning_rate": 0.0002683973139734929, "loss": 0.0249, "step": 41760 }, { "epoch": 0.21, "learning_rate": 0.0002683897462804789, "loss": 0.0244, "step": 41770 }, { "epoch": 0.21, "learning_rate": 0.00026838217858746486, "loss": 0.0243, "step": 41780 }, { "epoch": 0.21, "learning_rate": 0.00026837461089445085, "loss": 0.0263, "step": 41790 }, { "epoch": 0.21, "learning_rate": 0.0002683670432014368, "loss": 0.0243, "step": 41800 }, { "epoch": 0.21, "learning_rate": 0.0002683594755084228, "loss": 0.0245, "step": 41810 }, { "epoch": 0.21, "learning_rate": 0.00026835190781540884, "loss": 0.0203, "step": 41820 }, { "epoch": 0.21, "learning_rate": 0.0002683443401223948, "loss": 0.0245, "step": 41830 }, { "epoch": 0.21, "learning_rate": 0.0002683367724293808, "loss": 0.0206, "step": 41840 }, { "epoch": 0.21, "learning_rate": 0.0002683292047363668, "loss": 0.0231, "step": 41850 }, { "epoch": 0.21, "learning_rate": 0.00026832163704335277, "loss": 0.0256, "step": 41860 }, { "epoch": 0.21, "learning_rate": 0.00026831406935033875, "loss": 0.0225, "step": 41870 }, { "epoch": 0.21, "learning_rate": 0.00026830650165732473, "loss": 0.022, "step": 41880 }, { "epoch": 0.21, "learning_rate": 0.00026829893396431077, "loss": 0.0211, "step": 41890 }, { "epoch": 0.21, "learning_rate": 0.00026829136627129675, "loss": 0.0196, "step": 41900 }, { "epoch": 0.21, "learning_rate": 0.00026828379857828273, "loss": 0.0222, "step": 41910 }, { "epoch": 0.21, "learning_rate": 0.0002682762308852687, "loss": 0.0221, "step": 41920 }, { "epoch": 0.21, "learning_rate": 0.0002682686631922547, "loss": 0.0218, "step": 41930 }, { "epoch": 0.21, "learning_rate": 0.0002682610954992407, "loss": 0.0212, "step": 41940 }, { "epoch": 0.21, "learning_rate": 0.0002682535278062267, "loss": 0.0238, "step": 41950 }, { "epoch": 0.21, "learning_rate": 0.0002682459601132127, "loss": 0.0307, "step": 41960 }, { "epoch": 0.21, "learning_rate": 0.0002682383924201987, "loss": 0.0334, "step": 41970 }, { "epoch": 0.21, "learning_rate": 0.00026823082472718466, "loss": 0.0275, "step": 41980 }, { "epoch": 0.21, "learning_rate": 0.00026822325703417064, "loss": 0.0235, "step": 41990 }, { "epoch": 0.21, "learning_rate": 0.0002682156893411566, "loss": 0.0311, "step": 42000 }, { "epoch": 0.21, "eval_cer": 0.9144421144155256, "eval_loss": 0.01655089110136032, "eval_runtime": 117.2639, "eval_samples_per_second": 17.056, "eval_steps_per_second": 4.264, "step": 42000 }, { "epoch": 0.21, "learning_rate": 0.0002682081216481426, "loss": 0.0264, "step": 42010 }, { "epoch": 0.21, "learning_rate": 0.00026820055395512864, "loss": 0.0291, "step": 42020 }, { "epoch": 0.21, "learning_rate": 0.0002681929862621146, "loss": 0.0261, "step": 42030 }, { "epoch": 0.21, "learning_rate": 0.0002681854185691006, "loss": 0.0209, "step": 42040 }, { "epoch": 0.21, "learning_rate": 0.0002681778508760866, "loss": 0.0226, "step": 42050 }, { "epoch": 0.21, "learning_rate": 0.00026817028318307256, "loss": 0.0231, "step": 42060 }, { "epoch": 0.21, "learning_rate": 0.00026816271549005854, "loss": 0.0239, "step": 42070 }, { "epoch": 0.21, "learning_rate": 0.0002681551477970446, "loss": 0.0293, "step": 42080 }, { "epoch": 0.21, "learning_rate": 0.00026814758010403056, "loss": 0.0192, "step": 42090 }, { "epoch": 0.21, "learning_rate": 0.00026814001241101654, "loss": 0.0228, "step": 42100 }, { "epoch": 0.21, "learning_rate": 0.00026813244471800247, "loss": 0.0269, "step": 42110 }, { "epoch": 0.21, "learning_rate": 0.0002681248770249885, "loss": 0.0225, "step": 42120 }, { "epoch": 0.21, "learning_rate": 0.0002681173093319745, "loss": 0.024, "step": 42130 }, { "epoch": 0.21, "learning_rate": 0.00026810974163896047, "loss": 0.0257, "step": 42140 }, { "epoch": 0.21, "learning_rate": 0.00026810217394594645, "loss": 0.0231, "step": 42150 }, { "epoch": 0.21, "learning_rate": 0.00026809460625293243, "loss": 0.0231, "step": 42160 }, { "epoch": 0.21, "learning_rate": 0.0002680870385599184, "loss": 0.0223, "step": 42170 }, { "epoch": 0.21, "learning_rate": 0.00026807947086690445, "loss": 0.0225, "step": 42180 }, { "epoch": 0.21, "learning_rate": 0.00026807190317389043, "loss": 0.02, "step": 42190 }, { "epoch": 0.21, "learning_rate": 0.0002680643354808764, "loss": 0.0242, "step": 42200 }, { "epoch": 0.21, "learning_rate": 0.0002680567677878624, "loss": 0.0179, "step": 42210 }, { "epoch": 0.21, "learning_rate": 0.00026804920009484837, "loss": 0.0194, "step": 42220 }, { "epoch": 0.21, "learning_rate": 0.00026804163240183435, "loss": 0.021, "step": 42230 }, { "epoch": 0.21, "learning_rate": 0.00026803406470882034, "loss": 0.018, "step": 42240 }, { "epoch": 0.21, "learning_rate": 0.00026802649701580637, "loss": 0.0221, "step": 42250 }, { "epoch": 0.21, "learning_rate": 0.00026801892932279235, "loss": 0.0242, "step": 42260 }, { "epoch": 0.21, "learning_rate": 0.00026801136162977833, "loss": 0.0258, "step": 42270 }, { "epoch": 0.21, "learning_rate": 0.0002680037939367643, "loss": 0.0204, "step": 42280 }, { "epoch": 0.21, "learning_rate": 0.0002679962262437503, "loss": 0.023, "step": 42290 }, { "epoch": 0.21, "learning_rate": 0.0002679886585507363, "loss": 0.0242, "step": 42300 }, { "epoch": 0.21, "learning_rate": 0.0002679810908577223, "loss": 0.0187, "step": 42310 }, { "epoch": 0.21, "learning_rate": 0.0002679735231647083, "loss": 0.019, "step": 42320 }, { "epoch": 0.21, "learning_rate": 0.0002679659554716943, "loss": 0.0214, "step": 42330 }, { "epoch": 0.21, "learning_rate": 0.00026795838777868026, "loss": 0.0222, "step": 42340 }, { "epoch": 0.21, "learning_rate": 0.00026795082008566624, "loss": 0.0202, "step": 42350 }, { "epoch": 0.21, "learning_rate": 0.0002679432523926522, "loss": 0.0223, "step": 42360 }, { "epoch": 0.21, "learning_rate": 0.00026793568469963826, "loss": 0.0238, "step": 42370 }, { "epoch": 0.21, "learning_rate": 0.00026792811700662424, "loss": 0.0199, "step": 42380 }, { "epoch": 0.21, "learning_rate": 0.0002679205493136102, "loss": 0.021, "step": 42390 }, { "epoch": 0.21, "learning_rate": 0.0002679129816205962, "loss": 0.0234, "step": 42400 }, { "epoch": 0.21, "learning_rate": 0.0002679054139275822, "loss": 0.0234, "step": 42410 }, { "epoch": 0.21, "learning_rate": 0.00026789784623456816, "loss": 0.0229, "step": 42420 }, { "epoch": 0.21, "learning_rate": 0.00026789027854155415, "loss": 0.0213, "step": 42430 }, { "epoch": 0.21, "learning_rate": 0.0002678827108485402, "loss": 0.0188, "step": 42440 }, { "epoch": 0.21, "learning_rate": 0.00026787514315552616, "loss": 0.0209, "step": 42450 }, { "epoch": 0.21, "learning_rate": 0.00026786757546251214, "loss": 0.0246, "step": 42460 }, { "epoch": 0.21, "learning_rate": 0.0002678600077694981, "loss": 0.0231, "step": 42470 }, { "epoch": 0.21, "learning_rate": 0.0002678524400764841, "loss": 0.0214, "step": 42480 }, { "epoch": 0.21, "learning_rate": 0.0002678448723834701, "loss": 0.0195, "step": 42490 }, { "epoch": 0.21, "learning_rate": 0.0002678373046904561, "loss": 0.0219, "step": 42500 }, { "epoch": 0.21, "learning_rate": 0.0002678297369974421, "loss": 0.0203, "step": 42510 }, { "epoch": 0.21, "learning_rate": 0.0002678221693044281, "loss": 0.0226, "step": 42520 }, { "epoch": 0.21, "learning_rate": 0.00026781460161141407, "loss": 0.0229, "step": 42530 }, { "epoch": 0.21, "learning_rate": 0.00026780703391840005, "loss": 0.0261, "step": 42540 }, { "epoch": 0.21, "learning_rate": 0.00026779946622538603, "loss": 0.0243, "step": 42550 }, { "epoch": 0.21, "learning_rate": 0.00026779189853237207, "loss": 0.0204, "step": 42560 }, { "epoch": 0.21, "learning_rate": 0.00026778433083935805, "loss": 0.0246, "step": 42570 }, { "epoch": 0.21, "learning_rate": 0.00026777676314634403, "loss": 0.0189, "step": 42580 }, { "epoch": 0.21, "learning_rate": 0.00026776919545333, "loss": 0.0214, "step": 42590 }, { "epoch": 0.21, "learning_rate": 0.000267761627760316, "loss": 0.022, "step": 42600 }, { "epoch": 0.21, "learning_rate": 0.000267754060067302, "loss": 0.0232, "step": 42610 }, { "epoch": 0.22, "learning_rate": 0.00026774649237428796, "loss": 0.022, "step": 42620 }, { "epoch": 0.22, "learning_rate": 0.000267738924681274, "loss": 0.0212, "step": 42630 }, { "epoch": 0.22, "learning_rate": 0.00026773135698825997, "loss": 0.0227, "step": 42640 }, { "epoch": 0.22, "learning_rate": 0.00026772378929524595, "loss": 0.0223, "step": 42650 }, { "epoch": 0.22, "learning_rate": 0.00026771622160223194, "loss": 0.022, "step": 42660 }, { "epoch": 0.22, "learning_rate": 0.0002677086539092179, "loss": 0.0231, "step": 42670 }, { "epoch": 0.22, "learning_rate": 0.0002677010862162039, "loss": 0.0209, "step": 42680 }, { "epoch": 0.22, "learning_rate": 0.00026769351852318993, "loss": 0.0256, "step": 42690 }, { "epoch": 0.22, "learning_rate": 0.0002676859508301759, "loss": 0.0274, "step": 42700 }, { "epoch": 0.22, "learning_rate": 0.0002676783831371619, "loss": 0.024, "step": 42710 }, { "epoch": 0.22, "learning_rate": 0.0002676708154441479, "loss": 0.0265, "step": 42720 }, { "epoch": 0.22, "learning_rate": 0.00026766324775113386, "loss": 0.0192, "step": 42730 }, { "epoch": 0.22, "learning_rate": 0.00026765568005811984, "loss": 0.0212, "step": 42740 }, { "epoch": 0.22, "learning_rate": 0.0002676481123651058, "loss": 0.0235, "step": 42750 }, { "epoch": 0.22, "learning_rate": 0.00026764054467209186, "loss": 0.0211, "step": 42760 }, { "epoch": 0.22, "learning_rate": 0.00026763297697907784, "loss": 0.0212, "step": 42770 }, { "epoch": 0.22, "learning_rate": 0.0002676254092860638, "loss": 0.022, "step": 42780 }, { "epoch": 0.22, "learning_rate": 0.0002676178415930498, "loss": 0.0222, "step": 42790 }, { "epoch": 0.22, "learning_rate": 0.0002676102739000358, "loss": 0.0208, "step": 42800 }, { "epoch": 0.22, "learning_rate": 0.00026760270620702177, "loss": 0.0224, "step": 42810 }, { "epoch": 0.22, "learning_rate": 0.0002675951385140078, "loss": 0.0195, "step": 42820 }, { "epoch": 0.22, "learning_rate": 0.0002675875708209938, "loss": 0.0269, "step": 42830 }, { "epoch": 0.22, "learning_rate": 0.00026758000312797976, "loss": 0.0266, "step": 42840 }, { "epoch": 0.22, "learning_rate": 0.00026757243543496575, "loss": 0.0244, "step": 42850 }, { "epoch": 0.22, "learning_rate": 0.00026756486774195173, "loss": 0.0231, "step": 42860 }, { "epoch": 0.22, "learning_rate": 0.0002675573000489377, "loss": 0.0253, "step": 42870 }, { "epoch": 0.22, "learning_rate": 0.00026754973235592374, "loss": 0.0207, "step": 42880 }, { "epoch": 0.22, "learning_rate": 0.0002675421646629097, "loss": 0.0204, "step": 42890 }, { "epoch": 0.22, "learning_rate": 0.0002675345969698957, "loss": 0.0212, "step": 42900 }, { "epoch": 0.22, "learning_rate": 0.0002675270292768817, "loss": 0.0285, "step": 42910 }, { "epoch": 0.22, "learning_rate": 0.00026751946158386767, "loss": 0.0214, "step": 42920 }, { "epoch": 0.22, "learning_rate": 0.00026751189389085365, "loss": 0.0294, "step": 42930 }, { "epoch": 0.22, "learning_rate": 0.00026750432619783963, "loss": 0.0213, "step": 42940 }, { "epoch": 0.22, "learning_rate": 0.00026749675850482567, "loss": 0.0254, "step": 42950 }, { "epoch": 0.22, "learning_rate": 0.00026748919081181165, "loss": 0.0196, "step": 42960 }, { "epoch": 0.22, "learning_rate": 0.00026748162311879763, "loss": 0.0287, "step": 42970 }, { "epoch": 0.22, "learning_rate": 0.0002674740554257836, "loss": 0.0214, "step": 42980 }, { "epoch": 0.22, "learning_rate": 0.0002674664877327696, "loss": 0.0244, "step": 42990 }, { "epoch": 0.22, "learning_rate": 0.0002674589200397556, "loss": 0.024, "step": 43000 }, { "epoch": 0.22, "eval_cer": 0.9144954862024227, "eval_loss": 0.01679139770567417, "eval_runtime": 117.1853, "eval_samples_per_second": 17.067, "eval_steps_per_second": 4.267, "step": 43000 }, { "epoch": 0.22, "learning_rate": 0.0002674513523467416, "loss": 0.0234, "step": 43010 }, { "epoch": 0.22, "learning_rate": 0.0002674437846537276, "loss": 0.0265, "step": 43020 }, { "epoch": 0.22, "learning_rate": 0.0002674362169607136, "loss": 0.0239, "step": 43030 }, { "epoch": 0.22, "learning_rate": 0.00026742864926769956, "loss": 0.0224, "step": 43040 }, { "epoch": 0.22, "learning_rate": 0.00026742108157468554, "loss": 0.0224, "step": 43050 }, { "epoch": 0.22, "learning_rate": 0.0002674135138816715, "loss": 0.0209, "step": 43060 }, { "epoch": 0.22, "learning_rate": 0.00026740594618865755, "loss": 0.0221, "step": 43070 }, { "epoch": 0.22, "learning_rate": 0.00026739837849564354, "loss": 0.0219, "step": 43080 }, { "epoch": 0.22, "learning_rate": 0.0002673908108026295, "loss": 0.02, "step": 43090 }, { "epoch": 0.22, "learning_rate": 0.0002673832431096155, "loss": 0.0235, "step": 43100 }, { "epoch": 0.22, "learning_rate": 0.0002673756754166015, "loss": 0.0226, "step": 43110 }, { "epoch": 0.22, "learning_rate": 0.00026736810772358746, "loss": 0.0228, "step": 43120 }, { "epoch": 0.22, "learning_rate": 0.00026736054003057344, "loss": 0.0192, "step": 43130 }, { "epoch": 0.22, "learning_rate": 0.0002673529723375595, "loss": 0.022, "step": 43140 }, { "epoch": 0.22, "learning_rate": 0.00026734540464454546, "loss": 0.0229, "step": 43150 }, { "epoch": 0.22, "learning_rate": 0.00026733783695153144, "loss": 0.0224, "step": 43160 }, { "epoch": 0.22, "learning_rate": 0.0002673302692585174, "loss": 0.021, "step": 43170 }, { "epoch": 0.22, "learning_rate": 0.0002673227015655034, "loss": 0.025, "step": 43180 }, { "epoch": 0.22, "learning_rate": 0.0002673151338724894, "loss": 0.0229, "step": 43190 }, { "epoch": 0.22, "learning_rate": 0.0002673075661794754, "loss": 0.0237, "step": 43200 }, { "epoch": 0.22, "learning_rate": 0.0002672999984864614, "loss": 0.0209, "step": 43210 }, { "epoch": 0.22, "learning_rate": 0.0002672924307934474, "loss": 0.021, "step": 43220 }, { "epoch": 0.22, "learning_rate": 0.00026728486310043337, "loss": 0.0237, "step": 43230 }, { "epoch": 0.22, "learning_rate": 0.00026727729540741935, "loss": 0.0241, "step": 43240 }, { "epoch": 0.22, "learning_rate": 0.00026726972771440533, "loss": 0.0254, "step": 43250 }, { "epoch": 0.22, "learning_rate": 0.0002672621600213913, "loss": 0.0236, "step": 43260 }, { "epoch": 0.22, "learning_rate": 0.00026725459232837735, "loss": 0.0281, "step": 43270 }, { "epoch": 0.22, "learning_rate": 0.00026724702463536333, "loss": 0.023, "step": 43280 }, { "epoch": 0.22, "learning_rate": 0.0002672394569423493, "loss": 0.023, "step": 43290 }, { "epoch": 0.22, "learning_rate": 0.0002672318892493353, "loss": 0.0235, "step": 43300 }, { "epoch": 0.22, "learning_rate": 0.00026722432155632127, "loss": 0.0212, "step": 43310 }, { "epoch": 0.22, "learning_rate": 0.00026721675386330725, "loss": 0.0237, "step": 43320 }, { "epoch": 0.22, "learning_rate": 0.0002672091861702933, "loss": 0.0194, "step": 43330 }, { "epoch": 0.22, "learning_rate": 0.00026720161847727927, "loss": 0.0216, "step": 43340 }, { "epoch": 0.22, "learning_rate": 0.00026719405078426525, "loss": 0.0227, "step": 43350 }, { "epoch": 0.22, "learning_rate": 0.00026718648309125123, "loss": 0.0219, "step": 43360 }, { "epoch": 0.22, "learning_rate": 0.0002671789153982372, "loss": 0.0226, "step": 43370 }, { "epoch": 0.22, "learning_rate": 0.0002671713477052232, "loss": 0.0236, "step": 43380 }, { "epoch": 0.22, "learning_rate": 0.0002671637800122092, "loss": 0.0223, "step": 43390 }, { "epoch": 0.22, "learning_rate": 0.00026715621231919516, "loss": 0.0216, "step": 43400 }, { "epoch": 0.22, "learning_rate": 0.00026714864462618114, "loss": 0.0199, "step": 43410 }, { "epoch": 0.22, "learning_rate": 0.0002671410769331671, "loss": 0.0257, "step": 43420 }, { "epoch": 0.22, "learning_rate": 0.00026713350924015316, "loss": 0.0252, "step": 43430 }, { "epoch": 0.22, "learning_rate": 0.00026712594154713914, "loss": 0.023, "step": 43440 }, { "epoch": 0.22, "learning_rate": 0.0002671183738541251, "loss": 0.0199, "step": 43450 }, { "epoch": 0.22, "learning_rate": 0.0002671108061611111, "loss": 0.0217, "step": 43460 }, { "epoch": 0.22, "learning_rate": 0.0002671032384680971, "loss": 0.0195, "step": 43470 }, { "epoch": 0.22, "learning_rate": 0.00026709567077508306, "loss": 0.0232, "step": 43480 }, { "epoch": 0.22, "learning_rate": 0.00026708810308206905, "loss": 0.0198, "step": 43490 }, { "epoch": 0.22, "learning_rate": 0.0002670805353890551, "loss": 0.0285, "step": 43500 }, { "epoch": 0.22, "learning_rate": 0.00026707296769604106, "loss": 0.0255, "step": 43510 }, { "epoch": 0.22, "learning_rate": 0.00026706540000302704, "loss": 0.0238, "step": 43520 }, { "epoch": 0.22, "learning_rate": 0.000267057832310013, "loss": 0.022, "step": 43530 }, { "epoch": 0.22, "learning_rate": 0.000267050264616999, "loss": 0.0227, "step": 43540 }, { "epoch": 0.22, "learning_rate": 0.000267042696923985, "loss": 0.0226, "step": 43550 }, { "epoch": 0.22, "learning_rate": 0.000267035129230971, "loss": 0.0207, "step": 43560 }, { "epoch": 0.22, "learning_rate": 0.000267027561537957, "loss": 0.0234, "step": 43570 }, { "epoch": 0.22, "learning_rate": 0.000267019993844943, "loss": 0.0204, "step": 43580 }, { "epoch": 0.22, "learning_rate": 0.00026701242615192897, "loss": 0.0212, "step": 43590 }, { "epoch": 0.22, "learning_rate": 0.00026700485845891495, "loss": 0.022, "step": 43600 }, { "epoch": 0.22, "learning_rate": 0.00026699729076590093, "loss": 0.0504, "step": 43610 }, { "epoch": 0.22, "learning_rate": 0.00026698972307288697, "loss": 0.0199, "step": 43620 }, { "epoch": 0.22, "learning_rate": 0.00026698215537987295, "loss": 0.0281, "step": 43630 }, { "epoch": 0.22, "learning_rate": 0.00026697458768685893, "loss": 0.0217, "step": 43640 }, { "epoch": 0.22, "learning_rate": 0.0002669670199938449, "loss": 0.0236, "step": 43650 }, { "epoch": 0.22, "learning_rate": 0.0002669594523008309, "loss": 0.0211, "step": 43660 }, { "epoch": 0.22, "learning_rate": 0.0002669518846078169, "loss": 0.0208, "step": 43670 }, { "epoch": 0.22, "learning_rate": 0.00026694431691480286, "loss": 0.0253, "step": 43680 }, { "epoch": 0.22, "learning_rate": 0.0002669367492217889, "loss": 0.0202, "step": 43690 }, { "epoch": 0.22, "learning_rate": 0.0002669291815287749, "loss": 0.0228, "step": 43700 }, { "epoch": 0.22, "learning_rate": 0.00026692161383576085, "loss": 0.0259, "step": 43710 }, { "epoch": 0.22, "learning_rate": 0.00026691404614274684, "loss": 0.0252, "step": 43720 }, { "epoch": 0.22, "learning_rate": 0.0002669064784497328, "loss": 0.0236, "step": 43730 }, { "epoch": 0.22, "learning_rate": 0.0002668989107567188, "loss": 0.0253, "step": 43740 }, { "epoch": 0.22, "learning_rate": 0.00026689134306370483, "loss": 0.0205, "step": 43750 }, { "epoch": 0.22, "learning_rate": 0.0002668837753706908, "loss": 0.0192, "step": 43760 }, { "epoch": 0.22, "learning_rate": 0.0002668762076776768, "loss": 0.0189, "step": 43770 }, { "epoch": 0.22, "learning_rate": 0.0002668686399846628, "loss": 0.0208, "step": 43780 }, { "epoch": 0.22, "learning_rate": 0.00026686107229164876, "loss": 0.021, "step": 43790 }, { "epoch": 0.22, "learning_rate": 0.00026685350459863474, "loss": 0.0204, "step": 43800 }, { "epoch": 0.22, "learning_rate": 0.0002668459369056207, "loss": 0.021, "step": 43810 }, { "epoch": 0.22, "learning_rate": 0.00026683836921260676, "loss": 0.0225, "step": 43820 }, { "epoch": 0.22, "learning_rate": 0.00026683080151959274, "loss": 0.0263, "step": 43830 }, { "epoch": 0.22, "learning_rate": 0.0002668232338265787, "loss": 0.0205, "step": 43840 }, { "epoch": 0.22, "learning_rate": 0.0002668156661335647, "loss": 0.0266, "step": 43850 }, { "epoch": 0.22, "learning_rate": 0.0002668080984405507, "loss": 0.0246, "step": 43860 }, { "epoch": 0.22, "learning_rate": 0.00026680053074753667, "loss": 0.023, "step": 43870 }, { "epoch": 0.22, "learning_rate": 0.0002667929630545227, "loss": 0.0242, "step": 43880 }, { "epoch": 0.22, "learning_rate": 0.0002667853953615087, "loss": 0.0225, "step": 43890 }, { "epoch": 0.22, "learning_rate": 0.00026677782766849466, "loss": 0.0233, "step": 43900 }, { "epoch": 0.22, "learning_rate": 0.00026677025997548065, "loss": 0.0208, "step": 43910 }, { "epoch": 0.22, "learning_rate": 0.00026676269228246663, "loss": 0.0248, "step": 43920 }, { "epoch": 0.22, "learning_rate": 0.0002667551245894526, "loss": 0.0218, "step": 43930 }, { "epoch": 0.22, "learning_rate": 0.00026674755689643864, "loss": 0.02, "step": 43940 }, { "epoch": 0.22, "learning_rate": 0.0002667399892034246, "loss": 0.0161, "step": 43950 }, { "epoch": 0.22, "learning_rate": 0.0002667324215104106, "loss": 0.0226, "step": 43960 }, { "epoch": 0.22, "learning_rate": 0.0002667248538173966, "loss": 0.0182, "step": 43970 }, { "epoch": 0.22, "learning_rate": 0.00026671728612438257, "loss": 0.0228, "step": 43980 }, { "epoch": 0.22, "learning_rate": 0.00026670971843136855, "loss": 0.0189, "step": 43990 }, { "epoch": 0.22, "learning_rate": 0.00026670215073835453, "loss": 0.0206, "step": 44000 }, { "epoch": 0.22, "eval_cer": 0.914452788772905, "eval_loss": 0.01625337265431881, "eval_runtime": 117.269, "eval_samples_per_second": 17.055, "eval_steps_per_second": 4.264, "step": 44000 }, { "epoch": 0.22, "learning_rate": 0.00026669458304534057, "loss": 0.0252, "step": 44010 }, { "epoch": 0.22, "learning_rate": 0.00026668701535232655, "loss": 0.026, "step": 44020 }, { "epoch": 0.22, "learning_rate": 0.00026667944765931253, "loss": 0.0212, "step": 44030 }, { "epoch": 0.22, "learning_rate": 0.0002666718799662985, "loss": 0.0205, "step": 44040 }, { "epoch": 0.22, "learning_rate": 0.0002666643122732845, "loss": 0.0271, "step": 44050 }, { "epoch": 0.22, "learning_rate": 0.0002666567445802705, "loss": 0.0234, "step": 44060 }, { "epoch": 0.22, "learning_rate": 0.0002666491768872565, "loss": 0.0242, "step": 44070 }, { "epoch": 0.22, "learning_rate": 0.0002666416091942425, "loss": 0.0203, "step": 44080 }, { "epoch": 0.22, "learning_rate": 0.0002666340415012285, "loss": 0.0196, "step": 44090 }, { "epoch": 0.22, "learning_rate": 0.00026662647380821446, "loss": 0.0214, "step": 44100 }, { "epoch": 0.22, "learning_rate": 0.00026661890611520044, "loss": 0.0276, "step": 44110 }, { "epoch": 0.22, "learning_rate": 0.0002666113384221864, "loss": 0.0215, "step": 44120 }, { "epoch": 0.22, "learning_rate": 0.00026660377072917245, "loss": 0.0233, "step": 44130 }, { "epoch": 0.22, "learning_rate": 0.00026659620303615844, "loss": 0.0246, "step": 44140 }, { "epoch": 0.22, "learning_rate": 0.0002665886353431444, "loss": 0.0191, "step": 44150 }, { "epoch": 0.22, "learning_rate": 0.0002665810676501304, "loss": 0.0241, "step": 44160 }, { "epoch": 0.22, "learning_rate": 0.0002665734999571164, "loss": 0.0196, "step": 44170 }, { "epoch": 0.22, "learning_rate": 0.00026656593226410236, "loss": 0.0297, "step": 44180 }, { "epoch": 0.22, "learning_rate": 0.00026655836457108834, "loss": 0.0272, "step": 44190 }, { "epoch": 0.22, "learning_rate": 0.0002665507968780744, "loss": 0.0298, "step": 44200 }, { "epoch": 0.22, "learning_rate": 0.00026654322918506036, "loss": 0.0241, "step": 44210 }, { "epoch": 0.22, "learning_rate": 0.00026653566149204634, "loss": 0.0249, "step": 44220 }, { "epoch": 0.22, "learning_rate": 0.0002665280937990323, "loss": 0.0265, "step": 44230 }, { "epoch": 0.22, "learning_rate": 0.0002665205261060183, "loss": 0.021, "step": 44240 }, { "epoch": 0.22, "learning_rate": 0.0002665129584130043, "loss": 0.0226, "step": 44250 }, { "epoch": 0.22, "learning_rate": 0.0002665053907199903, "loss": 0.023, "step": 44260 }, { "epoch": 0.22, "learning_rate": 0.0002664978230269763, "loss": 0.0364, "step": 44270 }, { "epoch": 0.22, "learning_rate": 0.0002664902553339623, "loss": 0.0259, "step": 44280 }, { "epoch": 0.22, "learning_rate": 0.00026648268764094827, "loss": 0.0238, "step": 44290 }, { "epoch": 0.22, "learning_rate": 0.00026647511994793425, "loss": 0.0234, "step": 44300 }, { "epoch": 0.22, "learning_rate": 0.00026646755225492023, "loss": 0.0217, "step": 44310 }, { "epoch": 0.22, "learning_rate": 0.0002664599845619062, "loss": 0.0233, "step": 44320 }, { "epoch": 0.22, "learning_rate": 0.00026645241686889225, "loss": 0.023, "step": 44330 }, { "epoch": 0.22, "learning_rate": 0.00026644484917587823, "loss": 0.0219, "step": 44340 }, { "epoch": 0.22, "learning_rate": 0.0002664372814828642, "loss": 0.0251, "step": 44350 }, { "epoch": 0.22, "learning_rate": 0.0002664297137898502, "loss": 0.0248, "step": 44360 }, { "epoch": 0.22, "learning_rate": 0.00026642214609683617, "loss": 0.023, "step": 44370 }, { "epoch": 0.22, "learning_rate": 0.00026641457840382215, "loss": 0.0293, "step": 44380 }, { "epoch": 0.22, "learning_rate": 0.0002664070107108082, "loss": 0.0262, "step": 44390 }, { "epoch": 0.22, "learning_rate": 0.00026639944301779417, "loss": 0.0255, "step": 44400 }, { "epoch": 0.22, "learning_rate": 0.00026639187532478015, "loss": 0.024, "step": 44410 }, { "epoch": 0.22, "learning_rate": 0.00026638430763176613, "loss": 0.0228, "step": 44420 }, { "epoch": 0.22, "learning_rate": 0.0002663767399387521, "loss": 0.0215, "step": 44430 }, { "epoch": 0.22, "learning_rate": 0.0002663691722457381, "loss": 0.0208, "step": 44440 }, { "epoch": 0.22, "learning_rate": 0.00026636160455272413, "loss": 0.0209, "step": 44450 }, { "epoch": 0.22, "learning_rate": 0.0002663540368597101, "loss": 0.0235, "step": 44460 }, { "epoch": 0.22, "learning_rate": 0.0002663464691666961, "loss": 0.026, "step": 44470 }, { "epoch": 0.22, "learning_rate": 0.0002663389014736821, "loss": 0.0173, "step": 44480 }, { "epoch": 0.22, "learning_rate": 0.00026633133378066806, "loss": 0.0225, "step": 44490 }, { "epoch": 0.22, "learning_rate": 0.00026632376608765404, "loss": 0.0256, "step": 44500 }, { "epoch": 0.22, "learning_rate": 0.00026631619839464, "loss": 0.0221, "step": 44510 }, { "epoch": 0.22, "learning_rate": 0.00026630863070162606, "loss": 0.0248, "step": 44520 }, { "epoch": 0.22, "learning_rate": 0.00026630106300861204, "loss": 0.0199, "step": 44530 }, { "epoch": 0.22, "learning_rate": 0.000266293495315598, "loss": 0.0219, "step": 44540 }, { "epoch": 0.22, "learning_rate": 0.000266285927622584, "loss": 0.0223, "step": 44550 }, { "epoch": 0.22, "learning_rate": 0.00026627835992957, "loss": 0.0214, "step": 44560 }, { "epoch": 0.22, "learning_rate": 0.00026627079223655596, "loss": 0.027, "step": 44570 }, { "epoch": 0.22, "learning_rate": 0.000266263224543542, "loss": 0.0207, "step": 44580 }, { "epoch": 0.22, "learning_rate": 0.000266255656850528, "loss": 0.0189, "step": 44590 }, { "epoch": 0.23, "learning_rate": 0.00026624808915751396, "loss": 0.0237, "step": 44600 }, { "epoch": 0.23, "learning_rate": 0.00026624052146449994, "loss": 0.0242, "step": 44610 }, { "epoch": 0.23, "learning_rate": 0.0002662329537714859, "loss": 0.0203, "step": 44620 }, { "epoch": 0.23, "learning_rate": 0.0002662253860784719, "loss": 0.025, "step": 44630 }, { "epoch": 0.23, "learning_rate": 0.0002662178183854579, "loss": 0.0227, "step": 44640 }, { "epoch": 0.23, "learning_rate": 0.00026621025069244387, "loss": 0.0208, "step": 44650 }, { "epoch": 0.23, "learning_rate": 0.00026620268299942985, "loss": 0.0214, "step": 44660 }, { "epoch": 0.23, "learning_rate": 0.00026619511530641583, "loss": 0.0225, "step": 44670 }, { "epoch": 0.23, "learning_rate": 0.00026618754761340187, "loss": 0.0193, "step": 44680 }, { "epoch": 0.23, "learning_rate": 0.00026617997992038785, "loss": 0.0233, "step": 44690 }, { "epoch": 0.23, "learning_rate": 0.00026617241222737383, "loss": 0.0205, "step": 44700 }, { "epoch": 0.23, "learning_rate": 0.0002661648445343598, "loss": 0.0236, "step": 44710 }, { "epoch": 0.23, "learning_rate": 0.0002661572768413458, "loss": 0.0216, "step": 44720 }, { "epoch": 0.23, "learning_rate": 0.0002661497091483318, "loss": 0.0232, "step": 44730 }, { "epoch": 0.23, "learning_rate": 0.00026614214145531776, "loss": 0.0252, "step": 44740 }, { "epoch": 0.23, "learning_rate": 0.0002661345737623038, "loss": 0.0228, "step": 44750 }, { "epoch": 0.23, "learning_rate": 0.0002661270060692898, "loss": 0.0239, "step": 44760 }, { "epoch": 0.23, "learning_rate": 0.00026611943837627575, "loss": 0.0185, "step": 44770 }, { "epoch": 0.23, "learning_rate": 0.00026611187068326174, "loss": 0.0217, "step": 44780 }, { "epoch": 0.23, "learning_rate": 0.0002661043029902477, "loss": 0.0229, "step": 44790 }, { "epoch": 0.23, "learning_rate": 0.0002660967352972337, "loss": 0.0223, "step": 44800 }, { "epoch": 0.23, "learning_rate": 0.00026608916760421973, "loss": 0.0278, "step": 44810 }, { "epoch": 0.23, "learning_rate": 0.0002660815999112057, "loss": 0.0196, "step": 44820 }, { "epoch": 0.23, "learning_rate": 0.0002660740322181917, "loss": 0.0175, "step": 44830 }, { "epoch": 0.23, "learning_rate": 0.0002660664645251777, "loss": 0.0179, "step": 44840 }, { "epoch": 0.23, "learning_rate": 0.00026605889683216366, "loss": 0.0223, "step": 44850 }, { "epoch": 0.23, "learning_rate": 0.00026605132913914964, "loss": 0.0259, "step": 44860 }, { "epoch": 0.23, "learning_rate": 0.0002660437614461356, "loss": 0.0212, "step": 44870 }, { "epoch": 0.23, "learning_rate": 0.00026603619375312166, "loss": 0.0186, "step": 44880 }, { "epoch": 0.23, "learning_rate": 0.00026602862606010764, "loss": 0.024, "step": 44890 }, { "epoch": 0.23, "learning_rate": 0.0002660210583670936, "loss": 0.0233, "step": 44900 }, { "epoch": 0.23, "learning_rate": 0.0002660134906740796, "loss": 0.0251, "step": 44910 }, { "epoch": 0.23, "learning_rate": 0.0002660059229810656, "loss": 0.0229, "step": 44920 }, { "epoch": 0.23, "learning_rate": 0.00026599835528805157, "loss": 0.0251, "step": 44930 }, { "epoch": 0.23, "learning_rate": 0.0002659907875950376, "loss": 0.02, "step": 44940 }, { "epoch": 0.23, "learning_rate": 0.0002659832199020236, "loss": 0.0213, "step": 44950 }, { "epoch": 0.23, "learning_rate": 0.00026597565220900956, "loss": 0.0212, "step": 44960 }, { "epoch": 0.23, "learning_rate": 0.00026596808451599555, "loss": 0.0219, "step": 44970 }, { "epoch": 0.23, "learning_rate": 0.00026596051682298153, "loss": 0.026, "step": 44980 }, { "epoch": 0.23, "learning_rate": 0.0002659529491299675, "loss": 0.0202, "step": 44990 }, { "epoch": 0.23, "learning_rate": 0.00026594538143695354, "loss": 0.024, "step": 45000 }, { "epoch": 0.23, "eval_cer": 0.9144896638256703, "eval_loss": 0.016492534428834915, "eval_runtime": 117.0086, "eval_samples_per_second": 17.093, "eval_steps_per_second": 4.273, "step": 45000 }, { "epoch": 0.23, "learning_rate": 0.0002659378137439395, "loss": 0.0231, "step": 45010 }, { "epoch": 0.23, "learning_rate": 0.0002659302460509255, "loss": 0.0235, "step": 45020 }, { "epoch": 0.23, "learning_rate": 0.0002659226783579115, "loss": 0.0237, "step": 45030 }, { "epoch": 0.23, "learning_rate": 0.00026591511066489747, "loss": 0.0202, "step": 45040 }, { "epoch": 0.23, "learning_rate": 0.00026590754297188345, "loss": 0.0213, "step": 45050 }, { "epoch": 0.23, "learning_rate": 0.00026589997527886943, "loss": 0.019, "step": 45060 }, { "epoch": 0.23, "learning_rate": 0.00026589240758585547, "loss": 0.0231, "step": 45070 }, { "epoch": 0.23, "learning_rate": 0.00026588483989284145, "loss": 0.0309, "step": 45080 }, { "epoch": 0.23, "learning_rate": 0.00026587727219982743, "loss": 0.0219, "step": 45090 }, { "epoch": 0.23, "learning_rate": 0.0002658697045068134, "loss": 0.0226, "step": 45100 }, { "epoch": 0.23, "learning_rate": 0.0002658621368137994, "loss": 0.0203, "step": 45110 }, { "epoch": 0.23, "learning_rate": 0.0002658545691207854, "loss": 0.0228, "step": 45120 }, { "epoch": 0.23, "learning_rate": 0.0002658470014277714, "loss": 0.0229, "step": 45130 }, { "epoch": 0.23, "learning_rate": 0.0002658394337347574, "loss": 0.0204, "step": 45140 }, { "epoch": 0.23, "learning_rate": 0.0002658318660417434, "loss": 0.0221, "step": 45150 }, { "epoch": 0.23, "learning_rate": 0.00026582429834872936, "loss": 0.022, "step": 45160 }, { "epoch": 0.23, "learning_rate": 0.00026581673065571534, "loss": 0.0216, "step": 45170 }, { "epoch": 0.23, "learning_rate": 0.0002658091629627013, "loss": 0.0224, "step": 45180 }, { "epoch": 0.23, "learning_rate": 0.00026580159526968735, "loss": 0.0237, "step": 45190 }, { "epoch": 0.23, "learning_rate": 0.00026579402757667334, "loss": 0.0245, "step": 45200 }, { "epoch": 0.23, "learning_rate": 0.0002657864598836593, "loss": 0.023, "step": 45210 }, { "epoch": 0.23, "learning_rate": 0.0002657788921906453, "loss": 0.027, "step": 45220 }, { "epoch": 0.23, "learning_rate": 0.0002657713244976313, "loss": 0.0214, "step": 45230 }, { "epoch": 0.23, "learning_rate": 0.00026576375680461726, "loss": 0.0209, "step": 45240 }, { "epoch": 0.23, "learning_rate": 0.00026575618911160324, "loss": 0.0208, "step": 45250 }, { "epoch": 0.23, "learning_rate": 0.0002657486214185893, "loss": 0.0224, "step": 45260 }, { "epoch": 0.23, "learning_rate": 0.00026574105372557526, "loss": 0.024, "step": 45270 }, { "epoch": 0.23, "learning_rate": 0.00026573348603256124, "loss": 0.0253, "step": 45280 }, { "epoch": 0.23, "learning_rate": 0.0002657259183395472, "loss": 0.0235, "step": 45290 }, { "epoch": 0.23, "learning_rate": 0.0002657183506465332, "loss": 0.0219, "step": 45300 }, { "epoch": 0.23, "learning_rate": 0.0002657107829535192, "loss": 0.0227, "step": 45310 }, { "epoch": 0.23, "learning_rate": 0.0002657032152605052, "loss": 0.0265, "step": 45320 }, { "epoch": 0.23, "learning_rate": 0.0002656956475674912, "loss": 0.0194, "step": 45330 }, { "epoch": 0.23, "learning_rate": 0.0002656880798744772, "loss": 0.0212, "step": 45340 }, { "epoch": 0.23, "learning_rate": 0.00026568051218146317, "loss": 0.0228, "step": 45350 }, { "epoch": 0.23, "learning_rate": 0.00026567294448844915, "loss": 0.0227, "step": 45360 }, { "epoch": 0.23, "learning_rate": 0.00026566537679543513, "loss": 0.0268, "step": 45370 }, { "epoch": 0.23, "learning_rate": 0.0002656578091024211, "loss": 0.0272, "step": 45380 }, { "epoch": 0.23, "learning_rate": 0.00026565024140940715, "loss": 0.021, "step": 45390 }, { "epoch": 0.23, "learning_rate": 0.00026564267371639313, "loss": 0.0236, "step": 45400 }, { "epoch": 0.23, "learning_rate": 0.0002656351060233791, "loss": 0.024, "step": 45410 }, { "epoch": 0.23, "learning_rate": 0.0002656275383303651, "loss": 0.022, "step": 45420 }, { "epoch": 0.23, "learning_rate": 0.00026561997063735107, "loss": 0.0226, "step": 45430 }, { "epoch": 0.23, "learning_rate": 0.00026561240294433705, "loss": 0.0266, "step": 45440 }, { "epoch": 0.23, "learning_rate": 0.0002656048352513231, "loss": 0.0282, "step": 45450 }, { "epoch": 0.23, "learning_rate": 0.00026559726755830907, "loss": 0.0231, "step": 45460 }, { "epoch": 0.23, "learning_rate": 0.00026558969986529505, "loss": 0.0223, "step": 45470 }, { "epoch": 0.23, "learning_rate": 0.00026558213217228103, "loss": 0.0209, "step": 45480 }, { "epoch": 0.23, "learning_rate": 0.000265574564479267, "loss": 0.0216, "step": 45490 }, { "epoch": 0.23, "learning_rate": 0.000265566996786253, "loss": 0.0232, "step": 45500 }, { "epoch": 0.23, "learning_rate": 0.00026555942909323903, "loss": 0.0253, "step": 45510 }, { "epoch": 0.23, "learning_rate": 0.000265551861400225, "loss": 0.0236, "step": 45520 }, { "epoch": 0.23, "learning_rate": 0.000265544293707211, "loss": 0.0222, "step": 45530 }, { "epoch": 0.23, "learning_rate": 0.000265536726014197, "loss": 0.0205, "step": 45540 }, { "epoch": 0.23, "learning_rate": 0.00026552915832118296, "loss": 0.0195, "step": 45550 }, { "epoch": 0.23, "learning_rate": 0.00026552159062816894, "loss": 0.0212, "step": 45560 }, { "epoch": 0.23, "learning_rate": 0.0002655140229351549, "loss": 0.0227, "step": 45570 }, { "epoch": 0.23, "learning_rate": 0.00026550645524214096, "loss": 0.0243, "step": 45580 }, { "epoch": 0.23, "learning_rate": 0.00026549888754912694, "loss": 0.0207, "step": 45590 }, { "epoch": 0.23, "learning_rate": 0.0002654913198561129, "loss": 0.0222, "step": 45600 }, { "epoch": 0.23, "learning_rate": 0.0002654837521630989, "loss": 0.0198, "step": 45610 }, { "epoch": 0.23, "learning_rate": 0.0002654761844700849, "loss": 0.0216, "step": 45620 }, { "epoch": 0.23, "learning_rate": 0.00026546861677707086, "loss": 0.0186, "step": 45630 }, { "epoch": 0.23, "learning_rate": 0.0002654610490840569, "loss": 0.0205, "step": 45640 }, { "epoch": 0.23, "learning_rate": 0.0002654534813910429, "loss": 0.0279, "step": 45650 }, { "epoch": 0.23, "learning_rate": 0.00026544591369802886, "loss": 0.0211, "step": 45660 }, { "epoch": 0.23, "learning_rate": 0.00026543834600501484, "loss": 0.019, "step": 45670 }, { "epoch": 0.23, "learning_rate": 0.0002654307783120008, "loss": 0.0247, "step": 45680 }, { "epoch": 0.23, "learning_rate": 0.0002654232106189868, "loss": 0.0187, "step": 45690 }, { "epoch": 0.23, "learning_rate": 0.00026541564292597284, "loss": 0.0231, "step": 45700 }, { "epoch": 0.23, "learning_rate": 0.0002654080752329588, "loss": 0.0282, "step": 45710 }, { "epoch": 0.23, "learning_rate": 0.0002654005075399448, "loss": 0.0182, "step": 45720 }, { "epoch": 0.23, "learning_rate": 0.0002653929398469308, "loss": 0.0236, "step": 45730 }, { "epoch": 0.23, "learning_rate": 0.00026538537215391677, "loss": 0.0195, "step": 45740 }, { "epoch": 0.23, "learning_rate": 0.00026537780446090275, "loss": 0.0247, "step": 45750 }, { "epoch": 0.23, "learning_rate": 0.00026537023676788873, "loss": 0.0208, "step": 45760 }, { "epoch": 0.23, "learning_rate": 0.00026536266907487477, "loss": 0.0218, "step": 45770 }, { "epoch": 0.23, "learning_rate": 0.00026535510138186075, "loss": 0.0249, "step": 45780 }, { "epoch": 0.23, "learning_rate": 0.00026534753368884673, "loss": 0.0209, "step": 45790 }, { "epoch": 0.23, "learning_rate": 0.0002653399659958327, "loss": 0.023, "step": 45800 }, { "epoch": 0.23, "learning_rate": 0.0002653323983028187, "loss": 0.0184, "step": 45810 }, { "epoch": 0.23, "learning_rate": 0.0002653248306098047, "loss": 0.0246, "step": 45820 }, { "epoch": 0.23, "learning_rate": 0.0002653172629167907, "loss": 0.0245, "step": 45830 }, { "epoch": 0.23, "learning_rate": 0.0002653096952237767, "loss": 0.0209, "step": 45840 }, { "epoch": 0.23, "learning_rate": 0.00026530212753076267, "loss": 0.0254, "step": 45850 }, { "epoch": 0.23, "learning_rate": 0.00026529455983774865, "loss": 0.0221, "step": 45860 }, { "epoch": 0.23, "learning_rate": 0.00026528699214473463, "loss": 0.0208, "step": 45870 }, { "epoch": 0.23, "learning_rate": 0.0002652794244517206, "loss": 0.0242, "step": 45880 }, { "epoch": 0.23, "learning_rate": 0.0002652718567587066, "loss": 0.0208, "step": 45890 }, { "epoch": 0.23, "learning_rate": 0.0002652642890656926, "loss": 0.0223, "step": 45900 }, { "epoch": 0.23, "learning_rate": 0.00026525672137267856, "loss": 0.0214, "step": 45910 }, { "epoch": 0.23, "learning_rate": 0.00026524915367966454, "loss": 0.0258, "step": 45920 }, { "epoch": 0.23, "learning_rate": 0.0002652415859866506, "loss": 0.0216, "step": 45930 }, { "epoch": 0.23, "learning_rate": 0.00026523401829363656, "loss": 0.0246, "step": 45940 }, { "epoch": 0.23, "learning_rate": 0.00026522645060062254, "loss": 0.0233, "step": 45950 }, { "epoch": 0.23, "learning_rate": 0.0002652188829076085, "loss": 0.0182, "step": 45960 }, { "epoch": 0.23, "learning_rate": 0.0002652113152145945, "loss": 0.0225, "step": 45970 }, { "epoch": 0.23, "learning_rate": 0.0002652037475215805, "loss": 0.0192, "step": 45980 }, { "epoch": 0.23, "learning_rate": 0.00026519617982856647, "loss": 0.0246, "step": 45990 }, { "epoch": 0.23, "learning_rate": 0.0002651886121355525, "loss": 0.0228, "step": 46000 }, { "epoch": 0.23, "eval_cer": 0.9144877230334195, "eval_loss": 0.016304470598697662, "eval_runtime": 117.0909, "eval_samples_per_second": 17.081, "eval_steps_per_second": 4.27, "step": 46000 }, { "epoch": 0.23, "learning_rate": 0.0002651810444425385, "loss": 0.0214, "step": 46010 }, { "epoch": 0.23, "learning_rate": 0.00026517347674952447, "loss": 0.0216, "step": 46020 }, { "epoch": 0.23, "learning_rate": 0.00026516590905651045, "loss": 0.0235, "step": 46030 }, { "epoch": 0.23, "learning_rate": 0.00026515834136349643, "loss": 0.0227, "step": 46040 }, { "epoch": 0.23, "learning_rate": 0.0002651507736704824, "loss": 0.0207, "step": 46050 }, { "epoch": 0.23, "learning_rate": 0.00026514320597746845, "loss": 0.0197, "step": 46060 }, { "epoch": 0.23, "learning_rate": 0.0002651356382844544, "loss": 0.0191, "step": 46070 }, { "epoch": 0.23, "learning_rate": 0.0002651280705914404, "loss": 0.0204, "step": 46080 }, { "epoch": 0.23, "learning_rate": 0.0002651205028984264, "loss": 0.0198, "step": 46090 }, { "epoch": 0.23, "learning_rate": 0.00026511293520541237, "loss": 0.0197, "step": 46100 }, { "epoch": 0.23, "learning_rate": 0.00026510536751239835, "loss": 0.0199, "step": 46110 }, { "epoch": 0.23, "learning_rate": 0.00026509779981938433, "loss": 0.023, "step": 46120 }, { "epoch": 0.23, "learning_rate": 0.00026509023212637037, "loss": 0.0263, "step": 46130 }, { "epoch": 0.23, "learning_rate": 0.00026508266443335635, "loss": 0.0235, "step": 46140 }, { "epoch": 0.23, "learning_rate": 0.00026507509674034233, "loss": 0.026, "step": 46150 }, { "epoch": 0.23, "learning_rate": 0.0002650675290473283, "loss": 0.0229, "step": 46160 }, { "epoch": 0.23, "learning_rate": 0.0002650599613543143, "loss": 0.0249, "step": 46170 }, { "epoch": 0.23, "learning_rate": 0.0002650523936613003, "loss": 0.0269, "step": 46180 }, { "epoch": 0.23, "learning_rate": 0.0002650448259682863, "loss": 0.0199, "step": 46190 }, { "epoch": 0.23, "learning_rate": 0.0002650372582752723, "loss": 0.0235, "step": 46200 }, { "epoch": 0.23, "learning_rate": 0.0002650296905822583, "loss": 0.0305, "step": 46210 }, { "epoch": 0.23, "learning_rate": 0.00026502212288924426, "loss": 0.0246, "step": 46220 }, { "epoch": 0.23, "learning_rate": 0.00026501455519623024, "loss": 0.0207, "step": 46230 }, { "epoch": 0.23, "learning_rate": 0.0002650069875032162, "loss": 0.0205, "step": 46240 }, { "epoch": 0.23, "learning_rate": 0.00026499941981020226, "loss": 0.0233, "step": 46250 }, { "epoch": 0.23, "learning_rate": 0.00026499185211718824, "loss": 0.0228, "step": 46260 }, { "epoch": 0.23, "learning_rate": 0.0002649842844241742, "loss": 0.0191, "step": 46270 }, { "epoch": 0.23, "learning_rate": 0.0002649767167311602, "loss": 0.0205, "step": 46280 }, { "epoch": 0.23, "learning_rate": 0.0002649691490381462, "loss": 0.0187, "step": 46290 }, { "epoch": 0.23, "learning_rate": 0.00026496158134513216, "loss": 0.0212, "step": 46300 }, { "epoch": 0.23, "learning_rate": 0.00026495401365211814, "loss": 0.0185, "step": 46310 }, { "epoch": 0.23, "learning_rate": 0.0002649464459591042, "loss": 0.0228, "step": 46320 }, { "epoch": 0.23, "learning_rate": 0.00026493887826609016, "loss": 0.0214, "step": 46330 }, { "epoch": 0.23, "learning_rate": 0.00026493131057307614, "loss": 0.0189, "step": 46340 }, { "epoch": 0.23, "learning_rate": 0.0002649237428800621, "loss": 0.0188, "step": 46350 }, { "epoch": 0.23, "learning_rate": 0.0002649161751870481, "loss": 0.0262, "step": 46360 }, { "epoch": 0.23, "learning_rate": 0.0002649086074940341, "loss": 0.0203, "step": 46370 }, { "epoch": 0.23, "learning_rate": 0.0002649010398010201, "loss": 0.0235, "step": 46380 }, { "epoch": 0.23, "learning_rate": 0.0002648934721080061, "loss": 0.0184, "step": 46390 }, { "epoch": 0.23, "learning_rate": 0.0002648859044149921, "loss": 0.0214, "step": 46400 }, { "epoch": 0.23, "learning_rate": 0.00026487833672197807, "loss": 0.0194, "step": 46410 }, { "epoch": 0.23, "learning_rate": 0.00026487076902896405, "loss": 0.0244, "step": 46420 }, { "epoch": 0.23, "learning_rate": 0.00026486320133595003, "loss": 0.022, "step": 46430 }, { "epoch": 0.23, "learning_rate": 0.00026485563364293607, "loss": 0.0233, "step": 46440 }, { "epoch": 0.23, "learning_rate": 0.00026484806594992205, "loss": 0.0217, "step": 46450 }, { "epoch": 0.23, "learning_rate": 0.00026484049825690803, "loss": 0.0219, "step": 46460 }, { "epoch": 0.23, "learning_rate": 0.000264832930563894, "loss": 0.0162, "step": 46470 }, { "epoch": 0.23, "learning_rate": 0.00026482536287088, "loss": 0.0231, "step": 46480 }, { "epoch": 0.23, "learning_rate": 0.00026481779517786597, "loss": 0.0209, "step": 46490 }, { "epoch": 0.23, "learning_rate": 0.00026481022748485195, "loss": 0.0207, "step": 46500 }, { "epoch": 0.23, "learning_rate": 0.000264802659791838, "loss": 0.0205, "step": 46510 }, { "epoch": 0.23, "learning_rate": 0.00026479509209882397, "loss": 0.022, "step": 46520 }, { "epoch": 0.23, "learning_rate": 0.00026478752440580995, "loss": 0.0227, "step": 46530 }, { "epoch": 0.23, "learning_rate": 0.00026477995671279593, "loss": 0.0235, "step": 46540 }, { "epoch": 0.23, "learning_rate": 0.0002647723890197819, "loss": 0.0246, "step": 46550 }, { "epoch": 0.23, "learning_rate": 0.0002647648213267679, "loss": 0.0276, "step": 46560 }, { "epoch": 0.23, "learning_rate": 0.00026475725363375393, "loss": 0.022, "step": 46570 }, { "epoch": 0.24, "learning_rate": 0.0002647496859407399, "loss": 0.0196, "step": 46580 }, { "epoch": 0.24, "learning_rate": 0.0002647421182477259, "loss": 0.0196, "step": 46590 }, { "epoch": 0.24, "learning_rate": 0.0002647345505547119, "loss": 0.0203, "step": 46600 }, { "epoch": 0.24, "learning_rate": 0.00026472698286169786, "loss": 0.0207, "step": 46610 }, { "epoch": 0.24, "learning_rate": 0.00026471941516868384, "loss": 0.0217, "step": 46620 }, { "epoch": 0.24, "learning_rate": 0.0002647118474756698, "loss": 0.0185, "step": 46630 }, { "epoch": 0.24, "learning_rate": 0.00026470427978265586, "loss": 0.0215, "step": 46640 }, { "epoch": 0.24, "learning_rate": 0.00026469671208964184, "loss": 0.0194, "step": 46650 }, { "epoch": 0.24, "learning_rate": 0.0002646891443966278, "loss": 0.0238, "step": 46660 }, { "epoch": 0.24, "learning_rate": 0.0002646815767036138, "loss": 0.0205, "step": 46670 }, { "epoch": 0.24, "learning_rate": 0.0002646740090105998, "loss": 0.0214, "step": 46680 }, { "epoch": 0.24, "learning_rate": 0.00026466644131758576, "loss": 0.0189, "step": 46690 }, { "epoch": 0.24, "learning_rate": 0.0002646588736245718, "loss": 0.0191, "step": 46700 }, { "epoch": 0.24, "learning_rate": 0.0002646513059315578, "loss": 0.0238, "step": 46710 }, { "epoch": 0.24, "learning_rate": 0.00026464373823854376, "loss": 0.0209, "step": 46720 }, { "epoch": 0.24, "learning_rate": 0.00026463617054552974, "loss": 0.023, "step": 46730 }, { "epoch": 0.24, "learning_rate": 0.0002646286028525157, "loss": 0.0222, "step": 46740 }, { "epoch": 0.24, "learning_rate": 0.0002646210351595017, "loss": 0.0259, "step": 46750 }, { "epoch": 0.24, "learning_rate": 0.00026461346746648774, "loss": 0.0206, "step": 46760 }, { "epoch": 0.24, "learning_rate": 0.0002646058997734737, "loss": 0.0267, "step": 46770 }, { "epoch": 0.24, "learning_rate": 0.0002645983320804597, "loss": 0.0238, "step": 46780 }, { "epoch": 0.24, "learning_rate": 0.0002645907643874457, "loss": 0.026, "step": 46790 }, { "epoch": 0.24, "learning_rate": 0.00026458319669443167, "loss": 0.023, "step": 46800 }, { "epoch": 0.24, "learning_rate": 0.00026457562900141765, "loss": 0.0181, "step": 46810 }, { "epoch": 0.24, "learning_rate": 0.00026456806130840363, "loss": 0.023, "step": 46820 }, { "epoch": 0.24, "learning_rate": 0.00026456049361538967, "loss": 0.0237, "step": 46830 }, { "epoch": 0.24, "learning_rate": 0.00026455292592237565, "loss": 0.0209, "step": 46840 }, { "epoch": 0.24, "learning_rate": 0.00026454535822936163, "loss": 0.0234, "step": 46850 }, { "epoch": 0.24, "learning_rate": 0.0002645377905363476, "loss": 0.0178, "step": 46860 }, { "epoch": 0.24, "learning_rate": 0.0002645302228433336, "loss": 0.0219, "step": 46870 }, { "epoch": 0.24, "learning_rate": 0.0002645226551503196, "loss": 0.0225, "step": 46880 }, { "epoch": 0.24, "learning_rate": 0.0002645150874573056, "loss": 0.0207, "step": 46890 }, { "epoch": 0.24, "learning_rate": 0.0002645075197642916, "loss": 0.0211, "step": 46900 }, { "epoch": 0.24, "learning_rate": 0.00026449995207127757, "loss": 0.0274, "step": 46910 }, { "epoch": 0.24, "learning_rate": 0.00026449238437826355, "loss": 0.0229, "step": 46920 }, { "epoch": 0.24, "learning_rate": 0.00026448481668524954, "loss": 0.0243, "step": 46930 }, { "epoch": 0.24, "learning_rate": 0.0002644772489922355, "loss": 0.0228, "step": 46940 }, { "epoch": 0.24, "learning_rate": 0.00026446968129922155, "loss": 0.0171, "step": 46950 }, { "epoch": 0.24, "learning_rate": 0.00026446211360620753, "loss": 0.0219, "step": 46960 }, { "epoch": 0.24, "learning_rate": 0.0002644545459131935, "loss": 0.0197, "step": 46970 }, { "epoch": 0.24, "learning_rate": 0.0002644469782201795, "loss": 0.0285, "step": 46980 }, { "epoch": 0.24, "learning_rate": 0.0002644394105271655, "loss": 0.0208, "step": 46990 }, { "epoch": 0.24, "learning_rate": 0.00026443184283415146, "loss": 0.0222, "step": 47000 }, { "epoch": 0.24, "eval_cer": 0.9145042197675514, "eval_loss": 0.01637718454003334, "eval_runtime": 117.1859, "eval_samples_per_second": 17.067, "eval_steps_per_second": 4.267, "step": 47000 }, { "epoch": 0.24, "learning_rate": 0.00026442427514113744, "loss": 0.0188, "step": 47010 }, { "epoch": 0.24, "learning_rate": 0.0002644167074481235, "loss": 0.0246, "step": 47020 }, { "epoch": 0.24, "learning_rate": 0.00026440913975510946, "loss": 0.0251, "step": 47030 }, { "epoch": 0.24, "learning_rate": 0.00026440157206209544, "loss": 0.0211, "step": 47040 }, { "epoch": 0.24, "learning_rate": 0.0002643940043690814, "loss": 0.0213, "step": 47050 }, { "epoch": 0.24, "learning_rate": 0.0002643864366760674, "loss": 0.0222, "step": 47060 }, { "epoch": 0.24, "learning_rate": 0.0002643788689830534, "loss": 0.0188, "step": 47070 }, { "epoch": 0.24, "learning_rate": 0.0002643713012900394, "loss": 0.0238, "step": 47080 }, { "epoch": 0.24, "learning_rate": 0.0002643637335970254, "loss": 0.0224, "step": 47090 }, { "epoch": 0.24, "learning_rate": 0.0002643561659040114, "loss": 0.0182, "step": 47100 }, { "epoch": 0.24, "learning_rate": 0.00026434859821099736, "loss": 0.0235, "step": 47110 }, { "epoch": 0.24, "learning_rate": 0.00026434103051798335, "loss": 0.0206, "step": 47120 }, { "epoch": 0.24, "learning_rate": 0.0002643334628249693, "loss": 0.0196, "step": 47130 }, { "epoch": 0.24, "learning_rate": 0.0002643258951319553, "loss": 0.0266, "step": 47140 }, { "epoch": 0.24, "learning_rate": 0.0002643183274389413, "loss": 0.0225, "step": 47150 }, { "epoch": 0.24, "learning_rate": 0.00026431075974592727, "loss": 0.0224, "step": 47160 }, { "epoch": 0.24, "learning_rate": 0.00026430319205291325, "loss": 0.0199, "step": 47170 }, { "epoch": 0.24, "learning_rate": 0.00026429562435989923, "loss": 0.0187, "step": 47180 }, { "epoch": 0.24, "learning_rate": 0.00026428805666688527, "loss": 0.0233, "step": 47190 }, { "epoch": 0.24, "learning_rate": 0.00026428048897387125, "loss": 0.0248, "step": 47200 }, { "epoch": 0.24, "learning_rate": 0.00026427292128085723, "loss": 0.0197, "step": 47210 }, { "epoch": 0.24, "learning_rate": 0.0002642653535878432, "loss": 0.027, "step": 47220 }, { "epoch": 0.24, "learning_rate": 0.0002642577858948292, "loss": 0.0225, "step": 47230 }, { "epoch": 0.24, "learning_rate": 0.0002642502182018152, "loss": 0.0343, "step": 47240 }, { "epoch": 0.24, "learning_rate": 0.0002642426505088012, "loss": 0.0245, "step": 47250 }, { "epoch": 0.24, "learning_rate": 0.0002642350828157872, "loss": 0.0214, "step": 47260 }, { "epoch": 0.24, "learning_rate": 0.0002642275151227732, "loss": 0.0239, "step": 47270 }, { "epoch": 0.24, "learning_rate": 0.00026421994742975916, "loss": 0.0241, "step": 47280 }, { "epoch": 0.24, "learning_rate": 0.00026421237973674514, "loss": 0.0199, "step": 47290 }, { "epoch": 0.24, "learning_rate": 0.0002642048120437311, "loss": 0.0254, "step": 47300 }, { "epoch": 0.24, "learning_rate": 0.00026419724435071716, "loss": 0.0212, "step": 47310 }, { "epoch": 0.24, "learning_rate": 0.00026418967665770314, "loss": 0.019, "step": 47320 }, { "epoch": 0.24, "learning_rate": 0.0002641821089646891, "loss": 0.0199, "step": 47330 }, { "epoch": 0.24, "learning_rate": 0.0002641745412716751, "loss": 0.0228, "step": 47340 }, { "epoch": 0.24, "learning_rate": 0.0002641669735786611, "loss": 0.0224, "step": 47350 }, { "epoch": 0.24, "learning_rate": 0.00026415940588564706, "loss": 0.0274, "step": 47360 }, { "epoch": 0.24, "learning_rate": 0.00026415183819263304, "loss": 0.0212, "step": 47370 }, { "epoch": 0.24, "learning_rate": 0.0002641442704996191, "loss": 0.0212, "step": 47380 }, { "epoch": 0.24, "learning_rate": 0.00026413670280660506, "loss": 0.0193, "step": 47390 }, { "epoch": 0.24, "learning_rate": 0.00026412913511359104, "loss": 0.0199, "step": 47400 }, { "epoch": 0.24, "learning_rate": 0.000264121567420577, "loss": 0.0196, "step": 47410 }, { "epoch": 0.24, "learning_rate": 0.000264113999727563, "loss": 0.024, "step": 47420 }, { "epoch": 0.24, "learning_rate": 0.000264106432034549, "loss": 0.0214, "step": 47430 }, { "epoch": 0.24, "learning_rate": 0.000264098864341535, "loss": 0.0207, "step": 47440 }, { "epoch": 0.24, "learning_rate": 0.000264091296648521, "loss": 0.0191, "step": 47450 }, { "epoch": 0.24, "learning_rate": 0.000264083728955507, "loss": 0.0182, "step": 47460 }, { "epoch": 0.24, "learning_rate": 0.00026407616126249297, "loss": 0.0216, "step": 47470 }, { "epoch": 0.24, "learning_rate": 0.00026406859356947895, "loss": 0.02, "step": 47480 }, { "epoch": 0.24, "learning_rate": 0.00026406102587646493, "loss": 0.0159, "step": 47490 }, { "epoch": 0.24, "learning_rate": 0.00026405345818345097, "loss": 0.0212, "step": 47500 }, { "epoch": 0.24, "learning_rate": 0.00026404589049043695, "loss": 0.0226, "step": 47510 }, { "epoch": 0.24, "learning_rate": 0.00026403832279742293, "loss": 0.0201, "step": 47520 }, { "epoch": 0.24, "learning_rate": 0.0002640307551044089, "loss": 0.0164, "step": 47530 }, { "epoch": 0.24, "learning_rate": 0.0002640231874113949, "loss": 0.0229, "step": 47540 }, { "epoch": 0.24, "learning_rate": 0.00026401561971838087, "loss": 0.0247, "step": 47550 }, { "epoch": 0.24, "learning_rate": 0.00026400805202536685, "loss": 0.0194, "step": 47560 }, { "epoch": 0.24, "learning_rate": 0.0002640004843323529, "loss": 0.0219, "step": 47570 }, { "epoch": 0.24, "learning_rate": 0.00026399291663933887, "loss": 0.0188, "step": 47580 }, { "epoch": 0.24, "learning_rate": 0.00026398534894632485, "loss": 0.0244, "step": 47590 }, { "epoch": 0.24, "learning_rate": 0.00026397778125331083, "loss": 0.0197, "step": 47600 }, { "epoch": 0.24, "learning_rate": 0.0002639702135602968, "loss": 0.0221, "step": 47610 }, { "epoch": 0.24, "learning_rate": 0.0002639626458672828, "loss": 0.0216, "step": 47620 }, { "epoch": 0.24, "learning_rate": 0.00026395507817426883, "loss": 0.0227, "step": 47630 }, { "epoch": 0.24, "learning_rate": 0.0002639475104812548, "loss": 0.0247, "step": 47640 }, { "epoch": 0.24, "learning_rate": 0.0002639399427882408, "loss": 0.0204, "step": 47650 }, { "epoch": 0.24, "learning_rate": 0.0002639323750952268, "loss": 0.026, "step": 47660 }, { "epoch": 0.24, "learning_rate": 0.00026392480740221276, "loss": 0.0216, "step": 47670 }, { "epoch": 0.24, "learning_rate": 0.00026391723970919874, "loss": 0.022, "step": 47680 }, { "epoch": 0.24, "learning_rate": 0.0002639096720161847, "loss": 0.0216, "step": 47690 }, { "epoch": 0.24, "learning_rate": 0.00026390210432317076, "loss": 0.0209, "step": 47700 }, { "epoch": 0.24, "learning_rate": 0.00026389453663015674, "loss": 0.0277, "step": 47710 }, { "epoch": 0.24, "learning_rate": 0.0002638869689371427, "loss": 0.0262, "step": 47720 }, { "epoch": 0.24, "learning_rate": 0.0002638794012441287, "loss": 0.0212, "step": 47730 }, { "epoch": 0.24, "learning_rate": 0.0002638718335511147, "loss": 0.0265, "step": 47740 }, { "epoch": 0.24, "learning_rate": 0.00026386426585810066, "loss": 0.0204, "step": 47750 }, { "epoch": 0.24, "learning_rate": 0.0002638566981650867, "loss": 0.0244, "step": 47760 }, { "epoch": 0.24, "learning_rate": 0.0002638491304720727, "loss": 0.0235, "step": 47770 }, { "epoch": 0.24, "learning_rate": 0.00026384156277905866, "loss": 0.0228, "step": 47780 }, { "epoch": 0.24, "learning_rate": 0.00026383399508604464, "loss": 0.0228, "step": 47790 }, { "epoch": 0.24, "learning_rate": 0.0002638264273930306, "loss": 0.0253, "step": 47800 }, { "epoch": 0.24, "learning_rate": 0.0002638188597000166, "loss": 0.0205, "step": 47810 }, { "epoch": 0.24, "learning_rate": 0.00026381129200700264, "loss": 0.0226, "step": 47820 }, { "epoch": 0.24, "learning_rate": 0.0002638037243139886, "loss": 0.0198, "step": 47830 }, { "epoch": 0.24, "learning_rate": 0.0002637961566209746, "loss": 0.0209, "step": 47840 }, { "epoch": 0.24, "learning_rate": 0.0002637885889279606, "loss": 0.0246, "step": 47850 }, { "epoch": 0.24, "learning_rate": 0.00026378102123494657, "loss": 0.0185, "step": 47860 }, { "epoch": 0.24, "learning_rate": 0.00026377345354193255, "loss": 0.0212, "step": 47870 }, { "epoch": 0.24, "learning_rate": 0.00026376588584891853, "loss": 0.0234, "step": 47880 }, { "epoch": 0.24, "learning_rate": 0.00026375831815590457, "loss": 0.0225, "step": 47890 }, { "epoch": 0.24, "learning_rate": 0.00026375075046289055, "loss": 0.0246, "step": 47900 }, { "epoch": 0.24, "learning_rate": 0.00026374318276987653, "loss": 0.0237, "step": 47910 }, { "epoch": 0.24, "learning_rate": 0.0002637356150768625, "loss": 0.0229, "step": 47920 }, { "epoch": 0.24, "learning_rate": 0.0002637280473838485, "loss": 0.0238, "step": 47930 }, { "epoch": 0.24, "learning_rate": 0.0002637204796908345, "loss": 0.023, "step": 47940 }, { "epoch": 0.24, "learning_rate": 0.0002637129119978205, "loss": 0.0245, "step": 47950 }, { "epoch": 0.24, "learning_rate": 0.0002637053443048065, "loss": 0.024, "step": 47960 }, { "epoch": 0.24, "learning_rate": 0.00026369777661179247, "loss": 0.0206, "step": 47970 }, { "epoch": 0.24, "learning_rate": 0.00026369020891877845, "loss": 0.0229, "step": 47980 }, { "epoch": 0.24, "learning_rate": 0.00026368264122576444, "loss": 0.0198, "step": 47990 }, { "epoch": 0.24, "learning_rate": 0.0002636750735327504, "loss": 0.0226, "step": 48000 }, { "epoch": 0.24, "eval_cer": 0.9144945158062973, "eval_loss": 0.015514707192778587, "eval_runtime": 117.0856, "eval_samples_per_second": 17.082, "eval_steps_per_second": 4.27, "step": 48000 }, { "epoch": 0.24, "learning_rate": 0.00026366750583973645, "loss": 0.0243, "step": 48010 }, { "epoch": 0.24, "learning_rate": 0.00026365993814672243, "loss": 0.0214, "step": 48020 }, { "epoch": 0.24, "learning_rate": 0.0002636523704537084, "loss": 0.0243, "step": 48030 }, { "epoch": 0.24, "learning_rate": 0.0002636448027606944, "loss": 0.0254, "step": 48040 }, { "epoch": 0.24, "learning_rate": 0.0002636372350676804, "loss": 0.023, "step": 48050 }, { "epoch": 0.24, "learning_rate": 0.00026362966737466636, "loss": 0.0218, "step": 48060 }, { "epoch": 0.24, "learning_rate": 0.00026362209968165234, "loss": 0.0228, "step": 48070 }, { "epoch": 0.24, "learning_rate": 0.0002636145319886384, "loss": 0.0219, "step": 48080 }, { "epoch": 0.24, "learning_rate": 0.00026360696429562436, "loss": 0.0156, "step": 48090 }, { "epoch": 0.24, "learning_rate": 0.00026359939660261034, "loss": 0.0239, "step": 48100 }, { "epoch": 0.24, "learning_rate": 0.0002635918289095963, "loss": 0.0257, "step": 48110 }, { "epoch": 0.24, "learning_rate": 0.0002635842612165823, "loss": 0.0211, "step": 48120 }, { "epoch": 0.24, "learning_rate": 0.0002635766935235683, "loss": 0.0273, "step": 48130 }, { "epoch": 0.24, "learning_rate": 0.0002635691258305543, "loss": 0.0219, "step": 48140 }, { "epoch": 0.24, "learning_rate": 0.0002635615581375403, "loss": 0.0251, "step": 48150 }, { "epoch": 0.24, "learning_rate": 0.0002635539904445263, "loss": 0.0212, "step": 48160 }, { "epoch": 0.24, "learning_rate": 0.00026354642275151226, "loss": 0.0205, "step": 48170 }, { "epoch": 0.24, "learning_rate": 0.00026353885505849825, "loss": 0.0199, "step": 48180 }, { "epoch": 0.24, "learning_rate": 0.0002635312873654842, "loss": 0.0203, "step": 48190 }, { "epoch": 0.24, "learning_rate": 0.0002635237196724702, "loss": 0.0216, "step": 48200 }, { "epoch": 0.24, "learning_rate": 0.00026351615197945624, "loss": 0.0198, "step": 48210 }, { "epoch": 0.24, "learning_rate": 0.0002635085842864422, "loss": 0.0235, "step": 48220 }, { "epoch": 0.24, "learning_rate": 0.0002635010165934282, "loss": 0.0244, "step": 48230 }, { "epoch": 0.24, "learning_rate": 0.0002634934489004142, "loss": 0.0211, "step": 48240 }, { "epoch": 0.24, "learning_rate": 0.00026348588120740017, "loss": 0.0189, "step": 48250 }, { "epoch": 0.24, "learning_rate": 0.00026347831351438615, "loss": 0.0228, "step": 48260 }, { "epoch": 0.24, "learning_rate": 0.0002634707458213722, "loss": 0.0208, "step": 48270 }, { "epoch": 0.24, "learning_rate": 0.00026346317812835817, "loss": 0.024, "step": 48280 }, { "epoch": 0.24, "learning_rate": 0.00026345561043534415, "loss": 0.0229, "step": 48290 }, { "epoch": 0.24, "learning_rate": 0.00026344804274233013, "loss": 0.0207, "step": 48300 }, { "epoch": 0.24, "learning_rate": 0.0002634404750493161, "loss": 0.0215, "step": 48310 }, { "epoch": 0.24, "learning_rate": 0.0002634329073563021, "loss": 0.0354, "step": 48320 }, { "epoch": 0.24, "learning_rate": 0.00026342533966328813, "loss": 0.0351, "step": 48330 }, { "epoch": 0.24, "learning_rate": 0.0002634177719702741, "loss": 0.0239, "step": 48340 }, { "epoch": 0.24, "learning_rate": 0.0002634102042772601, "loss": 0.0199, "step": 48350 }, { "epoch": 0.24, "learning_rate": 0.0002634026365842461, "loss": 0.0196, "step": 48360 }, { "epoch": 0.24, "learning_rate": 0.00026339506889123206, "loss": 0.0282, "step": 48370 }, { "epoch": 0.24, "learning_rate": 0.00026338750119821804, "loss": 0.0207, "step": 48380 }, { "epoch": 0.24, "learning_rate": 0.000263379933505204, "loss": 0.0238, "step": 48390 }, { "epoch": 0.24, "learning_rate": 0.00026337236581219, "loss": 0.0243, "step": 48400 }, { "epoch": 0.24, "learning_rate": 0.000263364798119176, "loss": 0.0196, "step": 48410 }, { "epoch": 0.24, "learning_rate": 0.00026335723042616196, "loss": 0.0195, "step": 48420 }, { "epoch": 0.24, "learning_rate": 0.00026334966273314794, "loss": 0.0169, "step": 48430 }, { "epoch": 0.24, "learning_rate": 0.000263342095040134, "loss": 0.0239, "step": 48440 }, { "epoch": 0.24, "learning_rate": 0.00026333452734711996, "loss": 0.0218, "step": 48450 }, { "epoch": 0.24, "learning_rate": 0.00026332695965410594, "loss": 0.0185, "step": 48460 }, { "epoch": 0.24, "learning_rate": 0.0002633193919610919, "loss": 0.0182, "step": 48470 }, { "epoch": 0.24, "learning_rate": 0.0002633118242680779, "loss": 0.0219, "step": 48480 }, { "epoch": 0.24, "learning_rate": 0.0002633042565750639, "loss": 0.0188, "step": 48490 }, { "epoch": 0.24, "learning_rate": 0.0002632966888820499, "loss": 0.0259, "step": 48500 }, { "epoch": 0.24, "learning_rate": 0.0002632891211890359, "loss": 0.0259, "step": 48510 }, { "epoch": 0.24, "learning_rate": 0.0002632815534960219, "loss": 0.0211, "step": 48520 }, { "epoch": 0.24, "learning_rate": 0.00026327398580300787, "loss": 0.0176, "step": 48530 }, { "epoch": 0.24, "learning_rate": 0.00026326641810999385, "loss": 0.0215, "step": 48540 }, { "epoch": 0.24, "learning_rate": 0.00026325885041697983, "loss": 0.0193, "step": 48550 }, { "epoch": 0.24, "learning_rate": 0.00026325128272396587, "loss": 0.0211, "step": 48560 }, { "epoch": 0.25, "learning_rate": 0.00026324371503095185, "loss": 0.0204, "step": 48570 }, { "epoch": 0.25, "learning_rate": 0.00026323614733793783, "loss": 0.0194, "step": 48580 }, { "epoch": 0.25, "learning_rate": 0.0002632285796449238, "loss": 0.0161, "step": 48590 }, { "epoch": 0.25, "learning_rate": 0.0002632210119519098, "loss": 0.0273, "step": 48600 }, { "epoch": 0.25, "learning_rate": 0.00026321344425889577, "loss": 0.0227, "step": 48610 }, { "epoch": 0.25, "learning_rate": 0.00026320587656588175, "loss": 0.0217, "step": 48620 }, { "epoch": 0.25, "learning_rate": 0.0002631983088728678, "loss": 0.0256, "step": 48630 }, { "epoch": 0.25, "learning_rate": 0.00026319074117985377, "loss": 0.0195, "step": 48640 }, { "epoch": 0.25, "learning_rate": 0.00026318317348683975, "loss": 0.0206, "step": 48650 }, { "epoch": 0.25, "learning_rate": 0.00026317560579382573, "loss": 0.0203, "step": 48660 }, { "epoch": 0.25, "learning_rate": 0.0002631680381008117, "loss": 0.0292, "step": 48670 }, { "epoch": 0.25, "learning_rate": 0.0002631604704077977, "loss": 0.0227, "step": 48680 }, { "epoch": 0.25, "learning_rate": 0.00026315290271478373, "loss": 0.0221, "step": 48690 }, { "epoch": 0.25, "learning_rate": 0.0002631453350217697, "loss": 0.0199, "step": 48700 }, { "epoch": 0.25, "learning_rate": 0.0002631377673287557, "loss": 0.0205, "step": 48710 }, { "epoch": 0.25, "learning_rate": 0.0002631301996357417, "loss": 0.0198, "step": 48720 }, { "epoch": 0.25, "learning_rate": 0.00026312263194272766, "loss": 0.0239, "step": 48730 }, { "epoch": 0.25, "learning_rate": 0.00026311506424971364, "loss": 0.0193, "step": 48740 }, { "epoch": 0.25, "learning_rate": 0.0002631074965566996, "loss": 0.0203, "step": 48750 }, { "epoch": 0.25, "learning_rate": 0.00026309992886368566, "loss": 0.0259, "step": 48760 }, { "epoch": 0.25, "learning_rate": 0.00026309236117067164, "loss": 0.0228, "step": 48770 }, { "epoch": 0.25, "learning_rate": 0.0002630847934776576, "loss": 0.0207, "step": 48780 }, { "epoch": 0.25, "learning_rate": 0.0002630772257846436, "loss": 0.0235, "step": 48790 }, { "epoch": 0.25, "learning_rate": 0.0002630696580916296, "loss": 0.0219, "step": 48800 }, { "epoch": 0.25, "learning_rate": 0.00026306209039861556, "loss": 0.0228, "step": 48810 }, { "epoch": 0.25, "learning_rate": 0.0002630545227056016, "loss": 0.021, "step": 48820 }, { "epoch": 0.25, "learning_rate": 0.0002630469550125876, "loss": 0.0212, "step": 48830 }, { "epoch": 0.25, "learning_rate": 0.00026303938731957356, "loss": 0.0202, "step": 48840 }, { "epoch": 0.25, "learning_rate": 0.00026303181962655954, "loss": 0.0193, "step": 48850 }, { "epoch": 0.25, "learning_rate": 0.0002630242519335455, "loss": 0.0174, "step": 48860 }, { "epoch": 0.25, "learning_rate": 0.0002630166842405315, "loss": 0.0211, "step": 48870 }, { "epoch": 0.25, "learning_rate": 0.00026300911654751754, "loss": 0.0255, "step": 48880 }, { "epoch": 0.25, "learning_rate": 0.0002630015488545035, "loss": 0.0251, "step": 48890 }, { "epoch": 0.25, "learning_rate": 0.0002629939811614895, "loss": 0.0213, "step": 48900 }, { "epoch": 0.25, "learning_rate": 0.0002629864134684755, "loss": 0.0236, "step": 48910 }, { "epoch": 0.25, "learning_rate": 0.00026297884577546147, "loss": 0.0214, "step": 48920 }, { "epoch": 0.25, "learning_rate": 0.00026297127808244745, "loss": 0.0194, "step": 48930 }, { "epoch": 0.25, "learning_rate": 0.00026296371038943343, "loss": 0.0219, "step": 48940 }, { "epoch": 0.25, "learning_rate": 0.00026295614269641947, "loss": 0.0216, "step": 48950 }, { "epoch": 0.25, "learning_rate": 0.00026294857500340545, "loss": 0.0219, "step": 48960 }, { "epoch": 0.25, "learning_rate": 0.00026294100731039143, "loss": 0.0237, "step": 48970 }, { "epoch": 0.25, "learning_rate": 0.0002629334396173774, "loss": 0.0216, "step": 48980 }, { "epoch": 0.25, "learning_rate": 0.0002629258719243634, "loss": 0.0226, "step": 48990 }, { "epoch": 0.25, "learning_rate": 0.0002629183042313494, "loss": 0.0171, "step": 49000 }, { "epoch": 0.25, "eval_cer": 0.914452788772905, "eval_loss": 0.01547841913998127, "eval_runtime": 116.9106, "eval_samples_per_second": 17.107, "eval_steps_per_second": 4.277, "step": 49000 }, { "epoch": 0.25, "learning_rate": 0.0002629107365383354, "loss": 0.0207, "step": 49010 }, { "epoch": 0.25, "learning_rate": 0.0002629031688453214, "loss": 0.0196, "step": 49020 }, { "epoch": 0.25, "learning_rate": 0.0002628956011523074, "loss": 0.0228, "step": 49030 }, { "epoch": 0.25, "learning_rate": 0.00026288803345929335, "loss": 0.0224, "step": 49040 }, { "epoch": 0.25, "learning_rate": 0.00026288046576627934, "loss": 0.0213, "step": 49050 }, { "epoch": 0.25, "learning_rate": 0.0002628728980732653, "loss": 0.02, "step": 49060 }, { "epoch": 0.25, "learning_rate": 0.00026286533038025135, "loss": 0.0183, "step": 49070 }, { "epoch": 0.25, "learning_rate": 0.00026285776268723733, "loss": 0.023, "step": 49080 }, { "epoch": 0.25, "learning_rate": 0.0002628501949942233, "loss": 0.0184, "step": 49090 }, { "epoch": 0.25, "learning_rate": 0.0002628426273012093, "loss": 0.0265, "step": 49100 }, { "epoch": 0.25, "learning_rate": 0.0002628350596081953, "loss": 0.023, "step": 49110 }, { "epoch": 0.25, "learning_rate": 0.00026282749191518126, "loss": 0.0267, "step": 49120 }, { "epoch": 0.25, "learning_rate": 0.00026281992422216724, "loss": 0.021, "step": 49130 }, { "epoch": 0.25, "learning_rate": 0.0002628123565291533, "loss": 0.0201, "step": 49140 }, { "epoch": 0.25, "learning_rate": 0.00026280478883613926, "loss": 0.023, "step": 49150 }, { "epoch": 0.25, "learning_rate": 0.00026279722114312524, "loss": 0.0224, "step": 49160 }, { "epoch": 0.25, "learning_rate": 0.0002627896534501112, "loss": 0.0228, "step": 49170 }, { "epoch": 0.25, "learning_rate": 0.0002627820857570972, "loss": 0.022, "step": 49180 }, { "epoch": 0.25, "learning_rate": 0.0002627745180640832, "loss": 0.0164, "step": 49190 }, { "epoch": 0.25, "learning_rate": 0.0002627669503710692, "loss": 0.018, "step": 49200 }, { "epoch": 0.25, "learning_rate": 0.0002627593826780552, "loss": 0.0173, "step": 49210 }, { "epoch": 0.25, "learning_rate": 0.0002627518149850412, "loss": 0.0205, "step": 49220 }, { "epoch": 0.25, "learning_rate": 0.00026274424729202716, "loss": 0.0234, "step": 49230 }, { "epoch": 0.25, "learning_rate": 0.00026273667959901315, "loss": 0.0218, "step": 49240 }, { "epoch": 0.25, "learning_rate": 0.00026272911190599913, "loss": 0.0169, "step": 49250 }, { "epoch": 0.25, "learning_rate": 0.0002627215442129851, "loss": 0.0187, "step": 49260 }, { "epoch": 0.25, "learning_rate": 0.00026271397651997114, "loss": 0.0195, "step": 49270 }, { "epoch": 0.25, "learning_rate": 0.0002627064088269571, "loss": 0.0175, "step": 49280 }, { "epoch": 0.25, "learning_rate": 0.0002626988411339431, "loss": 0.0215, "step": 49290 }, { "epoch": 0.25, "learning_rate": 0.0002626912734409291, "loss": 0.0204, "step": 49300 }, { "epoch": 0.25, "learning_rate": 0.00026268370574791507, "loss": 0.0264, "step": 49310 }, { "epoch": 0.25, "learning_rate": 0.00026267613805490105, "loss": 0.0278, "step": 49320 }, { "epoch": 0.25, "learning_rate": 0.0002626685703618871, "loss": 0.0248, "step": 49330 }, { "epoch": 0.25, "learning_rate": 0.00026266100266887307, "loss": 0.0231, "step": 49340 }, { "epoch": 0.25, "learning_rate": 0.00026265343497585905, "loss": 0.0239, "step": 49350 }, { "epoch": 0.25, "learning_rate": 0.00026264586728284503, "loss": 0.0204, "step": 49360 }, { "epoch": 0.25, "learning_rate": 0.000262638299589831, "loss": 0.021, "step": 49370 }, { "epoch": 0.25, "learning_rate": 0.000262630731896817, "loss": 0.0216, "step": 49380 }, { "epoch": 0.25, "learning_rate": 0.00026262316420380303, "loss": 0.022, "step": 49390 }, { "epoch": 0.25, "learning_rate": 0.000262615596510789, "loss": 0.02, "step": 49400 }, { "epoch": 0.25, "learning_rate": 0.000262608028817775, "loss": 0.0201, "step": 49410 }, { "epoch": 0.25, "learning_rate": 0.000262600461124761, "loss": 0.0203, "step": 49420 }, { "epoch": 0.25, "learning_rate": 0.00026259289343174696, "loss": 0.0205, "step": 49430 }, { "epoch": 0.25, "learning_rate": 0.00026258532573873294, "loss": 0.0223, "step": 49440 }, { "epoch": 0.25, "learning_rate": 0.0002625777580457189, "loss": 0.0216, "step": 49450 }, { "epoch": 0.25, "learning_rate": 0.00026257019035270495, "loss": 0.0212, "step": 49460 }, { "epoch": 0.25, "learning_rate": 0.00026256262265969094, "loss": 0.0207, "step": 49470 }, { "epoch": 0.25, "learning_rate": 0.0002625550549666769, "loss": 0.0235, "step": 49480 }, { "epoch": 0.25, "learning_rate": 0.0002625474872736629, "loss": 0.0181, "step": 49490 }, { "epoch": 0.25, "learning_rate": 0.0002625399195806489, "loss": 0.0182, "step": 49500 }, { "epoch": 0.25, "learning_rate": 0.00026253235188763486, "loss": 0.0221, "step": 49510 }, { "epoch": 0.25, "learning_rate": 0.0002625247841946209, "loss": 0.0301, "step": 49520 }, { "epoch": 0.25, "learning_rate": 0.0002625172165016069, "loss": 0.0225, "step": 49530 }, { "epoch": 0.25, "learning_rate": 0.00026250964880859286, "loss": 0.0241, "step": 49540 }, { "epoch": 0.25, "learning_rate": 0.00026250208111557884, "loss": 0.0226, "step": 49550 }, { "epoch": 0.25, "learning_rate": 0.0002624945134225648, "loss": 0.0236, "step": 49560 }, { "epoch": 0.25, "learning_rate": 0.0002624869457295508, "loss": 0.0215, "step": 49570 }, { "epoch": 0.25, "learning_rate": 0.00026247937803653684, "loss": 0.0232, "step": 49580 }, { "epoch": 0.25, "learning_rate": 0.0002624718103435228, "loss": 0.02, "step": 49590 }, { "epoch": 0.25, "learning_rate": 0.0002624642426505088, "loss": 0.0189, "step": 49600 }, { "epoch": 0.25, "learning_rate": 0.0002624566749574948, "loss": 0.0234, "step": 49610 }, { "epoch": 0.25, "learning_rate": 0.00026244910726448077, "loss": 0.0208, "step": 49620 }, { "epoch": 0.25, "learning_rate": 0.00026244153957146675, "loss": 0.0176, "step": 49630 }, { "epoch": 0.25, "learning_rate": 0.00026243397187845273, "loss": 0.0277, "step": 49640 }, { "epoch": 0.25, "learning_rate": 0.0002624264041854387, "loss": 0.0259, "step": 49650 }, { "epoch": 0.25, "learning_rate": 0.0002624188364924247, "loss": 0.0293, "step": 49660 }, { "epoch": 0.25, "learning_rate": 0.0002624112687994107, "loss": 0.0237, "step": 49670 }, { "epoch": 0.25, "learning_rate": 0.00026240370110639665, "loss": 0.0198, "step": 49680 }, { "epoch": 0.25, "learning_rate": 0.0002623961334133827, "loss": 0.0218, "step": 49690 }, { "epoch": 0.25, "learning_rate": 0.00026238856572036867, "loss": 0.0217, "step": 49700 }, { "epoch": 0.25, "learning_rate": 0.00026238099802735465, "loss": 0.0206, "step": 49710 }, { "epoch": 0.25, "learning_rate": 0.00026237343033434063, "loss": 0.0174, "step": 49720 }, { "epoch": 0.25, "learning_rate": 0.0002623658626413266, "loss": 0.0238, "step": 49730 }, { "epoch": 0.25, "learning_rate": 0.0002623582949483126, "loss": 0.0251, "step": 49740 }, { "epoch": 0.25, "learning_rate": 0.00026235072725529863, "loss": 0.0189, "step": 49750 }, { "epoch": 0.25, "learning_rate": 0.0002623431595622846, "loss": 0.019, "step": 49760 }, { "epoch": 0.25, "learning_rate": 0.0002623355918692706, "loss": 0.0216, "step": 49770 }, { "epoch": 0.25, "learning_rate": 0.0002623280241762566, "loss": 0.0211, "step": 49780 }, { "epoch": 0.25, "learning_rate": 0.00026232045648324256, "loss": 0.0243, "step": 49790 }, { "epoch": 0.25, "learning_rate": 0.00026231288879022854, "loss": 0.0228, "step": 49800 }, { "epoch": 0.25, "learning_rate": 0.0002623053210972146, "loss": 0.0223, "step": 49810 }, { "epoch": 0.25, "learning_rate": 0.00026229775340420056, "loss": 0.0203, "step": 49820 }, { "epoch": 0.25, "learning_rate": 0.00026229018571118654, "loss": 0.0194, "step": 49830 }, { "epoch": 0.25, "learning_rate": 0.0002622826180181725, "loss": 0.0225, "step": 49840 }, { "epoch": 0.25, "learning_rate": 0.0002622750503251585, "loss": 0.0241, "step": 49850 }, { "epoch": 0.25, "learning_rate": 0.0002622674826321445, "loss": 0.0213, "step": 49860 }, { "epoch": 0.25, "learning_rate": 0.00026225991493913046, "loss": 0.0197, "step": 49870 }, { "epoch": 0.25, "learning_rate": 0.0002622523472461165, "loss": 0.0223, "step": 49880 }, { "epoch": 0.25, "learning_rate": 0.0002622447795531025, "loss": 0.0208, "step": 49890 }, { "epoch": 0.25, "learning_rate": 0.00026223721186008846, "loss": 0.0244, "step": 49900 }, { "epoch": 0.25, "learning_rate": 0.00026222964416707444, "loss": 0.0235, "step": 49910 }, { "epoch": 0.25, "learning_rate": 0.0002622220764740604, "loss": 0.0244, "step": 49920 }, { "epoch": 0.25, "learning_rate": 0.0002622145087810464, "loss": 0.0262, "step": 49930 }, { "epoch": 0.25, "learning_rate": 0.00026220694108803244, "loss": 0.0229, "step": 49940 }, { "epoch": 0.25, "learning_rate": 0.0002621993733950184, "loss": 0.0204, "step": 49950 }, { "epoch": 0.25, "learning_rate": 0.0002621918057020044, "loss": 0.0185, "step": 49960 }, { "epoch": 0.25, "learning_rate": 0.0002621842380089904, "loss": 0.0206, "step": 49970 }, { "epoch": 0.25, "learning_rate": 0.00026217667031597637, "loss": 0.0246, "step": 49980 }, { "epoch": 0.25, "learning_rate": 0.00026216910262296235, "loss": 0.0191, "step": 49990 }, { "epoch": 0.25, "learning_rate": 0.00026216153492994833, "loss": 0.0225, "step": 50000 }, { "epoch": 0.25, "eval_cer": 0.9144683151109114, "eval_loss": 0.015245326794683933, "eval_runtime": 117.0207, "eval_samples_per_second": 17.091, "eval_steps_per_second": 4.273, "step": 50000 }, { "epoch": 0.25, "learning_rate": 0.00026215396723693437, "loss": 0.0215, "step": 50010 }, { "epoch": 0.25, "learning_rate": 0.00026214639954392035, "loss": 0.0214, "step": 50020 }, { "epoch": 0.25, "learning_rate": 0.00026213883185090633, "loss": 0.0212, "step": 50030 }, { "epoch": 0.25, "learning_rate": 0.0002621312641578923, "loss": 0.0178, "step": 50040 }, { "epoch": 0.25, "learning_rate": 0.0002621236964648783, "loss": 0.023, "step": 50050 }, { "epoch": 0.25, "learning_rate": 0.0002621161287718643, "loss": 0.0211, "step": 50060 }, { "epoch": 0.25, "learning_rate": 0.0002621085610788503, "loss": 0.0221, "step": 50070 }, { "epoch": 0.25, "learning_rate": 0.0002621009933858363, "loss": 0.0188, "step": 50080 }, { "epoch": 0.25, "learning_rate": 0.0002620934256928223, "loss": 0.0233, "step": 50090 }, { "epoch": 0.25, "learning_rate": 0.00026208585799980825, "loss": 0.0258, "step": 50100 }, { "epoch": 0.25, "learning_rate": 0.00026207829030679424, "loss": 0.0252, "step": 50110 }, { "epoch": 0.25, "learning_rate": 0.0002620707226137802, "loss": 0.0217, "step": 50120 }, { "epoch": 0.25, "learning_rate": 0.00026206315492076625, "loss": 0.0236, "step": 50130 }, { "epoch": 0.25, "learning_rate": 0.00026205558722775223, "loss": 0.0214, "step": 50140 }, { "epoch": 0.25, "learning_rate": 0.0002620480195347382, "loss": 0.0196, "step": 50150 }, { "epoch": 0.25, "learning_rate": 0.0002620404518417242, "loss": 0.0211, "step": 50160 }, { "epoch": 0.25, "learning_rate": 0.0002620328841487102, "loss": 0.0217, "step": 50170 }, { "epoch": 0.25, "learning_rate": 0.00026202531645569616, "loss": 0.0216, "step": 50180 }, { "epoch": 0.25, "learning_rate": 0.00026201774876268214, "loss": 0.0212, "step": 50190 }, { "epoch": 0.25, "learning_rate": 0.0002620101810696682, "loss": 0.0194, "step": 50200 }, { "epoch": 0.25, "learning_rate": 0.00026200261337665416, "loss": 0.0253, "step": 50210 }, { "epoch": 0.25, "learning_rate": 0.00026199504568364014, "loss": 0.0251, "step": 50220 }, { "epoch": 0.25, "learning_rate": 0.0002619874779906261, "loss": 0.02, "step": 50230 }, { "epoch": 0.25, "learning_rate": 0.0002619799102976121, "loss": 0.0204, "step": 50240 }, { "epoch": 0.25, "learning_rate": 0.0002619723426045981, "loss": 0.0262, "step": 50250 }, { "epoch": 0.25, "learning_rate": 0.0002619647749115841, "loss": 0.0199, "step": 50260 }, { "epoch": 0.25, "learning_rate": 0.0002619572072185701, "loss": 0.0235, "step": 50270 }, { "epoch": 0.25, "learning_rate": 0.0002619496395255561, "loss": 0.0206, "step": 50280 }, { "epoch": 0.25, "learning_rate": 0.00026194207183254206, "loss": 0.0196, "step": 50290 }, { "epoch": 0.25, "learning_rate": 0.00026193450413952805, "loss": 0.019, "step": 50300 }, { "epoch": 0.25, "learning_rate": 0.00026192693644651403, "loss": 0.0215, "step": 50310 }, { "epoch": 0.25, "learning_rate": 0.00026191936875350006, "loss": 0.0218, "step": 50320 }, { "epoch": 0.25, "learning_rate": 0.00026191180106048604, "loss": 0.0237, "step": 50330 }, { "epoch": 0.25, "learning_rate": 0.000261904233367472, "loss": 0.0252, "step": 50340 }, { "epoch": 0.25, "learning_rate": 0.000261896665674458, "loss": 0.0229, "step": 50350 }, { "epoch": 0.25, "learning_rate": 0.000261889097981444, "loss": 0.0208, "step": 50360 }, { "epoch": 0.25, "learning_rate": 0.00026188153028842997, "loss": 0.021, "step": 50370 }, { "epoch": 0.25, "learning_rate": 0.00026187396259541595, "loss": 0.0233, "step": 50380 }, { "epoch": 0.25, "learning_rate": 0.000261866394902402, "loss": 0.0215, "step": 50390 }, { "epoch": 0.25, "learning_rate": 0.00026185882720938797, "loss": 0.0213, "step": 50400 }, { "epoch": 0.25, "learning_rate": 0.00026185125951637395, "loss": 0.0197, "step": 50410 }, { "epoch": 0.25, "learning_rate": 0.00026184369182335993, "loss": 0.0214, "step": 50420 }, { "epoch": 0.25, "learning_rate": 0.0002618361241303459, "loss": 0.0183, "step": 50430 }, { "epoch": 0.25, "learning_rate": 0.0002618285564373319, "loss": 0.0213, "step": 50440 }, { "epoch": 0.25, "learning_rate": 0.00026182098874431793, "loss": 0.0207, "step": 50450 }, { "epoch": 0.25, "learning_rate": 0.0002618134210513039, "loss": 0.019, "step": 50460 }, { "epoch": 0.25, "learning_rate": 0.0002618058533582899, "loss": 0.0195, "step": 50470 }, { "epoch": 0.25, "learning_rate": 0.0002617982856652759, "loss": 0.0182, "step": 50480 }, { "epoch": 0.25, "learning_rate": 0.00026179071797226186, "loss": 0.022, "step": 50490 }, { "epoch": 0.25, "learning_rate": 0.00026178315027924784, "loss": 0.0216, "step": 50500 }, { "epoch": 0.25, "learning_rate": 0.0002617755825862338, "loss": 0.0211, "step": 50510 }, { "epoch": 0.25, "learning_rate": 0.00026176801489321985, "loss": 0.0225, "step": 50520 }, { "epoch": 0.25, "learning_rate": 0.00026176044720020584, "loss": 0.0247, "step": 50530 }, { "epoch": 0.25, "learning_rate": 0.0002617528795071918, "loss": 0.0167, "step": 50540 }, { "epoch": 0.26, "learning_rate": 0.0002617453118141778, "loss": 0.0208, "step": 50550 }, { "epoch": 0.26, "learning_rate": 0.0002617377441211638, "loss": 0.0187, "step": 50560 }, { "epoch": 0.26, "learning_rate": 0.00026173017642814976, "loss": 0.0207, "step": 50570 }, { "epoch": 0.26, "learning_rate": 0.0002617226087351358, "loss": 0.0205, "step": 50580 }, { "epoch": 0.26, "learning_rate": 0.0002617150410421218, "loss": 0.0193, "step": 50590 }, { "epoch": 0.26, "learning_rate": 0.00026170747334910776, "loss": 0.0202, "step": 50600 }, { "epoch": 0.26, "learning_rate": 0.00026169990565609374, "loss": 0.0174, "step": 50610 }, { "epoch": 0.26, "learning_rate": 0.0002616923379630797, "loss": 0.0223, "step": 50620 }, { "epoch": 0.26, "learning_rate": 0.0002616847702700657, "loss": 0.0233, "step": 50630 }, { "epoch": 0.26, "learning_rate": 0.00026167720257705174, "loss": 0.0248, "step": 50640 }, { "epoch": 0.26, "learning_rate": 0.0002616696348840377, "loss": 0.0214, "step": 50650 }, { "epoch": 0.26, "learning_rate": 0.0002616620671910237, "loss": 0.0205, "step": 50660 }, { "epoch": 0.26, "learning_rate": 0.0002616544994980097, "loss": 0.0223, "step": 50670 }, { "epoch": 0.26, "learning_rate": 0.00026164693180499567, "loss": 0.0222, "step": 50680 }, { "epoch": 0.26, "learning_rate": 0.00026163936411198165, "loss": 0.024, "step": 50690 }, { "epoch": 0.26, "learning_rate": 0.00026163179641896763, "loss": 0.0229, "step": 50700 }, { "epoch": 0.26, "learning_rate": 0.00026162422872595366, "loss": 0.022, "step": 50710 }, { "epoch": 0.26, "learning_rate": 0.00026161666103293965, "loss": 0.021, "step": 50720 }, { "epoch": 0.26, "learning_rate": 0.00026160909333992563, "loss": 0.0199, "step": 50730 }, { "epoch": 0.26, "learning_rate": 0.0002616015256469116, "loss": 0.0206, "step": 50740 }, { "epoch": 0.26, "learning_rate": 0.0002615939579538976, "loss": 0.022, "step": 50750 }, { "epoch": 0.26, "learning_rate": 0.00026158639026088357, "loss": 0.0206, "step": 50760 }, { "epoch": 0.26, "learning_rate": 0.0002615788225678696, "loss": 0.0215, "step": 50770 }, { "epoch": 0.26, "learning_rate": 0.0002615712548748556, "loss": 0.0254, "step": 50780 }, { "epoch": 0.26, "learning_rate": 0.00026156368718184157, "loss": 0.021, "step": 50790 }, { "epoch": 0.26, "learning_rate": 0.00026155611948882755, "loss": 0.0202, "step": 50800 }, { "epoch": 0.26, "learning_rate": 0.00026154855179581353, "loss": 0.0216, "step": 50810 }, { "epoch": 0.26, "learning_rate": 0.0002615409841027995, "loss": 0.0244, "step": 50820 }, { "epoch": 0.26, "learning_rate": 0.00026153341640978555, "loss": 0.0193, "step": 50830 }, { "epoch": 0.26, "learning_rate": 0.00026152584871677153, "loss": 0.0197, "step": 50840 }, { "epoch": 0.26, "learning_rate": 0.0002615182810237575, "loss": 0.0207, "step": 50850 }, { "epoch": 0.26, "learning_rate": 0.0002615107133307435, "loss": 0.021, "step": 50860 }, { "epoch": 0.26, "learning_rate": 0.0002615031456377295, "loss": 0.023, "step": 50870 }, { "epoch": 0.26, "learning_rate": 0.00026149557794471546, "loss": 0.0209, "step": 50880 }, { "epoch": 0.26, "learning_rate": 0.00026148801025170144, "loss": 0.022, "step": 50890 }, { "epoch": 0.26, "learning_rate": 0.0002614804425586875, "loss": 0.0198, "step": 50900 }, { "epoch": 0.26, "learning_rate": 0.0002614728748656734, "loss": 0.0215, "step": 50910 }, { "epoch": 0.26, "learning_rate": 0.0002614653071726594, "loss": 0.023, "step": 50920 }, { "epoch": 0.26, "learning_rate": 0.00026145773947964536, "loss": 0.0217, "step": 50930 }, { "epoch": 0.26, "learning_rate": 0.0002614501717866314, "loss": 0.0229, "step": 50940 }, { "epoch": 0.26, "learning_rate": 0.0002614426040936174, "loss": 0.0212, "step": 50950 }, { "epoch": 0.26, "learning_rate": 0.00026143503640060336, "loss": 0.018, "step": 50960 }, { "epoch": 0.26, "learning_rate": 0.00026142746870758934, "loss": 0.0183, "step": 50970 }, { "epoch": 0.26, "learning_rate": 0.0002614199010145753, "loss": 0.018, "step": 50980 }, { "epoch": 0.26, "learning_rate": 0.0002614123333215613, "loss": 0.0205, "step": 50990 }, { "epoch": 0.26, "learning_rate": 0.00026140476562854734, "loss": 0.022, "step": 51000 }, { "epoch": 0.26, "eval_cer": 0.9144770486760401, "eval_loss": 0.01605140045285225, "eval_runtime": 117.035, "eval_samples_per_second": 17.089, "eval_steps_per_second": 4.272, "step": 51000 }, { "epoch": 0.26, "learning_rate": 0.0002613971979355333, "loss": 0.019, "step": 51010 }, { "epoch": 0.26, "learning_rate": 0.0002613896302425193, "loss": 0.0237, "step": 51020 }, { "epoch": 0.26, "learning_rate": 0.0002613820625495053, "loss": 0.0232, "step": 51030 }, { "epoch": 0.26, "learning_rate": 0.00026137449485649127, "loss": 0.0221, "step": 51040 }, { "epoch": 0.26, "learning_rate": 0.00026136692716347725, "loss": 0.017, "step": 51050 }, { "epoch": 0.26, "learning_rate": 0.00026135935947046323, "loss": 0.0204, "step": 51060 }, { "epoch": 0.26, "learning_rate": 0.00026135179177744927, "loss": 0.02, "step": 51070 }, { "epoch": 0.26, "learning_rate": 0.00026134422408443525, "loss": 0.0178, "step": 51080 }, { "epoch": 0.26, "learning_rate": 0.00026133665639142123, "loss": 0.0212, "step": 51090 }, { "epoch": 0.26, "learning_rate": 0.0002613290886984072, "loss": 0.0243, "step": 51100 }, { "epoch": 0.26, "learning_rate": 0.0002613215210053932, "loss": 0.0243, "step": 51110 }, { "epoch": 0.26, "learning_rate": 0.0002613139533123792, "loss": 0.0238, "step": 51120 }, { "epoch": 0.26, "learning_rate": 0.0002613063856193652, "loss": 0.0265, "step": 51130 }, { "epoch": 0.26, "learning_rate": 0.0002612988179263512, "loss": 0.0194, "step": 51140 }, { "epoch": 0.26, "learning_rate": 0.0002612912502333372, "loss": 0.0224, "step": 51150 }, { "epoch": 0.26, "learning_rate": 0.00026128368254032315, "loss": 0.0209, "step": 51160 }, { "epoch": 0.26, "learning_rate": 0.00026127611484730914, "loss": 0.0192, "step": 51170 }, { "epoch": 0.26, "learning_rate": 0.0002612685471542951, "loss": 0.0194, "step": 51180 }, { "epoch": 0.26, "learning_rate": 0.00026126097946128115, "loss": 0.023, "step": 51190 }, { "epoch": 0.26, "learning_rate": 0.00026125341176826713, "loss": 0.0234, "step": 51200 }, { "epoch": 0.26, "learning_rate": 0.0002612458440752531, "loss": 0.0201, "step": 51210 }, { "epoch": 0.26, "learning_rate": 0.0002612382763822391, "loss": 0.0248, "step": 51220 }, { "epoch": 0.26, "learning_rate": 0.0002612307086892251, "loss": 0.0214, "step": 51230 }, { "epoch": 0.26, "learning_rate": 0.00026122314099621106, "loss": 0.0203, "step": 51240 }, { "epoch": 0.26, "learning_rate": 0.00026121557330319704, "loss": 0.0187, "step": 51250 }, { "epoch": 0.26, "learning_rate": 0.0002612080056101831, "loss": 0.0227, "step": 51260 }, { "epoch": 0.26, "learning_rate": 0.00026120043791716906, "loss": 0.0194, "step": 51270 }, { "epoch": 0.26, "learning_rate": 0.00026119287022415504, "loss": 0.0226, "step": 51280 }, { "epoch": 0.26, "learning_rate": 0.000261185302531141, "loss": 0.0201, "step": 51290 }, { "epoch": 0.26, "learning_rate": 0.000261177734838127, "loss": 0.0182, "step": 51300 }, { "epoch": 0.26, "learning_rate": 0.000261170167145113, "loss": 0.0282, "step": 51310 }, { "epoch": 0.26, "learning_rate": 0.000261162599452099, "loss": 0.0208, "step": 51320 }, { "epoch": 0.26, "learning_rate": 0.000261155031759085, "loss": 0.0216, "step": 51330 }, { "epoch": 0.26, "learning_rate": 0.000261147464066071, "loss": 0.0241, "step": 51340 }, { "epoch": 0.26, "learning_rate": 0.00026113989637305696, "loss": 0.0197, "step": 51350 }, { "epoch": 0.26, "learning_rate": 0.00026113232868004295, "loss": 0.0178, "step": 51360 }, { "epoch": 0.26, "learning_rate": 0.00026112476098702893, "loss": 0.0197, "step": 51370 }, { "epoch": 0.26, "learning_rate": 0.00026111719329401496, "loss": 0.0244, "step": 51380 }, { "epoch": 0.26, "learning_rate": 0.00026110962560100094, "loss": 0.0223, "step": 51390 }, { "epoch": 0.26, "learning_rate": 0.0002611020579079869, "loss": 0.0218, "step": 51400 }, { "epoch": 0.26, "learning_rate": 0.0002610944902149729, "loss": 0.0206, "step": 51410 }, { "epoch": 0.26, "learning_rate": 0.0002610869225219589, "loss": 0.0204, "step": 51420 }, { "epoch": 0.26, "learning_rate": 0.00026107935482894487, "loss": 0.0269, "step": 51430 }, { "epoch": 0.26, "learning_rate": 0.00026107178713593085, "loss": 0.0278, "step": 51440 }, { "epoch": 0.26, "learning_rate": 0.0002610642194429169, "loss": 0.0228, "step": 51450 }, { "epoch": 0.26, "learning_rate": 0.00026105665174990287, "loss": 0.0213, "step": 51460 }, { "epoch": 0.26, "learning_rate": 0.00026104908405688885, "loss": 0.0199, "step": 51470 }, { "epoch": 0.26, "learning_rate": 0.00026104151636387483, "loss": 0.0218, "step": 51480 }, { "epoch": 0.26, "learning_rate": 0.0002610339486708608, "loss": 0.0202, "step": 51490 }, { "epoch": 0.26, "learning_rate": 0.0002610263809778468, "loss": 0.0209, "step": 51500 }, { "epoch": 0.26, "learning_rate": 0.00026101881328483283, "loss": 0.0213, "step": 51510 }, { "epoch": 0.26, "learning_rate": 0.0002610112455918188, "loss": 0.0222, "step": 51520 }, { "epoch": 0.26, "learning_rate": 0.0002610036778988048, "loss": 0.0191, "step": 51530 }, { "epoch": 0.26, "learning_rate": 0.0002609961102057908, "loss": 0.0196, "step": 51540 }, { "epoch": 0.26, "learning_rate": 0.00026098854251277676, "loss": 0.0214, "step": 51550 }, { "epoch": 0.26, "learning_rate": 0.00026098097481976274, "loss": 0.016, "step": 51560 }, { "epoch": 0.26, "learning_rate": 0.0002609734071267487, "loss": 0.0207, "step": 51570 }, { "epoch": 0.26, "learning_rate": 0.00026096583943373475, "loss": 0.0242, "step": 51580 }, { "epoch": 0.26, "learning_rate": 0.00026095827174072074, "loss": 0.018, "step": 51590 }, { "epoch": 0.26, "learning_rate": 0.0002609507040477067, "loss": 0.0201, "step": 51600 }, { "epoch": 0.26, "learning_rate": 0.0002609431363546927, "loss": 0.0232, "step": 51610 }, { "epoch": 0.26, "learning_rate": 0.0002609355686616787, "loss": 0.0234, "step": 51620 }, { "epoch": 0.26, "learning_rate": 0.00026092800096866466, "loss": 0.0198, "step": 51630 }, { "epoch": 0.26, "learning_rate": 0.0002609204332756507, "loss": 0.0238, "step": 51640 }, { "epoch": 0.26, "learning_rate": 0.0002609128655826367, "loss": 0.0186, "step": 51650 }, { "epoch": 0.26, "learning_rate": 0.00026090529788962266, "loss": 0.019, "step": 51660 }, { "epoch": 0.26, "learning_rate": 0.00026089773019660864, "loss": 0.0186, "step": 51670 }, { "epoch": 0.26, "learning_rate": 0.0002608901625035946, "loss": 0.0225, "step": 51680 }, { "epoch": 0.26, "learning_rate": 0.0002608825948105806, "loss": 0.0175, "step": 51690 }, { "epoch": 0.26, "learning_rate": 0.00026087502711756664, "loss": 0.0212, "step": 51700 }, { "epoch": 0.26, "learning_rate": 0.0002608674594245526, "loss": 0.0241, "step": 51710 }, { "epoch": 0.26, "learning_rate": 0.0002608598917315386, "loss": 0.0191, "step": 51720 }, { "epoch": 0.26, "learning_rate": 0.0002608523240385246, "loss": 0.0188, "step": 51730 }, { "epoch": 0.26, "learning_rate": 0.00026084475634551057, "loss": 0.0208, "step": 51740 }, { "epoch": 0.26, "learning_rate": 0.00026083718865249655, "loss": 0.0202, "step": 51750 }, { "epoch": 0.26, "learning_rate": 0.00026082962095948253, "loss": 0.0199, "step": 51760 }, { "epoch": 0.26, "learning_rate": 0.00026082205326646856, "loss": 0.0393, "step": 51770 }, { "epoch": 0.26, "learning_rate": 0.00026081448557345455, "loss": 0.0419, "step": 51780 }, { "epoch": 0.26, "learning_rate": 0.00026080691788044053, "loss": 0.0159, "step": 51790 }, { "epoch": 0.26, "learning_rate": 0.0002607993501874265, "loss": 0.0194, "step": 51800 }, { "epoch": 0.26, "learning_rate": 0.0002607917824944125, "loss": 0.0199, "step": 51810 }, { "epoch": 0.26, "learning_rate": 0.00026078421480139847, "loss": 0.0203, "step": 51820 }, { "epoch": 0.26, "learning_rate": 0.0002607766471083845, "loss": 0.0208, "step": 51830 }, { "epoch": 0.26, "learning_rate": 0.0002607690794153705, "loss": 0.0246, "step": 51840 }, { "epoch": 0.26, "learning_rate": 0.00026076151172235647, "loss": 0.0209, "step": 51850 }, { "epoch": 0.26, "learning_rate": 0.00026075394402934245, "loss": 0.0238, "step": 51860 }, { "epoch": 0.26, "learning_rate": 0.00026074637633632843, "loss": 0.0219, "step": 51870 }, { "epoch": 0.26, "learning_rate": 0.0002607388086433144, "loss": 0.0247, "step": 51880 }, { "epoch": 0.26, "learning_rate": 0.00026073124095030045, "loss": 0.0211, "step": 51890 }, { "epoch": 0.26, "learning_rate": 0.00026072367325728643, "loss": 0.0167, "step": 51900 }, { "epoch": 0.26, "learning_rate": 0.0002607161055642724, "loss": 0.0237, "step": 51910 }, { "epoch": 0.26, "learning_rate": 0.0002607085378712584, "loss": 0.0207, "step": 51920 }, { "epoch": 0.26, "learning_rate": 0.0002607009701782444, "loss": 0.0234, "step": 51930 }, { "epoch": 0.26, "learning_rate": 0.00026069340248523036, "loss": 0.0232, "step": 51940 }, { "epoch": 0.26, "learning_rate": 0.00026068583479221634, "loss": 0.0213, "step": 51950 }, { "epoch": 0.26, "learning_rate": 0.0002606782670992024, "loss": 0.0221, "step": 51960 }, { "epoch": 0.26, "learning_rate": 0.00026067069940618836, "loss": 0.0236, "step": 51970 }, { "epoch": 0.26, "learning_rate": 0.00026066313171317434, "loss": 0.0219, "step": 51980 }, { "epoch": 0.26, "learning_rate": 0.0002606555640201603, "loss": 0.0223, "step": 51990 }, { "epoch": 0.26, "learning_rate": 0.0002606479963271463, "loss": 0.0231, "step": 52000 }, { "epoch": 0.26, "eval_cer": 0.9145013085791751, "eval_loss": 0.015823883935809135, "eval_runtime": 116.6377, "eval_samples_per_second": 17.147, "eval_steps_per_second": 4.287, "step": 52000 }, { "epoch": 0.26, "learning_rate": 0.0002606404286341323, "loss": 0.0225, "step": 52010 }, { "epoch": 0.26, "learning_rate": 0.0002606328609411183, "loss": 0.0197, "step": 52020 }, { "epoch": 0.26, "learning_rate": 0.0002606252932481043, "loss": 0.0207, "step": 52030 }, { "epoch": 0.26, "learning_rate": 0.0002606177255550903, "loss": 0.0181, "step": 52040 }, { "epoch": 0.26, "learning_rate": 0.00026061015786207626, "loss": 0.0194, "step": 52050 }, { "epoch": 0.26, "learning_rate": 0.00026060259016906224, "loss": 0.0248, "step": 52060 }, { "epoch": 0.26, "learning_rate": 0.0002605950224760482, "loss": 0.0233, "step": 52070 }, { "epoch": 0.26, "learning_rate": 0.0002605874547830342, "loss": 0.0234, "step": 52080 }, { "epoch": 0.26, "learning_rate": 0.00026057988709002024, "loss": 0.0198, "step": 52090 }, { "epoch": 0.26, "learning_rate": 0.0002605723193970062, "loss": 0.0197, "step": 52100 }, { "epoch": 0.26, "learning_rate": 0.0002605647517039922, "loss": 0.0186, "step": 52110 }, { "epoch": 0.26, "learning_rate": 0.0002605571840109782, "loss": 0.0216, "step": 52120 }, { "epoch": 0.26, "learning_rate": 0.00026054961631796417, "loss": 0.0231, "step": 52130 }, { "epoch": 0.26, "learning_rate": 0.00026054204862495015, "loss": 0.0219, "step": 52140 }, { "epoch": 0.26, "learning_rate": 0.0002605344809319362, "loss": 0.0209, "step": 52150 }, { "epoch": 0.26, "learning_rate": 0.00026052691323892217, "loss": 0.0191, "step": 52160 }, { "epoch": 0.26, "learning_rate": 0.0002605193455459081, "loss": 0.0205, "step": 52170 }, { "epoch": 0.26, "learning_rate": 0.0002605117778528941, "loss": 0.0268, "step": 52180 }, { "epoch": 0.26, "learning_rate": 0.0002605042101598801, "loss": 0.019, "step": 52190 }, { "epoch": 0.26, "learning_rate": 0.0002604966424668661, "loss": 0.0191, "step": 52200 }, { "epoch": 0.26, "learning_rate": 0.0002604890747738521, "loss": 0.0197, "step": 52210 }, { "epoch": 0.26, "learning_rate": 0.00026048150708083806, "loss": 0.0232, "step": 52220 }, { "epoch": 0.26, "learning_rate": 0.00026047393938782404, "loss": 0.0213, "step": 52230 }, { "epoch": 0.26, "learning_rate": 0.00026046637169481, "loss": 0.0238, "step": 52240 }, { "epoch": 0.26, "learning_rate": 0.00026045880400179605, "loss": 0.0203, "step": 52250 }, { "epoch": 0.26, "learning_rate": 0.00026045123630878204, "loss": 0.0217, "step": 52260 }, { "epoch": 0.26, "learning_rate": 0.000260443668615768, "loss": 0.024, "step": 52270 }, { "epoch": 0.26, "learning_rate": 0.000260436100922754, "loss": 0.019, "step": 52280 }, { "epoch": 0.26, "learning_rate": 0.00026042853322974, "loss": 0.0183, "step": 52290 }, { "epoch": 0.26, "learning_rate": 0.00026042096553672596, "loss": 0.0207, "step": 52300 }, { "epoch": 0.26, "learning_rate": 0.00026041339784371194, "loss": 0.0191, "step": 52310 }, { "epoch": 0.26, "learning_rate": 0.000260405830150698, "loss": 0.0196, "step": 52320 }, { "epoch": 0.26, "learning_rate": 0.00026039826245768396, "loss": 0.0229, "step": 52330 }, { "epoch": 0.26, "learning_rate": 0.00026039069476466994, "loss": 0.02, "step": 52340 }, { "epoch": 0.26, "learning_rate": 0.0002603831270716559, "loss": 0.0205, "step": 52350 }, { "epoch": 0.26, "learning_rate": 0.0002603755593786419, "loss": 0.0192, "step": 52360 }, { "epoch": 0.26, "learning_rate": 0.0002603679916856279, "loss": 0.02, "step": 52370 }, { "epoch": 0.26, "learning_rate": 0.0002603604239926139, "loss": 0.0292, "step": 52380 }, { "epoch": 0.26, "learning_rate": 0.0002603528562995999, "loss": 0.0183, "step": 52390 }, { "epoch": 0.26, "learning_rate": 0.0002603452886065859, "loss": 0.0249, "step": 52400 }, { "epoch": 0.26, "learning_rate": 0.00026033772091357187, "loss": 0.0192, "step": 52410 }, { "epoch": 0.26, "learning_rate": 0.00026033015322055785, "loss": 0.0211, "step": 52420 }, { "epoch": 0.26, "learning_rate": 0.00026032258552754383, "loss": 0.0222, "step": 52430 }, { "epoch": 0.26, "learning_rate": 0.00026031501783452986, "loss": 0.0232, "step": 52440 }, { "epoch": 0.26, "learning_rate": 0.00026030745014151585, "loss": 0.0258, "step": 52450 }, { "epoch": 0.26, "learning_rate": 0.0002602998824485018, "loss": 0.021, "step": 52460 }, { "epoch": 0.26, "learning_rate": 0.0002602923147554878, "loss": 0.0185, "step": 52470 }, { "epoch": 0.26, "learning_rate": 0.0002602847470624738, "loss": 0.0182, "step": 52480 }, { "epoch": 0.26, "learning_rate": 0.00026027717936945977, "loss": 0.0181, "step": 52490 }, { "epoch": 0.26, "learning_rate": 0.00026026961167644575, "loss": 0.0193, "step": 52500 }, { "epoch": 0.26, "learning_rate": 0.0002602620439834318, "loss": 0.0241, "step": 52510 }, { "epoch": 0.26, "learning_rate": 0.00026025447629041777, "loss": 0.0183, "step": 52520 }, { "epoch": 0.27, "learning_rate": 0.00026024690859740375, "loss": 0.0205, "step": 52530 }, { "epoch": 0.27, "learning_rate": 0.00026023934090438973, "loss": 0.0189, "step": 52540 }, { "epoch": 0.27, "learning_rate": 0.0002602317732113757, "loss": 0.0187, "step": 52550 }, { "epoch": 0.27, "learning_rate": 0.0002602242055183617, "loss": 0.0214, "step": 52560 }, { "epoch": 0.27, "learning_rate": 0.00026021663782534773, "loss": 0.0204, "step": 52570 }, { "epoch": 0.27, "learning_rate": 0.0002602090701323337, "loss": 0.0226, "step": 52580 }, { "epoch": 0.27, "learning_rate": 0.0002602015024393197, "loss": 0.0285, "step": 52590 }, { "epoch": 0.27, "learning_rate": 0.0002601939347463057, "loss": 0.0269, "step": 52600 }, { "epoch": 0.27, "learning_rate": 0.00026018636705329166, "loss": 0.0216, "step": 52610 }, { "epoch": 0.27, "learning_rate": 0.00026017879936027764, "loss": 0.021, "step": 52620 }, { "epoch": 0.27, "learning_rate": 0.0002601712316672636, "loss": 0.0208, "step": 52630 }, { "epoch": 0.27, "learning_rate": 0.00026016366397424966, "loss": 0.0242, "step": 52640 }, { "epoch": 0.27, "learning_rate": 0.00026015609628123564, "loss": 0.0206, "step": 52650 }, { "epoch": 0.27, "learning_rate": 0.0002601485285882216, "loss": 0.0181, "step": 52660 }, { "epoch": 0.27, "learning_rate": 0.0002601409608952076, "loss": 0.0177, "step": 52670 }, { "epoch": 0.27, "learning_rate": 0.0002601333932021936, "loss": 0.0231, "step": 52680 }, { "epoch": 0.27, "learning_rate": 0.00026012582550917956, "loss": 0.0209, "step": 52690 }, { "epoch": 0.27, "learning_rate": 0.0002601182578161656, "loss": 0.0232, "step": 52700 }, { "epoch": 0.27, "learning_rate": 0.0002601106901231516, "loss": 0.0216, "step": 52710 }, { "epoch": 0.27, "learning_rate": 0.00026010312243013756, "loss": 0.0172, "step": 52720 }, { "epoch": 0.27, "learning_rate": 0.00026009555473712354, "loss": 0.0181, "step": 52730 }, { "epoch": 0.27, "learning_rate": 0.0002600879870441095, "loss": 0.0199, "step": 52740 }, { "epoch": 0.27, "learning_rate": 0.0002600804193510955, "loss": 0.0209, "step": 52750 }, { "epoch": 0.27, "learning_rate": 0.00026007285165808154, "loss": 0.0196, "step": 52760 }, { "epoch": 0.27, "learning_rate": 0.0002600652839650675, "loss": 0.0218, "step": 52770 }, { "epoch": 0.27, "learning_rate": 0.0002600577162720535, "loss": 0.0219, "step": 52780 }, { "epoch": 0.27, "learning_rate": 0.0002600501485790395, "loss": 0.0209, "step": 52790 }, { "epoch": 0.27, "learning_rate": 0.00026004258088602547, "loss": 0.0178, "step": 52800 }, { "epoch": 0.27, "learning_rate": 0.00026003501319301145, "loss": 0.0203, "step": 52810 }, { "epoch": 0.27, "learning_rate": 0.00026002744549999743, "loss": 0.0229, "step": 52820 }, { "epoch": 0.27, "learning_rate": 0.00026001987780698347, "loss": 0.0202, "step": 52830 }, { "epoch": 0.27, "learning_rate": 0.00026001231011396945, "loss": 0.0215, "step": 52840 }, { "epoch": 0.27, "learning_rate": 0.00026000474242095543, "loss": 0.019, "step": 52850 }, { "epoch": 0.27, "learning_rate": 0.0002599971747279414, "loss": 0.0201, "step": 52860 }, { "epoch": 0.27, "learning_rate": 0.0002599896070349274, "loss": 0.0209, "step": 52870 }, { "epoch": 0.27, "learning_rate": 0.00025998203934191337, "loss": 0.0205, "step": 52880 }, { "epoch": 0.27, "learning_rate": 0.0002599744716488994, "loss": 0.023, "step": 52890 }, { "epoch": 0.27, "learning_rate": 0.0002599669039558854, "loss": 0.02, "step": 52900 }, { "epoch": 0.27, "learning_rate": 0.00025995933626287137, "loss": 0.0205, "step": 52910 }, { "epoch": 0.27, "learning_rate": 0.00025995176856985735, "loss": 0.0192, "step": 52920 }, { "epoch": 0.27, "learning_rate": 0.00025994420087684333, "loss": 0.022, "step": 52930 }, { "epoch": 0.27, "learning_rate": 0.0002599366331838293, "loss": 0.0226, "step": 52940 }, { "epoch": 0.27, "learning_rate": 0.00025992906549081535, "loss": 0.0185, "step": 52950 }, { "epoch": 0.27, "learning_rate": 0.00025992149779780133, "loss": 0.0218, "step": 52960 }, { "epoch": 0.27, "learning_rate": 0.0002599139301047873, "loss": 0.0222, "step": 52970 }, { "epoch": 0.27, "learning_rate": 0.0002599063624117733, "loss": 0.0201, "step": 52980 }, { "epoch": 0.27, "learning_rate": 0.0002598987947187593, "loss": 0.0221, "step": 52990 }, { "epoch": 0.27, "learning_rate": 0.00025989122702574526, "loss": 0.0175, "step": 53000 }, { "epoch": 0.27, "eval_cer": 0.9145139237288054, "eval_loss": 0.015266528353095055, "eval_runtime": 115.681, "eval_samples_per_second": 17.289, "eval_steps_per_second": 4.322, "step": 53000 }, { "epoch": 0.27, "learning_rate": 0.00025988365933273124, "loss": 0.0195, "step": 53010 }, { "epoch": 0.27, "learning_rate": 0.0002598760916397173, "loss": 0.0184, "step": 53020 }, { "epoch": 0.27, "learning_rate": 0.00025986852394670326, "loss": 0.0241, "step": 53030 }, { "epoch": 0.27, "learning_rate": 0.00025986095625368924, "loss": 0.0221, "step": 53040 }, { "epoch": 0.27, "learning_rate": 0.0002598533885606752, "loss": 0.0205, "step": 53050 }, { "epoch": 0.27, "learning_rate": 0.0002598458208676612, "loss": 0.0233, "step": 53060 }, { "epoch": 0.27, "learning_rate": 0.0002598382531746472, "loss": 0.0203, "step": 53070 }, { "epoch": 0.27, "learning_rate": 0.0002598306854816332, "loss": 0.0199, "step": 53080 }, { "epoch": 0.27, "learning_rate": 0.0002598231177886192, "loss": 0.021, "step": 53090 }, { "epoch": 0.27, "learning_rate": 0.0002598155500956052, "loss": 0.0176, "step": 53100 }, { "epoch": 0.27, "learning_rate": 0.00025980798240259116, "loss": 0.0187, "step": 53110 }, { "epoch": 0.27, "learning_rate": 0.00025980041470957714, "loss": 0.0223, "step": 53120 }, { "epoch": 0.27, "learning_rate": 0.0002597928470165631, "loss": 0.0216, "step": 53130 }, { "epoch": 0.27, "learning_rate": 0.0002597852793235491, "loss": 0.0224, "step": 53140 }, { "epoch": 0.27, "learning_rate": 0.00025977771163053514, "loss": 0.0224, "step": 53150 }, { "epoch": 0.27, "learning_rate": 0.0002597701439375211, "loss": 0.0199, "step": 53160 }, { "epoch": 0.27, "learning_rate": 0.0002597625762445071, "loss": 0.0199, "step": 53170 }, { "epoch": 0.27, "learning_rate": 0.0002597550085514931, "loss": 0.0261, "step": 53180 }, { "epoch": 0.27, "learning_rate": 0.00025974744085847907, "loss": 0.0254, "step": 53190 }, { "epoch": 0.27, "learning_rate": 0.00025973987316546505, "loss": 0.024, "step": 53200 }, { "epoch": 0.27, "learning_rate": 0.0002597323054724511, "loss": 0.0212, "step": 53210 }, { "epoch": 0.27, "learning_rate": 0.00025972473777943707, "loss": 0.0167, "step": 53220 }, { "epoch": 0.27, "learning_rate": 0.00025971717008642305, "loss": 0.0234, "step": 53230 }, { "epoch": 0.27, "learning_rate": 0.00025970960239340903, "loss": 0.0207, "step": 53240 }, { "epoch": 0.27, "learning_rate": 0.000259702034700395, "loss": 0.0243, "step": 53250 }, { "epoch": 0.27, "learning_rate": 0.000259694467007381, "loss": 0.0201, "step": 53260 }, { "epoch": 0.27, "learning_rate": 0.00025968689931436703, "loss": 0.019, "step": 53270 }, { "epoch": 0.27, "learning_rate": 0.000259679331621353, "loss": 0.0231, "step": 53280 }, { "epoch": 0.27, "learning_rate": 0.000259671763928339, "loss": 0.0202, "step": 53290 }, { "epoch": 0.27, "learning_rate": 0.00025966419623532497, "loss": 0.022, "step": 53300 }, { "epoch": 0.27, "learning_rate": 0.00025965662854231095, "loss": 0.021, "step": 53310 }, { "epoch": 0.27, "learning_rate": 0.00025964906084929694, "loss": 0.0198, "step": 53320 }, { "epoch": 0.27, "learning_rate": 0.0002596414931562829, "loss": 0.0193, "step": 53330 }, { "epoch": 0.27, "learning_rate": 0.00025963392546326895, "loss": 0.0194, "step": 53340 }, { "epoch": 0.27, "learning_rate": 0.00025962635777025493, "loss": 0.0188, "step": 53350 }, { "epoch": 0.27, "learning_rate": 0.0002596187900772409, "loss": 0.0222, "step": 53360 }, { "epoch": 0.27, "learning_rate": 0.0002596112223842269, "loss": 0.0222, "step": 53370 }, { "epoch": 0.27, "learning_rate": 0.0002596036546912129, "loss": 0.0183, "step": 53380 }, { "epoch": 0.27, "learning_rate": 0.00025959608699819886, "loss": 0.0209, "step": 53390 }, { "epoch": 0.27, "learning_rate": 0.0002595885193051849, "loss": 0.0216, "step": 53400 }, { "epoch": 0.27, "learning_rate": 0.0002595809516121709, "loss": 0.0195, "step": 53410 }, { "epoch": 0.27, "learning_rate": 0.0002595733839191568, "loss": 0.02, "step": 53420 }, { "epoch": 0.27, "learning_rate": 0.0002595658162261428, "loss": 0.0177, "step": 53430 }, { "epoch": 0.27, "learning_rate": 0.0002595582485331288, "loss": 0.0191, "step": 53440 }, { "epoch": 0.27, "learning_rate": 0.0002595506808401148, "loss": 0.0245, "step": 53450 }, { "epoch": 0.27, "learning_rate": 0.0002595431131471008, "loss": 0.0175, "step": 53460 }, { "epoch": 0.27, "learning_rate": 0.00025953554545408677, "loss": 0.0199, "step": 53470 }, { "epoch": 0.27, "learning_rate": 0.00025952797776107275, "loss": 0.0222, "step": 53480 }, { "epoch": 0.27, "learning_rate": 0.00025952041006805873, "loss": 0.0218, "step": 53490 }, { "epoch": 0.27, "learning_rate": 0.00025951284237504476, "loss": 0.0183, "step": 53500 }, { "epoch": 0.27, "learning_rate": 0.00025950527468203075, "loss": 0.0208, "step": 53510 }, { "epoch": 0.27, "learning_rate": 0.0002594977069890167, "loss": 0.0213, "step": 53520 }, { "epoch": 0.27, "learning_rate": 0.0002594901392960027, "loss": 0.0182, "step": 53530 }, { "epoch": 0.27, "learning_rate": 0.0002594825716029887, "loss": 0.0207, "step": 53540 }, { "epoch": 0.27, "learning_rate": 0.00025947500390997467, "loss": 0.0188, "step": 53550 }, { "epoch": 0.27, "learning_rate": 0.00025946743621696065, "loss": 0.0212, "step": 53560 }, { "epoch": 0.27, "learning_rate": 0.0002594598685239467, "loss": 0.0211, "step": 53570 }, { "epoch": 0.27, "learning_rate": 0.00025945230083093267, "loss": 0.0185, "step": 53580 }, { "epoch": 0.27, "learning_rate": 0.00025944473313791865, "loss": 0.0217, "step": 53590 }, { "epoch": 0.27, "learning_rate": 0.00025943716544490463, "loss": 0.0209, "step": 53600 }, { "epoch": 0.27, "learning_rate": 0.0002594295977518906, "loss": 0.0213, "step": 53610 }, { "epoch": 0.27, "learning_rate": 0.0002594220300588766, "loss": 0.0195, "step": 53620 }, { "epoch": 0.27, "learning_rate": 0.00025941446236586263, "loss": 0.0239, "step": 53630 }, { "epoch": 0.27, "learning_rate": 0.0002594068946728486, "loss": 0.0188, "step": 53640 }, { "epoch": 0.27, "learning_rate": 0.0002593993269798346, "loss": 0.0215, "step": 53650 }, { "epoch": 0.27, "learning_rate": 0.0002593917592868206, "loss": 0.0215, "step": 53660 }, { "epoch": 0.27, "learning_rate": 0.00025938419159380656, "loss": 0.0234, "step": 53670 }, { "epoch": 0.27, "learning_rate": 0.00025937662390079254, "loss": 0.0191, "step": 53680 }, { "epoch": 0.27, "learning_rate": 0.0002593690562077786, "loss": 0.021, "step": 53690 }, { "epoch": 0.27, "learning_rate": 0.00025936148851476456, "loss": 0.0237, "step": 53700 }, { "epoch": 0.27, "learning_rate": 0.00025935392082175054, "loss": 0.0247, "step": 53710 }, { "epoch": 0.27, "learning_rate": 0.0002593463531287365, "loss": 0.0222, "step": 53720 }, { "epoch": 0.27, "learning_rate": 0.0002593387854357225, "loss": 0.025, "step": 53730 }, { "epoch": 0.27, "learning_rate": 0.0002593312177427085, "loss": 0.023, "step": 53740 }, { "epoch": 0.27, "learning_rate": 0.00025932365004969446, "loss": 0.0198, "step": 53750 }, { "epoch": 0.27, "learning_rate": 0.0002593160823566805, "loss": 0.0187, "step": 53760 }, { "epoch": 0.27, "learning_rate": 0.0002593085146636665, "loss": 0.0211, "step": 53770 }, { "epoch": 0.27, "learning_rate": 0.00025930094697065246, "loss": 0.018, "step": 53780 }, { "epoch": 0.27, "learning_rate": 0.00025929337927763844, "loss": 0.0223, "step": 53790 }, { "epoch": 0.27, "learning_rate": 0.0002592858115846244, "loss": 0.0201, "step": 53800 }, { "epoch": 0.27, "learning_rate": 0.0002592782438916104, "loss": 0.0215, "step": 53810 }, { "epoch": 0.27, "learning_rate": 0.00025927067619859644, "loss": 0.0229, "step": 53820 }, { "epoch": 0.27, "learning_rate": 0.0002592631085055824, "loss": 0.02, "step": 53830 }, { "epoch": 0.27, "learning_rate": 0.0002592555408125684, "loss": 0.0187, "step": 53840 }, { "epoch": 0.27, "learning_rate": 0.0002592479731195544, "loss": 0.0186, "step": 53850 }, { "epoch": 0.27, "learning_rate": 0.00025924040542654037, "loss": 0.0216, "step": 53860 }, { "epoch": 0.27, "learning_rate": 0.00025923283773352635, "loss": 0.0201, "step": 53870 }, { "epoch": 0.27, "learning_rate": 0.00025922527004051233, "loss": 0.0207, "step": 53880 }, { "epoch": 0.27, "learning_rate": 0.00025921770234749837, "loss": 0.0211, "step": 53890 }, { "epoch": 0.27, "learning_rate": 0.00025921013465448435, "loss": 0.0197, "step": 53900 }, { "epoch": 0.27, "learning_rate": 0.00025920256696147033, "loss": 0.0213, "step": 53910 }, { "epoch": 0.27, "learning_rate": 0.0002591949992684563, "loss": 0.0166, "step": 53920 }, { "epoch": 0.27, "learning_rate": 0.0002591874315754423, "loss": 0.0223, "step": 53930 }, { "epoch": 0.27, "learning_rate": 0.00025917986388242827, "loss": 0.0161, "step": 53940 }, { "epoch": 0.27, "learning_rate": 0.0002591722961894143, "loss": 0.0202, "step": 53950 }, { "epoch": 0.27, "learning_rate": 0.0002591647284964003, "loss": 0.0214, "step": 53960 }, { "epoch": 0.27, "learning_rate": 0.00025915716080338627, "loss": 0.0167, "step": 53970 }, { "epoch": 0.27, "learning_rate": 0.00025914959311037225, "loss": 0.0202, "step": 53980 }, { "epoch": 0.27, "learning_rate": 0.00025914202541735823, "loss": 0.0219, "step": 53990 }, { "epoch": 0.27, "learning_rate": 0.0002591344577243442, "loss": 0.0209, "step": 54000 }, { "epoch": 0.27, "eval_cer": 0.9144857822411687, "eval_loss": 0.014917539432644844, "eval_runtime": 115.9864, "eval_samples_per_second": 17.243, "eval_steps_per_second": 4.311, "step": 54000 }, { "epoch": 0.27, "learning_rate": 0.00025912689003133025, "loss": 0.0213, "step": 54010 }, { "epoch": 0.27, "learning_rate": 0.00025911932233831623, "loss": 0.0186, "step": 54020 }, { "epoch": 0.27, "learning_rate": 0.0002591117546453022, "loss": 0.0197, "step": 54030 }, { "epoch": 0.27, "learning_rate": 0.0002591041869522882, "loss": 0.0207, "step": 54040 }, { "epoch": 0.27, "learning_rate": 0.0002590966192592742, "loss": 0.0218, "step": 54050 }, { "epoch": 0.27, "learning_rate": 0.00025908905156626016, "loss": 0.022, "step": 54060 }, { "epoch": 0.27, "learning_rate": 0.00025908148387324614, "loss": 0.0279, "step": 54070 }, { "epoch": 0.27, "learning_rate": 0.0002590739161802322, "loss": 0.0219, "step": 54080 }, { "epoch": 0.27, "learning_rate": 0.00025906634848721816, "loss": 0.0769, "step": 54090 }, { "epoch": 0.27, "learning_rate": 0.00025905878079420414, "loss": 0.0249, "step": 54100 }, { "epoch": 0.27, "learning_rate": 0.0002590512131011901, "loss": 0.0208, "step": 54110 }, { "epoch": 0.27, "learning_rate": 0.0002590436454081761, "loss": 0.0231, "step": 54120 }, { "epoch": 0.27, "learning_rate": 0.0002590360777151621, "loss": 0.025, "step": 54130 }, { "epoch": 0.27, "learning_rate": 0.0002590285100221481, "loss": 0.0341, "step": 54140 }, { "epoch": 0.27, "learning_rate": 0.0002590209423291341, "loss": 0.0182, "step": 54150 }, { "epoch": 0.27, "learning_rate": 0.0002590133746361201, "loss": 0.0226, "step": 54160 }, { "epoch": 0.27, "learning_rate": 0.00025900580694310606, "loss": 0.0229, "step": 54170 }, { "epoch": 0.27, "learning_rate": 0.00025899823925009204, "loss": 0.0222, "step": 54180 }, { "epoch": 0.27, "learning_rate": 0.000258990671557078, "loss": 0.0165, "step": 54190 }, { "epoch": 0.27, "learning_rate": 0.00025898310386406406, "loss": 0.0272, "step": 54200 }, { "epoch": 0.27, "learning_rate": 0.00025897553617105004, "loss": 0.0251, "step": 54210 }, { "epoch": 0.27, "learning_rate": 0.000258967968478036, "loss": 0.0219, "step": 54220 }, { "epoch": 0.27, "learning_rate": 0.000258960400785022, "loss": 0.0223, "step": 54230 }, { "epoch": 0.27, "learning_rate": 0.000258952833092008, "loss": 0.0248, "step": 54240 }, { "epoch": 0.27, "learning_rate": 0.00025894526539899397, "loss": 0.0204, "step": 54250 }, { "epoch": 0.27, "learning_rate": 0.00025893769770597995, "loss": 0.0218, "step": 54260 }, { "epoch": 0.27, "learning_rate": 0.000258930130012966, "loss": 0.0197, "step": 54270 }, { "epoch": 0.27, "learning_rate": 0.00025892256231995197, "loss": 0.0206, "step": 54280 }, { "epoch": 0.27, "learning_rate": 0.00025891499462693795, "loss": 0.0197, "step": 54290 }, { "epoch": 0.27, "learning_rate": 0.00025890742693392393, "loss": 0.019, "step": 54300 }, { "epoch": 0.27, "learning_rate": 0.0002588998592409099, "loss": 0.0159, "step": 54310 }, { "epoch": 0.27, "learning_rate": 0.0002588922915478959, "loss": 0.0225, "step": 54320 }, { "epoch": 0.27, "learning_rate": 0.00025888472385488193, "loss": 0.0188, "step": 54330 }, { "epoch": 0.27, "learning_rate": 0.0002588771561618679, "loss": 0.0232, "step": 54340 }, { "epoch": 0.27, "learning_rate": 0.0002588695884688539, "loss": 0.0184, "step": 54350 }, { "epoch": 0.27, "learning_rate": 0.00025886202077583987, "loss": 0.0213, "step": 54360 }, { "epoch": 0.27, "learning_rate": 0.00025885445308282585, "loss": 0.0231, "step": 54370 }, { "epoch": 0.27, "learning_rate": 0.00025884688538981184, "loss": 0.02, "step": 54380 }, { "epoch": 0.27, "learning_rate": 0.0002588393176967978, "loss": 0.022, "step": 54390 }, { "epoch": 0.27, "learning_rate": 0.00025883175000378385, "loss": 0.0253, "step": 54400 }, { "epoch": 0.27, "learning_rate": 0.00025882418231076983, "loss": 0.025, "step": 54410 }, { "epoch": 0.27, "learning_rate": 0.0002588166146177558, "loss": 0.0224, "step": 54420 }, { "epoch": 0.27, "learning_rate": 0.0002588090469247418, "loss": 0.0216, "step": 54430 }, { "epoch": 0.27, "learning_rate": 0.0002588014792317278, "loss": 0.0204, "step": 54440 }, { "epoch": 0.27, "learning_rate": 0.00025879391153871376, "loss": 0.0228, "step": 54450 }, { "epoch": 0.27, "learning_rate": 0.0002587863438456998, "loss": 0.0173, "step": 54460 }, { "epoch": 0.27, "learning_rate": 0.0002587787761526858, "loss": 0.0179, "step": 54470 }, { "epoch": 0.27, "learning_rate": 0.00025877120845967176, "loss": 0.0294, "step": 54480 }, { "epoch": 0.27, "learning_rate": 0.00025876364076665774, "loss": 0.023, "step": 54490 }, { "epoch": 0.27, "learning_rate": 0.0002587560730736437, "loss": 0.0196, "step": 54500 }, { "epoch": 0.28, "learning_rate": 0.0002587485053806297, "loss": 0.0192, "step": 54510 }, { "epoch": 0.28, "learning_rate": 0.00025874093768761574, "loss": 0.0216, "step": 54520 }, { "epoch": 0.28, "learning_rate": 0.0002587333699946017, "loss": 0.0189, "step": 54530 }, { "epoch": 0.28, "learning_rate": 0.0002587258023015877, "loss": 0.022, "step": 54540 }, { "epoch": 0.28, "learning_rate": 0.0002587182346085737, "loss": 0.0242, "step": 54550 }, { "epoch": 0.28, "learning_rate": 0.00025871066691555966, "loss": 0.0205, "step": 54560 }, { "epoch": 0.28, "learning_rate": 0.00025870309922254565, "loss": 0.0198, "step": 54570 }, { "epoch": 0.28, "learning_rate": 0.00025869553152953163, "loss": 0.0218, "step": 54580 }, { "epoch": 0.28, "learning_rate": 0.00025868796383651766, "loss": 0.0232, "step": 54590 }, { "epoch": 0.28, "learning_rate": 0.00025868039614350364, "loss": 0.0253, "step": 54600 }, { "epoch": 0.28, "learning_rate": 0.0002586728284504896, "loss": 0.0187, "step": 54610 }, { "epoch": 0.28, "learning_rate": 0.0002586652607574756, "loss": 0.0187, "step": 54620 }, { "epoch": 0.28, "learning_rate": 0.0002586576930644616, "loss": 0.0231, "step": 54630 }, { "epoch": 0.28, "learning_rate": 0.00025865012537144757, "loss": 0.0232, "step": 54640 }, { "epoch": 0.28, "learning_rate": 0.0002586425576784336, "loss": 0.0191, "step": 54650 }, { "epoch": 0.28, "learning_rate": 0.0002586349899854196, "loss": 0.0203, "step": 54660 }, { "epoch": 0.28, "learning_rate": 0.00025862742229240557, "loss": 0.0224, "step": 54670 }, { "epoch": 0.28, "learning_rate": 0.0002586198545993915, "loss": 0.0187, "step": 54680 }, { "epoch": 0.28, "learning_rate": 0.00025861228690637753, "loss": 0.0215, "step": 54690 }, { "epoch": 0.28, "learning_rate": 0.0002586047192133635, "loss": 0.0227, "step": 54700 }, { "epoch": 0.28, "learning_rate": 0.0002585971515203495, "loss": 0.0164, "step": 54710 }, { "epoch": 0.28, "learning_rate": 0.0002585895838273355, "loss": 0.0203, "step": 54720 }, { "epoch": 0.28, "learning_rate": 0.00025858201613432146, "loss": 0.0224, "step": 54730 }, { "epoch": 0.28, "learning_rate": 0.00025857444844130744, "loss": 0.0213, "step": 54740 }, { "epoch": 0.28, "learning_rate": 0.0002585668807482935, "loss": 0.0192, "step": 54750 }, { "epoch": 0.28, "learning_rate": 0.00025855931305527946, "loss": 0.0183, "step": 54760 }, { "epoch": 0.28, "learning_rate": 0.00025855174536226544, "loss": 0.0232, "step": 54770 }, { "epoch": 0.28, "learning_rate": 0.0002585441776692514, "loss": 0.0258, "step": 54780 }, { "epoch": 0.28, "learning_rate": 0.0002585366099762374, "loss": 0.0201, "step": 54790 }, { "epoch": 0.28, "learning_rate": 0.0002585290422832234, "loss": 0.0201, "step": 54800 }, { "epoch": 0.28, "learning_rate": 0.00025852147459020936, "loss": 0.0246, "step": 54810 }, { "epoch": 0.28, "learning_rate": 0.0002585139068971954, "loss": 0.019, "step": 54820 }, { "epoch": 0.28, "learning_rate": 0.0002585063392041814, "loss": 0.0237, "step": 54830 }, { "epoch": 0.28, "learning_rate": 0.00025849877151116736, "loss": 0.0224, "step": 54840 }, { "epoch": 0.28, "learning_rate": 0.00025849120381815334, "loss": 0.0289, "step": 54850 }, { "epoch": 0.28, "learning_rate": 0.0002584836361251393, "loss": 0.0304, "step": 54860 }, { "epoch": 0.28, "learning_rate": 0.0002584760684321253, "loss": 0.0211, "step": 54870 }, { "epoch": 0.28, "learning_rate": 0.00025846850073911134, "loss": 0.0244, "step": 54880 }, { "epoch": 0.28, "learning_rate": 0.0002584609330460973, "loss": 0.0233, "step": 54890 }, { "epoch": 0.28, "learning_rate": 0.0002584533653530833, "loss": 0.0176, "step": 54900 }, { "epoch": 0.28, "learning_rate": 0.0002584457976600693, "loss": 0.019, "step": 54910 }, { "epoch": 0.28, "learning_rate": 0.00025843822996705527, "loss": 0.0249, "step": 54920 }, { "epoch": 0.28, "learning_rate": 0.00025843066227404125, "loss": 0.0194, "step": 54930 }, { "epoch": 0.28, "learning_rate": 0.00025842309458102723, "loss": 0.0208, "step": 54940 }, { "epoch": 0.28, "learning_rate": 0.00025841552688801327, "loss": 0.0183, "step": 54950 }, { "epoch": 0.28, "learning_rate": 0.00025840795919499925, "loss": 0.0209, "step": 54960 }, { "epoch": 0.28, "learning_rate": 0.00025840039150198523, "loss": 0.0214, "step": 54970 }, { "epoch": 0.28, "learning_rate": 0.0002583928238089712, "loss": 0.0222, "step": 54980 }, { "epoch": 0.28, "learning_rate": 0.0002583852561159572, "loss": 0.0208, "step": 54990 }, { "epoch": 0.28, "learning_rate": 0.0002583776884229432, "loss": 0.0218, "step": 55000 }, { "epoch": 0.28, "eval_cer": 0.914472196695413, "eval_loss": 0.014595328830182552, "eval_runtime": 116.9041, "eval_samples_per_second": 17.108, "eval_steps_per_second": 4.277, "step": 55000 }, { "epoch": 0.28, "learning_rate": 0.0002583701207299292, "loss": 0.019, "step": 55010 }, { "epoch": 0.28, "learning_rate": 0.0002583625530369152, "loss": 0.0263, "step": 55020 }, { "epoch": 0.28, "learning_rate": 0.00025835498534390117, "loss": 0.0244, "step": 55030 }, { "epoch": 0.28, "learning_rate": 0.00025834741765088715, "loss": 0.0189, "step": 55040 }, { "epoch": 0.28, "learning_rate": 0.00025833984995787313, "loss": 0.0207, "step": 55050 }, { "epoch": 0.28, "learning_rate": 0.0002583322822648591, "loss": 0.0205, "step": 55060 }, { "epoch": 0.28, "learning_rate": 0.00025832471457184515, "loss": 0.0225, "step": 55070 }, { "epoch": 0.28, "learning_rate": 0.00025831714687883113, "loss": 0.0212, "step": 55080 }, { "epoch": 0.28, "learning_rate": 0.0002583095791858171, "loss": 0.0208, "step": 55090 }, { "epoch": 0.28, "learning_rate": 0.0002583020114928031, "loss": 0.0224, "step": 55100 }, { "epoch": 0.28, "learning_rate": 0.0002582944437997891, "loss": 0.0239, "step": 55110 }, { "epoch": 0.28, "learning_rate": 0.00025828687610677506, "loss": 0.0173, "step": 55120 }, { "epoch": 0.28, "learning_rate": 0.00025827930841376104, "loss": 0.0308, "step": 55130 }, { "epoch": 0.28, "learning_rate": 0.0002582717407207471, "loss": 0.0244, "step": 55140 }, { "epoch": 0.28, "learning_rate": 0.00025826417302773306, "loss": 0.0239, "step": 55150 }, { "epoch": 0.28, "learning_rate": 0.00025825660533471904, "loss": 0.025, "step": 55160 }, { "epoch": 0.28, "learning_rate": 0.000258249037641705, "loss": 0.0309, "step": 55170 }, { "epoch": 0.28, "learning_rate": 0.000258241469948691, "loss": 0.024, "step": 55180 }, { "epoch": 0.28, "learning_rate": 0.000258233902255677, "loss": 0.0204, "step": 55190 }, { "epoch": 0.28, "learning_rate": 0.000258226334562663, "loss": 0.0193, "step": 55200 }, { "epoch": 0.28, "learning_rate": 0.000258218766869649, "loss": 0.0225, "step": 55210 }, { "epoch": 0.28, "learning_rate": 0.000258211199176635, "loss": 0.02, "step": 55220 }, { "epoch": 0.28, "learning_rate": 0.00025820363148362096, "loss": 0.0266, "step": 55230 }, { "epoch": 0.28, "learning_rate": 0.00025819606379060694, "loss": 0.0234, "step": 55240 }, { "epoch": 0.28, "learning_rate": 0.0002581884960975929, "loss": 0.0198, "step": 55250 }, { "epoch": 0.28, "learning_rate": 0.00025818092840457896, "loss": 0.0241, "step": 55260 }, { "epoch": 0.28, "learning_rate": 0.00025817336071156494, "loss": 0.0204, "step": 55270 }, { "epoch": 0.28, "learning_rate": 0.0002581657930185509, "loss": 0.0225, "step": 55280 }, { "epoch": 0.28, "learning_rate": 0.0002581582253255369, "loss": 0.0206, "step": 55290 }, { "epoch": 0.28, "learning_rate": 0.0002581506576325229, "loss": 0.0208, "step": 55300 }, { "epoch": 0.28, "learning_rate": 0.00025814308993950887, "loss": 0.0211, "step": 55310 }, { "epoch": 0.28, "learning_rate": 0.00025813552224649485, "loss": 0.0247, "step": 55320 }, { "epoch": 0.28, "learning_rate": 0.0002581279545534809, "loss": 0.0197, "step": 55330 }, { "epoch": 0.28, "learning_rate": 0.00025812038686046687, "loss": 0.0199, "step": 55340 }, { "epoch": 0.28, "learning_rate": 0.00025811281916745285, "loss": 0.0182, "step": 55350 }, { "epoch": 0.28, "learning_rate": 0.00025810525147443883, "loss": 0.0203, "step": 55360 }, { "epoch": 0.28, "learning_rate": 0.0002580976837814248, "loss": 0.018, "step": 55370 }, { "epoch": 0.28, "learning_rate": 0.0002580901160884108, "loss": 0.0194, "step": 55380 }, { "epoch": 0.28, "learning_rate": 0.00025808254839539683, "loss": 0.0196, "step": 55390 }, { "epoch": 0.28, "learning_rate": 0.0002580749807023828, "loss": 0.0212, "step": 55400 }, { "epoch": 0.28, "learning_rate": 0.0002580674130093688, "loss": 0.025, "step": 55410 }, { "epoch": 0.28, "learning_rate": 0.0002580598453163548, "loss": 0.0202, "step": 55420 }, { "epoch": 0.28, "learning_rate": 0.00025805227762334075, "loss": 0.0212, "step": 55430 }, { "epoch": 0.28, "learning_rate": 0.00025804470993032674, "loss": 0.0207, "step": 55440 }, { "epoch": 0.28, "learning_rate": 0.0002580371422373127, "loss": 0.0199, "step": 55450 }, { "epoch": 0.28, "learning_rate": 0.00025802957454429875, "loss": 0.0186, "step": 55460 }, { "epoch": 0.28, "learning_rate": 0.00025802200685128473, "loss": 0.0188, "step": 55470 }, { "epoch": 0.28, "learning_rate": 0.0002580144391582707, "loss": 0.0219, "step": 55480 }, { "epoch": 0.28, "learning_rate": 0.0002580068714652567, "loss": 0.0261, "step": 55490 }, { "epoch": 0.28, "learning_rate": 0.0002579993037722427, "loss": 0.0177, "step": 55500 }, { "epoch": 0.28, "learning_rate": 0.00025799173607922866, "loss": 0.0188, "step": 55510 }, { "epoch": 0.28, "learning_rate": 0.0002579841683862147, "loss": 0.0184, "step": 55520 }, { "epoch": 0.28, "learning_rate": 0.0002579766006932007, "loss": 0.021, "step": 55530 }, { "epoch": 0.28, "learning_rate": 0.00025796903300018666, "loss": 0.0221, "step": 55540 }, { "epoch": 0.28, "learning_rate": 0.00025796146530717264, "loss": 0.0187, "step": 55550 }, { "epoch": 0.28, "learning_rate": 0.0002579538976141586, "loss": 0.0187, "step": 55560 }, { "epoch": 0.28, "learning_rate": 0.0002579463299211446, "loss": 0.0199, "step": 55570 }, { "epoch": 0.28, "learning_rate": 0.00025793876222813064, "loss": 0.0181, "step": 55580 }, { "epoch": 0.28, "learning_rate": 0.0002579311945351166, "loss": 0.0181, "step": 55590 }, { "epoch": 0.28, "learning_rate": 0.0002579236268421026, "loss": 0.0198, "step": 55600 }, { "epoch": 0.28, "learning_rate": 0.0002579160591490886, "loss": 0.0223, "step": 55610 }, { "epoch": 0.28, "learning_rate": 0.00025790849145607456, "loss": 0.0208, "step": 55620 }, { "epoch": 0.28, "learning_rate": 0.00025790092376306055, "loss": 0.0192, "step": 55630 }, { "epoch": 0.28, "learning_rate": 0.00025789335607004653, "loss": 0.0182, "step": 55640 }, { "epoch": 0.28, "learning_rate": 0.00025788578837703256, "loss": 0.0224, "step": 55650 }, { "epoch": 0.28, "learning_rate": 0.00025787822068401854, "loss": 0.0204, "step": 55660 }, { "epoch": 0.28, "learning_rate": 0.0002578706529910045, "loss": 0.0186, "step": 55670 }, { "epoch": 0.28, "learning_rate": 0.0002578630852979905, "loss": 0.023, "step": 55680 }, { "epoch": 0.28, "learning_rate": 0.0002578555176049765, "loss": 0.0216, "step": 55690 }, { "epoch": 0.28, "learning_rate": 0.00025784794991196247, "loss": 0.0186, "step": 55700 }, { "epoch": 0.28, "learning_rate": 0.0002578403822189485, "loss": 0.0194, "step": 55710 }, { "epoch": 0.28, "learning_rate": 0.0002578328145259345, "loss": 0.0233, "step": 55720 }, { "epoch": 0.28, "learning_rate": 0.00025782524683292047, "loss": 0.0215, "step": 55730 }, { "epoch": 0.28, "learning_rate": 0.00025781767913990645, "loss": 0.0178, "step": 55740 }, { "epoch": 0.28, "learning_rate": 0.00025781011144689243, "loss": 0.0205, "step": 55750 }, { "epoch": 0.28, "learning_rate": 0.0002578025437538784, "loss": 0.0231, "step": 55760 }, { "epoch": 0.28, "learning_rate": 0.00025779497606086445, "loss": 0.0192, "step": 55770 }, { "epoch": 0.28, "learning_rate": 0.00025778740836785043, "loss": 0.0209, "step": 55780 }, { "epoch": 0.28, "learning_rate": 0.0002577798406748364, "loss": 0.0225, "step": 55790 }, { "epoch": 0.28, "learning_rate": 0.0002577722729818224, "loss": 0.0188, "step": 55800 }, { "epoch": 0.28, "learning_rate": 0.0002577647052888084, "loss": 0.0206, "step": 55810 }, { "epoch": 0.28, "learning_rate": 0.00025775713759579436, "loss": 0.0156, "step": 55820 }, { "epoch": 0.28, "learning_rate": 0.00025774956990278034, "loss": 0.0205, "step": 55830 }, { "epoch": 0.28, "learning_rate": 0.0002577420022097664, "loss": 0.0191, "step": 55840 }, { "epoch": 0.28, "learning_rate": 0.00025773443451675235, "loss": 0.0242, "step": 55850 }, { "epoch": 0.28, "learning_rate": 0.00025772686682373834, "loss": 0.0188, "step": 55860 }, { "epoch": 0.28, "learning_rate": 0.0002577192991307243, "loss": 0.0188, "step": 55870 }, { "epoch": 0.28, "learning_rate": 0.0002577117314377103, "loss": 0.0239, "step": 55880 }, { "epoch": 0.28, "learning_rate": 0.0002577041637446963, "loss": 0.0209, "step": 55890 }, { "epoch": 0.28, "learning_rate": 0.0002576965960516823, "loss": 0.0239, "step": 55900 }, { "epoch": 0.28, "learning_rate": 0.0002576890283586683, "loss": 0.0183, "step": 55910 }, { "epoch": 0.28, "learning_rate": 0.0002576814606656543, "loss": 0.0171, "step": 55920 }, { "epoch": 0.28, "learning_rate": 0.00025767389297264026, "loss": 0.0187, "step": 55930 }, { "epoch": 0.28, "learning_rate": 0.00025766632527962624, "loss": 0.0229, "step": 55940 }, { "epoch": 0.28, "learning_rate": 0.0002576587575866122, "loss": 0.0203, "step": 55950 }, { "epoch": 0.28, "learning_rate": 0.0002576511898935982, "loss": 0.0193, "step": 55960 }, { "epoch": 0.28, "learning_rate": 0.0002576436222005842, "loss": 0.0203, "step": 55970 }, { "epoch": 0.28, "learning_rate": 0.00025763605450757017, "loss": 0.0202, "step": 55980 }, { "epoch": 0.28, "learning_rate": 0.00025762848681455615, "loss": 0.0217, "step": 55990 }, { "epoch": 0.28, "learning_rate": 0.0002576209191215422, "loss": 0.0231, "step": 56000 }, { "epoch": 0.28, "eval_cer": 0.9144886934295449, "eval_loss": 0.014846866950392723, "eval_runtime": 116.7024, "eval_samples_per_second": 17.138, "eval_steps_per_second": 4.284, "step": 56000 }, { "epoch": 0.28, "learning_rate": 0.00025761335142852817, "loss": 0.0217, "step": 56010 }, { "epoch": 0.28, "learning_rate": 0.00025760578373551415, "loss": 0.0188, "step": 56020 }, { "epoch": 0.28, "learning_rate": 0.00025759821604250013, "loss": 0.0211, "step": 56030 }, { "epoch": 0.28, "learning_rate": 0.0002575906483494861, "loss": 0.0206, "step": 56040 }, { "epoch": 0.28, "learning_rate": 0.0002575830806564721, "loss": 0.0159, "step": 56050 }, { "epoch": 0.28, "learning_rate": 0.0002575755129634581, "loss": 0.0219, "step": 56060 }, { "epoch": 0.28, "learning_rate": 0.0002575679452704441, "loss": 0.0194, "step": 56070 }, { "epoch": 0.28, "learning_rate": 0.0002575603775774301, "loss": 0.0193, "step": 56080 }, { "epoch": 0.28, "learning_rate": 0.00025755280988441607, "loss": 0.0166, "step": 56090 }, { "epoch": 0.28, "learning_rate": 0.00025754524219140205, "loss": 0.0205, "step": 56100 }, { "epoch": 0.28, "learning_rate": 0.00025753767449838803, "loss": 0.0187, "step": 56110 }, { "epoch": 0.28, "learning_rate": 0.000257530106805374, "loss": 0.022, "step": 56120 }, { "epoch": 0.28, "learning_rate": 0.00025752253911236005, "loss": 0.0186, "step": 56130 }, { "epoch": 0.28, "learning_rate": 0.00025751497141934603, "loss": 0.0186, "step": 56140 }, { "epoch": 0.28, "learning_rate": 0.000257507403726332, "loss": 0.0208, "step": 56150 }, { "epoch": 0.28, "learning_rate": 0.000257499836033318, "loss": 0.0181, "step": 56160 }, { "epoch": 0.28, "learning_rate": 0.000257492268340304, "loss": 0.021, "step": 56170 }, { "epoch": 0.28, "learning_rate": 0.00025748470064728996, "loss": 0.0231, "step": 56180 }, { "epoch": 0.28, "learning_rate": 0.00025747713295427594, "loss": 0.0215, "step": 56190 }, { "epoch": 0.28, "learning_rate": 0.000257469565261262, "loss": 0.0171, "step": 56200 }, { "epoch": 0.28, "learning_rate": 0.00025746199756824796, "loss": 0.0192, "step": 56210 }, { "epoch": 0.28, "learning_rate": 0.00025745442987523394, "loss": 0.0196, "step": 56220 }, { "epoch": 0.28, "learning_rate": 0.0002574468621822199, "loss": 0.0239, "step": 56230 }, { "epoch": 0.28, "learning_rate": 0.0002574392944892059, "loss": 0.0216, "step": 56240 }, { "epoch": 0.28, "learning_rate": 0.0002574317267961919, "loss": 0.0229, "step": 56250 }, { "epoch": 0.28, "learning_rate": 0.0002574241591031779, "loss": 0.0239, "step": 56260 }, { "epoch": 0.28, "learning_rate": 0.0002574165914101639, "loss": 0.0189, "step": 56270 }, { "epoch": 0.28, "learning_rate": 0.0002574090237171499, "loss": 0.0235, "step": 56280 }, { "epoch": 0.28, "learning_rate": 0.00025740145602413586, "loss": 0.0223, "step": 56290 }, { "epoch": 0.28, "learning_rate": 0.00025739388833112184, "loss": 0.0204, "step": 56300 }, { "epoch": 0.28, "learning_rate": 0.0002573863206381078, "loss": 0.0243, "step": 56310 }, { "epoch": 0.28, "learning_rate": 0.00025737875294509386, "loss": 0.0205, "step": 56320 }, { "epoch": 0.28, "learning_rate": 0.00025737118525207984, "loss": 0.0221, "step": 56330 }, { "epoch": 0.28, "learning_rate": 0.0002573636175590658, "loss": 0.0257, "step": 56340 }, { "epoch": 0.28, "learning_rate": 0.0002573560498660518, "loss": 0.0195, "step": 56350 }, { "epoch": 0.28, "learning_rate": 0.0002573484821730378, "loss": 0.0186, "step": 56360 }, { "epoch": 0.28, "learning_rate": 0.00025734091448002377, "loss": 0.0191, "step": 56370 }, { "epoch": 0.28, "learning_rate": 0.00025733334678700975, "loss": 0.02, "step": 56380 }, { "epoch": 0.28, "learning_rate": 0.0002573257790939958, "loss": 0.0203, "step": 56390 }, { "epoch": 0.28, "learning_rate": 0.00025731821140098177, "loss": 0.0212, "step": 56400 }, { "epoch": 0.28, "learning_rate": 0.00025731064370796775, "loss": 0.0216, "step": 56410 }, { "epoch": 0.28, "learning_rate": 0.00025730307601495373, "loss": 0.0271, "step": 56420 }, { "epoch": 0.28, "learning_rate": 0.0002572955083219397, "loss": 0.0196, "step": 56430 }, { "epoch": 0.28, "learning_rate": 0.0002572879406289257, "loss": 0.0235, "step": 56440 }, { "epoch": 0.28, "learning_rate": 0.00025728037293591173, "loss": 0.0213, "step": 56450 }, { "epoch": 0.28, "learning_rate": 0.0002572728052428977, "loss": 0.037, "step": 56460 }, { "epoch": 0.28, "learning_rate": 0.0002572652375498837, "loss": 0.0182, "step": 56470 }, { "epoch": 0.28, "learning_rate": 0.0002572576698568697, "loss": 0.0186, "step": 56480 }, { "epoch": 0.28, "learning_rate": 0.00025725010216385565, "loss": 0.0186, "step": 56490 }, { "epoch": 0.29, "learning_rate": 0.00025724253447084164, "loss": 0.0252, "step": 56500 }, { "epoch": 0.29, "learning_rate": 0.0002572349667778276, "loss": 0.0242, "step": 56510 }, { "epoch": 0.29, "learning_rate": 0.00025722739908481365, "loss": 0.0204, "step": 56520 }, { "epoch": 0.29, "learning_rate": 0.00025721983139179963, "loss": 0.0236, "step": 56530 }, { "epoch": 0.29, "learning_rate": 0.0002572122636987856, "loss": 0.0248, "step": 56540 }, { "epoch": 0.29, "learning_rate": 0.0002572046960057716, "loss": 0.0227, "step": 56550 }, { "epoch": 0.29, "learning_rate": 0.0002571971283127576, "loss": 0.0206, "step": 56560 }, { "epoch": 0.29, "learning_rate": 0.00025718956061974356, "loss": 0.0212, "step": 56570 }, { "epoch": 0.29, "learning_rate": 0.0002571819929267296, "loss": 0.0183, "step": 56580 }, { "epoch": 0.29, "learning_rate": 0.0002571744252337156, "loss": 0.0237, "step": 56590 }, { "epoch": 0.29, "learning_rate": 0.00025716685754070156, "loss": 0.0188, "step": 56600 }, { "epoch": 0.29, "learning_rate": 0.00025715928984768754, "loss": 0.0202, "step": 56610 }, { "epoch": 0.29, "learning_rate": 0.0002571517221546735, "loss": 0.02, "step": 56620 }, { "epoch": 0.29, "learning_rate": 0.0002571441544616595, "loss": 0.0222, "step": 56630 }, { "epoch": 0.29, "learning_rate": 0.00025713658676864554, "loss": 0.0181, "step": 56640 }, { "epoch": 0.29, "learning_rate": 0.0002571290190756315, "loss": 0.0193, "step": 56650 }, { "epoch": 0.29, "learning_rate": 0.0002571214513826175, "loss": 0.0206, "step": 56660 }, { "epoch": 0.29, "learning_rate": 0.0002571138836896035, "loss": 0.0208, "step": 56670 }, { "epoch": 0.29, "learning_rate": 0.00025710631599658946, "loss": 0.0205, "step": 56680 }, { "epoch": 0.29, "learning_rate": 0.00025709874830357545, "loss": 0.0229, "step": 56690 }, { "epoch": 0.29, "learning_rate": 0.00025709118061056143, "loss": 0.0234, "step": 56700 }, { "epoch": 0.29, "learning_rate": 0.00025708361291754746, "loss": 0.027, "step": 56710 }, { "epoch": 0.29, "learning_rate": 0.00025707604522453344, "loss": 0.0241, "step": 56720 }, { "epoch": 0.29, "learning_rate": 0.0002570684775315194, "loss": 0.0194, "step": 56730 }, { "epoch": 0.29, "learning_rate": 0.0002570609098385054, "loss": 0.0168, "step": 56740 }, { "epoch": 0.29, "learning_rate": 0.0002570533421454914, "loss": 0.0177, "step": 56750 }, { "epoch": 0.29, "learning_rate": 0.00025704577445247737, "loss": 0.0176, "step": 56760 }, { "epoch": 0.29, "learning_rate": 0.0002570382067594634, "loss": 0.0233, "step": 56770 }, { "epoch": 0.29, "learning_rate": 0.0002570306390664494, "loss": 0.0194, "step": 56780 }, { "epoch": 0.29, "learning_rate": 0.00025702307137343537, "loss": 0.0209, "step": 56790 }, { "epoch": 0.29, "learning_rate": 0.00025701550368042135, "loss": 0.0257, "step": 56800 }, { "epoch": 0.29, "learning_rate": 0.00025700793598740733, "loss": 0.0195, "step": 56810 }, { "epoch": 0.29, "learning_rate": 0.0002570003682943933, "loss": 0.0198, "step": 56820 }, { "epoch": 0.29, "learning_rate": 0.00025699280060137935, "loss": 0.0229, "step": 56830 }, { "epoch": 0.29, "learning_rate": 0.00025698523290836533, "loss": 0.0193, "step": 56840 }, { "epoch": 0.29, "learning_rate": 0.0002569776652153513, "loss": 0.0187, "step": 56850 }, { "epoch": 0.29, "learning_rate": 0.0002569700975223373, "loss": 0.0213, "step": 56860 }, { "epoch": 0.29, "learning_rate": 0.0002569625298293233, "loss": 0.0171, "step": 56870 }, { "epoch": 0.29, "learning_rate": 0.00025695496213630926, "loss": 0.0196, "step": 56880 }, { "epoch": 0.29, "learning_rate": 0.00025694739444329524, "loss": 0.017, "step": 56890 }, { "epoch": 0.29, "learning_rate": 0.0002569398267502813, "loss": 0.0427, "step": 56900 }, { "epoch": 0.29, "learning_rate": 0.00025693225905726725, "loss": 0.0221, "step": 56910 }, { "epoch": 0.29, "learning_rate": 0.00025692469136425324, "loss": 0.0206, "step": 56920 }, { "epoch": 0.29, "learning_rate": 0.0002569171236712392, "loss": 0.03, "step": 56930 }, { "epoch": 0.29, "learning_rate": 0.0002569095559782252, "loss": 0.02, "step": 56940 }, { "epoch": 0.29, "learning_rate": 0.0002569019882852112, "loss": 0.0199, "step": 56950 }, { "epoch": 0.29, "learning_rate": 0.0002568944205921972, "loss": 0.0206, "step": 56960 }, { "epoch": 0.29, "learning_rate": 0.0002568868528991832, "loss": 0.022, "step": 56970 }, { "epoch": 0.29, "learning_rate": 0.0002568792852061692, "loss": 0.028, "step": 56980 }, { "epoch": 0.29, "learning_rate": 0.00025687171751315516, "loss": 0.0209, "step": 56990 }, { "epoch": 0.29, "learning_rate": 0.00025686414982014114, "loss": 0.0217, "step": 57000 }, { "epoch": 0.29, "eval_cer": 0.9144644335264098, "eval_loss": 0.014634103514254093, "eval_runtime": 116.5702, "eval_samples_per_second": 17.157, "eval_steps_per_second": 4.289, "step": 57000 }, { "epoch": 0.29, "learning_rate": 0.0002568565821271271, "loss": 0.0183, "step": 57010 }, { "epoch": 0.29, "learning_rate": 0.0002568490144341131, "loss": 0.0169, "step": 57020 }, { "epoch": 0.29, "learning_rate": 0.00025684144674109914, "loss": 0.0273, "step": 57030 }, { "epoch": 0.29, "learning_rate": 0.0002568338790480851, "loss": 0.0249, "step": 57040 }, { "epoch": 0.29, "learning_rate": 0.0002568263113550711, "loss": 0.0195, "step": 57050 }, { "epoch": 0.29, "learning_rate": 0.0002568187436620571, "loss": 0.0171, "step": 57060 }, { "epoch": 0.29, "learning_rate": 0.00025681117596904307, "loss": 0.0186, "step": 57070 }, { "epoch": 0.29, "learning_rate": 0.00025680360827602905, "loss": 0.0236, "step": 57080 }, { "epoch": 0.29, "learning_rate": 0.0002567960405830151, "loss": 0.019, "step": 57090 }, { "epoch": 0.29, "learning_rate": 0.00025678847289000106, "loss": 0.0243, "step": 57100 }, { "epoch": 0.29, "learning_rate": 0.00025678090519698705, "loss": 0.0207, "step": 57110 }, { "epoch": 0.29, "learning_rate": 0.00025677333750397303, "loss": 0.0199, "step": 57120 }, { "epoch": 0.29, "learning_rate": 0.000256765769810959, "loss": 0.0218, "step": 57130 }, { "epoch": 0.29, "learning_rate": 0.000256758202117945, "loss": 0.0233, "step": 57140 }, { "epoch": 0.29, "learning_rate": 0.000256750634424931, "loss": 0.0202, "step": 57150 }, { "epoch": 0.29, "learning_rate": 0.000256743066731917, "loss": 0.0222, "step": 57160 }, { "epoch": 0.29, "learning_rate": 0.000256735499038903, "loss": 0.0229, "step": 57170 }, { "epoch": 0.29, "learning_rate": 0.00025672793134588897, "loss": 0.0185, "step": 57180 }, { "epoch": 0.29, "learning_rate": 0.00025672036365287495, "loss": 0.0251, "step": 57190 }, { "epoch": 0.29, "learning_rate": 0.00025671279595986093, "loss": 0.0174, "step": 57200 }, { "epoch": 0.29, "learning_rate": 0.0002567052282668469, "loss": 0.0226, "step": 57210 }, { "epoch": 0.29, "learning_rate": 0.0002566976605738329, "loss": 0.0242, "step": 57220 }, { "epoch": 0.29, "learning_rate": 0.0002566900928808189, "loss": 0.0263, "step": 57230 }, { "epoch": 0.29, "learning_rate": 0.00025668252518780486, "loss": 0.0278, "step": 57240 }, { "epoch": 0.29, "learning_rate": 0.00025667495749479084, "loss": 0.0207, "step": 57250 }, { "epoch": 0.29, "learning_rate": 0.0002566673898017769, "loss": 0.0209, "step": 57260 }, { "epoch": 0.29, "learning_rate": 0.00025665982210876286, "loss": 0.0188, "step": 57270 }, { "epoch": 0.29, "learning_rate": 0.00025665225441574884, "loss": 0.0194, "step": 57280 }, { "epoch": 0.29, "learning_rate": 0.0002566446867227348, "loss": 0.021, "step": 57290 }, { "epoch": 0.29, "learning_rate": 0.0002566371190297208, "loss": 0.0245, "step": 57300 }, { "epoch": 0.29, "learning_rate": 0.0002566295513367068, "loss": 0.0265, "step": 57310 }, { "epoch": 0.29, "learning_rate": 0.0002566219836436928, "loss": 0.0186, "step": 57320 }, { "epoch": 0.29, "learning_rate": 0.0002566144159506788, "loss": 0.0239, "step": 57330 }, { "epoch": 0.29, "learning_rate": 0.0002566068482576648, "loss": 0.0198, "step": 57340 }, { "epoch": 0.29, "learning_rate": 0.00025659928056465076, "loss": 0.0241, "step": 57350 }, { "epoch": 0.29, "learning_rate": 0.00025659171287163674, "loss": 0.0189, "step": 57360 }, { "epoch": 0.29, "learning_rate": 0.0002565841451786227, "loss": 0.0187, "step": 57370 }, { "epoch": 0.29, "learning_rate": 0.00025657657748560876, "loss": 0.0195, "step": 57380 }, { "epoch": 0.29, "learning_rate": 0.00025656900979259474, "loss": 0.0241, "step": 57390 }, { "epoch": 0.29, "learning_rate": 0.0002565614420995807, "loss": 0.0166, "step": 57400 }, { "epoch": 0.29, "learning_rate": 0.0002565538744065667, "loss": 0.0163, "step": 57410 }, { "epoch": 0.29, "learning_rate": 0.0002565463067135527, "loss": 0.0186, "step": 57420 }, { "epoch": 0.29, "learning_rate": 0.00025653873902053867, "loss": 0.0186, "step": 57430 }, { "epoch": 0.29, "learning_rate": 0.00025653117132752465, "loss": 0.0214, "step": 57440 }, { "epoch": 0.29, "learning_rate": 0.0002565236036345107, "loss": 0.0215, "step": 57450 }, { "epoch": 0.29, "learning_rate": 0.00025651603594149667, "loss": 0.0198, "step": 57460 }, { "epoch": 0.29, "learning_rate": 0.00025650846824848265, "loss": 0.0209, "step": 57470 }, { "epoch": 0.29, "learning_rate": 0.00025650090055546863, "loss": 0.0219, "step": 57480 }, { "epoch": 0.29, "learning_rate": 0.0002564933328624546, "loss": 0.0249, "step": 57490 }, { "epoch": 0.29, "learning_rate": 0.0002564857651694406, "loss": 0.0168, "step": 57500 }, { "epoch": 0.29, "learning_rate": 0.00025647819747642663, "loss": 0.0211, "step": 57510 }, { "epoch": 0.29, "learning_rate": 0.0002564706297834126, "loss": 0.0206, "step": 57520 }, { "epoch": 0.29, "learning_rate": 0.0002564630620903986, "loss": 0.0218, "step": 57530 }, { "epoch": 0.29, "learning_rate": 0.0002564554943973846, "loss": 0.0201, "step": 57540 }, { "epoch": 0.29, "learning_rate": 0.00025644792670437056, "loss": 0.0209, "step": 57550 }, { "epoch": 0.29, "learning_rate": 0.00025644035901135654, "loss": 0.0171, "step": 57560 }, { "epoch": 0.29, "learning_rate": 0.00025643279131834257, "loss": 0.0197, "step": 57570 }, { "epoch": 0.29, "learning_rate": 0.00025642522362532855, "loss": 0.0187, "step": 57580 }, { "epoch": 0.29, "learning_rate": 0.00025641765593231454, "loss": 0.0191, "step": 57590 }, { "epoch": 0.29, "learning_rate": 0.0002564100882393005, "loss": 0.0213, "step": 57600 }, { "epoch": 0.29, "learning_rate": 0.0002564025205462865, "loss": 0.0176, "step": 57610 }, { "epoch": 0.29, "learning_rate": 0.0002563949528532725, "loss": 0.0206, "step": 57620 }, { "epoch": 0.29, "learning_rate": 0.00025638738516025846, "loss": 0.0181, "step": 57630 }, { "epoch": 0.29, "learning_rate": 0.0002563798174672445, "loss": 0.0229, "step": 57640 }, { "epoch": 0.29, "learning_rate": 0.0002563722497742305, "loss": 0.0235, "step": 57650 }, { "epoch": 0.29, "learning_rate": 0.00025636468208121646, "loss": 0.0192, "step": 57660 }, { "epoch": 0.29, "learning_rate": 0.00025635711438820244, "loss": 0.017, "step": 57670 }, { "epoch": 0.29, "learning_rate": 0.0002563495466951884, "loss": 0.0178, "step": 57680 }, { "epoch": 0.29, "learning_rate": 0.0002563419790021744, "loss": 0.0167, "step": 57690 }, { "epoch": 0.29, "learning_rate": 0.00025633441130916044, "loss": 0.017, "step": 57700 }, { "epoch": 0.29, "learning_rate": 0.0002563268436161464, "loss": 0.0176, "step": 57710 }, { "epoch": 0.29, "learning_rate": 0.0002563192759231324, "loss": 0.0204, "step": 57720 }, { "epoch": 0.29, "learning_rate": 0.0002563117082301184, "loss": 0.024, "step": 57730 }, { "epoch": 0.29, "learning_rate": 0.00025630414053710437, "loss": 0.0171, "step": 57740 }, { "epoch": 0.29, "learning_rate": 0.00025629657284409035, "loss": 0.0136, "step": 57750 }, { "epoch": 0.29, "learning_rate": 0.00025628900515107633, "loss": 0.0175, "step": 57760 }, { "epoch": 0.29, "learning_rate": 0.00025628143745806236, "loss": 0.0213, "step": 57770 }, { "epoch": 0.29, "learning_rate": 0.00025627386976504835, "loss": 0.0175, "step": 57780 }, { "epoch": 0.29, "learning_rate": 0.0002562663020720343, "loss": 0.0196, "step": 57790 }, { "epoch": 0.29, "learning_rate": 0.0002562587343790203, "loss": 0.0179, "step": 57800 }, { "epoch": 0.29, "learning_rate": 0.0002562511666860063, "loss": 0.0197, "step": 57810 }, { "epoch": 0.29, "learning_rate": 0.00025624359899299227, "loss": 0.0187, "step": 57820 }, { "epoch": 0.29, "learning_rate": 0.0002562360312999783, "loss": 0.0199, "step": 57830 }, { "epoch": 0.29, "learning_rate": 0.0002562284636069643, "loss": 0.0206, "step": 57840 }, { "epoch": 0.29, "learning_rate": 0.00025622089591395027, "loss": 0.0188, "step": 57850 }, { "epoch": 0.29, "learning_rate": 0.00025621332822093625, "loss": 0.017, "step": 57860 }, { "epoch": 0.29, "learning_rate": 0.00025620576052792223, "loss": 0.0177, "step": 57870 }, { "epoch": 0.29, "learning_rate": 0.0002561981928349082, "loss": 0.0188, "step": 57880 }, { "epoch": 0.29, "learning_rate": 0.00025619062514189425, "loss": 0.0194, "step": 57890 }, { "epoch": 0.29, "learning_rate": 0.00025618305744888023, "loss": 0.0226, "step": 57900 }, { "epoch": 0.29, "learning_rate": 0.0002561754897558662, "loss": 0.0199, "step": 57910 }, { "epoch": 0.29, "learning_rate": 0.0002561679220628522, "loss": 0.0172, "step": 57920 }, { "epoch": 0.29, "learning_rate": 0.0002561603543698382, "loss": 0.0197, "step": 57930 }, { "epoch": 0.29, "learning_rate": 0.00025615278667682416, "loss": 0.0196, "step": 57940 }, { "epoch": 0.29, "learning_rate": 0.00025614521898381014, "loss": 0.0179, "step": 57950 }, { "epoch": 0.29, "learning_rate": 0.0002561376512907962, "loss": 0.0268, "step": 57960 }, { "epoch": 0.29, "learning_rate": 0.00025613008359778216, "loss": 0.0231, "step": 57970 }, { "epoch": 0.29, "learning_rate": 0.00025612251590476814, "loss": 0.0186, "step": 57980 }, { "epoch": 0.29, "learning_rate": 0.0002561149482117541, "loss": 0.0204, "step": 57990 }, { "epoch": 0.29, "learning_rate": 0.0002561073805187401, "loss": 0.019, "step": 58000 }, { "epoch": 0.29, "eval_cer": 0.914472196695413, "eval_loss": 0.014296288602054119, "eval_runtime": 116.695, "eval_samples_per_second": 17.139, "eval_steps_per_second": 4.285, "step": 58000 }, { "epoch": 0.29, "learning_rate": 0.0002560998128257261, "loss": 0.0212, "step": 58010 }, { "epoch": 0.29, "learning_rate": 0.0002560922451327121, "loss": 0.0204, "step": 58020 }, { "epoch": 0.29, "learning_rate": 0.0002560846774396981, "loss": 0.015, "step": 58030 }, { "epoch": 0.29, "learning_rate": 0.0002560771097466841, "loss": 0.0206, "step": 58040 }, { "epoch": 0.29, "learning_rate": 0.00025606954205367006, "loss": 0.0218, "step": 58050 }, { "epoch": 0.29, "learning_rate": 0.00025606197436065604, "loss": 0.0192, "step": 58060 }, { "epoch": 0.29, "learning_rate": 0.000256054406667642, "loss": 0.0203, "step": 58070 }, { "epoch": 0.29, "learning_rate": 0.00025604683897462806, "loss": 0.0193, "step": 58080 }, { "epoch": 0.29, "learning_rate": 0.00025603927128161404, "loss": 0.019, "step": 58090 }, { "epoch": 0.29, "learning_rate": 0.0002560317035886, "loss": 0.0174, "step": 58100 }, { "epoch": 0.29, "learning_rate": 0.000256024135895586, "loss": 0.0199, "step": 58110 }, { "epoch": 0.29, "learning_rate": 0.000256016568202572, "loss": 0.02, "step": 58120 }, { "epoch": 0.29, "learning_rate": 0.00025600900050955797, "loss": 0.0179, "step": 58130 }, { "epoch": 0.29, "learning_rate": 0.00025600143281654395, "loss": 0.0192, "step": 58140 }, { "epoch": 0.29, "learning_rate": 0.00025599386512353, "loss": 0.0195, "step": 58150 }, { "epoch": 0.29, "learning_rate": 0.00025598629743051597, "loss": 0.0211, "step": 58160 }, { "epoch": 0.29, "learning_rate": 0.00025597872973750195, "loss": 0.0255, "step": 58170 }, { "epoch": 0.29, "learning_rate": 0.00025597116204448793, "loss": 0.0201, "step": 58180 }, { "epoch": 0.29, "learning_rate": 0.0002559635943514739, "loss": 0.0198, "step": 58190 }, { "epoch": 0.29, "learning_rate": 0.0002559560266584599, "loss": 0.0187, "step": 58200 }, { "epoch": 0.29, "learning_rate": 0.0002559484589654459, "loss": 0.0221, "step": 58210 }, { "epoch": 0.29, "learning_rate": 0.0002559408912724319, "loss": 0.0192, "step": 58220 }, { "epoch": 0.29, "learning_rate": 0.0002559333235794179, "loss": 0.0217, "step": 58230 }, { "epoch": 0.29, "learning_rate": 0.00025592575588640387, "loss": 0.0174, "step": 58240 }, { "epoch": 0.29, "learning_rate": 0.00025591818819338985, "loss": 0.0188, "step": 58250 }, { "epoch": 0.29, "learning_rate": 0.00025591062050037583, "loss": 0.0195, "step": 58260 }, { "epoch": 0.29, "learning_rate": 0.0002559030528073618, "loss": 0.0199, "step": 58270 }, { "epoch": 0.29, "learning_rate": 0.00025589548511434785, "loss": 0.0215, "step": 58280 }, { "epoch": 0.29, "learning_rate": 0.00025588791742133383, "loss": 0.0226, "step": 58290 }, { "epoch": 0.29, "learning_rate": 0.0002558803497283198, "loss": 0.0203, "step": 58300 }, { "epoch": 0.29, "learning_rate": 0.0002558727820353058, "loss": 0.0201, "step": 58310 }, { "epoch": 0.29, "learning_rate": 0.0002558652143422918, "loss": 0.0253, "step": 58320 }, { "epoch": 0.29, "learning_rate": 0.00025585764664927776, "loss": 0.018, "step": 58330 }, { "epoch": 0.29, "learning_rate": 0.0002558500789562638, "loss": 0.0206, "step": 58340 }, { "epoch": 0.29, "learning_rate": 0.0002558425112632498, "loss": 0.0159, "step": 58350 }, { "epoch": 0.29, "learning_rate": 0.00025583494357023576, "loss": 0.0183, "step": 58360 }, { "epoch": 0.29, "learning_rate": 0.00025582737587722174, "loss": 0.0208, "step": 58370 }, { "epoch": 0.29, "learning_rate": 0.0002558198081842077, "loss": 0.018, "step": 58380 }, { "epoch": 0.29, "learning_rate": 0.0002558122404911937, "loss": 0.0215, "step": 58390 }, { "epoch": 0.29, "learning_rate": 0.00025580467279817974, "loss": 0.0199, "step": 58400 }, { "epoch": 0.29, "learning_rate": 0.0002557971051051657, "loss": 0.0212, "step": 58410 }, { "epoch": 0.29, "learning_rate": 0.0002557895374121517, "loss": 0.0298, "step": 58420 }, { "epoch": 0.29, "learning_rate": 0.0002557819697191377, "loss": 0.0216, "step": 58430 }, { "epoch": 0.29, "learning_rate": 0.00025577440202612366, "loss": 0.0188, "step": 58440 }, { "epoch": 0.29, "learning_rate": 0.00025576683433310964, "loss": 0.0182, "step": 58450 }, { "epoch": 0.29, "learning_rate": 0.0002557592666400956, "loss": 0.0166, "step": 58460 }, { "epoch": 0.29, "learning_rate": 0.0002557516989470816, "loss": 0.0229, "step": 58470 }, { "epoch": 0.3, "learning_rate": 0.0002557441312540676, "loss": 0.0194, "step": 58480 }, { "epoch": 0.3, "learning_rate": 0.00025573656356105357, "loss": 0.0227, "step": 58490 }, { "epoch": 0.3, "learning_rate": 0.00025572899586803955, "loss": 0.0189, "step": 58500 }, { "epoch": 0.3, "learning_rate": 0.0002557214281750256, "loss": 0.0191, "step": 58510 }, { "epoch": 0.3, "learning_rate": 0.00025571386048201157, "loss": 0.019, "step": 58520 }, { "epoch": 0.3, "learning_rate": 0.00025570629278899755, "loss": 0.019, "step": 58530 }, { "epoch": 0.3, "learning_rate": 0.00025569872509598353, "loss": 0.0174, "step": 58540 }, { "epoch": 0.3, "learning_rate": 0.0002556911574029695, "loss": 0.0252, "step": 58550 }, { "epoch": 0.3, "learning_rate": 0.0002556835897099555, "loss": 0.0192, "step": 58560 }, { "epoch": 0.3, "learning_rate": 0.00025567602201694153, "loss": 0.0203, "step": 58570 }, { "epoch": 0.3, "learning_rate": 0.0002556684543239275, "loss": 0.018, "step": 58580 }, { "epoch": 0.3, "learning_rate": 0.0002556608866309135, "loss": 0.0187, "step": 58590 }, { "epoch": 0.3, "learning_rate": 0.0002556533189378995, "loss": 0.02, "step": 58600 }, { "epoch": 0.3, "learning_rate": 0.00025564575124488546, "loss": 0.0192, "step": 58610 }, { "epoch": 0.3, "learning_rate": 0.00025563818355187144, "loss": 0.0189, "step": 58620 }, { "epoch": 0.3, "learning_rate": 0.00025563061585885747, "loss": 0.0226, "step": 58630 }, { "epoch": 0.3, "learning_rate": 0.00025562304816584345, "loss": 0.02, "step": 58640 }, { "epoch": 0.3, "learning_rate": 0.00025561548047282944, "loss": 0.0194, "step": 58650 }, { "epoch": 0.3, "learning_rate": 0.0002556079127798154, "loss": 0.0212, "step": 58660 }, { "epoch": 0.3, "learning_rate": 0.0002556003450868014, "loss": 0.0214, "step": 58670 }, { "epoch": 0.3, "learning_rate": 0.0002555927773937874, "loss": 0.0227, "step": 58680 }, { "epoch": 0.3, "learning_rate": 0.00025558520970077336, "loss": 0.0171, "step": 58690 }, { "epoch": 0.3, "learning_rate": 0.0002555776420077594, "loss": 0.0217, "step": 58700 }, { "epoch": 0.3, "learning_rate": 0.0002555700743147454, "loss": 0.0233, "step": 58710 }, { "epoch": 0.3, "learning_rate": 0.00025556250662173136, "loss": 0.0233, "step": 58720 }, { "epoch": 0.3, "learning_rate": 0.00025555493892871734, "loss": 0.0195, "step": 58730 }, { "epoch": 0.3, "learning_rate": 0.0002555473712357033, "loss": 0.0206, "step": 58740 }, { "epoch": 0.3, "learning_rate": 0.0002555398035426893, "loss": 0.0236, "step": 58750 }, { "epoch": 0.3, "learning_rate": 0.00025553223584967534, "loss": 0.0218, "step": 58760 }, { "epoch": 0.3, "learning_rate": 0.0002555246681566613, "loss": 0.0205, "step": 58770 }, { "epoch": 0.3, "learning_rate": 0.0002555171004636473, "loss": 0.0196, "step": 58780 }, { "epoch": 0.3, "learning_rate": 0.0002555095327706333, "loss": 0.0209, "step": 58790 }, { "epoch": 0.3, "learning_rate": 0.00025550196507761927, "loss": 0.0205, "step": 58800 }, { "epoch": 0.3, "learning_rate": 0.00025549439738460525, "loss": 0.0206, "step": 58810 }, { "epoch": 0.3, "learning_rate": 0.00025548682969159123, "loss": 0.021, "step": 58820 }, { "epoch": 0.3, "learning_rate": 0.00025547926199857726, "loss": 0.0188, "step": 58830 }, { "epoch": 0.3, "learning_rate": 0.00025547169430556325, "loss": 0.0202, "step": 58840 }, { "epoch": 0.3, "learning_rate": 0.0002554641266125492, "loss": 0.0244, "step": 58850 }, { "epoch": 0.3, "learning_rate": 0.0002554565589195352, "loss": 0.053, "step": 58860 }, { "epoch": 0.3, "learning_rate": 0.0002554489912265212, "loss": 0.0232, "step": 58870 }, { "epoch": 0.3, "learning_rate": 0.00025544142353350717, "loss": 0.0183, "step": 58880 }, { "epoch": 0.3, "learning_rate": 0.0002554338558404932, "loss": 0.0426, "step": 58890 }, { "epoch": 0.3, "learning_rate": 0.0002554262881474792, "loss": 0.0177, "step": 58900 }, { "epoch": 0.3, "learning_rate": 0.00025541872045446517, "loss": 0.0179, "step": 58910 }, { "epoch": 0.3, "learning_rate": 0.00025541115276145115, "loss": 0.0202, "step": 58920 }, { "epoch": 0.3, "learning_rate": 0.00025540358506843713, "loss": 0.0236, "step": 58930 }, { "epoch": 0.3, "learning_rate": 0.0002553960173754231, "loss": 0.0213, "step": 58940 }, { "epoch": 0.3, "learning_rate": 0.00025538844968240915, "loss": 0.0203, "step": 58950 }, { "epoch": 0.3, "learning_rate": 0.00025538088198939513, "loss": 0.022, "step": 58960 }, { "epoch": 0.3, "learning_rate": 0.0002553733142963811, "loss": 0.0185, "step": 58970 }, { "epoch": 0.3, "learning_rate": 0.0002553657466033671, "loss": 0.0215, "step": 58980 }, { "epoch": 0.3, "learning_rate": 0.0002553581789103531, "loss": 0.0176, "step": 58990 }, { "epoch": 0.3, "learning_rate": 0.00025535061121733906, "loss": 0.0179, "step": 59000 }, { "epoch": 0.3, "eval_cer": 0.9144916046179211, "eval_loss": 0.014513496309518814, "eval_runtime": 116.7004, "eval_samples_per_second": 17.138, "eval_steps_per_second": 4.284, "step": 59000 }, { "epoch": 0.3, "learning_rate": 0.00025534304352432504, "loss": 0.024, "step": 59010 }, { "epoch": 0.3, "learning_rate": 0.0002553354758313111, "loss": 0.0185, "step": 59020 }, { "epoch": 0.3, "learning_rate": 0.00025532790813829706, "loss": 0.0185, "step": 59030 }, { "epoch": 0.3, "learning_rate": 0.00025532034044528304, "loss": 0.0213, "step": 59040 }, { "epoch": 0.3, "learning_rate": 0.000255312772752269, "loss": 0.0171, "step": 59050 }, { "epoch": 0.3, "learning_rate": 0.000255305205059255, "loss": 0.0214, "step": 59060 }, { "epoch": 0.3, "learning_rate": 0.000255297637366241, "loss": 0.0191, "step": 59070 }, { "epoch": 0.3, "learning_rate": 0.000255290069673227, "loss": 0.0181, "step": 59080 }, { "epoch": 0.3, "learning_rate": 0.000255282501980213, "loss": 0.019, "step": 59090 }, { "epoch": 0.3, "learning_rate": 0.000255274934287199, "loss": 0.0217, "step": 59100 }, { "epoch": 0.3, "learning_rate": 0.00025526736659418496, "loss": 0.0169, "step": 59110 }, { "epoch": 0.3, "learning_rate": 0.00025525979890117094, "loss": 0.0203, "step": 59120 }, { "epoch": 0.3, "learning_rate": 0.0002552522312081569, "loss": 0.0228, "step": 59130 }, { "epoch": 0.3, "learning_rate": 0.00025524466351514296, "loss": 0.0209, "step": 59140 }, { "epoch": 0.3, "learning_rate": 0.00025523709582212894, "loss": 0.025, "step": 59150 }, { "epoch": 0.3, "learning_rate": 0.0002552295281291149, "loss": 0.0197, "step": 59160 }, { "epoch": 0.3, "learning_rate": 0.0002552219604361009, "loss": 0.0191, "step": 59170 }, { "epoch": 0.3, "learning_rate": 0.0002552143927430869, "loss": 0.0208, "step": 59180 }, { "epoch": 0.3, "learning_rate": 0.00025520682505007287, "loss": 0.0202, "step": 59190 }, { "epoch": 0.3, "learning_rate": 0.00025519925735705885, "loss": 0.0194, "step": 59200 }, { "epoch": 0.3, "learning_rate": 0.0002551916896640449, "loss": 0.0189, "step": 59210 }, { "epoch": 0.3, "learning_rate": 0.00025518412197103087, "loss": 0.0223, "step": 59220 }, { "epoch": 0.3, "learning_rate": 0.00025517655427801685, "loss": 0.0222, "step": 59230 }, { "epoch": 0.3, "learning_rate": 0.00025516898658500283, "loss": 0.0189, "step": 59240 }, { "epoch": 0.3, "learning_rate": 0.0002551614188919888, "loss": 0.0214, "step": 59250 }, { "epoch": 0.3, "learning_rate": 0.0002551538511989748, "loss": 0.0198, "step": 59260 }, { "epoch": 0.3, "learning_rate": 0.0002551462835059608, "loss": 0.0212, "step": 59270 }, { "epoch": 0.3, "learning_rate": 0.0002551387158129468, "loss": 0.0223, "step": 59280 }, { "epoch": 0.3, "learning_rate": 0.0002551311481199328, "loss": 0.0205, "step": 59290 }, { "epoch": 0.3, "learning_rate": 0.00025512358042691877, "loss": 0.0179, "step": 59300 }, { "epoch": 0.3, "learning_rate": 0.00025511601273390475, "loss": 0.0182, "step": 59310 }, { "epoch": 0.3, "learning_rate": 0.00025510844504089073, "loss": 0.0184, "step": 59320 }, { "epoch": 0.3, "learning_rate": 0.0002551008773478767, "loss": 0.0181, "step": 59330 }, { "epoch": 0.3, "learning_rate": 0.00025509330965486275, "loss": 0.0206, "step": 59340 }, { "epoch": 0.3, "learning_rate": 0.00025508574196184873, "loss": 0.0164, "step": 59350 }, { "epoch": 0.3, "learning_rate": 0.0002550781742688347, "loss": 0.0216, "step": 59360 }, { "epoch": 0.3, "learning_rate": 0.0002550706065758207, "loss": 0.0213, "step": 59370 }, { "epoch": 0.3, "learning_rate": 0.0002550630388828067, "loss": 0.0218, "step": 59380 }, { "epoch": 0.3, "learning_rate": 0.00025505547118979266, "loss": 0.0208, "step": 59390 }, { "epoch": 0.3, "learning_rate": 0.0002550479034967787, "loss": 0.0233, "step": 59400 }, { "epoch": 0.3, "learning_rate": 0.0002550403358037647, "loss": 0.0239, "step": 59410 }, { "epoch": 0.3, "learning_rate": 0.00025503276811075066, "loss": 0.0208, "step": 59420 }, { "epoch": 0.3, "learning_rate": 0.00025502520041773664, "loss": 0.0208, "step": 59430 }, { "epoch": 0.3, "learning_rate": 0.0002550176327247226, "loss": 0.0222, "step": 59440 }, { "epoch": 0.3, "learning_rate": 0.0002550100650317086, "loss": 0.0214, "step": 59450 }, { "epoch": 0.3, "learning_rate": 0.00025500249733869464, "loss": 0.0329, "step": 59460 }, { "epoch": 0.3, "learning_rate": 0.0002549949296456806, "loss": 0.0242, "step": 59470 }, { "epoch": 0.3, "learning_rate": 0.0002549873619526666, "loss": 0.0266, "step": 59480 }, { "epoch": 0.3, "learning_rate": 0.0002549797942596526, "loss": 0.0795, "step": 59490 }, { "epoch": 0.3, "learning_rate": 0.00025497222656663856, "loss": 0.0277, "step": 59500 }, { "epoch": 0.3, "learning_rate": 0.00025496465887362454, "loss": 0.02, "step": 59510 }, { "epoch": 0.3, "learning_rate": 0.0002549570911806105, "loss": 0.0209, "step": 59520 }, { "epoch": 0.3, "learning_rate": 0.00025494952348759656, "loss": 0.0174, "step": 59530 }, { "epoch": 0.3, "learning_rate": 0.00025494195579458254, "loss": 0.0194, "step": 59540 }, { "epoch": 0.3, "learning_rate": 0.0002549343881015685, "loss": 0.0272, "step": 59550 }, { "epoch": 0.3, "learning_rate": 0.0002549268204085545, "loss": 0.0196, "step": 59560 }, { "epoch": 0.3, "learning_rate": 0.0002549192527155405, "loss": 0.022, "step": 59570 }, { "epoch": 0.3, "learning_rate": 0.00025491168502252647, "loss": 0.0221, "step": 59580 }, { "epoch": 0.3, "learning_rate": 0.0002549041173295125, "loss": 0.0304, "step": 59590 }, { "epoch": 0.3, "learning_rate": 0.0002548965496364985, "loss": 0.0214, "step": 59600 }, { "epoch": 0.3, "learning_rate": 0.00025488898194348447, "loss": 0.0246, "step": 59610 }, { "epoch": 0.3, "learning_rate": 0.00025488141425047045, "loss": 0.0211, "step": 59620 }, { "epoch": 0.3, "learning_rate": 0.00025487384655745643, "loss": 0.0215, "step": 59630 }, { "epoch": 0.3, "learning_rate": 0.0002548662788644424, "loss": 0.0218, "step": 59640 }, { "epoch": 0.3, "learning_rate": 0.00025485871117142845, "loss": 0.0214, "step": 59650 }, { "epoch": 0.3, "learning_rate": 0.00025485114347841443, "loss": 0.0248, "step": 59660 }, { "epoch": 0.3, "learning_rate": 0.0002548435757854004, "loss": 0.022, "step": 59670 }, { "epoch": 0.3, "learning_rate": 0.0002548360080923864, "loss": 0.0206, "step": 59680 }, { "epoch": 0.3, "learning_rate": 0.00025482844039937237, "loss": 0.0213, "step": 59690 }, { "epoch": 0.3, "learning_rate": 0.00025482087270635835, "loss": 0.0178, "step": 59700 }, { "epoch": 0.3, "learning_rate": 0.00025481330501334434, "loss": 0.0318, "step": 59710 }, { "epoch": 0.3, "learning_rate": 0.0002548057373203303, "loss": 0.0239, "step": 59720 }, { "epoch": 0.3, "learning_rate": 0.0002547981696273163, "loss": 0.0198, "step": 59730 }, { "epoch": 0.3, "learning_rate": 0.0002547906019343023, "loss": 0.0214, "step": 59740 }, { "epoch": 0.3, "learning_rate": 0.00025478303424128826, "loss": 0.0176, "step": 59750 }, { "epoch": 0.3, "learning_rate": 0.0002547754665482743, "loss": 0.021, "step": 59760 }, { "epoch": 0.3, "learning_rate": 0.0002547678988552603, "loss": 0.0196, "step": 59770 }, { "epoch": 0.3, "learning_rate": 0.00025476033116224626, "loss": 0.0192, "step": 59780 }, { "epoch": 0.3, "learning_rate": 0.00025475276346923224, "loss": 0.025, "step": 59790 }, { "epoch": 0.3, "learning_rate": 0.0002547451957762182, "loss": 0.019, "step": 59800 }, { "epoch": 0.3, "learning_rate": 0.0002547376280832042, "loss": 0.0182, "step": 59810 }, { "epoch": 0.3, "learning_rate": 0.00025473006039019024, "loss": 0.0199, "step": 59820 }, { "epoch": 0.3, "learning_rate": 0.0002547224926971762, "loss": 0.02, "step": 59830 }, { "epoch": 0.3, "learning_rate": 0.0002547149250041622, "loss": 0.0212, "step": 59840 }, { "epoch": 0.3, "learning_rate": 0.0002547073573111482, "loss": 0.016, "step": 59850 }, { "epoch": 0.3, "learning_rate": 0.00025469978961813417, "loss": 0.0213, "step": 59860 }, { "epoch": 0.3, "learning_rate": 0.00025469222192512015, "loss": 0.0211, "step": 59870 }, { "epoch": 0.3, "learning_rate": 0.0002546846542321062, "loss": 0.0208, "step": 59880 }, { "epoch": 0.3, "learning_rate": 0.00025467708653909216, "loss": 0.0223, "step": 59890 }, { "epoch": 0.3, "learning_rate": 0.00025466951884607815, "loss": 0.0217, "step": 59900 }, { "epoch": 0.3, "learning_rate": 0.0002546619511530641, "loss": 0.0192, "step": 59910 }, { "epoch": 0.3, "learning_rate": 0.0002546543834600501, "loss": 0.0191, "step": 59920 }, { "epoch": 0.3, "learning_rate": 0.0002546468157670361, "loss": 0.0181, "step": 59930 }, { "epoch": 0.3, "learning_rate": 0.00025463924807402207, "loss": 0.0208, "step": 59940 }, { "epoch": 0.3, "learning_rate": 0.0002546316803810081, "loss": 0.0267, "step": 59950 }, { "epoch": 0.3, "learning_rate": 0.0002546241126879941, "loss": 0.0264, "step": 59960 }, { "epoch": 0.3, "learning_rate": 0.00025461654499498007, "loss": 0.0235, "step": 59970 }, { "epoch": 0.3, "learning_rate": 0.00025460897730196605, "loss": 0.0181, "step": 59980 }, { "epoch": 0.3, "learning_rate": 0.00025460140960895203, "loss": 0.0188, "step": 59990 }, { "epoch": 0.3, "learning_rate": 0.000254593841915938, "loss": 0.0241, "step": 60000 }, { "epoch": 0.3, "eval_cer": 0.9145197461055578, "eval_loss": 0.01466525811702013, "eval_runtime": 116.7343, "eval_samples_per_second": 17.133, "eval_steps_per_second": 4.283, "step": 60000 }, { "epoch": 0.3, "learning_rate": 0.00025458627422292405, "loss": 0.0222, "step": 60010 }, { "epoch": 0.3, "learning_rate": 0.00025457870652991003, "loss": 0.022, "step": 60020 }, { "epoch": 0.3, "learning_rate": 0.000254571138836896, "loss": 0.025, "step": 60030 }, { "epoch": 0.3, "learning_rate": 0.000254563571143882, "loss": 0.0254, "step": 60040 }, { "epoch": 0.3, "learning_rate": 0.000254556003450868, "loss": 0.0161, "step": 60050 }, { "epoch": 0.3, "learning_rate": 0.00025454843575785396, "loss": 0.0222, "step": 60060 }, { "epoch": 0.3, "learning_rate": 0.00025454086806483994, "loss": 0.0249, "step": 60070 }, { "epoch": 0.3, "learning_rate": 0.000254533300371826, "loss": 0.0201, "step": 60080 }, { "epoch": 0.3, "learning_rate": 0.00025452573267881196, "loss": 0.0251, "step": 60090 }, { "epoch": 0.3, "learning_rate": 0.00025451816498579794, "loss": 0.0184, "step": 60100 }, { "epoch": 0.3, "learning_rate": 0.0002545105972927839, "loss": 0.0202, "step": 60110 }, { "epoch": 0.3, "learning_rate": 0.0002545030295997699, "loss": 0.0188, "step": 60120 }, { "epoch": 0.3, "learning_rate": 0.0002544954619067559, "loss": 0.0217, "step": 60130 }, { "epoch": 0.3, "learning_rate": 0.0002544878942137419, "loss": 0.0195, "step": 60140 }, { "epoch": 0.3, "learning_rate": 0.0002544803265207279, "loss": 0.0158, "step": 60150 }, { "epoch": 0.3, "learning_rate": 0.0002544727588277139, "loss": 0.0186, "step": 60160 }, { "epoch": 0.3, "learning_rate": 0.00025446519113469986, "loss": 0.0186, "step": 60170 }, { "epoch": 0.3, "learning_rate": 0.00025445762344168584, "loss": 0.0174, "step": 60180 }, { "epoch": 0.3, "learning_rate": 0.0002544500557486718, "loss": 0.0219, "step": 60190 }, { "epoch": 0.3, "learning_rate": 0.00025444248805565786, "loss": 0.0207, "step": 60200 }, { "epoch": 0.3, "learning_rate": 0.00025443492036264384, "loss": 0.0172, "step": 60210 }, { "epoch": 0.3, "learning_rate": 0.0002544273526696298, "loss": 0.0183, "step": 60220 }, { "epoch": 0.3, "learning_rate": 0.0002544197849766158, "loss": 0.0178, "step": 60230 }, { "epoch": 0.3, "learning_rate": 0.0002544122172836018, "loss": 0.0183, "step": 60240 }, { "epoch": 0.3, "learning_rate": 0.00025440464959058777, "loss": 0.0244, "step": 60250 }, { "epoch": 0.3, "learning_rate": 0.00025439708189757375, "loss": 0.0236, "step": 60260 }, { "epoch": 0.3, "learning_rate": 0.0002543895142045598, "loss": 0.0188, "step": 60270 }, { "epoch": 0.3, "learning_rate": 0.00025438194651154577, "loss": 0.0188, "step": 60280 }, { "epoch": 0.3, "learning_rate": 0.00025437437881853175, "loss": 0.0232, "step": 60290 }, { "epoch": 0.3, "learning_rate": 0.00025436681112551773, "loss": 0.0174, "step": 60300 }, { "epoch": 0.3, "learning_rate": 0.0002543592434325037, "loss": 0.0225, "step": 60310 }, { "epoch": 0.3, "learning_rate": 0.0002543516757394897, "loss": 0.02, "step": 60320 }, { "epoch": 0.3, "learning_rate": 0.0002543441080464757, "loss": 0.0178, "step": 60330 }, { "epoch": 0.3, "learning_rate": 0.0002543365403534617, "loss": 0.0174, "step": 60340 }, { "epoch": 0.3, "learning_rate": 0.0002543289726604477, "loss": 0.0205, "step": 60350 }, { "epoch": 0.3, "learning_rate": 0.00025432140496743367, "loss": 0.0188, "step": 60360 }, { "epoch": 0.3, "learning_rate": 0.00025431383727441965, "loss": 0.0151, "step": 60370 }, { "epoch": 0.3, "learning_rate": 0.00025430626958140563, "loss": 0.0177, "step": 60380 }, { "epoch": 0.3, "learning_rate": 0.0002542987018883916, "loss": 0.0193, "step": 60390 }, { "epoch": 0.3, "learning_rate": 0.00025429113419537765, "loss": 0.0221, "step": 60400 }, { "epoch": 0.3, "learning_rate": 0.00025428356650236363, "loss": 0.0209, "step": 60410 }, { "epoch": 0.3, "learning_rate": 0.0002542759988093496, "loss": 0.0216, "step": 60420 }, { "epoch": 0.3, "learning_rate": 0.0002542684311163356, "loss": 0.0209, "step": 60430 }, { "epoch": 0.3, "learning_rate": 0.0002542608634233216, "loss": 0.0154, "step": 60440 }, { "epoch": 0.3, "learning_rate": 0.00025425329573030756, "loss": 0.0193, "step": 60450 }, { "epoch": 0.31, "learning_rate": 0.0002542457280372936, "loss": 0.0172, "step": 60460 }, { "epoch": 0.31, "learning_rate": 0.0002542381603442796, "loss": 0.0191, "step": 60470 }, { "epoch": 0.31, "learning_rate": 0.00025423059265126556, "loss": 0.0174, "step": 60480 }, { "epoch": 0.31, "learning_rate": 0.00025422302495825154, "loss": 0.0192, "step": 60490 }, { "epoch": 0.31, "learning_rate": 0.0002542154572652375, "loss": 0.0193, "step": 60500 }, { "epoch": 0.31, "learning_rate": 0.0002542078895722235, "loss": 0.0244, "step": 60510 }, { "epoch": 0.31, "learning_rate": 0.00025420032187920954, "loss": 0.0176, "step": 60520 }, { "epoch": 0.31, "learning_rate": 0.0002541927541861955, "loss": 0.0243, "step": 60530 }, { "epoch": 0.31, "learning_rate": 0.0002541851864931815, "loss": 0.0201, "step": 60540 }, { "epoch": 0.31, "learning_rate": 0.0002541776188001675, "loss": 0.0217, "step": 60550 }, { "epoch": 0.31, "learning_rate": 0.00025417005110715346, "loss": 0.0192, "step": 60560 }, { "epoch": 0.31, "learning_rate": 0.00025416248341413944, "loss": 0.0218, "step": 60570 }, { "epoch": 0.31, "learning_rate": 0.0002541549157211254, "loss": 0.0238, "step": 60580 }, { "epoch": 0.31, "learning_rate": 0.00025414734802811146, "loss": 0.0173, "step": 60590 }, { "epoch": 0.31, "learning_rate": 0.00025413978033509744, "loss": 0.0186, "step": 60600 }, { "epoch": 0.31, "learning_rate": 0.0002541322126420834, "loss": 0.0208, "step": 60610 }, { "epoch": 0.31, "learning_rate": 0.0002541246449490694, "loss": 0.0211, "step": 60620 }, { "epoch": 0.31, "learning_rate": 0.0002541170772560554, "loss": 0.0186, "step": 60630 }, { "epoch": 0.31, "learning_rate": 0.00025410950956304137, "loss": 0.0186, "step": 60640 }, { "epoch": 0.31, "learning_rate": 0.0002541019418700274, "loss": 0.0193, "step": 60650 }, { "epoch": 0.31, "learning_rate": 0.0002540943741770134, "loss": 0.0182, "step": 60660 }, { "epoch": 0.31, "learning_rate": 0.00025408680648399937, "loss": 0.0217, "step": 60670 }, { "epoch": 0.31, "learning_rate": 0.00025407923879098535, "loss": 0.0216, "step": 60680 }, { "epoch": 0.31, "learning_rate": 0.00025407167109797133, "loss": 0.0203, "step": 60690 }, { "epoch": 0.31, "learning_rate": 0.0002540641034049573, "loss": 0.0189, "step": 60700 }, { "epoch": 0.31, "learning_rate": 0.00025405653571194335, "loss": 0.0223, "step": 60710 }, { "epoch": 0.31, "learning_rate": 0.00025404896801892933, "loss": 0.0173, "step": 60720 }, { "epoch": 0.31, "learning_rate": 0.0002540414003259153, "loss": 0.0181, "step": 60730 }, { "epoch": 0.31, "learning_rate": 0.0002540338326329013, "loss": 0.0196, "step": 60740 }, { "epoch": 0.31, "learning_rate": 0.0002540262649398873, "loss": 0.0158, "step": 60750 }, { "epoch": 0.31, "learning_rate": 0.00025401869724687325, "loss": 0.0215, "step": 60760 }, { "epoch": 0.31, "learning_rate": 0.00025401112955385924, "loss": 0.018, "step": 60770 }, { "epoch": 0.31, "learning_rate": 0.00025400356186084527, "loss": 0.0185, "step": 60780 }, { "epoch": 0.31, "learning_rate": 0.00025399599416783125, "loss": 0.0197, "step": 60790 }, { "epoch": 0.31, "learning_rate": 0.00025398842647481723, "loss": 0.0205, "step": 60800 }, { "epoch": 0.31, "learning_rate": 0.0002539808587818032, "loss": 0.0225, "step": 60810 }, { "epoch": 0.31, "learning_rate": 0.0002539732910887892, "loss": 0.0179, "step": 60820 }, { "epoch": 0.31, "learning_rate": 0.0002539657233957752, "loss": 0.019, "step": 60830 }, { "epoch": 0.31, "learning_rate": 0.0002539581557027612, "loss": 0.0205, "step": 60840 }, { "epoch": 0.31, "learning_rate": 0.0002539505880097472, "loss": 0.0215, "step": 60850 }, { "epoch": 0.31, "learning_rate": 0.0002539430203167332, "loss": 0.0189, "step": 60860 }, { "epoch": 0.31, "learning_rate": 0.00025393545262371916, "loss": 0.0186, "step": 60870 }, { "epoch": 0.31, "learning_rate": 0.00025392788493070514, "loss": 0.0246, "step": 60880 }, { "epoch": 0.31, "learning_rate": 0.0002539203172376911, "loss": 0.0224, "step": 60890 }, { "epoch": 0.31, "learning_rate": 0.0002539127495446771, "loss": 0.0181, "step": 60900 }, { "epoch": 0.31, "learning_rate": 0.00025390518185166314, "loss": 0.0198, "step": 60910 }, { "epoch": 0.31, "learning_rate": 0.0002538976141586491, "loss": 0.0235, "step": 60920 }, { "epoch": 0.31, "learning_rate": 0.0002538900464656351, "loss": 0.0185, "step": 60930 }, { "epoch": 0.31, "learning_rate": 0.0002538824787726211, "loss": 0.0187, "step": 60940 }, { "epoch": 0.31, "learning_rate": 0.00025387491107960706, "loss": 0.02, "step": 60950 }, { "epoch": 0.31, "learning_rate": 0.00025386734338659305, "loss": 0.0174, "step": 60960 }, { "epoch": 0.31, "learning_rate": 0.00025385977569357903, "loss": 0.018, "step": 60970 }, { "epoch": 0.31, "learning_rate": 0.000253852208000565, "loss": 0.0197, "step": 60980 }, { "epoch": 0.31, "learning_rate": 0.000253844640307551, "loss": 0.0193, "step": 60990 }, { "epoch": 0.31, "learning_rate": 0.00025383707261453697, "loss": 0.02, "step": 61000 }, { "epoch": 0.31, "eval_cer": 0.9144615223380336, "eval_loss": 0.01344729121774435, "eval_runtime": 116.7714, "eval_samples_per_second": 17.127, "eval_steps_per_second": 4.282, "step": 61000 }, { "epoch": 0.31, "learning_rate": 0.000253829504921523, "loss": 0.0177, "step": 61010 }, { "epoch": 0.31, "learning_rate": 0.000253821937228509, "loss": 0.0203, "step": 61020 }, { "epoch": 0.31, "learning_rate": 0.00025381436953549497, "loss": 0.0181, "step": 61030 }, { "epoch": 0.31, "learning_rate": 0.00025380680184248095, "loss": 0.0181, "step": 61040 }, { "epoch": 0.31, "learning_rate": 0.00025379923414946693, "loss": 0.0211, "step": 61050 }, { "epoch": 0.31, "learning_rate": 0.0002537916664564529, "loss": 0.0216, "step": 61060 }, { "epoch": 0.31, "learning_rate": 0.00025378409876343895, "loss": 0.0188, "step": 61070 }, { "epoch": 0.31, "learning_rate": 0.00025377653107042493, "loss": 0.0202, "step": 61080 }, { "epoch": 0.31, "learning_rate": 0.0002537689633774109, "loss": 0.0203, "step": 61090 }, { "epoch": 0.31, "learning_rate": 0.0002537613956843969, "loss": 0.0198, "step": 61100 }, { "epoch": 0.31, "learning_rate": 0.0002537538279913829, "loss": 0.0193, "step": 61110 }, { "epoch": 0.31, "learning_rate": 0.00025374626029836886, "loss": 0.0154, "step": 61120 }, { "epoch": 0.31, "learning_rate": 0.00025373869260535484, "loss": 0.0201, "step": 61130 }, { "epoch": 0.31, "learning_rate": 0.0002537311249123409, "loss": 0.0212, "step": 61140 }, { "epoch": 0.31, "learning_rate": 0.00025372355721932686, "loss": 0.0196, "step": 61150 }, { "epoch": 0.31, "learning_rate": 0.00025371598952631284, "loss": 0.0204, "step": 61160 }, { "epoch": 0.31, "learning_rate": 0.0002537084218332988, "loss": 0.0205, "step": 61170 }, { "epoch": 0.31, "learning_rate": 0.0002537008541402848, "loss": 0.0203, "step": 61180 }, { "epoch": 0.31, "learning_rate": 0.0002536932864472708, "loss": 0.0142, "step": 61190 }, { "epoch": 0.31, "learning_rate": 0.0002536857187542568, "loss": 0.0162, "step": 61200 }, { "epoch": 0.31, "learning_rate": 0.0002536781510612428, "loss": 0.0192, "step": 61210 }, { "epoch": 0.31, "learning_rate": 0.0002536705833682288, "loss": 0.0198, "step": 61220 }, { "epoch": 0.31, "learning_rate": 0.00025366301567521476, "loss": 0.0182, "step": 61230 }, { "epoch": 0.31, "learning_rate": 0.00025365544798220074, "loss": 0.0196, "step": 61240 }, { "epoch": 0.31, "learning_rate": 0.0002536478802891867, "loss": 0.0201, "step": 61250 }, { "epoch": 0.31, "learning_rate": 0.00025364031259617276, "loss": 0.0217, "step": 61260 }, { "epoch": 0.31, "learning_rate": 0.00025363274490315874, "loss": 0.021, "step": 61270 }, { "epoch": 0.31, "learning_rate": 0.0002536251772101447, "loss": 0.019, "step": 61280 }, { "epoch": 0.31, "learning_rate": 0.0002536176095171307, "loss": 0.0201, "step": 61290 }, { "epoch": 0.31, "learning_rate": 0.0002536100418241167, "loss": 0.0178, "step": 61300 }, { "epoch": 0.31, "learning_rate": 0.00025360247413110267, "loss": 0.0185, "step": 61310 }, { "epoch": 0.31, "learning_rate": 0.00025359490643808865, "loss": 0.0179, "step": 61320 }, { "epoch": 0.31, "learning_rate": 0.0002535873387450747, "loss": 0.0179, "step": 61330 }, { "epoch": 0.31, "learning_rate": 0.00025357977105206067, "loss": 0.0223, "step": 61340 }, { "epoch": 0.31, "learning_rate": 0.00025357220335904665, "loss": 0.0179, "step": 61350 }, { "epoch": 0.31, "learning_rate": 0.00025356463566603263, "loss": 0.0219, "step": 61360 }, { "epoch": 0.31, "learning_rate": 0.0002535570679730186, "loss": 0.0226, "step": 61370 }, { "epoch": 0.31, "learning_rate": 0.0002535495002800046, "loss": 0.0179, "step": 61380 }, { "epoch": 0.31, "learning_rate": 0.00025354193258699063, "loss": 0.0198, "step": 61390 }, { "epoch": 0.31, "learning_rate": 0.0002535343648939766, "loss": 0.019, "step": 61400 }, { "epoch": 0.31, "learning_rate": 0.0002535267972009626, "loss": 0.0229, "step": 61410 }, { "epoch": 0.31, "learning_rate": 0.00025351922950794857, "loss": 0.0246, "step": 61420 }, { "epoch": 0.31, "learning_rate": 0.00025351166181493455, "loss": 0.0162, "step": 61430 }, { "epoch": 0.31, "learning_rate": 0.00025350409412192053, "loss": 0.0236, "step": 61440 }, { "epoch": 0.31, "learning_rate": 0.00025349652642890657, "loss": 0.0207, "step": 61450 }, { "epoch": 0.31, "learning_rate": 0.00025348895873589255, "loss": 0.0217, "step": 61460 }, { "epoch": 0.31, "learning_rate": 0.00025348139104287853, "loss": 0.0222, "step": 61470 }, { "epoch": 0.31, "learning_rate": 0.0002534738233498645, "loss": 0.0188, "step": 61480 }, { "epoch": 0.31, "learning_rate": 0.0002534662556568505, "loss": 0.0183, "step": 61490 }, { "epoch": 0.31, "learning_rate": 0.0002534586879638365, "loss": 0.0163, "step": 61500 }, { "epoch": 0.31, "learning_rate": 0.00025345112027082246, "loss": 0.0176, "step": 61510 }, { "epoch": 0.31, "learning_rate": 0.0002534435525778085, "loss": 0.0193, "step": 61520 }, { "epoch": 0.31, "learning_rate": 0.0002534359848847945, "loss": 0.017, "step": 61530 }, { "epoch": 0.31, "learning_rate": 0.00025342841719178046, "loss": 0.0197, "step": 61540 }, { "epoch": 0.31, "learning_rate": 0.00025342084949876644, "loss": 0.0206, "step": 61550 }, { "epoch": 0.31, "learning_rate": 0.0002534132818057524, "loss": 0.0192, "step": 61560 }, { "epoch": 0.31, "learning_rate": 0.0002534057141127384, "loss": 0.0209, "step": 61570 }, { "epoch": 0.31, "learning_rate": 0.00025339814641972444, "loss": 0.0215, "step": 61580 }, { "epoch": 0.31, "learning_rate": 0.0002533905787267104, "loss": 0.0207, "step": 61590 }, { "epoch": 0.31, "learning_rate": 0.0002533830110336964, "loss": 0.0207, "step": 61600 }, { "epoch": 0.31, "learning_rate": 0.0002533754433406824, "loss": 0.0199, "step": 61610 }, { "epoch": 0.31, "learning_rate": 0.00025336787564766836, "loss": 0.0169, "step": 61620 }, { "epoch": 0.31, "learning_rate": 0.00025336030795465434, "loss": 0.0215, "step": 61630 }, { "epoch": 0.31, "learning_rate": 0.0002533527402616403, "loss": 0.0189, "step": 61640 }, { "epoch": 0.31, "learning_rate": 0.00025334517256862636, "loss": 0.0171, "step": 61650 }, { "epoch": 0.31, "learning_rate": 0.00025333760487561234, "loss": 0.0195, "step": 61660 }, { "epoch": 0.31, "learning_rate": 0.0002533300371825983, "loss": 0.0215, "step": 61670 }, { "epoch": 0.31, "learning_rate": 0.0002533224694895843, "loss": 0.0208, "step": 61680 }, { "epoch": 0.31, "learning_rate": 0.0002533149017965703, "loss": 0.0219, "step": 61690 }, { "epoch": 0.31, "learning_rate": 0.00025330733410355627, "loss": 0.021, "step": 61700 }, { "epoch": 0.31, "learning_rate": 0.0002532997664105423, "loss": 0.0225, "step": 61710 }, { "epoch": 0.31, "learning_rate": 0.0002532921987175283, "loss": 0.024, "step": 61720 }, { "epoch": 0.31, "learning_rate": 0.00025328463102451427, "loss": 0.018, "step": 61730 }, { "epoch": 0.31, "learning_rate": 0.00025327706333150025, "loss": 0.0191, "step": 61740 }, { "epoch": 0.31, "learning_rate": 0.00025326949563848623, "loss": 0.0177, "step": 61750 }, { "epoch": 0.31, "learning_rate": 0.0002532619279454722, "loss": 0.0208, "step": 61760 }, { "epoch": 0.31, "learning_rate": 0.00025325436025245825, "loss": 0.0175, "step": 61770 }, { "epoch": 0.31, "learning_rate": 0.00025324679255944423, "loss": 0.0175, "step": 61780 }, { "epoch": 0.31, "learning_rate": 0.0002532392248664302, "loss": 0.0203, "step": 61790 }, { "epoch": 0.31, "learning_rate": 0.0002532316571734162, "loss": 0.0211, "step": 61800 }, { "epoch": 0.31, "learning_rate": 0.0002532240894804022, "loss": 0.0191, "step": 61810 }, { "epoch": 0.31, "learning_rate": 0.00025321652178738815, "loss": 0.0181, "step": 61820 }, { "epoch": 0.31, "learning_rate": 0.00025320895409437414, "loss": 0.0227, "step": 61830 }, { "epoch": 0.31, "learning_rate": 0.00025320138640136017, "loss": 0.0221, "step": 61840 }, { "epoch": 0.31, "learning_rate": 0.00025319381870834615, "loss": 0.0198, "step": 61850 }, { "epoch": 0.31, "learning_rate": 0.00025318625101533213, "loss": 0.0188, "step": 61860 }, { "epoch": 0.31, "learning_rate": 0.0002531786833223181, "loss": 0.0216, "step": 61870 }, { "epoch": 0.31, "learning_rate": 0.0002531711156293041, "loss": 0.0242, "step": 61880 }, { "epoch": 0.31, "learning_rate": 0.0002531635479362901, "loss": 0.0194, "step": 61890 }, { "epoch": 0.31, "learning_rate": 0.0002531559802432761, "loss": 0.0158, "step": 61900 }, { "epoch": 0.31, "learning_rate": 0.0002531484125502621, "loss": 0.0187, "step": 61910 }, { "epoch": 0.31, "learning_rate": 0.0002531408448572481, "loss": 0.0213, "step": 61920 }, { "epoch": 0.31, "learning_rate": 0.00025313327716423406, "loss": 0.0252, "step": 61930 }, { "epoch": 0.31, "learning_rate": 0.00025312570947122004, "loss": 0.0224, "step": 61940 }, { "epoch": 0.31, "learning_rate": 0.000253118141778206, "loss": 0.0216, "step": 61950 }, { "epoch": 0.31, "learning_rate": 0.00025311057408519206, "loss": 0.0215, "step": 61960 }, { "epoch": 0.31, "learning_rate": 0.00025310300639217804, "loss": 0.0189, "step": 61970 }, { "epoch": 0.31, "learning_rate": 0.000253095438699164, "loss": 0.0195, "step": 61980 }, { "epoch": 0.31, "learning_rate": 0.00025308787100615, "loss": 0.0169, "step": 61990 }, { "epoch": 0.31, "learning_rate": 0.000253080303313136, "loss": 0.024, "step": 62000 }, { "epoch": 0.31, "eval_cer": 0.9144838414489178, "eval_loss": 0.014024483039975166, "eval_runtime": 116.7957, "eval_samples_per_second": 17.124, "eval_steps_per_second": 4.281, "step": 62000 }, { "epoch": 0.31, "learning_rate": 0.00025307273562012196, "loss": 0.0204, "step": 62010 }, { "epoch": 0.31, "learning_rate": 0.00025306516792710795, "loss": 0.0195, "step": 62020 }, { "epoch": 0.31, "learning_rate": 0.000253057600234094, "loss": 0.0199, "step": 62030 }, { "epoch": 0.31, "learning_rate": 0.00025305003254107996, "loss": 0.0215, "step": 62040 }, { "epoch": 0.31, "learning_rate": 0.00025304246484806594, "loss": 0.0183, "step": 62050 }, { "epoch": 0.31, "learning_rate": 0.0002530348971550519, "loss": 0.0228, "step": 62060 }, { "epoch": 0.31, "learning_rate": 0.0002530273294620379, "loss": 0.022, "step": 62070 }, { "epoch": 0.31, "learning_rate": 0.0002530197617690239, "loss": 0.0208, "step": 62080 }, { "epoch": 0.31, "learning_rate": 0.0002530121940760099, "loss": 0.0275, "step": 62090 }, { "epoch": 0.31, "learning_rate": 0.0002530046263829959, "loss": 0.0203, "step": 62100 }, { "epoch": 0.31, "learning_rate": 0.0002529970586899819, "loss": 0.0219, "step": 62110 }, { "epoch": 0.31, "learning_rate": 0.00025298949099696787, "loss": 0.0225, "step": 62120 }, { "epoch": 0.31, "learning_rate": 0.00025298192330395385, "loss": 0.0185, "step": 62130 }, { "epoch": 0.31, "learning_rate": 0.00025297435561093983, "loss": 0.0206, "step": 62140 }, { "epoch": 0.31, "learning_rate": 0.0002529667879179258, "loss": 0.0213, "step": 62150 }, { "epoch": 0.31, "learning_rate": 0.00025295922022491185, "loss": 0.0231, "step": 62160 }, { "epoch": 0.31, "learning_rate": 0.00025295165253189783, "loss": 0.0182, "step": 62170 }, { "epoch": 0.31, "learning_rate": 0.0002529440848388838, "loss": 0.0204, "step": 62180 }, { "epoch": 0.31, "learning_rate": 0.0002529365171458698, "loss": 0.02, "step": 62190 }, { "epoch": 0.31, "learning_rate": 0.0002529289494528558, "loss": 0.0219, "step": 62200 }, { "epoch": 0.31, "learning_rate": 0.00025292138175984176, "loss": 0.0212, "step": 62210 }, { "epoch": 0.31, "learning_rate": 0.00025291381406682774, "loss": 0.0237, "step": 62220 }, { "epoch": 0.31, "learning_rate": 0.0002529062463738137, "loss": 0.019, "step": 62230 }, { "epoch": 0.31, "learning_rate": 0.0002528986786807997, "loss": 0.0195, "step": 62240 }, { "epoch": 0.31, "learning_rate": 0.0002528911109877857, "loss": 0.0205, "step": 62250 }, { "epoch": 0.31, "learning_rate": 0.0002528835432947717, "loss": 0.0231, "step": 62260 }, { "epoch": 0.31, "learning_rate": 0.0002528759756017577, "loss": 0.02, "step": 62270 }, { "epoch": 0.31, "learning_rate": 0.0002528684079087437, "loss": 0.0196, "step": 62280 }, { "epoch": 0.31, "learning_rate": 0.00025286084021572966, "loss": 0.0176, "step": 62290 }, { "epoch": 0.31, "learning_rate": 0.00025285327252271564, "loss": 0.0196, "step": 62300 }, { "epoch": 0.31, "learning_rate": 0.0002528457048297016, "loss": 0.0173, "step": 62310 }, { "epoch": 0.31, "learning_rate": 0.00025283813713668766, "loss": 0.0189, "step": 62320 }, { "epoch": 0.31, "learning_rate": 0.00025283056944367364, "loss": 0.0228, "step": 62330 }, { "epoch": 0.31, "learning_rate": 0.0002528230017506596, "loss": 0.0182, "step": 62340 }, { "epoch": 0.31, "learning_rate": 0.0002528154340576456, "loss": 0.0232, "step": 62350 }, { "epoch": 0.31, "learning_rate": 0.0002528078663646316, "loss": 0.0159, "step": 62360 }, { "epoch": 0.31, "learning_rate": 0.00025280029867161757, "loss": 0.019, "step": 62370 }, { "epoch": 0.31, "learning_rate": 0.00025279273097860355, "loss": 0.0198, "step": 62380 }, { "epoch": 0.31, "learning_rate": 0.0002527851632855896, "loss": 0.023, "step": 62390 }, { "epoch": 0.31, "learning_rate": 0.00025277759559257557, "loss": 0.0207, "step": 62400 }, { "epoch": 0.31, "learning_rate": 0.00025277002789956155, "loss": 0.0182, "step": 62410 }, { "epoch": 0.31, "learning_rate": 0.00025276246020654753, "loss": 0.0205, "step": 62420 }, { "epoch": 0.31, "learning_rate": 0.0002527548925135335, "loss": 0.0204, "step": 62430 }, { "epoch": 0.32, "learning_rate": 0.0002527473248205195, "loss": 0.0217, "step": 62440 }, { "epoch": 0.32, "learning_rate": 0.00025273975712750553, "loss": 0.0245, "step": 62450 }, { "epoch": 0.32, "learning_rate": 0.0002527321894344915, "loss": 0.0216, "step": 62460 }, { "epoch": 0.32, "learning_rate": 0.0002527246217414775, "loss": 0.0215, "step": 62470 }, { "epoch": 0.32, "learning_rate": 0.00025271705404846347, "loss": 0.0223, "step": 62480 }, { "epoch": 0.32, "learning_rate": 0.00025270948635544945, "loss": 0.0195, "step": 62490 }, { "epoch": 0.32, "learning_rate": 0.00025270191866243543, "loss": 0.0208, "step": 62500 }, { "epoch": 0.32, "learning_rate": 0.00025269435096942147, "loss": 0.0197, "step": 62510 }, { "epoch": 0.32, "learning_rate": 0.00025268678327640745, "loss": 0.0188, "step": 62520 }, { "epoch": 0.32, "learning_rate": 0.00025267921558339343, "loss": 0.0197, "step": 62530 }, { "epoch": 0.32, "learning_rate": 0.0002526716478903794, "loss": 0.0204, "step": 62540 }, { "epoch": 0.32, "learning_rate": 0.0002526640801973654, "loss": 0.0155, "step": 62550 }, { "epoch": 0.32, "learning_rate": 0.0002526565125043514, "loss": 0.0229, "step": 62560 }, { "epoch": 0.32, "learning_rate": 0.00025264894481133736, "loss": 0.0238, "step": 62570 }, { "epoch": 0.32, "learning_rate": 0.0002526413771183234, "loss": 0.0245, "step": 62580 }, { "epoch": 0.32, "learning_rate": 0.0002526338094253094, "loss": 0.0196, "step": 62590 }, { "epoch": 0.32, "learning_rate": 0.00025262624173229536, "loss": 0.0206, "step": 62600 }, { "epoch": 0.32, "learning_rate": 0.00025261867403928134, "loss": 0.0193, "step": 62610 }, { "epoch": 0.32, "learning_rate": 0.0002526111063462673, "loss": 0.0186, "step": 62620 }, { "epoch": 0.32, "learning_rate": 0.0002526035386532533, "loss": 0.0173, "step": 62630 }, { "epoch": 0.32, "learning_rate": 0.00025259597096023934, "loss": 0.0172, "step": 62640 }, { "epoch": 0.32, "learning_rate": 0.0002525884032672253, "loss": 0.0247, "step": 62650 }, { "epoch": 0.32, "learning_rate": 0.0002525808355742113, "loss": 0.0177, "step": 62660 }, { "epoch": 0.32, "learning_rate": 0.0002525732678811973, "loss": 0.0206, "step": 62670 }, { "epoch": 0.32, "learning_rate": 0.00025256570018818326, "loss": 0.0188, "step": 62680 }, { "epoch": 0.32, "learning_rate": 0.00025255813249516924, "loss": 0.0219, "step": 62690 }, { "epoch": 0.32, "learning_rate": 0.0002525505648021552, "loss": 0.0219, "step": 62700 }, { "epoch": 0.32, "learning_rate": 0.00025254299710914126, "loss": 0.0178, "step": 62710 }, { "epoch": 0.32, "learning_rate": 0.00025253542941612724, "loss": 0.02, "step": 62720 }, { "epoch": 0.32, "learning_rate": 0.0002525278617231132, "loss": 0.0183, "step": 62730 }, { "epoch": 0.32, "learning_rate": 0.0002525202940300992, "loss": 0.0189, "step": 62740 }, { "epoch": 0.32, "learning_rate": 0.0002525127263370852, "loss": 0.0273, "step": 62750 }, { "epoch": 0.32, "learning_rate": 0.00025250515864407117, "loss": 0.0189, "step": 62760 }, { "epoch": 0.32, "learning_rate": 0.0002524975909510572, "loss": 0.0171, "step": 62770 }, { "epoch": 0.32, "learning_rate": 0.0002524900232580432, "loss": 0.0194, "step": 62780 }, { "epoch": 0.32, "learning_rate": 0.00025248245556502917, "loss": 0.0194, "step": 62790 }, { "epoch": 0.32, "learning_rate": 0.00025247488787201515, "loss": 0.0205, "step": 62800 }, { "epoch": 0.32, "learning_rate": 0.00025246732017900113, "loss": 0.0176, "step": 62810 }, { "epoch": 0.32, "learning_rate": 0.0002524597524859871, "loss": 0.0207, "step": 62820 }, { "epoch": 0.32, "learning_rate": 0.00025245218479297315, "loss": 0.0213, "step": 62830 }, { "epoch": 0.32, "learning_rate": 0.00025244461709995913, "loss": 0.0184, "step": 62840 }, { "epoch": 0.32, "learning_rate": 0.0002524370494069451, "loss": 0.0177, "step": 62850 }, { "epoch": 0.32, "learning_rate": 0.0002524294817139311, "loss": 0.0194, "step": 62860 }, { "epoch": 0.32, "learning_rate": 0.0002524219140209171, "loss": 0.0198, "step": 62870 }, { "epoch": 0.32, "learning_rate": 0.00025241434632790305, "loss": 0.0249, "step": 62880 }, { "epoch": 0.32, "learning_rate": 0.00025240677863488904, "loss": 0.0195, "step": 62890 }, { "epoch": 0.32, "learning_rate": 0.00025239921094187507, "loss": 0.0195, "step": 62900 }, { "epoch": 0.32, "learning_rate": 0.00025239164324886105, "loss": 0.0169, "step": 62910 }, { "epoch": 0.32, "learning_rate": 0.00025238407555584703, "loss": 0.0203, "step": 62920 }, { "epoch": 0.32, "learning_rate": 0.000252376507862833, "loss": 0.0181, "step": 62930 }, { "epoch": 0.32, "learning_rate": 0.000252368940169819, "loss": 0.0179, "step": 62940 }, { "epoch": 0.32, "learning_rate": 0.000252361372476805, "loss": 0.0204, "step": 62950 }, { "epoch": 0.32, "learning_rate": 0.000252353804783791, "loss": 0.0172, "step": 62960 }, { "epoch": 0.32, "learning_rate": 0.000252346237090777, "loss": 0.0169, "step": 62970 }, { "epoch": 0.32, "learning_rate": 0.000252338669397763, "loss": 0.0185, "step": 62980 }, { "epoch": 0.32, "learning_rate": 0.00025233110170474896, "loss": 0.0192, "step": 62990 }, { "epoch": 0.32, "learning_rate": 0.00025232353401173494, "loss": 0.0175, "step": 63000 }, { "epoch": 0.32, "eval_cer": 0.9144712262992877, "eval_loss": 0.013699725270271301, "eval_runtime": 116.7034, "eval_samples_per_second": 17.137, "eval_steps_per_second": 4.284, "step": 63000 }, { "epoch": 0.32, "learning_rate": 0.0002523159663187209, "loss": 0.0179, "step": 63010 }, { "epoch": 0.32, "learning_rate": 0.00025230839862570696, "loss": 0.0182, "step": 63020 }, { "epoch": 0.32, "learning_rate": 0.00025230083093269294, "loss": 0.0214, "step": 63030 }, { "epoch": 0.32, "learning_rate": 0.0002522932632396789, "loss": 0.0225, "step": 63040 }, { "epoch": 0.32, "learning_rate": 0.0002522856955466649, "loss": 0.0154, "step": 63050 }, { "epoch": 0.32, "learning_rate": 0.0002522781278536509, "loss": 0.0199, "step": 63060 }, { "epoch": 0.32, "learning_rate": 0.00025227056016063686, "loss": 0.017, "step": 63070 }, { "epoch": 0.32, "learning_rate": 0.00025226299246762285, "loss": 0.0253, "step": 63080 }, { "epoch": 0.32, "learning_rate": 0.0002522554247746089, "loss": 0.0208, "step": 63090 }, { "epoch": 0.32, "learning_rate": 0.00025224785708159486, "loss": 0.0201, "step": 63100 }, { "epoch": 0.32, "learning_rate": 0.00025224028938858084, "loss": 0.0207, "step": 63110 }, { "epoch": 0.32, "learning_rate": 0.0002522327216955668, "loss": 0.0171, "step": 63120 }, { "epoch": 0.32, "learning_rate": 0.0002522251540025528, "loss": 0.0183, "step": 63130 }, { "epoch": 0.32, "learning_rate": 0.0002522175863095388, "loss": 0.0175, "step": 63140 }, { "epoch": 0.32, "learning_rate": 0.0002522100186165248, "loss": 0.0194, "step": 63150 }, { "epoch": 0.32, "learning_rate": 0.0002522024509235108, "loss": 0.0233, "step": 63160 }, { "epoch": 0.32, "learning_rate": 0.0002521948832304968, "loss": 0.0177, "step": 63170 }, { "epoch": 0.32, "learning_rate": 0.00025218731553748277, "loss": 0.018, "step": 63180 }, { "epoch": 0.32, "learning_rate": 0.00025217974784446875, "loss": 0.0212, "step": 63190 }, { "epoch": 0.32, "learning_rate": 0.00025217218015145473, "loss": 0.0184, "step": 63200 }, { "epoch": 0.32, "learning_rate": 0.0002521646124584407, "loss": 0.0193, "step": 63210 }, { "epoch": 0.32, "learning_rate": 0.00025215704476542675, "loss": 0.0268, "step": 63220 }, { "epoch": 0.32, "learning_rate": 0.00025214947707241273, "loss": 0.0197, "step": 63230 }, { "epoch": 0.32, "learning_rate": 0.0002521419093793987, "loss": 0.019, "step": 63240 }, { "epoch": 0.32, "learning_rate": 0.0002521343416863847, "loss": 0.0178, "step": 63250 }, { "epoch": 0.32, "learning_rate": 0.0002521267739933707, "loss": 0.0218, "step": 63260 }, { "epoch": 0.32, "learning_rate": 0.00025211920630035666, "loss": 0.0217, "step": 63270 }, { "epoch": 0.32, "learning_rate": 0.0002521116386073427, "loss": 0.0218, "step": 63280 }, { "epoch": 0.32, "learning_rate": 0.0002521040709143287, "loss": 0.02, "step": 63290 }, { "epoch": 0.32, "learning_rate": 0.00025209650322131465, "loss": 0.0262, "step": 63300 }, { "epoch": 0.32, "learning_rate": 0.00025208893552830064, "loss": 0.0206, "step": 63310 }, { "epoch": 0.32, "learning_rate": 0.0002520813678352866, "loss": 0.019, "step": 63320 }, { "epoch": 0.32, "learning_rate": 0.0002520738001422726, "loss": 0.017, "step": 63330 }, { "epoch": 0.32, "learning_rate": 0.00025206623244925863, "loss": 0.0216, "step": 63340 }, { "epoch": 0.32, "learning_rate": 0.0002520586647562446, "loss": 0.0183, "step": 63350 }, { "epoch": 0.32, "learning_rate": 0.0002520510970632306, "loss": 0.018, "step": 63360 }, { "epoch": 0.32, "learning_rate": 0.0002520435293702166, "loss": 0.0185, "step": 63370 }, { "epoch": 0.32, "learning_rate": 0.00025203596167720256, "loss": 0.0206, "step": 63380 }, { "epoch": 0.32, "learning_rate": 0.00025202839398418854, "loss": 0.0194, "step": 63390 }, { "epoch": 0.32, "learning_rate": 0.0002520208262911745, "loss": 0.0273, "step": 63400 }, { "epoch": 0.32, "learning_rate": 0.00025201325859816056, "loss": 0.0179, "step": 63410 }, { "epoch": 0.32, "learning_rate": 0.00025200569090514654, "loss": 0.0242, "step": 63420 }, { "epoch": 0.32, "learning_rate": 0.0002519981232121325, "loss": 0.0193, "step": 63430 }, { "epoch": 0.32, "learning_rate": 0.0002519905555191185, "loss": 0.0194, "step": 63440 }, { "epoch": 0.32, "learning_rate": 0.0002519829878261045, "loss": 0.0235, "step": 63450 }, { "epoch": 0.32, "learning_rate": 0.00025197542013309047, "loss": 0.0206, "step": 63460 }, { "epoch": 0.32, "learning_rate": 0.0002519678524400765, "loss": 0.0165, "step": 63470 }, { "epoch": 0.32, "learning_rate": 0.00025196028474706243, "loss": 0.0186, "step": 63480 }, { "epoch": 0.32, "learning_rate": 0.0002519527170540484, "loss": 0.0216, "step": 63490 }, { "epoch": 0.32, "learning_rate": 0.0002519451493610344, "loss": 0.0175, "step": 63500 }, { "epoch": 0.32, "learning_rate": 0.00025193758166802043, "loss": 0.0144, "step": 63510 }, { "epoch": 0.32, "learning_rate": 0.0002519300139750064, "loss": 0.0219, "step": 63520 }, { "epoch": 0.32, "learning_rate": 0.0002519224462819924, "loss": 0.0196, "step": 63530 }, { "epoch": 0.32, "learning_rate": 0.00025191487858897837, "loss": 0.0194, "step": 63540 }, { "epoch": 0.32, "learning_rate": 0.00025190731089596435, "loss": 0.0176, "step": 63550 }, { "epoch": 0.32, "learning_rate": 0.00025189974320295034, "loss": 0.0203, "step": 63560 }, { "epoch": 0.32, "learning_rate": 0.00025189217550993637, "loss": 0.0162, "step": 63570 }, { "epoch": 0.32, "learning_rate": 0.00025188460781692235, "loss": 0.0185, "step": 63580 }, { "epoch": 0.32, "learning_rate": 0.00025187704012390833, "loss": 0.0205, "step": 63590 }, { "epoch": 0.32, "learning_rate": 0.0002518694724308943, "loss": 0.023, "step": 63600 }, { "epoch": 0.32, "learning_rate": 0.0002518619047378803, "loss": 0.0245, "step": 63610 }, { "epoch": 0.32, "learning_rate": 0.0002518543370448663, "loss": 0.0177, "step": 63620 }, { "epoch": 0.32, "learning_rate": 0.00025184676935185226, "loss": 0.0182, "step": 63630 }, { "epoch": 0.32, "learning_rate": 0.0002518392016588383, "loss": 0.0235, "step": 63640 }, { "epoch": 0.32, "learning_rate": 0.0002518316339658243, "loss": 0.0185, "step": 63650 }, { "epoch": 0.32, "learning_rate": 0.00025182406627281026, "loss": 0.02, "step": 63660 }, { "epoch": 0.32, "learning_rate": 0.00025181649857979624, "loss": 0.0162, "step": 63670 }, { "epoch": 0.32, "learning_rate": 0.0002518089308867822, "loss": 0.0181, "step": 63680 }, { "epoch": 0.32, "learning_rate": 0.0002518013631937682, "loss": 0.0192, "step": 63690 }, { "epoch": 0.32, "learning_rate": 0.00025179379550075424, "loss": 0.0192, "step": 63700 }, { "epoch": 0.32, "learning_rate": 0.0002517862278077402, "loss": 0.0164, "step": 63710 }, { "epoch": 0.32, "learning_rate": 0.0002517786601147262, "loss": 0.0164, "step": 63720 }, { "epoch": 0.32, "learning_rate": 0.0002517710924217122, "loss": 0.0245, "step": 63730 }, { "epoch": 0.32, "learning_rate": 0.00025176352472869816, "loss": 0.0178, "step": 63740 }, { "epoch": 0.32, "learning_rate": 0.00025175595703568415, "loss": 0.0236, "step": 63750 }, { "epoch": 0.32, "learning_rate": 0.0002517483893426702, "loss": 0.026, "step": 63760 }, { "epoch": 0.32, "learning_rate": 0.00025174082164965616, "loss": 0.0185, "step": 63770 }, { "epoch": 0.32, "learning_rate": 0.00025173325395664214, "loss": 0.021, "step": 63780 }, { "epoch": 0.32, "learning_rate": 0.0002517256862636281, "loss": 0.026, "step": 63790 }, { "epoch": 0.32, "learning_rate": 0.0002517181185706141, "loss": 0.0196, "step": 63800 }, { "epoch": 0.32, "learning_rate": 0.0002517105508776001, "loss": 0.0189, "step": 63810 }, { "epoch": 0.32, "learning_rate": 0.00025170298318458607, "loss": 0.0193, "step": 63820 }, { "epoch": 0.32, "learning_rate": 0.0002516954154915721, "loss": 0.0167, "step": 63830 }, { "epoch": 0.32, "learning_rate": 0.0002516878477985581, "loss": 0.0204, "step": 63840 }, { "epoch": 0.32, "learning_rate": 0.00025168028010554407, "loss": 0.0162, "step": 63850 }, { "epoch": 0.32, "learning_rate": 0.00025167271241253005, "loss": 0.0192, "step": 63860 }, { "epoch": 0.32, "learning_rate": 0.00025166514471951603, "loss": 0.0227, "step": 63870 }, { "epoch": 0.32, "learning_rate": 0.000251657577026502, "loss": 0.0194, "step": 63880 }, { "epoch": 0.32, "learning_rate": 0.00025165000933348805, "loss": 0.0164, "step": 63890 }, { "epoch": 0.32, "learning_rate": 0.00025164244164047403, "loss": 0.0176, "step": 63900 }, { "epoch": 0.32, "learning_rate": 0.00025163487394746, "loss": 0.0207, "step": 63910 }, { "epoch": 0.32, "learning_rate": 0.000251627306254446, "loss": 0.019, "step": 63920 }, { "epoch": 0.32, "learning_rate": 0.000251619738561432, "loss": 0.021, "step": 63930 }, { "epoch": 0.32, "learning_rate": 0.00025161217086841796, "loss": 0.0194, "step": 63940 }, { "epoch": 0.32, "learning_rate": 0.00025160460317540394, "loss": 0.0205, "step": 63950 }, { "epoch": 0.32, "learning_rate": 0.00025159703548238997, "loss": 0.02, "step": 63960 }, { "epoch": 0.32, "learning_rate": 0.00025158946778937595, "loss": 0.026, "step": 63970 }, { "epoch": 0.32, "learning_rate": 0.00025158190009636194, "loss": 0.0201, "step": 63980 }, { "epoch": 0.32, "learning_rate": 0.0002515743324033479, "loss": 0.0206, "step": 63990 }, { "epoch": 0.32, "learning_rate": 0.0002515667647103339, "loss": 0.0207, "step": 64000 }, { "epoch": 0.32, "eval_cer": 0.9144692855070369, "eval_loss": 0.01427229680120945, "eval_runtime": 116.7184, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 64000 }, { "epoch": 0.32, "learning_rate": 0.0002515591970173199, "loss": 0.0165, "step": 64010 }, { "epoch": 0.32, "learning_rate": 0.0002515516293243059, "loss": 0.0222, "step": 64020 }, { "epoch": 0.32, "learning_rate": 0.0002515440616312919, "loss": 0.0173, "step": 64030 }, { "epoch": 0.32, "learning_rate": 0.0002515364939382779, "loss": 0.0215, "step": 64040 }, { "epoch": 0.32, "learning_rate": 0.00025152892624526386, "loss": 0.0197, "step": 64050 }, { "epoch": 0.32, "learning_rate": 0.00025152135855224984, "loss": 0.0208, "step": 64060 }, { "epoch": 0.32, "learning_rate": 0.0002515137908592358, "loss": 0.0194, "step": 64070 }, { "epoch": 0.32, "learning_rate": 0.00025150622316622186, "loss": 0.023, "step": 64080 }, { "epoch": 0.32, "learning_rate": 0.00025149865547320784, "loss": 0.0217, "step": 64090 }, { "epoch": 0.32, "learning_rate": 0.0002514910877801938, "loss": 0.0243, "step": 64100 }, { "epoch": 0.32, "learning_rate": 0.0002514835200871798, "loss": 0.0202, "step": 64110 }, { "epoch": 0.32, "learning_rate": 0.0002514759523941658, "loss": 0.0224, "step": 64120 }, { "epoch": 0.32, "learning_rate": 0.00025146838470115177, "loss": 0.0198, "step": 64130 }, { "epoch": 0.32, "learning_rate": 0.00025146081700813775, "loss": 0.0193, "step": 64140 }, { "epoch": 0.32, "learning_rate": 0.0002514532493151238, "loss": 0.0202, "step": 64150 }, { "epoch": 0.32, "learning_rate": 0.00025144568162210976, "loss": 0.0202, "step": 64160 }, { "epoch": 0.32, "learning_rate": 0.00025143811392909575, "loss": 0.0187, "step": 64170 }, { "epoch": 0.32, "learning_rate": 0.0002514305462360817, "loss": 0.0184, "step": 64180 }, { "epoch": 0.32, "learning_rate": 0.0002514229785430677, "loss": 0.02, "step": 64190 }, { "epoch": 0.32, "learning_rate": 0.0002514154108500537, "loss": 0.025, "step": 64200 }, { "epoch": 0.32, "learning_rate": 0.0002514078431570397, "loss": 0.0195, "step": 64210 }, { "epoch": 0.32, "learning_rate": 0.0002514002754640257, "loss": 0.0231, "step": 64220 }, { "epoch": 0.32, "learning_rate": 0.0002513927077710117, "loss": 0.0199, "step": 64230 }, { "epoch": 0.32, "learning_rate": 0.00025138514007799767, "loss": 0.0214, "step": 64240 }, { "epoch": 0.32, "learning_rate": 0.00025137757238498365, "loss": 0.0217, "step": 64250 }, { "epoch": 0.32, "learning_rate": 0.00025137000469196963, "loss": 0.0174, "step": 64260 }, { "epoch": 0.32, "learning_rate": 0.0002513624369989556, "loss": 0.0192, "step": 64270 }, { "epoch": 0.32, "learning_rate": 0.00025135486930594165, "loss": 0.0185, "step": 64280 }, { "epoch": 0.32, "learning_rate": 0.00025134730161292763, "loss": 0.0229, "step": 64290 }, { "epoch": 0.32, "learning_rate": 0.0002513397339199136, "loss": 0.017, "step": 64300 }, { "epoch": 0.32, "learning_rate": 0.0002513321662268996, "loss": 0.0185, "step": 64310 }, { "epoch": 0.32, "learning_rate": 0.0002513245985338856, "loss": 0.0183, "step": 64320 }, { "epoch": 0.32, "learning_rate": 0.00025131703084087156, "loss": 0.0173, "step": 64330 }, { "epoch": 0.32, "learning_rate": 0.0002513094631478576, "loss": 0.0164, "step": 64340 }, { "epoch": 0.32, "learning_rate": 0.0002513018954548436, "loss": 0.0207, "step": 64350 }, { "epoch": 0.32, "learning_rate": 0.00025129432776182956, "loss": 0.0264, "step": 64360 }, { "epoch": 0.32, "learning_rate": 0.00025128676006881554, "loss": 0.0207, "step": 64370 }, { "epoch": 0.32, "learning_rate": 0.0002512791923758015, "loss": 0.0179, "step": 64380 }, { "epoch": 0.32, "learning_rate": 0.0002512716246827875, "loss": 0.0248, "step": 64390 }, { "epoch": 0.32, "learning_rate": 0.00025126405698977354, "loss": 0.0193, "step": 64400 }, { "epoch": 0.32, "learning_rate": 0.0002512564892967595, "loss": 0.0179, "step": 64410 }, { "epoch": 0.33, "learning_rate": 0.0002512489216037455, "loss": 0.0197, "step": 64420 }, { "epoch": 0.33, "learning_rate": 0.0002512413539107315, "loss": 0.0235, "step": 64430 }, { "epoch": 0.33, "learning_rate": 0.00025123378621771746, "loss": 0.0195, "step": 64440 }, { "epoch": 0.33, "learning_rate": 0.00025122621852470344, "loss": 0.0293, "step": 64450 }, { "epoch": 0.33, "learning_rate": 0.0002512186508316894, "loss": 0.0289, "step": 64460 }, { "epoch": 0.33, "learning_rate": 0.00025121108313867546, "loss": 0.0181, "step": 64470 }, { "epoch": 0.33, "learning_rate": 0.00025120351544566144, "loss": 0.0183, "step": 64480 }, { "epoch": 0.33, "learning_rate": 0.0002511959477526474, "loss": 0.0162, "step": 64490 }, { "epoch": 0.33, "learning_rate": 0.0002511883800596334, "loss": 0.0201, "step": 64500 }, { "epoch": 0.33, "learning_rate": 0.0002511808123666194, "loss": 0.0186, "step": 64510 }, { "epoch": 0.33, "learning_rate": 0.00025117324467360537, "loss": 0.0194, "step": 64520 }, { "epoch": 0.33, "learning_rate": 0.0002511656769805914, "loss": 0.0168, "step": 64530 }, { "epoch": 0.33, "learning_rate": 0.0002511581092875774, "loss": 0.0238, "step": 64540 }, { "epoch": 0.33, "learning_rate": 0.00025115054159456337, "loss": 0.0161, "step": 64550 }, { "epoch": 0.33, "learning_rate": 0.00025114297390154935, "loss": 0.0203, "step": 64560 }, { "epoch": 0.33, "learning_rate": 0.00025113540620853533, "loss": 0.0205, "step": 64570 }, { "epoch": 0.33, "learning_rate": 0.0002511278385155213, "loss": 0.0244, "step": 64580 }, { "epoch": 0.33, "learning_rate": 0.00025112027082250735, "loss": 0.0203, "step": 64590 }, { "epoch": 0.33, "learning_rate": 0.0002511127031294933, "loss": 0.0182, "step": 64600 }, { "epoch": 0.33, "learning_rate": 0.0002511051354364793, "loss": 0.0192, "step": 64610 }, { "epoch": 0.33, "learning_rate": 0.0002510975677434653, "loss": 0.0247, "step": 64620 }, { "epoch": 0.33, "learning_rate": 0.00025109000005045127, "loss": 0.019, "step": 64630 }, { "epoch": 0.33, "learning_rate": 0.00025108243235743725, "loss": 0.0199, "step": 64640 }, { "epoch": 0.33, "learning_rate": 0.00025107486466442323, "loss": 0.0221, "step": 64650 }, { "epoch": 0.33, "learning_rate": 0.00025106729697140927, "loss": 0.022, "step": 64660 }, { "epoch": 0.33, "learning_rate": 0.00025105972927839525, "loss": 0.0178, "step": 64670 }, { "epoch": 0.33, "learning_rate": 0.00025105216158538123, "loss": 0.0156, "step": 64680 }, { "epoch": 0.33, "learning_rate": 0.0002510445938923672, "loss": 0.0192, "step": 64690 }, { "epoch": 0.33, "learning_rate": 0.0002510370261993532, "loss": 0.017, "step": 64700 }, { "epoch": 0.33, "learning_rate": 0.0002510294585063392, "loss": 0.02, "step": 64710 }, { "epoch": 0.33, "learning_rate": 0.0002510218908133252, "loss": 0.0199, "step": 64720 }, { "epoch": 0.33, "learning_rate": 0.00025101432312031114, "loss": 0.0203, "step": 64730 }, { "epoch": 0.33, "learning_rate": 0.0002510067554272971, "loss": 0.0215, "step": 64740 }, { "epoch": 0.33, "learning_rate": 0.0002509991877342831, "loss": 0.0181, "step": 64750 }, { "epoch": 0.33, "learning_rate": 0.00025099162004126914, "loss": 0.0206, "step": 64760 }, { "epoch": 0.33, "learning_rate": 0.0002509840523482551, "loss": 0.0202, "step": 64770 }, { "epoch": 0.33, "learning_rate": 0.0002509764846552411, "loss": 0.0167, "step": 64780 }, { "epoch": 0.33, "learning_rate": 0.0002509689169622271, "loss": 0.0165, "step": 64790 }, { "epoch": 0.33, "learning_rate": 0.00025096134926921306, "loss": 0.022, "step": 64800 }, { "epoch": 0.33, "learning_rate": 0.00025095378157619905, "loss": 0.018, "step": 64810 }, { "epoch": 0.33, "learning_rate": 0.0002509462138831851, "loss": 0.0163, "step": 64820 }, { "epoch": 0.33, "learning_rate": 0.00025093864619017106, "loss": 0.0179, "step": 64830 }, { "epoch": 0.33, "learning_rate": 0.00025093107849715704, "loss": 0.0198, "step": 64840 }, { "epoch": 0.33, "learning_rate": 0.000250923510804143, "loss": 0.015, "step": 64850 }, { "epoch": 0.33, "learning_rate": 0.000250915943111129, "loss": 0.0222, "step": 64860 }, { "epoch": 0.33, "learning_rate": 0.000250908375418115, "loss": 0.022, "step": 64870 }, { "epoch": 0.33, "learning_rate": 0.00025090080772510097, "loss": 0.0169, "step": 64880 }, { "epoch": 0.33, "learning_rate": 0.000250893240032087, "loss": 0.0217, "step": 64890 }, { "epoch": 0.33, "learning_rate": 0.000250885672339073, "loss": 0.0205, "step": 64900 }, { "epoch": 0.33, "learning_rate": 0.00025087810464605897, "loss": 0.0174, "step": 64910 }, { "epoch": 0.33, "learning_rate": 0.00025087053695304495, "loss": 0.0171, "step": 64920 }, { "epoch": 0.33, "learning_rate": 0.00025086296926003093, "loss": 0.0178, "step": 64930 }, { "epoch": 0.33, "learning_rate": 0.0002508554015670169, "loss": 0.0178, "step": 64940 }, { "epoch": 0.33, "learning_rate": 0.00025084783387400295, "loss": 0.0192, "step": 64950 }, { "epoch": 0.33, "learning_rate": 0.00025084026618098893, "loss": 0.0181, "step": 64960 }, { "epoch": 0.33, "learning_rate": 0.0002508326984879749, "loss": 0.0183, "step": 64970 }, { "epoch": 0.33, "learning_rate": 0.0002508251307949609, "loss": 0.0263, "step": 64980 }, { "epoch": 0.33, "learning_rate": 0.0002508175631019469, "loss": 0.0171, "step": 64990 }, { "epoch": 0.33, "learning_rate": 0.00025080999540893286, "loss": 0.021, "step": 65000 }, { "epoch": 0.33, "eval_cer": 0.9144857822411687, "eval_loss": 0.013442865572869778, "eval_runtime": 116.7164, "eval_samples_per_second": 17.136, "eval_steps_per_second": 4.284, "step": 65000 }, { "epoch": 0.33, "learning_rate": 0.00025080242771591884, "loss": 0.022, "step": 65010 }, { "epoch": 0.33, "learning_rate": 0.00025079486002290487, "loss": 0.0164, "step": 65020 }, { "epoch": 0.33, "learning_rate": 0.00025078729232989085, "loss": 0.0209, "step": 65030 }, { "epoch": 0.33, "learning_rate": 0.00025077972463687684, "loss": 0.0224, "step": 65040 }, { "epoch": 0.33, "learning_rate": 0.0002507721569438628, "loss": 0.0178, "step": 65050 }, { "epoch": 0.33, "learning_rate": 0.0002507645892508488, "loss": 0.0205, "step": 65060 }, { "epoch": 0.33, "learning_rate": 0.0002507570215578348, "loss": 0.0205, "step": 65070 }, { "epoch": 0.33, "learning_rate": 0.0002507494538648208, "loss": 0.0166, "step": 65080 }, { "epoch": 0.33, "learning_rate": 0.0002507418861718068, "loss": 0.0141, "step": 65090 }, { "epoch": 0.33, "learning_rate": 0.0002507343184787928, "loss": 0.0224, "step": 65100 }, { "epoch": 0.33, "learning_rate": 0.00025072675078577876, "loss": 0.0191, "step": 65110 }, { "epoch": 0.33, "learning_rate": 0.00025071918309276474, "loss": 0.0214, "step": 65120 }, { "epoch": 0.33, "learning_rate": 0.0002507116153997507, "loss": 0.0147, "step": 65130 }, { "epoch": 0.33, "learning_rate": 0.00025070404770673676, "loss": 0.0176, "step": 65140 }, { "epoch": 0.33, "learning_rate": 0.00025069648001372274, "loss": 0.0168, "step": 65150 }, { "epoch": 0.33, "learning_rate": 0.0002506889123207087, "loss": 0.0155, "step": 65160 }, { "epoch": 0.33, "learning_rate": 0.0002506813446276947, "loss": 0.0203, "step": 65170 }, { "epoch": 0.33, "learning_rate": 0.0002506737769346807, "loss": 0.0213, "step": 65180 }, { "epoch": 0.33, "learning_rate": 0.00025066620924166667, "loss": 0.0169, "step": 65190 }, { "epoch": 0.33, "learning_rate": 0.00025065864154865265, "loss": 0.0197, "step": 65200 }, { "epoch": 0.33, "learning_rate": 0.0002506510738556387, "loss": 0.0235, "step": 65210 }, { "epoch": 0.33, "learning_rate": 0.00025064350616262466, "loss": 0.016, "step": 65220 }, { "epoch": 0.33, "learning_rate": 0.00025063593846961065, "loss": 0.0189, "step": 65230 }, { "epoch": 0.33, "learning_rate": 0.0002506283707765966, "loss": 0.0181, "step": 65240 }, { "epoch": 0.33, "learning_rate": 0.0002506208030835826, "loss": 0.0201, "step": 65250 }, { "epoch": 0.33, "learning_rate": 0.0002506132353905686, "loss": 0.0207, "step": 65260 }, { "epoch": 0.33, "learning_rate": 0.0002506056676975546, "loss": 0.018, "step": 65270 }, { "epoch": 0.33, "learning_rate": 0.0002505981000045406, "loss": 0.0186, "step": 65280 }, { "epoch": 0.33, "learning_rate": 0.0002505905323115266, "loss": 0.0237, "step": 65290 }, { "epoch": 0.33, "learning_rate": 0.00025058296461851257, "loss": 0.0265, "step": 65300 }, { "epoch": 0.33, "learning_rate": 0.00025057539692549855, "loss": 0.0166, "step": 65310 }, { "epoch": 0.33, "learning_rate": 0.00025056782923248453, "loss": 0.0183, "step": 65320 }, { "epoch": 0.33, "learning_rate": 0.00025056026153947057, "loss": 0.016, "step": 65330 }, { "epoch": 0.33, "learning_rate": 0.00025055269384645655, "loss": 0.0151, "step": 65340 }, { "epoch": 0.33, "learning_rate": 0.00025054512615344253, "loss": 0.0191, "step": 65350 }, { "epoch": 0.33, "learning_rate": 0.0002505375584604285, "loss": 0.0159, "step": 65360 }, { "epoch": 0.33, "learning_rate": 0.0002505299907674145, "loss": 0.019, "step": 65370 }, { "epoch": 0.33, "learning_rate": 0.0002505224230744005, "loss": 0.0195, "step": 65380 }, { "epoch": 0.33, "learning_rate": 0.00025051485538138646, "loss": 0.0228, "step": 65390 }, { "epoch": 0.33, "learning_rate": 0.0002505072876883725, "loss": 0.0193, "step": 65400 }, { "epoch": 0.33, "learning_rate": 0.0002504997199953585, "loss": 0.0173, "step": 65410 }, { "epoch": 0.33, "learning_rate": 0.00025049215230234446, "loss": 0.0188, "step": 65420 }, { "epoch": 0.33, "learning_rate": 0.00025048458460933044, "loss": 0.0192, "step": 65430 }, { "epoch": 0.33, "learning_rate": 0.0002504770169163164, "loss": 0.0198, "step": 65440 }, { "epoch": 0.33, "learning_rate": 0.0002504694492233024, "loss": 0.0222, "step": 65450 }, { "epoch": 0.33, "learning_rate": 0.00025046188153028844, "loss": 0.0185, "step": 65460 }, { "epoch": 0.33, "learning_rate": 0.0002504543138372744, "loss": 0.0213, "step": 65470 }, { "epoch": 0.33, "learning_rate": 0.0002504467461442604, "loss": 0.0182, "step": 65480 }, { "epoch": 0.33, "learning_rate": 0.0002504391784512464, "loss": 0.0168, "step": 65490 }, { "epoch": 0.33, "learning_rate": 0.00025043161075823236, "loss": 0.0178, "step": 65500 }, { "epoch": 0.33, "learning_rate": 0.00025042404306521834, "loss": 0.023, "step": 65510 }, { "epoch": 0.33, "learning_rate": 0.0002504164753722043, "loss": 0.0213, "step": 65520 }, { "epoch": 0.33, "learning_rate": 0.00025040890767919036, "loss": 0.0199, "step": 65530 }, { "epoch": 0.33, "learning_rate": 0.00025040133998617634, "loss": 0.0193, "step": 65540 }, { "epoch": 0.33, "learning_rate": 0.0002503937722931623, "loss": 0.018, "step": 65550 }, { "epoch": 0.33, "learning_rate": 0.0002503862046001483, "loss": 0.0307, "step": 65560 }, { "epoch": 0.33, "learning_rate": 0.0002503786369071343, "loss": 0.0172, "step": 65570 }, { "epoch": 0.33, "learning_rate": 0.00025037106921412027, "loss": 0.0179, "step": 65580 }, { "epoch": 0.33, "learning_rate": 0.0002503635015211063, "loss": 0.0171, "step": 65590 }, { "epoch": 0.33, "learning_rate": 0.0002503559338280923, "loss": 0.0225, "step": 65600 }, { "epoch": 0.33, "learning_rate": 0.00025034836613507827, "loss": 0.0174, "step": 65610 }, { "epoch": 0.33, "learning_rate": 0.00025034079844206425, "loss": 0.0236, "step": 65620 }, { "epoch": 0.33, "learning_rate": 0.00025033323074905023, "loss": 0.0174, "step": 65630 }, { "epoch": 0.33, "learning_rate": 0.0002503256630560362, "loss": 0.0196, "step": 65640 }, { "epoch": 0.33, "learning_rate": 0.00025031809536302225, "loss": 0.0177, "step": 65650 }, { "epoch": 0.33, "learning_rate": 0.0002503105276700082, "loss": 0.0194, "step": 65660 }, { "epoch": 0.33, "learning_rate": 0.0002503029599769942, "loss": 0.0185, "step": 65670 }, { "epoch": 0.33, "learning_rate": 0.0002502953922839802, "loss": 0.0229, "step": 65680 }, { "epoch": 0.33, "learning_rate": 0.00025028782459096617, "loss": 0.0224, "step": 65690 }, { "epoch": 0.33, "learning_rate": 0.00025028025689795215, "loss": 0.023, "step": 65700 }, { "epoch": 0.33, "learning_rate": 0.00025027268920493813, "loss": 0.0197, "step": 65710 }, { "epoch": 0.33, "learning_rate": 0.00025026512151192417, "loss": 0.0159, "step": 65720 }, { "epoch": 0.33, "learning_rate": 0.00025025755381891015, "loss": 0.0251, "step": 65730 }, { "epoch": 0.33, "learning_rate": 0.00025024998612589613, "loss": 0.0197, "step": 65740 }, { "epoch": 0.33, "learning_rate": 0.0002502424184328821, "loss": 0.0168, "step": 65750 }, { "epoch": 0.33, "learning_rate": 0.0002502348507398681, "loss": 0.019, "step": 65760 }, { "epoch": 0.33, "learning_rate": 0.0002502272830468541, "loss": 0.0175, "step": 65770 }, { "epoch": 0.33, "learning_rate": 0.0002502197153538401, "loss": 0.02, "step": 65780 }, { "epoch": 0.33, "learning_rate": 0.0002502121476608261, "loss": 0.0203, "step": 65790 }, { "epoch": 0.33, "learning_rate": 0.0002502045799678121, "loss": 0.023, "step": 65800 }, { "epoch": 0.33, "learning_rate": 0.00025019701227479806, "loss": 0.0184, "step": 65810 }, { "epoch": 0.33, "learning_rate": 0.00025018944458178404, "loss": 0.0244, "step": 65820 }, { "epoch": 0.33, "learning_rate": 0.00025018187688877, "loss": 0.0201, "step": 65830 }, { "epoch": 0.33, "learning_rate": 0.00025017430919575606, "loss": 0.0162, "step": 65840 }, { "epoch": 0.33, "learning_rate": 0.00025016674150274204, "loss": 0.0206, "step": 65850 }, { "epoch": 0.33, "learning_rate": 0.000250159173809728, "loss": 0.015, "step": 65860 }, { "epoch": 0.33, "learning_rate": 0.000250151606116714, "loss": 0.0178, "step": 65870 }, { "epoch": 0.33, "learning_rate": 0.0002501440384237, "loss": 0.0303, "step": 65880 }, { "epoch": 0.33, "learning_rate": 0.00025013647073068596, "loss": 0.0197, "step": 65890 }, { "epoch": 0.33, "learning_rate": 0.00025012890303767194, "loss": 0.0178, "step": 65900 }, { "epoch": 0.33, "learning_rate": 0.000250121335344658, "loss": 0.0179, "step": 65910 }, { "epoch": 0.33, "learning_rate": 0.00025011376765164396, "loss": 0.0201, "step": 65920 }, { "epoch": 0.33, "learning_rate": 0.00025010619995862994, "loss": 0.0211, "step": 65930 }, { "epoch": 0.33, "learning_rate": 0.0002500986322656159, "loss": 0.0188, "step": 65940 }, { "epoch": 0.33, "learning_rate": 0.0002500910645726019, "loss": 0.0166, "step": 65950 }, { "epoch": 0.33, "learning_rate": 0.0002500834968795879, "loss": 0.0192, "step": 65960 }, { "epoch": 0.33, "learning_rate": 0.0002500759291865739, "loss": 0.0177, "step": 65970 }, { "epoch": 0.33, "learning_rate": 0.0002500683614935599, "loss": 0.0149, "step": 65980 }, { "epoch": 0.33, "learning_rate": 0.00025006079380054583, "loss": 0.0199, "step": 65990 }, { "epoch": 0.33, "learning_rate": 0.0002500532261075318, "loss": 0.0174, "step": 66000 }, { "epoch": 0.33, "eval_cer": 0.9144324104542716, "eval_loss": 0.01361939124763012, "eval_runtime": 116.6985, "eval_samples_per_second": 17.138, "eval_steps_per_second": 4.285, "step": 66000 }, { "epoch": 0.33, "learning_rate": 0.00025004565841451785, "loss": 0.0174, "step": 66010 }, { "epoch": 0.33, "learning_rate": 0.00025003809072150383, "loss": 0.0191, "step": 66020 }, { "epoch": 0.33, "learning_rate": 0.0002500305230284898, "loss": 0.0187, "step": 66030 }, { "epoch": 0.33, "learning_rate": 0.0002500229553354758, "loss": 0.0169, "step": 66040 }, { "epoch": 0.33, "learning_rate": 0.0002500153876424618, "loss": 0.0237, "step": 66050 }, { "epoch": 0.33, "learning_rate": 0.00025000781994944776, "loss": 0.0186, "step": 66060 }, { "epoch": 0.33, "learning_rate": 0.00025000025225643374, "loss": 0.0148, "step": 66070 }, { "epoch": 0.33, "learning_rate": 0.00024999268456341977, "loss": 0.0197, "step": 66080 }, { "epoch": 0.33, "learning_rate": 0.00024998511687040575, "loss": 0.0197, "step": 66090 }, { "epoch": 0.33, "learning_rate": 0.00024997754917739174, "loss": 0.0172, "step": 66100 }, { "epoch": 0.33, "learning_rate": 0.0002499699814843777, "loss": 0.0189, "step": 66110 }, { "epoch": 0.33, "learning_rate": 0.0002499624137913637, "loss": 0.0187, "step": 66120 }, { "epoch": 0.33, "learning_rate": 0.0002499548460983497, "loss": 0.0218, "step": 66130 }, { "epoch": 0.33, "learning_rate": 0.0002499472784053357, "loss": 0.0229, "step": 66140 }, { "epoch": 0.33, "learning_rate": 0.0002499397107123217, "loss": 0.0175, "step": 66150 }, { "epoch": 0.33, "learning_rate": 0.0002499321430193077, "loss": 0.0179, "step": 66160 }, { "epoch": 0.33, "learning_rate": 0.00024992457532629366, "loss": 0.0172, "step": 66170 }, { "epoch": 0.33, "learning_rate": 0.00024991700763327964, "loss": 0.0197, "step": 66180 }, { "epoch": 0.33, "learning_rate": 0.0002499094399402656, "loss": 0.0192, "step": 66190 }, { "epoch": 0.33, "learning_rate": 0.00024990187224725166, "loss": 0.0175, "step": 66200 }, { "epoch": 0.33, "learning_rate": 0.00024989430455423764, "loss": 0.0204, "step": 66210 }, { "epoch": 0.33, "learning_rate": 0.0002498867368612236, "loss": 0.0195, "step": 66220 }, { "epoch": 0.33, "learning_rate": 0.0002498791691682096, "loss": 0.0178, "step": 66230 }, { "epoch": 0.33, "learning_rate": 0.0002498716014751956, "loss": 0.0247, "step": 66240 }, { "epoch": 0.33, "learning_rate": 0.00024986403378218157, "loss": 0.0201, "step": 66250 }, { "epoch": 0.33, "learning_rate": 0.00024985646608916755, "loss": 0.0181, "step": 66260 }, { "epoch": 0.33, "learning_rate": 0.0002498488983961536, "loss": 0.0232, "step": 66270 }, { "epoch": 0.33, "learning_rate": 0.00024984133070313956, "loss": 0.0173, "step": 66280 }, { "epoch": 0.33, "learning_rate": 0.00024983376301012555, "loss": 0.0189, "step": 66290 }, { "epoch": 0.33, "learning_rate": 0.00024982619531711153, "loss": 0.0189, "step": 66300 }, { "epoch": 0.33, "learning_rate": 0.0002498186276240975, "loss": 0.0176, "step": 66310 }, { "epoch": 0.33, "learning_rate": 0.0002498110599310835, "loss": 0.0174, "step": 66320 }, { "epoch": 0.33, "learning_rate": 0.0002498034922380695, "loss": 0.0159, "step": 66330 }, { "epoch": 0.33, "learning_rate": 0.0002497959245450555, "loss": 0.0198, "step": 66340 }, { "epoch": 0.33, "learning_rate": 0.0002497883568520415, "loss": 0.0191, "step": 66350 }, { "epoch": 0.33, "learning_rate": 0.00024978078915902747, "loss": 0.0234, "step": 66360 }, { "epoch": 0.33, "learning_rate": 0.00024977322146601345, "loss": 0.0172, "step": 66370 }, { "epoch": 0.33, "learning_rate": 0.00024976565377299943, "loss": 0.0188, "step": 66380 }, { "epoch": 0.33, "learning_rate": 0.00024975808607998547, "loss": 0.0183, "step": 66390 }, { "epoch": 0.33, "learning_rate": 0.00024975051838697145, "loss": 0.0193, "step": 66400 }, { "epoch": 0.34, "learning_rate": 0.00024974295069395743, "loss": 0.02, "step": 66410 }, { "epoch": 0.34, "learning_rate": 0.0002497353830009434, "loss": 0.0176, "step": 66420 }, { "epoch": 0.34, "learning_rate": 0.0002497278153079294, "loss": 0.0213, "step": 66430 }, { "epoch": 0.34, "learning_rate": 0.0002497202476149154, "loss": 0.0188, "step": 66440 }, { "epoch": 0.34, "learning_rate": 0.00024971267992190136, "loss": 0.018, "step": 66450 }, { "epoch": 0.34, "learning_rate": 0.0002497051122288874, "loss": 0.0194, "step": 66460 }, { "epoch": 0.34, "learning_rate": 0.0002496975445358734, "loss": 0.0144, "step": 66470 }, { "epoch": 0.34, "learning_rate": 0.00024968997684285936, "loss": 0.0178, "step": 66480 }, { "epoch": 0.34, "learning_rate": 0.00024968240914984534, "loss": 0.018, "step": 66490 }, { "epoch": 0.34, "learning_rate": 0.0002496748414568313, "loss": 0.0167, "step": 66500 }, { "epoch": 0.34, "learning_rate": 0.0002496672737638173, "loss": 0.0173, "step": 66510 }, { "epoch": 0.34, "learning_rate": 0.00024965970607080334, "loss": 0.0172, "step": 66520 }, { "epoch": 0.34, "learning_rate": 0.0002496521383777893, "loss": 0.0181, "step": 66530 }, { "epoch": 0.34, "learning_rate": 0.0002496445706847753, "loss": 0.0283, "step": 66540 }, { "epoch": 0.34, "learning_rate": 0.0002496370029917613, "loss": 0.0203, "step": 66550 }, { "epoch": 0.34, "learning_rate": 0.00024962943529874726, "loss": 0.0215, "step": 66560 }, { "epoch": 0.34, "learning_rate": 0.00024962186760573324, "loss": 0.0156, "step": 66570 }, { "epoch": 0.34, "learning_rate": 0.0002496142999127192, "loss": 0.0211, "step": 66580 }, { "epoch": 0.34, "learning_rate": 0.00024960673221970526, "loss": 0.0181, "step": 66590 }, { "epoch": 0.34, "learning_rate": 0.00024959916452669124, "loss": 0.0197, "step": 66600 }, { "epoch": 0.34, "learning_rate": 0.0002495915968336772, "loss": 0.0229, "step": 66610 }, { "epoch": 0.34, "learning_rate": 0.0002495840291406632, "loss": 0.0154, "step": 66620 }, { "epoch": 0.34, "learning_rate": 0.0002495764614476492, "loss": 0.0183, "step": 66630 }, { "epoch": 0.34, "learning_rate": 0.00024956889375463517, "loss": 0.0215, "step": 66640 }, { "epoch": 0.34, "learning_rate": 0.0002495613260616212, "loss": 0.0231, "step": 66650 }, { "epoch": 0.34, "learning_rate": 0.0002495537583686072, "loss": 0.0234, "step": 66660 }, { "epoch": 0.34, "learning_rate": 0.00024954619067559317, "loss": 0.0229, "step": 66670 }, { "epoch": 0.34, "learning_rate": 0.00024953862298257915, "loss": 0.0206, "step": 66680 }, { "epoch": 0.34, "learning_rate": 0.00024953105528956513, "loss": 0.0227, "step": 66690 }, { "epoch": 0.34, "learning_rate": 0.0002495234875965511, "loss": 0.0218, "step": 66700 }, { "epoch": 0.34, "learning_rate": 0.00024951591990353715, "loss": 0.0181, "step": 66710 }, { "epoch": 0.34, "learning_rate": 0.00024950835221052313, "loss": 0.018, "step": 66720 }, { "epoch": 0.34, "learning_rate": 0.0002495007845175091, "loss": 0.0198, "step": 66730 }, { "epoch": 0.34, "learning_rate": 0.0002494932168244951, "loss": 0.0192, "step": 66740 }, { "epoch": 0.34, "learning_rate": 0.00024948564913148107, "loss": 0.017, "step": 66750 }, { "epoch": 0.34, "learning_rate": 0.00024947808143846705, "loss": 0.0216, "step": 66760 }, { "epoch": 0.34, "learning_rate": 0.00024947051374545303, "loss": 0.0171, "step": 66770 }, { "epoch": 0.34, "learning_rate": 0.00024946294605243907, "loss": 0.0186, "step": 66780 }, { "epoch": 0.34, "learning_rate": 0.00024945537835942505, "loss": 0.0214, "step": 66790 }, { "epoch": 0.34, "learning_rate": 0.00024944781066641103, "loss": 0.0191, "step": 66800 }, { "epoch": 0.34, "learning_rate": 0.000249440242973397, "loss": 0.0166, "step": 66810 }, { "epoch": 0.34, "learning_rate": 0.000249432675280383, "loss": 0.0183, "step": 66820 }, { "epoch": 0.34, "learning_rate": 0.000249425107587369, "loss": 0.0182, "step": 66830 }, { "epoch": 0.34, "learning_rate": 0.000249417539894355, "loss": 0.019, "step": 66840 }, { "epoch": 0.34, "learning_rate": 0.000249409972201341, "loss": 0.0244, "step": 66850 }, { "epoch": 0.34, "learning_rate": 0.000249402404508327, "loss": 0.0206, "step": 66860 }, { "epoch": 0.34, "learning_rate": 0.00024939483681531296, "loss": 0.0177, "step": 66870 }, { "epoch": 0.34, "learning_rate": 0.00024938726912229894, "loss": 0.0174, "step": 66880 }, { "epoch": 0.34, "learning_rate": 0.0002493797014292849, "loss": 0.021, "step": 66890 }, { "epoch": 0.34, "learning_rate": 0.00024937213373627096, "loss": 0.0209, "step": 66900 }, { "epoch": 0.34, "learning_rate": 0.00024936456604325694, "loss": 0.0182, "step": 66910 }, { "epoch": 0.34, "learning_rate": 0.0002493569983502429, "loss": 0.0161, "step": 66920 }, { "epoch": 0.34, "learning_rate": 0.0002493494306572289, "loss": 0.0236, "step": 66930 }, { "epoch": 0.34, "learning_rate": 0.0002493418629642149, "loss": 0.0182, "step": 66940 }, { "epoch": 0.34, "learning_rate": 0.00024933429527120086, "loss": 0.0189, "step": 66950 }, { "epoch": 0.34, "learning_rate": 0.00024932672757818684, "loss": 0.0187, "step": 66960 }, { "epoch": 0.34, "learning_rate": 0.0002493191598851729, "loss": 0.0196, "step": 66970 }, { "epoch": 0.34, "learning_rate": 0.00024931159219215886, "loss": 0.0187, "step": 66980 }, { "epoch": 0.34, "learning_rate": 0.00024930402449914484, "loss": 0.0195, "step": 66990 }, { "epoch": 0.34, "learning_rate": 0.0002492964568061308, "loss": 0.017, "step": 67000 }, { "epoch": 0.34, "eval_cer": 0.9144518183767796, "eval_loss": 0.013345795683562756, "eval_runtime": 116.5962, "eval_samples_per_second": 17.153, "eval_steps_per_second": 4.288, "step": 67000 }, { "epoch": 0.34, "learning_rate": 0.0002492888891131168, "loss": 0.0192, "step": 67010 }, { "epoch": 0.34, "learning_rate": 0.0002492813214201028, "loss": 0.0234, "step": 67020 }, { "epoch": 0.34, "learning_rate": 0.0002492737537270888, "loss": 0.0155, "step": 67030 }, { "epoch": 0.34, "learning_rate": 0.0002492661860340748, "loss": 0.0181, "step": 67040 }, { "epoch": 0.34, "learning_rate": 0.0002492586183410608, "loss": 0.0186, "step": 67050 }, { "epoch": 0.34, "learning_rate": 0.00024925105064804677, "loss": 0.0213, "step": 67060 }, { "epoch": 0.34, "learning_rate": 0.00024924348295503275, "loss": 0.019, "step": 67070 }, { "epoch": 0.34, "learning_rate": 0.00024923591526201873, "loss": 0.0205, "step": 67080 }, { "epoch": 0.34, "learning_rate": 0.0002492283475690047, "loss": 0.024, "step": 67090 }, { "epoch": 0.34, "learning_rate": 0.00024922077987599075, "loss": 0.0229, "step": 67100 }, { "epoch": 0.34, "learning_rate": 0.00024921321218297673, "loss": 0.0218, "step": 67110 }, { "epoch": 0.34, "learning_rate": 0.0002492056444899627, "loss": 0.0178, "step": 67120 }, { "epoch": 0.34, "learning_rate": 0.0002491980767969487, "loss": 0.021, "step": 67130 }, { "epoch": 0.34, "learning_rate": 0.0002491905091039347, "loss": 0.0172, "step": 67140 }, { "epoch": 0.34, "learning_rate": 0.00024918294141092065, "loss": 0.0164, "step": 67150 }, { "epoch": 0.34, "learning_rate": 0.0002491753737179067, "loss": 0.0202, "step": 67160 }, { "epoch": 0.34, "learning_rate": 0.00024916780602489267, "loss": 0.0182, "step": 67170 }, { "epoch": 0.34, "learning_rate": 0.00024916023833187865, "loss": 0.0182, "step": 67180 }, { "epoch": 0.34, "learning_rate": 0.00024915267063886463, "loss": 0.0179, "step": 67190 }, { "epoch": 0.34, "learning_rate": 0.0002491451029458506, "loss": 0.0194, "step": 67200 }, { "epoch": 0.34, "learning_rate": 0.0002491375352528366, "loss": 0.0171, "step": 67210 }, { "epoch": 0.34, "learning_rate": 0.00024912996755982263, "loss": 0.0198, "step": 67220 }, { "epoch": 0.34, "learning_rate": 0.0002491223998668086, "loss": 0.0203, "step": 67230 }, { "epoch": 0.34, "learning_rate": 0.0002491148321737946, "loss": 0.0192, "step": 67240 }, { "epoch": 0.34, "learning_rate": 0.0002491072644807805, "loss": 0.0199, "step": 67250 }, { "epoch": 0.34, "learning_rate": 0.00024909969678776656, "loss": 0.0191, "step": 67260 }, { "epoch": 0.34, "learning_rate": 0.00024909212909475254, "loss": 0.0163, "step": 67270 }, { "epoch": 0.34, "learning_rate": 0.0002490845614017385, "loss": 0.0163, "step": 67280 }, { "epoch": 0.34, "learning_rate": 0.0002490769937087245, "loss": 0.017, "step": 67290 }, { "epoch": 0.34, "learning_rate": 0.0002490694260157105, "loss": 0.0186, "step": 67300 }, { "epoch": 0.34, "learning_rate": 0.00024906185832269647, "loss": 0.02, "step": 67310 }, { "epoch": 0.34, "learning_rate": 0.00024905429062968245, "loss": 0.0191, "step": 67320 }, { "epoch": 0.34, "learning_rate": 0.0002490467229366685, "loss": 0.0148, "step": 67330 }, { "epoch": 0.34, "learning_rate": 0.00024903915524365446, "loss": 0.0195, "step": 67340 }, { "epoch": 0.34, "learning_rate": 0.00024903158755064045, "loss": 0.0175, "step": 67350 }, { "epoch": 0.34, "learning_rate": 0.00024902401985762643, "loss": 0.017, "step": 67360 }, { "epoch": 0.34, "learning_rate": 0.0002490164521646124, "loss": 0.022, "step": 67370 }, { "epoch": 0.34, "learning_rate": 0.0002490088844715984, "loss": 0.02, "step": 67380 }, { "epoch": 0.34, "learning_rate": 0.0002490013167785844, "loss": 0.0252, "step": 67390 }, { "epoch": 0.34, "learning_rate": 0.0002489937490855704, "loss": 0.0201, "step": 67400 }, { "epoch": 0.34, "learning_rate": 0.0002489861813925564, "loss": 0.0216, "step": 67410 }, { "epoch": 0.34, "learning_rate": 0.00024897861369954237, "loss": 0.0163, "step": 67420 }, { "epoch": 0.34, "learning_rate": 0.00024897104600652835, "loss": 0.0193, "step": 67430 }, { "epoch": 0.34, "learning_rate": 0.00024896347831351433, "loss": 0.0193, "step": 67440 }, { "epoch": 0.34, "learning_rate": 0.00024895591062050037, "loss": 0.0163, "step": 67450 }, { "epoch": 0.34, "learning_rate": 0.00024894834292748635, "loss": 0.0163, "step": 67460 }, { "epoch": 0.34, "learning_rate": 0.00024894077523447233, "loss": 0.0185, "step": 67470 }, { "epoch": 0.34, "learning_rate": 0.0002489332075414583, "loss": 0.0225, "step": 67480 }, { "epoch": 0.34, "learning_rate": 0.0002489256398484443, "loss": 0.0176, "step": 67490 }, { "epoch": 0.34, "learning_rate": 0.0002489180721554303, "loss": 0.0166, "step": 67500 }, { "epoch": 0.34, "learning_rate": 0.00024891050446241626, "loss": 0.0199, "step": 67510 }, { "epoch": 0.34, "learning_rate": 0.0002489029367694023, "loss": 0.0205, "step": 67520 }, { "epoch": 0.34, "learning_rate": 0.0002488953690763883, "loss": 0.0201, "step": 67530 }, { "epoch": 0.34, "learning_rate": 0.00024888780138337426, "loss": 0.0173, "step": 67540 }, { "epoch": 0.34, "learning_rate": 0.00024888023369036024, "loss": 0.02, "step": 67550 }, { "epoch": 0.34, "learning_rate": 0.0002488726659973462, "loss": 0.0188, "step": 67560 }, { "epoch": 0.34, "learning_rate": 0.0002488650983043322, "loss": 0.0218, "step": 67570 }, { "epoch": 0.34, "learning_rate": 0.00024885753061131824, "loss": 0.015, "step": 67580 }, { "epoch": 0.34, "learning_rate": 0.0002488499629183042, "loss": 0.0174, "step": 67590 }, { "epoch": 0.34, "learning_rate": 0.0002488423952252902, "loss": 0.0237, "step": 67600 }, { "epoch": 0.34, "learning_rate": 0.0002488348275322762, "loss": 0.0171, "step": 67610 }, { "epoch": 0.34, "learning_rate": 0.00024882725983926216, "loss": 0.0203, "step": 67620 }, { "epoch": 0.34, "learning_rate": 0.00024881969214624814, "loss": 0.0142, "step": 67630 }, { "epoch": 0.34, "learning_rate": 0.0002488121244532342, "loss": 0.0177, "step": 67640 }, { "epoch": 0.34, "learning_rate": 0.00024880455676022016, "loss": 0.0195, "step": 67650 }, { "epoch": 0.34, "learning_rate": 0.00024879698906720614, "loss": 0.021, "step": 67660 }, { "epoch": 0.34, "learning_rate": 0.0002487894213741921, "loss": 0.0204, "step": 67670 }, { "epoch": 0.34, "learning_rate": 0.0002487818536811781, "loss": 0.0162, "step": 67680 }, { "epoch": 0.34, "learning_rate": 0.0002487742859881641, "loss": 0.0174, "step": 67690 }, { "epoch": 0.34, "learning_rate": 0.00024876671829515007, "loss": 0.0177, "step": 67700 }, { "epoch": 0.34, "learning_rate": 0.0002487591506021361, "loss": 0.0166, "step": 67710 }, { "epoch": 0.34, "learning_rate": 0.0002487515829091221, "loss": 0.0178, "step": 67720 }, { "epoch": 0.34, "learning_rate": 0.00024874401521610807, "loss": 0.0189, "step": 67730 }, { "epoch": 0.34, "learning_rate": 0.00024873644752309405, "loss": 0.0148, "step": 67740 }, { "epoch": 0.34, "learning_rate": 0.00024872887983008003, "loss": 0.0177, "step": 67750 }, { "epoch": 0.34, "learning_rate": 0.000248721312137066, "loss": 0.0181, "step": 67760 }, { "epoch": 0.34, "learning_rate": 0.00024871374444405205, "loss": 0.0165, "step": 67770 }, { "epoch": 0.34, "learning_rate": 0.00024870617675103803, "loss": 0.0261, "step": 67780 }, { "epoch": 0.34, "learning_rate": 0.000248698609058024, "loss": 0.0199, "step": 67790 }, { "epoch": 0.34, "learning_rate": 0.00024869104136501, "loss": 0.02, "step": 67800 }, { "epoch": 0.34, "learning_rate": 0.00024868347367199597, "loss": 0.0217, "step": 67810 }, { "epoch": 0.34, "learning_rate": 0.00024867590597898195, "loss": 0.0202, "step": 67820 }, { "epoch": 0.34, "learning_rate": 0.00024866833828596793, "loss": 0.0166, "step": 67830 }, { "epoch": 0.34, "learning_rate": 0.00024866077059295397, "loss": 0.0191, "step": 67840 }, { "epoch": 0.34, "learning_rate": 0.00024865320289993995, "loss": 0.0181, "step": 67850 }, { "epoch": 0.34, "learning_rate": 0.00024864563520692593, "loss": 0.0199, "step": 67860 }, { "epoch": 0.34, "learning_rate": 0.0002486380675139119, "loss": 0.019, "step": 67870 }, { "epoch": 0.34, "learning_rate": 0.0002486304998208979, "loss": 0.0182, "step": 67880 }, { "epoch": 0.34, "learning_rate": 0.0002486229321278839, "loss": 0.0155, "step": 67890 }, { "epoch": 0.34, "learning_rate": 0.0002486153644348699, "loss": 0.0169, "step": 67900 }, { "epoch": 0.34, "learning_rate": 0.0002486077967418559, "loss": 0.0171, "step": 67910 }, { "epoch": 0.34, "learning_rate": 0.0002486002290488419, "loss": 0.0227, "step": 67920 }, { "epoch": 0.34, "learning_rate": 0.00024859266135582786, "loss": 0.0201, "step": 67930 }, { "epoch": 0.34, "learning_rate": 0.00024858509366281384, "loss": 0.0165, "step": 67940 }, { "epoch": 0.34, "learning_rate": 0.0002485775259697998, "loss": 0.0154, "step": 67950 }, { "epoch": 0.34, "learning_rate": 0.00024856995827678586, "loss": 0.0165, "step": 67960 }, { "epoch": 0.34, "learning_rate": 0.00024856239058377184, "loss": 0.0199, "step": 67970 }, { "epoch": 0.34, "learning_rate": 0.0002485548228907578, "loss": 0.0166, "step": 67980 }, { "epoch": 0.34, "learning_rate": 0.0002485472551977438, "loss": 0.0178, "step": 67990 }, { "epoch": 0.34, "learning_rate": 0.0002485396875047298, "loss": 0.0206, "step": 68000 }, { "epoch": 0.34, "eval_cer": 0.9144692855070369, "eval_loss": 0.013180240988731384, "eval_runtime": 116.7123, "eval_samples_per_second": 17.136, "eval_steps_per_second": 4.284, "step": 68000 }, { "epoch": 0.34, "learning_rate": 0.00024853211981171576, "loss": 0.0169, "step": 68010 }, { "epoch": 0.34, "learning_rate": 0.00024852455211870174, "loss": 0.0189, "step": 68020 }, { "epoch": 0.34, "learning_rate": 0.0002485169844256878, "loss": 0.0172, "step": 68030 }, { "epoch": 0.34, "learning_rate": 0.00024850941673267376, "loss": 0.019, "step": 68040 }, { "epoch": 0.34, "learning_rate": 0.00024850184903965974, "loss": 0.0184, "step": 68050 }, { "epoch": 0.34, "learning_rate": 0.0002484942813466457, "loss": 0.015, "step": 68060 }, { "epoch": 0.34, "learning_rate": 0.0002484867136536317, "loss": 0.0175, "step": 68070 }, { "epoch": 0.34, "learning_rate": 0.0002484791459606177, "loss": 0.0203, "step": 68080 }, { "epoch": 0.34, "learning_rate": 0.0002484715782676037, "loss": 0.0184, "step": 68090 }, { "epoch": 0.34, "learning_rate": 0.0002484640105745897, "loss": 0.021, "step": 68100 }, { "epoch": 0.34, "learning_rate": 0.0002484564428815757, "loss": 0.0204, "step": 68110 }, { "epoch": 0.34, "learning_rate": 0.00024844887518856167, "loss": 0.0199, "step": 68120 }, { "epoch": 0.34, "learning_rate": 0.00024844130749554765, "loss": 0.0175, "step": 68130 }, { "epoch": 0.34, "learning_rate": 0.00024843373980253363, "loss": 0.0201, "step": 68140 }, { "epoch": 0.34, "learning_rate": 0.0002484261721095196, "loss": 0.0196, "step": 68150 }, { "epoch": 0.34, "learning_rate": 0.00024841860441650565, "loss": 0.0186, "step": 68160 }, { "epoch": 0.34, "learning_rate": 0.00024841103672349163, "loss": 0.0208, "step": 68170 }, { "epoch": 0.34, "learning_rate": 0.0002484034690304776, "loss": 0.0244, "step": 68180 }, { "epoch": 0.34, "learning_rate": 0.0002483959013374636, "loss": 0.0239, "step": 68190 }, { "epoch": 0.34, "learning_rate": 0.0002483883336444496, "loss": 0.0216, "step": 68200 }, { "epoch": 0.34, "learning_rate": 0.00024838076595143555, "loss": 0.0191, "step": 68210 }, { "epoch": 0.34, "learning_rate": 0.0002483731982584216, "loss": 0.0216, "step": 68220 }, { "epoch": 0.34, "learning_rate": 0.00024836563056540757, "loss": 0.0223, "step": 68230 }, { "epoch": 0.34, "learning_rate": 0.00024835806287239355, "loss": 0.0246, "step": 68240 }, { "epoch": 0.34, "learning_rate": 0.00024835049517937953, "loss": 0.0193, "step": 68250 }, { "epoch": 0.34, "learning_rate": 0.0002483429274863655, "loss": 0.0206, "step": 68260 }, { "epoch": 0.34, "learning_rate": 0.0002483353597933515, "loss": 0.0176, "step": 68270 }, { "epoch": 0.34, "learning_rate": 0.00024832779210033753, "loss": 0.0206, "step": 68280 }, { "epoch": 0.34, "learning_rate": 0.0002483202244073235, "loss": 0.0177, "step": 68290 }, { "epoch": 0.34, "learning_rate": 0.0002483126567143095, "loss": 0.0207, "step": 68300 }, { "epoch": 0.34, "learning_rate": 0.0002483050890212955, "loss": 0.0214, "step": 68310 }, { "epoch": 0.34, "learning_rate": 0.00024829752132828146, "loss": 0.0199, "step": 68320 }, { "epoch": 0.34, "learning_rate": 0.00024828995363526744, "loss": 0.0216, "step": 68330 }, { "epoch": 0.34, "learning_rate": 0.0002482823859422534, "loss": 0.0187, "step": 68340 }, { "epoch": 0.34, "learning_rate": 0.00024827481824923946, "loss": 0.0205, "step": 68350 }, { "epoch": 0.34, "learning_rate": 0.00024826725055622544, "loss": 0.0198, "step": 68360 }, { "epoch": 0.34, "learning_rate": 0.0002482596828632114, "loss": 0.0172, "step": 68370 }, { "epoch": 0.34, "learning_rate": 0.0002482521151701974, "loss": 0.0191, "step": 68380 }, { "epoch": 0.35, "learning_rate": 0.0002482445474771834, "loss": 0.0183, "step": 68390 }, { "epoch": 0.35, "learning_rate": 0.00024823697978416936, "loss": 0.0167, "step": 68400 }, { "epoch": 0.35, "learning_rate": 0.0002482294120911554, "loss": 0.0175, "step": 68410 }, { "epoch": 0.35, "learning_rate": 0.0002482218443981414, "loss": 0.0226, "step": 68420 }, { "epoch": 0.35, "learning_rate": 0.00024821427670512736, "loss": 0.0181, "step": 68430 }, { "epoch": 0.35, "learning_rate": 0.00024820670901211334, "loss": 0.0177, "step": 68440 }, { "epoch": 0.35, "learning_rate": 0.0002481991413190993, "loss": 0.0178, "step": 68450 }, { "epoch": 0.35, "learning_rate": 0.0002481915736260853, "loss": 0.0184, "step": 68460 }, { "epoch": 0.35, "learning_rate": 0.00024818400593307134, "loss": 0.0159, "step": 68470 }, { "epoch": 0.35, "learning_rate": 0.0002481764382400573, "loss": 0.0201, "step": 68480 }, { "epoch": 0.35, "learning_rate": 0.0002481688705470433, "loss": 0.0196, "step": 68490 }, { "epoch": 0.35, "learning_rate": 0.0002481613028540293, "loss": 0.0198, "step": 68500 }, { "epoch": 0.35, "learning_rate": 0.00024815373516101527, "loss": 0.0162, "step": 68510 }, { "epoch": 0.35, "learning_rate": 0.00024814616746800125, "loss": 0.0233, "step": 68520 }, { "epoch": 0.35, "learning_rate": 0.00024813859977498723, "loss": 0.0157, "step": 68530 }, { "epoch": 0.35, "learning_rate": 0.0002481310320819732, "loss": 0.0198, "step": 68540 }, { "epoch": 0.35, "learning_rate": 0.0002481234643889592, "loss": 0.0187, "step": 68550 }, { "epoch": 0.35, "learning_rate": 0.0002481158966959452, "loss": 0.0171, "step": 68560 }, { "epoch": 0.35, "learning_rate": 0.00024810832900293116, "loss": 0.014, "step": 68570 }, { "epoch": 0.35, "learning_rate": 0.0002481007613099172, "loss": 0.0164, "step": 68580 }, { "epoch": 0.35, "learning_rate": 0.0002480931936169032, "loss": 0.0158, "step": 68590 }, { "epoch": 0.35, "learning_rate": 0.00024808562592388916, "loss": 0.0178, "step": 68600 }, { "epoch": 0.35, "learning_rate": 0.00024807805823087514, "loss": 0.0215, "step": 68610 }, { "epoch": 0.35, "learning_rate": 0.0002480704905378611, "loss": 0.0182, "step": 68620 }, { "epoch": 0.35, "learning_rate": 0.0002480629228448471, "loss": 0.019, "step": 68630 }, { "epoch": 0.35, "learning_rate": 0.00024805535515183314, "loss": 0.0183, "step": 68640 }, { "epoch": 0.35, "learning_rate": 0.0002480477874588191, "loss": 0.0185, "step": 68650 }, { "epoch": 0.35, "learning_rate": 0.0002480402197658051, "loss": 0.0205, "step": 68660 }, { "epoch": 0.35, "learning_rate": 0.0002480326520727911, "loss": 0.019, "step": 68670 }, { "epoch": 0.35, "learning_rate": 0.00024802508437977706, "loss": 0.0174, "step": 68680 }, { "epoch": 0.35, "learning_rate": 0.00024801751668676304, "loss": 0.0223, "step": 68690 }, { "epoch": 0.35, "learning_rate": 0.0002480099489937491, "loss": 0.0172, "step": 68700 }, { "epoch": 0.35, "learning_rate": 0.00024800238130073506, "loss": 0.019, "step": 68710 }, { "epoch": 0.35, "learning_rate": 0.00024799481360772104, "loss": 0.0165, "step": 68720 }, { "epoch": 0.35, "learning_rate": 0.000247987245914707, "loss": 0.0224, "step": 68730 }, { "epoch": 0.35, "learning_rate": 0.000247979678221693, "loss": 0.0159, "step": 68740 }, { "epoch": 0.35, "learning_rate": 0.000247972110528679, "loss": 0.0246, "step": 68750 }, { "epoch": 0.35, "learning_rate": 0.00024796454283566497, "loss": 0.0189, "step": 68760 }, { "epoch": 0.35, "learning_rate": 0.000247956975142651, "loss": 0.0204, "step": 68770 }, { "epoch": 0.35, "learning_rate": 0.000247949407449637, "loss": 0.0139, "step": 68780 }, { "epoch": 0.35, "learning_rate": 0.00024794183975662297, "loss": 0.0155, "step": 68790 }, { "epoch": 0.35, "learning_rate": 0.00024793427206360895, "loss": 0.0197, "step": 68800 }, { "epoch": 0.35, "learning_rate": 0.00024792670437059493, "loss": 0.0176, "step": 68810 }, { "epoch": 0.35, "learning_rate": 0.0002479191366775809, "loss": 0.0352, "step": 68820 }, { "epoch": 0.35, "learning_rate": 0.00024791156898456695, "loss": 0.021, "step": 68830 }, { "epoch": 0.35, "learning_rate": 0.00024790400129155293, "loss": 0.0193, "step": 68840 }, { "epoch": 0.35, "learning_rate": 0.0002478964335985389, "loss": 0.0245, "step": 68850 }, { "epoch": 0.35, "learning_rate": 0.0002478888659055249, "loss": 0.0221, "step": 68860 }, { "epoch": 0.35, "learning_rate": 0.00024788129821251087, "loss": 0.0198, "step": 68870 }, { "epoch": 0.35, "learning_rate": 0.00024787373051949685, "loss": 0.022, "step": 68880 }, { "epoch": 0.35, "learning_rate": 0.00024786616282648283, "loss": 0.0186, "step": 68890 }, { "epoch": 0.35, "learning_rate": 0.00024785859513346887, "loss": 0.0228, "step": 68900 }, { "epoch": 0.35, "learning_rate": 0.00024785102744045485, "loss": 0.0237, "step": 68910 }, { "epoch": 0.35, "learning_rate": 0.00024784345974744083, "loss": 0.0238, "step": 68920 }, { "epoch": 0.35, "learning_rate": 0.0002478358920544268, "loss": 0.0186, "step": 68930 }, { "epoch": 0.35, "learning_rate": 0.0002478283243614128, "loss": 0.0199, "step": 68940 }, { "epoch": 0.35, "learning_rate": 0.0002478207566683988, "loss": 0.0207, "step": 68950 }, { "epoch": 0.35, "learning_rate": 0.0002478131889753848, "loss": 0.0246, "step": 68960 }, { "epoch": 0.35, "learning_rate": 0.0002478056212823708, "loss": 0.0194, "step": 68970 }, { "epoch": 0.35, "learning_rate": 0.0002477980535893568, "loss": 0.0235, "step": 68980 }, { "epoch": 0.35, "learning_rate": 0.00024779048589634276, "loss": 0.0227, "step": 68990 }, { "epoch": 0.35, "learning_rate": 0.00024778291820332874, "loss": 0.0194, "step": 69000 }, { "epoch": 0.35, "eval_cer": 0.9145119829365546, "eval_loss": 0.014301990158855915, "eval_runtime": 116.8153, "eval_samples_per_second": 17.121, "eval_steps_per_second": 4.28, "step": 69000 }, { "epoch": 0.35, "learning_rate": 0.0002477753505103147, "loss": 0.0174, "step": 69010 }, { "epoch": 0.35, "learning_rate": 0.00024776778281730076, "loss": 0.0214, "step": 69020 }, { "epoch": 0.35, "learning_rate": 0.00024776021512428674, "loss": 0.0158, "step": 69030 }, { "epoch": 0.35, "learning_rate": 0.0002477526474312727, "loss": 0.0175, "step": 69040 }, { "epoch": 0.35, "learning_rate": 0.0002477450797382587, "loss": 0.0176, "step": 69050 }, { "epoch": 0.35, "learning_rate": 0.0002477375120452447, "loss": 0.0165, "step": 69060 }, { "epoch": 0.35, "learning_rate": 0.00024772994435223066, "loss": 0.0191, "step": 69070 }, { "epoch": 0.35, "learning_rate": 0.00024772237665921665, "loss": 0.019, "step": 69080 }, { "epoch": 0.35, "learning_rate": 0.0002477148089662027, "loss": 0.0206, "step": 69090 }, { "epoch": 0.35, "learning_rate": 0.00024770724127318866, "loss": 0.0244, "step": 69100 }, { "epoch": 0.35, "learning_rate": 0.00024769967358017464, "loss": 0.0197, "step": 69110 }, { "epoch": 0.35, "learning_rate": 0.0002476921058871606, "loss": 0.0204, "step": 69120 }, { "epoch": 0.35, "learning_rate": 0.0002476845381941466, "loss": 0.0234, "step": 69130 }, { "epoch": 0.35, "learning_rate": 0.0002476769705011326, "loss": 0.0166, "step": 69140 }, { "epoch": 0.35, "learning_rate": 0.0002476694028081186, "loss": 0.0201, "step": 69150 }, { "epoch": 0.35, "learning_rate": 0.0002476618351151046, "loss": 0.0182, "step": 69160 }, { "epoch": 0.35, "learning_rate": 0.0002476542674220906, "loss": 0.0224, "step": 69170 }, { "epoch": 0.35, "learning_rate": 0.00024764669972907657, "loss": 0.0181, "step": 69180 }, { "epoch": 0.35, "learning_rate": 0.00024763913203606255, "loss": 0.0172, "step": 69190 }, { "epoch": 0.35, "learning_rate": 0.00024763156434304853, "loss": 0.0215, "step": 69200 }, { "epoch": 0.35, "learning_rate": 0.00024762399665003457, "loss": 0.016, "step": 69210 }, { "epoch": 0.35, "learning_rate": 0.00024761642895702055, "loss": 0.019, "step": 69220 }, { "epoch": 0.35, "learning_rate": 0.00024760886126400653, "loss": 0.0175, "step": 69230 }, { "epoch": 0.35, "learning_rate": 0.0002476012935709925, "loss": 0.0192, "step": 69240 }, { "epoch": 0.35, "learning_rate": 0.0002475937258779785, "loss": 0.0171, "step": 69250 }, { "epoch": 0.35, "learning_rate": 0.0002475861581849645, "loss": 0.016, "step": 69260 }, { "epoch": 0.35, "learning_rate": 0.00024757859049195046, "loss": 0.0192, "step": 69270 }, { "epoch": 0.35, "learning_rate": 0.0002475710227989365, "loss": 0.0171, "step": 69280 }, { "epoch": 0.35, "learning_rate": 0.00024756345510592247, "loss": 0.0179, "step": 69290 }, { "epoch": 0.35, "learning_rate": 0.00024755588741290845, "loss": 0.0191, "step": 69300 }, { "epoch": 0.35, "learning_rate": 0.00024754831971989444, "loss": 0.0194, "step": 69310 }, { "epoch": 0.35, "learning_rate": 0.0002475407520268804, "loss": 0.0206, "step": 69320 }, { "epoch": 0.35, "learning_rate": 0.0002475331843338664, "loss": 0.0214, "step": 69330 }, { "epoch": 0.35, "learning_rate": 0.00024752561664085243, "loss": 0.0208, "step": 69340 }, { "epoch": 0.35, "learning_rate": 0.0002475180489478384, "loss": 0.0184, "step": 69350 }, { "epoch": 0.35, "learning_rate": 0.0002475104812548244, "loss": 0.0172, "step": 69360 }, { "epoch": 0.35, "learning_rate": 0.0002475029135618104, "loss": 0.0237, "step": 69370 }, { "epoch": 0.35, "learning_rate": 0.00024749534586879636, "loss": 0.0197, "step": 69380 }, { "epoch": 0.35, "learning_rate": 0.00024748777817578234, "loss": 0.0217, "step": 69390 }, { "epoch": 0.35, "learning_rate": 0.0002474802104827683, "loss": 0.0231, "step": 69400 }, { "epoch": 0.35, "learning_rate": 0.00024747264278975436, "loss": 0.0189, "step": 69410 }, { "epoch": 0.35, "learning_rate": 0.00024746507509674034, "loss": 0.0188, "step": 69420 }, { "epoch": 0.35, "learning_rate": 0.0002474575074037263, "loss": 0.0446, "step": 69430 }, { "epoch": 0.35, "learning_rate": 0.0002474499397107123, "loss": 0.0461, "step": 69440 }, { "epoch": 0.35, "learning_rate": 0.0002474423720176983, "loss": 0.0163, "step": 69450 }, { "epoch": 0.35, "learning_rate": 0.00024743480432468427, "loss": 0.0194, "step": 69460 }, { "epoch": 0.35, "learning_rate": 0.0002474272366316703, "loss": 0.019, "step": 69470 }, { "epoch": 0.35, "learning_rate": 0.0002474196689386563, "loss": 0.0231, "step": 69480 }, { "epoch": 0.35, "learning_rate": 0.00024741210124564226, "loss": 0.017, "step": 69490 }, { "epoch": 0.35, "learning_rate": 0.00024740453355262825, "loss": 0.0185, "step": 69500 }, { "epoch": 0.35, "learning_rate": 0.0002473969658596142, "loss": 0.0169, "step": 69510 }, { "epoch": 0.35, "learning_rate": 0.0002473893981666002, "loss": 0.0238, "step": 69520 }, { "epoch": 0.35, "learning_rate": 0.00024738183047358624, "loss": 0.021, "step": 69530 }, { "epoch": 0.35, "learning_rate": 0.0002473742627805722, "loss": 0.0167, "step": 69540 }, { "epoch": 0.35, "learning_rate": 0.0002473666950875582, "loss": 0.0204, "step": 69550 }, { "epoch": 0.35, "learning_rate": 0.0002473591273945442, "loss": 0.0204, "step": 69560 }, { "epoch": 0.35, "learning_rate": 0.00024735155970153017, "loss": 0.0176, "step": 69570 }, { "epoch": 0.35, "learning_rate": 0.00024734399200851615, "loss": 0.0191, "step": 69580 }, { "epoch": 0.35, "learning_rate": 0.00024733642431550213, "loss": 0.018, "step": 69590 }, { "epoch": 0.35, "learning_rate": 0.00024732885662248817, "loss": 0.0189, "step": 69600 }, { "epoch": 0.35, "learning_rate": 0.00024732128892947415, "loss": 0.0174, "step": 69610 }, { "epoch": 0.35, "learning_rate": 0.00024731372123646013, "loss": 0.0189, "step": 69620 }, { "epoch": 0.35, "learning_rate": 0.0002473061535434461, "loss": 0.0193, "step": 69630 }, { "epoch": 0.35, "learning_rate": 0.0002472985858504321, "loss": 0.0202, "step": 69640 }, { "epoch": 0.35, "learning_rate": 0.0002472910181574181, "loss": 0.0162, "step": 69650 }, { "epoch": 0.35, "learning_rate": 0.0002472834504644041, "loss": 0.0184, "step": 69660 }, { "epoch": 0.35, "learning_rate": 0.0002472758827713901, "loss": 0.0182, "step": 69670 }, { "epoch": 0.35, "learning_rate": 0.0002472683150783761, "loss": 0.0283, "step": 69680 }, { "epoch": 0.35, "learning_rate": 0.00024726074738536206, "loss": 0.0173, "step": 69690 }, { "epoch": 0.35, "learning_rate": 0.00024725317969234804, "loss": 0.0178, "step": 69700 }, { "epoch": 0.35, "learning_rate": 0.000247245611999334, "loss": 0.0161, "step": 69710 }, { "epoch": 0.35, "learning_rate": 0.00024723804430632005, "loss": 0.0178, "step": 69720 }, { "epoch": 0.35, "learning_rate": 0.00024723047661330604, "loss": 0.0196, "step": 69730 }, { "epoch": 0.35, "learning_rate": 0.000247222908920292, "loss": 0.0208, "step": 69740 }, { "epoch": 0.35, "learning_rate": 0.000247215341227278, "loss": 0.0175, "step": 69750 }, { "epoch": 0.35, "learning_rate": 0.000247207773534264, "loss": 0.021, "step": 69760 }, { "epoch": 0.35, "learning_rate": 0.00024720020584124996, "loss": 0.0157, "step": 69770 }, { "epoch": 0.35, "learning_rate": 0.00024719263814823594, "loss": 0.017, "step": 69780 }, { "epoch": 0.35, "learning_rate": 0.0002471850704552219, "loss": 0.0225, "step": 69790 }, { "epoch": 0.35, "learning_rate": 0.0002471775027622079, "loss": 0.0189, "step": 69800 }, { "epoch": 0.35, "learning_rate": 0.0002471699350691939, "loss": 0.0204, "step": 69810 }, { "epoch": 0.35, "learning_rate": 0.00024716236737617987, "loss": 0.0194, "step": 69820 }, { "epoch": 0.35, "learning_rate": 0.0002471547996831659, "loss": 0.0211, "step": 69830 }, { "epoch": 0.35, "learning_rate": 0.0002471472319901519, "loss": 0.0197, "step": 69840 }, { "epoch": 0.35, "learning_rate": 0.00024713966429713787, "loss": 0.0183, "step": 69850 }, { "epoch": 0.35, "learning_rate": 0.00024713209660412385, "loss": 0.0153, "step": 69860 }, { "epoch": 0.35, "learning_rate": 0.00024712452891110983, "loss": 0.0213, "step": 69870 }, { "epoch": 0.35, "learning_rate": 0.0002471169612180958, "loss": 0.0205, "step": 69880 }, { "epoch": 0.35, "learning_rate": 0.00024710939352508185, "loss": 0.0184, "step": 69890 }, { "epoch": 0.35, "learning_rate": 0.00024710182583206783, "loss": 0.0185, "step": 69900 }, { "epoch": 0.35, "learning_rate": 0.0002470942581390538, "loss": 0.0186, "step": 69910 }, { "epoch": 0.35, "learning_rate": 0.0002470866904460398, "loss": 0.0167, "step": 69920 }, { "epoch": 0.35, "learning_rate": 0.00024707912275302577, "loss": 0.0193, "step": 69930 }, { "epoch": 0.35, "learning_rate": 0.00024707155506001175, "loss": 0.0223, "step": 69940 }, { "epoch": 0.35, "learning_rate": 0.00024706398736699774, "loss": 0.0167, "step": 69950 }, { "epoch": 0.35, "learning_rate": 0.00024705641967398377, "loss": 0.0175, "step": 69960 }, { "epoch": 0.35, "learning_rate": 0.00024704885198096975, "loss": 0.0165, "step": 69970 }, { "epoch": 0.35, "learning_rate": 0.00024704128428795573, "loss": 0.0174, "step": 69980 }, { "epoch": 0.35, "learning_rate": 0.0002470337165949417, "loss": 0.0218, "step": 69990 }, { "epoch": 0.35, "learning_rate": 0.0002470261489019277, "loss": 0.018, "step": 70000 }, { "epoch": 0.35, "eval_cer": 0.9144508479806542, "eval_loss": 0.013182277791202068, "eval_runtime": 116.7197, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 70000 }, { "epoch": 0.35, "learning_rate": 0.0002470185812089137, "loss": 0.0209, "step": 70010 }, { "epoch": 0.35, "learning_rate": 0.0002470110135158997, "loss": 0.0188, "step": 70020 }, { "epoch": 0.35, "learning_rate": 0.0002470034458228857, "loss": 0.02, "step": 70030 }, { "epoch": 0.35, "learning_rate": 0.0002469958781298717, "loss": 0.0319, "step": 70040 }, { "epoch": 0.35, "learning_rate": 0.00024698831043685766, "loss": 0.0164, "step": 70050 }, { "epoch": 0.35, "learning_rate": 0.00024698074274384364, "loss": 0.0206, "step": 70060 }, { "epoch": 0.35, "learning_rate": 0.0002469731750508296, "loss": 0.0208, "step": 70070 }, { "epoch": 0.35, "learning_rate": 0.00024696560735781566, "loss": 0.0216, "step": 70080 }, { "epoch": 0.35, "learning_rate": 0.00024695803966480164, "loss": 0.0189, "step": 70090 }, { "epoch": 0.35, "learning_rate": 0.0002469504719717876, "loss": 0.024, "step": 70100 }, { "epoch": 0.35, "learning_rate": 0.0002469429042787736, "loss": 0.0176, "step": 70110 }, { "epoch": 0.35, "learning_rate": 0.0002469353365857596, "loss": 0.0181, "step": 70120 }, { "epoch": 0.35, "learning_rate": 0.00024692776889274556, "loss": 0.0192, "step": 70130 }, { "epoch": 0.35, "learning_rate": 0.00024692020119973155, "loss": 0.0241, "step": 70140 }, { "epoch": 0.35, "learning_rate": 0.0002469126335067176, "loss": 0.0196, "step": 70150 }, { "epoch": 0.35, "learning_rate": 0.00024690506581370356, "loss": 0.0185, "step": 70160 }, { "epoch": 0.35, "learning_rate": 0.00024689749812068954, "loss": 0.0178, "step": 70170 }, { "epoch": 0.35, "learning_rate": 0.0002468899304276755, "loss": 0.0179, "step": 70180 }, { "epoch": 0.35, "learning_rate": 0.0002468823627346615, "loss": 0.0232, "step": 70190 }, { "epoch": 0.35, "learning_rate": 0.0002468747950416475, "loss": 0.0184, "step": 70200 }, { "epoch": 0.35, "learning_rate": 0.0002468672273486335, "loss": 0.0163, "step": 70210 }, { "epoch": 0.35, "learning_rate": 0.0002468596596556195, "loss": 0.0159, "step": 70220 }, { "epoch": 0.35, "learning_rate": 0.0002468520919626055, "loss": 0.0198, "step": 70230 }, { "epoch": 0.35, "learning_rate": 0.00024684452426959147, "loss": 0.0188, "step": 70240 }, { "epoch": 0.35, "learning_rate": 0.00024683695657657745, "loss": 0.0212, "step": 70250 }, { "epoch": 0.35, "learning_rate": 0.00024682938888356343, "loss": 0.0175, "step": 70260 }, { "epoch": 0.35, "learning_rate": 0.00024682182119054947, "loss": 0.0172, "step": 70270 }, { "epoch": 0.35, "learning_rate": 0.00024681425349753545, "loss": 0.0191, "step": 70280 }, { "epoch": 0.35, "learning_rate": 0.00024680668580452143, "loss": 0.0196, "step": 70290 }, { "epoch": 0.35, "learning_rate": 0.0002467991181115074, "loss": 0.0184, "step": 70300 }, { "epoch": 0.35, "learning_rate": 0.0002467915504184934, "loss": 0.0172, "step": 70310 }, { "epoch": 0.35, "learning_rate": 0.0002467839827254794, "loss": 0.0198, "step": 70320 }, { "epoch": 0.35, "learning_rate": 0.00024677641503246536, "loss": 0.0193, "step": 70330 }, { "epoch": 0.35, "learning_rate": 0.0002467688473394514, "loss": 0.0177, "step": 70340 }, { "epoch": 0.35, "learning_rate": 0.00024676127964643737, "loss": 0.017, "step": 70350 }, { "epoch": 0.35, "learning_rate": 0.00024675371195342335, "loss": 0.0191, "step": 70360 }, { "epoch": 0.36, "learning_rate": 0.00024674614426040934, "loss": 0.0194, "step": 70370 }, { "epoch": 0.36, "learning_rate": 0.0002467385765673953, "loss": 0.0163, "step": 70380 }, { "epoch": 0.36, "learning_rate": 0.0002467310088743813, "loss": 0.0163, "step": 70390 }, { "epoch": 0.36, "learning_rate": 0.00024672344118136733, "loss": 0.0186, "step": 70400 }, { "epoch": 0.36, "learning_rate": 0.0002467158734883533, "loss": 0.0175, "step": 70410 }, { "epoch": 0.36, "learning_rate": 0.0002467083057953393, "loss": 0.0164, "step": 70420 }, { "epoch": 0.36, "learning_rate": 0.0002467007381023253, "loss": 0.0178, "step": 70430 }, { "epoch": 0.36, "learning_rate": 0.00024669317040931126, "loss": 0.021, "step": 70440 }, { "epoch": 0.36, "learning_rate": 0.00024668560271629724, "loss": 0.0229, "step": 70450 }, { "epoch": 0.36, "learning_rate": 0.0002466780350232832, "loss": 0.0205, "step": 70460 }, { "epoch": 0.36, "learning_rate": 0.00024667046733026926, "loss": 0.0169, "step": 70470 }, { "epoch": 0.36, "learning_rate": 0.00024666289963725524, "loss": 0.0181, "step": 70480 }, { "epoch": 0.36, "learning_rate": 0.0002466553319442412, "loss": 0.0197, "step": 70490 }, { "epoch": 0.36, "learning_rate": 0.0002466477642512272, "loss": 0.0183, "step": 70500 }, { "epoch": 0.36, "learning_rate": 0.0002466401965582132, "loss": 0.0198, "step": 70510 }, { "epoch": 0.36, "learning_rate": 0.00024663262886519917, "loss": 0.0174, "step": 70520 }, { "epoch": 0.36, "learning_rate": 0.0002466250611721852, "loss": 0.0221, "step": 70530 }, { "epoch": 0.36, "learning_rate": 0.0002466174934791712, "loss": 0.0203, "step": 70540 }, { "epoch": 0.36, "learning_rate": 0.00024660992578615716, "loss": 0.0206, "step": 70550 }, { "epoch": 0.36, "learning_rate": 0.00024660235809314315, "loss": 0.0192, "step": 70560 }, { "epoch": 0.36, "learning_rate": 0.0002465947904001291, "loss": 0.0157, "step": 70570 }, { "epoch": 0.36, "learning_rate": 0.0002465872227071151, "loss": 0.0193, "step": 70580 }, { "epoch": 0.36, "learning_rate": 0.00024657965501410114, "loss": 0.0199, "step": 70590 }, { "epoch": 0.36, "learning_rate": 0.0002465720873210871, "loss": 0.0168, "step": 70600 }, { "epoch": 0.36, "learning_rate": 0.0002465645196280731, "loss": 0.0155, "step": 70610 }, { "epoch": 0.36, "learning_rate": 0.0002465569519350591, "loss": 0.0235, "step": 70620 }, { "epoch": 0.36, "learning_rate": 0.00024654938424204507, "loss": 0.0158, "step": 70630 }, { "epoch": 0.36, "learning_rate": 0.00024654181654903105, "loss": 0.0199, "step": 70640 }, { "epoch": 0.36, "learning_rate": 0.00024653424885601703, "loss": 0.02, "step": 70650 }, { "epoch": 0.36, "learning_rate": 0.00024652668116300307, "loss": 0.0156, "step": 70660 }, { "epoch": 0.36, "learning_rate": 0.00024651911346998905, "loss": 0.02, "step": 70670 }, { "epoch": 0.36, "learning_rate": 0.00024651154577697503, "loss": 0.0187, "step": 70680 }, { "epoch": 0.36, "learning_rate": 0.000246503978083961, "loss": 0.0175, "step": 70690 }, { "epoch": 0.36, "learning_rate": 0.000246496410390947, "loss": 0.0217, "step": 70700 }, { "epoch": 0.36, "learning_rate": 0.000246488842697933, "loss": 0.0209, "step": 70710 }, { "epoch": 0.36, "learning_rate": 0.000246481275004919, "loss": 0.0165, "step": 70720 }, { "epoch": 0.36, "learning_rate": 0.000246473707311905, "loss": 0.0153, "step": 70730 }, { "epoch": 0.36, "learning_rate": 0.000246466139618891, "loss": 0.0177, "step": 70740 }, { "epoch": 0.36, "learning_rate": 0.00024645857192587696, "loss": 0.0173, "step": 70750 }, { "epoch": 0.36, "learning_rate": 0.00024645100423286294, "loss": 0.0176, "step": 70760 }, { "epoch": 0.36, "learning_rate": 0.0002464434365398489, "loss": 0.0163, "step": 70770 }, { "epoch": 0.36, "learning_rate": 0.00024643586884683495, "loss": 0.0202, "step": 70780 }, { "epoch": 0.36, "learning_rate": 0.00024642830115382094, "loss": 0.0138, "step": 70790 }, { "epoch": 0.36, "learning_rate": 0.0002464207334608069, "loss": 0.0166, "step": 70800 }, { "epoch": 0.36, "learning_rate": 0.0002464131657677929, "loss": 0.0192, "step": 70810 }, { "epoch": 0.36, "learning_rate": 0.0002464055980747789, "loss": 0.0188, "step": 70820 }, { "epoch": 0.36, "learning_rate": 0.00024639803038176486, "loss": 0.0169, "step": 70830 }, { "epoch": 0.36, "learning_rate": 0.00024639046268875084, "loss": 0.0169, "step": 70840 }, { "epoch": 0.36, "learning_rate": 0.0002463828949957369, "loss": 0.0182, "step": 70850 }, { "epoch": 0.36, "learning_rate": 0.00024637532730272286, "loss": 0.0181, "step": 70860 }, { "epoch": 0.36, "learning_rate": 0.00024636775960970884, "loss": 0.0165, "step": 70870 }, { "epoch": 0.36, "learning_rate": 0.0002463601919166948, "loss": 0.0154, "step": 70880 }, { "epoch": 0.36, "learning_rate": 0.0002463526242236808, "loss": 0.0171, "step": 70890 }, { "epoch": 0.36, "learning_rate": 0.0002463450565306668, "loss": 0.0183, "step": 70900 }, { "epoch": 0.36, "learning_rate": 0.0002463374888376528, "loss": 0.0181, "step": 70910 }, { "epoch": 0.36, "learning_rate": 0.0002463299211446388, "loss": 0.0174, "step": 70920 }, { "epoch": 0.36, "learning_rate": 0.0002463223534516248, "loss": 0.0202, "step": 70930 }, { "epoch": 0.36, "learning_rate": 0.00024631478575861077, "loss": 0.0203, "step": 70940 }, { "epoch": 0.36, "learning_rate": 0.00024630721806559675, "loss": 0.0189, "step": 70950 }, { "epoch": 0.36, "learning_rate": 0.00024629965037258273, "loss": 0.0199, "step": 70960 }, { "epoch": 0.36, "learning_rate": 0.0002462920826795687, "loss": 0.0169, "step": 70970 }, { "epoch": 0.36, "learning_rate": 0.00024628451498655475, "loss": 0.0166, "step": 70980 }, { "epoch": 0.36, "learning_rate": 0.0002462769472935407, "loss": 0.0164, "step": 70990 }, { "epoch": 0.36, "learning_rate": 0.0002462693796005267, "loss": 0.0199, "step": 71000 }, { "epoch": 0.36, "eval_cer": 0.9145042197675514, "eval_loss": 0.013640601187944412, "eval_runtime": 116.7174, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 71000 }, { "epoch": 0.36, "learning_rate": 0.0002462618119075127, "loss": 0.0179, "step": 71010 }, { "epoch": 0.36, "learning_rate": 0.00024625424421449867, "loss": 0.0169, "step": 71020 }, { "epoch": 0.36, "learning_rate": 0.00024624667652148465, "loss": 0.019, "step": 71030 }, { "epoch": 0.36, "learning_rate": 0.00024623910882847063, "loss": 0.0206, "step": 71040 }, { "epoch": 0.36, "learning_rate": 0.0002462315411354566, "loss": 0.0143, "step": 71050 }, { "epoch": 0.36, "learning_rate": 0.0002462239734424426, "loss": 0.0205, "step": 71060 }, { "epoch": 0.36, "learning_rate": 0.0002462164057494286, "loss": 0.0194, "step": 71070 }, { "epoch": 0.36, "learning_rate": 0.0002462088380564146, "loss": 0.0177, "step": 71080 }, { "epoch": 0.36, "learning_rate": 0.0002462012703634006, "loss": 0.0223, "step": 71090 }, { "epoch": 0.36, "learning_rate": 0.0002461937026703866, "loss": 0.0198, "step": 71100 }, { "epoch": 0.36, "learning_rate": 0.00024618613497737256, "loss": 0.0183, "step": 71110 }, { "epoch": 0.36, "learning_rate": 0.00024617856728435854, "loss": 0.0222, "step": 71120 }, { "epoch": 0.36, "learning_rate": 0.0002461709995913445, "loss": 0.0175, "step": 71130 }, { "epoch": 0.36, "learning_rate": 0.00024616343189833056, "loss": 0.0197, "step": 71140 }, { "epoch": 0.36, "learning_rate": 0.00024615586420531654, "loss": 0.0223, "step": 71150 }, { "epoch": 0.36, "learning_rate": 0.0002461482965123025, "loss": 0.0152, "step": 71160 }, { "epoch": 0.36, "learning_rate": 0.0002461407288192885, "loss": 0.0192, "step": 71170 }, { "epoch": 0.36, "learning_rate": 0.0002461331611262745, "loss": 0.0223, "step": 71180 }, { "epoch": 0.36, "learning_rate": 0.00024612559343326046, "loss": 0.0179, "step": 71190 }, { "epoch": 0.36, "learning_rate": 0.00024611802574024645, "loss": 0.0198, "step": 71200 }, { "epoch": 0.36, "learning_rate": 0.0002461104580472325, "loss": 0.0182, "step": 71210 }, { "epoch": 0.36, "learning_rate": 0.00024610289035421846, "loss": 0.0168, "step": 71220 }, { "epoch": 0.36, "learning_rate": 0.00024609532266120444, "loss": 0.0191, "step": 71230 }, { "epoch": 0.36, "learning_rate": 0.0002460877549681904, "loss": 0.0171, "step": 71240 }, { "epoch": 0.36, "learning_rate": 0.0002460801872751764, "loss": 0.0154, "step": 71250 }, { "epoch": 0.36, "learning_rate": 0.0002460726195821624, "loss": 0.0173, "step": 71260 }, { "epoch": 0.36, "learning_rate": 0.0002460650518891484, "loss": 0.018, "step": 71270 }, { "epoch": 0.36, "learning_rate": 0.0002460574841961344, "loss": 0.018, "step": 71280 }, { "epoch": 0.36, "learning_rate": 0.0002460499165031204, "loss": 0.0166, "step": 71290 }, { "epoch": 0.36, "learning_rate": 0.00024604234881010637, "loss": 0.02, "step": 71300 }, { "epoch": 0.36, "learning_rate": 0.00024603478111709235, "loss": 0.0157, "step": 71310 }, { "epoch": 0.36, "learning_rate": 0.00024602721342407833, "loss": 0.0169, "step": 71320 }, { "epoch": 0.36, "learning_rate": 0.00024601964573106437, "loss": 0.0161, "step": 71330 }, { "epoch": 0.36, "learning_rate": 0.00024601207803805035, "loss": 0.0164, "step": 71340 }, { "epoch": 0.36, "learning_rate": 0.00024600451034503633, "loss": 0.0193, "step": 71350 }, { "epoch": 0.36, "learning_rate": 0.0002459969426520223, "loss": 0.0161, "step": 71360 }, { "epoch": 0.36, "learning_rate": 0.0002459893749590083, "loss": 0.0136, "step": 71370 }, { "epoch": 0.36, "learning_rate": 0.0002459818072659943, "loss": 0.0146, "step": 71380 }, { "epoch": 0.36, "learning_rate": 0.00024597423957298026, "loss": 0.0178, "step": 71390 }, { "epoch": 0.36, "learning_rate": 0.0002459666718799663, "loss": 0.0177, "step": 71400 }, { "epoch": 0.36, "learning_rate": 0.00024595910418695227, "loss": 0.015, "step": 71410 }, { "epoch": 0.36, "learning_rate": 0.00024595153649393825, "loss": 0.0234, "step": 71420 }, { "epoch": 0.36, "learning_rate": 0.00024594396880092424, "loss": 0.0189, "step": 71430 }, { "epoch": 0.36, "learning_rate": 0.0002459364011079102, "loss": 0.0195, "step": 71440 }, { "epoch": 0.36, "learning_rate": 0.0002459288334148962, "loss": 0.018, "step": 71450 }, { "epoch": 0.36, "learning_rate": 0.00024592126572188223, "loss": 0.0142, "step": 71460 }, { "epoch": 0.36, "learning_rate": 0.0002459136980288682, "loss": 0.0171, "step": 71470 }, { "epoch": 0.36, "learning_rate": 0.0002459061303358542, "loss": 0.018, "step": 71480 }, { "epoch": 0.36, "learning_rate": 0.0002458985626428402, "loss": 0.0163, "step": 71490 }, { "epoch": 0.36, "learning_rate": 0.00024589099494982616, "loss": 0.0148, "step": 71500 }, { "epoch": 0.36, "learning_rate": 0.00024588342725681214, "loss": 0.0154, "step": 71510 }, { "epoch": 0.36, "learning_rate": 0.0002458758595637982, "loss": 0.0158, "step": 71520 }, { "epoch": 0.36, "learning_rate": 0.00024586829187078416, "loss": 0.0192, "step": 71530 }, { "epoch": 0.36, "learning_rate": 0.00024586072417777014, "loss": 0.0162, "step": 71540 }, { "epoch": 0.36, "learning_rate": 0.0002458531564847561, "loss": 0.0189, "step": 71550 }, { "epoch": 0.36, "learning_rate": 0.0002458455887917421, "loss": 0.0136, "step": 71560 }, { "epoch": 0.36, "learning_rate": 0.0002458380210987281, "loss": 0.0169, "step": 71570 }, { "epoch": 0.36, "learning_rate": 0.00024583045340571407, "loss": 0.018, "step": 71580 }, { "epoch": 0.36, "learning_rate": 0.0002458228857127001, "loss": 0.0199, "step": 71590 }, { "epoch": 0.36, "learning_rate": 0.0002458153180196861, "loss": 0.0157, "step": 71600 }, { "epoch": 0.36, "learning_rate": 0.00024580775032667206, "loss": 0.0174, "step": 71610 }, { "epoch": 0.36, "learning_rate": 0.00024580018263365805, "loss": 0.0175, "step": 71620 }, { "epoch": 0.36, "learning_rate": 0.000245792614940644, "loss": 0.0184, "step": 71630 }, { "epoch": 0.36, "learning_rate": 0.00024578504724763, "loss": 0.0176, "step": 71640 }, { "epoch": 0.36, "learning_rate": 0.00024577747955461604, "loss": 0.0222, "step": 71650 }, { "epoch": 0.36, "learning_rate": 0.000245769911861602, "loss": 0.0182, "step": 71660 }, { "epoch": 0.36, "learning_rate": 0.000245762344168588, "loss": 0.0146, "step": 71670 }, { "epoch": 0.36, "learning_rate": 0.000245754776475574, "loss": 0.018, "step": 71680 }, { "epoch": 0.36, "learning_rate": 0.00024574720878255997, "loss": 0.0151, "step": 71690 }, { "epoch": 0.36, "learning_rate": 0.00024573964108954595, "loss": 0.0177, "step": 71700 }, { "epoch": 0.36, "learning_rate": 0.00024573207339653193, "loss": 0.0204, "step": 71710 }, { "epoch": 0.36, "learning_rate": 0.00024572450570351797, "loss": 0.0163, "step": 71720 }, { "epoch": 0.36, "learning_rate": 0.00024571693801050395, "loss": 0.0202, "step": 71730 }, { "epoch": 0.36, "learning_rate": 0.00024570937031748993, "loss": 0.017, "step": 71740 }, { "epoch": 0.36, "learning_rate": 0.0002457018026244759, "loss": 0.0207, "step": 71750 }, { "epoch": 0.36, "learning_rate": 0.0002456942349314619, "loss": 0.0169, "step": 71760 }, { "epoch": 0.36, "learning_rate": 0.0002456866672384479, "loss": 0.0184, "step": 71770 }, { "epoch": 0.36, "learning_rate": 0.0002456790995454339, "loss": 0.0186, "step": 71780 }, { "epoch": 0.36, "learning_rate": 0.0002456715318524199, "loss": 0.0152, "step": 71790 }, { "epoch": 0.36, "learning_rate": 0.0002456639641594059, "loss": 0.0157, "step": 71800 }, { "epoch": 0.36, "learning_rate": 0.00024565639646639186, "loss": 0.0204, "step": 71810 }, { "epoch": 0.36, "learning_rate": 0.00024564882877337784, "loss": 0.0197, "step": 71820 }, { "epoch": 0.36, "learning_rate": 0.0002456412610803638, "loss": 0.0185, "step": 71830 }, { "epoch": 0.36, "learning_rate": 0.00024563369338734985, "loss": 0.0177, "step": 71840 }, { "epoch": 0.36, "learning_rate": 0.00024562612569433584, "loss": 0.0259, "step": 71850 }, { "epoch": 0.36, "learning_rate": 0.0002456185580013218, "loss": 0.0205, "step": 71860 }, { "epoch": 0.36, "learning_rate": 0.0002456109903083078, "loss": 0.0149, "step": 71870 }, { "epoch": 0.36, "learning_rate": 0.0002456034226152938, "loss": 0.018, "step": 71880 }, { "epoch": 0.36, "learning_rate": 0.00024559585492227976, "loss": 0.0192, "step": 71890 }, { "epoch": 0.36, "learning_rate": 0.00024558828722926574, "loss": 0.0223, "step": 71900 }, { "epoch": 0.36, "learning_rate": 0.0002455807195362518, "loss": 0.0208, "step": 71910 }, { "epoch": 0.36, "learning_rate": 0.00024557315184323776, "loss": 0.0185, "step": 71920 }, { "epoch": 0.36, "learning_rate": 0.00024556558415022374, "loss": 0.0226, "step": 71930 }, { "epoch": 0.36, "learning_rate": 0.0002455580164572097, "loss": 0.0202, "step": 71940 }, { "epoch": 0.36, "learning_rate": 0.0002455504487641957, "loss": 0.0139, "step": 71950 }, { "epoch": 0.36, "learning_rate": 0.0002455428810711817, "loss": 0.02, "step": 71960 }, { "epoch": 0.36, "learning_rate": 0.0002455353133781677, "loss": 0.0159, "step": 71970 }, { "epoch": 0.36, "learning_rate": 0.0002455277456851537, "loss": 0.0186, "step": 71980 }, { "epoch": 0.36, "learning_rate": 0.0002455201779921397, "loss": 0.0174, "step": 71990 }, { "epoch": 0.36, "learning_rate": 0.00024551261029912567, "loss": 0.0187, "step": 72000 }, { "epoch": 0.36, "eval_cer": 0.9144828710527925, "eval_loss": 0.013233224861323833, "eval_runtime": 116.7335, "eval_samples_per_second": 17.133, "eval_steps_per_second": 4.283, "step": 72000 }, { "epoch": 0.36, "learning_rate": 0.00024550504260611165, "loss": 0.0232, "step": 72010 }, { "epoch": 0.36, "learning_rate": 0.00024549747491309763, "loss": 0.0183, "step": 72020 }, { "epoch": 0.36, "learning_rate": 0.0002454899072200836, "loss": 0.0155, "step": 72030 }, { "epoch": 0.36, "learning_rate": 0.00024548233952706965, "loss": 0.0159, "step": 72040 }, { "epoch": 0.36, "learning_rate": 0.00024547477183405563, "loss": 0.0276, "step": 72050 }, { "epoch": 0.36, "learning_rate": 0.0002454672041410416, "loss": 0.0188, "step": 72060 }, { "epoch": 0.36, "learning_rate": 0.0002454596364480276, "loss": 0.018, "step": 72070 }, { "epoch": 0.36, "learning_rate": 0.00024545206875501357, "loss": 0.0171, "step": 72080 }, { "epoch": 0.36, "learning_rate": 0.00024544450106199955, "loss": 0.0187, "step": 72090 }, { "epoch": 0.36, "learning_rate": 0.0002454369333689856, "loss": 0.0166, "step": 72100 }, { "epoch": 0.36, "learning_rate": 0.00024542936567597157, "loss": 0.0169, "step": 72110 }, { "epoch": 0.36, "learning_rate": 0.00024542179798295755, "loss": 0.0223, "step": 72120 }, { "epoch": 0.36, "learning_rate": 0.00024541423028994353, "loss": 0.016, "step": 72130 }, { "epoch": 0.36, "learning_rate": 0.0002454066625969295, "loss": 0.0205, "step": 72140 }, { "epoch": 0.36, "learning_rate": 0.0002453990949039155, "loss": 0.0174, "step": 72150 }, { "epoch": 0.36, "learning_rate": 0.00024539152721090153, "loss": 0.0176, "step": 72160 }, { "epoch": 0.36, "learning_rate": 0.0002453839595178875, "loss": 0.0159, "step": 72170 }, { "epoch": 0.36, "learning_rate": 0.0002453763918248735, "loss": 0.0234, "step": 72180 }, { "epoch": 0.36, "learning_rate": 0.0002453688241318595, "loss": 0.0204, "step": 72190 }, { "epoch": 0.36, "learning_rate": 0.00024536125643884546, "loss": 0.0193, "step": 72200 }, { "epoch": 0.36, "learning_rate": 0.00024535368874583144, "loss": 0.0159, "step": 72210 }, { "epoch": 0.36, "learning_rate": 0.0002453461210528174, "loss": 0.0206, "step": 72220 }, { "epoch": 0.36, "learning_rate": 0.00024533855335980346, "loss": 0.0177, "step": 72230 }, { "epoch": 0.36, "learning_rate": 0.00024533098566678944, "loss": 0.0162, "step": 72240 }, { "epoch": 0.36, "learning_rate": 0.0002453234179737754, "loss": 0.0202, "step": 72250 }, { "epoch": 0.36, "learning_rate": 0.0002453158502807614, "loss": 0.0214, "step": 72260 }, { "epoch": 0.36, "learning_rate": 0.0002453082825877474, "loss": 0.0204, "step": 72270 }, { "epoch": 0.36, "learning_rate": 0.00024530071489473336, "loss": 0.022, "step": 72280 }, { "epoch": 0.36, "learning_rate": 0.00024529314720171934, "loss": 0.018, "step": 72290 }, { "epoch": 0.36, "learning_rate": 0.0002452855795087053, "loss": 0.0162, "step": 72300 }, { "epoch": 0.36, "learning_rate": 0.0002452780118156913, "loss": 0.0165, "step": 72310 }, { "epoch": 0.36, "learning_rate": 0.0002452704441226773, "loss": 0.0187, "step": 72320 }, { "epoch": 0.36, "learning_rate": 0.0002452628764296633, "loss": 0.0176, "step": 72330 }, { "epoch": 0.36, "learning_rate": 0.0002452553087366493, "loss": 0.0206, "step": 72340 }, { "epoch": 0.37, "learning_rate": 0.0002452477410436353, "loss": 0.0183, "step": 72350 }, { "epoch": 0.37, "learning_rate": 0.00024524017335062127, "loss": 0.0208, "step": 72360 }, { "epoch": 0.37, "learning_rate": 0.00024523260565760725, "loss": 0.0177, "step": 72370 }, { "epoch": 0.37, "learning_rate": 0.00024522503796459323, "loss": 0.0196, "step": 72380 }, { "epoch": 0.37, "learning_rate": 0.00024521747027157927, "loss": 0.0188, "step": 72390 }, { "epoch": 0.37, "learning_rate": 0.00024520990257856525, "loss": 0.0192, "step": 72400 }, { "epoch": 0.37, "learning_rate": 0.00024520233488555123, "loss": 0.0187, "step": 72410 }, { "epoch": 0.37, "learning_rate": 0.0002451947671925372, "loss": 0.0208, "step": 72420 }, { "epoch": 0.37, "learning_rate": 0.0002451871994995232, "loss": 0.0172, "step": 72430 }, { "epoch": 0.37, "learning_rate": 0.0002451796318065092, "loss": 0.014, "step": 72440 }, { "epoch": 0.37, "learning_rate": 0.00024517206411349516, "loss": 0.0155, "step": 72450 }, { "epoch": 0.37, "learning_rate": 0.0002451644964204812, "loss": 0.0216, "step": 72460 }, { "epoch": 0.37, "learning_rate": 0.0002451569287274672, "loss": 0.0186, "step": 72470 }, { "epoch": 0.37, "learning_rate": 0.00024514936103445315, "loss": 0.0172, "step": 72480 }, { "epoch": 0.37, "learning_rate": 0.00024514179334143914, "loss": 0.0171, "step": 72490 }, { "epoch": 0.37, "learning_rate": 0.0002451342256484251, "loss": 0.0176, "step": 72500 }, { "epoch": 0.37, "learning_rate": 0.0002451266579554111, "loss": 0.0187, "step": 72510 }, { "epoch": 0.37, "learning_rate": 0.00024511909026239713, "loss": 0.0176, "step": 72520 }, { "epoch": 0.37, "learning_rate": 0.0002451115225693831, "loss": 0.0181, "step": 72530 }, { "epoch": 0.37, "learning_rate": 0.0002451039548763691, "loss": 0.017, "step": 72540 }, { "epoch": 0.37, "learning_rate": 0.0002450963871833551, "loss": 0.0195, "step": 72550 }, { "epoch": 0.37, "learning_rate": 0.00024508881949034106, "loss": 0.017, "step": 72560 }, { "epoch": 0.37, "learning_rate": 0.00024508125179732704, "loss": 0.0172, "step": 72570 }, { "epoch": 0.37, "learning_rate": 0.0002450736841043131, "loss": 0.0167, "step": 72580 }, { "epoch": 0.37, "learning_rate": 0.00024506611641129906, "loss": 0.0177, "step": 72590 }, { "epoch": 0.37, "learning_rate": 0.00024505854871828504, "loss": 0.0207, "step": 72600 }, { "epoch": 0.37, "learning_rate": 0.000245050981025271, "loss": 0.0173, "step": 72610 }, { "epoch": 0.37, "learning_rate": 0.000245043413332257, "loss": 0.0189, "step": 72620 }, { "epoch": 0.37, "learning_rate": 0.000245035845639243, "loss": 0.0203, "step": 72630 }, { "epoch": 0.37, "learning_rate": 0.00024502827794622897, "loss": 0.0175, "step": 72640 }, { "epoch": 0.37, "learning_rate": 0.000245020710253215, "loss": 0.0169, "step": 72650 }, { "epoch": 0.37, "learning_rate": 0.000245013142560201, "loss": 0.0185, "step": 72660 }, { "epoch": 0.37, "learning_rate": 0.00024500557486718696, "loss": 0.0178, "step": 72670 }, { "epoch": 0.37, "learning_rate": 0.00024499800717417295, "loss": 0.0239, "step": 72680 }, { "epoch": 0.37, "learning_rate": 0.00024499043948115893, "loss": 0.017, "step": 72690 }, { "epoch": 0.37, "learning_rate": 0.0002449828717881449, "loss": 0.0188, "step": 72700 }, { "epoch": 0.37, "learning_rate": 0.00024497530409513094, "loss": 0.0202, "step": 72710 }, { "epoch": 0.37, "learning_rate": 0.0002449677364021169, "loss": 0.019, "step": 72720 }, { "epoch": 0.37, "learning_rate": 0.0002449601687091029, "loss": 0.0186, "step": 72730 }, { "epoch": 0.37, "learning_rate": 0.0002449526010160889, "loss": 0.0184, "step": 72740 }, { "epoch": 0.37, "learning_rate": 0.00024494503332307487, "loss": 0.019, "step": 72750 }, { "epoch": 0.37, "learning_rate": 0.00024493746563006085, "loss": 0.0173, "step": 72760 }, { "epoch": 0.37, "learning_rate": 0.00024492989793704683, "loss": 0.0173, "step": 72770 }, { "epoch": 0.37, "learning_rate": 0.00024492233024403287, "loss": 0.0162, "step": 72780 }, { "epoch": 0.37, "learning_rate": 0.00024491476255101885, "loss": 0.0173, "step": 72790 }, { "epoch": 0.37, "learning_rate": 0.00024490719485800483, "loss": 0.0195, "step": 72800 }, { "epoch": 0.37, "learning_rate": 0.0002448996271649908, "loss": 0.0162, "step": 72810 }, { "epoch": 0.37, "learning_rate": 0.0002448920594719768, "loss": 0.0175, "step": 72820 }, { "epoch": 0.37, "learning_rate": 0.0002448844917789628, "loss": 0.018, "step": 72830 }, { "epoch": 0.37, "learning_rate": 0.0002448769240859488, "loss": 0.0211, "step": 72840 }, { "epoch": 0.37, "learning_rate": 0.0002448693563929348, "loss": 0.0163, "step": 72850 }, { "epoch": 0.37, "learning_rate": 0.0002448617886999208, "loss": 0.0193, "step": 72860 }, { "epoch": 0.37, "learning_rate": 0.00024485422100690676, "loss": 0.0187, "step": 72870 }, { "epoch": 0.37, "learning_rate": 0.00024484665331389274, "loss": 0.0232, "step": 72880 }, { "epoch": 0.37, "learning_rate": 0.0002448390856208787, "loss": 0.0195, "step": 72890 }, { "epoch": 0.37, "learning_rate": 0.00024483151792786475, "loss": 0.0167, "step": 72900 }, { "epoch": 0.37, "learning_rate": 0.00024482395023485074, "loss": 0.0166, "step": 72910 }, { "epoch": 0.37, "learning_rate": 0.0002448163825418367, "loss": 0.0203, "step": 72920 }, { "epoch": 0.37, "learning_rate": 0.0002448088148488227, "loss": 0.0204, "step": 72930 }, { "epoch": 0.37, "learning_rate": 0.0002448012471558087, "loss": 0.0184, "step": 72940 }, { "epoch": 0.37, "learning_rate": 0.00024479367946279466, "loss": 0.0207, "step": 72950 }, { "epoch": 0.37, "learning_rate": 0.00024478611176978064, "loss": 0.0193, "step": 72960 }, { "epoch": 0.37, "learning_rate": 0.0002447785440767667, "loss": 0.0165, "step": 72970 }, { "epoch": 0.37, "learning_rate": 0.00024477097638375266, "loss": 0.0158, "step": 72980 }, { "epoch": 0.37, "learning_rate": 0.00024476340869073864, "loss": 0.0159, "step": 72990 }, { "epoch": 0.37, "learning_rate": 0.0002447558409977246, "loss": 0.02, "step": 73000 }, { "epoch": 0.37, "eval_cer": 0.9145197461055578, "eval_loss": 0.013241157867014408, "eval_runtime": 116.696, "eval_samples_per_second": 17.139, "eval_steps_per_second": 4.285, "step": 73000 }, { "epoch": 0.37, "learning_rate": 0.0002447482733047106, "loss": 0.019, "step": 73010 }, { "epoch": 0.37, "learning_rate": 0.0002447407056116966, "loss": 0.0194, "step": 73020 }, { "epoch": 0.37, "learning_rate": 0.0002447331379186826, "loss": 0.0166, "step": 73030 }, { "epoch": 0.37, "learning_rate": 0.0002447255702256686, "loss": 0.0193, "step": 73040 }, { "epoch": 0.37, "learning_rate": 0.0002447180025326546, "loss": 0.0232, "step": 73050 }, { "epoch": 0.37, "learning_rate": 0.00024471043483964057, "loss": 0.0167, "step": 73060 }, { "epoch": 0.37, "learning_rate": 0.00024470286714662655, "loss": 0.0205, "step": 73070 }, { "epoch": 0.37, "learning_rate": 0.00024469529945361253, "loss": 0.0195, "step": 73080 }, { "epoch": 0.37, "learning_rate": 0.00024468773176059856, "loss": 0.0181, "step": 73090 }, { "epoch": 0.37, "learning_rate": 0.00024468016406758455, "loss": 0.018, "step": 73100 }, { "epoch": 0.37, "learning_rate": 0.00024467259637457053, "loss": 0.0291, "step": 73110 }, { "epoch": 0.37, "learning_rate": 0.0002446650286815565, "loss": 0.0198, "step": 73120 }, { "epoch": 0.37, "learning_rate": 0.0002446574609885425, "loss": 0.0162, "step": 73130 }, { "epoch": 0.37, "learning_rate": 0.00024464989329552847, "loss": 0.0184, "step": 73140 }, { "epoch": 0.37, "learning_rate": 0.00024464232560251445, "loss": 0.0188, "step": 73150 }, { "epoch": 0.37, "learning_rate": 0.0002446347579095005, "loss": 0.0174, "step": 73160 }, { "epoch": 0.37, "learning_rate": 0.00024462719021648647, "loss": 0.0233, "step": 73170 }, { "epoch": 0.37, "learning_rate": 0.00024461962252347245, "loss": 0.0152, "step": 73180 }, { "epoch": 0.37, "learning_rate": 0.00024461205483045843, "loss": 0.0173, "step": 73190 }, { "epoch": 0.37, "learning_rate": 0.0002446044871374444, "loss": 0.0244, "step": 73200 }, { "epoch": 0.37, "learning_rate": 0.0002445969194444304, "loss": 0.0183, "step": 73210 }, { "epoch": 0.37, "learning_rate": 0.00024458935175141643, "loss": 0.0193, "step": 73220 }, { "epoch": 0.37, "learning_rate": 0.0002445817840584024, "loss": 0.0149, "step": 73230 }, { "epoch": 0.37, "learning_rate": 0.0002445742163653884, "loss": 0.0188, "step": 73240 }, { "epoch": 0.37, "learning_rate": 0.0002445666486723744, "loss": 0.0194, "step": 73250 }, { "epoch": 0.37, "learning_rate": 0.00024455908097936036, "loss": 0.0158, "step": 73260 }, { "epoch": 0.37, "learning_rate": 0.00024455151328634634, "loss": 0.0166, "step": 73270 }, { "epoch": 0.37, "learning_rate": 0.0002445439455933323, "loss": 0.014, "step": 73280 }, { "epoch": 0.37, "learning_rate": 0.00024453637790031836, "loss": 0.0207, "step": 73290 }, { "epoch": 0.37, "learning_rate": 0.00024452881020730434, "loss": 0.0232, "step": 73300 }, { "epoch": 0.37, "learning_rate": 0.0002445212425142903, "loss": 0.0151, "step": 73310 }, { "epoch": 0.37, "learning_rate": 0.0002445136748212763, "loss": 0.0191, "step": 73320 }, { "epoch": 0.37, "learning_rate": 0.0002445061071282623, "loss": 0.021, "step": 73330 }, { "epoch": 0.37, "learning_rate": 0.00024449853943524826, "loss": 0.0165, "step": 73340 }, { "epoch": 0.37, "learning_rate": 0.0002444909717422343, "loss": 0.0135, "step": 73350 }, { "epoch": 0.37, "learning_rate": 0.0002444834040492203, "loss": 0.0145, "step": 73360 }, { "epoch": 0.37, "learning_rate": 0.00024447583635620626, "loss": 0.0177, "step": 73370 }, { "epoch": 0.37, "learning_rate": 0.00024446826866319224, "loss": 0.0165, "step": 73380 }, { "epoch": 0.37, "learning_rate": 0.0002444607009701782, "loss": 0.0203, "step": 73390 }, { "epoch": 0.37, "learning_rate": 0.0002444531332771642, "loss": 0.0139, "step": 73400 }, { "epoch": 0.37, "learning_rate": 0.00024444556558415024, "loss": 0.014, "step": 73410 }, { "epoch": 0.37, "learning_rate": 0.0002444379978911362, "loss": 0.019, "step": 73420 }, { "epoch": 0.37, "learning_rate": 0.0002444304301981222, "loss": 0.0149, "step": 73430 }, { "epoch": 0.37, "learning_rate": 0.0002444228625051082, "loss": 0.0173, "step": 73440 }, { "epoch": 0.37, "learning_rate": 0.00024441529481209417, "loss": 0.0219, "step": 73450 }, { "epoch": 0.37, "learning_rate": 0.00024440772711908015, "loss": 0.0178, "step": 73460 }, { "epoch": 0.37, "learning_rate": 0.00024440015942606613, "loss": 0.0198, "step": 73470 }, { "epoch": 0.37, "learning_rate": 0.00024439259173305217, "loss": 0.0182, "step": 73480 }, { "epoch": 0.37, "learning_rate": 0.00024438502404003815, "loss": 0.0175, "step": 73490 }, { "epoch": 0.37, "learning_rate": 0.00024437745634702413, "loss": 0.024, "step": 73500 }, { "epoch": 0.37, "learning_rate": 0.0002443698886540101, "loss": 0.0177, "step": 73510 }, { "epoch": 0.37, "learning_rate": 0.0002443623209609961, "loss": 0.0212, "step": 73520 }, { "epoch": 0.37, "learning_rate": 0.0002443547532679821, "loss": 0.0182, "step": 73530 }, { "epoch": 0.37, "learning_rate": 0.00024434718557496805, "loss": 0.0156, "step": 73540 }, { "epoch": 0.37, "learning_rate": 0.00024433961788195404, "loss": 0.0179, "step": 73550 }, { "epoch": 0.37, "learning_rate": 0.00024433205018894, "loss": 0.0374, "step": 73560 }, { "epoch": 0.37, "learning_rate": 0.000244324482495926, "loss": 0.0162, "step": 73570 }, { "epoch": 0.37, "learning_rate": 0.00024431691480291203, "loss": 0.0173, "step": 73580 }, { "epoch": 0.37, "learning_rate": 0.000244309347109898, "loss": 0.0174, "step": 73590 }, { "epoch": 0.37, "learning_rate": 0.000244301779416884, "loss": 0.0173, "step": 73600 }, { "epoch": 0.37, "learning_rate": 0.00024429421172387, "loss": 0.0218, "step": 73610 }, { "epoch": 0.37, "learning_rate": 0.00024428664403085596, "loss": 0.019, "step": 73620 }, { "epoch": 0.37, "learning_rate": 0.00024427907633784194, "loss": 0.0197, "step": 73630 }, { "epoch": 0.37, "learning_rate": 0.000244271508644828, "loss": 0.0195, "step": 73640 }, { "epoch": 0.37, "learning_rate": 0.00024426394095181396, "loss": 0.0201, "step": 73650 }, { "epoch": 0.37, "learning_rate": 0.00024425637325879994, "loss": 0.0203, "step": 73660 }, { "epoch": 0.37, "learning_rate": 0.0002442488055657859, "loss": 0.02, "step": 73670 }, { "epoch": 0.37, "learning_rate": 0.0002442412378727719, "loss": 0.0148, "step": 73680 }, { "epoch": 0.37, "learning_rate": 0.0002442336701797579, "loss": 0.0149, "step": 73690 }, { "epoch": 0.37, "learning_rate": 0.00024422610248674387, "loss": 0.0186, "step": 73700 }, { "epoch": 0.37, "learning_rate": 0.0002442185347937299, "loss": 0.0163, "step": 73710 }, { "epoch": 0.37, "learning_rate": 0.0002442109671007159, "loss": 0.0183, "step": 73720 }, { "epoch": 0.37, "learning_rate": 0.00024420339940770186, "loss": 0.0192, "step": 73730 }, { "epoch": 0.37, "learning_rate": 0.00024419583171468785, "loss": 0.0192, "step": 73740 }, { "epoch": 0.37, "learning_rate": 0.00024418826402167383, "loss": 0.0179, "step": 73750 }, { "epoch": 0.37, "learning_rate": 0.0002441806963286598, "loss": 0.0192, "step": 73760 }, { "epoch": 0.37, "learning_rate": 0.00024417312863564584, "loss": 0.0169, "step": 73770 }, { "epoch": 0.37, "learning_rate": 0.0002441655609426318, "loss": 0.0166, "step": 73780 }, { "epoch": 0.37, "learning_rate": 0.0002441579932496178, "loss": 0.0153, "step": 73790 }, { "epoch": 0.37, "learning_rate": 0.0002441504255566038, "loss": 0.0178, "step": 73800 }, { "epoch": 0.37, "learning_rate": 0.00024414285786358977, "loss": 0.0184, "step": 73810 }, { "epoch": 0.37, "learning_rate": 0.00024413529017057578, "loss": 0.0177, "step": 73820 }, { "epoch": 0.37, "learning_rate": 0.00024412772247756176, "loss": 0.0185, "step": 73830 }, { "epoch": 0.37, "learning_rate": 0.00024412015478454774, "loss": 0.0203, "step": 73840 }, { "epoch": 0.37, "learning_rate": 0.00024411258709153375, "loss": 0.0168, "step": 73850 }, { "epoch": 0.37, "learning_rate": 0.00024410501939851973, "loss": 0.0186, "step": 73860 }, { "epoch": 0.37, "learning_rate": 0.0002440974517055057, "loss": 0.0192, "step": 73870 }, { "epoch": 0.37, "learning_rate": 0.00024408988401249172, "loss": 0.019, "step": 73880 }, { "epoch": 0.37, "learning_rate": 0.0002440823163194777, "loss": 0.015, "step": 73890 }, { "epoch": 0.37, "learning_rate": 0.00024407474862646368, "loss": 0.0198, "step": 73900 }, { "epoch": 0.37, "learning_rate": 0.00024406718093344967, "loss": 0.0203, "step": 73910 }, { "epoch": 0.37, "learning_rate": 0.00024405961324043567, "loss": 0.0176, "step": 73920 }, { "epoch": 0.37, "learning_rate": 0.00024405204554742166, "loss": 0.0169, "step": 73930 }, { "epoch": 0.37, "learning_rate": 0.00024404447785440764, "loss": 0.017, "step": 73940 }, { "epoch": 0.37, "learning_rate": 0.00024403691016139365, "loss": 0.0188, "step": 73950 }, { "epoch": 0.37, "learning_rate": 0.00024402934246837963, "loss": 0.0181, "step": 73960 }, { "epoch": 0.37, "learning_rate": 0.0002440217747753656, "loss": 0.0174, "step": 73970 }, { "epoch": 0.37, "learning_rate": 0.00024401420708235162, "loss": 0.0171, "step": 73980 }, { "epoch": 0.37, "learning_rate": 0.0002440066393893376, "loss": 0.0221, "step": 73990 }, { "epoch": 0.37, "learning_rate": 0.00024399907169632358, "loss": 0.02, "step": 74000 }, { "epoch": 0.37, "eval_cer": 0.9144848118450433, "eval_loss": 0.012880527414381504, "eval_runtime": 116.6543, "eval_samples_per_second": 17.145, "eval_steps_per_second": 4.286, "step": 74000 }, { "epoch": 0.37, "learning_rate": 0.0002439915040033096, "loss": 0.0215, "step": 74010 }, { "epoch": 0.37, "learning_rate": 0.00024398393631029557, "loss": 0.0181, "step": 74020 }, { "epoch": 0.37, "learning_rate": 0.00024397636861728155, "loss": 0.0187, "step": 74030 }, { "epoch": 0.37, "learning_rate": 0.00024396880092426756, "loss": 0.0162, "step": 74040 }, { "epoch": 0.37, "learning_rate": 0.00024396123323125354, "loss": 0.0164, "step": 74050 }, { "epoch": 0.37, "learning_rate": 0.00024395366553823952, "loss": 0.0189, "step": 74060 }, { "epoch": 0.37, "learning_rate": 0.00024394609784522553, "loss": 0.016, "step": 74070 }, { "epoch": 0.37, "learning_rate": 0.0002439385301522115, "loss": 0.0193, "step": 74080 }, { "epoch": 0.37, "learning_rate": 0.0002439309624591975, "loss": 0.0194, "step": 74090 }, { "epoch": 0.37, "learning_rate": 0.00024392339476618348, "loss": 0.0184, "step": 74100 }, { "epoch": 0.37, "learning_rate": 0.00024391582707316948, "loss": 0.0196, "step": 74110 }, { "epoch": 0.37, "learning_rate": 0.00024390825938015547, "loss": 0.0197, "step": 74120 }, { "epoch": 0.37, "learning_rate": 0.00024390069168714145, "loss": 0.0172, "step": 74130 }, { "epoch": 0.37, "learning_rate": 0.00024389312399412746, "loss": 0.0189, "step": 74140 }, { "epoch": 0.37, "learning_rate": 0.00024388555630111344, "loss": 0.0165, "step": 74150 }, { "epoch": 0.37, "learning_rate": 0.00024387798860809942, "loss": 0.0179, "step": 74160 }, { "epoch": 0.37, "learning_rate": 0.00024387042091508543, "loss": 0.015, "step": 74170 }, { "epoch": 0.37, "learning_rate": 0.0002438628532220714, "loss": 0.0181, "step": 74180 }, { "epoch": 0.37, "learning_rate": 0.0002438552855290574, "loss": 0.0204, "step": 74190 }, { "epoch": 0.37, "learning_rate": 0.0002438477178360434, "loss": 0.0181, "step": 74200 }, { "epoch": 0.37, "learning_rate": 0.00024384015014302938, "loss": 0.0182, "step": 74210 }, { "epoch": 0.37, "learning_rate": 0.00024383258245001536, "loss": 0.0188, "step": 74220 }, { "epoch": 0.37, "learning_rate": 0.00024382501475700137, "loss": 0.0242, "step": 74230 }, { "epoch": 0.37, "learning_rate": 0.00024381744706398735, "loss": 0.0171, "step": 74240 }, { "epoch": 0.37, "learning_rate": 0.00024380987937097333, "loss": 0.0187, "step": 74250 }, { "epoch": 0.37, "learning_rate": 0.00024380231167795931, "loss": 0.0171, "step": 74260 }, { "epoch": 0.37, "learning_rate": 0.00024379474398494532, "loss": 0.0148, "step": 74270 }, { "epoch": 0.37, "learning_rate": 0.0002437871762919313, "loss": 0.0187, "step": 74280 }, { "epoch": 0.37, "learning_rate": 0.00024377960859891729, "loss": 0.0166, "step": 74290 }, { "epoch": 0.37, "learning_rate": 0.0002437720409059033, "loss": 0.018, "step": 74300 }, { "epoch": 0.37, "learning_rate": 0.00024376447321288928, "loss": 0.0141, "step": 74310 }, { "epoch": 0.37, "learning_rate": 0.00024375690551987526, "loss": 0.0173, "step": 74320 }, { "epoch": 0.38, "learning_rate": 0.00024374933782686127, "loss": 0.0209, "step": 74330 }, { "epoch": 0.38, "learning_rate": 0.00024374177013384725, "loss": 0.0183, "step": 74340 }, { "epoch": 0.38, "learning_rate": 0.00024373420244083323, "loss": 0.0157, "step": 74350 }, { "epoch": 0.38, "learning_rate": 0.00024372663474781924, "loss": 0.0167, "step": 74360 }, { "epoch": 0.38, "learning_rate": 0.00024371906705480522, "loss": 0.0168, "step": 74370 }, { "epoch": 0.38, "learning_rate": 0.0002437114993617912, "loss": 0.0158, "step": 74380 }, { "epoch": 0.38, "learning_rate": 0.0002437039316687772, "loss": 0.0216, "step": 74390 }, { "epoch": 0.38, "learning_rate": 0.0002436963639757632, "loss": 0.0217, "step": 74400 }, { "epoch": 0.38, "learning_rate": 0.00024368879628274917, "loss": 0.0187, "step": 74410 }, { "epoch": 0.38, "learning_rate": 0.00024368122858973515, "loss": 0.0217, "step": 74420 }, { "epoch": 0.38, "learning_rate": 0.00024367366089672116, "loss": 0.0231, "step": 74430 }, { "epoch": 0.38, "learning_rate": 0.00024366609320370714, "loss": 0.0163, "step": 74440 }, { "epoch": 0.38, "learning_rate": 0.00024365852551069312, "loss": 0.0169, "step": 74450 }, { "epoch": 0.38, "learning_rate": 0.00024365095781767913, "loss": 0.0225, "step": 74460 }, { "epoch": 0.38, "learning_rate": 0.00024364339012466511, "loss": 0.0206, "step": 74470 }, { "epoch": 0.38, "learning_rate": 0.0002436358224316511, "loss": 0.0202, "step": 74480 }, { "epoch": 0.38, "learning_rate": 0.0002436282547386371, "loss": 0.0168, "step": 74490 }, { "epoch": 0.38, "learning_rate": 0.00024362068704562309, "loss": 0.0195, "step": 74500 }, { "epoch": 0.38, "learning_rate": 0.00024361311935260907, "loss": 0.0196, "step": 74510 }, { "epoch": 0.38, "learning_rate": 0.00024360555165959508, "loss": 0.0178, "step": 74520 }, { "epoch": 0.38, "learning_rate": 0.00024359798396658106, "loss": 0.0168, "step": 74530 }, { "epoch": 0.38, "learning_rate": 0.00024359041627356704, "loss": 0.0194, "step": 74540 }, { "epoch": 0.38, "learning_rate": 0.00024358284858055305, "loss": 0.0216, "step": 74550 }, { "epoch": 0.38, "learning_rate": 0.00024357528088753903, "loss": 0.0178, "step": 74560 }, { "epoch": 0.38, "learning_rate": 0.000243567713194525, "loss": 0.0204, "step": 74570 }, { "epoch": 0.38, "learning_rate": 0.00024356014550151102, "loss": 0.0185, "step": 74580 }, { "epoch": 0.38, "learning_rate": 0.000243552577808497, "loss": 0.0173, "step": 74590 }, { "epoch": 0.38, "learning_rate": 0.00024354501011548298, "loss": 0.0183, "step": 74600 }, { "epoch": 0.38, "learning_rate": 0.00024353744242246896, "loss": 0.0188, "step": 74610 }, { "epoch": 0.38, "learning_rate": 0.00024352987472945497, "loss": 0.0213, "step": 74620 }, { "epoch": 0.38, "learning_rate": 0.00024352230703644095, "loss": 0.0171, "step": 74630 }, { "epoch": 0.38, "learning_rate": 0.00024351473934342693, "loss": 0.0194, "step": 74640 }, { "epoch": 0.38, "learning_rate": 0.00024350717165041294, "loss": 0.0204, "step": 74650 }, { "epoch": 0.38, "learning_rate": 0.00024349960395739892, "loss": 0.0214, "step": 74660 }, { "epoch": 0.38, "learning_rate": 0.0002434920362643849, "loss": 0.0178, "step": 74670 }, { "epoch": 0.38, "learning_rate": 0.00024348446857137091, "loss": 0.0173, "step": 74680 }, { "epoch": 0.38, "learning_rate": 0.0002434769008783569, "loss": 0.0165, "step": 74690 }, { "epoch": 0.38, "learning_rate": 0.00024346933318534288, "loss": 0.0181, "step": 74700 }, { "epoch": 0.38, "learning_rate": 0.00024346176549232889, "loss": 0.0171, "step": 74710 }, { "epoch": 0.38, "learning_rate": 0.00024345419779931487, "loss": 0.0178, "step": 74720 }, { "epoch": 0.38, "learning_rate": 0.00024344663010630085, "loss": 0.017, "step": 74730 }, { "epoch": 0.38, "learning_rate": 0.00024343906241328686, "loss": 0.0205, "step": 74740 }, { "epoch": 0.38, "learning_rate": 0.00024343149472027284, "loss": 0.0173, "step": 74750 }, { "epoch": 0.38, "learning_rate": 0.00024342392702725882, "loss": 0.0185, "step": 74760 }, { "epoch": 0.38, "learning_rate": 0.0002434163593342448, "loss": 0.0179, "step": 74770 }, { "epoch": 0.38, "learning_rate": 0.0002434087916412308, "loss": 0.0176, "step": 74780 }, { "epoch": 0.38, "learning_rate": 0.00024340122394821676, "loss": 0.0205, "step": 74790 }, { "epoch": 0.38, "learning_rate": 0.00024339365625520275, "loss": 0.0175, "step": 74800 }, { "epoch": 0.38, "learning_rate": 0.00024338608856218873, "loss": 0.0168, "step": 74810 }, { "epoch": 0.38, "learning_rate": 0.00024337852086917474, "loss": 0.0211, "step": 74820 }, { "epoch": 0.38, "learning_rate": 0.00024337095317616072, "loss": 0.0186, "step": 74830 }, { "epoch": 0.38, "learning_rate": 0.0002433633854831467, "loss": 0.0184, "step": 74840 }, { "epoch": 0.38, "learning_rate": 0.0002433558177901327, "loss": 0.0167, "step": 74850 }, { "epoch": 0.38, "learning_rate": 0.0002433482500971187, "loss": 0.0211, "step": 74860 }, { "epoch": 0.38, "learning_rate": 0.00024334068240410467, "loss": 0.0193, "step": 74870 }, { "epoch": 0.38, "learning_rate": 0.00024333311471109068, "loss": 0.0197, "step": 74880 }, { "epoch": 0.38, "learning_rate": 0.00024332554701807666, "loss": 0.0151, "step": 74890 }, { "epoch": 0.38, "learning_rate": 0.00024331797932506264, "loss": 0.0191, "step": 74900 }, { "epoch": 0.38, "learning_rate": 0.00024331041163204865, "loss": 0.0204, "step": 74910 }, { "epoch": 0.38, "learning_rate": 0.00024330284393903463, "loss": 0.0217, "step": 74920 }, { "epoch": 0.38, "learning_rate": 0.00024329527624602061, "loss": 0.0208, "step": 74930 }, { "epoch": 0.38, "learning_rate": 0.00024328770855300662, "loss": 0.0187, "step": 74940 }, { "epoch": 0.38, "learning_rate": 0.0002432801408599926, "loss": 0.0184, "step": 74950 }, { "epoch": 0.38, "learning_rate": 0.00024327257316697859, "loss": 0.0186, "step": 74960 }, { "epoch": 0.38, "learning_rate": 0.0002432650054739646, "loss": 0.0217, "step": 74970 }, { "epoch": 0.38, "learning_rate": 0.00024325743778095058, "loss": 0.0188, "step": 74980 }, { "epoch": 0.38, "learning_rate": 0.00024324987008793656, "loss": 0.02, "step": 74990 }, { "epoch": 0.38, "learning_rate": 0.00024324230239492254, "loss": 0.0191, "step": 75000 }, { "epoch": 0.38, "eval_cer": 0.9144935454101719, "eval_loss": 0.013869182206690311, "eval_runtime": 116.7861, "eval_samples_per_second": 17.125, "eval_steps_per_second": 4.281, "step": 75000 }, { "epoch": 0.38, "learning_rate": 0.00024323473470190855, "loss": 0.0208, "step": 75010 }, { "epoch": 0.38, "learning_rate": 0.00024322716700889453, "loss": 0.0217, "step": 75020 }, { "epoch": 0.38, "learning_rate": 0.0002432195993158805, "loss": 0.0162, "step": 75030 }, { "epoch": 0.38, "learning_rate": 0.00024321203162286652, "loss": 0.0162, "step": 75040 }, { "epoch": 0.38, "learning_rate": 0.0002432044639298525, "loss": 0.0242, "step": 75050 }, { "epoch": 0.38, "learning_rate": 0.00024319689623683848, "loss": 0.019, "step": 75060 }, { "epoch": 0.38, "learning_rate": 0.0002431893285438245, "loss": 0.0189, "step": 75070 }, { "epoch": 0.38, "learning_rate": 0.00024318176085081047, "loss": 0.0169, "step": 75080 }, { "epoch": 0.38, "learning_rate": 0.00024317419315779645, "loss": 0.0173, "step": 75090 }, { "epoch": 0.38, "learning_rate": 0.00024316662546478246, "loss": 0.0189, "step": 75100 }, { "epoch": 0.38, "learning_rate": 0.00024315905777176844, "loss": 0.0181, "step": 75110 }, { "epoch": 0.38, "learning_rate": 0.00024315149007875442, "loss": 0.0204, "step": 75120 }, { "epoch": 0.38, "learning_rate": 0.00024314392238574043, "loss": 0.0199, "step": 75130 }, { "epoch": 0.38, "learning_rate": 0.00024313635469272641, "loss": 0.0169, "step": 75140 }, { "epoch": 0.38, "learning_rate": 0.0002431287869997124, "loss": 0.0174, "step": 75150 }, { "epoch": 0.38, "learning_rate": 0.00024312121930669838, "loss": 0.02, "step": 75160 }, { "epoch": 0.38, "learning_rate": 0.00024311365161368439, "loss": 0.0205, "step": 75170 }, { "epoch": 0.38, "learning_rate": 0.00024310608392067037, "loss": 0.0188, "step": 75180 }, { "epoch": 0.38, "learning_rate": 0.00024309851622765635, "loss": 0.0221, "step": 75190 }, { "epoch": 0.38, "learning_rate": 0.00024309094853464236, "loss": 0.0181, "step": 75200 }, { "epoch": 0.38, "learning_rate": 0.00024308338084162834, "loss": 0.018, "step": 75210 }, { "epoch": 0.38, "learning_rate": 0.00024307581314861432, "loss": 0.0225, "step": 75220 }, { "epoch": 0.38, "learning_rate": 0.00024306824545560033, "loss": 0.0168, "step": 75230 }, { "epoch": 0.38, "learning_rate": 0.0002430606777625863, "loss": 0.0179, "step": 75240 }, { "epoch": 0.38, "learning_rate": 0.0002430531100695723, "loss": 0.0173, "step": 75250 }, { "epoch": 0.38, "learning_rate": 0.0002430455423765583, "loss": 0.0203, "step": 75260 }, { "epoch": 0.38, "learning_rate": 0.00024303797468354428, "loss": 0.0186, "step": 75270 }, { "epoch": 0.38, "learning_rate": 0.00024303040699053026, "loss": 0.0168, "step": 75280 }, { "epoch": 0.38, "learning_rate": 0.00024302283929751627, "loss": 0.019, "step": 75290 }, { "epoch": 0.38, "learning_rate": 0.00024301527160450225, "loss": 0.0194, "step": 75300 }, { "epoch": 0.38, "learning_rate": 0.00024300770391148823, "loss": 0.0195, "step": 75310 }, { "epoch": 0.38, "learning_rate": 0.00024300013621847422, "loss": 0.0145, "step": 75320 }, { "epoch": 0.38, "learning_rate": 0.00024299256852546022, "loss": 0.0141, "step": 75330 }, { "epoch": 0.38, "learning_rate": 0.0002429850008324462, "loss": 0.0206, "step": 75340 }, { "epoch": 0.38, "learning_rate": 0.0002429774331394322, "loss": 0.0232, "step": 75350 }, { "epoch": 0.38, "learning_rate": 0.0002429698654464182, "loss": 0.0177, "step": 75360 }, { "epoch": 0.38, "learning_rate": 0.00024296229775340418, "loss": 0.0148, "step": 75370 }, { "epoch": 0.38, "learning_rate": 0.00024295473006039016, "loss": 0.0182, "step": 75380 }, { "epoch": 0.38, "learning_rate": 0.00024294716236737617, "loss": 0.0197, "step": 75390 }, { "epoch": 0.38, "learning_rate": 0.00024293959467436215, "loss": 0.0162, "step": 75400 }, { "epoch": 0.38, "learning_rate": 0.00024293202698134813, "loss": 0.0181, "step": 75410 }, { "epoch": 0.38, "learning_rate": 0.00024292445928833414, "loss": 0.0198, "step": 75420 }, { "epoch": 0.38, "learning_rate": 0.00024291689159532012, "loss": 0.0172, "step": 75430 }, { "epoch": 0.38, "learning_rate": 0.0002429093239023061, "loss": 0.0187, "step": 75440 }, { "epoch": 0.38, "learning_rate": 0.0002429017562092921, "loss": 0.0137, "step": 75450 }, { "epoch": 0.38, "learning_rate": 0.0002428941885162781, "loss": 0.0202, "step": 75460 }, { "epoch": 0.38, "learning_rate": 0.00024288662082326407, "loss": 0.0159, "step": 75470 }, { "epoch": 0.38, "learning_rate": 0.00024287905313025008, "loss": 0.0231, "step": 75480 }, { "epoch": 0.38, "learning_rate": 0.00024287148543723606, "loss": 0.0209, "step": 75490 }, { "epoch": 0.38, "learning_rate": 0.00024286391774422204, "loss": 0.0184, "step": 75500 }, { "epoch": 0.38, "learning_rate": 0.00024285635005120803, "loss": 0.0173, "step": 75510 }, { "epoch": 0.38, "learning_rate": 0.00024284878235819403, "loss": 0.0181, "step": 75520 }, { "epoch": 0.38, "learning_rate": 0.00024284121466518002, "loss": 0.0188, "step": 75530 }, { "epoch": 0.38, "learning_rate": 0.000242833646972166, "loss": 0.0179, "step": 75540 }, { "epoch": 0.38, "learning_rate": 0.000242826079279152, "loss": 0.0158, "step": 75550 }, { "epoch": 0.38, "learning_rate": 0.000242818511586138, "loss": 0.0201, "step": 75560 }, { "epoch": 0.38, "learning_rate": 0.00024281094389312397, "loss": 0.0166, "step": 75570 }, { "epoch": 0.38, "learning_rate": 0.00024280337620010998, "loss": 0.0168, "step": 75580 }, { "epoch": 0.38, "learning_rate": 0.00024279580850709596, "loss": 0.0188, "step": 75590 }, { "epoch": 0.38, "learning_rate": 0.00024278824081408194, "loss": 0.018, "step": 75600 }, { "epoch": 0.38, "learning_rate": 0.00024278067312106795, "loss": 0.0191, "step": 75610 }, { "epoch": 0.38, "learning_rate": 0.00024277310542805393, "loss": 0.0172, "step": 75620 }, { "epoch": 0.38, "learning_rate": 0.0002427655377350399, "loss": 0.0191, "step": 75630 }, { "epoch": 0.38, "learning_rate": 0.00024275797004202592, "loss": 0.0216, "step": 75640 }, { "epoch": 0.38, "learning_rate": 0.0002427504023490119, "loss": 0.018, "step": 75650 }, { "epoch": 0.38, "learning_rate": 0.00024274283465599788, "loss": 0.0179, "step": 75660 }, { "epoch": 0.38, "learning_rate": 0.00024273526696298386, "loss": 0.0238, "step": 75670 }, { "epoch": 0.38, "learning_rate": 0.00024272769926996987, "loss": 0.0177, "step": 75680 }, { "epoch": 0.38, "learning_rate": 0.00024272013157695585, "loss": 0.0169, "step": 75690 }, { "epoch": 0.38, "learning_rate": 0.00024271256388394184, "loss": 0.02, "step": 75700 }, { "epoch": 0.38, "learning_rate": 0.00024270499619092784, "loss": 0.0188, "step": 75710 }, { "epoch": 0.38, "learning_rate": 0.00024269742849791383, "loss": 0.0197, "step": 75720 }, { "epoch": 0.38, "learning_rate": 0.0002426898608048998, "loss": 0.0168, "step": 75730 }, { "epoch": 0.38, "learning_rate": 0.00024268229311188582, "loss": 0.018, "step": 75740 }, { "epoch": 0.38, "learning_rate": 0.0002426747254188718, "loss": 0.0186, "step": 75750 }, { "epoch": 0.38, "learning_rate": 0.00024266715772585778, "loss": 0.019, "step": 75760 }, { "epoch": 0.38, "learning_rate": 0.0002426595900328438, "loss": 0.0165, "step": 75770 }, { "epoch": 0.38, "learning_rate": 0.00024265202233982977, "loss": 0.0161, "step": 75780 }, { "epoch": 0.38, "learning_rate": 0.00024264445464681575, "loss": 0.0233, "step": 75790 }, { "epoch": 0.38, "learning_rate": 0.00024263688695380176, "loss": 0.0207, "step": 75800 }, { "epoch": 0.38, "learning_rate": 0.00024262931926078774, "loss": 0.0291, "step": 75810 }, { "epoch": 0.38, "learning_rate": 0.00024262175156777372, "loss": 0.0234, "step": 75820 }, { "epoch": 0.38, "learning_rate": 0.0002426141838747597, "loss": 0.0198, "step": 75830 }, { "epoch": 0.38, "learning_rate": 0.0002426066161817457, "loss": 0.0192, "step": 75840 }, { "epoch": 0.38, "learning_rate": 0.0002425990484887317, "loss": 0.0206, "step": 75850 }, { "epoch": 0.38, "learning_rate": 0.00024259148079571767, "loss": 0.0199, "step": 75860 }, { "epoch": 0.38, "learning_rate": 0.00024258391310270368, "loss": 0.014, "step": 75870 }, { "epoch": 0.38, "learning_rate": 0.00024257634540968966, "loss": 0.0183, "step": 75880 }, { "epoch": 0.38, "learning_rate": 0.00024256877771667565, "loss": 0.0204, "step": 75890 }, { "epoch": 0.38, "learning_rate": 0.00024256121002366165, "loss": 0.017, "step": 75900 }, { "epoch": 0.38, "learning_rate": 0.00024255364233064764, "loss": 0.0169, "step": 75910 }, { "epoch": 0.38, "learning_rate": 0.00024254607463763362, "loss": 0.0174, "step": 75920 }, { "epoch": 0.38, "learning_rate": 0.00024253850694461963, "loss": 0.0183, "step": 75930 }, { "epoch": 0.38, "learning_rate": 0.0002425309392516056, "loss": 0.0181, "step": 75940 }, { "epoch": 0.38, "learning_rate": 0.0002425233715585916, "loss": 0.0183, "step": 75950 }, { "epoch": 0.38, "learning_rate": 0.0002425158038655776, "loss": 0.0183, "step": 75960 }, { "epoch": 0.38, "learning_rate": 0.00024250823617256358, "loss": 0.0203, "step": 75970 }, { "epoch": 0.38, "learning_rate": 0.00024250066847954956, "loss": 0.0179, "step": 75980 }, { "epoch": 0.38, "learning_rate": 0.00024249310078653557, "loss": 0.0203, "step": 75990 }, { "epoch": 0.38, "learning_rate": 0.00024248553309352155, "loss": 0.0175, "step": 76000 }, { "epoch": 0.38, "eval_cer": 0.9144925750140465, "eval_loss": 0.012879201211035252, "eval_runtime": 116.6021, "eval_samples_per_second": 17.152, "eval_steps_per_second": 4.288, "step": 76000 }, { "epoch": 0.38, "learning_rate": 0.00024247796540050753, "loss": 0.0189, "step": 76010 }, { "epoch": 0.38, "learning_rate": 0.0002424703977074935, "loss": 0.0175, "step": 76020 }, { "epoch": 0.38, "learning_rate": 0.00024246283001447952, "loss": 0.0171, "step": 76030 }, { "epoch": 0.38, "learning_rate": 0.0002424552623214655, "loss": 0.0174, "step": 76040 }, { "epoch": 0.38, "learning_rate": 0.00024244769462845146, "loss": 0.0159, "step": 76050 }, { "epoch": 0.38, "learning_rate": 0.00024244012693543744, "loss": 0.0189, "step": 76060 }, { "epoch": 0.38, "learning_rate": 0.00024243255924242345, "loss": 0.0171, "step": 76070 }, { "epoch": 0.38, "learning_rate": 0.00024242499154940943, "loss": 0.0219, "step": 76080 }, { "epoch": 0.38, "learning_rate": 0.0002424174238563954, "loss": 0.0165, "step": 76090 }, { "epoch": 0.38, "learning_rate": 0.00024240985616338142, "loss": 0.0196, "step": 76100 }, { "epoch": 0.38, "learning_rate": 0.0002424022884703674, "loss": 0.0203, "step": 76110 }, { "epoch": 0.38, "learning_rate": 0.00024239472077735338, "loss": 0.0205, "step": 76120 }, { "epoch": 0.38, "learning_rate": 0.0002423871530843394, "loss": 0.0197, "step": 76130 }, { "epoch": 0.38, "learning_rate": 0.00024237958539132537, "loss": 0.0179, "step": 76140 }, { "epoch": 0.38, "learning_rate": 0.00024237201769831135, "loss": 0.0143, "step": 76150 }, { "epoch": 0.38, "learning_rate": 0.00024236445000529736, "loss": 0.0198, "step": 76160 }, { "epoch": 0.38, "learning_rate": 0.00024235688231228334, "loss": 0.019, "step": 76170 }, { "epoch": 0.38, "learning_rate": 0.00024234931461926932, "loss": 0.0217, "step": 76180 }, { "epoch": 0.38, "learning_rate": 0.00024234174692625533, "loss": 0.0185, "step": 76190 }, { "epoch": 0.38, "learning_rate": 0.00024233417923324131, "loss": 0.0181, "step": 76200 }, { "epoch": 0.38, "learning_rate": 0.0002423266115402273, "loss": 0.0206, "step": 76210 }, { "epoch": 0.38, "learning_rate": 0.00024231904384721328, "loss": 0.0172, "step": 76220 }, { "epoch": 0.38, "learning_rate": 0.00024231147615419929, "loss": 0.0185, "step": 76230 }, { "epoch": 0.38, "learning_rate": 0.00024230390846118527, "loss": 0.0209, "step": 76240 }, { "epoch": 0.38, "learning_rate": 0.00024229634076817125, "loss": 0.0186, "step": 76250 }, { "epoch": 0.38, "learning_rate": 0.00024228877307515726, "loss": 0.0212, "step": 76260 }, { "epoch": 0.38, "learning_rate": 0.00024228120538214324, "loss": 0.0172, "step": 76270 }, { "epoch": 0.38, "learning_rate": 0.00024227363768912922, "loss": 0.0169, "step": 76280 }, { "epoch": 0.38, "learning_rate": 0.00024226606999611523, "loss": 0.0176, "step": 76290 }, { "epoch": 0.38, "learning_rate": 0.0002422585023031012, "loss": 0.0183, "step": 76300 }, { "epoch": 0.38, "learning_rate": 0.0002422509346100872, "loss": 0.0154, "step": 76310 }, { "epoch": 0.39, "learning_rate": 0.0002422433669170732, "loss": 0.0204, "step": 76320 }, { "epoch": 0.39, "learning_rate": 0.00024223579922405918, "loss": 0.018, "step": 76330 }, { "epoch": 0.39, "learning_rate": 0.00024222823153104516, "loss": 0.0238, "step": 76340 }, { "epoch": 0.39, "learning_rate": 0.00024222066383803117, "loss": 0.0168, "step": 76350 }, { "epoch": 0.39, "learning_rate": 0.00024221309614501715, "loss": 0.0149, "step": 76360 }, { "epoch": 0.39, "learning_rate": 0.00024220552845200313, "loss": 0.0194, "step": 76370 }, { "epoch": 0.39, "learning_rate": 0.00024219796075898914, "loss": 0.0177, "step": 76380 }, { "epoch": 0.39, "learning_rate": 0.00024219039306597512, "loss": 0.0185, "step": 76390 }, { "epoch": 0.39, "learning_rate": 0.0002421828253729611, "loss": 0.0173, "step": 76400 }, { "epoch": 0.39, "learning_rate": 0.0002421752576799471, "loss": 0.0188, "step": 76410 }, { "epoch": 0.39, "learning_rate": 0.0002421676899869331, "loss": 0.0212, "step": 76420 }, { "epoch": 0.39, "learning_rate": 0.00024216012229391908, "loss": 0.0176, "step": 76430 }, { "epoch": 0.39, "learning_rate": 0.00024215255460090506, "loss": 0.0186, "step": 76440 }, { "epoch": 0.39, "learning_rate": 0.00024214498690789107, "loss": 0.0174, "step": 76450 }, { "epoch": 0.39, "learning_rate": 0.00024213741921487705, "loss": 0.0178, "step": 76460 }, { "epoch": 0.39, "learning_rate": 0.00024212985152186303, "loss": 0.0196, "step": 76470 }, { "epoch": 0.39, "learning_rate": 0.00024212228382884904, "loss": 0.0174, "step": 76480 }, { "epoch": 0.39, "learning_rate": 0.00024211471613583502, "loss": 0.016, "step": 76490 }, { "epoch": 0.39, "learning_rate": 0.000242107148442821, "loss": 0.0139, "step": 76500 }, { "epoch": 0.39, "learning_rate": 0.000242099580749807, "loss": 0.0174, "step": 76510 }, { "epoch": 0.39, "learning_rate": 0.000242092013056793, "loss": 0.0215, "step": 76520 }, { "epoch": 0.39, "learning_rate": 0.00024208444536377897, "loss": 0.0173, "step": 76530 }, { "epoch": 0.39, "learning_rate": 0.00024207687767076498, "loss": 0.0189, "step": 76540 }, { "epoch": 0.39, "learning_rate": 0.00024206930997775096, "loss": 0.0173, "step": 76550 }, { "epoch": 0.39, "learning_rate": 0.00024206174228473694, "loss": 0.018, "step": 76560 }, { "epoch": 0.39, "learning_rate": 0.00024205417459172293, "loss": 0.055, "step": 76570 }, { "epoch": 0.39, "learning_rate": 0.00024204660689870893, "loss": 0.0154, "step": 76580 }, { "epoch": 0.39, "learning_rate": 0.00024203903920569492, "loss": 0.0182, "step": 76590 }, { "epoch": 0.39, "learning_rate": 0.0002420314715126809, "loss": 0.0171, "step": 76600 }, { "epoch": 0.39, "learning_rate": 0.0002420239038196669, "loss": 0.0193, "step": 76610 }, { "epoch": 0.39, "learning_rate": 0.0002420163361266529, "loss": 0.0184, "step": 76620 }, { "epoch": 0.39, "learning_rate": 0.00024200876843363887, "loss": 0.0205, "step": 76630 }, { "epoch": 0.39, "learning_rate": 0.00024200120074062488, "loss": 0.0199, "step": 76640 }, { "epoch": 0.39, "learning_rate": 0.00024199363304761086, "loss": 0.0182, "step": 76650 }, { "epoch": 0.39, "learning_rate": 0.00024198606535459684, "loss": 0.0166, "step": 76660 }, { "epoch": 0.39, "learning_rate": 0.00024197849766158285, "loss": 0.0187, "step": 76670 }, { "epoch": 0.39, "learning_rate": 0.00024197092996856883, "loss": 0.0168, "step": 76680 }, { "epoch": 0.39, "learning_rate": 0.0002419633622755548, "loss": 0.0145, "step": 76690 }, { "epoch": 0.39, "learning_rate": 0.00024195579458254082, "loss": 0.0157, "step": 76700 }, { "epoch": 0.39, "learning_rate": 0.0002419482268895268, "loss": 0.0168, "step": 76710 }, { "epoch": 0.39, "learning_rate": 0.00024194065919651278, "loss": 0.0172, "step": 76720 }, { "epoch": 0.39, "learning_rate": 0.00024193309150349876, "loss": 0.0186, "step": 76730 }, { "epoch": 0.39, "learning_rate": 0.00024192552381048477, "loss": 0.0141, "step": 76740 }, { "epoch": 0.39, "learning_rate": 0.00024191795611747075, "loss": 0.0183, "step": 76750 }, { "epoch": 0.39, "learning_rate": 0.00024191038842445674, "loss": 0.0196, "step": 76760 }, { "epoch": 0.39, "learning_rate": 0.00024190282073144274, "loss": 0.0201, "step": 76770 }, { "epoch": 0.39, "learning_rate": 0.00024189525303842873, "loss": 0.0201, "step": 76780 }, { "epoch": 0.39, "learning_rate": 0.0002418876853454147, "loss": 0.0148, "step": 76790 }, { "epoch": 0.39, "learning_rate": 0.00024188011765240072, "loss": 0.0211, "step": 76800 }, { "epoch": 0.39, "learning_rate": 0.0002418725499593867, "loss": 0.0213, "step": 76810 }, { "epoch": 0.39, "learning_rate": 0.00024186498226637268, "loss": 0.0161, "step": 76820 }, { "epoch": 0.39, "learning_rate": 0.0002418574145733587, "loss": 0.0179, "step": 76830 }, { "epoch": 0.39, "learning_rate": 0.00024184984688034467, "loss": 0.0152, "step": 76840 }, { "epoch": 0.39, "learning_rate": 0.00024184227918733065, "loss": 0.0195, "step": 76850 }, { "epoch": 0.39, "learning_rate": 0.00024183471149431666, "loss": 0.0214, "step": 76860 }, { "epoch": 0.39, "learning_rate": 0.00024182714380130264, "loss": 0.0268, "step": 76870 }, { "epoch": 0.39, "learning_rate": 0.00024181957610828862, "loss": 0.0213, "step": 76880 }, { "epoch": 0.39, "learning_rate": 0.00024181200841527463, "loss": 0.0185, "step": 76890 }, { "epoch": 0.39, "learning_rate": 0.0002418044407222606, "loss": 0.0198, "step": 76900 }, { "epoch": 0.39, "learning_rate": 0.0002417968730292466, "loss": 0.0206, "step": 76910 }, { "epoch": 0.39, "learning_rate": 0.00024178930533623257, "loss": 0.0165, "step": 76920 }, { "epoch": 0.39, "learning_rate": 0.00024178173764321858, "loss": 0.0171, "step": 76930 }, { "epoch": 0.39, "learning_rate": 0.00024177416995020456, "loss": 0.0183, "step": 76940 }, { "epoch": 0.39, "learning_rate": 0.00024176660225719055, "loss": 0.0224, "step": 76950 }, { "epoch": 0.39, "learning_rate": 0.00024175903456417655, "loss": 0.0219, "step": 76960 }, { "epoch": 0.39, "learning_rate": 0.00024175146687116254, "loss": 0.0175, "step": 76970 }, { "epoch": 0.39, "learning_rate": 0.00024174389917814852, "loss": 0.0131, "step": 76980 }, { "epoch": 0.39, "learning_rate": 0.00024173633148513453, "loss": 0.0148, "step": 76990 }, { "epoch": 0.39, "learning_rate": 0.0002417287637921205, "loss": 0.0143, "step": 77000 }, { "epoch": 0.39, "eval_cer": 0.9144974269946735, "eval_loss": 0.012495556846261024, "eval_runtime": 116.5435, "eval_samples_per_second": 17.161, "eval_steps_per_second": 4.29, "step": 77000 }, { "epoch": 0.39, "learning_rate": 0.0002417211960991065, "loss": 0.0195, "step": 77010 }, { "epoch": 0.39, "learning_rate": 0.0002417136284060925, "loss": 0.0186, "step": 77020 }, { "epoch": 0.39, "learning_rate": 0.00024170606071307848, "loss": 0.0197, "step": 77030 }, { "epoch": 0.39, "learning_rate": 0.00024169849302006446, "loss": 0.0182, "step": 77040 }, { "epoch": 0.39, "learning_rate": 0.00024169092532705047, "loss": 0.0164, "step": 77050 }, { "epoch": 0.39, "learning_rate": 0.00024168335763403645, "loss": 0.0151, "step": 77060 }, { "epoch": 0.39, "learning_rate": 0.00024167578994102243, "loss": 0.0165, "step": 77070 }, { "epoch": 0.39, "learning_rate": 0.0002416682222480084, "loss": 0.019, "step": 77080 }, { "epoch": 0.39, "learning_rate": 0.00024166065455499442, "loss": 0.0179, "step": 77090 }, { "epoch": 0.39, "learning_rate": 0.0002416530868619804, "loss": 0.0245, "step": 77100 }, { "epoch": 0.39, "learning_rate": 0.00024164551916896638, "loss": 0.0208, "step": 77110 }, { "epoch": 0.39, "learning_rate": 0.0002416379514759524, "loss": 0.0195, "step": 77120 }, { "epoch": 0.39, "learning_rate": 0.00024163038378293837, "loss": 0.018, "step": 77130 }, { "epoch": 0.39, "learning_rate": 0.00024162281608992436, "loss": 0.0153, "step": 77140 }, { "epoch": 0.39, "learning_rate": 0.00024161524839691036, "loss": 0.0219, "step": 77150 }, { "epoch": 0.39, "learning_rate": 0.00024160768070389635, "loss": 0.0184, "step": 77160 }, { "epoch": 0.39, "learning_rate": 0.00024160011301088233, "loss": 0.0222, "step": 77170 }, { "epoch": 0.39, "learning_rate": 0.00024159254531786834, "loss": 0.0227, "step": 77180 }, { "epoch": 0.39, "learning_rate": 0.00024158497762485432, "loss": 0.0192, "step": 77190 }, { "epoch": 0.39, "learning_rate": 0.0002415774099318403, "loss": 0.0174, "step": 77200 }, { "epoch": 0.39, "learning_rate": 0.0002415698422388263, "loss": 0.0127, "step": 77210 }, { "epoch": 0.39, "learning_rate": 0.0002415622745458123, "loss": 0.0152, "step": 77220 }, { "epoch": 0.39, "learning_rate": 0.00024155470685279827, "loss": 0.0163, "step": 77230 }, { "epoch": 0.39, "learning_rate": 0.00024154713915978425, "loss": 0.0172, "step": 77240 }, { "epoch": 0.39, "learning_rate": 0.00024153957146677026, "loss": 0.0155, "step": 77250 }, { "epoch": 0.39, "learning_rate": 0.00024153200377375624, "loss": 0.0181, "step": 77260 }, { "epoch": 0.39, "learning_rate": 0.00024152443608074222, "loss": 0.0185, "step": 77270 }, { "epoch": 0.39, "learning_rate": 0.00024151686838772823, "loss": 0.0179, "step": 77280 }, { "epoch": 0.39, "learning_rate": 0.0002415093006947142, "loss": 0.0157, "step": 77290 }, { "epoch": 0.39, "learning_rate": 0.00024150173300170017, "loss": 0.0166, "step": 77300 }, { "epoch": 0.39, "learning_rate": 0.00024149416530868615, "loss": 0.0131, "step": 77310 }, { "epoch": 0.39, "learning_rate": 0.00024148659761567216, "loss": 0.0155, "step": 77320 }, { "epoch": 0.39, "learning_rate": 0.00024147902992265814, "loss": 0.0166, "step": 77330 }, { "epoch": 0.39, "learning_rate": 0.00024147146222964412, "loss": 0.0178, "step": 77340 }, { "epoch": 0.39, "learning_rate": 0.00024146389453663013, "loss": 0.0167, "step": 77350 }, { "epoch": 0.39, "learning_rate": 0.0002414563268436161, "loss": 0.0167, "step": 77360 }, { "epoch": 0.39, "learning_rate": 0.0002414487591506021, "loss": 0.0177, "step": 77370 }, { "epoch": 0.39, "learning_rate": 0.0002414411914575881, "loss": 0.0204, "step": 77380 }, { "epoch": 0.39, "learning_rate": 0.00024143362376457408, "loss": 0.0167, "step": 77390 }, { "epoch": 0.39, "learning_rate": 0.00024142605607156006, "loss": 0.0173, "step": 77400 }, { "epoch": 0.39, "learning_rate": 0.00024141848837854607, "loss": 0.0181, "step": 77410 }, { "epoch": 0.39, "learning_rate": 0.00024141092068553205, "loss": 0.0166, "step": 77420 }, { "epoch": 0.39, "learning_rate": 0.00024140335299251803, "loss": 0.0169, "step": 77430 }, { "epoch": 0.39, "learning_rate": 0.00024139578529950404, "loss": 0.0234, "step": 77440 }, { "epoch": 0.39, "learning_rate": 0.00024138821760649002, "loss": 0.0164, "step": 77450 }, { "epoch": 0.39, "learning_rate": 0.000241380649913476, "loss": 0.0178, "step": 77460 }, { "epoch": 0.39, "learning_rate": 0.000241373082220462, "loss": 0.0183, "step": 77470 }, { "epoch": 0.39, "learning_rate": 0.000241365514527448, "loss": 0.0161, "step": 77480 }, { "epoch": 0.39, "learning_rate": 0.00024135794683443398, "loss": 0.0137, "step": 77490 }, { "epoch": 0.39, "learning_rate": 0.00024135037914141996, "loss": 0.0194, "step": 77500 }, { "epoch": 0.39, "learning_rate": 0.00024134281144840597, "loss": 0.021, "step": 77510 }, { "epoch": 0.39, "learning_rate": 0.00024133524375539195, "loss": 0.0157, "step": 77520 }, { "epoch": 0.39, "learning_rate": 0.00024132767606237793, "loss": 0.0172, "step": 77530 }, { "epoch": 0.39, "learning_rate": 0.00024132010836936394, "loss": 0.0174, "step": 77540 }, { "epoch": 0.39, "learning_rate": 0.00024131254067634992, "loss": 0.017, "step": 77550 }, { "epoch": 0.39, "learning_rate": 0.0002413049729833359, "loss": 0.0159, "step": 77560 }, { "epoch": 0.39, "learning_rate": 0.0002412974052903219, "loss": 0.0197, "step": 77570 }, { "epoch": 0.39, "learning_rate": 0.0002412898375973079, "loss": 0.0176, "step": 77580 }, { "epoch": 0.39, "learning_rate": 0.00024128226990429387, "loss": 0.0166, "step": 77590 }, { "epoch": 0.39, "learning_rate": 0.00024127470221127988, "loss": 0.019, "step": 77600 }, { "epoch": 0.39, "learning_rate": 0.00024126713451826586, "loss": 0.018, "step": 77610 }, { "epoch": 0.39, "learning_rate": 0.00024125956682525184, "loss": 0.0185, "step": 77620 }, { "epoch": 0.39, "learning_rate": 0.00024125199913223783, "loss": 0.0178, "step": 77630 }, { "epoch": 0.39, "learning_rate": 0.00024124443143922383, "loss": 0.02, "step": 77640 }, { "epoch": 0.39, "learning_rate": 0.00024123686374620982, "loss": 0.0173, "step": 77650 }, { "epoch": 0.39, "learning_rate": 0.0002412292960531958, "loss": 0.019, "step": 77660 }, { "epoch": 0.39, "learning_rate": 0.0002412217283601818, "loss": 0.0242, "step": 77670 }, { "epoch": 0.39, "learning_rate": 0.0002412141606671678, "loss": 0.0186, "step": 77680 }, { "epoch": 0.39, "learning_rate": 0.00024120659297415377, "loss": 0.0184, "step": 77690 }, { "epoch": 0.39, "learning_rate": 0.00024119902528113978, "loss": 0.0165, "step": 77700 }, { "epoch": 0.39, "learning_rate": 0.00024119145758812576, "loss": 0.0163, "step": 77710 }, { "epoch": 0.39, "learning_rate": 0.00024118388989511174, "loss": 0.0174, "step": 77720 }, { "epoch": 0.39, "learning_rate": 0.00024117632220209775, "loss": 0.0169, "step": 77730 }, { "epoch": 0.39, "learning_rate": 0.00024116875450908373, "loss": 0.0202, "step": 77740 }, { "epoch": 0.39, "learning_rate": 0.0002411611868160697, "loss": 0.0165, "step": 77750 }, { "epoch": 0.39, "learning_rate": 0.00024115361912305572, "loss": 0.0176, "step": 77760 }, { "epoch": 0.39, "learning_rate": 0.0002411460514300417, "loss": 0.0178, "step": 77770 }, { "epoch": 0.39, "learning_rate": 0.00024113848373702768, "loss": 0.0193, "step": 77780 }, { "epoch": 0.39, "learning_rate": 0.00024113091604401366, "loss": 0.0189, "step": 77790 }, { "epoch": 0.39, "learning_rate": 0.00024112334835099967, "loss": 0.0208, "step": 77800 }, { "epoch": 0.39, "learning_rate": 0.00024111578065798565, "loss": 0.0158, "step": 77810 }, { "epoch": 0.39, "learning_rate": 0.00024110821296497164, "loss": 0.0181, "step": 77820 }, { "epoch": 0.39, "learning_rate": 0.00024110064527195764, "loss": 0.0172, "step": 77830 }, { "epoch": 0.39, "learning_rate": 0.00024109307757894363, "loss": 0.0158, "step": 77840 }, { "epoch": 0.39, "learning_rate": 0.0002410855098859296, "loss": 0.0172, "step": 77850 }, { "epoch": 0.39, "learning_rate": 0.00024107794219291562, "loss": 0.0149, "step": 77860 }, { "epoch": 0.39, "learning_rate": 0.0002410703744999016, "loss": 0.0178, "step": 77870 }, { "epoch": 0.39, "learning_rate": 0.00024106280680688758, "loss": 0.0178, "step": 77880 }, { "epoch": 0.39, "learning_rate": 0.0002410552391138736, "loss": 0.0159, "step": 77890 }, { "epoch": 0.39, "learning_rate": 0.00024104767142085957, "loss": 0.0159, "step": 77900 }, { "epoch": 0.39, "learning_rate": 0.00024104010372784555, "loss": 0.0179, "step": 77910 }, { "epoch": 0.39, "learning_rate": 0.00024103253603483156, "loss": 0.0185, "step": 77920 }, { "epoch": 0.39, "learning_rate": 0.00024102496834181754, "loss": 0.017, "step": 77930 }, { "epoch": 0.39, "learning_rate": 0.00024101740064880352, "loss": 0.0189, "step": 77940 }, { "epoch": 0.39, "learning_rate": 0.00024100983295578953, "loss": 0.015, "step": 77950 }, { "epoch": 0.39, "learning_rate": 0.0002410022652627755, "loss": 0.0157, "step": 77960 }, { "epoch": 0.39, "learning_rate": 0.0002409946975697615, "loss": 0.0185, "step": 77970 }, { "epoch": 0.39, "learning_rate": 0.00024098712987674747, "loss": 0.0163, "step": 77980 }, { "epoch": 0.39, "learning_rate": 0.00024097956218373348, "loss": 0.0163, "step": 77990 }, { "epoch": 0.39, "learning_rate": 0.00024097199449071946, "loss": 0.0178, "step": 78000 }, { "epoch": 0.39, "eval_cer": 0.9145148941249307, "eval_loss": 0.012463193386793137, "eval_runtime": 116.5238, "eval_samples_per_second": 17.164, "eval_steps_per_second": 4.291, "step": 78000 }, { "epoch": 0.39, "learning_rate": 0.00024096442679770545, "loss": 0.0181, "step": 78010 }, { "epoch": 0.39, "learning_rate": 0.00024095685910469145, "loss": 0.016, "step": 78020 }, { "epoch": 0.39, "learning_rate": 0.00024094929141167744, "loss": 0.019, "step": 78030 }, { "epoch": 0.39, "learning_rate": 0.00024094172371866342, "loss": 0.0137, "step": 78040 }, { "epoch": 0.39, "learning_rate": 0.00024093415602564943, "loss": 0.0163, "step": 78050 }, { "epoch": 0.39, "learning_rate": 0.0002409265883326354, "loss": 0.0176, "step": 78060 }, { "epoch": 0.39, "learning_rate": 0.0002409190206396214, "loss": 0.0183, "step": 78070 }, { "epoch": 0.39, "learning_rate": 0.0002409114529466074, "loss": 0.0196, "step": 78080 }, { "epoch": 0.39, "learning_rate": 0.00024090388525359338, "loss": 0.0175, "step": 78090 }, { "epoch": 0.39, "learning_rate": 0.00024089631756057936, "loss": 0.0183, "step": 78100 }, { "epoch": 0.39, "learning_rate": 0.00024088874986756537, "loss": 0.0202, "step": 78110 }, { "epoch": 0.39, "learning_rate": 0.00024088118217455135, "loss": 0.0204, "step": 78120 }, { "epoch": 0.39, "learning_rate": 0.00024087361448153733, "loss": 0.0167, "step": 78130 }, { "epoch": 0.39, "learning_rate": 0.0002408660467885233, "loss": 0.0173, "step": 78140 }, { "epoch": 0.39, "learning_rate": 0.00024085847909550932, "loss": 0.0217, "step": 78150 }, { "epoch": 0.39, "learning_rate": 0.0002408509114024953, "loss": 0.0189, "step": 78160 }, { "epoch": 0.39, "learning_rate": 0.00024084334370948128, "loss": 0.0177, "step": 78170 }, { "epoch": 0.39, "learning_rate": 0.0002408357760164673, "loss": 0.0162, "step": 78180 }, { "epoch": 0.39, "learning_rate": 0.00024082820832345327, "loss": 0.0171, "step": 78190 }, { "epoch": 0.39, "learning_rate": 0.00024082064063043926, "loss": 0.0177, "step": 78200 }, { "epoch": 0.39, "learning_rate": 0.00024081307293742526, "loss": 0.018, "step": 78210 }, { "epoch": 0.39, "learning_rate": 0.00024080550524441125, "loss": 0.0202, "step": 78220 }, { "epoch": 0.39, "learning_rate": 0.00024079793755139723, "loss": 0.015, "step": 78230 }, { "epoch": 0.39, "learning_rate": 0.00024079036985838324, "loss": 0.0211, "step": 78240 }, { "epoch": 0.39, "learning_rate": 0.00024078280216536922, "loss": 0.0216, "step": 78250 }, { "epoch": 0.39, "learning_rate": 0.0002407752344723552, "loss": 0.015, "step": 78260 }, { "epoch": 0.39, "learning_rate": 0.0002407676667793412, "loss": 0.017, "step": 78270 }, { "epoch": 0.39, "learning_rate": 0.0002407600990863272, "loss": 0.0243, "step": 78280 }, { "epoch": 0.39, "learning_rate": 0.00024075253139331317, "loss": 0.0165, "step": 78290 }, { "epoch": 0.4, "learning_rate": 0.00024074496370029915, "loss": 0.0172, "step": 78300 }, { "epoch": 0.4, "learning_rate": 0.00024073739600728516, "loss": 0.0185, "step": 78310 }, { "epoch": 0.4, "learning_rate": 0.00024072982831427114, "loss": 0.0184, "step": 78320 }, { "epoch": 0.4, "learning_rate": 0.00024072226062125712, "loss": 0.019, "step": 78330 }, { "epoch": 0.4, "learning_rate": 0.00024071469292824313, "loss": 0.0224, "step": 78340 }, { "epoch": 0.4, "learning_rate": 0.0002407071252352291, "loss": 0.0212, "step": 78350 }, { "epoch": 0.4, "learning_rate": 0.0002406995575422151, "loss": 0.0187, "step": 78360 }, { "epoch": 0.4, "learning_rate": 0.0002406919898492011, "loss": 0.0203, "step": 78370 }, { "epoch": 0.4, "learning_rate": 0.00024068442215618708, "loss": 0.0144, "step": 78380 }, { "epoch": 0.4, "learning_rate": 0.00024067685446317307, "loss": 0.016, "step": 78390 }, { "epoch": 0.4, "learning_rate": 0.00024066928677015907, "loss": 0.0171, "step": 78400 }, { "epoch": 0.4, "learning_rate": 0.00024066171907714506, "loss": 0.0171, "step": 78410 }, { "epoch": 0.4, "learning_rate": 0.00024065415138413104, "loss": 0.0146, "step": 78420 }, { "epoch": 0.4, "learning_rate": 0.00024064658369111705, "loss": 0.0157, "step": 78430 }, { "epoch": 0.4, "learning_rate": 0.00024063901599810303, "loss": 0.0161, "step": 78440 }, { "epoch": 0.4, "learning_rate": 0.000240631448305089, "loss": 0.0175, "step": 78450 }, { "epoch": 0.4, "learning_rate": 0.00024062388061207502, "loss": 0.0152, "step": 78460 }, { "epoch": 0.4, "learning_rate": 0.000240616312919061, "loss": 0.0184, "step": 78470 }, { "epoch": 0.4, "learning_rate": 0.00024060874522604698, "loss": 0.0223, "step": 78480 }, { "epoch": 0.4, "learning_rate": 0.00024060117753303296, "loss": 0.027, "step": 78490 }, { "epoch": 0.4, "learning_rate": 0.00024059360984001897, "loss": 0.0212, "step": 78500 }, { "epoch": 0.4, "learning_rate": 0.00024058604214700495, "loss": 0.0158, "step": 78510 }, { "epoch": 0.4, "learning_rate": 0.00024057847445399093, "loss": 0.0192, "step": 78520 }, { "epoch": 0.4, "learning_rate": 0.00024057090676097694, "loss": 0.0138, "step": 78530 }, { "epoch": 0.4, "learning_rate": 0.00024056333906796292, "loss": 0.0198, "step": 78540 }, { "epoch": 0.4, "learning_rate": 0.0002405557713749489, "loss": 0.0174, "step": 78550 }, { "epoch": 0.4, "learning_rate": 0.00024054820368193486, "loss": 0.019, "step": 78560 }, { "epoch": 0.4, "learning_rate": 0.00024054063598892087, "loss": 0.0217, "step": 78570 }, { "epoch": 0.4, "learning_rate": 0.00024053306829590685, "loss": 0.0209, "step": 78580 }, { "epoch": 0.4, "learning_rate": 0.00024052550060289283, "loss": 0.0179, "step": 78590 }, { "epoch": 0.4, "learning_rate": 0.00024051793290987884, "loss": 0.0198, "step": 78600 }, { "epoch": 0.4, "learning_rate": 0.00024051036521686482, "loss": 0.0189, "step": 78610 }, { "epoch": 0.4, "learning_rate": 0.0002405027975238508, "loss": 0.0174, "step": 78620 }, { "epoch": 0.4, "learning_rate": 0.0002404952298308368, "loss": 0.0171, "step": 78630 }, { "epoch": 0.4, "learning_rate": 0.0002404876621378228, "loss": 0.0176, "step": 78640 }, { "epoch": 0.4, "learning_rate": 0.00024048009444480877, "loss": 0.0177, "step": 78650 }, { "epoch": 0.4, "learning_rate": 0.00024047252675179478, "loss": 0.0181, "step": 78660 }, { "epoch": 0.4, "learning_rate": 0.00024046495905878076, "loss": 0.0197, "step": 78670 }, { "epoch": 0.4, "learning_rate": 0.00024045739136576674, "loss": 0.0211, "step": 78680 }, { "epoch": 0.4, "learning_rate": 0.00024044982367275273, "loss": 0.0175, "step": 78690 }, { "epoch": 0.4, "learning_rate": 0.00024044225597973873, "loss": 0.0195, "step": 78700 }, { "epoch": 0.4, "learning_rate": 0.00024043468828672472, "loss": 0.0188, "step": 78710 }, { "epoch": 0.4, "learning_rate": 0.0002404271205937107, "loss": 0.0165, "step": 78720 }, { "epoch": 0.4, "learning_rate": 0.0002404195529006967, "loss": 0.0172, "step": 78730 }, { "epoch": 0.4, "learning_rate": 0.0002404119852076827, "loss": 0.019, "step": 78740 }, { "epoch": 0.4, "learning_rate": 0.00024040441751466867, "loss": 0.0166, "step": 78750 }, { "epoch": 0.4, "learning_rate": 0.00024039684982165468, "loss": 0.0156, "step": 78760 }, { "epoch": 0.4, "learning_rate": 0.00024038928212864066, "loss": 0.0173, "step": 78770 }, { "epoch": 0.4, "learning_rate": 0.00024038171443562664, "loss": 0.0184, "step": 78780 }, { "epoch": 0.4, "learning_rate": 0.00024037414674261265, "loss": 0.0189, "step": 78790 }, { "epoch": 0.4, "learning_rate": 0.00024036657904959863, "loss": 0.0171, "step": 78800 }, { "epoch": 0.4, "learning_rate": 0.0002403590113565846, "loss": 0.0196, "step": 78810 }, { "epoch": 0.4, "learning_rate": 0.00024035144366357062, "loss": 0.0153, "step": 78820 }, { "epoch": 0.4, "learning_rate": 0.0002403438759705566, "loss": 0.0188, "step": 78830 }, { "epoch": 0.4, "learning_rate": 0.00024033630827754258, "loss": 0.0178, "step": 78840 }, { "epoch": 0.4, "learning_rate": 0.0002403287405845286, "loss": 0.0221, "step": 78850 }, { "epoch": 0.4, "learning_rate": 0.00024032117289151457, "loss": 0.0166, "step": 78860 }, { "epoch": 0.4, "learning_rate": 0.00024031360519850055, "loss": 0.0216, "step": 78870 }, { "epoch": 0.4, "learning_rate": 0.00024030603750548654, "loss": 0.0176, "step": 78880 }, { "epoch": 0.4, "learning_rate": 0.00024029846981247254, "loss": 0.0192, "step": 78890 }, { "epoch": 0.4, "learning_rate": 0.00024029090211945853, "loss": 0.0182, "step": 78900 }, { "epoch": 0.4, "learning_rate": 0.0002402833344264445, "loss": 0.0208, "step": 78910 }, { "epoch": 0.4, "learning_rate": 0.00024027576673343052, "loss": 0.0182, "step": 78920 }, { "epoch": 0.4, "learning_rate": 0.0002402681990404165, "loss": 0.0192, "step": 78930 }, { "epoch": 0.4, "learning_rate": 0.00024026063134740248, "loss": 0.0141, "step": 78940 }, { "epoch": 0.4, "learning_rate": 0.0002402530636543885, "loss": 0.0166, "step": 78950 }, { "epoch": 0.4, "learning_rate": 0.00024024549596137447, "loss": 0.0179, "step": 78960 }, { "epoch": 0.4, "learning_rate": 0.00024023792826836045, "loss": 0.0154, "step": 78970 }, { "epoch": 0.4, "learning_rate": 0.00024023036057534646, "loss": 0.0157, "step": 78980 }, { "epoch": 0.4, "learning_rate": 0.00024022279288233244, "loss": 0.0167, "step": 78990 }, { "epoch": 0.4, "learning_rate": 0.00024021522518931842, "loss": 0.0181, "step": 79000 }, { "epoch": 0.4, "eval_cer": 0.914508101352053, "eval_loss": 0.012615088373422623, "eval_runtime": 116.5859, "eval_samples_per_second": 17.155, "eval_steps_per_second": 4.289, "step": 79000 }, { "epoch": 0.4, "learning_rate": 0.00024020765749630443, "loss": 0.0181, "step": 79010 }, { "epoch": 0.4, "learning_rate": 0.0002402000898032904, "loss": 0.0182, "step": 79020 }, { "epoch": 0.4, "learning_rate": 0.0002401925221102764, "loss": 0.0178, "step": 79030 }, { "epoch": 0.4, "learning_rate": 0.00024018495441726237, "loss": 0.019, "step": 79040 }, { "epoch": 0.4, "learning_rate": 0.00024017738672424838, "loss": 0.0146, "step": 79050 }, { "epoch": 0.4, "learning_rate": 0.00024016981903123436, "loss": 0.0158, "step": 79060 }, { "epoch": 0.4, "learning_rate": 0.00024016225133822035, "loss": 0.018, "step": 79070 }, { "epoch": 0.4, "learning_rate": 0.00024015468364520635, "loss": 0.0188, "step": 79080 }, { "epoch": 0.4, "learning_rate": 0.00024014711595219234, "loss": 0.0198, "step": 79090 }, { "epoch": 0.4, "learning_rate": 0.00024013954825917832, "loss": 0.02, "step": 79100 }, { "epoch": 0.4, "learning_rate": 0.00024013198056616433, "loss": 0.0146, "step": 79110 }, { "epoch": 0.4, "learning_rate": 0.0002401244128731503, "loss": 0.0169, "step": 79120 }, { "epoch": 0.4, "learning_rate": 0.0002401168451801363, "loss": 0.0132, "step": 79130 }, { "epoch": 0.4, "learning_rate": 0.0002401092774871223, "loss": 0.0181, "step": 79140 }, { "epoch": 0.4, "learning_rate": 0.00024010170979410828, "loss": 0.019, "step": 79150 }, { "epoch": 0.4, "learning_rate": 0.00024009414210109426, "loss": 0.022, "step": 79160 }, { "epoch": 0.4, "learning_rate": 0.00024008657440808027, "loss": 0.02, "step": 79170 }, { "epoch": 0.4, "learning_rate": 0.00024007900671506625, "loss": 0.0159, "step": 79180 }, { "epoch": 0.4, "learning_rate": 0.00024007143902205223, "loss": 0.0208, "step": 79190 }, { "epoch": 0.4, "learning_rate": 0.0002400638713290382, "loss": 0.0177, "step": 79200 }, { "epoch": 0.4, "learning_rate": 0.00024005630363602422, "loss": 0.0155, "step": 79210 }, { "epoch": 0.4, "learning_rate": 0.0002400487359430102, "loss": 0.0171, "step": 79220 }, { "epoch": 0.4, "learning_rate": 0.00024004116824999618, "loss": 0.0201, "step": 79230 }, { "epoch": 0.4, "learning_rate": 0.0002400336005569822, "loss": 0.0184, "step": 79240 }, { "epoch": 0.4, "learning_rate": 0.00024002603286396817, "loss": 0.021, "step": 79250 }, { "epoch": 0.4, "learning_rate": 0.00024001846517095416, "loss": 0.0165, "step": 79260 }, { "epoch": 0.4, "learning_rate": 0.00024001089747794016, "loss": 0.0173, "step": 79270 }, { "epoch": 0.4, "learning_rate": 0.00024000332978492615, "loss": 0.0199, "step": 79280 }, { "epoch": 0.4, "learning_rate": 0.00023999576209191213, "loss": 0.019, "step": 79290 }, { "epoch": 0.4, "learning_rate": 0.00023998819439889814, "loss": 0.018, "step": 79300 }, { "epoch": 0.4, "learning_rate": 0.00023998062670588412, "loss": 0.0199, "step": 79310 }, { "epoch": 0.4, "learning_rate": 0.0002399730590128701, "loss": 0.017, "step": 79320 }, { "epoch": 0.4, "learning_rate": 0.0002399654913198561, "loss": 0.0181, "step": 79330 }, { "epoch": 0.4, "learning_rate": 0.0002399579236268421, "loss": 0.0147, "step": 79340 }, { "epoch": 0.4, "learning_rate": 0.00023995035593382807, "loss": 0.0157, "step": 79350 }, { "epoch": 0.4, "learning_rate": 0.00023994278824081408, "loss": 0.0157, "step": 79360 }, { "epoch": 0.4, "learning_rate": 0.00023993522054780006, "loss": 0.0178, "step": 79370 }, { "epoch": 0.4, "learning_rate": 0.00023992765285478604, "loss": 0.0152, "step": 79380 }, { "epoch": 0.4, "learning_rate": 0.00023992008516177202, "loss": 0.0155, "step": 79390 }, { "epoch": 0.4, "learning_rate": 0.00023991251746875803, "loss": 0.017, "step": 79400 }, { "epoch": 0.4, "learning_rate": 0.000239904949775744, "loss": 0.0179, "step": 79410 }, { "epoch": 0.4, "learning_rate": 0.00023989738208273, "loss": 0.0212, "step": 79420 }, { "epoch": 0.4, "learning_rate": 0.000239889814389716, "loss": 0.0262, "step": 79430 }, { "epoch": 0.4, "learning_rate": 0.00023988224669670198, "loss": 0.0186, "step": 79440 }, { "epoch": 0.4, "learning_rate": 0.00023987467900368797, "loss": 0.0187, "step": 79450 }, { "epoch": 0.4, "learning_rate": 0.00023986711131067397, "loss": 0.0218, "step": 79460 }, { "epoch": 0.4, "learning_rate": 0.00023985954361765996, "loss": 0.0167, "step": 79470 }, { "epoch": 0.4, "learning_rate": 0.00023985197592464594, "loss": 0.02, "step": 79480 }, { "epoch": 0.4, "learning_rate": 0.00023984440823163195, "loss": 0.0144, "step": 79490 }, { "epoch": 0.4, "learning_rate": 0.00023983684053861793, "loss": 0.0187, "step": 79500 }, { "epoch": 0.4, "learning_rate": 0.0002398292728456039, "loss": 0.0156, "step": 79510 }, { "epoch": 0.4, "learning_rate": 0.00023982170515258992, "loss": 0.0184, "step": 79520 }, { "epoch": 0.4, "learning_rate": 0.0002398141374595759, "loss": 0.0161, "step": 79530 }, { "epoch": 0.4, "learning_rate": 0.00023980656976656188, "loss": 0.0204, "step": 79540 }, { "epoch": 0.4, "learning_rate": 0.00023979900207354786, "loss": 0.0165, "step": 79550 }, { "epoch": 0.4, "learning_rate": 0.00023979143438053387, "loss": 0.0173, "step": 79560 }, { "epoch": 0.4, "learning_rate": 0.00023978386668751985, "loss": 0.0168, "step": 79570 }, { "epoch": 0.4, "learning_rate": 0.00023977629899450583, "loss": 0.0165, "step": 79580 }, { "epoch": 0.4, "learning_rate": 0.00023976873130149184, "loss": 0.0189, "step": 79590 }, { "epoch": 0.4, "learning_rate": 0.00023976116360847782, "loss": 0.0212, "step": 79600 }, { "epoch": 0.4, "learning_rate": 0.0002397535959154638, "loss": 0.0217, "step": 79610 }, { "epoch": 0.4, "learning_rate": 0.0002397460282224498, "loss": 0.02, "step": 79620 }, { "epoch": 0.4, "learning_rate": 0.0002397384605294358, "loss": 0.0183, "step": 79630 }, { "epoch": 0.4, "learning_rate": 0.00023973089283642178, "loss": 0.0191, "step": 79640 }, { "epoch": 0.4, "learning_rate": 0.00023972332514340778, "loss": 0.0192, "step": 79650 }, { "epoch": 0.4, "learning_rate": 0.00023971575745039377, "loss": 0.021, "step": 79660 }, { "epoch": 0.4, "learning_rate": 0.00023970818975737975, "loss": 0.0147, "step": 79670 }, { "epoch": 0.4, "learning_rate": 0.00023970062206436576, "loss": 0.0186, "step": 79680 }, { "epoch": 0.4, "learning_rate": 0.00023969305437135174, "loss": 0.0195, "step": 79690 }, { "epoch": 0.4, "learning_rate": 0.00023968548667833772, "loss": 0.0194, "step": 79700 }, { "epoch": 0.4, "learning_rate": 0.0002396779189853237, "loss": 0.0176, "step": 79710 }, { "epoch": 0.4, "learning_rate": 0.0002396703512923097, "loss": 0.0189, "step": 79720 }, { "epoch": 0.4, "learning_rate": 0.0002396627835992957, "loss": 0.0164, "step": 79730 }, { "epoch": 0.4, "learning_rate": 0.00023965521590628167, "loss": 0.0141, "step": 79740 }, { "epoch": 0.4, "learning_rate": 0.00023964764821326768, "loss": 0.0162, "step": 79750 }, { "epoch": 0.4, "learning_rate": 0.00023964008052025366, "loss": 0.017, "step": 79760 }, { "epoch": 0.4, "learning_rate": 0.00023963251282723964, "loss": 0.0156, "step": 79770 }, { "epoch": 0.4, "learning_rate": 0.00023962494513422565, "loss": 0.0193, "step": 79780 }, { "epoch": 0.4, "learning_rate": 0.00023961737744121163, "loss": 0.0144, "step": 79790 }, { "epoch": 0.4, "learning_rate": 0.00023960980974819761, "loss": 0.0179, "step": 79800 }, { "epoch": 0.4, "learning_rate": 0.00023960224205518362, "loss": 0.0191, "step": 79810 }, { "epoch": 0.4, "learning_rate": 0.00023959467436216958, "loss": 0.019, "step": 79820 }, { "epoch": 0.4, "learning_rate": 0.00023958710666915556, "loss": 0.0188, "step": 79830 }, { "epoch": 0.4, "learning_rate": 0.00023957953897614154, "loss": 0.0194, "step": 79840 }, { "epoch": 0.4, "learning_rate": 0.00023957197128312755, "loss": 0.0162, "step": 79850 }, { "epoch": 0.4, "learning_rate": 0.00023956440359011353, "loss": 0.0175, "step": 79860 }, { "epoch": 0.4, "learning_rate": 0.0002395568358970995, "loss": 0.0164, "step": 79870 }, { "epoch": 0.4, "learning_rate": 0.00023954926820408552, "loss": 0.0181, "step": 79880 }, { "epoch": 0.4, "learning_rate": 0.0002395417005110715, "loss": 0.0226, "step": 79890 }, { "epoch": 0.4, "learning_rate": 0.00023953413281805748, "loss": 0.0207, "step": 79900 }, { "epoch": 0.4, "learning_rate": 0.0002395265651250435, "loss": 0.018, "step": 79910 }, { "epoch": 0.4, "learning_rate": 0.00023951899743202947, "loss": 0.0194, "step": 79920 }, { "epoch": 0.4, "learning_rate": 0.00023951142973901545, "loss": 0.0228, "step": 79930 }, { "epoch": 0.4, "learning_rate": 0.00023950386204600144, "loss": 0.0186, "step": 79940 }, { "epoch": 0.4, "learning_rate": 0.00023949629435298744, "loss": 0.0176, "step": 79950 }, { "epoch": 0.4, "learning_rate": 0.00023948872665997343, "loss": 0.0185, "step": 79960 }, { "epoch": 0.4, "learning_rate": 0.0002394811589669594, "loss": 0.0174, "step": 79970 }, { "epoch": 0.4, "learning_rate": 0.00023947359127394542, "loss": 0.0178, "step": 79980 }, { "epoch": 0.4, "learning_rate": 0.0002394660235809314, "loss": 0.0189, "step": 79990 }, { "epoch": 0.4, "learning_rate": 0.00023945845588791738, "loss": 0.0193, "step": 80000 }, { "epoch": 0.4, "eval_cer": 0.9145207165016832, "eval_loss": 0.012683646753430367, "eval_runtime": 116.5374, "eval_samples_per_second": 17.162, "eval_steps_per_second": 4.29, "step": 80000 }, { "epoch": 0.4, "learning_rate": 0.0002394508881949034, "loss": 0.021, "step": 80010 }, { "epoch": 0.4, "learning_rate": 0.00023944332050188937, "loss": 0.0137, "step": 80020 }, { "epoch": 0.4, "learning_rate": 0.00023943575280887535, "loss": 0.0192, "step": 80030 }, { "epoch": 0.4, "learning_rate": 0.00023942818511586136, "loss": 0.0183, "step": 80040 }, { "epoch": 0.4, "learning_rate": 0.00023942061742284734, "loss": 0.0167, "step": 80050 }, { "epoch": 0.4, "learning_rate": 0.00023941304972983332, "loss": 0.0149, "step": 80060 }, { "epoch": 0.4, "learning_rate": 0.00023940548203681933, "loss": 0.0176, "step": 80070 }, { "epoch": 0.4, "learning_rate": 0.0002393979143438053, "loss": 0.0176, "step": 80080 }, { "epoch": 0.4, "learning_rate": 0.0002393903466507913, "loss": 0.0201, "step": 80090 }, { "epoch": 0.4, "learning_rate": 0.00023938277895777727, "loss": 0.02, "step": 80100 }, { "epoch": 0.4, "learning_rate": 0.00023937521126476328, "loss": 0.0158, "step": 80110 }, { "epoch": 0.4, "learning_rate": 0.00023936764357174926, "loss": 0.0187, "step": 80120 }, { "epoch": 0.4, "learning_rate": 0.00023936007587873525, "loss": 0.0198, "step": 80130 }, { "epoch": 0.4, "learning_rate": 0.00023935250818572125, "loss": 0.02, "step": 80140 }, { "epoch": 0.4, "learning_rate": 0.00023934494049270724, "loss": 0.0166, "step": 80150 }, { "epoch": 0.4, "learning_rate": 0.00023933737279969322, "loss": 0.0193, "step": 80160 }, { "epoch": 0.4, "learning_rate": 0.00023932980510667923, "loss": 0.0182, "step": 80170 }, { "epoch": 0.4, "learning_rate": 0.0002393222374136652, "loss": 0.0185, "step": 80180 }, { "epoch": 0.4, "learning_rate": 0.0002393146697206512, "loss": 0.0176, "step": 80190 }, { "epoch": 0.4, "learning_rate": 0.0002393071020276372, "loss": 0.0157, "step": 80200 }, { "epoch": 0.4, "learning_rate": 0.00023929953433462318, "loss": 0.0172, "step": 80210 }, { "epoch": 0.4, "learning_rate": 0.00023929196664160916, "loss": 0.0128, "step": 80220 }, { "epoch": 0.4, "learning_rate": 0.00023928439894859517, "loss": 0.0185, "step": 80230 }, { "epoch": 0.4, "learning_rate": 0.00023927683125558115, "loss": 0.0202, "step": 80240 }, { "epoch": 0.4, "learning_rate": 0.00023926926356256713, "loss": 0.0162, "step": 80250 }, { "epoch": 0.4, "learning_rate": 0.00023926169586955314, "loss": 0.0162, "step": 80260 }, { "epoch": 0.4, "learning_rate": 0.00023925412817653912, "loss": 0.0159, "step": 80270 }, { "epoch": 0.41, "learning_rate": 0.0002392465604835251, "loss": 0.0347, "step": 80280 }, { "epoch": 0.41, "learning_rate": 0.00023923899279051108, "loss": 0.0174, "step": 80290 }, { "epoch": 0.41, "learning_rate": 0.0002392314250974971, "loss": 0.0184, "step": 80300 }, { "epoch": 0.41, "learning_rate": 0.00023922385740448307, "loss": 0.0195, "step": 80310 }, { "epoch": 0.41, "learning_rate": 0.00023921628971146906, "loss": 0.0182, "step": 80320 }, { "epoch": 0.41, "learning_rate": 0.00023920872201845506, "loss": 0.0161, "step": 80330 }, { "epoch": 0.41, "learning_rate": 0.00023920115432544105, "loss": 0.0174, "step": 80340 }, { "epoch": 0.41, "learning_rate": 0.00023919358663242703, "loss": 0.0167, "step": 80350 }, { "epoch": 0.41, "learning_rate": 0.00023918601893941304, "loss": 0.0167, "step": 80360 }, { "epoch": 0.41, "learning_rate": 0.00023917845124639902, "loss": 0.0205, "step": 80370 }, { "epoch": 0.41, "learning_rate": 0.000239170883553385, "loss": 0.02, "step": 80380 }, { "epoch": 0.41, "learning_rate": 0.000239163315860371, "loss": 0.0207, "step": 80390 }, { "epoch": 0.41, "learning_rate": 0.000239155748167357, "loss": 0.019, "step": 80400 }, { "epoch": 0.41, "learning_rate": 0.00023914818047434297, "loss": 0.0211, "step": 80410 }, { "epoch": 0.41, "learning_rate": 0.00023914061278132898, "loss": 0.0202, "step": 80420 }, { "epoch": 0.41, "learning_rate": 0.00023913304508831496, "loss": 0.0183, "step": 80430 }, { "epoch": 0.41, "learning_rate": 0.00023912547739530094, "loss": 0.018, "step": 80440 }, { "epoch": 0.41, "learning_rate": 0.00023911790970228692, "loss": 0.0182, "step": 80450 }, { "epoch": 0.41, "learning_rate": 0.00023911034200927293, "loss": 0.0173, "step": 80460 }, { "epoch": 0.41, "learning_rate": 0.0002391027743162589, "loss": 0.0227, "step": 80470 }, { "epoch": 0.41, "learning_rate": 0.0002390952066232449, "loss": 0.0166, "step": 80480 }, { "epoch": 0.41, "learning_rate": 0.0002390876389302309, "loss": 0.0164, "step": 80490 }, { "epoch": 0.41, "learning_rate": 0.00023908007123721688, "loss": 0.0159, "step": 80500 }, { "epoch": 0.41, "learning_rate": 0.00023907250354420287, "loss": 0.0175, "step": 80510 }, { "epoch": 0.41, "learning_rate": 0.00023906493585118887, "loss": 0.0194, "step": 80520 }, { "epoch": 0.41, "learning_rate": 0.00023905736815817486, "loss": 0.0196, "step": 80530 }, { "epoch": 0.41, "learning_rate": 0.00023904980046516084, "loss": 0.019, "step": 80540 }, { "epoch": 0.41, "learning_rate": 0.00023904223277214685, "loss": 0.0174, "step": 80550 }, { "epoch": 0.41, "learning_rate": 0.00023903466507913283, "loss": 0.0157, "step": 80560 }, { "epoch": 0.41, "learning_rate": 0.0002390270973861188, "loss": 0.0161, "step": 80570 }, { "epoch": 0.41, "learning_rate": 0.00023901952969310482, "loss": 0.0181, "step": 80580 }, { "epoch": 0.41, "learning_rate": 0.0002390119620000908, "loss": 0.0172, "step": 80590 }, { "epoch": 0.41, "learning_rate": 0.00023900439430707678, "loss": 0.0153, "step": 80600 }, { "epoch": 0.41, "learning_rate": 0.00023899682661406276, "loss": 0.0189, "step": 80610 }, { "epoch": 0.41, "learning_rate": 0.00023898925892104877, "loss": 0.0187, "step": 80620 }, { "epoch": 0.41, "learning_rate": 0.00023898169122803475, "loss": 0.0185, "step": 80630 }, { "epoch": 0.41, "learning_rate": 0.00023897412353502073, "loss": 0.015, "step": 80640 }, { "epoch": 0.41, "learning_rate": 0.00023896655584200674, "loss": 0.0205, "step": 80650 }, { "epoch": 0.41, "learning_rate": 0.00023895898814899272, "loss": 0.018, "step": 80660 }, { "epoch": 0.41, "learning_rate": 0.0002389514204559787, "loss": 0.0161, "step": 80670 }, { "epoch": 0.41, "learning_rate": 0.0002389438527629647, "loss": 0.0176, "step": 80680 }, { "epoch": 0.41, "learning_rate": 0.0002389362850699507, "loss": 0.0181, "step": 80690 }, { "epoch": 0.41, "learning_rate": 0.00023892871737693668, "loss": 0.015, "step": 80700 }, { "epoch": 0.41, "learning_rate": 0.00023892114968392268, "loss": 0.0183, "step": 80710 }, { "epoch": 0.41, "learning_rate": 0.00023891358199090867, "loss": 0.0204, "step": 80720 }, { "epoch": 0.41, "learning_rate": 0.00023890601429789465, "loss": 0.019, "step": 80730 }, { "epoch": 0.41, "learning_rate": 0.00023889844660488066, "loss": 0.0166, "step": 80740 }, { "epoch": 0.41, "learning_rate": 0.00023889087891186664, "loss": 0.0178, "step": 80750 }, { "epoch": 0.41, "learning_rate": 0.00023888331121885262, "loss": 0.0178, "step": 80760 }, { "epoch": 0.41, "learning_rate": 0.00023887574352583863, "loss": 0.0189, "step": 80770 }, { "epoch": 0.41, "learning_rate": 0.0002388681758328246, "loss": 0.016, "step": 80780 }, { "epoch": 0.41, "learning_rate": 0.0002388606081398106, "loss": 0.0165, "step": 80790 }, { "epoch": 0.41, "learning_rate": 0.00023885304044679657, "loss": 0.0181, "step": 80800 }, { "epoch": 0.41, "learning_rate": 0.00023884547275378258, "loss": 0.0173, "step": 80810 }, { "epoch": 0.41, "learning_rate": 0.00023883790506076856, "loss": 0.0173, "step": 80820 }, { "epoch": 0.41, "learning_rate": 0.00023883033736775454, "loss": 0.0159, "step": 80830 }, { "epoch": 0.41, "learning_rate": 0.00023882276967474055, "loss": 0.0154, "step": 80840 }, { "epoch": 0.41, "learning_rate": 0.00023881520198172653, "loss": 0.0167, "step": 80850 }, { "epoch": 0.41, "learning_rate": 0.00023880763428871252, "loss": 0.0255, "step": 80860 }, { "epoch": 0.41, "learning_rate": 0.00023880006659569852, "loss": 0.0181, "step": 80870 }, { "epoch": 0.41, "learning_rate": 0.0002387924989026845, "loss": 0.0139, "step": 80880 }, { "epoch": 0.41, "learning_rate": 0.0002387849312096705, "loss": 0.0164, "step": 80890 }, { "epoch": 0.41, "learning_rate": 0.0002387773635166565, "loss": 0.0188, "step": 80900 }, { "epoch": 0.41, "learning_rate": 0.00023876979582364248, "loss": 0.0154, "step": 80910 }, { "epoch": 0.41, "learning_rate": 0.00023876222813062846, "loss": 0.0137, "step": 80920 }, { "epoch": 0.41, "learning_rate": 0.00023875466043761447, "loss": 0.0185, "step": 80930 }, { "epoch": 0.41, "learning_rate": 0.00023874709274460045, "loss": 0.015, "step": 80940 }, { "epoch": 0.41, "learning_rate": 0.00023873952505158643, "loss": 0.0162, "step": 80950 }, { "epoch": 0.41, "learning_rate": 0.0002387319573585724, "loss": 0.0192, "step": 80960 }, { "epoch": 0.41, "learning_rate": 0.00023872438966555842, "loss": 0.0209, "step": 80970 }, { "epoch": 0.41, "learning_rate": 0.0002387168219725444, "loss": 0.0182, "step": 80980 }, { "epoch": 0.41, "learning_rate": 0.00023870925427953038, "loss": 0.0168, "step": 80990 }, { "epoch": 0.41, "learning_rate": 0.0002387016865865164, "loss": 0.016, "step": 81000 }, { "epoch": 0.41, "eval_cer": 0.9145090717481783, "eval_loss": 0.012487111613154411, "eval_runtime": 116.7617, "eval_samples_per_second": 17.129, "eval_steps_per_second": 4.282, "step": 81000 }, { "epoch": 0.41, "learning_rate": 0.00023869411889350237, "loss": 0.0197, "step": 81010 }, { "epoch": 0.41, "learning_rate": 0.00023868655120048835, "loss": 0.0159, "step": 81020 }, { "epoch": 0.41, "learning_rate": 0.00023867898350747436, "loss": 0.0203, "step": 81030 }, { "epoch": 0.41, "learning_rate": 0.00023867141581446034, "loss": 0.0169, "step": 81040 }, { "epoch": 0.41, "learning_rate": 0.00023866384812144633, "loss": 0.0194, "step": 81050 }, { "epoch": 0.41, "learning_rate": 0.00023865628042843233, "loss": 0.0174, "step": 81060 }, { "epoch": 0.41, "learning_rate": 0.0002386487127354183, "loss": 0.0177, "step": 81070 }, { "epoch": 0.41, "learning_rate": 0.00023864114504240427, "loss": 0.0169, "step": 81080 }, { "epoch": 0.41, "learning_rate": 0.00023863357734939025, "loss": 0.0198, "step": 81090 }, { "epoch": 0.41, "learning_rate": 0.00023862600965637626, "loss": 0.0161, "step": 81100 }, { "epoch": 0.41, "learning_rate": 0.00023861844196336224, "loss": 0.0203, "step": 81110 }, { "epoch": 0.41, "learning_rate": 0.00023861087427034822, "loss": 0.0186, "step": 81120 }, { "epoch": 0.41, "learning_rate": 0.00023860330657733423, "loss": 0.0194, "step": 81130 }, { "epoch": 0.41, "learning_rate": 0.0002385957388843202, "loss": 0.0222, "step": 81140 }, { "epoch": 0.41, "learning_rate": 0.0002385881711913062, "loss": 0.0179, "step": 81150 }, { "epoch": 0.41, "learning_rate": 0.0002385806034982922, "loss": 0.0176, "step": 81160 }, { "epoch": 0.41, "learning_rate": 0.00023857303580527818, "loss": 0.0206, "step": 81170 }, { "epoch": 0.41, "learning_rate": 0.00023856546811226417, "loss": 0.0173, "step": 81180 }, { "epoch": 0.41, "learning_rate": 0.00023855790041925015, "loss": 0.0187, "step": 81190 }, { "epoch": 0.41, "learning_rate": 0.00023855033272623616, "loss": 0.0167, "step": 81200 }, { "epoch": 0.41, "learning_rate": 0.00023854276503322214, "loss": 0.0172, "step": 81210 }, { "epoch": 0.41, "learning_rate": 0.00023853519734020812, "loss": 0.0161, "step": 81220 }, { "epoch": 0.41, "learning_rate": 0.00023852762964719413, "loss": 0.0163, "step": 81230 }, { "epoch": 0.41, "learning_rate": 0.0002385200619541801, "loss": 0.0138, "step": 81240 }, { "epoch": 0.41, "learning_rate": 0.0002385124942611661, "loss": 0.0166, "step": 81250 }, { "epoch": 0.41, "learning_rate": 0.0002385049265681521, "loss": 0.0182, "step": 81260 }, { "epoch": 0.41, "learning_rate": 0.00023849735887513808, "loss": 0.0202, "step": 81270 }, { "epoch": 0.41, "learning_rate": 0.00023848979118212406, "loss": 0.0228, "step": 81280 }, { "epoch": 0.41, "learning_rate": 0.00023848222348911007, "loss": 0.0169, "step": 81290 }, { "epoch": 0.41, "learning_rate": 0.00023847465579609605, "loss": 0.016, "step": 81300 }, { "epoch": 0.41, "learning_rate": 0.00023846708810308203, "loss": 0.0159, "step": 81310 }, { "epoch": 0.41, "learning_rate": 0.00023845952041006804, "loss": 0.0159, "step": 81320 }, { "epoch": 0.41, "learning_rate": 0.00023845195271705402, "loss": 0.0175, "step": 81330 }, { "epoch": 0.41, "learning_rate": 0.00023844438502404, "loss": 0.0187, "step": 81340 }, { "epoch": 0.41, "learning_rate": 0.00023843681733102599, "loss": 0.0149, "step": 81350 }, { "epoch": 0.41, "learning_rate": 0.000238429249638012, "loss": 0.0195, "step": 81360 }, { "epoch": 0.41, "learning_rate": 0.00023842168194499798, "loss": 0.0214, "step": 81370 }, { "epoch": 0.41, "learning_rate": 0.00023841411425198396, "loss": 0.0185, "step": 81380 }, { "epoch": 0.41, "learning_rate": 0.00023840654655896997, "loss": 0.0145, "step": 81390 }, { "epoch": 0.41, "learning_rate": 0.00023839897886595595, "loss": 0.0149, "step": 81400 }, { "epoch": 0.41, "learning_rate": 0.00023839141117294193, "loss": 0.0151, "step": 81410 }, { "epoch": 0.41, "learning_rate": 0.00023838384347992794, "loss": 0.0137, "step": 81420 }, { "epoch": 0.41, "learning_rate": 0.00023837627578691392, "loss": 0.0121, "step": 81430 }, { "epoch": 0.41, "learning_rate": 0.0002383687080938999, "loss": 0.0143, "step": 81440 }, { "epoch": 0.41, "learning_rate": 0.0002383611404008859, "loss": 0.0172, "step": 81450 }, { "epoch": 0.41, "learning_rate": 0.0002383535727078719, "loss": 0.0164, "step": 81460 }, { "epoch": 0.41, "learning_rate": 0.00023834600501485787, "loss": 0.0186, "step": 81470 }, { "epoch": 0.41, "learning_rate": 0.00023833843732184388, "loss": 0.0154, "step": 81480 }, { "epoch": 0.41, "learning_rate": 0.00023833086962882986, "loss": 0.013, "step": 81490 }, { "epoch": 0.41, "learning_rate": 0.00023832330193581584, "loss": 0.0175, "step": 81500 }, { "epoch": 0.41, "learning_rate": 0.00023831573424280182, "loss": 0.0172, "step": 81510 }, { "epoch": 0.41, "learning_rate": 0.00023830816654978783, "loss": 0.0157, "step": 81520 }, { "epoch": 0.41, "learning_rate": 0.00023830059885677381, "loss": 0.0181, "step": 81530 }, { "epoch": 0.41, "learning_rate": 0.0002382930311637598, "loss": 0.0198, "step": 81540 }, { "epoch": 0.41, "learning_rate": 0.0002382854634707458, "loss": 0.0143, "step": 81550 }, { "epoch": 0.41, "learning_rate": 0.00023827789577773179, "loss": 0.0163, "step": 81560 }, { "epoch": 0.41, "learning_rate": 0.00023827032808471777, "loss": 0.0148, "step": 81570 }, { "epoch": 0.41, "learning_rate": 0.00023826276039170378, "loss": 0.0155, "step": 81580 }, { "epoch": 0.41, "learning_rate": 0.00023825519269868976, "loss": 0.0201, "step": 81590 }, { "epoch": 0.41, "learning_rate": 0.00023824762500567574, "loss": 0.0193, "step": 81600 }, { "epoch": 0.41, "learning_rate": 0.00023824005731266175, "loss": 0.0149, "step": 81610 }, { "epoch": 0.41, "learning_rate": 0.00023823248961964773, "loss": 0.0212, "step": 81620 }, { "epoch": 0.41, "learning_rate": 0.0002382249219266337, "loss": 0.0181, "step": 81630 }, { "epoch": 0.41, "learning_rate": 0.00023821735423361972, "loss": 0.0172, "step": 81640 }, { "epoch": 0.41, "learning_rate": 0.0002382097865406057, "loss": 0.0236, "step": 81650 }, { "epoch": 0.41, "learning_rate": 0.00023820221884759168, "loss": 0.0255, "step": 81660 }, { "epoch": 0.41, "learning_rate": 0.00023819465115457766, "loss": 0.0179, "step": 81670 }, { "epoch": 0.41, "learning_rate": 0.00023818708346156367, "loss": 0.0173, "step": 81680 }, { "epoch": 0.41, "learning_rate": 0.00023817951576854965, "loss": 0.0176, "step": 81690 }, { "epoch": 0.41, "learning_rate": 0.00023817194807553563, "loss": 0.0169, "step": 81700 }, { "epoch": 0.41, "learning_rate": 0.00023816438038252164, "loss": 0.0199, "step": 81710 }, { "epoch": 0.41, "learning_rate": 0.00023815681268950762, "loss": 0.016, "step": 81720 }, { "epoch": 0.41, "learning_rate": 0.0002381492449964936, "loss": 0.0171, "step": 81730 }, { "epoch": 0.41, "learning_rate": 0.00023814167730347961, "loss": 0.0189, "step": 81740 }, { "epoch": 0.41, "learning_rate": 0.0002381341096104656, "loss": 0.018, "step": 81750 }, { "epoch": 0.41, "learning_rate": 0.00023812654191745158, "loss": 0.0158, "step": 81760 }, { "epoch": 0.41, "learning_rate": 0.00023811897422443759, "loss": 0.0141, "step": 81770 }, { "epoch": 0.41, "learning_rate": 0.00023811140653142357, "loss": 0.0172, "step": 81780 }, { "epoch": 0.41, "learning_rate": 0.00023810383883840955, "loss": 0.0135, "step": 81790 }, { "epoch": 0.41, "learning_rate": 0.00023809627114539556, "loss": 0.0158, "step": 81800 }, { "epoch": 0.41, "learning_rate": 0.00023808870345238154, "loss": 0.0172, "step": 81810 }, { "epoch": 0.41, "learning_rate": 0.00023808113575936752, "loss": 0.0173, "step": 81820 }, { "epoch": 0.41, "learning_rate": 0.00023807356806635353, "loss": 0.0211, "step": 81830 }, { "epoch": 0.41, "learning_rate": 0.0002380660003733395, "loss": 0.0167, "step": 81840 }, { "epoch": 0.41, "learning_rate": 0.0002380584326803255, "loss": 0.0176, "step": 81850 }, { "epoch": 0.41, "learning_rate": 0.00023805086498731147, "loss": 0.0185, "step": 81860 }, { "epoch": 0.41, "learning_rate": 0.00023804329729429748, "loss": 0.0159, "step": 81870 }, { "epoch": 0.41, "learning_rate": 0.00023803572960128346, "loss": 0.0178, "step": 81880 }, { "epoch": 0.41, "learning_rate": 0.00023802816190826944, "loss": 0.0198, "step": 81890 }, { "epoch": 0.41, "learning_rate": 0.00023802059421525545, "loss": 0.0191, "step": 81900 }, { "epoch": 0.41, "learning_rate": 0.00023801302652224143, "loss": 0.0179, "step": 81910 }, { "epoch": 0.41, "learning_rate": 0.00023800545882922742, "loss": 0.0177, "step": 81920 }, { "epoch": 0.41, "learning_rate": 0.00023799789113621342, "loss": 0.0173, "step": 81930 }, { "epoch": 0.41, "learning_rate": 0.0002379903234431994, "loss": 0.0204, "step": 81940 }, { "epoch": 0.41, "learning_rate": 0.0002379827557501854, "loss": 0.0158, "step": 81950 }, { "epoch": 0.41, "learning_rate": 0.0002379751880571714, "loss": 0.015, "step": 81960 }, { "epoch": 0.41, "learning_rate": 0.00023796762036415738, "loss": 0.0147, "step": 81970 }, { "epoch": 0.41, "learning_rate": 0.00023796005267114336, "loss": 0.0162, "step": 81980 }, { "epoch": 0.41, "learning_rate": 0.00023795248497812937, "loss": 0.016, "step": 81990 }, { "epoch": 0.41, "learning_rate": 0.00023794491728511535, "loss": 0.0146, "step": 82000 }, { "epoch": 0.41, "eval_cer": 0.9144935454101719, "eval_loss": 0.012472189962863922, "eval_runtime": 116.6656, "eval_samples_per_second": 17.143, "eval_steps_per_second": 4.286, "step": 82000 }, { "epoch": 0.41, "learning_rate": 0.00023793734959210133, "loss": 0.0162, "step": 82010 }, { "epoch": 0.41, "learning_rate": 0.0002379297818990873, "loss": 0.0168, "step": 82020 }, { "epoch": 0.41, "learning_rate": 0.00023792221420607332, "loss": 0.0198, "step": 82030 }, { "epoch": 0.41, "learning_rate": 0.0002379146465130593, "loss": 0.0183, "step": 82040 }, { "epoch": 0.41, "learning_rate": 0.00023790707882004528, "loss": 0.0302, "step": 82050 }, { "epoch": 0.41, "learning_rate": 0.0002378995111270313, "loss": 0.0161, "step": 82060 }, { "epoch": 0.41, "learning_rate": 0.00023789194343401727, "loss": 0.018, "step": 82070 }, { "epoch": 0.41, "learning_rate": 0.00023788437574100325, "loss": 0.0202, "step": 82080 }, { "epoch": 0.41, "learning_rate": 0.00023787680804798926, "loss": 0.019, "step": 82090 }, { "epoch": 0.41, "learning_rate": 0.00023786924035497524, "loss": 0.023, "step": 82100 }, { "epoch": 0.41, "learning_rate": 0.00023786167266196123, "loss": 0.0193, "step": 82110 }, { "epoch": 0.41, "learning_rate": 0.00023785410496894723, "loss": 0.0151, "step": 82120 }, { "epoch": 0.41, "learning_rate": 0.00023784653727593322, "loss": 0.0216, "step": 82130 }, { "epoch": 0.41, "learning_rate": 0.0002378389695829192, "loss": 0.0253, "step": 82140 }, { "epoch": 0.41, "learning_rate": 0.0002378314018899052, "loss": 0.0196, "step": 82150 }, { "epoch": 0.41, "learning_rate": 0.0002378238341968912, "loss": 0.0166, "step": 82160 }, { "epoch": 0.41, "learning_rate": 0.00023781626650387717, "loss": 0.0154, "step": 82170 }, { "epoch": 0.41, "learning_rate": 0.00023780869881086315, "loss": 0.0148, "step": 82180 }, { "epoch": 0.41, "learning_rate": 0.00023780113111784916, "loss": 0.0206, "step": 82190 }, { "epoch": 0.41, "learning_rate": 0.00023779356342483514, "loss": 0.0171, "step": 82200 }, { "epoch": 0.41, "learning_rate": 0.00023778599573182112, "loss": 0.0161, "step": 82210 }, { "epoch": 0.41, "learning_rate": 0.00023777842803880713, "loss": 0.0177, "step": 82220 }, { "epoch": 0.41, "learning_rate": 0.0002377708603457931, "loss": 0.0166, "step": 82230 }, { "epoch": 0.41, "learning_rate": 0.0002377632926527791, "loss": 0.0183, "step": 82240 }, { "epoch": 0.41, "learning_rate": 0.0002377557249597651, "loss": 0.0222, "step": 82250 }, { "epoch": 0.42, "learning_rate": 0.00023774815726675108, "loss": 0.0154, "step": 82260 }, { "epoch": 0.42, "learning_rate": 0.00023774058957373706, "loss": 0.0174, "step": 82270 }, { "epoch": 0.42, "learning_rate": 0.00023773302188072307, "loss": 0.0222, "step": 82280 }, { "epoch": 0.42, "learning_rate": 0.00023772545418770905, "loss": 0.017, "step": 82290 }, { "epoch": 0.42, "learning_rate": 0.00023771788649469504, "loss": 0.0132, "step": 82300 }, { "epoch": 0.42, "learning_rate": 0.00023771031880168104, "loss": 0.0185, "step": 82310 }, { "epoch": 0.42, "learning_rate": 0.00023770275110866703, "loss": 0.0154, "step": 82320 }, { "epoch": 0.42, "learning_rate": 0.00023769518341565298, "loss": 0.0219, "step": 82330 }, { "epoch": 0.42, "learning_rate": 0.00023768761572263896, "loss": 0.0168, "step": 82340 }, { "epoch": 0.42, "learning_rate": 0.00023768004802962497, "loss": 0.0198, "step": 82350 }, { "epoch": 0.42, "learning_rate": 0.00023767248033661095, "loss": 0.0175, "step": 82360 }, { "epoch": 0.42, "learning_rate": 0.00023766491264359693, "loss": 0.0187, "step": 82370 }, { "epoch": 0.42, "learning_rate": 0.00023765734495058294, "loss": 0.0216, "step": 82380 }, { "epoch": 0.42, "learning_rate": 0.00023764977725756892, "loss": 0.0176, "step": 82390 }, { "epoch": 0.42, "learning_rate": 0.0002376422095645549, "loss": 0.0199, "step": 82400 }, { "epoch": 0.42, "learning_rate": 0.00023763464187154089, "loss": 0.0169, "step": 82410 }, { "epoch": 0.42, "learning_rate": 0.0002376270741785269, "loss": 0.017, "step": 82420 }, { "epoch": 0.42, "learning_rate": 0.00023761950648551288, "loss": 0.0212, "step": 82430 }, { "epoch": 0.42, "learning_rate": 0.00023761193879249886, "loss": 0.017, "step": 82440 }, { "epoch": 0.42, "learning_rate": 0.00023760437109948487, "loss": 0.0159, "step": 82450 }, { "epoch": 0.42, "learning_rate": 0.00023759680340647085, "loss": 0.0241, "step": 82460 }, { "epoch": 0.42, "learning_rate": 0.00023758923571345683, "loss": 0.0181, "step": 82470 }, { "epoch": 0.42, "learning_rate": 0.00023758166802044284, "loss": 0.0194, "step": 82480 }, { "epoch": 0.42, "learning_rate": 0.00023757410032742882, "loss": 0.0193, "step": 82490 }, { "epoch": 0.42, "learning_rate": 0.0002375665326344148, "loss": 0.0213, "step": 82500 }, { "epoch": 0.42, "learning_rate": 0.0002375589649414008, "loss": 0.02, "step": 82510 }, { "epoch": 0.42, "learning_rate": 0.0002375513972483868, "loss": 0.0183, "step": 82520 }, { "epoch": 0.42, "learning_rate": 0.00023754382955537277, "loss": 0.022, "step": 82530 }, { "epoch": 0.42, "learning_rate": 0.00023753626186235878, "loss": 0.0179, "step": 82540 }, { "epoch": 0.42, "learning_rate": 0.00023752869416934476, "loss": 0.0168, "step": 82550 }, { "epoch": 0.42, "learning_rate": 0.00023752112647633074, "loss": 0.0143, "step": 82560 }, { "epoch": 0.42, "learning_rate": 0.00023751355878331672, "loss": 0.0146, "step": 82570 }, { "epoch": 0.42, "learning_rate": 0.00023750599109030273, "loss": 0.0178, "step": 82580 }, { "epoch": 0.42, "learning_rate": 0.00023749842339728871, "loss": 0.0188, "step": 82590 }, { "epoch": 0.42, "learning_rate": 0.0002374908557042747, "loss": 0.0206, "step": 82600 }, { "epoch": 0.42, "learning_rate": 0.0002374832880112607, "loss": 0.0159, "step": 82610 }, { "epoch": 0.42, "learning_rate": 0.00023747572031824669, "loss": 0.014, "step": 82620 }, { "epoch": 0.42, "learning_rate": 0.00023746815262523267, "loss": 0.016, "step": 82630 }, { "epoch": 0.42, "learning_rate": 0.00023746058493221868, "loss": 0.0213, "step": 82640 }, { "epoch": 0.42, "learning_rate": 0.00023745301723920466, "loss": 0.0156, "step": 82650 }, { "epoch": 0.42, "learning_rate": 0.00023744544954619064, "loss": 0.0224, "step": 82660 }, { "epoch": 0.42, "learning_rate": 0.00023743788185317665, "loss": 0.0151, "step": 82670 }, { "epoch": 0.42, "learning_rate": 0.00023743031416016263, "loss": 0.0174, "step": 82680 }, { "epoch": 0.42, "learning_rate": 0.0002374227464671486, "loss": 0.0157, "step": 82690 }, { "epoch": 0.42, "learning_rate": 0.00023741517877413462, "loss": 0.0215, "step": 82700 }, { "epoch": 0.42, "learning_rate": 0.0002374076110811206, "loss": 0.0198, "step": 82710 }, { "epoch": 0.42, "learning_rate": 0.00023740004338810658, "loss": 0.0164, "step": 82720 }, { "epoch": 0.42, "learning_rate": 0.0002373924756950926, "loss": 0.0185, "step": 82730 }, { "epoch": 0.42, "learning_rate": 0.00023738490800207857, "loss": 0.0238, "step": 82740 }, { "epoch": 0.42, "learning_rate": 0.00023737734030906455, "loss": 0.018, "step": 82750 }, { "epoch": 0.42, "learning_rate": 0.00023736977261605053, "loss": 0.0216, "step": 82760 }, { "epoch": 0.42, "learning_rate": 0.00023736220492303654, "loss": 0.0214, "step": 82770 }, { "epoch": 0.42, "learning_rate": 0.00023735463723002252, "loss": 0.0169, "step": 82780 }, { "epoch": 0.42, "learning_rate": 0.0002373470695370085, "loss": 0.0182, "step": 82790 }, { "epoch": 0.42, "learning_rate": 0.00023733950184399451, "loss": 0.017, "step": 82800 }, { "epoch": 0.42, "learning_rate": 0.0002373319341509805, "loss": 0.0162, "step": 82810 }, { "epoch": 0.42, "learning_rate": 0.00023732436645796648, "loss": 0.0156, "step": 82820 }, { "epoch": 0.42, "learning_rate": 0.00023731679876495249, "loss": 0.0242, "step": 82830 }, { "epoch": 0.42, "learning_rate": 0.00023730923107193847, "loss": 0.0193, "step": 82840 }, { "epoch": 0.42, "learning_rate": 0.00023730166337892445, "loss": 0.0184, "step": 82850 }, { "epoch": 0.42, "learning_rate": 0.00023729409568591046, "loss": 0.019, "step": 82860 }, { "epoch": 0.42, "learning_rate": 0.00023728652799289644, "loss": 0.018, "step": 82870 }, { "epoch": 0.42, "learning_rate": 0.00023727896029988242, "loss": 0.0199, "step": 82880 }, { "epoch": 0.42, "learning_rate": 0.00023727139260686843, "loss": 0.0158, "step": 82890 }, { "epoch": 0.42, "learning_rate": 0.0002372638249138544, "loss": 0.0187, "step": 82900 }, { "epoch": 0.42, "learning_rate": 0.0002372562572208404, "loss": 0.0158, "step": 82910 }, { "epoch": 0.42, "learning_rate": 0.00023724868952782637, "loss": 0.0192, "step": 82920 }, { "epoch": 0.42, "learning_rate": 0.00023724112183481238, "loss": 0.0194, "step": 82930 }, { "epoch": 0.42, "learning_rate": 0.00023723355414179836, "loss": 0.0164, "step": 82940 }, { "epoch": 0.42, "learning_rate": 0.00023722598644878434, "loss": 0.0245, "step": 82950 }, { "epoch": 0.42, "learning_rate": 0.00023721841875577035, "loss": 0.0205, "step": 82960 }, { "epoch": 0.42, "learning_rate": 0.00023721085106275633, "loss": 0.0172, "step": 82970 }, { "epoch": 0.42, "learning_rate": 0.00023720328336974232, "loss": 0.0163, "step": 82980 }, { "epoch": 0.42, "learning_rate": 0.00023719571567672832, "loss": 0.0156, "step": 82990 }, { "epoch": 0.42, "learning_rate": 0.0002371881479837143, "loss": 0.0169, "step": 83000 }, { "epoch": 0.42, "eval_cer": 0.9144954862024227, "eval_loss": 0.012444199062883854, "eval_runtime": 116.798, "eval_samples_per_second": 17.124, "eval_steps_per_second": 4.281, "step": 83000 }, { "epoch": 0.42, "learning_rate": 0.0002371805802907003, "loss": 0.0181, "step": 83010 }, { "epoch": 0.42, "learning_rate": 0.0002371730125976863, "loss": 0.0159, "step": 83020 }, { "epoch": 0.42, "learning_rate": 0.00023716544490467228, "loss": 0.0158, "step": 83030 }, { "epoch": 0.42, "learning_rate": 0.00023715787721165826, "loss": 0.0195, "step": 83040 }, { "epoch": 0.42, "learning_rate": 0.00023715030951864427, "loss": 0.0186, "step": 83050 }, { "epoch": 0.42, "learning_rate": 0.00023714274182563025, "loss": 0.0142, "step": 83060 }, { "epoch": 0.42, "learning_rate": 0.00023713517413261623, "loss": 0.0178, "step": 83070 }, { "epoch": 0.42, "learning_rate": 0.0002371276064396022, "loss": 0.0168, "step": 83080 }, { "epoch": 0.42, "learning_rate": 0.00023712003874658822, "loss": 0.0164, "step": 83090 }, { "epoch": 0.42, "learning_rate": 0.0002371124710535742, "loss": 0.017, "step": 83100 }, { "epoch": 0.42, "learning_rate": 0.00023710490336056018, "loss": 0.0191, "step": 83110 }, { "epoch": 0.42, "learning_rate": 0.0002370973356675462, "loss": 0.02, "step": 83120 }, { "epoch": 0.42, "learning_rate": 0.00023708976797453217, "loss": 0.0158, "step": 83130 }, { "epoch": 0.42, "learning_rate": 0.00023708220028151815, "loss": 0.0154, "step": 83140 }, { "epoch": 0.42, "learning_rate": 0.00023707463258850416, "loss": 0.0183, "step": 83150 }, { "epoch": 0.42, "learning_rate": 0.00023706706489549014, "loss": 0.0162, "step": 83160 }, { "epoch": 0.42, "learning_rate": 0.00023705949720247613, "loss": 0.0193, "step": 83170 }, { "epoch": 0.42, "learning_rate": 0.00023705192950946213, "loss": 0.0179, "step": 83180 }, { "epoch": 0.42, "learning_rate": 0.00023704436181644812, "loss": 0.0192, "step": 83190 }, { "epoch": 0.42, "learning_rate": 0.0002370367941234341, "loss": 0.0184, "step": 83200 }, { "epoch": 0.42, "learning_rate": 0.0002370292264304201, "loss": 0.0184, "step": 83210 }, { "epoch": 0.42, "learning_rate": 0.0002370216587374061, "loss": 0.016, "step": 83220 }, { "epoch": 0.42, "learning_rate": 0.00023701409104439207, "loss": 0.0147, "step": 83230 }, { "epoch": 0.42, "learning_rate": 0.00023700652335137808, "loss": 0.0153, "step": 83240 }, { "epoch": 0.42, "learning_rate": 0.00023699895565836406, "loss": 0.016, "step": 83250 }, { "epoch": 0.42, "learning_rate": 0.00023699138796535004, "loss": 0.0157, "step": 83260 }, { "epoch": 0.42, "learning_rate": 0.00023698382027233602, "loss": 0.0171, "step": 83270 }, { "epoch": 0.42, "learning_rate": 0.00023697625257932203, "loss": 0.0229, "step": 83280 }, { "epoch": 0.42, "learning_rate": 0.000236968684886308, "loss": 0.0139, "step": 83290 }, { "epoch": 0.42, "learning_rate": 0.000236961117193294, "loss": 0.0156, "step": 83300 }, { "epoch": 0.42, "learning_rate": 0.00023695354950028, "loss": 0.0161, "step": 83310 }, { "epoch": 0.42, "learning_rate": 0.00023694598180726598, "loss": 0.0163, "step": 83320 }, { "epoch": 0.42, "learning_rate": 0.00023693841411425196, "loss": 0.016, "step": 83330 }, { "epoch": 0.42, "learning_rate": 0.00023693084642123797, "loss": 0.0206, "step": 83340 }, { "epoch": 0.42, "learning_rate": 0.00023692327872822395, "loss": 0.0136, "step": 83350 }, { "epoch": 0.42, "learning_rate": 0.00023691571103520994, "loss": 0.0184, "step": 83360 }, { "epoch": 0.42, "learning_rate": 0.00023690814334219594, "loss": 0.0152, "step": 83370 }, { "epoch": 0.42, "learning_rate": 0.00023690057564918193, "loss": 0.0183, "step": 83380 }, { "epoch": 0.42, "learning_rate": 0.0002368930079561679, "loss": 0.0157, "step": 83390 }, { "epoch": 0.42, "learning_rate": 0.00023688544026315392, "loss": 0.0207, "step": 83400 }, { "epoch": 0.42, "learning_rate": 0.0002368778725701399, "loss": 0.0177, "step": 83410 }, { "epoch": 0.42, "learning_rate": 0.00023687030487712588, "loss": 0.019, "step": 83420 }, { "epoch": 0.42, "learning_rate": 0.00023686273718411186, "loss": 0.0185, "step": 83430 }, { "epoch": 0.42, "learning_rate": 0.00023685516949109787, "loss": 0.0183, "step": 83440 }, { "epoch": 0.42, "learning_rate": 0.00023684760179808385, "loss": 0.0154, "step": 83450 }, { "epoch": 0.42, "learning_rate": 0.00023684003410506983, "loss": 0.0177, "step": 83460 }, { "epoch": 0.42, "learning_rate": 0.00023683246641205584, "loss": 0.0152, "step": 83470 }, { "epoch": 0.42, "learning_rate": 0.00023682489871904182, "loss": 0.0165, "step": 83480 }, { "epoch": 0.42, "learning_rate": 0.0002368173310260278, "loss": 0.0183, "step": 83490 }, { "epoch": 0.42, "learning_rate": 0.0002368097633330138, "loss": 0.0172, "step": 83500 }, { "epoch": 0.42, "learning_rate": 0.0002368021956399998, "loss": 0.0186, "step": 83510 }, { "epoch": 0.42, "learning_rate": 0.00023679462794698577, "loss": 0.0145, "step": 83520 }, { "epoch": 0.42, "learning_rate": 0.00023678706025397178, "loss": 0.0164, "step": 83530 }, { "epoch": 0.42, "learning_rate": 0.00023677949256095776, "loss": 0.0151, "step": 83540 }, { "epoch": 0.42, "learning_rate": 0.00023677192486794375, "loss": 0.0167, "step": 83550 }, { "epoch": 0.42, "learning_rate": 0.00023676435717492975, "loss": 0.0142, "step": 83560 }, { "epoch": 0.42, "learning_rate": 0.00023675678948191574, "loss": 0.0206, "step": 83570 }, { "epoch": 0.42, "learning_rate": 0.00023674922178890172, "loss": 0.022, "step": 83580 }, { "epoch": 0.42, "learning_rate": 0.00023674165409588767, "loss": 0.0183, "step": 83590 }, { "epoch": 0.42, "learning_rate": 0.00023673408640287368, "loss": 0.035, "step": 83600 }, { "epoch": 0.42, "learning_rate": 0.00023672651870985966, "loss": 0.0205, "step": 83610 }, { "epoch": 0.42, "learning_rate": 0.00023671895101684564, "loss": 0.0173, "step": 83620 }, { "epoch": 0.42, "learning_rate": 0.00023671138332383165, "loss": 0.018, "step": 83630 }, { "epoch": 0.42, "learning_rate": 0.00023670381563081763, "loss": 0.016, "step": 83640 }, { "epoch": 0.42, "learning_rate": 0.00023669624793780361, "loss": 0.0148, "step": 83650 }, { "epoch": 0.42, "learning_rate": 0.0002366886802447896, "loss": 0.0175, "step": 83660 }, { "epoch": 0.42, "learning_rate": 0.0002366811125517756, "loss": 0.0166, "step": 83670 }, { "epoch": 0.42, "learning_rate": 0.00023667354485876159, "loss": 0.0138, "step": 83680 }, { "epoch": 0.42, "learning_rate": 0.00023666597716574757, "loss": 0.0194, "step": 83690 }, { "epoch": 0.42, "learning_rate": 0.00023665840947273358, "loss": 0.016, "step": 83700 }, { "epoch": 0.42, "learning_rate": 0.00023665084177971956, "loss": 0.0191, "step": 83710 }, { "epoch": 0.42, "learning_rate": 0.00023664327408670554, "loss": 0.0181, "step": 83720 }, { "epoch": 0.42, "learning_rate": 0.00023663570639369155, "loss": 0.0185, "step": 83730 }, { "epoch": 0.42, "learning_rate": 0.00023662813870067753, "loss": 0.0172, "step": 83740 }, { "epoch": 0.42, "learning_rate": 0.0002366205710076635, "loss": 0.0171, "step": 83750 }, { "epoch": 0.42, "learning_rate": 0.00023661300331464952, "loss": 0.0184, "step": 83760 }, { "epoch": 0.42, "learning_rate": 0.0002366054356216355, "loss": 0.0223, "step": 83770 }, { "epoch": 0.42, "learning_rate": 0.00023659786792862148, "loss": 0.0146, "step": 83780 }, { "epoch": 0.42, "learning_rate": 0.0002365903002356075, "loss": 0.018, "step": 83790 }, { "epoch": 0.42, "learning_rate": 0.00023658273254259347, "loss": 0.0158, "step": 83800 }, { "epoch": 0.42, "learning_rate": 0.00023657516484957945, "loss": 0.0166, "step": 83810 }, { "epoch": 0.42, "learning_rate": 0.00023656759715656543, "loss": 0.0176, "step": 83820 }, { "epoch": 0.42, "learning_rate": 0.00023656002946355144, "loss": 0.0176, "step": 83830 }, { "epoch": 0.42, "learning_rate": 0.00023655246177053742, "loss": 0.0173, "step": 83840 }, { "epoch": 0.42, "learning_rate": 0.0002365448940775234, "loss": 0.0143, "step": 83850 }, { "epoch": 0.42, "learning_rate": 0.00023653732638450941, "loss": 0.0168, "step": 83860 }, { "epoch": 0.42, "learning_rate": 0.0002365297586914954, "loss": 0.0139, "step": 83870 }, { "epoch": 0.42, "learning_rate": 0.00023652219099848138, "loss": 0.0139, "step": 83880 }, { "epoch": 0.42, "learning_rate": 0.00023651462330546739, "loss": 0.019, "step": 83890 }, { "epoch": 0.42, "learning_rate": 0.00023650705561245337, "loss": 0.0175, "step": 83900 }, { "epoch": 0.42, "learning_rate": 0.00023649948791943935, "loss": 0.0185, "step": 83910 }, { "epoch": 0.42, "learning_rate": 0.00023649192022642536, "loss": 0.0187, "step": 83920 }, { "epoch": 0.42, "learning_rate": 0.00023648435253341134, "loss": 0.0206, "step": 83930 }, { "epoch": 0.42, "learning_rate": 0.00023647678484039732, "loss": 0.0166, "step": 83940 }, { "epoch": 0.42, "learning_rate": 0.00023646921714738333, "loss": 0.0219, "step": 83950 }, { "epoch": 0.42, "learning_rate": 0.0002364616494543693, "loss": 0.0189, "step": 83960 }, { "epoch": 0.42, "learning_rate": 0.0002364540817613553, "loss": 0.02, "step": 83970 }, { "epoch": 0.42, "learning_rate": 0.00023644651406834127, "loss": 0.02, "step": 83980 }, { "epoch": 0.42, "learning_rate": 0.00023643894637532728, "loss": 0.0191, "step": 83990 }, { "epoch": 0.42, "learning_rate": 0.00023643137868231326, "loss": 0.0162, "step": 84000 }, { "epoch": 0.42, "eval_cer": 0.9144935454101719, "eval_loss": 0.012893411330878735, "eval_runtime": 116.7828, "eval_samples_per_second": 17.126, "eval_steps_per_second": 4.281, "step": 84000 }, { "epoch": 0.42, "learning_rate": 0.00023642381098929924, "loss": 0.0194, "step": 84010 }, { "epoch": 0.42, "learning_rate": 0.00023641624329628525, "loss": 0.0205, "step": 84020 }, { "epoch": 0.42, "learning_rate": 0.00023640867560327123, "loss": 0.0171, "step": 84030 }, { "epoch": 0.42, "learning_rate": 0.00023640110791025722, "loss": 0.0153, "step": 84040 }, { "epoch": 0.42, "learning_rate": 0.00023639354021724322, "loss": 0.0116, "step": 84050 }, { "epoch": 0.42, "learning_rate": 0.0002363859725242292, "loss": 0.0176, "step": 84060 }, { "epoch": 0.42, "learning_rate": 0.0002363784048312152, "loss": 0.0144, "step": 84070 }, { "epoch": 0.42, "learning_rate": 0.0002363708371382012, "loss": 0.0176, "step": 84080 }, { "epoch": 0.42, "learning_rate": 0.00023636326944518718, "loss": 0.0194, "step": 84090 }, { "epoch": 0.42, "learning_rate": 0.00023635570175217316, "loss": 0.0176, "step": 84100 }, { "epoch": 0.42, "learning_rate": 0.00023634813405915917, "loss": 0.0159, "step": 84110 }, { "epoch": 0.42, "learning_rate": 0.00023634056636614515, "loss": 0.0232, "step": 84120 }, { "epoch": 0.42, "learning_rate": 0.00023633299867313113, "loss": 0.019, "step": 84130 }, { "epoch": 0.42, "learning_rate": 0.00023632543098011714, "loss": 0.0165, "step": 84140 }, { "epoch": 0.42, "learning_rate": 0.00023631786328710312, "loss": 0.0165, "step": 84150 }, { "epoch": 0.42, "learning_rate": 0.0002363102955940891, "loss": 0.0164, "step": 84160 }, { "epoch": 0.42, "learning_rate": 0.00023630272790107508, "loss": 0.0176, "step": 84170 }, { "epoch": 0.42, "learning_rate": 0.0002362951602080611, "loss": 0.0169, "step": 84180 }, { "epoch": 0.42, "learning_rate": 0.00023628759251504707, "loss": 0.015, "step": 84190 }, { "epoch": 0.42, "learning_rate": 0.00023628002482203305, "loss": 0.0201, "step": 84200 }, { "epoch": 0.42, "learning_rate": 0.00023627245712901906, "loss": 0.0176, "step": 84210 }, { "epoch": 0.42, "learning_rate": 0.00023626488943600504, "loss": 0.0152, "step": 84220 }, { "epoch": 0.42, "learning_rate": 0.00023625732174299103, "loss": 0.0144, "step": 84230 }, { "epoch": 0.42, "learning_rate": 0.00023624975404997703, "loss": 0.0189, "step": 84240 }, { "epoch": 0.43, "learning_rate": 0.00023624218635696302, "loss": 0.0212, "step": 84250 }, { "epoch": 0.43, "learning_rate": 0.000236234618663949, "loss": 0.0167, "step": 84260 }, { "epoch": 0.43, "learning_rate": 0.000236227050970935, "loss": 0.0186, "step": 84270 }, { "epoch": 0.43, "learning_rate": 0.000236219483277921, "loss": 0.016, "step": 84280 }, { "epoch": 0.43, "learning_rate": 0.00023621191558490697, "loss": 0.0168, "step": 84290 }, { "epoch": 0.43, "learning_rate": 0.00023620434789189298, "loss": 0.0152, "step": 84300 }, { "epoch": 0.43, "learning_rate": 0.00023619678019887896, "loss": 0.0189, "step": 84310 }, { "epoch": 0.43, "learning_rate": 0.00023618921250586494, "loss": 0.0158, "step": 84320 }, { "epoch": 0.43, "learning_rate": 0.00023618164481285092, "loss": 0.0188, "step": 84330 }, { "epoch": 0.43, "learning_rate": 0.00023617407711983693, "loss": 0.0146, "step": 84340 }, { "epoch": 0.43, "learning_rate": 0.0002361665094268229, "loss": 0.0139, "step": 84350 }, { "epoch": 0.43, "learning_rate": 0.0002361589417338089, "loss": 0.0151, "step": 84360 }, { "epoch": 0.43, "learning_rate": 0.0002361513740407949, "loss": 0.0148, "step": 84370 }, { "epoch": 0.43, "learning_rate": 0.00023614380634778088, "loss": 0.0184, "step": 84380 }, { "epoch": 0.43, "learning_rate": 0.00023613623865476686, "loss": 0.0186, "step": 84390 }, { "epoch": 0.43, "learning_rate": 0.00023612867096175287, "loss": 0.017, "step": 84400 }, { "epoch": 0.43, "learning_rate": 0.00023612110326873885, "loss": 0.0207, "step": 84410 }, { "epoch": 0.43, "learning_rate": 0.00023611353557572484, "loss": 0.018, "step": 84420 }, { "epoch": 0.43, "learning_rate": 0.00023610596788271084, "loss": 0.0179, "step": 84430 }, { "epoch": 0.43, "learning_rate": 0.00023609840018969683, "loss": 0.0189, "step": 84440 }, { "epoch": 0.43, "learning_rate": 0.0002360908324966828, "loss": 0.0164, "step": 84450 }, { "epoch": 0.43, "learning_rate": 0.00023608326480366882, "loss": 0.021, "step": 84460 }, { "epoch": 0.43, "learning_rate": 0.0002360756971106548, "loss": 0.0167, "step": 84470 }, { "epoch": 0.43, "learning_rate": 0.00023606812941764078, "loss": 0.0172, "step": 84480 }, { "epoch": 0.43, "learning_rate": 0.00023606056172462676, "loss": 0.0172, "step": 84490 }, { "epoch": 0.43, "learning_rate": 0.00023605299403161277, "loss": 0.0175, "step": 84500 }, { "epoch": 0.43, "learning_rate": 0.00023604542633859875, "loss": 0.0187, "step": 84510 }, { "epoch": 0.43, "learning_rate": 0.00023603785864558473, "loss": 0.015, "step": 84520 }, { "epoch": 0.43, "learning_rate": 0.00023603029095257074, "loss": 0.0154, "step": 84530 }, { "epoch": 0.43, "learning_rate": 0.00023602272325955672, "loss": 0.0154, "step": 84540 }, { "epoch": 0.43, "learning_rate": 0.0002360151555665427, "loss": 0.0156, "step": 84550 }, { "epoch": 0.43, "learning_rate": 0.0002360075878735287, "loss": 0.0186, "step": 84560 }, { "epoch": 0.43, "learning_rate": 0.0002360000201805147, "loss": 0.0154, "step": 84570 }, { "epoch": 0.43, "learning_rate": 0.00023599245248750067, "loss": 0.0162, "step": 84580 }, { "epoch": 0.43, "learning_rate": 0.00023598488479448668, "loss": 0.0142, "step": 84590 }, { "epoch": 0.43, "learning_rate": 0.00023597731710147266, "loss": 0.0206, "step": 84600 }, { "epoch": 0.43, "learning_rate": 0.00023596974940845865, "loss": 0.0174, "step": 84610 }, { "epoch": 0.43, "learning_rate": 0.00023596218171544465, "loss": 0.0177, "step": 84620 }, { "epoch": 0.43, "learning_rate": 0.00023595461402243064, "loss": 0.0167, "step": 84630 }, { "epoch": 0.43, "learning_rate": 0.00023594704632941662, "loss": 0.017, "step": 84640 }, { "epoch": 0.43, "learning_rate": 0.00023593947863640263, "loss": 0.0201, "step": 84650 }, { "epoch": 0.43, "learning_rate": 0.0002359319109433886, "loss": 0.0167, "step": 84660 }, { "epoch": 0.43, "learning_rate": 0.0002359243432503746, "loss": 0.018, "step": 84670 }, { "epoch": 0.43, "learning_rate": 0.00023591677555736057, "loss": 0.0173, "step": 84680 }, { "epoch": 0.43, "learning_rate": 0.00023590920786434658, "loss": 0.0158, "step": 84690 }, { "epoch": 0.43, "learning_rate": 0.00023590164017133256, "loss": 0.0185, "step": 84700 }, { "epoch": 0.43, "learning_rate": 0.00023589407247831854, "loss": 0.0172, "step": 84710 }, { "epoch": 0.43, "learning_rate": 0.00023588650478530455, "loss": 0.0194, "step": 84720 }, { "epoch": 0.43, "learning_rate": 0.00023587893709229053, "loss": 0.0151, "step": 84730 }, { "epoch": 0.43, "learning_rate": 0.0002358713693992765, "loss": 0.0136, "step": 84740 }, { "epoch": 0.43, "learning_rate": 0.00023586380170626252, "loss": 0.015, "step": 84750 }, { "epoch": 0.43, "learning_rate": 0.0002358562340132485, "loss": 0.0193, "step": 84760 }, { "epoch": 0.43, "learning_rate": 0.00023584866632023448, "loss": 0.0174, "step": 84770 }, { "epoch": 0.43, "learning_rate": 0.0002358410986272205, "loss": 0.0197, "step": 84780 }, { "epoch": 0.43, "learning_rate": 0.00023583353093420647, "loss": 0.0195, "step": 84790 }, { "epoch": 0.43, "learning_rate": 0.00023582596324119246, "loss": 0.0194, "step": 84800 }, { "epoch": 0.43, "learning_rate": 0.00023581839554817846, "loss": 0.0161, "step": 84810 }, { "epoch": 0.43, "learning_rate": 0.00023581082785516445, "loss": 0.0177, "step": 84820 }, { "epoch": 0.43, "learning_rate": 0.00023580326016215043, "loss": 0.0206, "step": 84830 }, { "epoch": 0.43, "learning_rate": 0.00023579569246913638, "loss": 0.0149, "step": 84840 }, { "epoch": 0.43, "learning_rate": 0.0002357881247761224, "loss": 0.0203, "step": 84850 }, { "epoch": 0.43, "learning_rate": 0.00023578055708310837, "loss": 0.018, "step": 84860 }, { "epoch": 0.43, "learning_rate": 0.00023577298939009435, "loss": 0.0154, "step": 84870 }, { "epoch": 0.43, "learning_rate": 0.00023576542169708033, "loss": 0.0179, "step": 84880 }, { "epoch": 0.43, "learning_rate": 0.00023575785400406634, "loss": 0.0173, "step": 84890 }, { "epoch": 0.43, "learning_rate": 0.00023575028631105232, "loss": 0.0165, "step": 84900 }, { "epoch": 0.43, "learning_rate": 0.0002357427186180383, "loss": 0.0219, "step": 84910 }, { "epoch": 0.43, "learning_rate": 0.00023573515092502431, "loss": 0.0202, "step": 84920 }, { "epoch": 0.43, "learning_rate": 0.0002357275832320103, "loss": 0.0185, "step": 84930 }, { "epoch": 0.43, "learning_rate": 0.00023572001553899628, "loss": 0.0187, "step": 84940 }, { "epoch": 0.43, "learning_rate": 0.00023571244784598229, "loss": 0.0163, "step": 84950 }, { "epoch": 0.43, "learning_rate": 0.00023570488015296827, "loss": 0.0191, "step": 84960 }, { "epoch": 0.43, "learning_rate": 0.00023569731245995425, "loss": 0.0154, "step": 84970 }, { "epoch": 0.43, "learning_rate": 0.00023568974476694026, "loss": 0.0209, "step": 84980 }, { "epoch": 0.43, "learning_rate": 0.00023568217707392624, "loss": 0.0169, "step": 84990 }, { "epoch": 0.43, "learning_rate": 0.00023567460938091222, "loss": 0.014, "step": 85000 }, { "epoch": 0.43, "eval_cer": 0.9145236276900593, "eval_loss": 0.01236006710678339, "eval_runtime": 116.6924, "eval_samples_per_second": 17.139, "eval_steps_per_second": 4.285, "step": 85000 }, { "epoch": 0.43, "learning_rate": 0.00023566704168789823, "loss": 0.0166, "step": 85010 }, { "epoch": 0.43, "learning_rate": 0.0002356594739948842, "loss": 0.0159, "step": 85020 }, { "epoch": 0.43, "learning_rate": 0.0002356519063018702, "loss": 0.0167, "step": 85030 }, { "epoch": 0.43, "learning_rate": 0.0002356443386088562, "loss": 0.0184, "step": 85040 }, { "epoch": 0.43, "learning_rate": 0.00023563677091584218, "loss": 0.0172, "step": 85050 }, { "epoch": 0.43, "learning_rate": 0.00023562920322282816, "loss": 0.0181, "step": 85060 }, { "epoch": 0.43, "learning_rate": 0.00023562163552981414, "loss": 0.0162, "step": 85070 }, { "epoch": 0.43, "learning_rate": 0.00023561406783680015, "loss": 0.0224, "step": 85080 }, { "epoch": 0.43, "learning_rate": 0.00023560650014378613, "loss": 0.0173, "step": 85090 }, { "epoch": 0.43, "learning_rate": 0.00023559893245077212, "loss": 0.0159, "step": 85100 }, { "epoch": 0.43, "learning_rate": 0.00023559136475775812, "loss": 0.017, "step": 85110 }, { "epoch": 0.43, "learning_rate": 0.0002355837970647441, "loss": 0.0232, "step": 85120 }, { "epoch": 0.43, "learning_rate": 0.0002355762293717301, "loss": 0.0168, "step": 85130 }, { "epoch": 0.43, "learning_rate": 0.0002355686616787161, "loss": 0.0187, "step": 85140 }, { "epoch": 0.43, "learning_rate": 0.00023556109398570208, "loss": 0.0213, "step": 85150 }, { "epoch": 0.43, "learning_rate": 0.00023555352629268806, "loss": 0.0174, "step": 85160 }, { "epoch": 0.43, "learning_rate": 0.00023554595859967407, "loss": 0.0183, "step": 85170 }, { "epoch": 0.43, "learning_rate": 0.00023553839090666005, "loss": 0.0219, "step": 85180 }, { "epoch": 0.43, "learning_rate": 0.00023553082321364603, "loss": 0.0171, "step": 85190 }, { "epoch": 0.43, "learning_rate": 0.00023552325552063204, "loss": 0.0119, "step": 85200 }, { "epoch": 0.43, "learning_rate": 0.00023551568782761802, "loss": 0.0162, "step": 85210 }, { "epoch": 0.43, "learning_rate": 0.000235508120134604, "loss": 0.0229, "step": 85220 }, { "epoch": 0.43, "learning_rate": 0.00023550055244158998, "loss": 0.0165, "step": 85230 }, { "epoch": 0.43, "learning_rate": 0.000235492984748576, "loss": 0.0147, "step": 85240 }, { "epoch": 0.43, "learning_rate": 0.00023548541705556197, "loss": 0.0177, "step": 85250 }, { "epoch": 0.43, "learning_rate": 0.00023547784936254795, "loss": 0.0179, "step": 85260 }, { "epoch": 0.43, "learning_rate": 0.00023547028166953396, "loss": 0.0185, "step": 85270 }, { "epoch": 0.43, "learning_rate": 0.00023546271397651994, "loss": 0.0192, "step": 85280 }, { "epoch": 0.43, "learning_rate": 0.00023545514628350593, "loss": 0.0205, "step": 85290 }, { "epoch": 0.43, "learning_rate": 0.00023544757859049193, "loss": 0.0212, "step": 85300 }, { "epoch": 0.43, "learning_rate": 0.00023544001089747792, "loss": 0.0166, "step": 85310 }, { "epoch": 0.43, "learning_rate": 0.0002354324432044639, "loss": 0.016, "step": 85320 }, { "epoch": 0.43, "learning_rate": 0.0002354248755114499, "loss": 0.0301, "step": 85330 }, { "epoch": 0.43, "learning_rate": 0.0002354173078184359, "loss": 0.0199, "step": 85340 }, { "epoch": 0.43, "learning_rate": 0.00023540974012542187, "loss": 0.0149, "step": 85350 }, { "epoch": 0.43, "learning_rate": 0.00023540217243240788, "loss": 0.0169, "step": 85360 }, { "epoch": 0.43, "learning_rate": 0.00023539460473939386, "loss": 0.0229, "step": 85370 }, { "epoch": 0.43, "learning_rate": 0.00023538703704637984, "loss": 0.0135, "step": 85380 }, { "epoch": 0.43, "learning_rate": 0.00023537946935336582, "loss": 0.0181, "step": 85390 }, { "epoch": 0.43, "learning_rate": 0.00023537190166035183, "loss": 0.0173, "step": 85400 }, { "epoch": 0.43, "learning_rate": 0.0002353643339673378, "loss": 0.0154, "step": 85410 }, { "epoch": 0.43, "learning_rate": 0.0002353567662743238, "loss": 0.0192, "step": 85420 }, { "epoch": 0.43, "learning_rate": 0.0002353491985813098, "loss": 0.0172, "step": 85430 }, { "epoch": 0.43, "learning_rate": 0.00023534163088829578, "loss": 0.0134, "step": 85440 }, { "epoch": 0.43, "learning_rate": 0.00023533406319528176, "loss": 0.0162, "step": 85450 }, { "epoch": 0.43, "learning_rate": 0.00023532649550226777, "loss": 0.0139, "step": 85460 }, { "epoch": 0.43, "learning_rate": 0.00023531892780925375, "loss": 0.0175, "step": 85470 }, { "epoch": 0.43, "learning_rate": 0.00023531136011623974, "loss": 0.0146, "step": 85480 }, { "epoch": 0.43, "learning_rate": 0.00023530379242322574, "loss": 0.0171, "step": 85490 }, { "epoch": 0.43, "learning_rate": 0.00023529622473021173, "loss": 0.0172, "step": 85500 }, { "epoch": 0.43, "learning_rate": 0.0002352886570371977, "loss": 0.0191, "step": 85510 }, { "epoch": 0.43, "learning_rate": 0.00023528108934418372, "loss": 0.0164, "step": 85520 }, { "epoch": 0.43, "learning_rate": 0.0002352735216511697, "loss": 0.0168, "step": 85530 }, { "epoch": 0.43, "learning_rate": 0.00023526595395815568, "loss": 0.0165, "step": 85540 }, { "epoch": 0.43, "learning_rate": 0.00023525838626514166, "loss": 0.0168, "step": 85550 }, { "epoch": 0.43, "learning_rate": 0.00023525081857212767, "loss": 0.0123, "step": 85560 }, { "epoch": 0.43, "learning_rate": 0.00023524325087911365, "loss": 0.0198, "step": 85570 }, { "epoch": 0.43, "learning_rate": 0.00023523568318609963, "loss": 0.0272, "step": 85580 }, { "epoch": 0.43, "learning_rate": 0.00023522811549308564, "loss": 0.0184, "step": 85590 }, { "epoch": 0.43, "learning_rate": 0.00023522054780007162, "loss": 0.0179, "step": 85600 }, { "epoch": 0.43, "learning_rate": 0.0002352129801070576, "loss": 0.0159, "step": 85610 }, { "epoch": 0.43, "learning_rate": 0.0002352054124140436, "loss": 0.0219, "step": 85620 }, { "epoch": 0.43, "learning_rate": 0.0002351978447210296, "loss": 0.0174, "step": 85630 }, { "epoch": 0.43, "learning_rate": 0.00023519027702801557, "loss": 0.0162, "step": 85640 }, { "epoch": 0.43, "learning_rate": 0.00023518270933500158, "loss": 0.0184, "step": 85650 }, { "epoch": 0.43, "learning_rate": 0.00023517514164198756, "loss": 0.0149, "step": 85660 }, { "epoch": 0.43, "learning_rate": 0.00023516757394897355, "loss": 0.0168, "step": 85670 }, { "epoch": 0.43, "learning_rate": 0.00023516000625595955, "loss": 0.0165, "step": 85680 }, { "epoch": 0.43, "learning_rate": 0.00023515243856294554, "loss": 0.0194, "step": 85690 }, { "epoch": 0.43, "learning_rate": 0.00023514487086993152, "loss": 0.0115, "step": 85700 }, { "epoch": 0.43, "learning_rate": 0.00023513730317691753, "loss": 0.0178, "step": 85710 }, { "epoch": 0.43, "learning_rate": 0.0002351297354839035, "loss": 0.0152, "step": 85720 }, { "epoch": 0.43, "learning_rate": 0.0002351221677908895, "loss": 0.016, "step": 85730 }, { "epoch": 0.43, "learning_rate": 0.00023511460009787547, "loss": 0.0182, "step": 85740 }, { "epoch": 0.43, "learning_rate": 0.00023510703240486148, "loss": 0.0233, "step": 85750 }, { "epoch": 0.43, "learning_rate": 0.00023509946471184746, "loss": 0.0231, "step": 85760 }, { "epoch": 0.43, "learning_rate": 0.00023509189701883344, "loss": 0.0201, "step": 85770 }, { "epoch": 0.43, "learning_rate": 0.00023508432932581945, "loss": 0.0201, "step": 85780 }, { "epoch": 0.43, "learning_rate": 0.00023507676163280543, "loss": 0.023, "step": 85790 }, { "epoch": 0.43, "learning_rate": 0.0002350691939397914, "loss": 0.0151, "step": 85800 }, { "epoch": 0.43, "learning_rate": 0.00023506162624677742, "loss": 0.023, "step": 85810 }, { "epoch": 0.43, "learning_rate": 0.0002350540585537634, "loss": 0.0161, "step": 85820 }, { "epoch": 0.43, "learning_rate": 0.00023504649086074938, "loss": 0.0202, "step": 85830 }, { "epoch": 0.43, "learning_rate": 0.0002350389231677354, "loss": 0.0151, "step": 85840 }, { "epoch": 0.43, "learning_rate": 0.00023503135547472137, "loss": 0.0163, "step": 85850 }, { "epoch": 0.43, "learning_rate": 0.00023502378778170736, "loss": 0.0139, "step": 85860 }, { "epoch": 0.43, "learning_rate": 0.00023501622008869336, "loss": 0.0157, "step": 85870 }, { "epoch": 0.43, "learning_rate": 0.00023500865239567935, "loss": 0.0173, "step": 85880 }, { "epoch": 0.43, "learning_rate": 0.00023500108470266533, "loss": 0.0174, "step": 85890 }, { "epoch": 0.43, "learning_rate": 0.0002349935170096513, "loss": 0.0166, "step": 85900 }, { "epoch": 0.43, "learning_rate": 0.00023498594931663732, "loss": 0.0237, "step": 85910 }, { "epoch": 0.43, "learning_rate": 0.0002349783816236233, "loss": 0.0184, "step": 85920 }, { "epoch": 0.43, "learning_rate": 0.00023497081393060928, "loss": 0.0186, "step": 85930 }, { "epoch": 0.43, "learning_rate": 0.0002349632462375953, "loss": 0.0175, "step": 85940 }, { "epoch": 0.43, "learning_rate": 0.00023495567854458127, "loss": 0.0183, "step": 85950 }, { "epoch": 0.43, "learning_rate": 0.00023494811085156725, "loss": 0.0169, "step": 85960 }, { "epoch": 0.43, "learning_rate": 0.00023494054315855326, "loss": 0.0143, "step": 85970 }, { "epoch": 0.43, "learning_rate": 0.00023493297546553924, "loss": 0.0171, "step": 85980 }, { "epoch": 0.43, "learning_rate": 0.00023492540777252522, "loss": 0.0171, "step": 85990 }, { "epoch": 0.43, "learning_rate": 0.00023491784007951123, "loss": 0.0186, "step": 86000 }, { "epoch": 0.43, "eval_cer": 0.9144702559031622, "eval_loss": 0.012443006969988346, "eval_runtime": 116.6618, "eval_samples_per_second": 17.144, "eval_steps_per_second": 4.286, "step": 86000 }, { "epoch": 0.43, "learning_rate": 0.0002349102723864972, "loss": 0.016, "step": 86010 }, { "epoch": 0.43, "learning_rate": 0.0002349027046934832, "loss": 0.0165, "step": 86020 }, { "epoch": 0.43, "learning_rate": 0.0002348951370004692, "loss": 0.0162, "step": 86030 }, { "epoch": 0.43, "learning_rate": 0.00023488756930745518, "loss": 0.0176, "step": 86040 }, { "epoch": 0.43, "learning_rate": 0.00023488000161444117, "loss": 0.017, "step": 86050 }, { "epoch": 0.43, "learning_rate": 0.00023487243392142715, "loss": 0.0163, "step": 86060 }, { "epoch": 0.43, "learning_rate": 0.00023486486622841316, "loss": 0.0178, "step": 86070 }, { "epoch": 0.43, "learning_rate": 0.00023485729853539914, "loss": 0.0188, "step": 86080 }, { "epoch": 0.43, "learning_rate": 0.00023484973084238512, "loss": 0.0184, "step": 86090 }, { "epoch": 0.43, "learning_rate": 0.0002348421631493711, "loss": 0.017, "step": 86100 }, { "epoch": 0.43, "learning_rate": 0.00023483459545635708, "loss": 0.0166, "step": 86110 }, { "epoch": 0.43, "learning_rate": 0.00023482702776334306, "loss": 0.0151, "step": 86120 }, { "epoch": 0.43, "learning_rate": 0.00023481946007032904, "loss": 0.0159, "step": 86130 }, { "epoch": 0.43, "learning_rate": 0.00023481189237731505, "loss": 0.0159, "step": 86140 }, { "epoch": 0.43, "learning_rate": 0.00023480432468430103, "loss": 0.021, "step": 86150 }, { "epoch": 0.43, "learning_rate": 0.00023479675699128702, "loss": 0.0153, "step": 86160 }, { "epoch": 0.43, "learning_rate": 0.00023478918929827302, "loss": 0.0155, "step": 86170 }, { "epoch": 0.43, "learning_rate": 0.000234781621605259, "loss": 0.016, "step": 86180 }, { "epoch": 0.43, "learning_rate": 0.000234774053912245, "loss": 0.0188, "step": 86190 }, { "epoch": 0.43, "learning_rate": 0.000234766486219231, "loss": 0.0251, "step": 86200 }, { "epoch": 0.43, "learning_rate": 0.00023475891852621698, "loss": 0.0162, "step": 86210 }, { "epoch": 0.43, "learning_rate": 0.00023475135083320296, "loss": 0.0194, "step": 86220 }, { "epoch": 0.44, "learning_rate": 0.00023474378314018897, "loss": 0.0236, "step": 86230 }, { "epoch": 0.44, "learning_rate": 0.00023473621544717495, "loss": 0.0163, "step": 86240 }, { "epoch": 0.44, "learning_rate": 0.00023472864775416093, "loss": 0.0151, "step": 86250 }, { "epoch": 0.44, "learning_rate": 0.00023472108006114694, "loss": 0.0137, "step": 86260 }, { "epoch": 0.44, "learning_rate": 0.00023471351236813292, "loss": 0.0157, "step": 86270 }, { "epoch": 0.44, "learning_rate": 0.0002347059446751189, "loss": 0.0172, "step": 86280 }, { "epoch": 0.44, "learning_rate": 0.00023469837698210488, "loss": 0.0181, "step": 86290 }, { "epoch": 0.44, "learning_rate": 0.0002346908092890909, "loss": 0.0163, "step": 86300 }, { "epoch": 0.44, "learning_rate": 0.00023468324159607687, "loss": 0.0136, "step": 86310 }, { "epoch": 0.44, "learning_rate": 0.00023467567390306285, "loss": 0.016, "step": 86320 }, { "epoch": 0.44, "learning_rate": 0.00023466810621004886, "loss": 0.0142, "step": 86330 }, { "epoch": 0.44, "learning_rate": 0.00023466053851703484, "loss": 0.0193, "step": 86340 }, { "epoch": 0.44, "learning_rate": 0.00023465297082402083, "loss": 0.0159, "step": 86350 }, { "epoch": 0.44, "learning_rate": 0.00023464540313100683, "loss": 0.0158, "step": 86360 }, { "epoch": 0.44, "learning_rate": 0.00023463783543799282, "loss": 0.0161, "step": 86370 }, { "epoch": 0.44, "learning_rate": 0.0002346302677449788, "loss": 0.014, "step": 86380 }, { "epoch": 0.44, "learning_rate": 0.0002346227000519648, "loss": 0.019, "step": 86390 }, { "epoch": 0.44, "learning_rate": 0.0002346151323589508, "loss": 0.019, "step": 86400 }, { "epoch": 0.44, "learning_rate": 0.00023460756466593677, "loss": 0.0165, "step": 86410 }, { "epoch": 0.44, "learning_rate": 0.00023459999697292278, "loss": 0.0169, "step": 86420 }, { "epoch": 0.44, "learning_rate": 0.00023459242927990876, "loss": 0.0149, "step": 86430 }, { "epoch": 0.44, "learning_rate": 0.00023458486158689474, "loss": 0.0163, "step": 86440 }, { "epoch": 0.44, "learning_rate": 0.00023457729389388072, "loss": 0.0152, "step": 86450 }, { "epoch": 0.44, "learning_rate": 0.00023456972620086673, "loss": 0.0161, "step": 86460 }, { "epoch": 0.44, "learning_rate": 0.0002345621585078527, "loss": 0.0149, "step": 86470 }, { "epoch": 0.44, "learning_rate": 0.0002345545908148387, "loss": 0.0228, "step": 86480 }, { "epoch": 0.44, "learning_rate": 0.0002345470231218247, "loss": 0.0214, "step": 86490 }, { "epoch": 0.44, "learning_rate": 0.00023453945542881068, "loss": 0.0142, "step": 86500 }, { "epoch": 0.44, "learning_rate": 0.00023453188773579667, "loss": 0.0158, "step": 86510 }, { "epoch": 0.44, "learning_rate": 0.00023452432004278267, "loss": 0.0293, "step": 86520 }, { "epoch": 0.44, "learning_rate": 0.00023451675234976865, "loss": 0.0173, "step": 86530 }, { "epoch": 0.44, "learning_rate": 0.00023450918465675464, "loss": 0.0191, "step": 86540 }, { "epoch": 0.44, "learning_rate": 0.00023450161696374064, "loss": 0.015, "step": 86550 }, { "epoch": 0.44, "learning_rate": 0.00023449404927072663, "loss": 0.02, "step": 86560 }, { "epoch": 0.44, "learning_rate": 0.0002344864815777126, "loss": 0.0195, "step": 86570 }, { "epoch": 0.44, "learning_rate": 0.00023447891388469862, "loss": 0.0164, "step": 86580 }, { "epoch": 0.44, "learning_rate": 0.0002344713461916846, "loss": 0.0173, "step": 86590 }, { "epoch": 0.44, "learning_rate": 0.00023446377849867058, "loss": 0.0151, "step": 86600 }, { "epoch": 0.44, "learning_rate": 0.0002344562108056566, "loss": 0.0161, "step": 86610 }, { "epoch": 0.44, "learning_rate": 0.00023444864311264257, "loss": 0.0179, "step": 86620 }, { "epoch": 0.44, "learning_rate": 0.00023444107541962855, "loss": 0.0188, "step": 86630 }, { "epoch": 0.44, "learning_rate": 0.00023443350772661453, "loss": 0.0166, "step": 86640 }, { "epoch": 0.44, "learning_rate": 0.00023442594003360054, "loss": 0.0145, "step": 86650 }, { "epoch": 0.44, "learning_rate": 0.00023441837234058652, "loss": 0.0177, "step": 86660 }, { "epoch": 0.44, "learning_rate": 0.0002344108046475725, "loss": 0.0158, "step": 86670 }, { "epoch": 0.44, "learning_rate": 0.0002344032369545585, "loss": 0.0177, "step": 86680 }, { "epoch": 0.44, "learning_rate": 0.0002343956692615445, "loss": 0.0147, "step": 86690 }, { "epoch": 0.44, "learning_rate": 0.00023438810156853048, "loss": 0.0143, "step": 86700 }, { "epoch": 0.44, "learning_rate": 0.00023438053387551648, "loss": 0.0138, "step": 86710 }, { "epoch": 0.44, "learning_rate": 0.00023437296618250247, "loss": 0.0211, "step": 86720 }, { "epoch": 0.44, "learning_rate": 0.00023436539848948845, "loss": 0.0192, "step": 86730 }, { "epoch": 0.44, "learning_rate": 0.00023435783079647446, "loss": 0.0151, "step": 86740 }, { "epoch": 0.44, "learning_rate": 0.00023435026310346044, "loss": 0.0171, "step": 86750 }, { "epoch": 0.44, "learning_rate": 0.00023434269541044642, "loss": 0.0155, "step": 86760 }, { "epoch": 0.44, "learning_rate": 0.00023433512771743243, "loss": 0.0193, "step": 86770 }, { "epoch": 0.44, "learning_rate": 0.0002343275600244184, "loss": 0.0165, "step": 86780 }, { "epoch": 0.44, "learning_rate": 0.0002343199923314044, "loss": 0.0176, "step": 86790 }, { "epoch": 0.44, "learning_rate": 0.00023431242463839037, "loss": 0.0166, "step": 86800 }, { "epoch": 0.44, "learning_rate": 0.00023430485694537638, "loss": 0.0178, "step": 86810 }, { "epoch": 0.44, "learning_rate": 0.00023429728925236236, "loss": 0.0171, "step": 86820 }, { "epoch": 0.44, "learning_rate": 0.00023428972155934834, "loss": 0.0147, "step": 86830 }, { "epoch": 0.44, "learning_rate": 0.00023428215386633435, "loss": 0.0191, "step": 86840 }, { "epoch": 0.44, "learning_rate": 0.00023427458617332033, "loss": 0.0196, "step": 86850 }, { "epoch": 0.44, "learning_rate": 0.00023426701848030631, "loss": 0.0203, "step": 86860 }, { "epoch": 0.44, "learning_rate": 0.00023425945078729232, "loss": 0.016, "step": 86870 }, { "epoch": 0.44, "learning_rate": 0.0002342518830942783, "loss": 0.015, "step": 86880 }, { "epoch": 0.44, "learning_rate": 0.00023424431540126429, "loss": 0.0169, "step": 86890 }, { "epoch": 0.44, "learning_rate": 0.0002342367477082503, "loss": 0.0175, "step": 86900 }, { "epoch": 0.44, "learning_rate": 0.00023422918001523628, "loss": 0.0187, "step": 86910 }, { "epoch": 0.44, "learning_rate": 0.00023422161232222226, "loss": 0.0185, "step": 86920 }, { "epoch": 0.44, "learning_rate": 0.00023421404462920827, "loss": 0.0194, "step": 86930 }, { "epoch": 0.44, "learning_rate": 0.00023420647693619425, "loss": 0.0167, "step": 86940 }, { "epoch": 0.44, "learning_rate": 0.00023419890924318023, "loss": 0.0196, "step": 86950 }, { "epoch": 0.44, "learning_rate": 0.0002341913415501662, "loss": 0.0191, "step": 86960 }, { "epoch": 0.44, "learning_rate": 0.00023418377385715222, "loss": 0.0243, "step": 86970 }, { "epoch": 0.44, "learning_rate": 0.0002341762061641382, "loss": 0.0139, "step": 86980 }, { "epoch": 0.44, "learning_rate": 0.00023416863847112418, "loss": 0.0147, "step": 86990 }, { "epoch": 0.44, "learning_rate": 0.0002341610707781102, "loss": 0.0172, "step": 87000 }, { "epoch": 0.44, "eval_cer": 0.9144848118450433, "eval_loss": 0.012073654681444168, "eval_runtime": 116.8061, "eval_samples_per_second": 17.122, "eval_steps_per_second": 4.281, "step": 87000 }, { "epoch": 0.44, "learning_rate": 0.00023415350308509617, "loss": 0.0192, "step": 87010 }, { "epoch": 0.44, "learning_rate": 0.00023414593539208215, "loss": 0.022, "step": 87020 }, { "epoch": 0.44, "learning_rate": 0.00023413836769906816, "loss": 0.0149, "step": 87030 }, { "epoch": 0.44, "learning_rate": 0.00023413080000605414, "loss": 0.0178, "step": 87040 }, { "epoch": 0.44, "learning_rate": 0.00023412323231304012, "loss": 0.0156, "step": 87050 }, { "epoch": 0.44, "learning_rate": 0.00023411566462002613, "loss": 0.0165, "step": 87060 }, { "epoch": 0.44, "learning_rate": 0.00023410809692701211, "loss": 0.0154, "step": 87070 }, { "epoch": 0.44, "learning_rate": 0.0002341005292339981, "loss": 0.0174, "step": 87080 }, { "epoch": 0.44, "learning_rate": 0.0002340929615409841, "loss": 0.0164, "step": 87090 }, { "epoch": 0.44, "learning_rate": 0.00023408539384797009, "loss": 0.024, "step": 87100 }, { "epoch": 0.44, "learning_rate": 0.00023407782615495607, "loss": 0.0189, "step": 87110 }, { "epoch": 0.44, "learning_rate": 0.00023407025846194208, "loss": 0.0173, "step": 87120 }, { "epoch": 0.44, "learning_rate": 0.00023406269076892806, "loss": 0.012, "step": 87130 }, { "epoch": 0.44, "learning_rate": 0.00023405512307591404, "loss": 0.0167, "step": 87140 }, { "epoch": 0.44, "learning_rate": 0.00023404755538290002, "loss": 0.0172, "step": 87150 }, { "epoch": 0.44, "learning_rate": 0.00023403998768988603, "loss": 0.0223, "step": 87160 }, { "epoch": 0.44, "learning_rate": 0.000234032419996872, "loss": 0.0191, "step": 87170 }, { "epoch": 0.44, "learning_rate": 0.000234024852303858, "loss": 0.0192, "step": 87180 }, { "epoch": 0.44, "learning_rate": 0.000234017284610844, "loss": 0.019, "step": 87190 }, { "epoch": 0.44, "learning_rate": 0.00023400971691782998, "loss": 0.0179, "step": 87200 }, { "epoch": 0.44, "learning_rate": 0.00023400214922481596, "loss": 0.0153, "step": 87210 }, { "epoch": 0.44, "learning_rate": 0.00023399458153180197, "loss": 0.02, "step": 87220 }, { "epoch": 0.44, "learning_rate": 0.00023398701383878795, "loss": 0.0151, "step": 87230 }, { "epoch": 0.44, "learning_rate": 0.00023397944614577393, "loss": 0.0207, "step": 87240 }, { "epoch": 0.44, "learning_rate": 0.00023397187845275994, "loss": 0.0176, "step": 87250 }, { "epoch": 0.44, "learning_rate": 0.00023396431075974592, "loss": 0.0173, "step": 87260 }, { "epoch": 0.44, "learning_rate": 0.0002339567430667319, "loss": 0.021, "step": 87270 }, { "epoch": 0.44, "learning_rate": 0.00023394917537371791, "loss": 0.0132, "step": 87280 }, { "epoch": 0.44, "learning_rate": 0.0002339416076807039, "loss": 0.0142, "step": 87290 }, { "epoch": 0.44, "learning_rate": 0.00023393403998768988, "loss": 0.015, "step": 87300 }, { "epoch": 0.44, "learning_rate": 0.00023392647229467586, "loss": 0.0171, "step": 87310 }, { "epoch": 0.44, "learning_rate": 0.00023391890460166187, "loss": 0.0159, "step": 87320 }, { "epoch": 0.44, "learning_rate": 0.00023391133690864785, "loss": 0.0182, "step": 87330 }, { "epoch": 0.44, "learning_rate": 0.00023390376921563383, "loss": 0.0198, "step": 87340 }, { "epoch": 0.44, "learning_rate": 0.00023389620152261984, "loss": 0.0191, "step": 87350 }, { "epoch": 0.44, "learning_rate": 0.0002338886338296058, "loss": 0.0222, "step": 87360 }, { "epoch": 0.44, "learning_rate": 0.00023388106613659177, "loss": 0.016, "step": 87370 }, { "epoch": 0.44, "learning_rate": 0.00023387349844357776, "loss": 0.0142, "step": 87380 }, { "epoch": 0.44, "learning_rate": 0.00023386593075056376, "loss": 0.0169, "step": 87390 }, { "epoch": 0.44, "learning_rate": 0.00023385836305754975, "loss": 0.0189, "step": 87400 }, { "epoch": 0.44, "learning_rate": 0.00023385079536453573, "loss": 0.016, "step": 87410 }, { "epoch": 0.44, "learning_rate": 0.00023384322767152174, "loss": 0.0152, "step": 87420 }, { "epoch": 0.44, "learning_rate": 0.00023383565997850772, "loss": 0.0168, "step": 87430 }, { "epoch": 0.44, "learning_rate": 0.0002338280922854937, "loss": 0.0142, "step": 87440 }, { "epoch": 0.44, "learning_rate": 0.0002338205245924797, "loss": 0.0186, "step": 87450 }, { "epoch": 0.44, "learning_rate": 0.0002338129568994657, "loss": 0.0179, "step": 87460 }, { "epoch": 0.44, "learning_rate": 0.00023380538920645167, "loss": 0.0174, "step": 87470 }, { "epoch": 0.44, "learning_rate": 0.00023379782151343768, "loss": 0.0149, "step": 87480 }, { "epoch": 0.44, "learning_rate": 0.00023379025382042366, "loss": 0.0194, "step": 87490 }, { "epoch": 0.44, "learning_rate": 0.00023378268612740964, "loss": 0.0167, "step": 87500 }, { "epoch": 0.44, "learning_rate": 0.00023377511843439565, "loss": 0.0138, "step": 87510 }, { "epoch": 0.44, "learning_rate": 0.00023376755074138163, "loss": 0.0171, "step": 87520 }, { "epoch": 0.44, "learning_rate": 0.0002337599830483676, "loss": 0.0178, "step": 87530 }, { "epoch": 0.44, "learning_rate": 0.0002337524153553536, "loss": 0.0156, "step": 87540 }, { "epoch": 0.44, "learning_rate": 0.0002337448476623396, "loss": 0.0217, "step": 87550 }, { "epoch": 0.44, "learning_rate": 0.00023373727996932558, "loss": 0.0163, "step": 87560 }, { "epoch": 0.44, "learning_rate": 0.00023372971227631157, "loss": 0.0169, "step": 87570 }, { "epoch": 0.44, "learning_rate": 0.00023372214458329757, "loss": 0.02, "step": 87580 }, { "epoch": 0.44, "learning_rate": 0.00023371457689028356, "loss": 0.0147, "step": 87590 }, { "epoch": 0.44, "learning_rate": 0.00023370700919726954, "loss": 0.0192, "step": 87600 }, { "epoch": 0.44, "learning_rate": 0.00023369944150425555, "loss": 0.0147, "step": 87610 }, { "epoch": 0.44, "learning_rate": 0.00023369187381124153, "loss": 0.0226, "step": 87620 }, { "epoch": 0.44, "learning_rate": 0.0002336843061182275, "loss": 0.0209, "step": 87630 }, { "epoch": 0.44, "learning_rate": 0.00023367673842521352, "loss": 0.0165, "step": 87640 }, { "epoch": 0.44, "learning_rate": 0.0002336691707321995, "loss": 0.0218, "step": 87650 }, { "epoch": 0.44, "learning_rate": 0.00023366160303918548, "loss": 0.0169, "step": 87660 }, { "epoch": 0.44, "learning_rate": 0.0002336540353461715, "loss": 0.0139, "step": 87670 }, { "epoch": 0.44, "learning_rate": 0.00023364646765315747, "loss": 0.0148, "step": 87680 }, { "epoch": 0.44, "learning_rate": 0.00023363889996014345, "loss": 0.0142, "step": 87690 }, { "epoch": 0.44, "learning_rate": 0.00023363133226712943, "loss": 0.0135, "step": 87700 }, { "epoch": 0.44, "learning_rate": 0.00023362376457411544, "loss": 0.0161, "step": 87710 }, { "epoch": 0.44, "learning_rate": 0.00023361619688110142, "loss": 0.0164, "step": 87720 }, { "epoch": 0.44, "learning_rate": 0.0002336086291880874, "loss": 0.0183, "step": 87730 }, { "epoch": 0.44, "learning_rate": 0.0002336010614950734, "loss": 0.0213, "step": 87740 }, { "epoch": 0.44, "learning_rate": 0.0002335934938020594, "loss": 0.0156, "step": 87750 }, { "epoch": 0.44, "learning_rate": 0.00023358592610904538, "loss": 0.0202, "step": 87760 }, { "epoch": 0.44, "learning_rate": 0.00023357835841603138, "loss": 0.0174, "step": 87770 }, { "epoch": 0.44, "learning_rate": 0.00023357079072301737, "loss": 0.0167, "step": 87780 }, { "epoch": 0.44, "learning_rate": 0.00023356322303000335, "loss": 0.0173, "step": 87790 }, { "epoch": 0.44, "learning_rate": 0.00023355565533698936, "loss": 0.0182, "step": 87800 }, { "epoch": 0.44, "learning_rate": 0.00023354808764397534, "loss": 0.0163, "step": 87810 }, { "epoch": 0.44, "learning_rate": 0.00023354051995096132, "loss": 0.017, "step": 87820 }, { "epoch": 0.44, "learning_rate": 0.00023353295225794733, "loss": 0.0153, "step": 87830 }, { "epoch": 0.44, "learning_rate": 0.0002335253845649333, "loss": 0.0165, "step": 87840 }, { "epoch": 0.44, "learning_rate": 0.0002335178168719193, "loss": 0.0151, "step": 87850 }, { "epoch": 0.44, "learning_rate": 0.00023351024917890527, "loss": 0.0186, "step": 87860 }, { "epoch": 0.44, "learning_rate": 0.00023350268148589128, "loss": 0.016, "step": 87870 }, { "epoch": 0.44, "learning_rate": 0.00023349511379287726, "loss": 0.016, "step": 87880 }, { "epoch": 0.44, "learning_rate": 0.00023348754609986324, "loss": 0.0159, "step": 87890 }, { "epoch": 0.44, "learning_rate": 0.00023347997840684925, "loss": 0.0171, "step": 87900 }, { "epoch": 0.44, "learning_rate": 0.00023347241071383523, "loss": 0.0177, "step": 87910 }, { "epoch": 0.44, "learning_rate": 0.00023346484302082121, "loss": 0.0154, "step": 87920 }, { "epoch": 0.44, "learning_rate": 0.00023345727532780722, "loss": 0.0172, "step": 87930 }, { "epoch": 0.44, "learning_rate": 0.0002334497076347932, "loss": 0.0172, "step": 87940 }, { "epoch": 0.44, "learning_rate": 0.00023344213994177919, "loss": 0.0157, "step": 87950 }, { "epoch": 0.44, "learning_rate": 0.0002334345722487652, "loss": 0.0148, "step": 87960 }, { "epoch": 0.44, "learning_rate": 0.00023342700455575118, "loss": 0.0168, "step": 87970 }, { "epoch": 0.44, "learning_rate": 0.00023341943686273716, "loss": 0.0173, "step": 87980 }, { "epoch": 0.44, "learning_rate": 0.00023341186916972317, "loss": 0.0205, "step": 87990 }, { "epoch": 0.44, "learning_rate": 0.00023340430147670915, "loss": 0.019, "step": 88000 }, { "epoch": 0.44, "eval_cer": 0.9145042197675514, "eval_loss": 0.011925076134502888, "eval_runtime": 116.6489, "eval_samples_per_second": 17.145, "eval_steps_per_second": 4.286, "step": 88000 }, { "epoch": 0.44, "learning_rate": 0.00023339673378369513, "loss": 0.0132, "step": 88010 }, { "epoch": 0.44, "learning_rate": 0.00023338916609068114, "loss": 0.0178, "step": 88020 }, { "epoch": 0.44, "learning_rate": 0.00023338159839766712, "loss": 0.0176, "step": 88030 }, { "epoch": 0.44, "learning_rate": 0.0002333740307046531, "loss": 0.0148, "step": 88040 }, { "epoch": 0.44, "learning_rate": 0.00023336646301163908, "loss": 0.0163, "step": 88050 }, { "epoch": 0.44, "learning_rate": 0.0002333588953186251, "loss": 0.0156, "step": 88060 }, { "epoch": 0.44, "learning_rate": 0.00023335132762561107, "loss": 0.0207, "step": 88070 }, { "epoch": 0.44, "learning_rate": 0.00023334375993259705, "loss": 0.0164, "step": 88080 }, { "epoch": 0.44, "learning_rate": 0.00023333619223958306, "loss": 0.0148, "step": 88090 }, { "epoch": 0.44, "learning_rate": 0.00023332862454656904, "loss": 0.0157, "step": 88100 }, { "epoch": 0.44, "learning_rate": 0.00023332105685355502, "loss": 0.0205, "step": 88110 }, { "epoch": 0.44, "learning_rate": 0.00023331348916054103, "loss": 0.0174, "step": 88120 }, { "epoch": 0.44, "learning_rate": 0.00023330592146752701, "loss": 0.0187, "step": 88130 }, { "epoch": 0.44, "learning_rate": 0.000233298353774513, "loss": 0.0189, "step": 88140 }, { "epoch": 0.44, "learning_rate": 0.000233290786081499, "loss": 0.0156, "step": 88150 }, { "epoch": 0.44, "learning_rate": 0.00023328321838848499, "loss": 0.0185, "step": 88160 }, { "epoch": 0.44, "learning_rate": 0.00023327565069547097, "loss": 0.0164, "step": 88170 }, { "epoch": 0.44, "learning_rate": 0.00023326808300245698, "loss": 0.0176, "step": 88180 }, { "epoch": 0.44, "learning_rate": 0.00023326051530944296, "loss": 0.0132, "step": 88190 }, { "epoch": 0.44, "learning_rate": 0.00023325294761642894, "loss": 0.016, "step": 88200 }, { "epoch": 0.45, "learning_rate": 0.00023324537992341492, "loss": 0.0175, "step": 88210 }, { "epoch": 0.45, "learning_rate": 0.00023323781223040093, "loss": 0.0136, "step": 88220 }, { "epoch": 0.45, "learning_rate": 0.0002332302445373869, "loss": 0.0161, "step": 88230 }, { "epoch": 0.45, "learning_rate": 0.0002332226768443729, "loss": 0.0184, "step": 88240 }, { "epoch": 0.45, "learning_rate": 0.0002332151091513589, "loss": 0.015, "step": 88250 }, { "epoch": 0.45, "learning_rate": 0.00023320754145834488, "loss": 0.0202, "step": 88260 }, { "epoch": 0.45, "learning_rate": 0.00023319997376533086, "loss": 0.0182, "step": 88270 }, { "epoch": 0.45, "learning_rate": 0.00023319240607231687, "loss": 0.0161, "step": 88280 }, { "epoch": 0.45, "learning_rate": 0.00023318483837930285, "loss": 0.0142, "step": 88290 }, { "epoch": 0.45, "learning_rate": 0.00023317727068628883, "loss": 0.0176, "step": 88300 }, { "epoch": 0.45, "learning_rate": 0.00023316970299327484, "loss": 0.0203, "step": 88310 }, { "epoch": 0.45, "learning_rate": 0.00023316213530026082, "loss": 0.0157, "step": 88320 }, { "epoch": 0.45, "learning_rate": 0.0002331545676072468, "loss": 0.0189, "step": 88330 }, { "epoch": 0.45, "learning_rate": 0.00023314699991423281, "loss": 0.0163, "step": 88340 }, { "epoch": 0.45, "learning_rate": 0.0002331394322212188, "loss": 0.0159, "step": 88350 }, { "epoch": 0.45, "learning_rate": 0.00023313186452820478, "loss": 0.0182, "step": 88360 }, { "epoch": 0.45, "learning_rate": 0.00023312429683519076, "loss": 0.0168, "step": 88370 }, { "epoch": 0.45, "learning_rate": 0.00023311672914217677, "loss": 0.016, "step": 88380 }, { "epoch": 0.45, "learning_rate": 0.00023310916144916275, "loss": 0.0198, "step": 88390 }, { "epoch": 0.45, "learning_rate": 0.00023310159375614873, "loss": 0.018, "step": 88400 }, { "epoch": 0.45, "learning_rate": 0.00023309402606313474, "loss": 0.0168, "step": 88410 }, { "epoch": 0.45, "learning_rate": 0.00023308645837012072, "loss": 0.019, "step": 88420 }, { "epoch": 0.45, "learning_rate": 0.0002330788906771067, "loss": 0.0175, "step": 88430 }, { "epoch": 0.45, "learning_rate": 0.0002330713229840927, "loss": 0.0205, "step": 88440 }, { "epoch": 0.45, "learning_rate": 0.0002330637552910787, "loss": 0.0187, "step": 88450 }, { "epoch": 0.45, "learning_rate": 0.00023305618759806467, "loss": 0.0158, "step": 88460 }, { "epoch": 0.45, "learning_rate": 0.00023304861990505068, "loss": 0.0181, "step": 88470 }, { "epoch": 0.45, "learning_rate": 0.00023304105221203666, "loss": 0.0167, "step": 88480 }, { "epoch": 0.45, "learning_rate": 0.00023303348451902264, "loss": 0.0165, "step": 88490 }, { "epoch": 0.45, "learning_rate": 0.00023302591682600865, "loss": 0.0164, "step": 88500 }, { "epoch": 0.45, "learning_rate": 0.00023301834913299463, "loss": 0.018, "step": 88510 }, { "epoch": 0.45, "learning_rate": 0.00023301078143998062, "loss": 0.0186, "step": 88520 }, { "epoch": 0.45, "learning_rate": 0.00023300321374696662, "loss": 0.0172, "step": 88530 }, { "epoch": 0.45, "learning_rate": 0.0002329956460539526, "loss": 0.0157, "step": 88540 }, { "epoch": 0.45, "learning_rate": 0.0002329880783609386, "loss": 0.0197, "step": 88550 }, { "epoch": 0.45, "learning_rate": 0.00023298051066792457, "loss": 0.017, "step": 88560 }, { "epoch": 0.45, "learning_rate": 0.00023297294297491058, "loss": 0.0136, "step": 88570 }, { "epoch": 0.45, "learning_rate": 0.00023296537528189656, "loss": 0.0144, "step": 88580 }, { "epoch": 0.45, "learning_rate": 0.00023295780758888254, "loss": 0.0136, "step": 88590 }, { "epoch": 0.45, "learning_rate": 0.00023295023989586855, "loss": 0.017, "step": 88600 }, { "epoch": 0.45, "learning_rate": 0.00023294267220285453, "loss": 0.0172, "step": 88610 }, { "epoch": 0.45, "learning_rate": 0.00023293510450984048, "loss": 0.0182, "step": 88620 }, { "epoch": 0.45, "learning_rate": 0.00023292753681682647, "loss": 0.0153, "step": 88630 }, { "epoch": 0.45, "learning_rate": 0.00023291996912381247, "loss": 0.0177, "step": 88640 }, { "epoch": 0.45, "learning_rate": 0.00023291240143079846, "loss": 0.0148, "step": 88650 }, { "epoch": 0.45, "learning_rate": 0.00023290483373778444, "loss": 0.0167, "step": 88660 }, { "epoch": 0.45, "learning_rate": 0.00023289726604477045, "loss": 0.0172, "step": 88670 }, { "epoch": 0.45, "learning_rate": 0.00023288969835175643, "loss": 0.014, "step": 88680 }, { "epoch": 0.45, "learning_rate": 0.0002328821306587424, "loss": 0.0171, "step": 88690 }, { "epoch": 0.45, "learning_rate": 0.00023287456296572842, "loss": 0.0229, "step": 88700 }, { "epoch": 0.45, "learning_rate": 0.0002328669952727144, "loss": 0.0173, "step": 88710 }, { "epoch": 0.45, "learning_rate": 0.00023285942757970038, "loss": 0.0181, "step": 88720 }, { "epoch": 0.45, "learning_rate": 0.0002328518598866864, "loss": 0.0206, "step": 88730 }, { "epoch": 0.45, "learning_rate": 0.00023284429219367237, "loss": 0.0186, "step": 88740 }, { "epoch": 0.45, "learning_rate": 0.00023283672450065835, "loss": 0.014, "step": 88750 }, { "epoch": 0.45, "learning_rate": 0.00023282915680764433, "loss": 0.0172, "step": 88760 }, { "epoch": 0.45, "learning_rate": 0.00023282158911463034, "loss": 0.0184, "step": 88770 }, { "epoch": 0.45, "learning_rate": 0.00023281402142161632, "loss": 0.0158, "step": 88780 }, { "epoch": 0.45, "learning_rate": 0.0002328064537286023, "loss": 0.0191, "step": 88790 }, { "epoch": 0.45, "learning_rate": 0.0002327988860355883, "loss": 0.0208, "step": 88800 }, { "epoch": 0.45, "learning_rate": 0.0002327913183425743, "loss": 0.0166, "step": 88810 }, { "epoch": 0.45, "learning_rate": 0.00023278375064956028, "loss": 0.0134, "step": 88820 }, { "epoch": 0.45, "learning_rate": 0.00023277618295654628, "loss": 0.0185, "step": 88830 }, { "epoch": 0.45, "learning_rate": 0.00023276861526353227, "loss": 0.0174, "step": 88840 }, { "epoch": 0.45, "learning_rate": 0.00023276104757051825, "loss": 0.0149, "step": 88850 }, { "epoch": 0.45, "learning_rate": 0.00023275347987750426, "loss": 0.0165, "step": 88860 }, { "epoch": 0.45, "learning_rate": 0.00023274591218449024, "loss": 0.0163, "step": 88870 }, { "epoch": 0.45, "learning_rate": 0.00023273834449147622, "loss": 0.0157, "step": 88880 }, { "epoch": 0.45, "learning_rate": 0.00023273077679846223, "loss": 0.0165, "step": 88890 }, { "epoch": 0.45, "learning_rate": 0.0002327232091054482, "loss": 0.0216, "step": 88900 }, { "epoch": 0.45, "learning_rate": 0.0002327156414124342, "loss": 0.0164, "step": 88910 }, { "epoch": 0.45, "learning_rate": 0.0002327080737194202, "loss": 0.0183, "step": 88920 }, { "epoch": 0.45, "learning_rate": 0.00023270050602640618, "loss": 0.0163, "step": 88930 }, { "epoch": 0.45, "learning_rate": 0.00023269293833339216, "loss": 0.0175, "step": 88940 }, { "epoch": 0.45, "learning_rate": 0.00023268537064037814, "loss": 0.023, "step": 88950 }, { "epoch": 0.45, "learning_rate": 0.00023267780294736415, "loss": 0.0185, "step": 88960 }, { "epoch": 0.45, "learning_rate": 0.00023267023525435013, "loss": 0.0168, "step": 88970 }, { "epoch": 0.45, "learning_rate": 0.00023266266756133611, "loss": 0.0144, "step": 88980 }, { "epoch": 0.45, "learning_rate": 0.00023265509986832212, "loss": 0.0162, "step": 88990 }, { "epoch": 0.45, "learning_rate": 0.0002326475321753081, "loss": 0.0146, "step": 89000 }, { "epoch": 0.45, "eval_cer": 0.9144906342217957, "eval_loss": 0.01203860528767109, "eval_runtime": 116.6624, "eval_samples_per_second": 17.143, "eval_steps_per_second": 4.286, "step": 89000 }, { "epoch": 0.45, "learning_rate": 0.00023263996448229409, "loss": 0.0206, "step": 89010 }, { "epoch": 0.45, "learning_rate": 0.0002326323967892801, "loss": 0.0151, "step": 89020 }, { "epoch": 0.45, "learning_rate": 0.00023262482909626608, "loss": 0.0156, "step": 89030 }, { "epoch": 0.45, "learning_rate": 0.00023261726140325206, "loss": 0.0193, "step": 89040 }, { "epoch": 0.45, "learning_rate": 0.00023260969371023807, "loss": 0.0177, "step": 89050 }, { "epoch": 0.45, "learning_rate": 0.00023260212601722405, "loss": 0.0126, "step": 89060 }, { "epoch": 0.45, "learning_rate": 0.00023259455832421003, "loss": 0.0178, "step": 89070 }, { "epoch": 0.45, "learning_rate": 0.00023258699063119604, "loss": 0.0148, "step": 89080 }, { "epoch": 0.45, "learning_rate": 0.00023257942293818202, "loss": 0.0187, "step": 89090 }, { "epoch": 0.45, "learning_rate": 0.000232571855245168, "loss": 0.0183, "step": 89100 }, { "epoch": 0.45, "learning_rate": 0.00023256428755215398, "loss": 0.0152, "step": 89110 }, { "epoch": 0.45, "learning_rate": 0.00023255671985914, "loss": 0.017, "step": 89120 }, { "epoch": 0.45, "learning_rate": 0.00023254915216612597, "loss": 0.0177, "step": 89130 }, { "epoch": 0.45, "learning_rate": 0.00023254158447311195, "loss": 0.0146, "step": 89140 }, { "epoch": 0.45, "learning_rate": 0.00023253401678009796, "loss": 0.0181, "step": 89150 }, { "epoch": 0.45, "learning_rate": 0.00023252644908708394, "loss": 0.0179, "step": 89160 }, { "epoch": 0.45, "learning_rate": 0.00023251888139406992, "loss": 0.0158, "step": 89170 }, { "epoch": 0.45, "learning_rate": 0.00023251131370105593, "loss": 0.0187, "step": 89180 }, { "epoch": 0.45, "learning_rate": 0.00023250374600804191, "loss": 0.0164, "step": 89190 }, { "epoch": 0.45, "learning_rate": 0.0002324961783150279, "loss": 0.0138, "step": 89200 }, { "epoch": 0.45, "learning_rate": 0.0002324886106220139, "loss": 0.0152, "step": 89210 }, { "epoch": 0.45, "learning_rate": 0.00023248104292899989, "loss": 0.0161, "step": 89220 }, { "epoch": 0.45, "learning_rate": 0.00023247347523598587, "loss": 0.0172, "step": 89230 }, { "epoch": 0.45, "learning_rate": 0.00023246590754297188, "loss": 0.0216, "step": 89240 }, { "epoch": 0.45, "learning_rate": 0.00023245833984995786, "loss": 0.0152, "step": 89250 }, { "epoch": 0.45, "learning_rate": 0.00023245077215694384, "loss": 0.0187, "step": 89260 }, { "epoch": 0.45, "learning_rate": 0.00023244320446392982, "loss": 0.0173, "step": 89270 }, { "epoch": 0.45, "learning_rate": 0.00023243563677091583, "loss": 0.0155, "step": 89280 }, { "epoch": 0.45, "learning_rate": 0.0002324280690779018, "loss": 0.0158, "step": 89290 }, { "epoch": 0.45, "learning_rate": 0.0002324205013848878, "loss": 0.0177, "step": 89300 }, { "epoch": 0.45, "learning_rate": 0.0002324129336918738, "loss": 0.0223, "step": 89310 }, { "epoch": 0.45, "learning_rate": 0.00023240536599885978, "loss": 0.0172, "step": 89320 }, { "epoch": 0.45, "learning_rate": 0.00023239779830584576, "loss": 0.0197, "step": 89330 }, { "epoch": 0.45, "learning_rate": 0.00023239023061283177, "loss": 0.0157, "step": 89340 }, { "epoch": 0.45, "learning_rate": 0.00023238266291981775, "loss": 0.0156, "step": 89350 }, { "epoch": 0.45, "learning_rate": 0.00023237509522680373, "loss": 0.0146, "step": 89360 }, { "epoch": 0.45, "learning_rate": 0.00023236752753378974, "loss": 0.0138, "step": 89370 }, { "epoch": 0.45, "learning_rate": 0.00023235995984077572, "loss": 0.0142, "step": 89380 }, { "epoch": 0.45, "learning_rate": 0.0002323523921477617, "loss": 0.0192, "step": 89390 }, { "epoch": 0.45, "learning_rate": 0.00023234482445474771, "loss": 0.0189, "step": 89400 }, { "epoch": 0.45, "learning_rate": 0.0002323372567617337, "loss": 0.0165, "step": 89410 }, { "epoch": 0.45, "learning_rate": 0.00023232968906871968, "loss": 0.016, "step": 89420 }, { "epoch": 0.45, "learning_rate": 0.00023232212137570566, "loss": 0.0171, "step": 89430 }, { "epoch": 0.45, "learning_rate": 0.00023231455368269167, "loss": 0.0133, "step": 89440 }, { "epoch": 0.45, "learning_rate": 0.00023230698598967765, "loss": 0.0127, "step": 89450 }, { "epoch": 0.45, "learning_rate": 0.00023229941829666363, "loss": 0.0155, "step": 89460 }, { "epoch": 0.45, "learning_rate": 0.00023229185060364964, "loss": 0.017, "step": 89470 }, { "epoch": 0.45, "learning_rate": 0.00023228428291063562, "loss": 0.0136, "step": 89480 }, { "epoch": 0.45, "learning_rate": 0.0002322767152176216, "loss": 0.018, "step": 89490 }, { "epoch": 0.45, "learning_rate": 0.0002322691475246076, "loss": 0.0151, "step": 89500 }, { "epoch": 0.45, "learning_rate": 0.0002322615798315936, "loss": 0.0158, "step": 89510 }, { "epoch": 0.45, "learning_rate": 0.00023225401213857957, "loss": 0.0214, "step": 89520 }, { "epoch": 0.45, "learning_rate": 0.00023224644444556558, "loss": 0.0207, "step": 89530 }, { "epoch": 0.45, "learning_rate": 0.00023223887675255156, "loss": 0.0157, "step": 89540 }, { "epoch": 0.45, "learning_rate": 0.00023223130905953754, "loss": 0.018, "step": 89550 }, { "epoch": 0.45, "learning_rate": 0.00023222374136652355, "loss": 0.0153, "step": 89560 }, { "epoch": 0.45, "learning_rate": 0.00023221617367350953, "loss": 0.0168, "step": 89570 }, { "epoch": 0.45, "learning_rate": 0.00023220860598049552, "loss": 0.0153, "step": 89580 }, { "epoch": 0.45, "learning_rate": 0.00023220103828748152, "loss": 0.0172, "step": 89590 }, { "epoch": 0.45, "learning_rate": 0.0002321934705944675, "loss": 0.0229, "step": 89600 }, { "epoch": 0.45, "learning_rate": 0.0002321859029014535, "loss": 0.0186, "step": 89610 }, { "epoch": 0.45, "learning_rate": 0.00023217833520843947, "loss": 0.0167, "step": 89620 }, { "epoch": 0.45, "learning_rate": 0.00023217076751542548, "loss": 0.0154, "step": 89630 }, { "epoch": 0.45, "learning_rate": 0.00023216319982241146, "loss": 0.0152, "step": 89640 }, { "epoch": 0.45, "learning_rate": 0.00023215563212939744, "loss": 0.0156, "step": 89650 }, { "epoch": 0.45, "learning_rate": 0.00023214806443638345, "loss": 0.0174, "step": 89660 }, { "epoch": 0.45, "learning_rate": 0.00023214049674336943, "loss": 0.0186, "step": 89670 }, { "epoch": 0.45, "learning_rate": 0.0002321329290503554, "loss": 0.0169, "step": 89680 }, { "epoch": 0.45, "learning_rate": 0.00023212536135734142, "loss": 0.0139, "step": 89690 }, { "epoch": 0.45, "learning_rate": 0.0002321177936643274, "loss": 0.0133, "step": 89700 }, { "epoch": 0.45, "learning_rate": 0.00023211022597131338, "loss": 0.0133, "step": 89710 }, { "epoch": 0.45, "learning_rate": 0.0002321026582782994, "loss": 0.0154, "step": 89720 }, { "epoch": 0.45, "learning_rate": 0.00023209509058528537, "loss": 0.0154, "step": 89730 }, { "epoch": 0.45, "learning_rate": 0.00023208752289227135, "loss": 0.0176, "step": 89740 }, { "epoch": 0.45, "learning_rate": 0.00023207995519925736, "loss": 0.0167, "step": 89750 }, { "epoch": 0.45, "learning_rate": 0.00023207238750624334, "loss": 0.0197, "step": 89760 }, { "epoch": 0.45, "learning_rate": 0.00023206481981322933, "loss": 0.0126, "step": 89770 }, { "epoch": 0.45, "learning_rate": 0.0002320572521202153, "loss": 0.0146, "step": 89780 }, { "epoch": 0.45, "learning_rate": 0.00023204968442720132, "loss": 0.0126, "step": 89790 }, { "epoch": 0.45, "learning_rate": 0.0002320421167341873, "loss": 0.0174, "step": 89800 }, { "epoch": 0.45, "learning_rate": 0.00023203454904117328, "loss": 0.0147, "step": 89810 }, { "epoch": 0.45, "learning_rate": 0.0002320269813481593, "loss": 0.0167, "step": 89820 }, { "epoch": 0.45, "learning_rate": 0.00023201941365514527, "loss": 0.0202, "step": 89830 }, { "epoch": 0.45, "learning_rate": 0.00023201184596213125, "loss": 0.0135, "step": 89840 }, { "epoch": 0.45, "learning_rate": 0.00023200427826911726, "loss": 0.0138, "step": 89850 }, { "epoch": 0.45, "learning_rate": 0.00023199671057610324, "loss": 0.0158, "step": 89860 }, { "epoch": 0.45, "learning_rate": 0.0002319891428830892, "loss": 0.015, "step": 89870 }, { "epoch": 0.45, "learning_rate": 0.00023198157519007518, "loss": 0.0149, "step": 89880 }, { "epoch": 0.45, "learning_rate": 0.00023197400749706118, "loss": 0.0162, "step": 89890 }, { "epoch": 0.45, "learning_rate": 0.00023196643980404717, "loss": 0.0156, "step": 89900 }, { "epoch": 0.45, "learning_rate": 0.00023195887211103315, "loss": 0.0146, "step": 89910 }, { "epoch": 0.45, "learning_rate": 0.00023195130441801916, "loss": 0.0142, "step": 89920 }, { "epoch": 0.45, "learning_rate": 0.00023194373672500514, "loss": 0.0144, "step": 89930 }, { "epoch": 0.45, "learning_rate": 0.00023193616903199112, "loss": 0.0159, "step": 89940 }, { "epoch": 0.45, "learning_rate": 0.00023192860133897713, "loss": 0.0333, "step": 89950 }, { "epoch": 0.45, "learning_rate": 0.0002319210336459631, "loss": 0.0643, "step": 89960 }, { "epoch": 0.45, "learning_rate": 0.0002319134659529491, "loss": 0.0249, "step": 89970 }, { "epoch": 0.45, "learning_rate": 0.0002319058982599351, "loss": 0.0134, "step": 89980 }, { "epoch": 0.45, "learning_rate": 0.00023189833056692108, "loss": 0.0211, "step": 89990 }, { "epoch": 0.45, "learning_rate": 0.00023189076287390706, "loss": 0.0173, "step": 90000 }, { "epoch": 0.45, "eval_cer": 0.9144983973907989, "eval_loss": 0.0122450590133667, "eval_runtime": 116.807, "eval_samples_per_second": 17.122, "eval_steps_per_second": 4.281, "step": 90000 }, { "epoch": 0.45, "learning_rate": 0.00023188319518089304, "loss": 0.0216, "step": 90010 }, { "epoch": 0.45, "learning_rate": 0.00023187562748787905, "loss": 0.0186, "step": 90020 }, { "epoch": 0.45, "learning_rate": 0.00023186805979486503, "loss": 0.0161, "step": 90030 }, { "epoch": 0.45, "learning_rate": 0.00023186049210185101, "loss": 0.0171, "step": 90040 }, { "epoch": 0.45, "learning_rate": 0.00023185292440883702, "loss": 0.0156, "step": 90050 }, { "epoch": 0.45, "learning_rate": 0.000231845356715823, "loss": 0.019, "step": 90060 }, { "epoch": 0.45, "learning_rate": 0.00023183778902280899, "loss": 0.0145, "step": 90070 }, { "epoch": 0.45, "learning_rate": 0.000231830221329795, "loss": 0.0184, "step": 90080 }, { "epoch": 0.45, "learning_rate": 0.00023182265363678098, "loss": 0.0175, "step": 90090 }, { "epoch": 0.45, "learning_rate": 0.00023181508594376696, "loss": 0.0194, "step": 90100 }, { "epoch": 0.45, "learning_rate": 0.00023180751825075297, "loss": 0.0152, "step": 90110 }, { "epoch": 0.45, "learning_rate": 0.00023179995055773895, "loss": 0.0167, "step": 90120 }, { "epoch": 0.45, "learning_rate": 0.00023179238286472493, "loss": 0.0178, "step": 90130 }, { "epoch": 0.45, "learning_rate": 0.00023178481517171094, "loss": 0.017, "step": 90140 }, { "epoch": 0.45, "learning_rate": 0.00023177724747869692, "loss": 0.0173, "step": 90150 }, { "epoch": 0.45, "learning_rate": 0.0002317696797856829, "loss": 0.0188, "step": 90160 }, { "epoch": 0.45, "learning_rate": 0.00023176211209266888, "loss": 0.0174, "step": 90170 }, { "epoch": 0.45, "learning_rate": 0.0002317545443996549, "loss": 0.0222, "step": 90180 }, { "epoch": 0.46, "learning_rate": 0.00023174697670664087, "loss": 0.0157, "step": 90190 }, { "epoch": 0.46, "learning_rate": 0.00023173940901362685, "loss": 0.018, "step": 90200 }, { "epoch": 0.46, "learning_rate": 0.00023173184132061286, "loss": 0.0191, "step": 90210 }, { "epoch": 0.46, "learning_rate": 0.00023172427362759884, "loss": 0.018, "step": 90220 }, { "epoch": 0.46, "learning_rate": 0.00023171670593458482, "loss": 0.0176, "step": 90230 }, { "epoch": 0.46, "learning_rate": 0.00023170913824157083, "loss": 0.0167, "step": 90240 }, { "epoch": 0.46, "learning_rate": 0.00023170157054855681, "loss": 0.0154, "step": 90250 }, { "epoch": 0.46, "learning_rate": 0.0002316940028555428, "loss": 0.0155, "step": 90260 }, { "epoch": 0.46, "learning_rate": 0.0002316864351625288, "loss": 0.0184, "step": 90270 }, { "epoch": 0.46, "learning_rate": 0.00023167886746951479, "loss": 0.019, "step": 90280 }, { "epoch": 0.46, "learning_rate": 0.00023167129977650077, "loss": 0.0158, "step": 90290 }, { "epoch": 0.46, "learning_rate": 0.00023166373208348678, "loss": 0.0136, "step": 90300 }, { "epoch": 0.46, "learning_rate": 0.00023165616439047276, "loss": 0.0182, "step": 90310 }, { "epoch": 0.46, "learning_rate": 0.00023164859669745874, "loss": 0.0154, "step": 90320 }, { "epoch": 0.46, "learning_rate": 0.00023164102900444472, "loss": 0.0161, "step": 90330 }, { "epoch": 0.46, "learning_rate": 0.00023163346131143073, "loss": 0.0169, "step": 90340 }, { "epoch": 0.46, "learning_rate": 0.0002316258936184167, "loss": 0.0159, "step": 90350 }, { "epoch": 0.46, "learning_rate": 0.0002316183259254027, "loss": 0.0181, "step": 90360 }, { "epoch": 0.46, "learning_rate": 0.0002316107582323887, "loss": 0.0152, "step": 90370 }, { "epoch": 0.46, "learning_rate": 0.00023160319053937468, "loss": 0.0189, "step": 90380 }, { "epoch": 0.46, "learning_rate": 0.00023159562284636066, "loss": 0.018, "step": 90390 }, { "epoch": 0.46, "learning_rate": 0.00023158805515334667, "loss": 0.0143, "step": 90400 }, { "epoch": 0.46, "learning_rate": 0.00023158048746033265, "loss": 0.0194, "step": 90410 }, { "epoch": 0.46, "learning_rate": 0.00023157291976731863, "loss": 0.0168, "step": 90420 }, { "epoch": 0.46, "learning_rate": 0.00023156535207430464, "loss": 0.0149, "step": 90430 }, { "epoch": 0.46, "learning_rate": 0.00023155778438129062, "loss": 0.0148, "step": 90440 }, { "epoch": 0.46, "learning_rate": 0.0002315502166882766, "loss": 0.0171, "step": 90450 }, { "epoch": 0.46, "learning_rate": 0.00023154264899526261, "loss": 0.0157, "step": 90460 }, { "epoch": 0.46, "learning_rate": 0.0002315350813022486, "loss": 0.0168, "step": 90470 }, { "epoch": 0.46, "learning_rate": 0.00023152751360923458, "loss": 0.0157, "step": 90480 }, { "epoch": 0.46, "learning_rate": 0.00023151994591622059, "loss": 0.0178, "step": 90490 }, { "epoch": 0.46, "learning_rate": 0.00023151237822320657, "loss": 0.013, "step": 90500 }, { "epoch": 0.46, "learning_rate": 0.00023150481053019255, "loss": 0.0145, "step": 90510 }, { "epoch": 0.46, "learning_rate": 0.00023149724283717853, "loss": 0.0141, "step": 90520 }, { "epoch": 0.46, "learning_rate": 0.00023148967514416454, "loss": 0.0154, "step": 90530 }, { "epoch": 0.46, "learning_rate": 0.00023148210745115052, "loss": 0.0154, "step": 90540 }, { "epoch": 0.46, "learning_rate": 0.0002314745397581365, "loss": 0.0155, "step": 90550 }, { "epoch": 0.46, "learning_rate": 0.0002314669720651225, "loss": 0.0163, "step": 90560 }, { "epoch": 0.46, "learning_rate": 0.0002314594043721085, "loss": 0.0189, "step": 90570 }, { "epoch": 0.46, "learning_rate": 0.00023145183667909447, "loss": 0.014, "step": 90580 }, { "epoch": 0.46, "learning_rate": 0.00023144426898608048, "loss": 0.0141, "step": 90590 }, { "epoch": 0.46, "learning_rate": 0.00023143670129306646, "loss": 0.0144, "step": 90600 }, { "epoch": 0.46, "learning_rate": 0.00023142913360005244, "loss": 0.0135, "step": 90610 }, { "epoch": 0.46, "learning_rate": 0.00023142156590703845, "loss": 0.0189, "step": 90620 }, { "epoch": 0.46, "learning_rate": 0.00023141399821402443, "loss": 0.0156, "step": 90630 }, { "epoch": 0.46, "learning_rate": 0.00023140643052101042, "loss": 0.0198, "step": 90640 }, { "epoch": 0.46, "learning_rate": 0.00023139886282799642, "loss": 0.015, "step": 90650 }, { "epoch": 0.46, "learning_rate": 0.0002313912951349824, "loss": 0.0173, "step": 90660 }, { "epoch": 0.46, "learning_rate": 0.0002313837274419684, "loss": 0.018, "step": 90670 }, { "epoch": 0.46, "learning_rate": 0.00023137615974895437, "loss": 0.0168, "step": 90680 }, { "epoch": 0.46, "learning_rate": 0.00023136859205594038, "loss": 0.0194, "step": 90690 }, { "epoch": 0.46, "learning_rate": 0.00023136102436292636, "loss": 0.018, "step": 90700 }, { "epoch": 0.46, "learning_rate": 0.00023135345666991234, "loss": 0.0119, "step": 90710 }, { "epoch": 0.46, "learning_rate": 0.00023134588897689835, "loss": 0.0158, "step": 90720 }, { "epoch": 0.46, "learning_rate": 0.00023133832128388433, "loss": 0.015, "step": 90730 }, { "epoch": 0.46, "learning_rate": 0.0002313307535908703, "loss": 0.0161, "step": 90740 }, { "epoch": 0.46, "learning_rate": 0.00023132318589785632, "loss": 0.0151, "step": 90750 }, { "epoch": 0.46, "learning_rate": 0.0002313156182048423, "loss": 0.0207, "step": 90760 }, { "epoch": 0.46, "learning_rate": 0.00023130805051182828, "loss": 0.0183, "step": 90770 }, { "epoch": 0.46, "learning_rate": 0.0002313004828188143, "loss": 0.0148, "step": 90780 }, { "epoch": 0.46, "learning_rate": 0.00023129291512580027, "loss": 0.0157, "step": 90790 }, { "epoch": 0.46, "learning_rate": 0.00023128534743278625, "loss": 0.0169, "step": 90800 }, { "epoch": 0.46, "learning_rate": 0.00023127777973977226, "loss": 0.0172, "step": 90810 }, { "epoch": 0.46, "learning_rate": 0.00023127021204675824, "loss": 0.0178, "step": 90820 }, { "epoch": 0.46, "learning_rate": 0.00023126264435374423, "loss": 0.0186, "step": 90830 }, { "epoch": 0.46, "learning_rate": 0.0002312550766607302, "loss": 0.0152, "step": 90840 }, { "epoch": 0.46, "learning_rate": 0.00023124750896771622, "loss": 0.0134, "step": 90850 }, { "epoch": 0.46, "learning_rate": 0.0002312399412747022, "loss": 0.0157, "step": 90860 }, { "epoch": 0.46, "learning_rate": 0.00023123237358168818, "loss": 0.0211, "step": 90870 }, { "epoch": 0.46, "learning_rate": 0.0002312248058886742, "loss": 0.0192, "step": 90880 }, { "epoch": 0.46, "learning_rate": 0.00023121723819566017, "loss": 0.0149, "step": 90890 }, { "epoch": 0.46, "learning_rate": 0.00023120967050264615, "loss": 0.0156, "step": 90900 }, { "epoch": 0.46, "learning_rate": 0.00023120210280963216, "loss": 0.015, "step": 90910 }, { "epoch": 0.46, "learning_rate": 0.00023119453511661814, "loss": 0.0175, "step": 90920 }, { "epoch": 0.46, "learning_rate": 0.00023118696742360412, "loss": 0.0149, "step": 90930 }, { "epoch": 0.46, "learning_rate": 0.00023117939973059013, "loss": 0.0145, "step": 90940 }, { "epoch": 0.46, "learning_rate": 0.0002311718320375761, "loss": 0.0163, "step": 90950 }, { "epoch": 0.46, "learning_rate": 0.0002311642643445621, "loss": 0.0163, "step": 90960 }, { "epoch": 0.46, "learning_rate": 0.0002311566966515481, "loss": 0.0162, "step": 90970 }, { "epoch": 0.46, "learning_rate": 0.00023114912895853408, "loss": 0.0172, "step": 90980 }, { "epoch": 0.46, "learning_rate": 0.00023114156126552006, "loss": 0.0177, "step": 90990 }, { "epoch": 0.46, "learning_rate": 0.00023113399357250607, "loss": 0.0168, "step": 91000 }, { "epoch": 0.46, "eval_cer": 0.9145022789753005, "eval_loss": 0.01197886560112238, "eval_runtime": 116.7595, "eval_samples_per_second": 17.129, "eval_steps_per_second": 4.282, "step": 91000 }, { "epoch": 0.46, "learning_rate": 0.00023112642587949205, "loss": 0.0226, "step": 91010 }, { "epoch": 0.46, "learning_rate": 0.00023111885818647804, "loss": 0.0155, "step": 91020 }, { "epoch": 0.46, "learning_rate": 0.00023111129049346402, "loss": 0.0138, "step": 91030 }, { "epoch": 0.46, "learning_rate": 0.00023110372280045003, "loss": 0.0222, "step": 91040 }, { "epoch": 0.46, "learning_rate": 0.000231096155107436, "loss": 0.0136, "step": 91050 }, { "epoch": 0.46, "learning_rate": 0.000231088587414422, "loss": 0.0187, "step": 91060 }, { "epoch": 0.46, "learning_rate": 0.000231081019721408, "loss": 0.0162, "step": 91070 }, { "epoch": 0.46, "learning_rate": 0.00023107345202839398, "loss": 0.0177, "step": 91080 }, { "epoch": 0.46, "learning_rate": 0.00023106588433537996, "loss": 0.0175, "step": 91090 }, { "epoch": 0.46, "learning_rate": 0.00023105831664236597, "loss": 0.0169, "step": 91100 }, { "epoch": 0.46, "learning_rate": 0.00023105074894935195, "loss": 0.0175, "step": 91110 }, { "epoch": 0.46, "learning_rate": 0.00023104318125633793, "loss": 0.0212, "step": 91120 }, { "epoch": 0.46, "learning_rate": 0.00023103561356332389, "loss": 0.0153, "step": 91130 }, { "epoch": 0.46, "learning_rate": 0.0002310280458703099, "loss": 0.0164, "step": 91140 }, { "epoch": 0.46, "learning_rate": 0.00023102047817729588, "loss": 0.0157, "step": 91150 }, { "epoch": 0.46, "learning_rate": 0.00023101291048428186, "loss": 0.014, "step": 91160 }, { "epoch": 0.46, "learning_rate": 0.00023100534279126787, "loss": 0.0172, "step": 91170 }, { "epoch": 0.46, "learning_rate": 0.00023099777509825385, "loss": 0.019, "step": 91180 }, { "epoch": 0.46, "learning_rate": 0.00023099020740523983, "loss": 0.0171, "step": 91190 }, { "epoch": 0.46, "learning_rate": 0.00023098263971222584, "loss": 0.0161, "step": 91200 }, { "epoch": 0.46, "learning_rate": 0.00023097507201921182, "loss": 0.0221, "step": 91210 }, { "epoch": 0.46, "learning_rate": 0.0002309675043261978, "loss": 0.0144, "step": 91220 }, { "epoch": 0.46, "learning_rate": 0.00023095993663318378, "loss": 0.0129, "step": 91230 }, { "epoch": 0.46, "learning_rate": 0.0002309523689401698, "loss": 0.0206, "step": 91240 }, { "epoch": 0.46, "learning_rate": 0.00023094480124715577, "loss": 0.0123, "step": 91250 }, { "epoch": 0.46, "learning_rate": 0.00023093723355414175, "loss": 0.0149, "step": 91260 }, { "epoch": 0.46, "learning_rate": 0.00023092966586112776, "loss": 0.0188, "step": 91270 }, { "epoch": 0.46, "learning_rate": 0.00023092209816811374, "loss": 0.0197, "step": 91280 }, { "epoch": 0.46, "learning_rate": 0.00023091453047509972, "loss": 0.0165, "step": 91290 }, { "epoch": 0.46, "learning_rate": 0.00023090696278208573, "loss": 0.0179, "step": 91300 }, { "epoch": 0.46, "learning_rate": 0.00023089939508907171, "loss": 0.0194, "step": 91310 }, { "epoch": 0.46, "learning_rate": 0.0002308918273960577, "loss": 0.022, "step": 91320 }, { "epoch": 0.46, "learning_rate": 0.0002308842597030437, "loss": 0.0215, "step": 91330 }, { "epoch": 0.46, "learning_rate": 0.00023087669201002969, "loss": 0.0174, "step": 91340 }, { "epoch": 0.46, "learning_rate": 0.00023086912431701567, "loss": 0.0195, "step": 91350 }, { "epoch": 0.46, "learning_rate": 0.00023086155662400168, "loss": 0.0159, "step": 91360 }, { "epoch": 0.46, "learning_rate": 0.00023085398893098766, "loss": 0.018, "step": 91370 }, { "epoch": 0.46, "learning_rate": 0.00023084642123797364, "loss": 0.0177, "step": 91380 }, { "epoch": 0.46, "learning_rate": 0.00023083885354495965, "loss": 0.0251, "step": 91390 }, { "epoch": 0.46, "learning_rate": 0.00023083128585194563, "loss": 0.0181, "step": 91400 }, { "epoch": 0.46, "learning_rate": 0.0002308237181589316, "loss": 0.022, "step": 91410 }, { "epoch": 0.46, "learning_rate": 0.0002308161504659176, "loss": 0.0176, "step": 91420 }, { "epoch": 0.46, "learning_rate": 0.0002308085827729036, "loss": 0.0198, "step": 91430 }, { "epoch": 0.46, "learning_rate": 0.00023080101507988958, "loss": 0.0189, "step": 91440 }, { "epoch": 0.46, "learning_rate": 0.00023079344738687556, "loss": 0.0196, "step": 91450 }, { "epoch": 0.46, "learning_rate": 0.00023078587969386157, "loss": 0.0166, "step": 91460 }, { "epoch": 0.46, "learning_rate": 0.00023077831200084755, "loss": 0.0208, "step": 91470 }, { "epoch": 0.46, "learning_rate": 0.00023077074430783353, "loss": 0.0145, "step": 91480 }, { "epoch": 0.46, "learning_rate": 0.00023076317661481954, "loss": 0.0164, "step": 91490 }, { "epoch": 0.46, "learning_rate": 0.00023075560892180552, "loss": 0.0163, "step": 91500 }, { "epoch": 0.46, "learning_rate": 0.0002307480412287915, "loss": 0.0186, "step": 91510 }, { "epoch": 0.46, "learning_rate": 0.00023074047353577751, "loss": 0.0174, "step": 91520 }, { "epoch": 0.46, "learning_rate": 0.0002307329058427635, "loss": 0.0138, "step": 91530 }, { "epoch": 0.46, "learning_rate": 0.00023072533814974948, "loss": 0.0204, "step": 91540 }, { "epoch": 0.46, "learning_rate": 0.00023071777045673549, "loss": 0.0159, "step": 91550 }, { "epoch": 0.46, "learning_rate": 0.00023071020276372147, "loss": 0.0135, "step": 91560 }, { "epoch": 0.46, "learning_rate": 0.00023070263507070745, "loss": 0.017, "step": 91570 }, { "epoch": 0.46, "learning_rate": 0.00023069506737769343, "loss": 0.0158, "step": 91580 }, { "epoch": 0.46, "learning_rate": 0.00023068749968467944, "loss": 0.0174, "step": 91590 }, { "epoch": 0.46, "learning_rate": 0.00023067993199166542, "loss": 0.0161, "step": 91600 }, { "epoch": 0.46, "learning_rate": 0.0002306723642986514, "loss": 0.0202, "step": 91610 }, { "epoch": 0.46, "learning_rate": 0.0002306647966056374, "loss": 0.0194, "step": 91620 }, { "epoch": 0.46, "learning_rate": 0.0002306572289126234, "loss": 0.0195, "step": 91630 }, { "epoch": 0.46, "learning_rate": 0.00023064966121960937, "loss": 0.0178, "step": 91640 }, { "epoch": 0.46, "learning_rate": 0.00023064209352659538, "loss": 0.0173, "step": 91650 }, { "epoch": 0.46, "learning_rate": 0.00023063452583358136, "loss": 0.015, "step": 91660 }, { "epoch": 0.46, "learning_rate": 0.00023062695814056734, "loss": 0.0153, "step": 91670 }, { "epoch": 0.46, "learning_rate": 0.00023061939044755335, "loss": 0.0176, "step": 91680 }, { "epoch": 0.46, "learning_rate": 0.00023061182275453933, "loss": 0.0178, "step": 91690 }, { "epoch": 0.46, "learning_rate": 0.00023060425506152532, "loss": 0.0181, "step": 91700 }, { "epoch": 0.46, "learning_rate": 0.00023059668736851132, "loss": 0.0195, "step": 91710 }, { "epoch": 0.46, "learning_rate": 0.0002305891196754973, "loss": 0.0171, "step": 91720 }, { "epoch": 0.46, "learning_rate": 0.0002305815519824833, "loss": 0.0165, "step": 91730 }, { "epoch": 0.46, "learning_rate": 0.00023057398428946927, "loss": 0.0174, "step": 91740 }, { "epoch": 0.46, "learning_rate": 0.00023056641659645528, "loss": 0.0175, "step": 91750 }, { "epoch": 0.46, "learning_rate": 0.00023055884890344126, "loss": 0.0185, "step": 91760 }, { "epoch": 0.46, "learning_rate": 0.00023055128121042724, "loss": 0.0184, "step": 91770 }, { "epoch": 0.46, "learning_rate": 0.00023054371351741325, "loss": 0.0161, "step": 91780 }, { "epoch": 0.46, "learning_rate": 0.00023053614582439923, "loss": 0.0184, "step": 91790 }, { "epoch": 0.46, "learning_rate": 0.0002305285781313852, "loss": 0.016, "step": 91800 }, { "epoch": 0.46, "learning_rate": 0.00023052101043837122, "loss": 0.0141, "step": 91810 }, { "epoch": 0.46, "learning_rate": 0.0002305134427453572, "loss": 0.02, "step": 91820 }, { "epoch": 0.46, "learning_rate": 0.00023050587505234318, "loss": 0.0146, "step": 91830 }, { "epoch": 0.46, "learning_rate": 0.0002304983073593292, "loss": 0.0144, "step": 91840 }, { "epoch": 0.46, "learning_rate": 0.00023049073966631517, "loss": 0.0144, "step": 91850 }, { "epoch": 0.46, "learning_rate": 0.00023048317197330115, "loss": 0.0142, "step": 91860 }, { "epoch": 0.46, "learning_rate": 0.00023047560428028716, "loss": 0.0161, "step": 91870 }, { "epoch": 0.46, "learning_rate": 0.00023046803658727314, "loss": 0.0133, "step": 91880 }, { "epoch": 0.46, "learning_rate": 0.00023046046889425913, "loss": 0.0168, "step": 91890 }, { "epoch": 0.46, "learning_rate": 0.00023045290120124513, "loss": 0.0171, "step": 91900 }, { "epoch": 0.46, "learning_rate": 0.00023044533350823112, "loss": 0.0262, "step": 91910 }, { "epoch": 0.46, "learning_rate": 0.0002304377658152171, "loss": 0.0167, "step": 91920 }, { "epoch": 0.46, "learning_rate": 0.00023043019812220308, "loss": 0.0148, "step": 91930 }, { "epoch": 0.46, "learning_rate": 0.0002304226304291891, "loss": 0.0152, "step": 91940 }, { "epoch": 0.46, "learning_rate": 0.00023041506273617507, "loss": 0.0187, "step": 91950 }, { "epoch": 0.46, "learning_rate": 0.00023040749504316105, "loss": 0.0157, "step": 91960 }, { "epoch": 0.46, "learning_rate": 0.00023039992735014706, "loss": 0.0129, "step": 91970 }, { "epoch": 0.46, "learning_rate": 0.00023039235965713304, "loss": 0.0174, "step": 91980 }, { "epoch": 0.46, "learning_rate": 0.00023038479196411902, "loss": 0.016, "step": 91990 }, { "epoch": 0.46, "learning_rate": 0.00023037722427110503, "loss": 0.017, "step": 92000 }, { "epoch": 0.46, "eval_cer": 0.9144974269946735, "eval_loss": 0.011690773069858551, "eval_runtime": 116.7969, "eval_samples_per_second": 17.124, "eval_steps_per_second": 4.281, "step": 92000 }, { "epoch": 0.46, "learning_rate": 0.000230369656578091, "loss": 0.0172, "step": 92010 }, { "epoch": 0.46, "learning_rate": 0.000230362088885077, "loss": 0.0176, "step": 92020 }, { "epoch": 0.46, "learning_rate": 0.000230354521192063, "loss": 0.0148, "step": 92030 }, { "epoch": 0.46, "learning_rate": 0.00023034695349904898, "loss": 0.0254, "step": 92040 }, { "epoch": 0.46, "learning_rate": 0.00023033938580603496, "loss": 0.0176, "step": 92050 }, { "epoch": 0.46, "learning_rate": 0.00023033181811302097, "loss": 0.0218, "step": 92060 }, { "epoch": 0.46, "learning_rate": 0.00023032425042000695, "loss": 0.0184, "step": 92070 }, { "epoch": 0.46, "learning_rate": 0.00023031668272699294, "loss": 0.0171, "step": 92080 }, { "epoch": 0.46, "learning_rate": 0.00023030911503397892, "loss": 0.0169, "step": 92090 }, { "epoch": 0.46, "learning_rate": 0.00023030154734096493, "loss": 0.0164, "step": 92100 }, { "epoch": 0.46, "learning_rate": 0.0002302939796479509, "loss": 0.0177, "step": 92110 }, { "epoch": 0.46, "learning_rate": 0.0002302864119549369, "loss": 0.0184, "step": 92120 }, { "epoch": 0.46, "learning_rate": 0.0002302788442619229, "loss": 0.019, "step": 92130 }, { "epoch": 0.46, "learning_rate": 0.00023027127656890888, "loss": 0.0174, "step": 92140 }, { "epoch": 0.46, "learning_rate": 0.00023026370887589486, "loss": 0.0162, "step": 92150 }, { "epoch": 0.46, "learning_rate": 0.00023025614118288087, "loss": 0.0189, "step": 92160 }, { "epoch": 0.47, "learning_rate": 0.00023024857348986685, "loss": 0.0166, "step": 92170 }, { "epoch": 0.47, "learning_rate": 0.00023024100579685283, "loss": 0.0175, "step": 92180 }, { "epoch": 0.47, "learning_rate": 0.00023023343810383884, "loss": 0.0141, "step": 92190 }, { "epoch": 0.47, "learning_rate": 0.00023022587041082482, "loss": 0.0188, "step": 92200 }, { "epoch": 0.47, "learning_rate": 0.0002302183027178108, "loss": 0.0153, "step": 92210 }, { "epoch": 0.47, "learning_rate": 0.0002302107350247968, "loss": 0.0183, "step": 92220 }, { "epoch": 0.47, "learning_rate": 0.0002302031673317828, "loss": 0.0149, "step": 92230 }, { "epoch": 0.47, "learning_rate": 0.00023019559963876877, "loss": 0.0169, "step": 92240 }, { "epoch": 0.47, "learning_rate": 0.00023018803194575476, "loss": 0.015, "step": 92250 }, { "epoch": 0.47, "learning_rate": 0.00023018046425274076, "loss": 0.0173, "step": 92260 }, { "epoch": 0.47, "learning_rate": 0.00023017289655972675, "loss": 0.0177, "step": 92270 }, { "epoch": 0.47, "learning_rate": 0.00023016532886671273, "loss": 0.0205, "step": 92280 }, { "epoch": 0.47, "learning_rate": 0.00023015776117369874, "loss": 0.0171, "step": 92290 }, { "epoch": 0.47, "learning_rate": 0.00023015019348068472, "loss": 0.0143, "step": 92300 }, { "epoch": 0.47, "learning_rate": 0.0002301426257876707, "loss": 0.0174, "step": 92310 }, { "epoch": 0.47, "learning_rate": 0.0002301350580946567, "loss": 0.0189, "step": 92320 }, { "epoch": 0.47, "learning_rate": 0.0002301274904016427, "loss": 0.015, "step": 92330 }, { "epoch": 0.47, "learning_rate": 0.00023011992270862867, "loss": 0.0153, "step": 92340 }, { "epoch": 0.47, "learning_rate": 0.00023011235501561468, "loss": 0.0169, "step": 92350 }, { "epoch": 0.47, "learning_rate": 0.00023010478732260066, "loss": 0.0132, "step": 92360 }, { "epoch": 0.47, "learning_rate": 0.00023009721962958664, "loss": 0.0149, "step": 92370 }, { "epoch": 0.47, "learning_rate": 0.00023008965193657265, "loss": 0.0155, "step": 92380 }, { "epoch": 0.47, "learning_rate": 0.0002300820842435586, "loss": 0.0161, "step": 92390 }, { "epoch": 0.47, "learning_rate": 0.0002300745165505446, "loss": 0.0195, "step": 92400 }, { "epoch": 0.47, "learning_rate": 0.00023006694885753057, "loss": 0.0183, "step": 92410 }, { "epoch": 0.47, "learning_rate": 0.00023005938116451658, "loss": 0.0182, "step": 92420 }, { "epoch": 0.47, "learning_rate": 0.00023005181347150256, "loss": 0.0189, "step": 92430 }, { "epoch": 0.47, "learning_rate": 0.00023004424577848854, "loss": 0.0171, "step": 92440 }, { "epoch": 0.47, "learning_rate": 0.00023003667808547455, "loss": 0.0221, "step": 92450 }, { "epoch": 0.47, "learning_rate": 0.00023002911039246053, "loss": 0.0119, "step": 92460 }, { "epoch": 0.47, "learning_rate": 0.0002300215426994465, "loss": 0.0139, "step": 92470 }, { "epoch": 0.47, "learning_rate": 0.0002300139750064325, "loss": 0.0143, "step": 92480 }, { "epoch": 0.47, "learning_rate": 0.0002300064073134185, "loss": 0.0151, "step": 92490 }, { "epoch": 0.47, "learning_rate": 0.00022999883962040448, "loss": 0.0174, "step": 92500 }, { "epoch": 0.47, "learning_rate": 0.00022999127192739046, "loss": 0.0144, "step": 92510 }, { "epoch": 0.47, "learning_rate": 0.00022998370423437647, "loss": 0.0209, "step": 92520 }, { "epoch": 0.47, "learning_rate": 0.00022997613654136245, "loss": 0.0164, "step": 92530 }, { "epoch": 0.47, "learning_rate": 0.00022996856884834844, "loss": 0.0165, "step": 92540 }, { "epoch": 0.47, "learning_rate": 0.00022996100115533444, "loss": 0.0144, "step": 92550 }, { "epoch": 0.47, "learning_rate": 0.00022995343346232043, "loss": 0.0168, "step": 92560 }, { "epoch": 0.47, "learning_rate": 0.0002299458657693064, "loss": 0.0142, "step": 92570 }, { "epoch": 0.47, "learning_rate": 0.00022993829807629242, "loss": 0.0194, "step": 92580 }, { "epoch": 0.47, "learning_rate": 0.0002299307303832784, "loss": 0.0141, "step": 92590 }, { "epoch": 0.47, "learning_rate": 0.00022992316269026438, "loss": 0.0159, "step": 92600 }, { "epoch": 0.47, "learning_rate": 0.0002299155949972504, "loss": 0.0163, "step": 92610 }, { "epoch": 0.47, "learning_rate": 0.00022990802730423637, "loss": 0.0131, "step": 92620 }, { "epoch": 0.47, "learning_rate": 0.00022990045961122235, "loss": 0.0157, "step": 92630 }, { "epoch": 0.47, "learning_rate": 0.00022989289191820833, "loss": 0.0124, "step": 92640 }, { "epoch": 0.47, "learning_rate": 0.00022988532422519434, "loss": 0.0141, "step": 92650 }, { "epoch": 0.47, "learning_rate": 0.00022987775653218032, "loss": 0.0173, "step": 92660 }, { "epoch": 0.47, "learning_rate": 0.0002298701888391663, "loss": 0.0133, "step": 92670 }, { "epoch": 0.47, "learning_rate": 0.0002298626211461523, "loss": 0.0157, "step": 92680 }, { "epoch": 0.47, "learning_rate": 0.0002298550534531383, "loss": 0.0207, "step": 92690 }, { "epoch": 0.47, "learning_rate": 0.00022984748576012427, "loss": 0.0155, "step": 92700 }, { "epoch": 0.47, "learning_rate": 0.00022983991806711028, "loss": 0.0129, "step": 92710 }, { "epoch": 0.47, "learning_rate": 0.00022983235037409626, "loss": 0.0137, "step": 92720 }, { "epoch": 0.47, "learning_rate": 0.00022982478268108225, "loss": 0.0151, "step": 92730 }, { "epoch": 0.47, "learning_rate": 0.00022981721498806825, "loss": 0.0135, "step": 92740 }, { "epoch": 0.47, "learning_rate": 0.00022980964729505424, "loss": 0.0148, "step": 92750 }, { "epoch": 0.47, "learning_rate": 0.00022980207960204022, "loss": 0.0153, "step": 92760 }, { "epoch": 0.47, "learning_rate": 0.00022979451190902623, "loss": 0.0157, "step": 92770 }, { "epoch": 0.47, "learning_rate": 0.0002297869442160122, "loss": 0.0168, "step": 92780 }, { "epoch": 0.47, "learning_rate": 0.0002297793765229982, "loss": 0.0166, "step": 92790 }, { "epoch": 0.47, "learning_rate": 0.0002297718088299842, "loss": 0.017, "step": 92800 }, { "epoch": 0.47, "learning_rate": 0.00022976424113697018, "loss": 0.0166, "step": 92810 }, { "epoch": 0.47, "learning_rate": 0.00022975667344395616, "loss": 0.0172, "step": 92820 }, { "epoch": 0.47, "learning_rate": 0.00022974910575094214, "loss": 0.0156, "step": 92830 }, { "epoch": 0.47, "learning_rate": 0.00022974153805792815, "loss": 0.0179, "step": 92840 }, { "epoch": 0.47, "learning_rate": 0.00022973397036491413, "loss": 0.0188, "step": 92850 }, { "epoch": 0.47, "learning_rate": 0.0002297264026719001, "loss": 0.0185, "step": 92860 }, { "epoch": 0.47, "learning_rate": 0.00022971883497888612, "loss": 0.0144, "step": 92870 }, { "epoch": 0.47, "learning_rate": 0.0002297112672858721, "loss": 0.0166, "step": 92880 }, { "epoch": 0.47, "learning_rate": 0.00022970369959285808, "loss": 0.0168, "step": 92890 }, { "epoch": 0.47, "learning_rate": 0.0002296961318998441, "loss": 0.0174, "step": 92900 }, { "epoch": 0.47, "learning_rate": 0.00022968856420683007, "loss": 0.0187, "step": 92910 }, { "epoch": 0.47, "learning_rate": 0.00022968099651381606, "loss": 0.0147, "step": 92920 }, { "epoch": 0.47, "learning_rate": 0.00022967342882080206, "loss": 0.0154, "step": 92930 }, { "epoch": 0.47, "learning_rate": 0.00022966586112778805, "loss": 0.0139, "step": 92940 }, { "epoch": 0.47, "learning_rate": 0.00022965829343477403, "loss": 0.0155, "step": 92950 }, { "epoch": 0.47, "learning_rate": 0.00022965072574176004, "loss": 0.0153, "step": 92960 }, { "epoch": 0.47, "learning_rate": 0.00022964315804874602, "loss": 0.0146, "step": 92970 }, { "epoch": 0.47, "learning_rate": 0.000229635590355732, "loss": 0.0187, "step": 92980 }, { "epoch": 0.47, "learning_rate": 0.00022962802266271798, "loss": 0.0197, "step": 92990 }, { "epoch": 0.47, "learning_rate": 0.000229620454969704, "loss": 0.0164, "step": 93000 }, { "epoch": 0.47, "eval_cer": 0.9144867526372941, "eval_loss": 0.0119341891258955, "eval_runtime": 116.7754, "eval_samples_per_second": 17.127, "eval_steps_per_second": 4.282, "step": 93000 }, { "epoch": 0.47, "learning_rate": 0.00022961288727668997, "loss": 0.0171, "step": 93010 }, { "epoch": 0.47, "learning_rate": 0.00022960531958367595, "loss": 0.0176, "step": 93020 }, { "epoch": 0.47, "learning_rate": 0.00022959775189066196, "loss": 0.0171, "step": 93030 }, { "epoch": 0.47, "learning_rate": 0.00022959018419764794, "loss": 0.0164, "step": 93040 }, { "epoch": 0.47, "learning_rate": 0.00022958261650463392, "loss": 0.0181, "step": 93050 }, { "epoch": 0.47, "learning_rate": 0.00022957504881161993, "loss": 0.0164, "step": 93060 }, { "epoch": 0.47, "learning_rate": 0.0002295674811186059, "loss": 0.0162, "step": 93070 }, { "epoch": 0.47, "learning_rate": 0.0002295599134255919, "loss": 0.0144, "step": 93080 }, { "epoch": 0.47, "learning_rate": 0.0002295523457325779, "loss": 0.0169, "step": 93090 }, { "epoch": 0.47, "learning_rate": 0.00022954477803956388, "loss": 0.0152, "step": 93100 }, { "epoch": 0.47, "learning_rate": 0.00022953721034654987, "loss": 0.013, "step": 93110 }, { "epoch": 0.47, "learning_rate": 0.00022952964265353587, "loss": 0.0171, "step": 93120 }, { "epoch": 0.47, "learning_rate": 0.00022952207496052186, "loss": 0.0178, "step": 93130 }, { "epoch": 0.47, "learning_rate": 0.00022951450726750784, "loss": 0.0179, "step": 93140 }, { "epoch": 0.47, "learning_rate": 0.00022950693957449382, "loss": 0.0142, "step": 93150 }, { "epoch": 0.47, "learning_rate": 0.00022949937188147983, "loss": 0.0143, "step": 93160 }, { "epoch": 0.47, "learning_rate": 0.0002294918041884658, "loss": 0.015, "step": 93170 }, { "epoch": 0.47, "learning_rate": 0.0002294842364954518, "loss": 0.0162, "step": 93180 }, { "epoch": 0.47, "learning_rate": 0.0002294766688024378, "loss": 0.0168, "step": 93190 }, { "epoch": 0.47, "learning_rate": 0.00022946910110942378, "loss": 0.0154, "step": 93200 }, { "epoch": 0.47, "learning_rate": 0.00022946153341640976, "loss": 0.0138, "step": 93210 }, { "epoch": 0.47, "learning_rate": 0.00022945396572339577, "loss": 0.0142, "step": 93220 }, { "epoch": 0.47, "learning_rate": 0.00022944639803038175, "loss": 0.0178, "step": 93230 }, { "epoch": 0.47, "learning_rate": 0.00022943883033736773, "loss": 0.0164, "step": 93240 }, { "epoch": 0.47, "learning_rate": 0.00022943126264435374, "loss": 0.0153, "step": 93250 }, { "epoch": 0.47, "learning_rate": 0.00022942369495133972, "loss": 0.0153, "step": 93260 }, { "epoch": 0.47, "learning_rate": 0.0002294161272583257, "loss": 0.02, "step": 93270 }, { "epoch": 0.47, "learning_rate": 0.0002294085595653117, "loss": 0.0168, "step": 93280 }, { "epoch": 0.47, "learning_rate": 0.0002294009918722977, "loss": 0.0161, "step": 93290 }, { "epoch": 0.47, "learning_rate": 0.00022939342417928368, "loss": 0.0146, "step": 93300 }, { "epoch": 0.47, "learning_rate": 0.00022938585648626966, "loss": 0.0162, "step": 93310 }, { "epoch": 0.47, "learning_rate": 0.00022937828879325567, "loss": 0.0158, "step": 93320 }, { "epoch": 0.47, "learning_rate": 0.00022937072110024165, "loss": 0.0166, "step": 93330 }, { "epoch": 0.47, "learning_rate": 0.00022936315340722763, "loss": 0.0159, "step": 93340 }, { "epoch": 0.47, "learning_rate": 0.00022935558571421364, "loss": 0.0178, "step": 93350 }, { "epoch": 0.47, "learning_rate": 0.00022934801802119962, "loss": 0.0145, "step": 93360 }, { "epoch": 0.47, "learning_rate": 0.0002293404503281856, "loss": 0.0168, "step": 93370 }, { "epoch": 0.47, "learning_rate": 0.0002293328826351716, "loss": 0.0142, "step": 93380 }, { "epoch": 0.47, "learning_rate": 0.0002293253149421576, "loss": 0.0172, "step": 93390 }, { "epoch": 0.47, "learning_rate": 0.00022931774724914357, "loss": 0.0138, "step": 93400 }, { "epoch": 0.47, "learning_rate": 0.00022931017955612958, "loss": 0.0148, "step": 93410 }, { "epoch": 0.47, "learning_rate": 0.00022930261186311556, "loss": 0.014, "step": 93420 }, { "epoch": 0.47, "learning_rate": 0.00022929504417010154, "loss": 0.015, "step": 93430 }, { "epoch": 0.47, "learning_rate": 0.00022928747647708755, "loss": 0.0141, "step": 93440 }, { "epoch": 0.47, "learning_rate": 0.00022927990878407353, "loss": 0.0186, "step": 93450 }, { "epoch": 0.47, "learning_rate": 0.00022927234109105951, "loss": 0.0208, "step": 93460 }, { "epoch": 0.47, "learning_rate": 0.00022926477339804552, "loss": 0.0142, "step": 93470 }, { "epoch": 0.47, "learning_rate": 0.0002292572057050315, "loss": 0.0183, "step": 93480 }, { "epoch": 0.47, "learning_rate": 0.00022924963801201749, "loss": 0.0149, "step": 93490 }, { "epoch": 0.47, "learning_rate": 0.00022924207031900347, "loss": 0.0197, "step": 93500 }, { "epoch": 0.47, "learning_rate": 0.00022923450262598948, "loss": 0.0162, "step": 93510 }, { "epoch": 0.47, "learning_rate": 0.00022922693493297546, "loss": 0.0183, "step": 93520 }, { "epoch": 0.47, "learning_rate": 0.00022921936723996144, "loss": 0.0166, "step": 93530 }, { "epoch": 0.47, "learning_rate": 0.00022921179954694745, "loss": 0.0161, "step": 93540 }, { "epoch": 0.47, "learning_rate": 0.00022920423185393343, "loss": 0.0185, "step": 93550 }, { "epoch": 0.47, "learning_rate": 0.0002291966641609194, "loss": 0.0173, "step": 93560 }, { "epoch": 0.47, "learning_rate": 0.00022918909646790542, "loss": 0.0161, "step": 93570 }, { "epoch": 0.47, "learning_rate": 0.0002291815287748914, "loss": 0.017, "step": 93580 }, { "epoch": 0.47, "learning_rate": 0.00022917396108187738, "loss": 0.016, "step": 93590 }, { "epoch": 0.47, "learning_rate": 0.0002291663933888634, "loss": 0.0143, "step": 93600 }, { "epoch": 0.47, "learning_rate": 0.00022915882569584937, "loss": 0.0143, "step": 93610 }, { "epoch": 0.47, "learning_rate": 0.00022915125800283535, "loss": 0.014, "step": 93620 }, { "epoch": 0.47, "learning_rate": 0.00022914369030982136, "loss": 0.0147, "step": 93630 }, { "epoch": 0.47, "learning_rate": 0.00022913612261680732, "loss": 0.0186, "step": 93640 }, { "epoch": 0.47, "learning_rate": 0.0002291285549237933, "loss": 0.0168, "step": 93650 }, { "epoch": 0.47, "learning_rate": 0.00022912098723077928, "loss": 0.0145, "step": 93660 }, { "epoch": 0.47, "learning_rate": 0.0002291134195377653, "loss": 0.0159, "step": 93670 }, { "epoch": 0.47, "learning_rate": 0.00022910585184475127, "loss": 0.0151, "step": 93680 }, { "epoch": 0.47, "learning_rate": 0.00022909828415173725, "loss": 0.0158, "step": 93690 }, { "epoch": 0.47, "learning_rate": 0.00022909071645872326, "loss": 0.0286, "step": 93700 }, { "epoch": 0.47, "learning_rate": 0.00022908314876570924, "loss": 0.0202, "step": 93710 }, { "epoch": 0.47, "learning_rate": 0.00022907558107269522, "loss": 0.0162, "step": 93720 }, { "epoch": 0.47, "learning_rate": 0.0002290680133796812, "loss": 0.0167, "step": 93730 }, { "epoch": 0.47, "learning_rate": 0.0002290604456866672, "loss": 0.0191, "step": 93740 }, { "epoch": 0.47, "learning_rate": 0.0002290528779936532, "loss": 0.0178, "step": 93750 }, { "epoch": 0.47, "learning_rate": 0.00022904531030063917, "loss": 0.0186, "step": 93760 }, { "epoch": 0.47, "learning_rate": 0.00022903774260762518, "loss": 0.0159, "step": 93770 }, { "epoch": 0.47, "learning_rate": 0.00022903017491461116, "loss": 0.0166, "step": 93780 }, { "epoch": 0.47, "learning_rate": 0.00022902260722159715, "loss": 0.0206, "step": 93790 }, { "epoch": 0.47, "learning_rate": 0.00022901503952858315, "loss": 0.0184, "step": 93800 }, { "epoch": 0.47, "learning_rate": 0.00022900747183556914, "loss": 0.0159, "step": 93810 }, { "epoch": 0.47, "learning_rate": 0.00022899990414255512, "loss": 0.0153, "step": 93820 }, { "epoch": 0.47, "learning_rate": 0.00022899233644954113, "loss": 0.018, "step": 93830 }, { "epoch": 0.47, "learning_rate": 0.0002289847687565271, "loss": 0.0178, "step": 93840 }, { "epoch": 0.47, "learning_rate": 0.0002289772010635131, "loss": 0.0171, "step": 93850 }, { "epoch": 0.47, "learning_rate": 0.0002289696333704991, "loss": 0.0188, "step": 93860 }, { "epoch": 0.47, "learning_rate": 0.00022896206567748508, "loss": 0.0165, "step": 93870 }, { "epoch": 0.47, "learning_rate": 0.00022895449798447106, "loss": 0.0183, "step": 93880 }, { "epoch": 0.47, "learning_rate": 0.00022894693029145704, "loss": 0.013, "step": 93890 }, { "epoch": 0.47, "learning_rate": 0.00022893936259844305, "loss": 0.0163, "step": 93900 }, { "epoch": 0.47, "learning_rate": 0.00022893179490542903, "loss": 0.0166, "step": 93910 }, { "epoch": 0.47, "learning_rate": 0.000228924227212415, "loss": 0.0152, "step": 93920 }, { "epoch": 0.47, "learning_rate": 0.00022891665951940102, "loss": 0.0181, "step": 93930 }, { "epoch": 0.47, "learning_rate": 0.000228909091826387, "loss": 0.0155, "step": 93940 }, { "epoch": 0.47, "learning_rate": 0.00022890152413337298, "loss": 0.012, "step": 93950 }, { "epoch": 0.47, "learning_rate": 0.000228893956440359, "loss": 0.0129, "step": 93960 }, { "epoch": 0.47, "learning_rate": 0.00022888638874734497, "loss": 0.0165, "step": 93970 }, { "epoch": 0.47, "learning_rate": 0.00022887882105433096, "loss": 0.0173, "step": 93980 }, { "epoch": 0.47, "learning_rate": 0.00022887125336131696, "loss": 0.0153, "step": 93990 }, { "epoch": 0.47, "learning_rate": 0.00022886368566830295, "loss": 0.0188, "step": 94000 }, { "epoch": 0.47, "eval_cer": 0.914481900656667, "eval_loss": 0.011606461368501186, "eval_runtime": 116.7314, "eval_samples_per_second": 17.133, "eval_steps_per_second": 4.283, "step": 94000 }, { "epoch": 0.47, "learning_rate": 0.00022885611797528893, "loss": 0.0187, "step": 94010 }, { "epoch": 0.47, "learning_rate": 0.00022884855028227494, "loss": 0.0155, "step": 94020 }, { "epoch": 0.47, "learning_rate": 0.00022884098258926092, "loss": 0.014, "step": 94030 }, { "epoch": 0.47, "learning_rate": 0.0002288334148962469, "loss": 0.0193, "step": 94040 }, { "epoch": 0.47, "learning_rate": 0.00022882584720323288, "loss": 0.0132, "step": 94050 }, { "epoch": 0.47, "learning_rate": 0.0002288182795102189, "loss": 0.0186, "step": 94060 }, { "epoch": 0.47, "learning_rate": 0.00022881071181720487, "loss": 0.0152, "step": 94070 }, { "epoch": 0.47, "learning_rate": 0.00022880314412419085, "loss": 0.0158, "step": 94080 }, { "epoch": 0.47, "learning_rate": 0.00022879557643117686, "loss": 0.0151, "step": 94090 }, { "epoch": 0.47, "learning_rate": 0.00022878800873816284, "loss": 0.0186, "step": 94100 }, { "epoch": 0.47, "learning_rate": 0.00022878044104514882, "loss": 0.0133, "step": 94110 }, { "epoch": 0.47, "learning_rate": 0.00022877287335213483, "loss": 0.0187, "step": 94120 }, { "epoch": 0.47, "learning_rate": 0.0002287653056591208, "loss": 0.0217, "step": 94130 }, { "epoch": 0.47, "learning_rate": 0.0002287577379661068, "loss": 0.0153, "step": 94140 }, { "epoch": 0.47, "learning_rate": 0.0002287501702730928, "loss": 0.0171, "step": 94150 }, { "epoch": 0.48, "learning_rate": 0.00022874260258007878, "loss": 0.0178, "step": 94160 }, { "epoch": 0.48, "learning_rate": 0.00022873503488706477, "loss": 0.0148, "step": 94170 }, { "epoch": 0.48, "learning_rate": 0.00022872746719405077, "loss": 0.0225, "step": 94180 }, { "epoch": 0.48, "learning_rate": 0.00022871989950103676, "loss": 0.0164, "step": 94190 }, { "epoch": 0.48, "learning_rate": 0.00022871233180802274, "loss": 0.0153, "step": 94200 }, { "epoch": 0.48, "learning_rate": 0.00022870476411500872, "loss": 0.014, "step": 94210 }, { "epoch": 0.48, "learning_rate": 0.00022869719642199473, "loss": 0.0184, "step": 94220 }, { "epoch": 0.48, "learning_rate": 0.0002286896287289807, "loss": 0.0149, "step": 94230 }, { "epoch": 0.48, "learning_rate": 0.0002286820610359667, "loss": 0.0145, "step": 94240 }, { "epoch": 0.48, "learning_rate": 0.0002286744933429527, "loss": 0.0138, "step": 94250 }, { "epoch": 0.48, "learning_rate": 0.00022866692564993868, "loss": 0.0158, "step": 94260 }, { "epoch": 0.48, "learning_rate": 0.00022865935795692466, "loss": 0.0149, "step": 94270 }, { "epoch": 0.48, "learning_rate": 0.00022865179026391067, "loss": 0.0147, "step": 94280 }, { "epoch": 0.48, "learning_rate": 0.00022864422257089665, "loss": 0.0195, "step": 94290 }, { "epoch": 0.48, "learning_rate": 0.00022863665487788263, "loss": 0.0234, "step": 94300 }, { "epoch": 0.48, "learning_rate": 0.00022862908718486864, "loss": 0.019, "step": 94310 }, { "epoch": 0.48, "learning_rate": 0.00022862151949185462, "loss": 0.0175, "step": 94320 }, { "epoch": 0.48, "learning_rate": 0.0002286139517988406, "loss": 0.0148, "step": 94330 }, { "epoch": 0.48, "learning_rate": 0.0002286063841058266, "loss": 0.017, "step": 94340 }, { "epoch": 0.48, "learning_rate": 0.0002285988164128126, "loss": 0.0187, "step": 94350 }, { "epoch": 0.48, "learning_rate": 0.00022859124871979858, "loss": 0.0143, "step": 94360 }, { "epoch": 0.48, "learning_rate": 0.00022858368102678458, "loss": 0.017, "step": 94370 }, { "epoch": 0.48, "learning_rate": 0.00022857611333377057, "loss": 0.0137, "step": 94380 }, { "epoch": 0.48, "learning_rate": 0.00022856854564075655, "loss": 0.015, "step": 94390 }, { "epoch": 0.48, "learning_rate": 0.00022856097794774253, "loss": 0.0181, "step": 94400 }, { "epoch": 0.48, "learning_rate": 0.00022855341025472854, "loss": 0.0182, "step": 94410 }, { "epoch": 0.48, "learning_rate": 0.00022854584256171452, "loss": 0.0202, "step": 94420 }, { "epoch": 0.48, "learning_rate": 0.0002285382748687005, "loss": 0.0156, "step": 94430 }, { "epoch": 0.48, "learning_rate": 0.0002285307071756865, "loss": 0.0179, "step": 94440 }, { "epoch": 0.48, "learning_rate": 0.0002285231394826725, "loss": 0.0136, "step": 94450 }, { "epoch": 0.48, "learning_rate": 0.00022851557178965847, "loss": 0.0125, "step": 94460 }, { "epoch": 0.48, "learning_rate": 0.00022850800409664448, "loss": 0.0137, "step": 94470 }, { "epoch": 0.48, "learning_rate": 0.00022850043640363046, "loss": 0.0142, "step": 94480 }, { "epoch": 0.48, "learning_rate": 0.00022849286871061644, "loss": 0.0159, "step": 94490 }, { "epoch": 0.48, "learning_rate": 0.00022848530101760245, "loss": 0.0142, "step": 94500 }, { "epoch": 0.48, "learning_rate": 0.00022847773332458843, "loss": 0.0142, "step": 94510 }, { "epoch": 0.48, "learning_rate": 0.00022847016563157441, "loss": 0.0151, "step": 94520 }, { "epoch": 0.48, "learning_rate": 0.00022846259793856042, "loss": 0.0179, "step": 94530 }, { "epoch": 0.48, "learning_rate": 0.0002284550302455464, "loss": 0.0167, "step": 94540 }, { "epoch": 0.48, "learning_rate": 0.00022844746255253239, "loss": 0.0168, "step": 94550 }, { "epoch": 0.48, "learning_rate": 0.00022843989485951837, "loss": 0.0119, "step": 94560 }, { "epoch": 0.48, "learning_rate": 0.00022843232716650438, "loss": 0.0192, "step": 94570 }, { "epoch": 0.48, "learning_rate": 0.00022842475947349036, "loss": 0.0196, "step": 94580 }, { "epoch": 0.48, "learning_rate": 0.00022841719178047634, "loss": 0.0153, "step": 94590 }, { "epoch": 0.48, "learning_rate": 0.00022840962408746235, "loss": 0.0139, "step": 94600 }, { "epoch": 0.48, "learning_rate": 0.00022840205639444833, "loss": 0.0147, "step": 94610 }, { "epoch": 0.48, "learning_rate": 0.0002283944887014343, "loss": 0.0126, "step": 94620 }, { "epoch": 0.48, "learning_rate": 0.00022838692100842032, "loss": 0.0158, "step": 94630 }, { "epoch": 0.48, "learning_rate": 0.0002283793533154063, "loss": 0.0156, "step": 94640 }, { "epoch": 0.48, "learning_rate": 0.00022837178562239228, "loss": 0.0156, "step": 94650 }, { "epoch": 0.48, "learning_rate": 0.0002283642179293783, "loss": 0.0148, "step": 94660 }, { "epoch": 0.48, "learning_rate": 0.00022835665023636427, "loss": 0.0146, "step": 94670 }, { "epoch": 0.48, "learning_rate": 0.00022834908254335025, "loss": 0.0193, "step": 94680 }, { "epoch": 0.48, "learning_rate": 0.00022834151485033626, "loss": 0.019, "step": 94690 }, { "epoch": 0.48, "learning_rate": 0.00022833394715732224, "loss": 0.0185, "step": 94700 }, { "epoch": 0.48, "learning_rate": 0.00022832637946430822, "loss": 0.0194, "step": 94710 }, { "epoch": 0.48, "learning_rate": 0.0002283188117712942, "loss": 0.0153, "step": 94720 }, { "epoch": 0.48, "learning_rate": 0.00022831124407828021, "loss": 0.0188, "step": 94730 }, { "epoch": 0.48, "learning_rate": 0.0002283036763852662, "loss": 0.0141, "step": 94740 }, { "epoch": 0.48, "learning_rate": 0.00022829610869225218, "loss": 0.0192, "step": 94750 }, { "epoch": 0.48, "learning_rate": 0.00022828854099923819, "loss": 0.0184, "step": 94760 }, { "epoch": 0.48, "learning_rate": 0.00022828097330622417, "loss": 0.0151, "step": 94770 }, { "epoch": 0.48, "learning_rate": 0.00022827340561321015, "loss": 0.015, "step": 94780 }, { "epoch": 0.48, "learning_rate": 0.00022826583792019616, "loss": 0.0161, "step": 94790 }, { "epoch": 0.48, "learning_rate": 0.00022825827022718214, "loss": 0.0218, "step": 94800 }, { "epoch": 0.48, "learning_rate": 0.00022825070253416812, "loss": 0.0139, "step": 94810 }, { "epoch": 0.48, "learning_rate": 0.00022824313484115413, "loss": 0.0153, "step": 94820 }, { "epoch": 0.48, "learning_rate": 0.0002282355671481401, "loss": 0.015, "step": 94830 }, { "epoch": 0.48, "learning_rate": 0.0002282279994551261, "loss": 0.0205, "step": 94840 }, { "epoch": 0.48, "learning_rate": 0.0002282204317621121, "loss": 0.012, "step": 94850 }, { "epoch": 0.48, "learning_rate": 0.00022821286406909808, "loss": 0.0166, "step": 94860 }, { "epoch": 0.48, "learning_rate": 0.00022820529637608406, "loss": 0.0121, "step": 94870 }, { "epoch": 0.48, "learning_rate": 0.00022819772868307007, "loss": 0.014, "step": 94880 }, { "epoch": 0.48, "learning_rate": 0.00022819016099005605, "loss": 0.0148, "step": 94890 }, { "epoch": 0.48, "learning_rate": 0.000228182593297042, "loss": 0.0174, "step": 94900 }, { "epoch": 0.48, "learning_rate": 0.000228175025604028, "loss": 0.0202, "step": 94910 }, { "epoch": 0.48, "learning_rate": 0.000228167457911014, "loss": 0.0141, "step": 94920 }, { "epoch": 0.48, "learning_rate": 0.00022815989021799998, "loss": 0.015, "step": 94930 }, { "epoch": 0.48, "learning_rate": 0.00022815232252498596, "loss": 0.0167, "step": 94940 }, { "epoch": 0.48, "learning_rate": 0.00022814475483197194, "loss": 0.0169, "step": 94950 }, { "epoch": 0.48, "learning_rate": 0.00022813718713895795, "loss": 0.0167, "step": 94960 }, { "epoch": 0.48, "learning_rate": 0.00022812961944594393, "loss": 0.0165, "step": 94970 }, { "epoch": 0.48, "learning_rate": 0.0002281220517529299, "loss": 0.0185, "step": 94980 }, { "epoch": 0.48, "learning_rate": 0.00022811448405991592, "loss": 0.0203, "step": 94990 }, { "epoch": 0.48, "learning_rate": 0.0002281069163669019, "loss": 0.0173, "step": 95000 }, { "epoch": 0.48, "eval_cer": 0.9144848118450433, "eval_loss": 0.012143060564994812, "eval_runtime": 116.8022, "eval_samples_per_second": 17.123, "eval_steps_per_second": 4.281, "step": 95000 }, { "epoch": 0.48, "learning_rate": 0.00022809934867388788, "loss": 0.0176, "step": 95010 }, { "epoch": 0.48, "learning_rate": 0.0002280917809808739, "loss": 0.014, "step": 95020 }, { "epoch": 0.48, "learning_rate": 0.00022808421328785987, "loss": 0.0155, "step": 95030 }, { "epoch": 0.48, "learning_rate": 0.00022807664559484586, "loss": 0.0143, "step": 95040 }, { "epoch": 0.48, "learning_rate": 0.00022806907790183186, "loss": 0.015, "step": 95050 }, { "epoch": 0.48, "learning_rate": 0.00022806151020881785, "loss": 0.0133, "step": 95060 }, { "epoch": 0.48, "learning_rate": 0.00022805394251580383, "loss": 0.0157, "step": 95070 }, { "epoch": 0.48, "learning_rate": 0.00022804637482278984, "loss": 0.0126, "step": 95080 }, { "epoch": 0.48, "learning_rate": 0.00022803880712977582, "loss": 0.0153, "step": 95090 }, { "epoch": 0.48, "learning_rate": 0.0002280312394367618, "loss": 0.0156, "step": 95100 }, { "epoch": 0.48, "learning_rate": 0.00022802367174374778, "loss": 0.0134, "step": 95110 }, { "epoch": 0.48, "learning_rate": 0.0002280161040507338, "loss": 0.0182, "step": 95120 }, { "epoch": 0.48, "learning_rate": 0.00022800853635771977, "loss": 0.0154, "step": 95130 }, { "epoch": 0.48, "learning_rate": 0.00022800096866470575, "loss": 0.0159, "step": 95140 }, { "epoch": 0.48, "learning_rate": 0.00022799340097169176, "loss": 0.0168, "step": 95150 }, { "epoch": 0.48, "learning_rate": 0.00022798583327867774, "loss": 0.015, "step": 95160 }, { "epoch": 0.48, "learning_rate": 0.00022797826558566372, "loss": 0.0139, "step": 95170 }, { "epoch": 0.48, "learning_rate": 0.00022797069789264973, "loss": 0.0164, "step": 95180 }, { "epoch": 0.48, "learning_rate": 0.0002279631301996357, "loss": 0.018, "step": 95190 }, { "epoch": 0.48, "learning_rate": 0.0002279555625066217, "loss": 0.0143, "step": 95200 }, { "epoch": 0.48, "learning_rate": 0.0002279479948136077, "loss": 0.0156, "step": 95210 }, { "epoch": 0.48, "learning_rate": 0.00022794042712059368, "loss": 0.0145, "step": 95220 }, { "epoch": 0.48, "learning_rate": 0.00022793285942757967, "loss": 0.0156, "step": 95230 }, { "epoch": 0.48, "learning_rate": 0.00022792529173456567, "loss": 0.0157, "step": 95240 }, { "epoch": 0.48, "learning_rate": 0.00022791772404155166, "loss": 0.0172, "step": 95250 }, { "epoch": 0.48, "learning_rate": 0.00022791015634853764, "loss": 0.0164, "step": 95260 }, { "epoch": 0.48, "learning_rate": 0.00022790258865552365, "loss": 0.0146, "step": 95270 }, { "epoch": 0.48, "learning_rate": 0.00022789502096250963, "loss": 0.0165, "step": 95280 }, { "epoch": 0.48, "learning_rate": 0.0002278874532694956, "loss": 0.0332, "step": 95290 }, { "epoch": 0.48, "learning_rate": 0.0002278798855764816, "loss": 0.0154, "step": 95300 }, { "epoch": 0.48, "learning_rate": 0.0002278723178834676, "loss": 0.0166, "step": 95310 }, { "epoch": 0.48, "learning_rate": 0.00022786475019045358, "loss": 0.0529, "step": 95320 }, { "epoch": 0.48, "learning_rate": 0.00022785718249743956, "loss": 0.0173, "step": 95330 }, { "epoch": 0.48, "learning_rate": 0.00022784961480442557, "loss": 0.0187, "step": 95340 }, { "epoch": 0.48, "learning_rate": 0.00022784204711141155, "loss": 0.0175, "step": 95350 }, { "epoch": 0.48, "learning_rate": 0.00022783447941839753, "loss": 0.0157, "step": 95360 }, { "epoch": 0.48, "learning_rate": 0.00022782691172538354, "loss": 0.0186, "step": 95370 }, { "epoch": 0.48, "learning_rate": 0.00022781934403236952, "loss": 0.0187, "step": 95380 }, { "epoch": 0.48, "learning_rate": 0.0002278117763393555, "loss": 0.0146, "step": 95390 }, { "epoch": 0.48, "learning_rate": 0.0002278042086463415, "loss": 0.017, "step": 95400 }, { "epoch": 0.48, "learning_rate": 0.0002277966409533275, "loss": 0.0155, "step": 95410 }, { "epoch": 0.48, "learning_rate": 0.00022778907326031348, "loss": 0.0159, "step": 95420 }, { "epoch": 0.48, "learning_rate": 0.00022778150556729948, "loss": 0.0171, "step": 95430 }, { "epoch": 0.48, "learning_rate": 0.00022777393787428547, "loss": 0.0189, "step": 95440 }, { "epoch": 0.48, "learning_rate": 0.00022776637018127145, "loss": 0.018, "step": 95450 }, { "epoch": 0.48, "learning_rate": 0.00022775880248825743, "loss": 0.0197, "step": 95460 }, { "epoch": 0.48, "learning_rate": 0.00022775123479524344, "loss": 0.0179, "step": 95470 }, { "epoch": 0.48, "learning_rate": 0.00022774366710222942, "loss": 0.0147, "step": 95480 }, { "epoch": 0.48, "learning_rate": 0.0002277360994092154, "loss": 0.0176, "step": 95490 }, { "epoch": 0.48, "learning_rate": 0.0002277285317162014, "loss": 0.0155, "step": 95500 }, { "epoch": 0.48, "learning_rate": 0.0002277209640231874, "loss": 0.014, "step": 95510 }, { "epoch": 0.48, "learning_rate": 0.00022771339633017337, "loss": 0.019, "step": 95520 }, { "epoch": 0.48, "learning_rate": 0.00022770582863715938, "loss": 0.0147, "step": 95530 }, { "epoch": 0.48, "learning_rate": 0.00022769826094414536, "loss": 0.0153, "step": 95540 }, { "epoch": 0.48, "learning_rate": 0.00022769069325113134, "loss": 0.0166, "step": 95550 }, { "epoch": 0.48, "learning_rate": 0.00022768312555811735, "loss": 0.0147, "step": 95560 }, { "epoch": 0.48, "learning_rate": 0.00022767555786510333, "loss": 0.0152, "step": 95570 }, { "epoch": 0.48, "learning_rate": 0.00022766799017208931, "loss": 0.017, "step": 95580 }, { "epoch": 0.48, "learning_rate": 0.00022766042247907532, "loss": 0.0192, "step": 95590 }, { "epoch": 0.48, "learning_rate": 0.0002276528547860613, "loss": 0.0194, "step": 95600 }, { "epoch": 0.48, "learning_rate": 0.00022764528709304729, "loss": 0.0181, "step": 95610 }, { "epoch": 0.48, "learning_rate": 0.00022763771940003327, "loss": 0.0169, "step": 95620 }, { "epoch": 0.48, "learning_rate": 0.00022763015170701928, "loss": 0.0168, "step": 95630 }, { "epoch": 0.48, "learning_rate": 0.00022762258401400526, "loss": 0.0175, "step": 95640 }, { "epoch": 0.48, "learning_rate": 0.00022761501632099124, "loss": 0.0158, "step": 95650 }, { "epoch": 0.48, "learning_rate": 0.00022760744862797725, "loss": 0.0144, "step": 95660 }, { "epoch": 0.48, "learning_rate": 0.00022759988093496323, "loss": 0.0214, "step": 95670 }, { "epoch": 0.48, "learning_rate": 0.0002275923132419492, "loss": 0.0203, "step": 95680 }, { "epoch": 0.48, "learning_rate": 0.00022758474554893522, "loss": 0.0149, "step": 95690 }, { "epoch": 0.48, "learning_rate": 0.0002275771778559212, "loss": 0.0146, "step": 95700 }, { "epoch": 0.48, "learning_rate": 0.00022756961016290718, "loss": 0.0123, "step": 95710 }, { "epoch": 0.48, "learning_rate": 0.0002275620424698932, "loss": 0.0182, "step": 95720 }, { "epoch": 0.48, "learning_rate": 0.00022755447477687917, "loss": 0.0166, "step": 95730 }, { "epoch": 0.48, "learning_rate": 0.00022754690708386515, "loss": 0.0231, "step": 95740 }, { "epoch": 0.48, "learning_rate": 0.00022753933939085116, "loss": 0.0151, "step": 95750 }, { "epoch": 0.48, "learning_rate": 0.00022753177169783714, "loss": 0.018, "step": 95760 }, { "epoch": 0.48, "learning_rate": 0.00022752420400482312, "loss": 0.0167, "step": 95770 }, { "epoch": 0.48, "learning_rate": 0.00022751663631180913, "loss": 0.017, "step": 95780 }, { "epoch": 0.48, "learning_rate": 0.00022750906861879511, "loss": 0.0186, "step": 95790 }, { "epoch": 0.48, "learning_rate": 0.0002275015009257811, "loss": 0.017, "step": 95800 }, { "epoch": 0.48, "learning_rate": 0.00022749393323276708, "loss": 0.0172, "step": 95810 }, { "epoch": 0.48, "learning_rate": 0.00022748636553975309, "loss": 0.0189, "step": 95820 }, { "epoch": 0.48, "learning_rate": 0.00022747879784673907, "loss": 0.018, "step": 95830 }, { "epoch": 0.48, "learning_rate": 0.00022747123015372505, "loss": 0.0173, "step": 95840 }, { "epoch": 0.48, "learning_rate": 0.00022746366246071106, "loss": 0.0138, "step": 95850 }, { "epoch": 0.48, "learning_rate": 0.00022745609476769704, "loss": 0.0167, "step": 95860 }, { "epoch": 0.48, "learning_rate": 0.00022744852707468302, "loss": 0.0192, "step": 95870 }, { "epoch": 0.48, "learning_rate": 0.00022744095938166903, "loss": 0.0165, "step": 95880 }, { "epoch": 0.48, "learning_rate": 0.000227433391688655, "loss": 0.0162, "step": 95890 }, { "epoch": 0.48, "learning_rate": 0.000227425823995641, "loss": 0.0163, "step": 95900 }, { "epoch": 0.48, "learning_rate": 0.000227418256302627, "loss": 0.0139, "step": 95910 }, { "epoch": 0.48, "learning_rate": 0.00022741068860961298, "loss": 0.0175, "step": 95920 }, { "epoch": 0.48, "learning_rate": 0.00022740312091659896, "loss": 0.0179, "step": 95930 }, { "epoch": 0.48, "learning_rate": 0.00022739555322358497, "loss": 0.0145, "step": 95940 }, { "epoch": 0.48, "learning_rate": 0.00022738798553057095, "loss": 0.0156, "step": 95950 }, { "epoch": 0.48, "learning_rate": 0.00022738041783755693, "loss": 0.0186, "step": 95960 }, { "epoch": 0.48, "learning_rate": 0.00022737285014454292, "loss": 0.0191, "step": 95970 }, { "epoch": 0.48, "learning_rate": 0.00022736528245152892, "loss": 0.0161, "step": 95980 }, { "epoch": 0.48, "learning_rate": 0.0002273577147585149, "loss": 0.0155, "step": 95990 }, { "epoch": 0.48, "learning_rate": 0.0002273501470655009, "loss": 0.0244, "step": 96000 }, { "epoch": 0.48, "eval_cer": 0.9144906342217957, "eval_loss": 0.011497566476464272, "eval_runtime": 116.7865, "eval_samples_per_second": 17.125, "eval_steps_per_second": 4.281, "step": 96000 }, { "epoch": 0.48, "learning_rate": 0.0002273425793724869, "loss": 0.0185, "step": 96010 }, { "epoch": 0.48, "learning_rate": 0.00022733501167947288, "loss": 0.0161, "step": 96020 }, { "epoch": 0.48, "learning_rate": 0.00022732744398645886, "loss": 0.0142, "step": 96030 }, { "epoch": 0.48, "learning_rate": 0.00022731987629344487, "loss": 0.0165, "step": 96040 }, { "epoch": 0.48, "learning_rate": 0.00022731230860043085, "loss": 0.0148, "step": 96050 }, { "epoch": 0.48, "learning_rate": 0.00022730474090741683, "loss": 0.0147, "step": 96060 }, { "epoch": 0.48, "learning_rate": 0.00022729717321440284, "loss": 0.0204, "step": 96070 }, { "epoch": 0.48, "learning_rate": 0.00022728960552138882, "loss": 0.0153, "step": 96080 }, { "epoch": 0.48, "learning_rate": 0.0002272820378283748, "loss": 0.0146, "step": 96090 }, { "epoch": 0.48, "learning_rate": 0.0002272744701353608, "loss": 0.0183, "step": 96100 }, { "epoch": 0.48, "learning_rate": 0.0002272669024423468, "loss": 0.0193, "step": 96110 }, { "epoch": 0.48, "learning_rate": 0.00022725933474933277, "loss": 0.0197, "step": 96120 }, { "epoch": 0.48, "learning_rate": 0.00022725176705631875, "loss": 0.0213, "step": 96130 }, { "epoch": 0.49, "learning_rate": 0.00022724419936330476, "loss": 0.015, "step": 96140 }, { "epoch": 0.49, "learning_rate": 0.00022723663167029074, "loss": 0.0164, "step": 96150 }, { "epoch": 0.49, "learning_rate": 0.0002272290639772767, "loss": 0.0148, "step": 96160 }, { "epoch": 0.49, "learning_rate": 0.0002272214962842627, "loss": 0.0158, "step": 96170 }, { "epoch": 0.49, "learning_rate": 0.0002272139285912487, "loss": 0.0164, "step": 96180 }, { "epoch": 0.49, "learning_rate": 0.00022720636089823467, "loss": 0.0181, "step": 96190 }, { "epoch": 0.49, "learning_rate": 0.00022719879320522065, "loss": 0.0146, "step": 96200 }, { "epoch": 0.49, "learning_rate": 0.00022719122551220666, "loss": 0.0146, "step": 96210 }, { "epoch": 0.49, "learning_rate": 0.00022718365781919264, "loss": 0.0197, "step": 96220 }, { "epoch": 0.49, "learning_rate": 0.00022717609012617862, "loss": 0.0201, "step": 96230 }, { "epoch": 0.49, "learning_rate": 0.00022716852243316463, "loss": 0.0176, "step": 96240 }, { "epoch": 0.49, "learning_rate": 0.0002271609547401506, "loss": 0.017, "step": 96250 }, { "epoch": 0.49, "learning_rate": 0.0002271533870471366, "loss": 0.0186, "step": 96260 }, { "epoch": 0.49, "learning_rate": 0.0002271458193541226, "loss": 0.0141, "step": 96270 }, { "epoch": 0.49, "learning_rate": 0.00022713825166110858, "loss": 0.0153, "step": 96280 }, { "epoch": 0.49, "learning_rate": 0.00022713068396809457, "loss": 0.0153, "step": 96290 }, { "epoch": 0.49, "learning_rate": 0.00022712311627508057, "loss": 0.013, "step": 96300 }, { "epoch": 0.49, "learning_rate": 0.00022711554858206656, "loss": 0.0132, "step": 96310 }, { "epoch": 0.49, "learning_rate": 0.00022710798088905254, "loss": 0.0177, "step": 96320 }, { "epoch": 0.49, "learning_rate": 0.00022710041319603855, "loss": 0.017, "step": 96330 }, { "epoch": 0.49, "learning_rate": 0.00022709284550302453, "loss": 0.0189, "step": 96340 }, { "epoch": 0.49, "learning_rate": 0.0002270852778100105, "loss": 0.0149, "step": 96350 }, { "epoch": 0.49, "learning_rate": 0.0002270777101169965, "loss": 0.0176, "step": 96360 }, { "epoch": 0.49, "learning_rate": 0.0002270701424239825, "loss": 0.0188, "step": 96370 }, { "epoch": 0.49, "learning_rate": 0.00022706257473096848, "loss": 0.0173, "step": 96380 }, { "epoch": 0.49, "learning_rate": 0.00022705500703795446, "loss": 0.016, "step": 96390 }, { "epoch": 0.49, "learning_rate": 0.00022704743934494047, "loss": 0.0153, "step": 96400 }, { "epoch": 0.49, "learning_rate": 0.00022703987165192645, "loss": 0.0158, "step": 96410 }, { "epoch": 0.49, "learning_rate": 0.00022703230395891243, "loss": 0.0153, "step": 96420 }, { "epoch": 0.49, "learning_rate": 0.00022702473626589844, "loss": 0.0166, "step": 96430 }, { "epoch": 0.49, "learning_rate": 0.00022701716857288442, "loss": 0.0172, "step": 96440 }, { "epoch": 0.49, "learning_rate": 0.0002270096008798704, "loss": 0.0163, "step": 96450 }, { "epoch": 0.49, "learning_rate": 0.0002270020331868564, "loss": 0.0169, "step": 96460 }, { "epoch": 0.49, "learning_rate": 0.0002269944654938424, "loss": 0.0123, "step": 96470 }, { "epoch": 0.49, "learning_rate": 0.00022698689780082838, "loss": 0.0148, "step": 96480 }, { "epoch": 0.49, "learning_rate": 0.00022697933010781438, "loss": 0.0138, "step": 96490 }, { "epoch": 0.49, "learning_rate": 0.00022697176241480037, "loss": 0.0142, "step": 96500 }, { "epoch": 0.49, "learning_rate": 0.00022696419472178635, "loss": 0.0183, "step": 96510 }, { "epoch": 0.49, "learning_rate": 0.00022695662702877233, "loss": 0.0156, "step": 96520 }, { "epoch": 0.49, "learning_rate": 0.00022694905933575834, "loss": 0.0164, "step": 96530 }, { "epoch": 0.49, "learning_rate": 0.00022694149164274432, "loss": 0.0202, "step": 96540 }, { "epoch": 0.49, "learning_rate": 0.0002269339239497303, "loss": 0.0155, "step": 96550 }, { "epoch": 0.49, "learning_rate": 0.0002269263562567163, "loss": 0.0146, "step": 96560 }, { "epoch": 0.49, "learning_rate": 0.0002269187885637023, "loss": 0.0142, "step": 96570 }, { "epoch": 0.49, "learning_rate": 0.00022691122087068827, "loss": 0.0137, "step": 96580 }, { "epoch": 0.49, "learning_rate": 0.00022690365317767428, "loss": 0.0171, "step": 96590 }, { "epoch": 0.49, "learning_rate": 0.00022689608548466026, "loss": 0.0173, "step": 96600 }, { "epoch": 0.49, "learning_rate": 0.00022688851779164624, "loss": 0.0161, "step": 96610 }, { "epoch": 0.49, "learning_rate": 0.00022688095009863225, "loss": 0.0156, "step": 96620 }, { "epoch": 0.49, "learning_rate": 0.00022687338240561823, "loss": 0.0162, "step": 96630 }, { "epoch": 0.49, "learning_rate": 0.00022686581471260421, "loss": 0.0169, "step": 96640 }, { "epoch": 0.49, "learning_rate": 0.00022685824701959022, "loss": 0.0116, "step": 96650 }, { "epoch": 0.49, "learning_rate": 0.0002268506793265762, "loss": 0.0159, "step": 96660 }, { "epoch": 0.49, "learning_rate": 0.00022684311163356219, "loss": 0.014, "step": 96670 }, { "epoch": 0.49, "learning_rate": 0.0002268355439405482, "loss": 0.0166, "step": 96680 }, { "epoch": 0.49, "learning_rate": 0.00022682797624753418, "loss": 0.0157, "step": 96690 }, { "epoch": 0.49, "learning_rate": 0.00022682040855452016, "loss": 0.0149, "step": 96700 }, { "epoch": 0.49, "learning_rate": 0.00022681284086150614, "loss": 0.0144, "step": 96710 }, { "epoch": 0.49, "learning_rate": 0.00022680527316849215, "loss": 0.0157, "step": 96720 }, { "epoch": 0.49, "learning_rate": 0.00022679770547547813, "loss": 0.0143, "step": 96730 }, { "epoch": 0.49, "learning_rate": 0.0002267901377824641, "loss": 0.0199, "step": 96740 }, { "epoch": 0.49, "learning_rate": 0.00022678257008945012, "loss": 0.0149, "step": 96750 }, { "epoch": 0.49, "learning_rate": 0.0002267750023964361, "loss": 0.0136, "step": 96760 }, { "epoch": 0.49, "learning_rate": 0.00022676743470342208, "loss": 0.0176, "step": 96770 }, { "epoch": 0.49, "learning_rate": 0.0002267598670104081, "loss": 0.0144, "step": 96780 }, { "epoch": 0.49, "learning_rate": 0.00022675229931739407, "loss": 0.0163, "step": 96790 }, { "epoch": 0.49, "learning_rate": 0.00022674473162438005, "loss": 0.0152, "step": 96800 }, { "epoch": 0.49, "learning_rate": 0.00022673716393136606, "loss": 0.0138, "step": 96810 }, { "epoch": 0.49, "learning_rate": 0.00022672959623835204, "loss": 0.0171, "step": 96820 }, { "epoch": 0.49, "learning_rate": 0.00022672202854533802, "loss": 0.0184, "step": 96830 }, { "epoch": 0.49, "learning_rate": 0.00022671446085232403, "loss": 0.0129, "step": 96840 }, { "epoch": 0.49, "learning_rate": 0.00022670689315931001, "loss": 0.0134, "step": 96850 }, { "epoch": 0.49, "learning_rate": 0.000226699325466296, "loss": 0.0167, "step": 96860 }, { "epoch": 0.49, "learning_rate": 0.00022669175777328198, "loss": 0.0128, "step": 96870 }, { "epoch": 0.49, "learning_rate": 0.00022668419008026799, "loss": 0.0195, "step": 96880 }, { "epoch": 0.49, "learning_rate": 0.00022667662238725397, "loss": 0.0161, "step": 96890 }, { "epoch": 0.49, "learning_rate": 0.00022666905469423995, "loss": 0.0183, "step": 96900 }, { "epoch": 0.49, "learning_rate": 0.00022666148700122596, "loss": 0.0137, "step": 96910 }, { "epoch": 0.49, "learning_rate": 0.00022665391930821194, "loss": 0.0152, "step": 96920 }, { "epoch": 0.49, "learning_rate": 0.00022664635161519792, "loss": 0.016, "step": 96930 }, { "epoch": 0.49, "learning_rate": 0.00022663878392218393, "loss": 0.015, "step": 96940 }, { "epoch": 0.49, "learning_rate": 0.0002266312162291699, "loss": 0.0149, "step": 96950 }, { "epoch": 0.49, "learning_rate": 0.0002266236485361559, "loss": 0.0227, "step": 96960 }, { "epoch": 0.49, "learning_rate": 0.0002266160808431419, "loss": 0.0148, "step": 96970 }, { "epoch": 0.49, "learning_rate": 0.00022660851315012788, "loss": 0.0175, "step": 96980 }, { "epoch": 0.49, "learning_rate": 0.00022660094545711386, "loss": 0.015, "step": 96990 }, { "epoch": 0.49, "learning_rate": 0.00022659337776409987, "loss": 0.0174, "step": 97000 }, { "epoch": 0.49, "eval_cer": 0.9144644335264098, "eval_loss": 0.011374830268323421, "eval_runtime": 116.7311, "eval_samples_per_second": 17.133, "eval_steps_per_second": 4.283, "step": 97000 }, { "epoch": 0.49, "learning_rate": 0.00022658581007108585, "loss": 0.015, "step": 97010 }, { "epoch": 0.49, "learning_rate": 0.00022657824237807183, "loss": 0.015, "step": 97020 }, { "epoch": 0.49, "learning_rate": 0.00022657067468505782, "loss": 0.0158, "step": 97030 }, { "epoch": 0.49, "learning_rate": 0.00022656310699204382, "loss": 0.0217, "step": 97040 }, { "epoch": 0.49, "learning_rate": 0.0002265555392990298, "loss": 0.0149, "step": 97050 }, { "epoch": 0.49, "learning_rate": 0.0002265479716060158, "loss": 0.0156, "step": 97060 }, { "epoch": 0.49, "learning_rate": 0.0002265404039130018, "loss": 0.0147, "step": 97070 }, { "epoch": 0.49, "learning_rate": 0.00022653283621998778, "loss": 0.0138, "step": 97080 }, { "epoch": 0.49, "learning_rate": 0.00022652526852697376, "loss": 0.0137, "step": 97090 }, { "epoch": 0.49, "learning_rate": 0.00022651770083395977, "loss": 0.0159, "step": 97100 }, { "epoch": 0.49, "learning_rate": 0.00022651013314094575, "loss": 0.0136, "step": 97110 }, { "epoch": 0.49, "learning_rate": 0.00022650256544793173, "loss": 0.0191, "step": 97120 }, { "epoch": 0.49, "learning_rate": 0.00022649499775491774, "loss": 0.0144, "step": 97130 }, { "epoch": 0.49, "learning_rate": 0.00022648743006190372, "loss": 0.0108, "step": 97140 }, { "epoch": 0.49, "learning_rate": 0.0002264798623688897, "loss": 0.0161, "step": 97150 }, { "epoch": 0.49, "learning_rate": 0.0002264722946758757, "loss": 0.0153, "step": 97160 }, { "epoch": 0.49, "learning_rate": 0.0002264647269828617, "loss": 0.0145, "step": 97170 }, { "epoch": 0.49, "learning_rate": 0.00022645715928984767, "loss": 0.0152, "step": 97180 }, { "epoch": 0.49, "learning_rate": 0.00022644959159683365, "loss": 0.0168, "step": 97190 }, { "epoch": 0.49, "learning_rate": 0.00022644202390381966, "loss": 0.0151, "step": 97200 }, { "epoch": 0.49, "learning_rate": 0.00022643445621080564, "loss": 0.014, "step": 97210 }, { "epoch": 0.49, "learning_rate": 0.00022642688851779163, "loss": 0.0143, "step": 97220 }, { "epoch": 0.49, "learning_rate": 0.00022641932082477763, "loss": 0.0146, "step": 97230 }, { "epoch": 0.49, "learning_rate": 0.00022641175313176362, "loss": 0.0161, "step": 97240 }, { "epoch": 0.49, "learning_rate": 0.0002264041854387496, "loss": 0.0166, "step": 97250 }, { "epoch": 0.49, "learning_rate": 0.0002263966177457356, "loss": 0.0162, "step": 97260 }, { "epoch": 0.49, "learning_rate": 0.0002263890500527216, "loss": 0.0173, "step": 97270 }, { "epoch": 0.49, "learning_rate": 0.00022638148235970757, "loss": 0.0171, "step": 97280 }, { "epoch": 0.49, "learning_rate": 0.00022637391466669358, "loss": 0.0161, "step": 97290 }, { "epoch": 0.49, "learning_rate": 0.00022636634697367956, "loss": 0.0176, "step": 97300 }, { "epoch": 0.49, "learning_rate": 0.00022635877928066554, "loss": 0.0161, "step": 97310 }, { "epoch": 0.49, "learning_rate": 0.00022635121158765155, "loss": 0.0192, "step": 97320 }, { "epoch": 0.49, "learning_rate": 0.00022634364389463753, "loss": 0.016, "step": 97330 }, { "epoch": 0.49, "learning_rate": 0.0002263360762016235, "loss": 0.0149, "step": 97340 }, { "epoch": 0.49, "learning_rate": 0.00022632850850860952, "loss": 0.0205, "step": 97350 }, { "epoch": 0.49, "learning_rate": 0.0002263209408155955, "loss": 0.0146, "step": 97360 }, { "epoch": 0.49, "learning_rate": 0.00022631337312258148, "loss": 0.0188, "step": 97370 }, { "epoch": 0.49, "learning_rate": 0.00022630580542956746, "loss": 0.0165, "step": 97380 }, { "epoch": 0.49, "learning_rate": 0.00022629823773655347, "loss": 0.0168, "step": 97390 }, { "epoch": 0.49, "learning_rate": 0.00022629067004353945, "loss": 0.0132, "step": 97400 }, { "epoch": 0.49, "learning_rate": 0.0002262831023505254, "loss": 0.0175, "step": 97410 }, { "epoch": 0.49, "learning_rate": 0.0002262755346575114, "loss": 0.0175, "step": 97420 }, { "epoch": 0.49, "learning_rate": 0.0002262679669644974, "loss": 0.0176, "step": 97430 }, { "epoch": 0.49, "learning_rate": 0.00022626039927148338, "loss": 0.0171, "step": 97440 }, { "epoch": 0.49, "learning_rate": 0.00022625283157846936, "loss": 0.0173, "step": 97450 }, { "epoch": 0.49, "learning_rate": 0.00022624526388545537, "loss": 0.0154, "step": 97460 }, { "epoch": 0.49, "learning_rate": 0.00022623769619244135, "loss": 0.0131, "step": 97470 }, { "epoch": 0.49, "learning_rate": 0.00022623012849942733, "loss": 0.0161, "step": 97480 }, { "epoch": 0.49, "learning_rate": 0.00022622256080641334, "loss": 0.0154, "step": 97490 }, { "epoch": 0.49, "learning_rate": 0.00022621499311339932, "loss": 0.0146, "step": 97500 }, { "epoch": 0.49, "learning_rate": 0.0002262074254203853, "loss": 0.0161, "step": 97510 }, { "epoch": 0.49, "learning_rate": 0.0002261998577273713, "loss": 0.0156, "step": 97520 }, { "epoch": 0.49, "learning_rate": 0.0002261922900343573, "loss": 0.0162, "step": 97530 }, { "epoch": 0.49, "learning_rate": 0.00022618472234134328, "loss": 0.0156, "step": 97540 }, { "epoch": 0.49, "learning_rate": 0.00022617715464832928, "loss": 0.0154, "step": 97550 }, { "epoch": 0.49, "learning_rate": 0.00022616958695531527, "loss": 0.0147, "step": 97560 }, { "epoch": 0.49, "learning_rate": 0.00022616201926230125, "loss": 0.0186, "step": 97570 }, { "epoch": 0.49, "learning_rate": 0.00022615445156928726, "loss": 0.0147, "step": 97580 }, { "epoch": 0.49, "learning_rate": 0.00022614688387627324, "loss": 0.0153, "step": 97590 }, { "epoch": 0.49, "learning_rate": 0.00022613931618325922, "loss": 0.0165, "step": 97600 }, { "epoch": 0.49, "learning_rate": 0.0002261317484902452, "loss": 0.0112, "step": 97610 }, { "epoch": 0.49, "learning_rate": 0.0002261241807972312, "loss": 0.014, "step": 97620 }, { "epoch": 0.49, "learning_rate": 0.0002261166131042172, "loss": 0.015, "step": 97630 }, { "epoch": 0.49, "learning_rate": 0.00022610904541120317, "loss": 0.0125, "step": 97640 }, { "epoch": 0.49, "learning_rate": 0.00022610147771818918, "loss": 0.0181, "step": 97650 }, { "epoch": 0.49, "learning_rate": 0.00022609391002517516, "loss": 0.0149, "step": 97660 }, { "epoch": 0.49, "learning_rate": 0.00022608634233216114, "loss": 0.0154, "step": 97670 }, { "epoch": 0.49, "learning_rate": 0.00022607877463914715, "loss": 0.0148, "step": 97680 }, { "epoch": 0.49, "learning_rate": 0.00022607120694613313, "loss": 0.0171, "step": 97690 }, { "epoch": 0.49, "learning_rate": 0.00022606363925311911, "loss": 0.0166, "step": 97700 }, { "epoch": 0.49, "learning_rate": 0.00022605607156010512, "loss": 0.0154, "step": 97710 }, { "epoch": 0.49, "learning_rate": 0.0002260485038670911, "loss": 0.0138, "step": 97720 }, { "epoch": 0.49, "learning_rate": 0.00022604093617407709, "loss": 0.0142, "step": 97730 }, { "epoch": 0.49, "learning_rate": 0.0002260333684810631, "loss": 0.0158, "step": 97740 }, { "epoch": 0.49, "learning_rate": 0.00022602580078804908, "loss": 0.0166, "step": 97750 }, { "epoch": 0.49, "learning_rate": 0.00022601823309503506, "loss": 0.0156, "step": 97760 }, { "epoch": 0.49, "learning_rate": 0.00022601066540202104, "loss": 0.0197, "step": 97770 }, { "epoch": 0.49, "learning_rate": 0.00022600309770900705, "loss": 0.0141, "step": 97780 }, { "epoch": 0.49, "learning_rate": 0.00022599553001599303, "loss": 0.0131, "step": 97790 }, { "epoch": 0.49, "learning_rate": 0.000225987962322979, "loss": 0.0169, "step": 97800 }, { "epoch": 0.49, "learning_rate": 0.00022598039462996502, "loss": 0.0127, "step": 97810 }, { "epoch": 0.49, "learning_rate": 0.000225972826936951, "loss": 0.0176, "step": 97820 }, { "epoch": 0.49, "learning_rate": 0.00022596525924393698, "loss": 0.0144, "step": 97830 }, { "epoch": 0.49, "learning_rate": 0.000225957691550923, "loss": 0.0178, "step": 97840 }, { "epoch": 0.49, "learning_rate": 0.00022595012385790897, "loss": 0.0165, "step": 97850 }, { "epoch": 0.49, "learning_rate": 0.00022594255616489495, "loss": 0.0182, "step": 97860 }, { "epoch": 0.49, "learning_rate": 0.00022593498847188096, "loss": 0.0152, "step": 97870 }, { "epoch": 0.49, "learning_rate": 0.00022592742077886694, "loss": 0.0165, "step": 97880 }, { "epoch": 0.49, "learning_rate": 0.00022591985308585292, "loss": 0.0179, "step": 97890 }, { "epoch": 0.49, "learning_rate": 0.00022591228539283893, "loss": 0.0192, "step": 97900 }, { "epoch": 0.49, "learning_rate": 0.00022590471769982491, "loss": 0.0176, "step": 97910 }, { "epoch": 0.49, "learning_rate": 0.0002258971500068109, "loss": 0.0158, "step": 97920 }, { "epoch": 0.49, "learning_rate": 0.00022588958231379688, "loss": 0.0187, "step": 97930 }, { "epoch": 0.49, "learning_rate": 0.00022588201462078289, "loss": 0.0178, "step": 97940 }, { "epoch": 0.49, "learning_rate": 0.00022587444692776887, "loss": 0.02, "step": 97950 }, { "epoch": 0.49, "learning_rate": 0.00022586687923475485, "loss": 0.0153, "step": 97960 }, { "epoch": 0.49, "learning_rate": 0.00022585931154174086, "loss": 0.0165, "step": 97970 }, { "epoch": 0.49, "learning_rate": 0.00022585174384872684, "loss": 0.0226, "step": 97980 }, { "epoch": 0.49, "learning_rate": 0.00022584417615571282, "loss": 0.016, "step": 97990 }, { "epoch": 0.49, "learning_rate": 0.00022583660846269883, "loss": 0.0241, "step": 98000 }, { "epoch": 0.49, "eval_cer": 0.9144799598644162, "eval_loss": 0.011652790941298008, "eval_runtime": 116.7303, "eval_samples_per_second": 17.134, "eval_steps_per_second": 4.283, "step": 98000 }, { "epoch": 0.49, "learning_rate": 0.0002258290407696848, "loss": 0.0164, "step": 98010 }, { "epoch": 0.49, "learning_rate": 0.0002258214730766708, "loss": 0.0178, "step": 98020 }, { "epoch": 0.49, "learning_rate": 0.0002258139053836568, "loss": 0.0155, "step": 98030 }, { "epoch": 0.49, "learning_rate": 0.00022580633769064278, "loss": 0.0136, "step": 98040 }, { "epoch": 0.49, "learning_rate": 0.00022579876999762876, "loss": 0.016, "step": 98050 }, { "epoch": 0.49, "learning_rate": 0.00022579120230461477, "loss": 0.0171, "step": 98060 }, { "epoch": 0.49, "learning_rate": 0.00022578363461160075, "loss": 0.0166, "step": 98070 }, { "epoch": 0.49, "learning_rate": 0.00022577606691858673, "loss": 0.0158, "step": 98080 }, { "epoch": 0.49, "learning_rate": 0.00022576849922557272, "loss": 0.0232, "step": 98090 }, { "epoch": 0.49, "learning_rate": 0.00022576093153255872, "loss": 0.0201, "step": 98100 }, { "epoch": 0.49, "learning_rate": 0.0002257533638395447, "loss": 0.0174, "step": 98110 }, { "epoch": 0.5, "learning_rate": 0.0002257457961465307, "loss": 0.0155, "step": 98120 }, { "epoch": 0.5, "learning_rate": 0.0002257382284535167, "loss": 0.0171, "step": 98130 }, { "epoch": 0.5, "learning_rate": 0.00022573066076050268, "loss": 0.0146, "step": 98140 }, { "epoch": 0.5, "learning_rate": 0.00022572309306748866, "loss": 0.019, "step": 98150 }, { "epoch": 0.5, "learning_rate": 0.00022571552537447467, "loss": 0.0157, "step": 98160 }, { "epoch": 0.5, "learning_rate": 0.00022570795768146065, "loss": 0.0203, "step": 98170 }, { "epoch": 0.5, "learning_rate": 0.00022570038998844663, "loss": 0.0153, "step": 98180 }, { "epoch": 0.5, "learning_rate": 0.00022569282229543264, "loss": 0.0159, "step": 98190 }, { "epoch": 0.5, "learning_rate": 0.00022568525460241862, "loss": 0.0148, "step": 98200 }, { "epoch": 0.5, "learning_rate": 0.0002256776869094046, "loss": 0.0161, "step": 98210 }, { "epoch": 0.5, "learning_rate": 0.0002256701192163906, "loss": 0.0164, "step": 98220 }, { "epoch": 0.5, "learning_rate": 0.0002256625515233766, "loss": 0.0165, "step": 98230 }, { "epoch": 0.5, "learning_rate": 0.00022565498383036257, "loss": 0.014, "step": 98240 }, { "epoch": 0.5, "learning_rate": 0.00022564741613734858, "loss": 0.0178, "step": 98250 }, { "epoch": 0.5, "learning_rate": 0.00022563984844433456, "loss": 0.0131, "step": 98260 }, { "epoch": 0.5, "learning_rate": 0.00022563228075132055, "loss": 0.0209, "step": 98270 }, { "epoch": 0.5, "learning_rate": 0.00022562471305830653, "loss": 0.0115, "step": 98280 }, { "epoch": 0.5, "learning_rate": 0.00022561714536529253, "loss": 0.0183, "step": 98290 }, { "epoch": 0.5, "learning_rate": 0.00022560957767227852, "loss": 0.0143, "step": 98300 }, { "epoch": 0.5, "learning_rate": 0.0002256020099792645, "loss": 0.015, "step": 98310 }, { "epoch": 0.5, "learning_rate": 0.0002255944422862505, "loss": 0.0122, "step": 98320 }, { "epoch": 0.5, "learning_rate": 0.0002255868745932365, "loss": 0.0149, "step": 98330 }, { "epoch": 0.5, "learning_rate": 0.00022557930690022247, "loss": 0.0157, "step": 98340 }, { "epoch": 0.5, "learning_rate": 0.00022557173920720848, "loss": 0.0168, "step": 98350 }, { "epoch": 0.5, "learning_rate": 0.00022556417151419446, "loss": 0.0139, "step": 98360 }, { "epoch": 0.5, "learning_rate": 0.00022555660382118044, "loss": 0.0133, "step": 98370 }, { "epoch": 0.5, "learning_rate": 0.00022554903612816645, "loss": 0.0243, "step": 98380 }, { "epoch": 0.5, "learning_rate": 0.00022554146843515243, "loss": 0.0139, "step": 98390 }, { "epoch": 0.5, "learning_rate": 0.0002255339007421384, "loss": 0.0148, "step": 98400 }, { "epoch": 0.5, "learning_rate": 0.00022552633304912442, "loss": 0.0178, "step": 98410 }, { "epoch": 0.5, "learning_rate": 0.0002255187653561104, "loss": 0.015, "step": 98420 }, { "epoch": 0.5, "learning_rate": 0.00022551119766309638, "loss": 0.0176, "step": 98430 }, { "epoch": 0.5, "learning_rate": 0.00022550362997008237, "loss": 0.0164, "step": 98440 }, { "epoch": 0.5, "learning_rate": 0.00022549606227706837, "loss": 0.0171, "step": 98450 }, { "epoch": 0.5, "learning_rate": 0.00022548849458405436, "loss": 0.013, "step": 98460 }, { "epoch": 0.5, "learning_rate": 0.00022548092689104034, "loss": 0.0157, "step": 98470 }, { "epoch": 0.5, "learning_rate": 0.00022547335919802635, "loss": 0.0169, "step": 98480 }, { "epoch": 0.5, "learning_rate": 0.00022546579150501233, "loss": 0.0159, "step": 98490 }, { "epoch": 0.5, "learning_rate": 0.0002254582238119983, "loss": 0.0276, "step": 98500 }, { "epoch": 0.5, "learning_rate": 0.00022545065611898432, "loss": 0.0217, "step": 98510 }, { "epoch": 0.5, "learning_rate": 0.0002254430884259703, "loss": 0.0157, "step": 98520 }, { "epoch": 0.5, "learning_rate": 0.00022543552073295628, "loss": 0.0147, "step": 98530 }, { "epoch": 0.5, "learning_rate": 0.0002254279530399423, "loss": 0.0137, "step": 98540 }, { "epoch": 0.5, "learning_rate": 0.00022542038534692827, "loss": 0.0151, "step": 98550 }, { "epoch": 0.5, "learning_rate": 0.00022541281765391425, "loss": 0.0161, "step": 98560 }, { "epoch": 0.5, "learning_rate": 0.00022540524996090026, "loss": 0.0158, "step": 98570 }, { "epoch": 0.5, "learning_rate": 0.00022539768226788624, "loss": 0.0195, "step": 98580 }, { "epoch": 0.5, "learning_rate": 0.00022539011457487222, "loss": 0.0179, "step": 98590 }, { "epoch": 0.5, "learning_rate": 0.0002253825468818582, "loss": 0.0153, "step": 98600 }, { "epoch": 0.5, "learning_rate": 0.0002253749791888442, "loss": 0.0187, "step": 98610 }, { "epoch": 0.5, "learning_rate": 0.0002253674114958302, "loss": 0.0156, "step": 98620 }, { "epoch": 0.5, "learning_rate": 0.00022535984380281618, "loss": 0.0126, "step": 98630 }, { "epoch": 0.5, "learning_rate": 0.00022535227610980218, "loss": 0.0159, "step": 98640 }, { "epoch": 0.5, "learning_rate": 0.00022534470841678817, "loss": 0.0154, "step": 98650 }, { "epoch": 0.5, "learning_rate": 0.00022533714072377415, "loss": 0.0157, "step": 98660 }, { "epoch": 0.5, "learning_rate": 0.0002253295730307601, "loss": 0.0134, "step": 98670 }, { "epoch": 0.5, "learning_rate": 0.0002253220053377461, "loss": 0.017, "step": 98680 }, { "epoch": 0.5, "learning_rate": 0.0002253144376447321, "loss": 0.014, "step": 98690 }, { "epoch": 0.5, "learning_rate": 0.00022530686995171807, "loss": 0.0188, "step": 98700 }, { "epoch": 0.5, "learning_rate": 0.00022529930225870408, "loss": 0.0153, "step": 98710 }, { "epoch": 0.5, "learning_rate": 0.00022529173456569006, "loss": 0.0156, "step": 98720 }, { "epoch": 0.5, "learning_rate": 0.00022528416687267604, "loss": 0.0142, "step": 98730 }, { "epoch": 0.5, "learning_rate": 0.00022527659917966205, "loss": 0.0156, "step": 98740 }, { "epoch": 0.5, "learning_rate": 0.00022526903148664803, "loss": 0.0203, "step": 98750 }, { "epoch": 0.5, "learning_rate": 0.00022526146379363402, "loss": 0.014, "step": 98760 }, { "epoch": 0.5, "learning_rate": 0.00022525389610062002, "loss": 0.0125, "step": 98770 }, { "epoch": 0.5, "learning_rate": 0.000225246328407606, "loss": 0.0155, "step": 98780 }, { "epoch": 0.5, "learning_rate": 0.000225238760714592, "loss": 0.0176, "step": 98790 }, { "epoch": 0.5, "learning_rate": 0.000225231193021578, "loss": 0.0164, "step": 98800 }, { "epoch": 0.5, "learning_rate": 0.00022522362532856398, "loss": 0.0132, "step": 98810 }, { "epoch": 0.5, "learning_rate": 0.00022521605763554996, "loss": 0.0171, "step": 98820 }, { "epoch": 0.5, "learning_rate": 0.00022520848994253594, "loss": 0.0187, "step": 98830 }, { "epoch": 0.5, "learning_rate": 0.00022520092224952195, "loss": 0.0168, "step": 98840 }, { "epoch": 0.5, "learning_rate": 0.00022519335455650793, "loss": 0.0166, "step": 98850 }, { "epoch": 0.5, "learning_rate": 0.0002251857868634939, "loss": 0.0135, "step": 98860 }, { "epoch": 0.5, "learning_rate": 0.00022517821917047992, "loss": 0.0213, "step": 98870 }, { "epoch": 0.5, "learning_rate": 0.0002251706514774659, "loss": 0.0151, "step": 98880 }, { "epoch": 0.5, "learning_rate": 0.00022516308378445188, "loss": 0.0165, "step": 98890 }, { "epoch": 0.5, "learning_rate": 0.0002251555160914379, "loss": 0.0156, "step": 98900 }, { "epoch": 0.5, "learning_rate": 0.00022514794839842387, "loss": 0.0125, "step": 98910 }, { "epoch": 0.5, "learning_rate": 0.00022514038070540985, "loss": 0.0159, "step": 98920 }, { "epoch": 0.5, "learning_rate": 0.00022513281301239586, "loss": 0.0143, "step": 98930 }, { "epoch": 0.5, "learning_rate": 0.00022512524531938184, "loss": 0.0142, "step": 98940 }, { "epoch": 0.5, "learning_rate": 0.00022511767762636783, "loss": 0.0143, "step": 98950 }, { "epoch": 0.5, "learning_rate": 0.00022511010993335383, "loss": 0.0153, "step": 98960 }, { "epoch": 0.5, "learning_rate": 0.00022510254224033982, "loss": 0.0134, "step": 98970 }, { "epoch": 0.5, "learning_rate": 0.0002250949745473258, "loss": 0.0167, "step": 98980 }, { "epoch": 0.5, "learning_rate": 0.00022508740685431178, "loss": 0.0195, "step": 98990 }, { "epoch": 0.5, "learning_rate": 0.0002250798391612978, "loss": 0.0132, "step": 99000 }, { "epoch": 0.5, "eval_cer": 0.9144857822411687, "eval_loss": 0.011587457731366158, "eval_runtime": 116.7415, "eval_samples_per_second": 17.132, "eval_steps_per_second": 4.283, "step": 99000 }, { "epoch": 0.5, "learning_rate": 0.00022507227146828377, "loss": 0.0159, "step": 99010 }, { "epoch": 0.5, "learning_rate": 0.00022506470377526975, "loss": 0.0158, "step": 99020 }, { "epoch": 0.5, "learning_rate": 0.00022505713608225576, "loss": 0.0154, "step": 99030 }, { "epoch": 0.5, "learning_rate": 0.00022504956838924174, "loss": 0.0127, "step": 99040 }, { "epoch": 0.5, "learning_rate": 0.00022504200069622772, "loss": 0.0199, "step": 99050 }, { "epoch": 0.5, "learning_rate": 0.00022503443300321373, "loss": 0.0172, "step": 99060 }, { "epoch": 0.5, "learning_rate": 0.0002250268653101997, "loss": 0.0162, "step": 99070 }, { "epoch": 0.5, "learning_rate": 0.0002250192976171857, "loss": 0.0187, "step": 99080 }, { "epoch": 0.5, "learning_rate": 0.0002250117299241717, "loss": 0.0157, "step": 99090 }, { "epoch": 0.5, "learning_rate": 0.00022500416223115768, "loss": 0.014, "step": 99100 }, { "epoch": 0.5, "learning_rate": 0.00022499659453814366, "loss": 0.0151, "step": 99110 }, { "epoch": 0.5, "learning_rate": 0.00022498902684512967, "loss": 0.013, "step": 99120 }, { "epoch": 0.5, "learning_rate": 0.00022498145915211565, "loss": 0.0151, "step": 99130 }, { "epoch": 0.5, "learning_rate": 0.00022497389145910164, "loss": 0.0135, "step": 99140 }, { "epoch": 0.5, "learning_rate": 0.00022496632376608764, "loss": 0.0234, "step": 99150 }, { "epoch": 0.5, "learning_rate": 0.00022495875607307363, "loss": 0.013, "step": 99160 }, { "epoch": 0.5, "learning_rate": 0.0002249511883800596, "loss": 0.0175, "step": 99170 }, { "epoch": 0.5, "learning_rate": 0.0002249436206870456, "loss": 0.0171, "step": 99180 }, { "epoch": 0.5, "learning_rate": 0.0002249360529940316, "loss": 0.0166, "step": 99190 }, { "epoch": 0.5, "learning_rate": 0.00022492848530101758, "loss": 0.0174, "step": 99200 }, { "epoch": 0.5, "learning_rate": 0.00022492091760800356, "loss": 0.0122, "step": 99210 }, { "epoch": 0.5, "learning_rate": 0.00022491334991498957, "loss": 0.0156, "step": 99220 }, { "epoch": 0.5, "learning_rate": 0.00022490578222197555, "loss": 0.0146, "step": 99230 }, { "epoch": 0.5, "learning_rate": 0.00022489821452896153, "loss": 0.0159, "step": 99240 }, { "epoch": 0.5, "learning_rate": 0.00022489064683594754, "loss": 0.0176, "step": 99250 }, { "epoch": 0.5, "learning_rate": 0.00022488307914293352, "loss": 0.0172, "step": 99260 }, { "epoch": 0.5, "learning_rate": 0.0002248755114499195, "loss": 0.0116, "step": 99270 }, { "epoch": 0.5, "learning_rate": 0.0002248679437569055, "loss": 0.0152, "step": 99280 }, { "epoch": 0.5, "learning_rate": 0.0002248603760638915, "loss": 0.0368, "step": 99290 }, { "epoch": 0.5, "learning_rate": 0.00022485280837087747, "loss": 0.0209, "step": 99300 }, { "epoch": 0.5, "learning_rate": 0.00022484524067786348, "loss": 0.0144, "step": 99310 }, { "epoch": 0.5, "learning_rate": 0.00022483767298484946, "loss": 0.019, "step": 99320 }, { "epoch": 0.5, "learning_rate": 0.00022483010529183545, "loss": 0.0153, "step": 99330 }, { "epoch": 0.5, "learning_rate": 0.00022482253759882143, "loss": 0.0179, "step": 99340 }, { "epoch": 0.5, "learning_rate": 0.00022481496990580744, "loss": 0.0215, "step": 99350 }, { "epoch": 0.5, "learning_rate": 0.00022480740221279342, "loss": 0.0174, "step": 99360 }, { "epoch": 0.5, "learning_rate": 0.0002247998345197794, "loss": 0.0178, "step": 99370 }, { "epoch": 0.5, "learning_rate": 0.0002247922668267654, "loss": 0.0148, "step": 99380 }, { "epoch": 0.5, "learning_rate": 0.0002247846991337514, "loss": 0.0166, "step": 99390 }, { "epoch": 0.5, "learning_rate": 0.00022477713144073737, "loss": 0.015, "step": 99400 }, { "epoch": 0.5, "learning_rate": 0.00022476956374772338, "loss": 0.0157, "step": 99410 }, { "epoch": 0.5, "learning_rate": 0.00022476199605470936, "loss": 0.0192, "step": 99420 }, { "epoch": 0.5, "learning_rate": 0.00022475442836169534, "loss": 0.0247, "step": 99430 }, { "epoch": 0.5, "learning_rate": 0.00022474686066868135, "loss": 0.0166, "step": 99440 }, { "epoch": 0.5, "learning_rate": 0.00022473929297566733, "loss": 0.0193, "step": 99450 }, { "epoch": 0.5, "learning_rate": 0.0002247317252826533, "loss": 0.0129, "step": 99460 }, { "epoch": 0.5, "learning_rate": 0.00022472415758963932, "loss": 0.0173, "step": 99470 }, { "epoch": 0.5, "learning_rate": 0.0002247165898966253, "loss": 0.015, "step": 99480 }, { "epoch": 0.5, "learning_rate": 0.00022470902220361128, "loss": 0.0155, "step": 99490 }, { "epoch": 0.5, "learning_rate": 0.00022470145451059727, "loss": 0.0151, "step": 99500 }, { "epoch": 0.5, "learning_rate": 0.00022469388681758327, "loss": 0.0148, "step": 99510 }, { "epoch": 0.5, "learning_rate": 0.00022468631912456926, "loss": 0.0152, "step": 99520 }, { "epoch": 0.5, "learning_rate": 0.00022467875143155524, "loss": 0.0137, "step": 99530 }, { "epoch": 0.5, "learning_rate": 0.00022467118373854125, "loss": 0.0168, "step": 99540 }, { "epoch": 0.5, "learning_rate": 0.00022466361604552723, "loss": 0.0198, "step": 99550 }, { "epoch": 0.5, "learning_rate": 0.0002246560483525132, "loss": 0.0177, "step": 99560 }, { "epoch": 0.5, "learning_rate": 0.00022464848065949922, "loss": 0.0186, "step": 99570 }, { "epoch": 0.5, "learning_rate": 0.0002246409129664852, "loss": 0.0164, "step": 99580 }, { "epoch": 0.5, "learning_rate": 0.00022463334527347118, "loss": 0.0136, "step": 99590 }, { "epoch": 0.5, "learning_rate": 0.0002246257775804572, "loss": 0.0159, "step": 99600 }, { "epoch": 0.5, "learning_rate": 0.00022461820988744317, "loss": 0.0155, "step": 99610 }, { "epoch": 0.5, "learning_rate": 0.00022461064219442915, "loss": 0.0147, "step": 99620 }, { "epoch": 0.5, "learning_rate": 0.00022460307450141516, "loss": 0.024, "step": 99630 }, { "epoch": 0.5, "learning_rate": 0.00022459550680840114, "loss": 0.0168, "step": 99640 }, { "epoch": 0.5, "learning_rate": 0.00022458793911538712, "loss": 0.0164, "step": 99650 }, { "epoch": 0.5, "learning_rate": 0.00022458037142237313, "loss": 0.0136, "step": 99660 }, { "epoch": 0.5, "learning_rate": 0.0002245728037293591, "loss": 0.0141, "step": 99670 }, { "epoch": 0.5, "learning_rate": 0.0002245652360363451, "loss": 0.0173, "step": 99680 }, { "epoch": 0.5, "learning_rate": 0.00022455766834333108, "loss": 0.0183, "step": 99690 }, { "epoch": 0.5, "learning_rate": 0.00022455010065031708, "loss": 0.0212, "step": 99700 }, { "epoch": 0.5, "learning_rate": 0.00022454253295730307, "loss": 0.0146, "step": 99710 }, { "epoch": 0.5, "learning_rate": 0.00022453496526428905, "loss": 0.0161, "step": 99720 }, { "epoch": 0.5, "learning_rate": 0.00022452739757127506, "loss": 0.0134, "step": 99730 }, { "epoch": 0.5, "learning_rate": 0.00022451982987826104, "loss": 0.0173, "step": 99740 }, { "epoch": 0.5, "learning_rate": 0.00022451226218524702, "loss": 0.0166, "step": 99750 }, { "epoch": 0.5, "learning_rate": 0.00022450469449223303, "loss": 0.0138, "step": 99760 }, { "epoch": 0.5, "learning_rate": 0.000224497126799219, "loss": 0.0198, "step": 99770 }, { "epoch": 0.5, "learning_rate": 0.000224489559106205, "loss": 0.0162, "step": 99780 }, { "epoch": 0.5, "learning_rate": 0.000224481991413191, "loss": 0.0143, "step": 99790 }, { "epoch": 0.5, "learning_rate": 0.00022447442372017698, "loss": 0.0166, "step": 99800 }, { "epoch": 0.5, "learning_rate": 0.00022446685602716296, "loss": 0.014, "step": 99810 }, { "epoch": 0.5, "learning_rate": 0.00022445928833414897, "loss": 0.0141, "step": 99820 }, { "epoch": 0.5, "learning_rate": 0.00022445172064113495, "loss": 0.0152, "step": 99830 }, { "epoch": 0.5, "learning_rate": 0.00022444415294812093, "loss": 0.0156, "step": 99840 }, { "epoch": 0.5, "learning_rate": 0.00022443658525510691, "loss": 0.0165, "step": 99850 }, { "epoch": 0.5, "learning_rate": 0.00022442901756209292, "loss": 0.0169, "step": 99860 }, { "epoch": 0.5, "learning_rate": 0.0002244214498690789, "loss": 0.0164, "step": 99870 }, { "epoch": 0.5, "learning_rate": 0.00022441388217606489, "loss": 0.0172, "step": 99880 }, { "epoch": 0.5, "learning_rate": 0.0002244063144830509, "loss": 0.0153, "step": 99890 }, { "epoch": 0.5, "learning_rate": 0.00022439874679003688, "loss": 0.018, "step": 99900 }, { "epoch": 0.5, "learning_rate": 0.00022439117909702286, "loss": 0.0136, "step": 99910 }, { "epoch": 0.5, "learning_rate": 0.00022438361140400887, "loss": 0.0163, "step": 99920 }, { "epoch": 0.5, "learning_rate": 0.00022437604371099482, "loss": 0.0155, "step": 99930 }, { "epoch": 0.5, "learning_rate": 0.0002243684760179808, "loss": 0.0164, "step": 99940 }, { "epoch": 0.5, "learning_rate": 0.00022436090832496678, "loss": 0.013, "step": 99950 }, { "epoch": 0.5, "learning_rate": 0.0002243533406319528, "loss": 0.0189, "step": 99960 }, { "epoch": 0.5, "learning_rate": 0.00022434577293893877, "loss": 0.0168, "step": 99970 }, { "epoch": 0.5, "learning_rate": 0.00022433820524592475, "loss": 0.0188, "step": 99980 }, { "epoch": 0.5, "learning_rate": 0.00022433063755291076, "loss": 0.0171, "step": 99990 }, { "epoch": 0.5, "learning_rate": 0.00022432306985989674, "loss": 0.0151, "step": 100000 }, { "epoch": 0.5, "eval_cer": 0.9145051901636767, "eval_loss": 0.011643487960100174, "eval_runtime": 116.6776, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 100000 }, { "epoch": 0.5, "learning_rate": 0.00022431550216688273, "loss": 0.0137, "step": 100010 }, { "epoch": 0.5, "learning_rate": 0.00022430793447386873, "loss": 0.0181, "step": 100020 }, { "epoch": 0.5, "learning_rate": 0.00022430036678085472, "loss": 0.0136, "step": 100030 }, { "epoch": 0.5, "learning_rate": 0.0002242927990878407, "loss": 0.0213, "step": 100040 }, { "epoch": 0.5, "learning_rate": 0.0002242852313948267, "loss": 0.0172, "step": 100050 }, { "epoch": 0.5, "learning_rate": 0.0002242776637018127, "loss": 0.0217, "step": 100060 }, { "epoch": 0.5, "learning_rate": 0.00022427009600879867, "loss": 0.0161, "step": 100070 }, { "epoch": 0.5, "learning_rate": 0.00022426252831578465, "loss": 0.0185, "step": 100080 }, { "epoch": 0.5, "learning_rate": 0.00022425496062277066, "loss": 0.0164, "step": 100090 }, { "epoch": 0.51, "learning_rate": 0.00022424739292975664, "loss": 0.0131, "step": 100100 }, { "epoch": 0.51, "learning_rate": 0.00022423982523674262, "loss": 0.0179, "step": 100110 }, { "epoch": 0.51, "learning_rate": 0.00022423225754372863, "loss": 0.0163, "step": 100120 }, { "epoch": 0.51, "learning_rate": 0.0002242246898507146, "loss": 0.0154, "step": 100130 }, { "epoch": 0.51, "learning_rate": 0.0002242171221577006, "loss": 0.0144, "step": 100140 }, { "epoch": 0.51, "learning_rate": 0.0002242095544646866, "loss": 0.0158, "step": 100150 }, { "epoch": 0.51, "learning_rate": 0.00022420198677167258, "loss": 0.0171, "step": 100160 }, { "epoch": 0.51, "learning_rate": 0.00022419441907865856, "loss": 0.0147, "step": 100170 }, { "epoch": 0.51, "learning_rate": 0.00022418685138564457, "loss": 0.0154, "step": 100180 }, { "epoch": 0.51, "learning_rate": 0.00022417928369263055, "loss": 0.017, "step": 100190 }, { "epoch": 0.51, "learning_rate": 0.00022417171599961654, "loss": 0.014, "step": 100200 }, { "epoch": 0.51, "learning_rate": 0.00022416414830660254, "loss": 0.0143, "step": 100210 }, { "epoch": 0.51, "learning_rate": 0.00022415658061358853, "loss": 0.0157, "step": 100220 }, { "epoch": 0.51, "learning_rate": 0.0002241490129205745, "loss": 0.0151, "step": 100230 }, { "epoch": 0.51, "learning_rate": 0.0002241414452275605, "loss": 0.016, "step": 100240 }, { "epoch": 0.51, "learning_rate": 0.0002241338775345465, "loss": 0.0186, "step": 100250 }, { "epoch": 0.51, "learning_rate": 0.00022412630984153248, "loss": 0.015, "step": 100260 }, { "epoch": 0.51, "learning_rate": 0.00022411874214851846, "loss": 0.0182, "step": 100270 }, { "epoch": 0.51, "learning_rate": 0.00022411117445550447, "loss": 0.0151, "step": 100280 }, { "epoch": 0.51, "learning_rate": 0.00022410360676249045, "loss": 0.0149, "step": 100290 }, { "epoch": 0.51, "learning_rate": 0.00022409603906947643, "loss": 0.0164, "step": 100300 }, { "epoch": 0.51, "learning_rate": 0.00022408847137646244, "loss": 0.0151, "step": 100310 }, { "epoch": 0.51, "learning_rate": 0.00022408090368344842, "loss": 0.0162, "step": 100320 }, { "epoch": 0.51, "learning_rate": 0.0002240733359904344, "loss": 0.0181, "step": 100330 }, { "epoch": 0.51, "learning_rate": 0.0002240657682974204, "loss": 0.0162, "step": 100340 }, { "epoch": 0.51, "learning_rate": 0.0002240582006044064, "loss": 0.0133, "step": 100350 }, { "epoch": 0.51, "learning_rate": 0.00022405063291139237, "loss": 0.0144, "step": 100360 }, { "epoch": 0.51, "learning_rate": 0.00022404306521837838, "loss": 0.0195, "step": 100370 }, { "epoch": 0.51, "learning_rate": 0.00022403549752536436, "loss": 0.0173, "step": 100380 }, { "epoch": 0.51, "learning_rate": 0.00022402792983235035, "loss": 0.0145, "step": 100390 }, { "epoch": 0.51, "learning_rate": 0.00022402036213933633, "loss": 0.0156, "step": 100400 }, { "epoch": 0.51, "learning_rate": 0.00022401279444632234, "loss": 0.0224, "step": 100410 }, { "epoch": 0.51, "learning_rate": 0.00022400522675330832, "loss": 0.019, "step": 100420 }, { "epoch": 0.51, "learning_rate": 0.0002239976590602943, "loss": 0.0199, "step": 100430 }, { "epoch": 0.51, "learning_rate": 0.0002239900913672803, "loss": 0.0168, "step": 100440 }, { "epoch": 0.51, "learning_rate": 0.0002239825236742663, "loss": 0.016, "step": 100450 }, { "epoch": 0.51, "learning_rate": 0.00022397495598125227, "loss": 0.0193, "step": 100460 }, { "epoch": 0.51, "learning_rate": 0.00022396738828823828, "loss": 0.0125, "step": 100470 }, { "epoch": 0.51, "learning_rate": 0.00022395982059522426, "loss": 0.0158, "step": 100480 }, { "epoch": 0.51, "learning_rate": 0.00022395225290221024, "loss": 0.016, "step": 100490 }, { "epoch": 0.51, "learning_rate": 0.00022394468520919625, "loss": 0.016, "step": 100500 }, { "epoch": 0.51, "learning_rate": 0.00022393711751618223, "loss": 0.0171, "step": 100510 }, { "epoch": 0.51, "learning_rate": 0.0002239295498231682, "loss": 0.016, "step": 100520 }, { "epoch": 0.51, "learning_rate": 0.00022392198213015422, "loss": 0.0196, "step": 100530 }, { "epoch": 0.51, "learning_rate": 0.0002239144144371402, "loss": 0.0155, "step": 100540 }, { "epoch": 0.51, "learning_rate": 0.00022390684674412618, "loss": 0.0164, "step": 100550 }, { "epoch": 0.51, "learning_rate": 0.0002238992790511122, "loss": 0.0164, "step": 100560 }, { "epoch": 0.51, "learning_rate": 0.00022389171135809817, "loss": 0.018, "step": 100570 }, { "epoch": 0.51, "learning_rate": 0.00022388414366508416, "loss": 0.0132, "step": 100580 }, { "epoch": 0.51, "learning_rate": 0.00022387657597207014, "loss": 0.0154, "step": 100590 }, { "epoch": 0.51, "learning_rate": 0.00022386900827905615, "loss": 0.0143, "step": 100600 }, { "epoch": 0.51, "learning_rate": 0.00022386144058604213, "loss": 0.0159, "step": 100610 }, { "epoch": 0.51, "learning_rate": 0.0002238538728930281, "loss": 0.0119, "step": 100620 }, { "epoch": 0.51, "learning_rate": 0.00022384630520001412, "loss": 0.0146, "step": 100630 }, { "epoch": 0.51, "learning_rate": 0.0002238387375070001, "loss": 0.0145, "step": 100640 }, { "epoch": 0.51, "learning_rate": 0.00022383116981398608, "loss": 0.0137, "step": 100650 }, { "epoch": 0.51, "learning_rate": 0.0002238236021209721, "loss": 0.016, "step": 100660 }, { "epoch": 0.51, "learning_rate": 0.00022381603442795807, "loss": 0.0168, "step": 100670 }, { "epoch": 0.51, "learning_rate": 0.00022380846673494405, "loss": 0.0135, "step": 100680 }, { "epoch": 0.51, "learning_rate": 0.00022380089904193006, "loss": 0.0151, "step": 100690 }, { "epoch": 0.51, "learning_rate": 0.00022379333134891604, "loss": 0.018, "step": 100700 }, { "epoch": 0.51, "learning_rate": 0.00022378576365590202, "loss": 0.018, "step": 100710 }, { "epoch": 0.51, "learning_rate": 0.00022377819596288803, "loss": 0.0127, "step": 100720 }, { "epoch": 0.51, "learning_rate": 0.000223770628269874, "loss": 0.0173, "step": 100730 }, { "epoch": 0.51, "learning_rate": 0.00022376306057686, "loss": 0.0169, "step": 100740 }, { "epoch": 0.51, "learning_rate": 0.00022375549288384598, "loss": 0.0149, "step": 100750 }, { "epoch": 0.51, "learning_rate": 0.00022374792519083198, "loss": 0.0138, "step": 100760 }, { "epoch": 0.51, "learning_rate": 0.00022374035749781797, "loss": 0.0162, "step": 100770 }, { "epoch": 0.51, "learning_rate": 0.00022373278980480395, "loss": 0.0126, "step": 100780 }, { "epoch": 0.51, "learning_rate": 0.00022372522211178996, "loss": 0.0143, "step": 100790 }, { "epoch": 0.51, "learning_rate": 0.00022371765441877594, "loss": 0.018, "step": 100800 }, { "epoch": 0.51, "learning_rate": 0.00022371008672576192, "loss": 0.0144, "step": 100810 }, { "epoch": 0.51, "learning_rate": 0.00022370251903274793, "loss": 0.0145, "step": 100820 }, { "epoch": 0.51, "learning_rate": 0.0002236949513397339, "loss": 0.0171, "step": 100830 }, { "epoch": 0.51, "learning_rate": 0.0002236873836467199, "loss": 0.0142, "step": 100840 }, { "epoch": 0.51, "learning_rate": 0.0002236798159537059, "loss": 0.0141, "step": 100850 }, { "epoch": 0.51, "learning_rate": 0.00022367224826069188, "loss": 0.0159, "step": 100860 }, { "epoch": 0.51, "learning_rate": 0.00022366468056767786, "loss": 0.0126, "step": 100870 }, { "epoch": 0.51, "learning_rate": 0.00022365711287466387, "loss": 0.0148, "step": 100880 }, { "epoch": 0.51, "learning_rate": 0.00022364954518164985, "loss": 0.0176, "step": 100890 }, { "epoch": 0.51, "learning_rate": 0.00022364197748863583, "loss": 0.0147, "step": 100900 }, { "epoch": 0.51, "learning_rate": 0.00022363440979562181, "loss": 0.0138, "step": 100910 }, { "epoch": 0.51, "learning_rate": 0.00022362684210260782, "loss": 0.013, "step": 100920 }, { "epoch": 0.51, "learning_rate": 0.0002236192744095938, "loss": 0.0135, "step": 100930 }, { "epoch": 0.51, "learning_rate": 0.00022361170671657979, "loss": 0.025, "step": 100940 }, { "epoch": 0.51, "learning_rate": 0.0002236041390235658, "loss": 0.0175, "step": 100950 }, { "epoch": 0.51, "learning_rate": 0.00022359657133055178, "loss": 0.0153, "step": 100960 }, { "epoch": 0.51, "learning_rate": 0.00022358900363753776, "loss": 0.0167, "step": 100970 }, { "epoch": 0.51, "learning_rate": 0.00022358143594452377, "loss": 0.0173, "step": 100980 }, { "epoch": 0.51, "learning_rate": 0.00022357386825150975, "loss": 0.016, "step": 100990 }, { "epoch": 0.51, "learning_rate": 0.00022356630055849573, "loss": 0.0195, "step": 101000 }, { "epoch": 0.51, "eval_cer": 0.9145022789753005, "eval_loss": 0.011683492921292782, "eval_runtime": 116.7876, "eval_samples_per_second": 17.125, "eval_steps_per_second": 4.281, "step": 101000 }, { "epoch": 0.51, "learning_rate": 0.00022355873286548174, "loss": 0.0174, "step": 101010 }, { "epoch": 0.51, "learning_rate": 0.00022355116517246772, "loss": 0.0147, "step": 101020 }, { "epoch": 0.51, "learning_rate": 0.0002235435974794537, "loss": 0.0156, "step": 101030 }, { "epoch": 0.51, "learning_rate": 0.0002235360297864397, "loss": 0.0193, "step": 101040 }, { "epoch": 0.51, "learning_rate": 0.0002235284620934257, "loss": 0.0137, "step": 101050 }, { "epoch": 0.51, "learning_rate": 0.00022352089440041167, "loss": 0.0148, "step": 101060 }, { "epoch": 0.51, "learning_rate": 0.00022351332670739765, "loss": 0.0113, "step": 101070 }, { "epoch": 0.51, "learning_rate": 0.00022350575901438366, "loss": 0.0157, "step": 101080 }, { "epoch": 0.51, "learning_rate": 0.00022349819132136964, "loss": 0.0162, "step": 101090 }, { "epoch": 0.51, "learning_rate": 0.00022349062362835562, "loss": 0.0157, "step": 101100 }, { "epoch": 0.51, "learning_rate": 0.00022348305593534163, "loss": 0.0161, "step": 101110 }, { "epoch": 0.51, "learning_rate": 0.00022347548824232761, "loss": 0.0133, "step": 101120 }, { "epoch": 0.51, "learning_rate": 0.0002234679205493136, "loss": 0.0164, "step": 101130 }, { "epoch": 0.51, "learning_rate": 0.0002234603528562996, "loss": 0.0149, "step": 101140 }, { "epoch": 0.51, "learning_rate": 0.00022345278516328559, "loss": 0.0146, "step": 101150 }, { "epoch": 0.51, "learning_rate": 0.00022344521747027157, "loss": 0.0147, "step": 101160 }, { "epoch": 0.51, "learning_rate": 0.00022343764977725758, "loss": 0.0145, "step": 101170 }, { "epoch": 0.51, "learning_rate": 0.00022343008208424353, "loss": 0.0172, "step": 101180 }, { "epoch": 0.51, "learning_rate": 0.0002234225143912295, "loss": 0.0138, "step": 101190 }, { "epoch": 0.51, "learning_rate": 0.0002234149466982155, "loss": 0.0153, "step": 101200 }, { "epoch": 0.51, "learning_rate": 0.0002234073790052015, "loss": 0.0155, "step": 101210 }, { "epoch": 0.51, "learning_rate": 0.00022339981131218748, "loss": 0.0124, "step": 101220 }, { "epoch": 0.51, "learning_rate": 0.00022339224361917346, "loss": 0.0125, "step": 101230 }, { "epoch": 0.51, "learning_rate": 0.00022338467592615947, "loss": 0.0152, "step": 101240 }, { "epoch": 0.51, "learning_rate": 0.00022337710823314545, "loss": 0.0146, "step": 101250 }, { "epoch": 0.51, "learning_rate": 0.00022336954054013144, "loss": 0.0158, "step": 101260 }, { "epoch": 0.51, "learning_rate": 0.00022336197284711744, "loss": 0.0157, "step": 101270 }, { "epoch": 0.51, "learning_rate": 0.00022335440515410343, "loss": 0.0123, "step": 101280 }, { "epoch": 0.51, "learning_rate": 0.0002233468374610894, "loss": 0.0158, "step": 101290 }, { "epoch": 0.51, "learning_rate": 0.0002233392697680754, "loss": 0.0153, "step": 101300 }, { "epoch": 0.51, "learning_rate": 0.0002233317020750614, "loss": 0.0169, "step": 101310 }, { "epoch": 0.51, "learning_rate": 0.00022332413438204738, "loss": 0.0219, "step": 101320 }, { "epoch": 0.51, "learning_rate": 0.00022331656668903336, "loss": 0.0145, "step": 101330 }, { "epoch": 0.51, "learning_rate": 0.00022330899899601937, "loss": 0.0162, "step": 101340 }, { "epoch": 0.51, "learning_rate": 0.00022330143130300535, "loss": 0.0124, "step": 101350 }, { "epoch": 0.51, "learning_rate": 0.00022329386360999133, "loss": 0.0125, "step": 101360 }, { "epoch": 0.51, "learning_rate": 0.00022328629591697734, "loss": 0.0153, "step": 101370 }, { "epoch": 0.51, "learning_rate": 0.00022327872822396332, "loss": 0.0144, "step": 101380 }, { "epoch": 0.51, "learning_rate": 0.0002232711605309493, "loss": 0.0207, "step": 101390 }, { "epoch": 0.51, "learning_rate": 0.0002232635928379353, "loss": 0.0154, "step": 101400 }, { "epoch": 0.51, "learning_rate": 0.0002232560251449213, "loss": 0.0133, "step": 101410 }, { "epoch": 0.51, "learning_rate": 0.00022324845745190727, "loss": 0.0153, "step": 101420 }, { "epoch": 0.51, "learning_rate": 0.00022324088975889328, "loss": 0.0181, "step": 101430 }, { "epoch": 0.51, "learning_rate": 0.00022323332206587926, "loss": 0.0198, "step": 101440 }, { "epoch": 0.51, "learning_rate": 0.00022322575437286525, "loss": 0.0147, "step": 101450 }, { "epoch": 0.51, "learning_rate": 0.00022321818667985125, "loss": 0.0171, "step": 101460 }, { "epoch": 0.51, "learning_rate": 0.00022321061898683724, "loss": 0.0182, "step": 101470 }, { "epoch": 0.51, "learning_rate": 0.00022320305129382322, "loss": 0.0147, "step": 101480 }, { "epoch": 0.51, "learning_rate": 0.0002231954836008092, "loss": 0.0152, "step": 101490 }, { "epoch": 0.51, "learning_rate": 0.0002231879159077952, "loss": 0.0168, "step": 101500 }, { "epoch": 0.51, "learning_rate": 0.0002231803482147812, "loss": 0.0165, "step": 101510 }, { "epoch": 0.51, "learning_rate": 0.00022317278052176717, "loss": 0.0142, "step": 101520 }, { "epoch": 0.51, "learning_rate": 0.00022316521282875318, "loss": 0.0134, "step": 101530 }, { "epoch": 0.51, "learning_rate": 0.00022315764513573916, "loss": 0.0169, "step": 101540 }, { "epoch": 0.51, "learning_rate": 0.00022315007744272514, "loss": 0.0154, "step": 101550 }, { "epoch": 0.51, "learning_rate": 0.00022314250974971115, "loss": 0.0188, "step": 101560 }, { "epoch": 0.51, "learning_rate": 0.00022313494205669713, "loss": 0.0159, "step": 101570 }, { "epoch": 0.51, "learning_rate": 0.0002231273743636831, "loss": 0.0193, "step": 101580 }, { "epoch": 0.51, "learning_rate": 0.00022311980667066912, "loss": 0.0147, "step": 101590 }, { "epoch": 0.51, "learning_rate": 0.0002231122389776551, "loss": 0.0205, "step": 101600 }, { "epoch": 0.51, "learning_rate": 0.00022310467128464108, "loss": 0.0143, "step": 101610 }, { "epoch": 0.51, "learning_rate": 0.0002230971035916271, "loss": 0.0144, "step": 101620 }, { "epoch": 0.51, "learning_rate": 0.00022308953589861307, "loss": 0.0148, "step": 101630 }, { "epoch": 0.51, "learning_rate": 0.00022308196820559906, "loss": 0.0162, "step": 101640 }, { "epoch": 0.51, "learning_rate": 0.00022307440051258504, "loss": 0.018, "step": 101650 }, { "epoch": 0.51, "learning_rate": 0.00022306683281957105, "loss": 0.0131, "step": 101660 }, { "epoch": 0.51, "learning_rate": 0.00022305926512655703, "loss": 0.0148, "step": 101670 }, { "epoch": 0.51, "learning_rate": 0.000223051697433543, "loss": 0.015, "step": 101680 }, { "epoch": 0.51, "learning_rate": 0.00022304412974052902, "loss": 0.0176, "step": 101690 }, { "epoch": 0.51, "learning_rate": 0.000223036562047515, "loss": 0.0174, "step": 101700 }, { "epoch": 0.51, "learning_rate": 0.00022302899435450098, "loss": 0.0174, "step": 101710 }, { "epoch": 0.51, "learning_rate": 0.000223021426661487, "loss": 0.0142, "step": 101720 }, { "epoch": 0.51, "learning_rate": 0.00022301385896847297, "loss": 0.0143, "step": 101730 }, { "epoch": 0.51, "learning_rate": 0.00022300629127545895, "loss": 0.0193, "step": 101740 }, { "epoch": 0.51, "learning_rate": 0.00022299872358244496, "loss": 0.0144, "step": 101750 }, { "epoch": 0.51, "learning_rate": 0.00022299115588943094, "loss": 0.016, "step": 101760 }, { "epoch": 0.51, "learning_rate": 0.00022298358819641692, "loss": 0.0147, "step": 101770 }, { "epoch": 0.51, "learning_rate": 0.00022297602050340293, "loss": 0.0142, "step": 101780 }, { "epoch": 0.51, "learning_rate": 0.0002229684528103889, "loss": 0.0119, "step": 101790 }, { "epoch": 0.51, "learning_rate": 0.0002229608851173749, "loss": 0.0143, "step": 101800 }, { "epoch": 0.51, "learning_rate": 0.00022295331742436088, "loss": 0.0134, "step": 101810 }, { "epoch": 0.51, "learning_rate": 0.00022294574973134688, "loss": 0.0136, "step": 101820 }, { "epoch": 0.51, "learning_rate": 0.00022293818203833287, "loss": 0.0145, "step": 101830 }, { "epoch": 0.51, "learning_rate": 0.00022293061434531885, "loss": 0.0158, "step": 101840 }, { "epoch": 0.51, "learning_rate": 0.00022292304665230486, "loss": 0.0152, "step": 101850 }, { "epoch": 0.51, "learning_rate": 0.00022291547895929084, "loss": 0.0188, "step": 101860 }, { "epoch": 0.51, "learning_rate": 0.00022290791126627682, "loss": 0.0135, "step": 101870 }, { "epoch": 0.51, "learning_rate": 0.00022290034357326283, "loss": 0.0136, "step": 101880 }, { "epoch": 0.51, "learning_rate": 0.0002228927758802488, "loss": 0.0166, "step": 101890 }, { "epoch": 0.51, "learning_rate": 0.0002228852081872348, "loss": 0.016, "step": 101900 }, { "epoch": 0.51, "learning_rate": 0.0002228776404942208, "loss": 0.0161, "step": 101910 }, { "epoch": 0.51, "learning_rate": 0.00022287007280120678, "loss": 0.0154, "step": 101920 }, { "epoch": 0.51, "learning_rate": 0.00022286250510819276, "loss": 0.0179, "step": 101930 }, { "epoch": 0.51, "learning_rate": 0.00022285493741517877, "loss": 0.0133, "step": 101940 }, { "epoch": 0.51, "learning_rate": 0.00022284736972216475, "loss": 0.0145, "step": 101950 }, { "epoch": 0.51, "learning_rate": 0.00022283980202915073, "loss": 0.0141, "step": 101960 }, { "epoch": 0.51, "learning_rate": 0.00022283223433613671, "loss": 0.0124, "step": 101970 }, { "epoch": 0.51, "learning_rate": 0.00022282466664312272, "loss": 0.0195, "step": 101980 }, { "epoch": 0.51, "learning_rate": 0.0002228170989501087, "loss": 0.0167, "step": 101990 }, { "epoch": 0.51, "learning_rate": 0.00022280953125709469, "loss": 0.0192, "step": 102000 }, { "epoch": 0.51, "eval_cer": 0.9145119829365546, "eval_loss": 0.01138813141733408, "eval_runtime": 116.604, "eval_samples_per_second": 17.152, "eval_steps_per_second": 4.288, "step": 102000 }, { "epoch": 0.51, "learning_rate": 0.0002228019635640807, "loss": 0.0137, "step": 102010 }, { "epoch": 0.51, "learning_rate": 0.00022279439587106668, "loss": 0.0162, "step": 102020 }, { "epoch": 0.51, "learning_rate": 0.00022278682817805266, "loss": 0.0133, "step": 102030 }, { "epoch": 0.51, "learning_rate": 0.00022277926048503867, "loss": 0.0145, "step": 102040 }, { "epoch": 0.51, "learning_rate": 0.00022277169279202465, "loss": 0.0159, "step": 102050 }, { "epoch": 0.51, "learning_rate": 0.00022276412509901063, "loss": 0.0133, "step": 102060 }, { "epoch": 0.51, "learning_rate": 0.00022275655740599664, "loss": 0.0162, "step": 102070 }, { "epoch": 0.52, "learning_rate": 0.00022274898971298262, "loss": 0.0128, "step": 102080 }, { "epoch": 0.52, "learning_rate": 0.0002227414220199686, "loss": 0.0179, "step": 102090 }, { "epoch": 0.52, "learning_rate": 0.0002227338543269546, "loss": 0.015, "step": 102100 }, { "epoch": 0.52, "learning_rate": 0.0002227262866339406, "loss": 0.0145, "step": 102110 }, { "epoch": 0.52, "learning_rate": 0.00022271871894092657, "loss": 0.0146, "step": 102120 }, { "epoch": 0.52, "learning_rate": 0.00022271115124791258, "loss": 0.0182, "step": 102130 }, { "epoch": 0.52, "learning_rate": 0.00022270358355489856, "loss": 0.0148, "step": 102140 }, { "epoch": 0.52, "learning_rate": 0.00022269601586188454, "loss": 0.0123, "step": 102150 }, { "epoch": 0.52, "learning_rate": 0.00022268844816887052, "loss": 0.0175, "step": 102160 }, { "epoch": 0.52, "learning_rate": 0.00022268088047585653, "loss": 0.0134, "step": 102170 }, { "epoch": 0.52, "learning_rate": 0.00022267331278284251, "loss": 0.016, "step": 102180 }, { "epoch": 0.52, "learning_rate": 0.0002226657450898285, "loss": 0.014, "step": 102190 }, { "epoch": 0.52, "learning_rate": 0.0002226581773968145, "loss": 0.0111, "step": 102200 }, { "epoch": 0.52, "learning_rate": 0.00022265060970380049, "loss": 0.0173, "step": 102210 }, { "epoch": 0.52, "learning_rate": 0.00022264304201078647, "loss": 0.017, "step": 102220 }, { "epoch": 0.52, "learning_rate": 0.00022263547431777248, "loss": 0.0149, "step": 102230 }, { "epoch": 0.52, "learning_rate": 0.00022262790662475846, "loss": 0.0152, "step": 102240 }, { "epoch": 0.52, "learning_rate": 0.00022262033893174444, "loss": 0.0172, "step": 102250 }, { "epoch": 0.52, "learning_rate": 0.00022261277123873045, "loss": 0.0135, "step": 102260 }, { "epoch": 0.52, "learning_rate": 0.00022260520354571643, "loss": 0.0133, "step": 102270 }, { "epoch": 0.52, "learning_rate": 0.0002225976358527024, "loss": 0.0167, "step": 102280 }, { "epoch": 0.52, "learning_rate": 0.00022259006815968842, "loss": 0.0186, "step": 102290 }, { "epoch": 0.52, "learning_rate": 0.0002225825004666744, "loss": 0.0169, "step": 102300 }, { "epoch": 0.52, "learning_rate": 0.00022257493277366038, "loss": 0.0156, "step": 102310 }, { "epoch": 0.52, "learning_rate": 0.00022256736508064636, "loss": 0.0163, "step": 102320 }, { "epoch": 0.52, "learning_rate": 0.00022255979738763237, "loss": 0.0146, "step": 102330 }, { "epoch": 0.52, "learning_rate": 0.00022255222969461835, "loss": 0.0174, "step": 102340 }, { "epoch": 0.52, "learning_rate": 0.00022254466200160433, "loss": 0.0162, "step": 102350 }, { "epoch": 0.52, "learning_rate": 0.00022253709430859034, "loss": 0.0138, "step": 102360 }, { "epoch": 0.52, "learning_rate": 0.00022252952661557632, "loss": 0.0161, "step": 102370 }, { "epoch": 0.52, "learning_rate": 0.0002225219589225623, "loss": 0.0181, "step": 102380 }, { "epoch": 0.52, "learning_rate": 0.00022251439122954831, "loss": 0.0213, "step": 102390 }, { "epoch": 0.52, "learning_rate": 0.0002225068235365343, "loss": 0.0141, "step": 102400 }, { "epoch": 0.52, "learning_rate": 0.00022249925584352028, "loss": 0.0218, "step": 102410 }, { "epoch": 0.52, "learning_rate": 0.00022249168815050629, "loss": 0.0169, "step": 102420 }, { "epoch": 0.52, "learning_rate": 0.00022248412045749227, "loss": 0.0152, "step": 102430 }, { "epoch": 0.52, "learning_rate": 0.00022247655276447822, "loss": 0.0142, "step": 102440 }, { "epoch": 0.52, "learning_rate": 0.0002224689850714642, "loss": 0.0187, "step": 102450 }, { "epoch": 0.52, "learning_rate": 0.0002224614173784502, "loss": 0.0159, "step": 102460 }, { "epoch": 0.52, "learning_rate": 0.0002224538496854362, "loss": 0.0148, "step": 102470 }, { "epoch": 0.52, "learning_rate": 0.00022244628199242217, "loss": 0.0145, "step": 102480 }, { "epoch": 0.52, "learning_rate": 0.00022243871429940818, "loss": 0.014, "step": 102490 }, { "epoch": 0.52, "learning_rate": 0.00022243114660639416, "loss": 0.0149, "step": 102500 }, { "epoch": 0.52, "learning_rate": 0.00022242357891338015, "loss": 0.0132, "step": 102510 }, { "epoch": 0.52, "learning_rate": 0.00022241601122036615, "loss": 0.0168, "step": 102520 }, { "epoch": 0.52, "learning_rate": 0.00022240844352735214, "loss": 0.0139, "step": 102530 }, { "epoch": 0.52, "learning_rate": 0.00022240087583433812, "loss": 0.0145, "step": 102540 }, { "epoch": 0.52, "learning_rate": 0.0002223933081413241, "loss": 0.0173, "step": 102550 }, { "epoch": 0.52, "learning_rate": 0.0002223857404483101, "loss": 0.0205, "step": 102560 }, { "epoch": 0.52, "learning_rate": 0.0002223781727552961, "loss": 0.0146, "step": 102570 }, { "epoch": 0.52, "learning_rate": 0.00022237060506228207, "loss": 0.0136, "step": 102580 }, { "epoch": 0.52, "learning_rate": 0.00022236303736926808, "loss": 0.0149, "step": 102590 }, { "epoch": 0.52, "learning_rate": 0.00022235546967625406, "loss": 0.0143, "step": 102600 }, { "epoch": 0.52, "learning_rate": 0.00022234790198324004, "loss": 0.0159, "step": 102610 }, { "epoch": 0.52, "learning_rate": 0.00022234033429022605, "loss": 0.0169, "step": 102620 }, { "epoch": 0.52, "learning_rate": 0.00022233276659721203, "loss": 0.0129, "step": 102630 }, { "epoch": 0.52, "learning_rate": 0.000222325198904198, "loss": 0.0146, "step": 102640 }, { "epoch": 0.52, "learning_rate": 0.00022231763121118402, "loss": 0.0179, "step": 102650 }, { "epoch": 0.52, "learning_rate": 0.00022231006351817, "loss": 0.0157, "step": 102660 }, { "epoch": 0.52, "learning_rate": 0.00022230249582515598, "loss": 0.0201, "step": 102670 }, { "epoch": 0.52, "learning_rate": 0.000222294928132142, "loss": 0.0174, "step": 102680 }, { "epoch": 0.52, "learning_rate": 0.00022228736043912797, "loss": 0.0153, "step": 102690 }, { "epoch": 0.52, "learning_rate": 0.00022227979274611396, "loss": 0.0131, "step": 102700 }, { "epoch": 0.52, "learning_rate": 0.00022227222505309994, "loss": 0.0157, "step": 102710 }, { "epoch": 0.52, "learning_rate": 0.00022226465736008595, "loss": 0.0172, "step": 102720 }, { "epoch": 0.52, "learning_rate": 0.00022225708966707193, "loss": 0.0176, "step": 102730 }, { "epoch": 0.52, "learning_rate": 0.0002222495219740579, "loss": 0.0145, "step": 102740 }, { "epoch": 0.52, "learning_rate": 0.00022224195428104392, "loss": 0.0181, "step": 102750 }, { "epoch": 0.52, "learning_rate": 0.0002222343865880299, "loss": 0.0167, "step": 102760 }, { "epoch": 0.52, "learning_rate": 0.00022222681889501588, "loss": 0.0166, "step": 102770 }, { "epoch": 0.52, "learning_rate": 0.0002222192512020019, "loss": 0.0138, "step": 102780 }, { "epoch": 0.52, "learning_rate": 0.00022221168350898787, "loss": 0.0157, "step": 102790 }, { "epoch": 0.52, "learning_rate": 0.00022220411581597385, "loss": 0.0216, "step": 102800 }, { "epoch": 0.52, "learning_rate": 0.00022219654812295986, "loss": 0.0148, "step": 102810 }, { "epoch": 0.52, "learning_rate": 0.00022218898042994584, "loss": 0.0175, "step": 102820 }, { "epoch": 0.52, "learning_rate": 0.00022218141273693182, "loss": 0.0178, "step": 102830 }, { "epoch": 0.52, "learning_rate": 0.00022217384504391783, "loss": 0.0176, "step": 102840 }, { "epoch": 0.52, "learning_rate": 0.0002221662773509038, "loss": 0.0142, "step": 102850 }, { "epoch": 0.52, "learning_rate": 0.0002221587096578898, "loss": 0.0157, "step": 102860 }, { "epoch": 0.52, "learning_rate": 0.00022215114196487578, "loss": 0.0124, "step": 102870 }, { "epoch": 0.52, "learning_rate": 0.00022214357427186178, "loss": 0.0156, "step": 102880 }, { "epoch": 0.52, "learning_rate": 0.00022213600657884777, "loss": 0.0133, "step": 102890 }, { "epoch": 0.52, "learning_rate": 0.00022212843888583375, "loss": 0.0142, "step": 102900 }, { "epoch": 0.52, "learning_rate": 0.00022212087119281976, "loss": 0.018, "step": 102910 }, { "epoch": 0.52, "learning_rate": 0.00022211330349980574, "loss": 0.016, "step": 102920 }, { "epoch": 0.52, "learning_rate": 0.00022210573580679172, "loss": 0.0134, "step": 102930 }, { "epoch": 0.52, "learning_rate": 0.00022209816811377773, "loss": 0.0178, "step": 102940 }, { "epoch": 0.52, "learning_rate": 0.0002220906004207637, "loss": 0.0167, "step": 102950 }, { "epoch": 0.52, "learning_rate": 0.0002220830327277497, "loss": 0.0121, "step": 102960 }, { "epoch": 0.52, "learning_rate": 0.0002220754650347357, "loss": 0.0166, "step": 102970 }, { "epoch": 0.52, "learning_rate": 0.00022206789734172168, "loss": 0.0175, "step": 102980 }, { "epoch": 0.52, "learning_rate": 0.00022206032964870766, "loss": 0.0172, "step": 102990 }, { "epoch": 0.52, "learning_rate": 0.00022205276195569367, "loss": 0.0146, "step": 103000 }, { "epoch": 0.52, "eval_cer": 0.9144828710527925, "eval_loss": 0.011572513729333878, "eval_runtime": 116.71, "eval_samples_per_second": 17.136, "eval_steps_per_second": 4.284, "step": 103000 }, { "epoch": 0.52, "learning_rate": 0.00022204519426267965, "loss": 0.0157, "step": 103010 }, { "epoch": 0.52, "learning_rate": 0.00022203762656966563, "loss": 0.0173, "step": 103020 }, { "epoch": 0.52, "learning_rate": 0.00022203005887665164, "loss": 0.0147, "step": 103030 }, { "epoch": 0.52, "learning_rate": 0.00022202249118363762, "loss": 0.0159, "step": 103040 }, { "epoch": 0.52, "learning_rate": 0.0002220149234906236, "loss": 0.0166, "step": 103050 }, { "epoch": 0.52, "learning_rate": 0.00022200735579760959, "loss": 0.0133, "step": 103060 }, { "epoch": 0.52, "learning_rate": 0.0002219997881045956, "loss": 0.019, "step": 103070 }, { "epoch": 0.52, "learning_rate": 0.00022199222041158158, "loss": 0.0156, "step": 103080 }, { "epoch": 0.52, "learning_rate": 0.00022198465271856756, "loss": 0.0138, "step": 103090 }, { "epoch": 0.52, "learning_rate": 0.00022197708502555357, "loss": 0.0165, "step": 103100 }, { "epoch": 0.52, "learning_rate": 0.00022196951733253955, "loss": 0.0155, "step": 103110 }, { "epoch": 0.52, "learning_rate": 0.00022196194963952553, "loss": 0.0132, "step": 103120 }, { "epoch": 0.52, "learning_rate": 0.00022195438194651154, "loss": 0.014, "step": 103130 }, { "epoch": 0.52, "learning_rate": 0.00022194681425349752, "loss": 0.0137, "step": 103140 }, { "epoch": 0.52, "learning_rate": 0.0002219392465604835, "loss": 0.0151, "step": 103150 }, { "epoch": 0.52, "learning_rate": 0.0002219316788674695, "loss": 0.0145, "step": 103160 }, { "epoch": 0.52, "learning_rate": 0.0002219241111744555, "loss": 0.0143, "step": 103170 }, { "epoch": 0.52, "learning_rate": 0.00022191654348144147, "loss": 0.0154, "step": 103180 }, { "epoch": 0.52, "learning_rate": 0.00022190897578842748, "loss": 0.0135, "step": 103190 }, { "epoch": 0.52, "learning_rate": 0.00022190140809541346, "loss": 0.0154, "step": 103200 }, { "epoch": 0.52, "learning_rate": 0.00022189384040239944, "loss": 0.0154, "step": 103210 }, { "epoch": 0.52, "learning_rate": 0.00022188627270938542, "loss": 0.0158, "step": 103220 }, { "epoch": 0.52, "learning_rate": 0.00022187870501637143, "loss": 0.0153, "step": 103230 }, { "epoch": 0.52, "learning_rate": 0.00022187113732335741, "loss": 0.0149, "step": 103240 }, { "epoch": 0.52, "learning_rate": 0.0002218635696303434, "loss": 0.0184, "step": 103250 }, { "epoch": 0.52, "learning_rate": 0.0002218560019373294, "loss": 0.0157, "step": 103260 }, { "epoch": 0.52, "learning_rate": 0.00022184843424431539, "loss": 0.016, "step": 103270 }, { "epoch": 0.52, "learning_rate": 0.00022184086655130137, "loss": 0.0157, "step": 103280 }, { "epoch": 0.52, "learning_rate": 0.00022183329885828738, "loss": 0.0153, "step": 103290 }, { "epoch": 0.52, "learning_rate": 0.00022182573116527336, "loss": 0.0168, "step": 103300 }, { "epoch": 0.52, "learning_rate": 0.00022181816347225934, "loss": 0.0129, "step": 103310 }, { "epoch": 0.52, "learning_rate": 0.00022181059577924535, "loss": 0.0168, "step": 103320 }, { "epoch": 0.52, "learning_rate": 0.00022180302808623133, "loss": 0.0216, "step": 103330 }, { "epoch": 0.52, "learning_rate": 0.0002217954603932173, "loss": 0.0155, "step": 103340 }, { "epoch": 0.52, "learning_rate": 0.00022178789270020332, "loss": 0.0165, "step": 103350 }, { "epoch": 0.52, "learning_rate": 0.0002217803250071893, "loss": 0.0133, "step": 103360 }, { "epoch": 0.52, "learning_rate": 0.00022177275731417528, "loss": 0.0164, "step": 103370 }, { "epoch": 0.52, "learning_rate": 0.00022176518962116126, "loss": 0.0176, "step": 103380 }, { "epoch": 0.52, "learning_rate": 0.00022175762192814727, "loss": 0.0157, "step": 103390 }, { "epoch": 0.52, "learning_rate": 0.00022175005423513325, "loss": 0.0166, "step": 103400 }, { "epoch": 0.52, "learning_rate": 0.00022174248654211923, "loss": 0.0134, "step": 103410 }, { "epoch": 0.52, "learning_rate": 0.00022173491884910524, "loss": 0.0163, "step": 103420 }, { "epoch": 0.52, "learning_rate": 0.00022172735115609122, "loss": 0.019, "step": 103430 }, { "epoch": 0.52, "learning_rate": 0.0002217197834630772, "loss": 0.0143, "step": 103440 }, { "epoch": 0.52, "learning_rate": 0.00022171221577006321, "loss": 0.0175, "step": 103450 }, { "epoch": 0.52, "learning_rate": 0.0002217046480770492, "loss": 0.03, "step": 103460 }, { "epoch": 0.52, "learning_rate": 0.00022169708038403518, "loss": 0.0142, "step": 103470 }, { "epoch": 0.52, "learning_rate": 0.00022168951269102119, "loss": 0.0197, "step": 103480 }, { "epoch": 0.52, "learning_rate": 0.00022168194499800717, "loss": 0.015, "step": 103490 }, { "epoch": 0.52, "learning_rate": 0.00022167437730499315, "loss": 0.0146, "step": 103500 }, { "epoch": 0.52, "learning_rate": 0.00022166680961197916, "loss": 0.0138, "step": 103510 }, { "epoch": 0.52, "learning_rate": 0.00022165924191896514, "loss": 0.0151, "step": 103520 }, { "epoch": 0.52, "learning_rate": 0.00022165167422595112, "loss": 0.018, "step": 103530 }, { "epoch": 0.52, "learning_rate": 0.00022164410653293713, "loss": 0.0167, "step": 103540 }, { "epoch": 0.52, "learning_rate": 0.0002216365388399231, "loss": 0.0158, "step": 103550 }, { "epoch": 0.52, "learning_rate": 0.0002216289711469091, "loss": 0.0211, "step": 103560 }, { "epoch": 0.52, "learning_rate": 0.00022162140345389507, "loss": 0.0145, "step": 103570 }, { "epoch": 0.52, "learning_rate": 0.00022161383576088108, "loss": 0.0159, "step": 103580 }, { "epoch": 0.52, "learning_rate": 0.00022160626806786706, "loss": 0.0139, "step": 103590 }, { "epoch": 0.52, "learning_rate": 0.00022159870037485304, "loss": 0.0145, "step": 103600 }, { "epoch": 0.52, "learning_rate": 0.00022159113268183905, "loss": 0.0156, "step": 103610 }, { "epoch": 0.52, "learning_rate": 0.00022158356498882503, "loss": 0.0138, "step": 103620 }, { "epoch": 0.52, "learning_rate": 0.00022157599729581102, "loss": 0.02, "step": 103630 }, { "epoch": 0.52, "learning_rate": 0.00022156842960279702, "loss": 0.0142, "step": 103640 }, { "epoch": 0.52, "learning_rate": 0.000221560861909783, "loss": 0.0153, "step": 103650 }, { "epoch": 0.52, "learning_rate": 0.000221553294216769, "loss": 0.0156, "step": 103660 }, { "epoch": 0.52, "learning_rate": 0.000221545726523755, "loss": 0.0158, "step": 103670 }, { "epoch": 0.52, "learning_rate": 0.00022153815883074098, "loss": 0.0144, "step": 103680 }, { "epoch": 0.52, "learning_rate": 0.00022153059113772696, "loss": 0.0126, "step": 103690 }, { "epoch": 0.52, "learning_rate": 0.0002215230234447129, "loss": 0.0229, "step": 103700 }, { "epoch": 0.52, "learning_rate": 0.00022151545575169892, "loss": 0.016, "step": 103710 }, { "epoch": 0.52, "learning_rate": 0.0002215078880586849, "loss": 0.0139, "step": 103720 }, { "epoch": 0.52, "learning_rate": 0.00022150032036567088, "loss": 0.0166, "step": 103730 }, { "epoch": 0.52, "learning_rate": 0.0002214927526726569, "loss": 0.0151, "step": 103740 }, { "epoch": 0.52, "learning_rate": 0.00022148518497964287, "loss": 0.0144, "step": 103750 }, { "epoch": 0.52, "learning_rate": 0.00022147761728662886, "loss": 0.0166, "step": 103760 }, { "epoch": 0.52, "learning_rate": 0.00022147004959361484, "loss": 0.0164, "step": 103770 }, { "epoch": 0.52, "learning_rate": 0.00022146248190060085, "loss": 0.0161, "step": 103780 }, { "epoch": 0.52, "learning_rate": 0.00022145491420758683, "loss": 0.0156, "step": 103790 }, { "epoch": 0.52, "learning_rate": 0.0002214473465145728, "loss": 0.0187, "step": 103800 }, { "epoch": 0.52, "learning_rate": 0.00022143977882155882, "loss": 0.0165, "step": 103810 }, { "epoch": 0.52, "learning_rate": 0.0002214322111285448, "loss": 0.0166, "step": 103820 }, { "epoch": 0.52, "learning_rate": 0.00022142464343553078, "loss": 0.015, "step": 103830 }, { "epoch": 0.52, "learning_rate": 0.0002214170757425168, "loss": 0.0156, "step": 103840 }, { "epoch": 0.52, "learning_rate": 0.00022140950804950277, "loss": 0.0167, "step": 103850 }, { "epoch": 0.52, "learning_rate": 0.00022140194035648875, "loss": 0.0155, "step": 103860 }, { "epoch": 0.52, "learning_rate": 0.00022139437266347476, "loss": 0.0147, "step": 103870 }, { "epoch": 0.52, "learning_rate": 0.00022138680497046074, "loss": 0.0185, "step": 103880 }, { "epoch": 0.52, "learning_rate": 0.00022137923727744672, "loss": 0.0142, "step": 103890 }, { "epoch": 0.52, "learning_rate": 0.00022137166958443273, "loss": 0.0156, "step": 103900 }, { "epoch": 0.52, "learning_rate": 0.0002213641018914187, "loss": 0.0155, "step": 103910 }, { "epoch": 0.52, "learning_rate": 0.0002213565341984047, "loss": 0.0129, "step": 103920 }, { "epoch": 0.52, "learning_rate": 0.0002213489665053907, "loss": 0.0154, "step": 103930 }, { "epoch": 0.52, "learning_rate": 0.00022134139881237668, "loss": 0.0125, "step": 103940 }, { "epoch": 0.52, "learning_rate": 0.00022133383111936267, "loss": 0.0165, "step": 103950 }, { "epoch": 0.52, "learning_rate": 0.00022132626342634865, "loss": 0.0142, "step": 103960 }, { "epoch": 0.52, "learning_rate": 0.00022131869573333466, "loss": 0.0153, "step": 103970 }, { "epoch": 0.52, "learning_rate": 0.00022131112804032064, "loss": 0.0166, "step": 103980 }, { "epoch": 0.52, "learning_rate": 0.00022130356034730662, "loss": 0.0114, "step": 103990 }, { "epoch": 0.52, "learning_rate": 0.00022129599265429263, "loss": 0.0178, "step": 104000 }, { "epoch": 0.52, "eval_cer": 0.9145071309559275, "eval_loss": 0.01152227446436882, "eval_runtime": 116.6853, "eval_samples_per_second": 17.14, "eval_steps_per_second": 4.285, "step": 104000 }, { "epoch": 0.52, "learning_rate": 0.0002212884249612786, "loss": 0.017, "step": 104010 }, { "epoch": 0.52, "learning_rate": 0.0002212808572682646, "loss": 0.0172, "step": 104020 }, { "epoch": 0.52, "learning_rate": 0.0002212732895752506, "loss": 0.017, "step": 104030 }, { "epoch": 0.52, "learning_rate": 0.00022126572188223658, "loss": 0.0133, "step": 104040 }, { "epoch": 0.52, "learning_rate": 0.00022125815418922256, "loss": 0.0159, "step": 104050 }, { "epoch": 0.52, "learning_rate": 0.00022125058649620857, "loss": 0.0134, "step": 104060 }, { "epoch": 0.53, "learning_rate": 0.00022124301880319455, "loss": 0.0152, "step": 104070 }, { "epoch": 0.53, "learning_rate": 0.00022123545111018053, "loss": 0.0161, "step": 104080 }, { "epoch": 0.53, "learning_rate": 0.00022122788341716654, "loss": 0.0185, "step": 104090 }, { "epoch": 0.53, "learning_rate": 0.00022122031572415252, "loss": 0.0135, "step": 104100 }, { "epoch": 0.53, "learning_rate": 0.0002212127480311385, "loss": 0.0162, "step": 104110 }, { "epoch": 0.53, "learning_rate": 0.0002212051803381245, "loss": 0.0162, "step": 104120 }, { "epoch": 0.53, "learning_rate": 0.0002211976126451105, "loss": 0.0143, "step": 104130 }, { "epoch": 0.53, "learning_rate": 0.00022119004495209648, "loss": 0.0179, "step": 104140 }, { "epoch": 0.53, "learning_rate": 0.00022118247725908246, "loss": 0.0159, "step": 104150 }, { "epoch": 0.53, "learning_rate": 0.00022117490956606847, "loss": 0.0132, "step": 104160 }, { "epoch": 0.53, "learning_rate": 0.00022116734187305445, "loss": 0.0149, "step": 104170 }, { "epoch": 0.53, "learning_rate": 0.00022115977418004043, "loss": 0.0153, "step": 104180 }, { "epoch": 0.53, "learning_rate": 0.00022115220648702644, "loss": 0.0149, "step": 104190 }, { "epoch": 0.53, "learning_rate": 0.00022114463879401242, "loss": 0.0133, "step": 104200 }, { "epoch": 0.53, "learning_rate": 0.0002211370711009984, "loss": 0.0234, "step": 104210 }, { "epoch": 0.53, "learning_rate": 0.0002211295034079844, "loss": 0.015, "step": 104220 }, { "epoch": 0.53, "learning_rate": 0.0002211219357149704, "loss": 0.019, "step": 104230 }, { "epoch": 0.53, "learning_rate": 0.00022111436802195637, "loss": 0.0151, "step": 104240 }, { "epoch": 0.53, "learning_rate": 0.00022110680032894238, "loss": 0.0173, "step": 104250 }, { "epoch": 0.53, "learning_rate": 0.00022109923263592836, "loss": 0.0144, "step": 104260 }, { "epoch": 0.53, "learning_rate": 0.00022109166494291434, "loss": 0.0125, "step": 104270 }, { "epoch": 0.53, "learning_rate": 0.00022108409724990033, "loss": 0.0159, "step": 104280 }, { "epoch": 0.53, "learning_rate": 0.00022107652955688633, "loss": 0.0124, "step": 104290 }, { "epoch": 0.53, "learning_rate": 0.00022106896186387232, "loss": 0.0134, "step": 104300 }, { "epoch": 0.53, "learning_rate": 0.0002210613941708583, "loss": 0.0159, "step": 104310 }, { "epoch": 0.53, "learning_rate": 0.0002210538264778443, "loss": 0.0167, "step": 104320 }, { "epoch": 0.53, "learning_rate": 0.0002210462587848303, "loss": 0.0154, "step": 104330 }, { "epoch": 0.53, "learning_rate": 0.00022103869109181627, "loss": 0.0148, "step": 104340 }, { "epoch": 0.53, "learning_rate": 0.00022103112339880228, "loss": 0.0202, "step": 104350 }, { "epoch": 0.53, "learning_rate": 0.00022102355570578826, "loss": 0.0176, "step": 104360 }, { "epoch": 0.53, "learning_rate": 0.00022101598801277424, "loss": 0.0138, "step": 104370 }, { "epoch": 0.53, "learning_rate": 0.00022100842031976025, "loss": 0.0135, "step": 104380 }, { "epoch": 0.53, "learning_rate": 0.00022100085262674623, "loss": 0.0159, "step": 104390 }, { "epoch": 0.53, "learning_rate": 0.0002209932849337322, "loss": 0.0148, "step": 104400 }, { "epoch": 0.53, "learning_rate": 0.00022098571724071822, "loss": 0.0152, "step": 104410 }, { "epoch": 0.53, "learning_rate": 0.0002209781495477042, "loss": 0.0187, "step": 104420 }, { "epoch": 0.53, "learning_rate": 0.00022097058185469018, "loss": 0.0153, "step": 104430 }, { "epoch": 0.53, "learning_rate": 0.0002209630141616762, "loss": 0.0169, "step": 104440 }, { "epoch": 0.53, "learning_rate": 0.00022095544646866217, "loss": 0.0155, "step": 104450 }, { "epoch": 0.53, "learning_rate": 0.00022094787877564815, "loss": 0.0154, "step": 104460 }, { "epoch": 0.53, "learning_rate": 0.00022094031108263414, "loss": 0.0214, "step": 104470 }, { "epoch": 0.53, "learning_rate": 0.00022093274338962014, "loss": 0.0166, "step": 104480 }, { "epoch": 0.53, "learning_rate": 0.00022092517569660613, "loss": 0.0166, "step": 104490 }, { "epoch": 0.53, "learning_rate": 0.0002209176080035921, "loss": 0.0129, "step": 104500 }, { "epoch": 0.53, "learning_rate": 0.00022091004031057812, "loss": 0.0147, "step": 104510 }, { "epoch": 0.53, "learning_rate": 0.0002209024726175641, "loss": 0.0187, "step": 104520 }, { "epoch": 0.53, "learning_rate": 0.00022089490492455008, "loss": 0.0137, "step": 104530 }, { "epoch": 0.53, "learning_rate": 0.0002208873372315361, "loss": 0.0161, "step": 104540 }, { "epoch": 0.53, "learning_rate": 0.00022087976953852207, "loss": 0.0167, "step": 104550 }, { "epoch": 0.53, "learning_rate": 0.00022087220184550805, "loss": 0.0148, "step": 104560 }, { "epoch": 0.53, "learning_rate": 0.00022086463415249406, "loss": 0.0161, "step": 104570 }, { "epoch": 0.53, "learning_rate": 0.00022085706645948004, "loss": 0.0145, "step": 104580 }, { "epoch": 0.53, "learning_rate": 0.00022084949876646602, "loss": 0.0169, "step": 104590 }, { "epoch": 0.53, "learning_rate": 0.00022084193107345203, "loss": 0.0157, "step": 104600 }, { "epoch": 0.53, "learning_rate": 0.000220834363380438, "loss": 0.015, "step": 104610 }, { "epoch": 0.53, "learning_rate": 0.000220826795687424, "loss": 0.0147, "step": 104620 }, { "epoch": 0.53, "learning_rate": 0.00022081922799440997, "loss": 0.0168, "step": 104630 }, { "epoch": 0.53, "learning_rate": 0.00022081166030139598, "loss": 0.0171, "step": 104640 }, { "epoch": 0.53, "learning_rate": 0.00022080409260838196, "loss": 0.0161, "step": 104650 }, { "epoch": 0.53, "learning_rate": 0.00022079652491536795, "loss": 0.0175, "step": 104660 }, { "epoch": 0.53, "learning_rate": 0.00022078895722235395, "loss": 0.0151, "step": 104670 }, { "epoch": 0.53, "learning_rate": 0.00022078138952933994, "loss": 0.0162, "step": 104680 }, { "epoch": 0.53, "learning_rate": 0.00022077382183632592, "loss": 0.0147, "step": 104690 }, { "epoch": 0.53, "learning_rate": 0.00022076625414331193, "loss": 0.0147, "step": 104700 }, { "epoch": 0.53, "learning_rate": 0.0002207586864502979, "loss": 0.0165, "step": 104710 }, { "epoch": 0.53, "learning_rate": 0.0002207511187572839, "loss": 0.0146, "step": 104720 }, { "epoch": 0.53, "learning_rate": 0.0002207435510642699, "loss": 0.019, "step": 104730 }, { "epoch": 0.53, "learning_rate": 0.00022073598337125588, "loss": 0.0171, "step": 104740 }, { "epoch": 0.53, "learning_rate": 0.00022072841567824186, "loss": 0.0163, "step": 104750 }, { "epoch": 0.53, "learning_rate": 0.00022072084798522787, "loss": 0.0176, "step": 104760 }, { "epoch": 0.53, "learning_rate": 0.00022071328029221385, "loss": 0.012, "step": 104770 }, { "epoch": 0.53, "learning_rate": 0.00022070571259919983, "loss": 0.013, "step": 104780 }, { "epoch": 0.53, "learning_rate": 0.0002206981449061858, "loss": 0.0134, "step": 104790 }, { "epoch": 0.53, "learning_rate": 0.00022069057721317182, "loss": 0.0151, "step": 104800 }, { "epoch": 0.53, "learning_rate": 0.0002206830095201578, "loss": 0.0211, "step": 104810 }, { "epoch": 0.53, "learning_rate": 0.00022067544182714378, "loss": 0.0153, "step": 104820 }, { "epoch": 0.53, "learning_rate": 0.0002206678741341298, "loss": 0.0186, "step": 104830 }, { "epoch": 0.53, "learning_rate": 0.00022066030644111577, "loss": 0.0161, "step": 104840 }, { "epoch": 0.53, "learning_rate": 0.00022065273874810176, "loss": 0.0184, "step": 104850 }, { "epoch": 0.53, "learning_rate": 0.00022064517105508776, "loss": 0.0146, "step": 104860 }, { "epoch": 0.53, "learning_rate": 0.00022063760336207375, "loss": 0.0152, "step": 104870 }, { "epoch": 0.53, "learning_rate": 0.00022063003566905973, "loss": 0.0127, "step": 104880 }, { "epoch": 0.53, "learning_rate": 0.00022062246797604574, "loss": 0.0163, "step": 104890 }, { "epoch": 0.53, "learning_rate": 0.00022061490028303172, "loss": 0.015, "step": 104900 }, { "epoch": 0.53, "learning_rate": 0.0002206073325900177, "loss": 0.0136, "step": 104910 }, { "epoch": 0.53, "learning_rate": 0.0002205997648970037, "loss": 0.0136, "step": 104920 }, { "epoch": 0.53, "learning_rate": 0.0002205921972039897, "loss": 0.0199, "step": 104930 }, { "epoch": 0.53, "learning_rate": 0.00022058462951097567, "loss": 0.0151, "step": 104940 }, { "epoch": 0.53, "learning_rate": 0.00022057706181796165, "loss": 0.0161, "step": 104950 }, { "epoch": 0.53, "learning_rate": 0.00022056949412494763, "loss": 0.0142, "step": 104960 }, { "epoch": 0.53, "learning_rate": 0.00022056192643193361, "loss": 0.013, "step": 104970 }, { "epoch": 0.53, "learning_rate": 0.0002205543587389196, "loss": 0.0197, "step": 104980 }, { "epoch": 0.53, "learning_rate": 0.0002205467910459056, "loss": 0.0173, "step": 104990 }, { "epoch": 0.53, "learning_rate": 0.00022053922335289159, "loss": 0.018, "step": 105000 }, { "epoch": 0.53, "eval_cer": 0.9144848118450433, "eval_loss": 0.011399283073842525, "eval_runtime": 116.6482, "eval_samples_per_second": 17.146, "eval_steps_per_second": 4.286, "step": 105000 }, { "epoch": 0.53, "learning_rate": 0.00022053165565987757, "loss": 0.0184, "step": 105010 }, { "epoch": 0.53, "learning_rate": 0.00022052408796686355, "loss": 0.0154, "step": 105020 }, { "epoch": 0.53, "learning_rate": 0.00022051652027384956, "loss": 0.015, "step": 105030 }, { "epoch": 0.53, "learning_rate": 0.00022050895258083554, "loss": 0.0146, "step": 105040 }, { "epoch": 0.53, "learning_rate": 0.00022050138488782152, "loss": 0.016, "step": 105050 }, { "epoch": 0.53, "learning_rate": 0.00022049381719480753, "loss": 0.0169, "step": 105060 }, { "epoch": 0.53, "learning_rate": 0.0002204862495017935, "loss": 0.0165, "step": 105070 }, { "epoch": 0.53, "learning_rate": 0.0002204786818087795, "loss": 0.0157, "step": 105080 }, { "epoch": 0.53, "learning_rate": 0.0002204711141157655, "loss": 0.0145, "step": 105090 }, { "epoch": 0.53, "learning_rate": 0.00022046354642275148, "loss": 0.0233, "step": 105100 }, { "epoch": 0.53, "learning_rate": 0.00022045597872973746, "loss": 0.0156, "step": 105110 }, { "epoch": 0.53, "learning_rate": 0.00022044841103672347, "loss": 0.0163, "step": 105120 }, { "epoch": 0.53, "learning_rate": 0.00022044084334370945, "loss": 0.0163, "step": 105130 }, { "epoch": 0.53, "learning_rate": 0.00022043327565069543, "loss": 0.0185, "step": 105140 }, { "epoch": 0.53, "learning_rate": 0.00022042570795768144, "loss": 0.0161, "step": 105150 }, { "epoch": 0.53, "learning_rate": 0.00022041814026466742, "loss": 0.0168, "step": 105160 }, { "epoch": 0.53, "learning_rate": 0.0002204105725716534, "loss": 0.0132, "step": 105170 }, { "epoch": 0.53, "learning_rate": 0.0002204030048786394, "loss": 0.0138, "step": 105180 }, { "epoch": 0.53, "learning_rate": 0.0002203954371856254, "loss": 0.016, "step": 105190 }, { "epoch": 0.53, "learning_rate": 0.00022038786949261138, "loss": 0.0129, "step": 105200 }, { "epoch": 0.53, "learning_rate": 0.00022038030179959736, "loss": 0.018, "step": 105210 }, { "epoch": 0.53, "learning_rate": 0.00022037273410658337, "loss": 0.0156, "step": 105220 }, { "epoch": 0.53, "learning_rate": 0.00022036516641356935, "loss": 0.0149, "step": 105230 }, { "epoch": 0.53, "learning_rate": 0.00022035759872055533, "loss": 0.0129, "step": 105240 }, { "epoch": 0.53, "learning_rate": 0.00022035003102754134, "loss": 0.0138, "step": 105250 }, { "epoch": 0.53, "learning_rate": 0.00022034246333452732, "loss": 0.0151, "step": 105260 }, { "epoch": 0.53, "learning_rate": 0.0002203348956415133, "loss": 0.0154, "step": 105270 }, { "epoch": 0.53, "learning_rate": 0.0002203273279484993, "loss": 0.0162, "step": 105280 }, { "epoch": 0.53, "learning_rate": 0.0002203197602554853, "loss": 0.0158, "step": 105290 }, { "epoch": 0.53, "learning_rate": 0.00022031219256247127, "loss": 0.0155, "step": 105300 }, { "epoch": 0.53, "learning_rate": 0.00022030462486945728, "loss": 0.0169, "step": 105310 }, { "epoch": 0.53, "learning_rate": 0.00022029705717644326, "loss": 0.0149, "step": 105320 }, { "epoch": 0.53, "learning_rate": 0.00022028948948342924, "loss": 0.017, "step": 105330 }, { "epoch": 0.53, "learning_rate": 0.00022028192179041525, "loss": 0.016, "step": 105340 }, { "epoch": 0.53, "learning_rate": 0.00022027435409740123, "loss": 0.0195, "step": 105350 }, { "epoch": 0.53, "learning_rate": 0.00022026678640438722, "loss": 0.0163, "step": 105360 }, { "epoch": 0.53, "learning_rate": 0.0002202592187113732, "loss": 0.0194, "step": 105370 }, { "epoch": 0.53, "learning_rate": 0.0002202516510183592, "loss": 0.0134, "step": 105380 }, { "epoch": 0.53, "learning_rate": 0.0002202440833253452, "loss": 0.0166, "step": 105390 }, { "epoch": 0.53, "learning_rate": 0.00022023651563233117, "loss": 0.0136, "step": 105400 }, { "epoch": 0.53, "learning_rate": 0.00022022894793931718, "loss": 0.0141, "step": 105410 }, { "epoch": 0.53, "learning_rate": 0.00022022138024630316, "loss": 0.0151, "step": 105420 }, { "epoch": 0.53, "learning_rate": 0.00022021381255328914, "loss": 0.0143, "step": 105430 }, { "epoch": 0.53, "learning_rate": 0.00022020624486027515, "loss": 0.0155, "step": 105440 }, { "epoch": 0.53, "learning_rate": 0.00022019867716726113, "loss": 0.0214, "step": 105450 }, { "epoch": 0.53, "learning_rate": 0.0002201911094742471, "loss": 0.015, "step": 105460 }, { "epoch": 0.53, "learning_rate": 0.00022018354178123312, "loss": 0.0156, "step": 105470 }, { "epoch": 0.53, "learning_rate": 0.0002201759740882191, "loss": 0.0166, "step": 105480 }, { "epoch": 0.53, "learning_rate": 0.00022016840639520508, "loss": 0.0133, "step": 105490 }, { "epoch": 0.53, "learning_rate": 0.0002201608387021911, "loss": 0.0131, "step": 105500 }, { "epoch": 0.53, "learning_rate": 0.00022015327100917707, "loss": 0.0165, "step": 105510 }, { "epoch": 0.53, "learning_rate": 0.00022014570331616305, "loss": 0.0157, "step": 105520 }, { "epoch": 0.53, "learning_rate": 0.00022013813562314904, "loss": 0.0125, "step": 105530 }, { "epoch": 0.53, "learning_rate": 0.00022013056793013504, "loss": 0.0153, "step": 105540 }, { "epoch": 0.53, "learning_rate": 0.00022012300023712103, "loss": 0.0188, "step": 105550 }, { "epoch": 0.53, "learning_rate": 0.000220115432544107, "loss": 0.0133, "step": 105560 }, { "epoch": 0.53, "learning_rate": 0.00022010786485109302, "loss": 0.0173, "step": 105570 }, { "epoch": 0.53, "learning_rate": 0.000220100297158079, "loss": 0.0149, "step": 105580 }, { "epoch": 0.53, "learning_rate": 0.00022009272946506498, "loss": 0.0133, "step": 105590 }, { "epoch": 0.53, "learning_rate": 0.000220085161772051, "loss": 0.0187, "step": 105600 }, { "epoch": 0.53, "learning_rate": 0.00022007759407903697, "loss": 0.0186, "step": 105610 }, { "epoch": 0.53, "learning_rate": 0.00022007002638602295, "loss": 0.0146, "step": 105620 }, { "epoch": 0.53, "learning_rate": 0.00022006245869300896, "loss": 0.0139, "step": 105630 }, { "epoch": 0.53, "learning_rate": 0.00022005489099999494, "loss": 0.0125, "step": 105640 }, { "epoch": 0.53, "learning_rate": 0.00022004732330698092, "loss": 0.0139, "step": 105650 }, { "epoch": 0.53, "learning_rate": 0.00022003975561396693, "loss": 0.0158, "step": 105660 }, { "epoch": 0.53, "learning_rate": 0.0002200321879209529, "loss": 0.0153, "step": 105670 }, { "epoch": 0.53, "learning_rate": 0.0002200246202279389, "loss": 0.0165, "step": 105680 }, { "epoch": 0.53, "learning_rate": 0.00022001705253492487, "loss": 0.0164, "step": 105690 }, { "epoch": 0.53, "learning_rate": 0.00022000948484191088, "loss": 0.0159, "step": 105700 }, { "epoch": 0.53, "learning_rate": 0.00022000191714889686, "loss": 0.0166, "step": 105710 }, { "epoch": 0.53, "learning_rate": 0.00021999434945588285, "loss": 0.0141, "step": 105720 }, { "epoch": 0.53, "learning_rate": 0.00021998678176286885, "loss": 0.0182, "step": 105730 }, { "epoch": 0.53, "learning_rate": 0.00021997921406985484, "loss": 0.0159, "step": 105740 }, { "epoch": 0.53, "learning_rate": 0.00021997164637684082, "loss": 0.0157, "step": 105750 }, { "epoch": 0.53, "learning_rate": 0.00021996407868382683, "loss": 0.0137, "step": 105760 }, { "epoch": 0.53, "learning_rate": 0.0002199565109908128, "loss": 0.0157, "step": 105770 }, { "epoch": 0.53, "learning_rate": 0.0002199489432977988, "loss": 0.0184, "step": 105780 }, { "epoch": 0.53, "learning_rate": 0.0002199413756047848, "loss": 0.015, "step": 105790 }, { "epoch": 0.53, "learning_rate": 0.00021993380791177078, "loss": 0.0133, "step": 105800 }, { "epoch": 0.53, "learning_rate": 0.00021992624021875676, "loss": 0.021, "step": 105810 }, { "epoch": 0.53, "learning_rate": 0.00021991867252574277, "loss": 0.0119, "step": 105820 }, { "epoch": 0.53, "learning_rate": 0.00021991110483272875, "loss": 0.013, "step": 105830 }, { "epoch": 0.53, "learning_rate": 0.00021990353713971473, "loss": 0.0163, "step": 105840 }, { "epoch": 0.53, "learning_rate": 0.0002198959694467007, "loss": 0.0225, "step": 105850 }, { "epoch": 0.53, "learning_rate": 0.00021988840175368672, "loss": 0.0149, "step": 105860 }, { "epoch": 0.53, "learning_rate": 0.0002198808340606727, "loss": 0.0129, "step": 105870 }, { "epoch": 0.53, "learning_rate": 0.00021987326636765868, "loss": 0.0191, "step": 105880 }, { "epoch": 0.53, "learning_rate": 0.0002198656986746447, "loss": 0.0123, "step": 105890 }, { "epoch": 0.53, "learning_rate": 0.00021985813098163067, "loss": 0.0126, "step": 105900 }, { "epoch": 0.53, "learning_rate": 0.00021985056328861666, "loss": 0.0144, "step": 105910 }, { "epoch": 0.53, "learning_rate": 0.00021984299559560266, "loss": 0.0123, "step": 105920 }, { "epoch": 0.53, "learning_rate": 0.00021983542790258865, "loss": 0.0156, "step": 105930 }, { "epoch": 0.53, "learning_rate": 0.00021982786020957463, "loss": 0.0114, "step": 105940 }, { "epoch": 0.53, "learning_rate": 0.00021982029251656064, "loss": 0.015, "step": 105950 }, { "epoch": 0.53, "learning_rate": 0.00021981272482354662, "loss": 0.0171, "step": 105960 }, { "epoch": 0.53, "learning_rate": 0.0002198051571305326, "loss": 0.0175, "step": 105970 }, { "epoch": 0.53, "learning_rate": 0.0002197975894375186, "loss": 0.0168, "step": 105980 }, { "epoch": 0.53, "learning_rate": 0.0002197900217445046, "loss": 0.0145, "step": 105990 }, { "epoch": 0.53, "learning_rate": 0.00021978245405149057, "loss": 0.02, "step": 106000 }, { "epoch": 0.53, "eval_cer": 0.9144886934295449, "eval_loss": 0.01085778046399355, "eval_runtime": 116.7271, "eval_samples_per_second": 17.134, "eval_steps_per_second": 4.283, "step": 106000 }, { "epoch": 0.53, "learning_rate": 0.00021977488635847658, "loss": 0.0155, "step": 106010 }, { "epoch": 0.53, "learning_rate": 0.00021976731866546256, "loss": 0.0119, "step": 106020 }, { "epoch": 0.53, "learning_rate": 0.00021975975097244854, "loss": 0.0178, "step": 106030 }, { "epoch": 0.53, "learning_rate": 0.00021975218327943452, "loss": 0.0181, "step": 106040 }, { "epoch": 0.54, "learning_rate": 0.00021974461558642053, "loss": 0.0155, "step": 106050 }, { "epoch": 0.54, "learning_rate": 0.0002197370478934065, "loss": 0.0122, "step": 106060 }, { "epoch": 0.54, "learning_rate": 0.0002197294802003925, "loss": 0.0148, "step": 106070 }, { "epoch": 0.54, "learning_rate": 0.0002197219125073785, "loss": 0.0172, "step": 106080 }, { "epoch": 0.54, "learning_rate": 0.00021971434481436448, "loss": 0.0152, "step": 106090 }, { "epoch": 0.54, "learning_rate": 0.00021970677712135047, "loss": 0.016, "step": 106100 }, { "epoch": 0.54, "learning_rate": 0.00021969920942833647, "loss": 0.0164, "step": 106110 }, { "epoch": 0.54, "learning_rate": 0.00021969164173532246, "loss": 0.0144, "step": 106120 }, { "epoch": 0.54, "learning_rate": 0.00021968407404230844, "loss": 0.0153, "step": 106130 }, { "epoch": 0.54, "learning_rate": 0.00021967650634929445, "loss": 0.0152, "step": 106140 }, { "epoch": 0.54, "learning_rate": 0.00021966893865628043, "loss": 0.0141, "step": 106150 }, { "epoch": 0.54, "learning_rate": 0.0002196613709632664, "loss": 0.0137, "step": 106160 }, { "epoch": 0.54, "learning_rate": 0.00021965380327025242, "loss": 0.0168, "step": 106170 }, { "epoch": 0.54, "learning_rate": 0.0002196462355772384, "loss": 0.0173, "step": 106180 }, { "epoch": 0.54, "learning_rate": 0.00021963866788422438, "loss": 0.0178, "step": 106190 }, { "epoch": 0.54, "learning_rate": 0.00021963110019121036, "loss": 0.0139, "step": 106200 }, { "epoch": 0.54, "learning_rate": 0.00021962353249819634, "loss": 0.0164, "step": 106210 }, { "epoch": 0.54, "learning_rate": 0.00021961596480518232, "loss": 0.0166, "step": 106220 }, { "epoch": 0.54, "learning_rate": 0.0002196083971121683, "loss": 0.0137, "step": 106230 }, { "epoch": 0.54, "learning_rate": 0.0002196008294191543, "loss": 0.0137, "step": 106240 }, { "epoch": 0.54, "learning_rate": 0.0002195932617261403, "loss": 0.0126, "step": 106250 }, { "epoch": 0.54, "learning_rate": 0.00021958569403312628, "loss": 0.019, "step": 106260 }, { "epoch": 0.54, "learning_rate": 0.00021957812634011226, "loss": 0.012, "step": 106270 }, { "epoch": 0.54, "learning_rate": 0.00021957055864709827, "loss": 0.0136, "step": 106280 }, { "epoch": 0.54, "learning_rate": 0.00021956299095408425, "loss": 0.0131, "step": 106290 }, { "epoch": 0.54, "learning_rate": 0.00021955542326107023, "loss": 0.0152, "step": 106300 }, { "epoch": 0.54, "learning_rate": 0.00021954785556805624, "loss": 0.0129, "step": 106310 }, { "epoch": 0.54, "learning_rate": 0.00021954028787504222, "loss": 0.012, "step": 106320 }, { "epoch": 0.54, "learning_rate": 0.0002195327201820282, "loss": 0.0136, "step": 106330 }, { "epoch": 0.54, "learning_rate": 0.0002195251524890142, "loss": 0.0148, "step": 106340 }, { "epoch": 0.54, "learning_rate": 0.0002195175847960002, "loss": 0.013, "step": 106350 }, { "epoch": 0.54, "learning_rate": 0.00021951001710298617, "loss": 0.015, "step": 106360 }, { "epoch": 0.54, "learning_rate": 0.00021950244940997218, "loss": 0.0159, "step": 106370 }, { "epoch": 0.54, "learning_rate": 0.00021949488171695816, "loss": 0.0124, "step": 106380 }, { "epoch": 0.54, "learning_rate": 0.00021948731402394414, "loss": 0.0131, "step": 106390 }, { "epoch": 0.54, "learning_rate": 0.00021947974633093015, "loss": 0.0172, "step": 106400 }, { "epoch": 0.54, "learning_rate": 0.00021947217863791613, "loss": 0.0129, "step": 106410 }, { "epoch": 0.54, "learning_rate": 0.00021946461094490212, "loss": 0.0194, "step": 106420 }, { "epoch": 0.54, "learning_rate": 0.0002194570432518881, "loss": 0.0149, "step": 106430 }, { "epoch": 0.54, "learning_rate": 0.0002194494755588741, "loss": 0.0191, "step": 106440 }, { "epoch": 0.54, "learning_rate": 0.0002194419078658601, "loss": 0.0136, "step": 106450 }, { "epoch": 0.54, "learning_rate": 0.00021943434017284607, "loss": 0.0142, "step": 106460 }, { "epoch": 0.54, "learning_rate": 0.00021942677247983208, "loss": 0.0128, "step": 106470 }, { "epoch": 0.54, "learning_rate": 0.00021941920478681806, "loss": 0.0176, "step": 106480 }, { "epoch": 0.54, "learning_rate": 0.00021941163709380404, "loss": 0.0141, "step": 106490 }, { "epoch": 0.54, "learning_rate": 0.00021940406940079005, "loss": 0.0146, "step": 106500 }, { "epoch": 0.54, "learning_rate": 0.00021939650170777603, "loss": 0.0145, "step": 106510 }, { "epoch": 0.54, "learning_rate": 0.000219388934014762, "loss": 0.0151, "step": 106520 }, { "epoch": 0.54, "learning_rate": 0.00021938136632174802, "loss": 0.0161, "step": 106530 }, { "epoch": 0.54, "learning_rate": 0.000219373798628734, "loss": 0.0169, "step": 106540 }, { "epoch": 0.54, "learning_rate": 0.00021936623093571998, "loss": 0.0133, "step": 106550 }, { "epoch": 0.54, "learning_rate": 0.000219358663242706, "loss": 0.0263, "step": 106560 }, { "epoch": 0.54, "learning_rate": 0.00021935109554969197, "loss": 0.0191, "step": 106570 }, { "epoch": 0.54, "learning_rate": 0.00021934352785667795, "loss": 0.0143, "step": 106580 }, { "epoch": 0.54, "learning_rate": 0.00021933596016366394, "loss": 0.0169, "step": 106590 }, { "epoch": 0.54, "learning_rate": 0.00021932839247064994, "loss": 0.0171, "step": 106600 }, { "epoch": 0.54, "learning_rate": 0.00021932082477763593, "loss": 0.0148, "step": 106610 }, { "epoch": 0.54, "learning_rate": 0.0002193132570846219, "loss": 0.015, "step": 106620 }, { "epoch": 0.54, "learning_rate": 0.00021930568939160792, "loss": 0.0174, "step": 106630 }, { "epoch": 0.54, "learning_rate": 0.0002192981216985939, "loss": 0.012, "step": 106640 }, { "epoch": 0.54, "learning_rate": 0.00021929055400557988, "loss": 0.0155, "step": 106650 }, { "epoch": 0.54, "learning_rate": 0.0002192829863125659, "loss": 0.0144, "step": 106660 }, { "epoch": 0.54, "learning_rate": 0.00021927541861955187, "loss": 0.0144, "step": 106670 }, { "epoch": 0.54, "learning_rate": 0.00021926785092653785, "loss": 0.0147, "step": 106680 }, { "epoch": 0.54, "learning_rate": 0.00021926028323352386, "loss": 0.0172, "step": 106690 }, { "epoch": 0.54, "learning_rate": 0.00021925271554050984, "loss": 0.0147, "step": 106700 }, { "epoch": 0.54, "learning_rate": 0.00021924514784749582, "loss": 0.0142, "step": 106710 }, { "epoch": 0.54, "learning_rate": 0.00021923758015448183, "loss": 0.0154, "step": 106720 }, { "epoch": 0.54, "learning_rate": 0.0002192300124614678, "loss": 0.0151, "step": 106730 }, { "epoch": 0.54, "learning_rate": 0.0002192224447684538, "loss": 0.016, "step": 106740 }, { "epoch": 0.54, "learning_rate": 0.00021921487707543977, "loss": 0.0135, "step": 106750 }, { "epoch": 0.54, "learning_rate": 0.00021920730938242578, "loss": 0.0155, "step": 106760 }, { "epoch": 0.54, "learning_rate": 0.00021919974168941176, "loss": 0.0147, "step": 106770 }, { "epoch": 0.54, "learning_rate": 0.00021919217399639775, "loss": 0.0216, "step": 106780 }, { "epoch": 0.54, "learning_rate": 0.00021918460630338375, "loss": 0.0156, "step": 106790 }, { "epoch": 0.54, "learning_rate": 0.00021917703861036974, "loss": 0.013, "step": 106800 }, { "epoch": 0.54, "learning_rate": 0.00021916947091735572, "loss": 0.0147, "step": 106810 }, { "epoch": 0.54, "learning_rate": 0.00021916190322434173, "loss": 0.0186, "step": 106820 }, { "epoch": 0.54, "learning_rate": 0.0002191543355313277, "loss": 0.0157, "step": 106830 }, { "epoch": 0.54, "learning_rate": 0.0002191467678383137, "loss": 0.0157, "step": 106840 }, { "epoch": 0.54, "learning_rate": 0.0002191392001452997, "loss": 0.0161, "step": 106850 }, { "epoch": 0.54, "learning_rate": 0.00021913163245228568, "loss": 0.0137, "step": 106860 }, { "epoch": 0.54, "learning_rate": 0.00021912406475927166, "loss": 0.0169, "step": 106870 }, { "epoch": 0.54, "learning_rate": 0.00021911649706625767, "loss": 0.0149, "step": 106880 }, { "epoch": 0.54, "learning_rate": 0.00021910892937324365, "loss": 0.019, "step": 106890 }, { "epoch": 0.54, "learning_rate": 0.00021910136168022963, "loss": 0.0167, "step": 106900 }, { "epoch": 0.54, "learning_rate": 0.00021909379398721564, "loss": 0.0152, "step": 106910 }, { "epoch": 0.54, "learning_rate": 0.00021908622629420162, "loss": 0.0167, "step": 106920 }, { "epoch": 0.54, "learning_rate": 0.0002190786586011876, "loss": 0.0173, "step": 106930 }, { "epoch": 0.54, "learning_rate": 0.00021907109090817358, "loss": 0.011, "step": 106940 }, { "epoch": 0.54, "learning_rate": 0.0002190635232151596, "loss": 0.0153, "step": 106950 }, { "epoch": 0.54, "learning_rate": 0.00021905595552214557, "loss": 0.0154, "step": 106960 }, { "epoch": 0.54, "learning_rate": 0.00021904838782913156, "loss": 0.0152, "step": 106970 }, { "epoch": 0.54, "learning_rate": 0.00021904082013611756, "loss": 0.0168, "step": 106980 }, { "epoch": 0.54, "learning_rate": 0.00021903325244310355, "loss": 0.0132, "step": 106990 }, { "epoch": 0.54, "learning_rate": 0.00021902568475008953, "loss": 0.0152, "step": 107000 }, { "epoch": 0.54, "eval_cer": 0.9144886934295449, "eval_loss": 0.010931231081485748, "eval_runtime": 116.6714, "eval_samples_per_second": 17.142, "eval_steps_per_second": 4.286, "step": 107000 }, { "epoch": 0.54, "learning_rate": 0.00021901811705707554, "loss": 0.0139, "step": 107010 }, { "epoch": 0.54, "learning_rate": 0.00021901054936406152, "loss": 0.0144, "step": 107020 }, { "epoch": 0.54, "learning_rate": 0.0002190029816710475, "loss": 0.0108, "step": 107030 }, { "epoch": 0.54, "learning_rate": 0.0002189954139780335, "loss": 0.0194, "step": 107040 }, { "epoch": 0.54, "learning_rate": 0.0002189878462850195, "loss": 0.0142, "step": 107050 }, { "epoch": 0.54, "learning_rate": 0.00021898027859200547, "loss": 0.0164, "step": 107060 }, { "epoch": 0.54, "learning_rate": 0.00021897271089899148, "loss": 0.0135, "step": 107070 }, { "epoch": 0.54, "learning_rate": 0.00021896514320597746, "loss": 0.016, "step": 107080 }, { "epoch": 0.54, "learning_rate": 0.00021895757551296344, "loss": 0.0143, "step": 107090 }, { "epoch": 0.54, "learning_rate": 0.00021895000781994942, "loss": 0.0282, "step": 107100 }, { "epoch": 0.54, "learning_rate": 0.00021894244012693543, "loss": 0.0153, "step": 107110 }, { "epoch": 0.54, "learning_rate": 0.0002189348724339214, "loss": 0.0144, "step": 107120 }, { "epoch": 0.54, "learning_rate": 0.0002189273047409074, "loss": 0.0135, "step": 107130 }, { "epoch": 0.54, "learning_rate": 0.0002189197370478934, "loss": 0.0165, "step": 107140 }, { "epoch": 0.54, "learning_rate": 0.00021891216935487938, "loss": 0.0173, "step": 107150 }, { "epoch": 0.54, "learning_rate": 0.00021890460166186537, "loss": 0.0209, "step": 107160 }, { "epoch": 0.54, "learning_rate": 0.00021889703396885137, "loss": 0.0149, "step": 107170 }, { "epoch": 0.54, "learning_rate": 0.00021888946627583736, "loss": 0.0118, "step": 107180 }, { "epoch": 0.54, "learning_rate": 0.00021888189858282334, "loss": 0.017, "step": 107190 }, { "epoch": 0.54, "learning_rate": 0.00021887433088980935, "loss": 0.0166, "step": 107200 }, { "epoch": 0.54, "learning_rate": 0.00021886676319679533, "loss": 0.0153, "step": 107210 }, { "epoch": 0.54, "learning_rate": 0.0002188591955037813, "loss": 0.0159, "step": 107220 }, { "epoch": 0.54, "learning_rate": 0.00021885162781076732, "loss": 0.0161, "step": 107230 }, { "epoch": 0.54, "learning_rate": 0.0002188440601177533, "loss": 0.0136, "step": 107240 }, { "epoch": 0.54, "learning_rate": 0.00021883649242473928, "loss": 0.0146, "step": 107250 }, { "epoch": 0.54, "learning_rate": 0.00021882892473172526, "loss": 0.0155, "step": 107260 }, { "epoch": 0.54, "learning_rate": 0.00021882135703871127, "loss": 0.013, "step": 107270 }, { "epoch": 0.54, "learning_rate": 0.00021881378934569725, "loss": 0.0149, "step": 107280 }, { "epoch": 0.54, "learning_rate": 0.00021880622165268323, "loss": 0.0144, "step": 107290 }, { "epoch": 0.54, "learning_rate": 0.00021879865395966924, "loss": 0.0143, "step": 107300 }, { "epoch": 0.54, "learning_rate": 0.00021879108626665522, "loss": 0.0117, "step": 107310 }, { "epoch": 0.54, "learning_rate": 0.0002187835185736412, "loss": 0.0171, "step": 107320 }, { "epoch": 0.54, "learning_rate": 0.0002187759508806272, "loss": 0.0158, "step": 107330 }, { "epoch": 0.54, "learning_rate": 0.0002187683831876132, "loss": 0.0203, "step": 107340 }, { "epoch": 0.54, "learning_rate": 0.00021876081549459918, "loss": 0.014, "step": 107350 }, { "epoch": 0.54, "learning_rate": 0.00021875324780158518, "loss": 0.0154, "step": 107360 }, { "epoch": 0.54, "learning_rate": 0.00021874568010857117, "loss": 0.0205, "step": 107370 }, { "epoch": 0.54, "learning_rate": 0.00021873811241555715, "loss": 0.0145, "step": 107380 }, { "epoch": 0.54, "learning_rate": 0.00021873054472254316, "loss": 0.0134, "step": 107390 }, { "epoch": 0.54, "learning_rate": 0.00021872297702952914, "loss": 0.0152, "step": 107400 }, { "epoch": 0.54, "learning_rate": 0.00021871540933651512, "loss": 0.0144, "step": 107410 }, { "epoch": 0.54, "learning_rate": 0.00021870784164350113, "loss": 0.0147, "step": 107420 }, { "epoch": 0.54, "learning_rate": 0.0002187002739504871, "loss": 0.0152, "step": 107430 }, { "epoch": 0.54, "learning_rate": 0.0002186927062574731, "loss": 0.0188, "step": 107440 }, { "epoch": 0.54, "learning_rate": 0.00021868513856445907, "loss": 0.0185, "step": 107450 }, { "epoch": 0.54, "learning_rate": 0.00021867757087144508, "loss": 0.0164, "step": 107460 }, { "epoch": 0.54, "learning_rate": 0.00021867000317843103, "loss": 0.0124, "step": 107470 }, { "epoch": 0.54, "learning_rate": 0.00021866243548541702, "loss": 0.0153, "step": 107480 }, { "epoch": 0.54, "learning_rate": 0.000218654867792403, "loss": 0.0181, "step": 107490 }, { "epoch": 0.54, "learning_rate": 0.000218647300099389, "loss": 0.016, "step": 107500 }, { "epoch": 0.54, "learning_rate": 0.000218639732406375, "loss": 0.0168, "step": 107510 }, { "epoch": 0.54, "learning_rate": 0.00021863216471336097, "loss": 0.0162, "step": 107520 }, { "epoch": 0.54, "learning_rate": 0.00021862459702034698, "loss": 0.0138, "step": 107530 }, { "epoch": 0.54, "learning_rate": 0.00021861702932733296, "loss": 0.0174, "step": 107540 }, { "epoch": 0.54, "learning_rate": 0.00021860946163431894, "loss": 0.0166, "step": 107550 }, { "epoch": 0.54, "learning_rate": 0.00021860189394130495, "loss": 0.0149, "step": 107560 }, { "epoch": 0.54, "learning_rate": 0.00021859432624829093, "loss": 0.0163, "step": 107570 }, { "epoch": 0.54, "learning_rate": 0.0002185867585552769, "loss": 0.0165, "step": 107580 }, { "epoch": 0.54, "learning_rate": 0.00021857919086226292, "loss": 0.0174, "step": 107590 }, { "epoch": 0.54, "learning_rate": 0.0002185716231692489, "loss": 0.0131, "step": 107600 }, { "epoch": 0.54, "learning_rate": 0.00021856405547623488, "loss": 0.0154, "step": 107610 }, { "epoch": 0.54, "learning_rate": 0.0002185564877832209, "loss": 0.0119, "step": 107620 }, { "epoch": 0.54, "learning_rate": 0.00021854892009020687, "loss": 0.0144, "step": 107630 }, { "epoch": 0.54, "learning_rate": 0.00021854135239719285, "loss": 0.0144, "step": 107640 }, { "epoch": 0.54, "learning_rate": 0.00021853378470417884, "loss": 0.0173, "step": 107650 }, { "epoch": 0.54, "learning_rate": 0.00021852621701116484, "loss": 0.0188, "step": 107660 }, { "epoch": 0.54, "learning_rate": 0.00021851864931815083, "loss": 0.0186, "step": 107670 }, { "epoch": 0.54, "learning_rate": 0.0002185110816251368, "loss": 0.0114, "step": 107680 }, { "epoch": 0.54, "learning_rate": 0.00021850351393212282, "loss": 0.0166, "step": 107690 }, { "epoch": 0.54, "learning_rate": 0.0002184959462391088, "loss": 0.0158, "step": 107700 }, { "epoch": 0.54, "learning_rate": 0.00021848837854609478, "loss": 0.0154, "step": 107710 }, { "epoch": 0.54, "learning_rate": 0.0002184808108530808, "loss": 0.0178, "step": 107720 }, { "epoch": 0.54, "learning_rate": 0.00021847324316006677, "loss": 0.016, "step": 107730 }, { "epoch": 0.54, "learning_rate": 0.00021846567546705275, "loss": 0.0134, "step": 107740 }, { "epoch": 0.54, "learning_rate": 0.00021845810777403876, "loss": 0.0142, "step": 107750 }, { "epoch": 0.54, "learning_rate": 0.00021845054008102474, "loss": 0.0135, "step": 107760 }, { "epoch": 0.54, "learning_rate": 0.00021844297238801072, "loss": 0.0173, "step": 107770 }, { "epoch": 0.54, "learning_rate": 0.00021843540469499673, "loss": 0.0131, "step": 107780 }, { "epoch": 0.54, "learning_rate": 0.0002184278370019827, "loss": 0.0145, "step": 107790 }, { "epoch": 0.54, "learning_rate": 0.0002184202693089687, "loss": 0.0142, "step": 107800 }, { "epoch": 0.54, "learning_rate": 0.0002184127016159547, "loss": 0.0166, "step": 107810 }, { "epoch": 0.54, "learning_rate": 0.00021840513392294068, "loss": 0.0137, "step": 107820 }, { "epoch": 0.54, "learning_rate": 0.00021839756622992666, "loss": 0.0165, "step": 107830 }, { "epoch": 0.54, "learning_rate": 0.00021838999853691265, "loss": 0.0128, "step": 107840 }, { "epoch": 0.54, "learning_rate": 0.00021838243084389865, "loss": 0.0143, "step": 107850 }, { "epoch": 0.54, "learning_rate": 0.00021837486315088464, "loss": 0.0123, "step": 107860 }, { "epoch": 0.54, "learning_rate": 0.00021836729545787062, "loss": 0.0162, "step": 107870 }, { "epoch": 0.54, "learning_rate": 0.00021835972776485663, "loss": 0.0173, "step": 107880 }, { "epoch": 0.54, "learning_rate": 0.0002183521600718426, "loss": 0.0154, "step": 107890 }, { "epoch": 0.54, "learning_rate": 0.0002183445923788286, "loss": 0.0174, "step": 107900 }, { "epoch": 0.54, "learning_rate": 0.0002183370246858146, "loss": 0.0143, "step": 107910 }, { "epoch": 0.54, "learning_rate": 0.00021832945699280058, "loss": 0.0183, "step": 107920 }, { "epoch": 0.54, "learning_rate": 0.00021832188929978656, "loss": 0.0166, "step": 107930 }, { "epoch": 0.54, "learning_rate": 0.00021831432160677257, "loss": 0.0179, "step": 107940 }, { "epoch": 0.54, "learning_rate": 0.00021830675391375855, "loss": 0.0156, "step": 107950 }, { "epoch": 0.54, "learning_rate": 0.00021829918622074453, "loss": 0.0146, "step": 107960 }, { "epoch": 0.54, "learning_rate": 0.00021829161852773054, "loss": 0.0139, "step": 107970 }, { "epoch": 0.54, "learning_rate": 0.00021828405083471652, "loss": 0.0175, "step": 107980 }, { "epoch": 0.54, "learning_rate": 0.0002182764831417025, "loss": 0.0176, "step": 107990 }, { "epoch": 0.54, "learning_rate": 0.00021826891544868848, "loss": 0.0146, "step": 108000 }, { "epoch": 0.54, "eval_cer": 0.9144886934295449, "eval_loss": 0.011288284324109554, "eval_runtime": 116.6804, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 108000 }, { "epoch": 0.54, "learning_rate": 0.0002182613477556745, "loss": 0.0146, "step": 108010 }, { "epoch": 0.54, "learning_rate": 0.00021825378006266047, "loss": 0.0141, "step": 108020 }, { "epoch": 0.55, "learning_rate": 0.00021824621236964646, "loss": 0.0117, "step": 108030 }, { "epoch": 0.55, "learning_rate": 0.00021823864467663246, "loss": 0.0141, "step": 108040 }, { "epoch": 0.55, "learning_rate": 0.00021823107698361845, "loss": 0.0155, "step": 108050 }, { "epoch": 0.55, "learning_rate": 0.00021822350929060443, "loss": 0.0161, "step": 108060 }, { "epoch": 0.55, "learning_rate": 0.00021821594159759044, "loss": 0.0161, "step": 108070 }, { "epoch": 0.55, "learning_rate": 0.00021820837390457642, "loss": 0.0119, "step": 108080 }, { "epoch": 0.55, "learning_rate": 0.0002182008062115624, "loss": 0.0153, "step": 108090 }, { "epoch": 0.55, "learning_rate": 0.0002181932385185484, "loss": 0.0184, "step": 108100 }, { "epoch": 0.55, "learning_rate": 0.0002181856708255344, "loss": 0.0135, "step": 108110 }, { "epoch": 0.55, "learning_rate": 0.00021817810313252037, "loss": 0.0131, "step": 108120 }, { "epoch": 0.55, "learning_rate": 0.00021817053543950638, "loss": 0.0136, "step": 108130 }, { "epoch": 0.55, "learning_rate": 0.00021816296774649236, "loss": 0.0147, "step": 108140 }, { "epoch": 0.55, "learning_rate": 0.00021815540005347834, "loss": 0.0152, "step": 108150 }, { "epoch": 0.55, "learning_rate": 0.00021814783236046432, "loss": 0.0159, "step": 108160 }, { "epoch": 0.55, "learning_rate": 0.00021814026466745033, "loss": 0.0132, "step": 108170 }, { "epoch": 0.55, "learning_rate": 0.0002181326969744363, "loss": 0.0161, "step": 108180 }, { "epoch": 0.55, "learning_rate": 0.0002181251292814223, "loss": 0.0189, "step": 108190 }, { "epoch": 0.55, "learning_rate": 0.0002181175615884083, "loss": 0.0147, "step": 108200 }, { "epoch": 0.55, "learning_rate": 0.00021810999389539428, "loss": 0.0148, "step": 108210 }, { "epoch": 0.55, "learning_rate": 0.00021810242620238027, "loss": 0.0171, "step": 108220 }, { "epoch": 0.55, "learning_rate": 0.00021809485850936627, "loss": 0.0148, "step": 108230 }, { "epoch": 0.55, "learning_rate": 0.00021808729081635226, "loss": 0.0146, "step": 108240 }, { "epoch": 0.55, "learning_rate": 0.00021807972312333824, "loss": 0.0192, "step": 108250 }, { "epoch": 0.55, "learning_rate": 0.00021807215543032425, "loss": 0.013, "step": 108260 }, { "epoch": 0.55, "learning_rate": 0.00021806458773731023, "loss": 0.0154, "step": 108270 }, { "epoch": 0.55, "learning_rate": 0.0002180570200442962, "loss": 0.016, "step": 108280 }, { "epoch": 0.55, "learning_rate": 0.00021804945235128222, "loss": 0.0175, "step": 108290 }, { "epoch": 0.55, "learning_rate": 0.0002180418846582682, "loss": 0.0148, "step": 108300 }, { "epoch": 0.55, "learning_rate": 0.00021803431696525418, "loss": 0.0147, "step": 108310 }, { "epoch": 0.55, "learning_rate": 0.0002180267492722402, "loss": 0.016, "step": 108320 }, { "epoch": 0.55, "learning_rate": 0.00021801918157922617, "loss": 0.0168, "step": 108330 }, { "epoch": 0.55, "learning_rate": 0.00021801161388621215, "loss": 0.0147, "step": 108340 }, { "epoch": 0.55, "learning_rate": 0.00021800404619319813, "loss": 0.0136, "step": 108350 }, { "epoch": 0.55, "learning_rate": 0.00021799647850018414, "loss": 0.0153, "step": 108360 }, { "epoch": 0.55, "learning_rate": 0.00021798891080717012, "loss": 0.0143, "step": 108370 }, { "epoch": 0.55, "learning_rate": 0.0002179813431141561, "loss": 0.0173, "step": 108380 }, { "epoch": 0.55, "learning_rate": 0.0002179737754211421, "loss": 0.0151, "step": 108390 }, { "epoch": 0.55, "learning_rate": 0.0002179662077281281, "loss": 0.0167, "step": 108400 }, { "epoch": 0.55, "learning_rate": 0.00021795864003511408, "loss": 0.0154, "step": 108410 }, { "epoch": 0.55, "learning_rate": 0.00021795107234210008, "loss": 0.0163, "step": 108420 }, { "epoch": 0.55, "learning_rate": 0.00021794350464908607, "loss": 0.0185, "step": 108430 }, { "epoch": 0.55, "learning_rate": 0.00021793593695607205, "loss": 0.0172, "step": 108440 }, { "epoch": 0.55, "learning_rate": 0.00021792836926305806, "loss": 0.0151, "step": 108450 }, { "epoch": 0.55, "learning_rate": 0.00021792080157004404, "loss": 0.016, "step": 108460 }, { "epoch": 0.55, "learning_rate": 0.00021791323387703002, "loss": 0.0127, "step": 108470 }, { "epoch": 0.55, "learning_rate": 0.00021790566618401603, "loss": 0.0163, "step": 108480 }, { "epoch": 0.55, "learning_rate": 0.000217898098491002, "loss": 0.0133, "step": 108490 }, { "epoch": 0.55, "learning_rate": 0.000217890530797988, "loss": 0.0174, "step": 108500 }, { "epoch": 0.55, "learning_rate": 0.00021788296310497397, "loss": 0.0156, "step": 108510 }, { "epoch": 0.55, "learning_rate": 0.00021787539541195998, "loss": 0.0122, "step": 108520 }, { "epoch": 0.55, "learning_rate": 0.00021786782771894596, "loss": 0.0138, "step": 108530 }, { "epoch": 0.55, "learning_rate": 0.00021786026002593194, "loss": 0.0144, "step": 108540 }, { "epoch": 0.55, "learning_rate": 0.00021785269233291795, "loss": 0.0116, "step": 108550 }, { "epoch": 0.55, "learning_rate": 0.00021784512463990393, "loss": 0.0165, "step": 108560 }, { "epoch": 0.55, "learning_rate": 0.00021783755694688991, "loss": 0.0151, "step": 108570 }, { "epoch": 0.55, "learning_rate": 0.00021782998925387592, "loss": 0.0148, "step": 108580 }, { "epoch": 0.55, "learning_rate": 0.0002178224215608619, "loss": 0.0196, "step": 108590 }, { "epoch": 0.55, "learning_rate": 0.00021781485386784789, "loss": 0.012, "step": 108600 }, { "epoch": 0.55, "learning_rate": 0.0002178072861748339, "loss": 0.0145, "step": 108610 }, { "epoch": 0.55, "learning_rate": 0.00021779971848181988, "loss": 0.0168, "step": 108620 }, { "epoch": 0.55, "learning_rate": 0.00021779215078880586, "loss": 0.0145, "step": 108630 }, { "epoch": 0.55, "learning_rate": 0.00021778458309579187, "loss": 0.014, "step": 108640 }, { "epoch": 0.55, "learning_rate": 0.00021777701540277785, "loss": 0.0138, "step": 108650 }, { "epoch": 0.55, "learning_rate": 0.00021776944770976383, "loss": 0.0156, "step": 108660 }, { "epoch": 0.55, "learning_rate": 0.0002177618800167498, "loss": 0.0135, "step": 108670 }, { "epoch": 0.55, "learning_rate": 0.00021775431232373582, "loss": 0.0162, "step": 108680 }, { "epoch": 0.55, "learning_rate": 0.0002177467446307218, "loss": 0.0203, "step": 108690 }, { "epoch": 0.55, "learning_rate": 0.00021773917693770778, "loss": 0.02, "step": 108700 }, { "epoch": 0.55, "learning_rate": 0.0002177316092446938, "loss": 0.0156, "step": 108710 }, { "epoch": 0.55, "learning_rate": 0.00021772404155167977, "loss": 0.0137, "step": 108720 }, { "epoch": 0.55, "learning_rate": 0.00021771647385866573, "loss": 0.015, "step": 108730 }, { "epoch": 0.55, "learning_rate": 0.0002177089061656517, "loss": 0.0159, "step": 108740 }, { "epoch": 0.55, "learning_rate": 0.00021770133847263772, "loss": 0.0164, "step": 108750 }, { "epoch": 0.55, "learning_rate": 0.0002176937707796237, "loss": 0.0166, "step": 108760 }, { "epoch": 0.55, "learning_rate": 0.00021768620308660968, "loss": 0.0131, "step": 108770 }, { "epoch": 0.55, "learning_rate": 0.0002176786353935957, "loss": 0.0144, "step": 108780 }, { "epoch": 0.55, "learning_rate": 0.00021767106770058167, "loss": 0.0163, "step": 108790 }, { "epoch": 0.55, "learning_rate": 0.00021766350000756765, "loss": 0.0138, "step": 108800 }, { "epoch": 0.55, "learning_rate": 0.00021765593231455366, "loss": 0.0149, "step": 108810 }, { "epoch": 0.55, "learning_rate": 0.00021764836462153964, "loss": 0.0181, "step": 108820 }, { "epoch": 0.55, "learning_rate": 0.00021764079692852562, "loss": 0.0157, "step": 108830 }, { "epoch": 0.55, "learning_rate": 0.00021763322923551163, "loss": 0.0157, "step": 108840 }, { "epoch": 0.55, "learning_rate": 0.0002176256615424976, "loss": 0.0162, "step": 108850 }, { "epoch": 0.55, "learning_rate": 0.0002176180938494836, "loss": 0.0153, "step": 108860 }, { "epoch": 0.55, "learning_rate": 0.0002176105261564696, "loss": 0.0141, "step": 108870 }, { "epoch": 0.55, "learning_rate": 0.00021760295846345558, "loss": 0.0152, "step": 108880 }, { "epoch": 0.55, "learning_rate": 0.00021759539077044156, "loss": 0.0146, "step": 108890 }, { "epoch": 0.55, "learning_rate": 0.00021758782307742755, "loss": 0.0162, "step": 108900 }, { "epoch": 0.55, "learning_rate": 0.00021758025538441355, "loss": 0.0141, "step": 108910 }, { "epoch": 0.55, "learning_rate": 0.00021757268769139954, "loss": 0.0153, "step": 108920 }, { "epoch": 0.55, "learning_rate": 0.00021756511999838552, "loss": 0.0144, "step": 108930 }, { "epoch": 0.55, "learning_rate": 0.00021755755230537153, "loss": 0.0137, "step": 108940 }, { "epoch": 0.55, "learning_rate": 0.0002175499846123575, "loss": 0.0129, "step": 108950 }, { "epoch": 0.55, "learning_rate": 0.0002175424169193435, "loss": 0.0133, "step": 108960 }, { "epoch": 0.55, "learning_rate": 0.0002175348492263295, "loss": 0.0119, "step": 108970 }, { "epoch": 0.55, "learning_rate": 0.00021752728153331548, "loss": 0.0169, "step": 108980 }, { "epoch": 0.55, "learning_rate": 0.00021751971384030146, "loss": 0.0128, "step": 108990 }, { "epoch": 0.55, "learning_rate": 0.00021751214614728747, "loss": 0.0128, "step": 109000 }, { "epoch": 0.55, "eval_cer": 0.9145003381830497, "eval_loss": 0.011132709681987762, "eval_runtime": 116.5842, "eval_samples_per_second": 17.155, "eval_steps_per_second": 4.289, "step": 109000 }, { "epoch": 0.55, "learning_rate": 0.00021750457845427345, "loss": 0.0133, "step": 109010 }, { "epoch": 0.55, "learning_rate": 0.00021749701076125943, "loss": 0.0148, "step": 109020 }, { "epoch": 0.55, "learning_rate": 0.00021748944306824544, "loss": 0.0132, "step": 109030 }, { "epoch": 0.55, "learning_rate": 0.00021748187537523142, "loss": 0.0138, "step": 109040 }, { "epoch": 0.55, "learning_rate": 0.0002174743076822174, "loss": 0.0147, "step": 109050 }, { "epoch": 0.55, "learning_rate": 0.00021746673998920338, "loss": 0.0134, "step": 109060 }, { "epoch": 0.55, "learning_rate": 0.0002174591722961894, "loss": 0.0126, "step": 109070 }, { "epoch": 0.55, "learning_rate": 0.00021745160460317537, "loss": 0.0146, "step": 109080 }, { "epoch": 0.55, "learning_rate": 0.00021744403691016136, "loss": 0.013, "step": 109090 }, { "epoch": 0.55, "learning_rate": 0.00021743646921714736, "loss": 0.0133, "step": 109100 }, { "epoch": 0.55, "learning_rate": 0.00021742890152413335, "loss": 0.0145, "step": 109110 }, { "epoch": 0.55, "learning_rate": 0.00021742133383111933, "loss": 0.0169, "step": 109120 }, { "epoch": 0.55, "learning_rate": 0.00021741376613810534, "loss": 0.0157, "step": 109130 }, { "epoch": 0.55, "learning_rate": 0.00021740619844509132, "loss": 0.0158, "step": 109140 }, { "epoch": 0.55, "learning_rate": 0.0002173986307520773, "loss": 0.017, "step": 109150 }, { "epoch": 0.55, "learning_rate": 0.0002173910630590633, "loss": 0.0136, "step": 109160 }, { "epoch": 0.55, "learning_rate": 0.0002173834953660493, "loss": 0.0227, "step": 109170 }, { "epoch": 0.55, "learning_rate": 0.00021737592767303527, "loss": 0.0156, "step": 109180 }, { "epoch": 0.55, "learning_rate": 0.00021736835998002128, "loss": 0.0136, "step": 109190 }, { "epoch": 0.55, "learning_rate": 0.00021736079228700726, "loss": 0.0174, "step": 109200 }, { "epoch": 0.55, "learning_rate": 0.00021735322459399324, "loss": 0.0162, "step": 109210 }, { "epoch": 0.55, "learning_rate": 0.00021734565690097925, "loss": 0.0196, "step": 109220 }, { "epoch": 0.55, "learning_rate": 0.00021733808920796523, "loss": 0.0146, "step": 109230 }, { "epoch": 0.55, "learning_rate": 0.0002173305215149512, "loss": 0.0141, "step": 109240 }, { "epoch": 0.55, "learning_rate": 0.0002173229538219372, "loss": 0.0138, "step": 109250 }, { "epoch": 0.55, "learning_rate": 0.0002173153861289232, "loss": 0.019, "step": 109260 }, { "epoch": 0.55, "learning_rate": 0.00021730781843590918, "loss": 0.0148, "step": 109270 }, { "epoch": 0.55, "learning_rate": 0.00021730025074289517, "loss": 0.0146, "step": 109280 }, { "epoch": 0.55, "learning_rate": 0.00021729268304988117, "loss": 0.0189, "step": 109290 }, { "epoch": 0.55, "learning_rate": 0.00021728511535686716, "loss": 0.0137, "step": 109300 }, { "epoch": 0.55, "learning_rate": 0.00021727754766385314, "loss": 0.0152, "step": 109310 }, { "epoch": 0.55, "learning_rate": 0.00021726997997083915, "loss": 0.0151, "step": 109320 }, { "epoch": 0.55, "learning_rate": 0.00021726241227782513, "loss": 0.0135, "step": 109330 }, { "epoch": 0.55, "learning_rate": 0.0002172548445848111, "loss": 0.0156, "step": 109340 }, { "epoch": 0.55, "learning_rate": 0.00021724727689179712, "loss": 0.0176, "step": 109350 }, { "epoch": 0.55, "learning_rate": 0.0002172397091987831, "loss": 0.0189, "step": 109360 }, { "epoch": 0.55, "learning_rate": 0.00021723214150576908, "loss": 0.0128, "step": 109370 }, { "epoch": 0.55, "learning_rate": 0.0002172245738127551, "loss": 0.0181, "step": 109380 }, { "epoch": 0.55, "learning_rate": 0.00021721700611974107, "loss": 0.017, "step": 109390 }, { "epoch": 0.55, "learning_rate": 0.00021720943842672705, "loss": 0.0163, "step": 109400 }, { "epoch": 0.55, "learning_rate": 0.00021720187073371303, "loss": 0.0133, "step": 109410 }, { "epoch": 0.55, "learning_rate": 0.00021719430304069904, "loss": 0.0169, "step": 109420 }, { "epoch": 0.55, "learning_rate": 0.00021718673534768502, "loss": 0.0212, "step": 109430 }, { "epoch": 0.55, "learning_rate": 0.000217179167654671, "loss": 0.0189, "step": 109440 }, { "epoch": 0.55, "learning_rate": 0.000217171599961657, "loss": 0.0172, "step": 109450 }, { "epoch": 0.55, "learning_rate": 0.000217164032268643, "loss": 0.0149, "step": 109460 }, { "epoch": 0.55, "learning_rate": 0.00021715646457562898, "loss": 0.0174, "step": 109470 }, { "epoch": 0.55, "learning_rate": 0.00021714889688261498, "loss": 0.0147, "step": 109480 }, { "epoch": 0.55, "learning_rate": 0.00021714132918960097, "loss": 0.0137, "step": 109490 }, { "epoch": 0.55, "learning_rate": 0.00021713376149658695, "loss": 0.0174, "step": 109500 }, { "epoch": 0.55, "learning_rate": 0.00021712619380357296, "loss": 0.0149, "step": 109510 }, { "epoch": 0.55, "learning_rate": 0.00021711862611055894, "loss": 0.0162, "step": 109520 }, { "epoch": 0.55, "learning_rate": 0.00021711105841754492, "loss": 0.0143, "step": 109530 }, { "epoch": 0.55, "learning_rate": 0.00021710349072453093, "loss": 0.0132, "step": 109540 }, { "epoch": 0.55, "learning_rate": 0.0002170959230315169, "loss": 0.0123, "step": 109550 }, { "epoch": 0.55, "learning_rate": 0.0002170883553385029, "loss": 0.0172, "step": 109560 }, { "epoch": 0.55, "learning_rate": 0.00021708078764548887, "loss": 0.0189, "step": 109570 }, { "epoch": 0.55, "learning_rate": 0.00021707321995247488, "loss": 0.0147, "step": 109580 }, { "epoch": 0.55, "learning_rate": 0.00021706565225946086, "loss": 0.0143, "step": 109590 }, { "epoch": 0.55, "learning_rate": 0.00021705808456644684, "loss": 0.0121, "step": 109600 }, { "epoch": 0.55, "learning_rate": 0.00021705051687343285, "loss": 0.015, "step": 109610 }, { "epoch": 0.55, "learning_rate": 0.00021704294918041883, "loss": 0.0157, "step": 109620 }, { "epoch": 0.55, "learning_rate": 0.00021703538148740481, "loss": 0.0152, "step": 109630 }, { "epoch": 0.55, "learning_rate": 0.00021702781379439082, "loss": 0.0142, "step": 109640 }, { "epoch": 0.55, "learning_rate": 0.0002170202461013768, "loss": 0.0134, "step": 109650 }, { "epoch": 0.55, "learning_rate": 0.00021701267840836279, "loss": 0.0163, "step": 109660 }, { "epoch": 0.55, "learning_rate": 0.0002170051107153488, "loss": 0.0142, "step": 109670 }, { "epoch": 0.55, "learning_rate": 0.00021699754302233478, "loss": 0.012, "step": 109680 }, { "epoch": 0.55, "learning_rate": 0.00021698997532932076, "loss": 0.0158, "step": 109690 }, { "epoch": 0.55, "learning_rate": 0.00021698240763630677, "loss": 0.0142, "step": 109700 }, { "epoch": 0.55, "learning_rate": 0.00021697483994329275, "loss": 0.0159, "step": 109710 }, { "epoch": 0.55, "learning_rate": 0.00021696727225027873, "loss": 0.0153, "step": 109720 }, { "epoch": 0.55, "learning_rate": 0.0002169597045572647, "loss": 0.0123, "step": 109730 }, { "epoch": 0.55, "learning_rate": 0.00021695213686425072, "loss": 0.0161, "step": 109740 }, { "epoch": 0.55, "learning_rate": 0.0002169445691712367, "loss": 0.0119, "step": 109750 }, { "epoch": 0.55, "learning_rate": 0.00021693700147822268, "loss": 0.0182, "step": 109760 }, { "epoch": 0.55, "learning_rate": 0.0002169294337852087, "loss": 0.019, "step": 109770 }, { "epoch": 0.55, "learning_rate": 0.00021692186609219467, "loss": 0.0133, "step": 109780 }, { "epoch": 0.55, "learning_rate": 0.00021691429839918065, "loss": 0.0151, "step": 109790 }, { "epoch": 0.55, "learning_rate": 0.00021690673070616666, "loss": 0.0133, "step": 109800 }, { "epoch": 0.55, "learning_rate": 0.00021689916301315264, "loss": 0.0112, "step": 109810 }, { "epoch": 0.55, "learning_rate": 0.00021689159532013862, "loss": 0.0145, "step": 109820 }, { "epoch": 0.55, "learning_rate": 0.00021688402762712463, "loss": 0.0114, "step": 109830 }, { "epoch": 0.55, "learning_rate": 0.00021687645993411061, "loss": 0.0134, "step": 109840 }, { "epoch": 0.55, "learning_rate": 0.0002168688922410966, "loss": 0.0146, "step": 109850 }, { "epoch": 0.55, "learning_rate": 0.0002168613245480826, "loss": 0.0147, "step": 109860 }, { "epoch": 0.55, "learning_rate": 0.00021685375685506859, "loss": 0.0115, "step": 109870 }, { "epoch": 0.55, "learning_rate": 0.00021684618916205457, "loss": 0.0162, "step": 109880 }, { "epoch": 0.55, "learning_rate": 0.00021683862146904058, "loss": 0.0133, "step": 109890 }, { "epoch": 0.55, "learning_rate": 0.00021683105377602656, "loss": 0.0174, "step": 109900 }, { "epoch": 0.55, "learning_rate": 0.00021682348608301254, "loss": 0.0163, "step": 109910 }, { "epoch": 0.55, "learning_rate": 0.00021681591838999852, "loss": 0.018, "step": 109920 }, { "epoch": 0.55, "learning_rate": 0.00021680835069698453, "loss": 0.0169, "step": 109930 }, { "epoch": 0.55, "learning_rate": 0.0002168007830039705, "loss": 0.0144, "step": 109940 }, { "epoch": 0.55, "learning_rate": 0.0002167932153109565, "loss": 0.0142, "step": 109950 }, { "epoch": 0.55, "learning_rate": 0.0002167856476179425, "loss": 0.0112, "step": 109960 }, { "epoch": 0.55, "learning_rate": 0.00021677807992492848, "loss": 0.0167, "step": 109970 }, { "epoch": 0.55, "learning_rate": 0.00021677051223191444, "loss": 0.0149, "step": 109980 }, { "epoch": 0.55, "learning_rate": 0.00021676294453890042, "loss": 0.0146, "step": 109990 }, { "epoch": 0.55, "learning_rate": 0.00021675537684588643, "loss": 0.0159, "step": 110000 }, { "epoch": 0.55, "eval_cer": 0.9144751078837893, "eval_loss": 0.010691503062844276, "eval_runtime": 116.7007, "eval_samples_per_second": 17.138, "eval_steps_per_second": 4.284, "step": 110000 }, { "epoch": 0.56, "learning_rate": 0.0002167478091528724, "loss": 0.015, "step": 110010 }, { "epoch": 0.56, "learning_rate": 0.0002167402414598584, "loss": 0.0209, "step": 110020 }, { "epoch": 0.56, "learning_rate": 0.0002167326737668444, "loss": 0.0157, "step": 110030 }, { "epoch": 0.56, "learning_rate": 0.00021672510607383038, "loss": 0.0184, "step": 110040 }, { "epoch": 0.56, "learning_rate": 0.00021671753838081636, "loss": 0.0169, "step": 110050 }, { "epoch": 0.56, "learning_rate": 0.00021670997068780237, "loss": 0.0206, "step": 110060 }, { "epoch": 0.56, "learning_rate": 0.00021670240299478835, "loss": 0.0151, "step": 110070 }, { "epoch": 0.56, "learning_rate": 0.00021669483530177433, "loss": 0.0166, "step": 110080 }, { "epoch": 0.56, "learning_rate": 0.00021668726760876034, "loss": 0.0171, "step": 110090 }, { "epoch": 0.56, "learning_rate": 0.00021667969991574632, "loss": 0.0128, "step": 110100 }, { "epoch": 0.56, "learning_rate": 0.0002166721322227323, "loss": 0.0141, "step": 110110 }, { "epoch": 0.56, "learning_rate": 0.00021666456452971829, "loss": 0.0174, "step": 110120 }, { "epoch": 0.56, "learning_rate": 0.0002166569968367043, "loss": 0.0129, "step": 110130 }, { "epoch": 0.56, "learning_rate": 0.00021664942914369028, "loss": 0.0202, "step": 110140 }, { "epoch": 0.56, "learning_rate": 0.00021664186145067626, "loss": 0.0145, "step": 110150 }, { "epoch": 0.56, "learning_rate": 0.00021663429375766227, "loss": 0.0186, "step": 110160 }, { "epoch": 0.56, "learning_rate": 0.00021662672606464825, "loss": 0.0183, "step": 110170 }, { "epoch": 0.56, "learning_rate": 0.00021661915837163423, "loss": 0.0143, "step": 110180 }, { "epoch": 0.56, "learning_rate": 0.00021661159067862024, "loss": 0.0127, "step": 110190 }, { "epoch": 0.56, "learning_rate": 0.00021660402298560622, "loss": 0.0195, "step": 110200 }, { "epoch": 0.56, "learning_rate": 0.0002165964552925922, "loss": 0.0149, "step": 110210 }, { "epoch": 0.56, "learning_rate": 0.0002165888875995782, "loss": 0.0144, "step": 110220 }, { "epoch": 0.56, "learning_rate": 0.0002165813199065642, "loss": 0.0134, "step": 110230 }, { "epoch": 0.56, "learning_rate": 0.00021657375221355017, "loss": 0.0139, "step": 110240 }, { "epoch": 0.56, "learning_rate": 0.00021656618452053618, "loss": 0.0156, "step": 110250 }, { "epoch": 0.56, "learning_rate": 0.00021655861682752216, "loss": 0.0141, "step": 110260 }, { "epoch": 0.56, "learning_rate": 0.00021655104913450814, "loss": 0.0146, "step": 110270 }, { "epoch": 0.56, "learning_rate": 0.00021654348144149415, "loss": 0.0167, "step": 110280 }, { "epoch": 0.56, "learning_rate": 0.00021653591374848013, "loss": 0.0131, "step": 110290 }, { "epoch": 0.56, "learning_rate": 0.00021652834605546611, "loss": 0.0151, "step": 110300 }, { "epoch": 0.56, "learning_rate": 0.0002165207783624521, "loss": 0.021, "step": 110310 }, { "epoch": 0.56, "learning_rate": 0.0002165132106694381, "loss": 0.0161, "step": 110320 }, { "epoch": 0.56, "learning_rate": 0.00021650564297642409, "loss": 0.0161, "step": 110330 }, { "epoch": 0.56, "learning_rate": 0.00021649807528341007, "loss": 0.0179, "step": 110340 }, { "epoch": 0.56, "learning_rate": 0.00021649050759039608, "loss": 0.0155, "step": 110350 }, { "epoch": 0.56, "learning_rate": 0.00021648293989738206, "loss": 0.0141, "step": 110360 }, { "epoch": 0.56, "learning_rate": 0.00021647537220436804, "loss": 0.0187, "step": 110370 }, { "epoch": 0.56, "learning_rate": 0.00021646780451135405, "loss": 0.0149, "step": 110380 }, { "epoch": 0.56, "learning_rate": 0.00021646023681834003, "loss": 0.0146, "step": 110390 }, { "epoch": 0.56, "learning_rate": 0.000216452669125326, "loss": 0.0131, "step": 110400 }, { "epoch": 0.56, "learning_rate": 0.00021644510143231202, "loss": 0.0139, "step": 110410 }, { "epoch": 0.56, "learning_rate": 0.000216437533739298, "loss": 0.0112, "step": 110420 }, { "epoch": 0.56, "learning_rate": 0.00021642996604628398, "loss": 0.0148, "step": 110430 }, { "epoch": 0.56, "learning_rate": 0.00021642239835327, "loss": 0.0128, "step": 110440 }, { "epoch": 0.56, "learning_rate": 0.00021641483066025597, "loss": 0.0147, "step": 110450 }, { "epoch": 0.56, "learning_rate": 0.00021640726296724195, "loss": 0.0164, "step": 110460 }, { "epoch": 0.56, "learning_rate": 0.00021639969527422793, "loss": 0.0181, "step": 110470 }, { "epoch": 0.56, "learning_rate": 0.00021639212758121394, "loss": 0.0146, "step": 110480 }, { "epoch": 0.56, "learning_rate": 0.00021638455988819992, "loss": 0.016, "step": 110490 }, { "epoch": 0.56, "learning_rate": 0.0002163769921951859, "loss": 0.0187, "step": 110500 }, { "epoch": 0.56, "learning_rate": 0.00021636942450217191, "loss": 0.014, "step": 110510 }, { "epoch": 0.56, "learning_rate": 0.0002163618568091579, "loss": 0.0164, "step": 110520 }, { "epoch": 0.56, "learning_rate": 0.00021635428911614388, "loss": 0.0137, "step": 110530 }, { "epoch": 0.56, "learning_rate": 0.00021634672142312989, "loss": 0.016, "step": 110540 }, { "epoch": 0.56, "learning_rate": 0.00021633915373011587, "loss": 0.0117, "step": 110550 }, { "epoch": 0.56, "learning_rate": 0.00021633158603710185, "loss": 0.0146, "step": 110560 }, { "epoch": 0.56, "learning_rate": 0.00021632401834408786, "loss": 0.0161, "step": 110570 }, { "epoch": 0.56, "learning_rate": 0.00021631645065107384, "loss": 0.0128, "step": 110580 }, { "epoch": 0.56, "learning_rate": 0.00021630888295805982, "loss": 0.0235, "step": 110590 }, { "epoch": 0.56, "learning_rate": 0.00021630131526504583, "loss": 0.0162, "step": 110600 }, { "epoch": 0.56, "learning_rate": 0.0002162937475720318, "loss": 0.0138, "step": 110610 }, { "epoch": 0.56, "learning_rate": 0.0002162861798790178, "loss": 0.0136, "step": 110620 }, { "epoch": 0.56, "learning_rate": 0.00021627861218600377, "loss": 0.0175, "step": 110630 }, { "epoch": 0.56, "learning_rate": 0.00021627104449298978, "loss": 0.0148, "step": 110640 }, { "epoch": 0.56, "learning_rate": 0.00021626347679997576, "loss": 0.0158, "step": 110650 }, { "epoch": 0.56, "learning_rate": 0.00021625590910696174, "loss": 0.0154, "step": 110660 }, { "epoch": 0.56, "learning_rate": 0.00021624834141394775, "loss": 0.0143, "step": 110670 }, { "epoch": 0.56, "learning_rate": 0.00021624077372093373, "loss": 0.0148, "step": 110680 }, { "epoch": 0.56, "learning_rate": 0.00021623320602791972, "loss": 0.0164, "step": 110690 }, { "epoch": 0.56, "learning_rate": 0.00021622563833490572, "loss": 0.0163, "step": 110700 }, { "epoch": 0.56, "learning_rate": 0.0002162180706418917, "loss": 0.015, "step": 110710 }, { "epoch": 0.56, "learning_rate": 0.0002162105029488777, "loss": 0.0141, "step": 110720 }, { "epoch": 0.56, "learning_rate": 0.0002162029352558637, "loss": 0.0157, "step": 110730 }, { "epoch": 0.56, "learning_rate": 0.00021619536756284968, "loss": 0.0123, "step": 110740 }, { "epoch": 0.56, "learning_rate": 0.00021618779986983566, "loss": 0.0141, "step": 110750 }, { "epoch": 0.56, "learning_rate": 0.00021618023217682167, "loss": 0.0146, "step": 110760 }, { "epoch": 0.56, "learning_rate": 0.00021617266448380765, "loss": 0.0148, "step": 110770 }, { "epoch": 0.56, "learning_rate": 0.00021616509679079363, "loss": 0.0186, "step": 110780 }, { "epoch": 0.56, "learning_rate": 0.00021615752909777964, "loss": 0.0168, "step": 110790 }, { "epoch": 0.56, "learning_rate": 0.00021614996140476562, "loss": 0.0136, "step": 110800 }, { "epoch": 0.56, "learning_rate": 0.0002161423937117516, "loss": 0.0126, "step": 110810 }, { "epoch": 0.56, "learning_rate": 0.00021613482601873758, "loss": 0.0173, "step": 110820 }, { "epoch": 0.56, "learning_rate": 0.0002161272583257236, "loss": 0.0129, "step": 110830 }, { "epoch": 0.56, "learning_rate": 0.00021611969063270957, "loss": 0.016, "step": 110840 }, { "epoch": 0.56, "learning_rate": 0.00021611212293969555, "loss": 0.0134, "step": 110850 }, { "epoch": 0.56, "learning_rate": 0.00021610455524668156, "loss": 0.019, "step": 110860 }, { "epoch": 0.56, "learning_rate": 0.00021609698755366754, "loss": 0.0157, "step": 110870 }, { "epoch": 0.56, "learning_rate": 0.00021608941986065353, "loss": 0.0173, "step": 110880 }, { "epoch": 0.56, "learning_rate": 0.00021608185216763953, "loss": 0.0149, "step": 110890 }, { "epoch": 0.56, "learning_rate": 0.00021607428447462552, "loss": 0.0156, "step": 110900 }, { "epoch": 0.56, "learning_rate": 0.0002160667167816115, "loss": 0.0137, "step": 110910 }, { "epoch": 0.56, "learning_rate": 0.0002160591490885975, "loss": 0.0135, "step": 110920 }, { "epoch": 0.56, "learning_rate": 0.0002160515813955835, "loss": 0.0158, "step": 110930 }, { "epoch": 0.56, "learning_rate": 0.00021604401370256947, "loss": 0.0155, "step": 110940 }, { "epoch": 0.56, "learning_rate": 0.00021603644600955548, "loss": 0.0147, "step": 110950 }, { "epoch": 0.56, "learning_rate": 0.00021602887831654146, "loss": 0.0134, "step": 110960 }, { "epoch": 0.56, "learning_rate": 0.00021602131062352744, "loss": 0.0138, "step": 110970 }, { "epoch": 0.56, "learning_rate": 0.00021601374293051342, "loss": 0.0126, "step": 110980 }, { "epoch": 0.56, "learning_rate": 0.00021600617523749943, "loss": 0.0159, "step": 110990 }, { "epoch": 0.56, "learning_rate": 0.0002159986075444854, "loss": 0.0134, "step": 111000 }, { "epoch": 0.56, "eval_cer": 0.914462492734159, "eval_loss": 0.010961051099002361, "eval_runtime": 116.7509, "eval_samples_per_second": 17.13, "eval_steps_per_second": 4.283, "step": 111000 }, { "epoch": 0.56, "learning_rate": 0.0002159910398514714, "loss": 0.0137, "step": 111010 }, { "epoch": 0.56, "learning_rate": 0.0002159834721584574, "loss": 0.0143, "step": 111020 }, { "epoch": 0.56, "learning_rate": 0.00021597590446544338, "loss": 0.0179, "step": 111030 }, { "epoch": 0.56, "learning_rate": 0.00021596833677242936, "loss": 0.0129, "step": 111040 }, { "epoch": 0.56, "learning_rate": 0.00021596076907941537, "loss": 0.0147, "step": 111050 }, { "epoch": 0.56, "learning_rate": 0.00021595320138640135, "loss": 0.0141, "step": 111060 }, { "epoch": 0.56, "learning_rate": 0.00021594563369338734, "loss": 0.011, "step": 111070 }, { "epoch": 0.56, "learning_rate": 0.00021593806600037334, "loss": 0.0134, "step": 111080 }, { "epoch": 0.56, "learning_rate": 0.00021593049830735933, "loss": 0.0135, "step": 111090 }, { "epoch": 0.56, "learning_rate": 0.0002159229306143453, "loss": 0.013, "step": 111100 }, { "epoch": 0.56, "learning_rate": 0.00021591536292133132, "loss": 0.0121, "step": 111110 }, { "epoch": 0.56, "learning_rate": 0.0002159077952283173, "loss": 0.0138, "step": 111120 }, { "epoch": 0.56, "learning_rate": 0.00021590022753530328, "loss": 0.0152, "step": 111130 }, { "epoch": 0.56, "learning_rate": 0.00021589265984228926, "loss": 0.0119, "step": 111140 }, { "epoch": 0.56, "learning_rate": 0.00021588509214927527, "loss": 0.0138, "step": 111150 }, { "epoch": 0.56, "learning_rate": 0.00021587752445626125, "loss": 0.0133, "step": 111160 }, { "epoch": 0.56, "learning_rate": 0.00021586995676324723, "loss": 0.016, "step": 111170 }, { "epoch": 0.56, "learning_rate": 0.00021586238907023324, "loss": 0.0151, "step": 111180 }, { "epoch": 0.56, "learning_rate": 0.00021585482137721922, "loss": 0.0139, "step": 111190 }, { "epoch": 0.56, "learning_rate": 0.0002158472536842052, "loss": 0.0184, "step": 111200 }, { "epoch": 0.56, "learning_rate": 0.0002158396859911912, "loss": 0.0145, "step": 111210 }, { "epoch": 0.56, "learning_rate": 0.0002158321182981772, "loss": 0.0189, "step": 111220 }, { "epoch": 0.56, "learning_rate": 0.00021582455060516317, "loss": 0.0204, "step": 111230 }, { "epoch": 0.56, "learning_rate": 0.00021581698291214913, "loss": 0.0139, "step": 111240 }, { "epoch": 0.56, "learning_rate": 0.00021580941521913514, "loss": 0.0145, "step": 111250 }, { "epoch": 0.56, "learning_rate": 0.00021580184752612112, "loss": 0.0141, "step": 111260 }, { "epoch": 0.56, "learning_rate": 0.0002157942798331071, "loss": 0.0161, "step": 111270 }, { "epoch": 0.56, "learning_rate": 0.0002157867121400931, "loss": 0.0121, "step": 111280 }, { "epoch": 0.56, "learning_rate": 0.0002157791444470791, "loss": 0.0169, "step": 111290 }, { "epoch": 0.56, "learning_rate": 0.00021577157675406507, "loss": 0.0119, "step": 111300 }, { "epoch": 0.56, "learning_rate": 0.00021576400906105108, "loss": 0.017, "step": 111310 }, { "epoch": 0.56, "learning_rate": 0.00021575644136803706, "loss": 0.0133, "step": 111320 }, { "epoch": 0.56, "learning_rate": 0.00021574887367502304, "loss": 0.0149, "step": 111330 }, { "epoch": 0.56, "learning_rate": 0.00021574130598200905, "loss": 0.014, "step": 111340 }, { "epoch": 0.56, "learning_rate": 0.00021573373828899503, "loss": 0.0133, "step": 111350 }, { "epoch": 0.56, "learning_rate": 0.00021572617059598101, "loss": 0.0144, "step": 111360 }, { "epoch": 0.56, "learning_rate": 0.000215718602902967, "loss": 0.0146, "step": 111370 }, { "epoch": 0.56, "learning_rate": 0.000215711035209953, "loss": 0.0159, "step": 111380 }, { "epoch": 0.56, "learning_rate": 0.00021570346751693899, "loss": 0.0174, "step": 111390 }, { "epoch": 0.56, "learning_rate": 0.00021569589982392497, "loss": 0.0138, "step": 111400 }, { "epoch": 0.56, "learning_rate": 0.00021568833213091098, "loss": 0.0134, "step": 111410 }, { "epoch": 0.56, "learning_rate": 0.00021568076443789696, "loss": 0.0156, "step": 111420 }, { "epoch": 0.56, "learning_rate": 0.00021567319674488294, "loss": 0.0156, "step": 111430 }, { "epoch": 0.56, "learning_rate": 0.00021566562905186895, "loss": 0.0161, "step": 111440 }, { "epoch": 0.56, "learning_rate": 0.00021565806135885493, "loss": 0.0157, "step": 111450 }, { "epoch": 0.56, "learning_rate": 0.0002156504936658409, "loss": 0.0136, "step": 111460 }, { "epoch": 0.56, "learning_rate": 0.00021564292597282692, "loss": 0.0164, "step": 111470 }, { "epoch": 0.56, "learning_rate": 0.0002156353582798129, "loss": 0.0124, "step": 111480 }, { "epoch": 0.56, "learning_rate": 0.00021562779058679888, "loss": 0.0155, "step": 111490 }, { "epoch": 0.56, "learning_rate": 0.0002156202228937849, "loss": 0.0125, "step": 111500 }, { "epoch": 0.56, "learning_rate": 0.00021561265520077087, "loss": 0.0154, "step": 111510 }, { "epoch": 0.56, "learning_rate": 0.00021560508750775685, "loss": 0.0203, "step": 111520 }, { "epoch": 0.56, "learning_rate": 0.00021559751981474283, "loss": 0.014, "step": 111530 }, { "epoch": 0.56, "learning_rate": 0.00021558995212172884, "loss": 0.0149, "step": 111540 }, { "epoch": 0.56, "learning_rate": 0.00021558238442871482, "loss": 0.0156, "step": 111550 }, { "epoch": 0.56, "learning_rate": 0.0002155748167357008, "loss": 0.0158, "step": 111560 }, { "epoch": 0.56, "learning_rate": 0.00021556724904268681, "loss": 0.0125, "step": 111570 }, { "epoch": 0.56, "learning_rate": 0.0002155596813496728, "loss": 0.0137, "step": 111580 }, { "epoch": 0.56, "learning_rate": 0.00021555211365665878, "loss": 0.0136, "step": 111590 }, { "epoch": 0.56, "learning_rate": 0.00021554454596364479, "loss": 0.0153, "step": 111600 }, { "epoch": 0.56, "learning_rate": 0.00021553697827063077, "loss": 0.0156, "step": 111610 }, { "epoch": 0.56, "learning_rate": 0.00021552941057761675, "loss": 0.0135, "step": 111620 }, { "epoch": 0.56, "learning_rate": 0.00021552184288460276, "loss": 0.0147, "step": 111630 }, { "epoch": 0.56, "learning_rate": 0.00021551427519158874, "loss": 0.0157, "step": 111640 }, { "epoch": 0.56, "learning_rate": 0.00021550670749857472, "loss": 0.0163, "step": 111650 }, { "epoch": 0.56, "learning_rate": 0.00021549913980556073, "loss": 0.0135, "step": 111660 }, { "epoch": 0.56, "learning_rate": 0.0002154915721125467, "loss": 0.0114, "step": 111670 }, { "epoch": 0.56, "learning_rate": 0.0002154840044195327, "loss": 0.0199, "step": 111680 }, { "epoch": 0.56, "learning_rate": 0.0002154764367265187, "loss": 0.0155, "step": 111690 }, { "epoch": 0.56, "learning_rate": 0.00021546886903350468, "loss": 0.017, "step": 111700 }, { "epoch": 0.56, "learning_rate": 0.00021546130134049066, "loss": 0.0176, "step": 111710 }, { "epoch": 0.56, "learning_rate": 0.00021545373364747664, "loss": 0.0138, "step": 111720 }, { "epoch": 0.56, "learning_rate": 0.00021544616595446265, "loss": 0.0155, "step": 111730 }, { "epoch": 0.56, "learning_rate": 0.00021543859826144863, "loss": 0.0142, "step": 111740 }, { "epoch": 0.56, "learning_rate": 0.00021543103056843462, "loss": 0.0168, "step": 111750 }, { "epoch": 0.56, "learning_rate": 0.00021542346287542062, "loss": 0.0152, "step": 111760 }, { "epoch": 0.56, "learning_rate": 0.0002154158951824066, "loss": 0.0178, "step": 111770 }, { "epoch": 0.56, "learning_rate": 0.0002154083274893926, "loss": 0.0135, "step": 111780 }, { "epoch": 0.56, "learning_rate": 0.0002154007597963786, "loss": 0.0133, "step": 111790 }, { "epoch": 0.56, "learning_rate": 0.00021539319210336458, "loss": 0.0188, "step": 111800 }, { "epoch": 0.56, "learning_rate": 0.00021538562441035056, "loss": 0.0127, "step": 111810 }, { "epoch": 0.56, "learning_rate": 0.00021537805671733657, "loss": 0.0127, "step": 111820 }, { "epoch": 0.56, "learning_rate": 0.00021537048902432255, "loss": 0.0147, "step": 111830 }, { "epoch": 0.56, "learning_rate": 0.00021536292133130853, "loss": 0.0136, "step": 111840 }, { "epoch": 0.56, "learning_rate": 0.00021535535363829454, "loss": 0.0131, "step": 111850 }, { "epoch": 0.56, "learning_rate": 0.00021534778594528052, "loss": 0.0123, "step": 111860 }, { "epoch": 0.56, "learning_rate": 0.0002153402182522665, "loss": 0.0157, "step": 111870 }, { "epoch": 0.56, "learning_rate": 0.00021533265055925248, "loss": 0.0141, "step": 111880 }, { "epoch": 0.56, "learning_rate": 0.0002153250828662385, "loss": 0.0141, "step": 111890 }, { "epoch": 0.56, "learning_rate": 0.00021531751517322447, "loss": 0.0133, "step": 111900 }, { "epoch": 0.56, "learning_rate": 0.00021530994748021045, "loss": 0.0154, "step": 111910 }, { "epoch": 0.56, "learning_rate": 0.00021530237978719646, "loss": 0.0134, "step": 111920 }, { "epoch": 0.56, "learning_rate": 0.00021529481209418244, "loss": 0.0162, "step": 111930 }, { "epoch": 0.56, "learning_rate": 0.00021528724440116843, "loss": 0.0168, "step": 111940 }, { "epoch": 0.56, "learning_rate": 0.00021527967670815443, "loss": 0.0145, "step": 111950 }, { "epoch": 0.56, "learning_rate": 0.00021527210901514042, "loss": 0.0118, "step": 111960 }, { "epoch": 0.56, "learning_rate": 0.0002152645413221264, "loss": 0.0131, "step": 111970 }, { "epoch": 0.56, "learning_rate": 0.0002152569736291124, "loss": 0.0128, "step": 111980 }, { "epoch": 0.57, "learning_rate": 0.0002152494059360984, "loss": 0.0134, "step": 111990 }, { "epoch": 0.57, "learning_rate": 0.00021524183824308437, "loss": 0.0167, "step": 112000 }, { "epoch": 0.57, "eval_cer": 0.9144595815457828, "eval_loss": 0.011023299768567085, "eval_runtime": 116.6938, "eval_samples_per_second": 17.139, "eval_steps_per_second": 4.285, "step": 112000 }, { "epoch": 0.57, "learning_rate": 0.00021523427055007038, "loss": 0.0195, "step": 112010 }, { "epoch": 0.57, "learning_rate": 0.00021522670285705636, "loss": 0.0127, "step": 112020 }, { "epoch": 0.57, "learning_rate": 0.00021521913516404234, "loss": 0.0153, "step": 112030 }, { "epoch": 0.57, "learning_rate": 0.00021521156747102832, "loss": 0.0166, "step": 112040 }, { "epoch": 0.57, "learning_rate": 0.00021520399977801433, "loss": 0.0152, "step": 112050 }, { "epoch": 0.57, "learning_rate": 0.0002151964320850003, "loss": 0.0159, "step": 112060 }, { "epoch": 0.57, "learning_rate": 0.0002151888643919863, "loss": 0.0152, "step": 112070 }, { "epoch": 0.57, "learning_rate": 0.0002151812966989723, "loss": 0.0179, "step": 112080 }, { "epoch": 0.57, "learning_rate": 0.00021517372900595828, "loss": 0.0182, "step": 112090 }, { "epoch": 0.57, "learning_rate": 0.00021516616131294426, "loss": 0.0182, "step": 112100 }, { "epoch": 0.57, "learning_rate": 0.00021515859361993027, "loss": 0.0156, "step": 112110 }, { "epoch": 0.57, "learning_rate": 0.00021515102592691625, "loss": 0.0191, "step": 112120 }, { "epoch": 0.57, "learning_rate": 0.00021514345823390224, "loss": 0.0153, "step": 112130 }, { "epoch": 0.57, "learning_rate": 0.00021513589054088824, "loss": 0.0165, "step": 112140 }, { "epoch": 0.57, "learning_rate": 0.00021512832284787423, "loss": 0.0143, "step": 112150 }, { "epoch": 0.57, "learning_rate": 0.0002151207551548602, "loss": 0.0154, "step": 112160 }, { "epoch": 0.57, "learning_rate": 0.00021511318746184622, "loss": 0.0149, "step": 112170 }, { "epoch": 0.57, "learning_rate": 0.0002151056197688322, "loss": 0.0132, "step": 112180 }, { "epoch": 0.57, "learning_rate": 0.00021509805207581818, "loss": 0.0111, "step": 112190 }, { "epoch": 0.57, "learning_rate": 0.0002150904843828042, "loss": 0.0147, "step": 112200 }, { "epoch": 0.57, "learning_rate": 0.00021508291668979017, "loss": 0.0165, "step": 112210 }, { "epoch": 0.57, "learning_rate": 0.00021507534899677615, "loss": 0.0142, "step": 112220 }, { "epoch": 0.57, "learning_rate": 0.00021506778130376213, "loss": 0.0134, "step": 112230 }, { "epoch": 0.57, "learning_rate": 0.00021506021361074814, "loss": 0.0141, "step": 112240 }, { "epoch": 0.57, "learning_rate": 0.00021505264591773412, "loss": 0.0153, "step": 112250 }, { "epoch": 0.57, "learning_rate": 0.0002150450782247201, "loss": 0.0162, "step": 112260 }, { "epoch": 0.57, "learning_rate": 0.0002150375105317061, "loss": 0.0133, "step": 112270 }, { "epoch": 0.57, "learning_rate": 0.0002150299428386921, "loss": 0.0153, "step": 112280 }, { "epoch": 0.57, "learning_rate": 0.00021502237514567807, "loss": 0.0169, "step": 112290 }, { "epoch": 0.57, "learning_rate": 0.00021501480745266408, "loss": 0.0133, "step": 112300 }, { "epoch": 0.57, "learning_rate": 0.00021500723975965006, "loss": 0.0134, "step": 112310 }, { "epoch": 0.57, "learning_rate": 0.00021499967206663605, "loss": 0.0123, "step": 112320 }, { "epoch": 0.57, "learning_rate": 0.00021499210437362205, "loss": 0.0195, "step": 112330 }, { "epoch": 0.57, "learning_rate": 0.00021498453668060804, "loss": 0.0159, "step": 112340 }, { "epoch": 0.57, "learning_rate": 0.00021497696898759402, "loss": 0.0147, "step": 112350 }, { "epoch": 0.57, "learning_rate": 0.00021496940129458003, "loss": 0.0153, "step": 112360 }, { "epoch": 0.57, "learning_rate": 0.000214961833601566, "loss": 0.0128, "step": 112370 }, { "epoch": 0.57, "learning_rate": 0.000214954265908552, "loss": 0.0178, "step": 112380 }, { "epoch": 0.57, "learning_rate": 0.00021494669821553797, "loss": 0.0147, "step": 112390 }, { "epoch": 0.57, "learning_rate": 0.00021493913052252398, "loss": 0.0145, "step": 112400 }, { "epoch": 0.57, "learning_rate": 0.00021493156282950996, "loss": 0.0131, "step": 112410 }, { "epoch": 0.57, "learning_rate": 0.00021492399513649594, "loss": 0.0176, "step": 112420 }, { "epoch": 0.57, "learning_rate": 0.00021491642744348195, "loss": 0.0153, "step": 112430 }, { "epoch": 0.57, "learning_rate": 0.00021490885975046793, "loss": 0.0136, "step": 112440 }, { "epoch": 0.57, "learning_rate": 0.0002149012920574539, "loss": 0.0145, "step": 112450 }, { "epoch": 0.57, "learning_rate": 0.00021489372436443992, "loss": 0.015, "step": 112460 }, { "epoch": 0.57, "learning_rate": 0.0002148861566714259, "loss": 0.0154, "step": 112470 }, { "epoch": 0.57, "learning_rate": 0.00021487858897841188, "loss": 0.0152, "step": 112480 }, { "epoch": 0.57, "learning_rate": 0.0002148710212853979, "loss": 0.0182, "step": 112490 }, { "epoch": 0.57, "learning_rate": 0.00021486345359238385, "loss": 0.0151, "step": 112500 }, { "epoch": 0.57, "learning_rate": 0.00021485588589936983, "loss": 0.0166, "step": 112510 }, { "epoch": 0.57, "learning_rate": 0.0002148483182063558, "loss": 0.0154, "step": 112520 }, { "epoch": 0.57, "learning_rate": 0.00021484075051334182, "loss": 0.0146, "step": 112530 }, { "epoch": 0.57, "learning_rate": 0.0002148331828203278, "loss": 0.018, "step": 112540 }, { "epoch": 0.57, "learning_rate": 0.00021482561512731378, "loss": 0.0169, "step": 112550 }, { "epoch": 0.57, "learning_rate": 0.0002148180474342998, "loss": 0.0161, "step": 112560 }, { "epoch": 0.57, "learning_rate": 0.00021481047974128577, "loss": 0.0176, "step": 112570 }, { "epoch": 0.57, "learning_rate": 0.00021480291204827175, "loss": 0.0145, "step": 112580 }, { "epoch": 0.57, "learning_rate": 0.00021479534435525776, "loss": 0.017, "step": 112590 }, { "epoch": 0.57, "learning_rate": 0.00021478777666224374, "loss": 0.0145, "step": 112600 }, { "epoch": 0.57, "learning_rate": 0.00021478020896922972, "loss": 0.0167, "step": 112610 }, { "epoch": 0.57, "learning_rate": 0.0002147726412762157, "loss": 0.0129, "step": 112620 }, { "epoch": 0.57, "learning_rate": 0.00021476507358320171, "loss": 0.016, "step": 112630 }, { "epoch": 0.57, "learning_rate": 0.0002147575058901877, "loss": 0.0161, "step": 112640 }, { "epoch": 0.57, "learning_rate": 0.00021474993819717368, "loss": 0.0152, "step": 112650 }, { "epoch": 0.57, "learning_rate": 0.00021474237050415969, "loss": 0.015, "step": 112660 }, { "epoch": 0.57, "learning_rate": 0.00021473480281114567, "loss": 0.0124, "step": 112670 }, { "epoch": 0.57, "learning_rate": 0.00021472723511813165, "loss": 0.0177, "step": 112680 }, { "epoch": 0.57, "learning_rate": 0.00021471966742511766, "loss": 0.0141, "step": 112690 }, { "epoch": 0.57, "learning_rate": 0.00021471209973210364, "loss": 0.0172, "step": 112700 }, { "epoch": 0.57, "learning_rate": 0.00021470453203908962, "loss": 0.0172, "step": 112710 }, { "epoch": 0.57, "learning_rate": 0.00021469696434607563, "loss": 0.0129, "step": 112720 }, { "epoch": 0.57, "learning_rate": 0.0002146893966530616, "loss": 0.0144, "step": 112730 }, { "epoch": 0.57, "learning_rate": 0.0002146818289600476, "loss": 0.0146, "step": 112740 }, { "epoch": 0.57, "learning_rate": 0.0002146742612670336, "loss": 0.0137, "step": 112750 }, { "epoch": 0.57, "learning_rate": 0.00021466669357401958, "loss": 0.0127, "step": 112760 }, { "epoch": 0.57, "learning_rate": 0.00021465912588100556, "loss": 0.0149, "step": 112770 }, { "epoch": 0.57, "learning_rate": 0.00021465155818799154, "loss": 0.0145, "step": 112780 }, { "epoch": 0.57, "learning_rate": 0.00021464399049497755, "loss": 0.0139, "step": 112790 }, { "epoch": 0.57, "learning_rate": 0.00021463642280196353, "loss": 0.0182, "step": 112800 }, { "epoch": 0.57, "learning_rate": 0.00021462885510894952, "loss": 0.0184, "step": 112810 }, { "epoch": 0.57, "learning_rate": 0.00021462128741593552, "loss": 0.0125, "step": 112820 }, { "epoch": 0.57, "learning_rate": 0.0002146137197229215, "loss": 0.0129, "step": 112830 }, { "epoch": 0.57, "learning_rate": 0.0002146061520299075, "loss": 0.0189, "step": 112840 }, { "epoch": 0.57, "learning_rate": 0.0002145985843368935, "loss": 0.0168, "step": 112850 }, { "epoch": 0.57, "learning_rate": 0.00021459101664387948, "loss": 0.0165, "step": 112860 }, { "epoch": 0.57, "learning_rate": 0.00021458344895086546, "loss": 0.0146, "step": 112870 }, { "epoch": 0.57, "learning_rate": 0.00021457588125785147, "loss": 0.0148, "step": 112880 }, { "epoch": 0.57, "learning_rate": 0.00021456831356483745, "loss": 0.0177, "step": 112890 }, { "epoch": 0.57, "learning_rate": 0.00021456074587182343, "loss": 0.0177, "step": 112900 }, { "epoch": 0.57, "learning_rate": 0.00021455317817880944, "loss": 0.0157, "step": 112910 }, { "epoch": 0.57, "learning_rate": 0.00021454561048579542, "loss": 0.0153, "step": 112920 }, { "epoch": 0.57, "learning_rate": 0.0002145380427927814, "loss": 0.0155, "step": 112930 }, { "epoch": 0.57, "learning_rate": 0.00021453047509976738, "loss": 0.0152, "step": 112940 }, { "epoch": 0.57, "learning_rate": 0.0002145229074067534, "loss": 0.013, "step": 112950 }, { "epoch": 0.57, "learning_rate": 0.00021451533971373937, "loss": 0.015, "step": 112960 }, { "epoch": 0.57, "learning_rate": 0.00021450777202072535, "loss": 0.0171, "step": 112970 }, { "epoch": 0.57, "learning_rate": 0.00021450020432771136, "loss": 0.016, "step": 112980 }, { "epoch": 0.57, "learning_rate": 0.00021449263663469734, "loss": 0.0162, "step": 112990 }, { "epoch": 0.57, "learning_rate": 0.00021448506894168333, "loss": 0.012, "step": 113000 }, { "epoch": 0.57, "eval_cer": 0.9144906342217957, "eval_loss": 0.01105137262493372, "eval_runtime": 116.8218, "eval_samples_per_second": 17.12, "eval_steps_per_second": 4.28, "step": 113000 }, { "epoch": 0.57, "learning_rate": 0.00021447750124866933, "loss": 0.0144, "step": 113010 }, { "epoch": 0.57, "learning_rate": 0.00021446993355565532, "loss": 0.0109, "step": 113020 }, { "epoch": 0.57, "learning_rate": 0.0002144623658626413, "loss": 0.0141, "step": 113030 }, { "epoch": 0.57, "learning_rate": 0.0002144547981696273, "loss": 0.0138, "step": 113040 }, { "epoch": 0.57, "learning_rate": 0.0002144472304766133, "loss": 0.0126, "step": 113050 }, { "epoch": 0.57, "learning_rate": 0.00021443966278359927, "loss": 0.015, "step": 113060 }, { "epoch": 0.57, "learning_rate": 0.00021443209509058528, "loss": 0.0164, "step": 113070 }, { "epoch": 0.57, "learning_rate": 0.00021442452739757126, "loss": 0.0143, "step": 113080 }, { "epoch": 0.57, "learning_rate": 0.00021441695970455724, "loss": 0.0136, "step": 113090 }, { "epoch": 0.57, "learning_rate": 0.00021440939201154325, "loss": 0.0155, "step": 113100 }, { "epoch": 0.57, "learning_rate": 0.00021440182431852923, "loss": 0.0133, "step": 113110 }, { "epoch": 0.57, "learning_rate": 0.0002143942566255152, "loss": 0.0129, "step": 113120 }, { "epoch": 0.57, "learning_rate": 0.0002143866889325012, "loss": 0.0142, "step": 113130 }, { "epoch": 0.57, "learning_rate": 0.0002143791212394872, "loss": 0.0134, "step": 113140 }, { "epoch": 0.57, "learning_rate": 0.00021437155354647318, "loss": 0.015, "step": 113150 }, { "epoch": 0.57, "learning_rate": 0.00021436398585345916, "loss": 0.0131, "step": 113160 }, { "epoch": 0.57, "learning_rate": 0.00021435641816044517, "loss": 0.0163, "step": 113170 }, { "epoch": 0.57, "learning_rate": 0.00021434885046743115, "loss": 0.0121, "step": 113180 }, { "epoch": 0.57, "learning_rate": 0.00021434128277441714, "loss": 0.0155, "step": 113190 }, { "epoch": 0.57, "learning_rate": 0.00021433371508140314, "loss": 0.0172, "step": 113200 }, { "epoch": 0.57, "learning_rate": 0.00021432614738838913, "loss": 0.0142, "step": 113210 }, { "epoch": 0.57, "learning_rate": 0.0002143185796953751, "loss": 0.0118, "step": 113220 }, { "epoch": 0.57, "learning_rate": 0.00021431101200236112, "loss": 0.0115, "step": 113230 }, { "epoch": 0.57, "learning_rate": 0.0002143034443093471, "loss": 0.0165, "step": 113240 }, { "epoch": 0.57, "learning_rate": 0.00021429587661633308, "loss": 0.013, "step": 113250 }, { "epoch": 0.57, "learning_rate": 0.0002142883089233191, "loss": 0.0122, "step": 113260 }, { "epoch": 0.57, "learning_rate": 0.00021428074123030507, "loss": 0.0128, "step": 113270 }, { "epoch": 0.57, "learning_rate": 0.00021427317353729105, "loss": 0.0123, "step": 113280 }, { "epoch": 0.57, "learning_rate": 0.00021426560584427703, "loss": 0.0125, "step": 113290 }, { "epoch": 0.57, "learning_rate": 0.00021425803815126304, "loss": 0.0142, "step": 113300 }, { "epoch": 0.57, "learning_rate": 0.00021425047045824902, "loss": 0.0155, "step": 113310 }, { "epoch": 0.57, "learning_rate": 0.000214242902765235, "loss": 0.0127, "step": 113320 }, { "epoch": 0.57, "learning_rate": 0.000214235335072221, "loss": 0.0177, "step": 113330 }, { "epoch": 0.57, "learning_rate": 0.000214227767379207, "loss": 0.0179, "step": 113340 }, { "epoch": 0.57, "learning_rate": 0.00021422019968619297, "loss": 0.0167, "step": 113350 }, { "epoch": 0.57, "learning_rate": 0.00021421263199317898, "loss": 0.0137, "step": 113360 }, { "epoch": 0.57, "learning_rate": 0.00021420506430016496, "loss": 0.0126, "step": 113370 }, { "epoch": 0.57, "learning_rate": 0.00021419749660715095, "loss": 0.0136, "step": 113380 }, { "epoch": 0.57, "learning_rate": 0.00021418992891413695, "loss": 0.0182, "step": 113390 }, { "epoch": 0.57, "learning_rate": 0.00021418236122112294, "loss": 0.0153, "step": 113400 }, { "epoch": 0.57, "learning_rate": 0.00021417479352810892, "loss": 0.0141, "step": 113410 }, { "epoch": 0.57, "learning_rate": 0.00021416722583509493, "loss": 0.0167, "step": 113420 }, { "epoch": 0.57, "learning_rate": 0.0002141596581420809, "loss": 0.0156, "step": 113430 }, { "epoch": 0.57, "learning_rate": 0.0002141520904490669, "loss": 0.0175, "step": 113440 }, { "epoch": 0.57, "learning_rate": 0.00021414452275605287, "loss": 0.017, "step": 113450 }, { "epoch": 0.57, "learning_rate": 0.00021413695506303888, "loss": 0.0131, "step": 113460 }, { "epoch": 0.57, "learning_rate": 0.00021412938737002486, "loss": 0.0128, "step": 113470 }, { "epoch": 0.57, "learning_rate": 0.00021412181967701084, "loss": 0.0122, "step": 113480 }, { "epoch": 0.57, "learning_rate": 0.00021411425198399685, "loss": 0.0181, "step": 113490 }, { "epoch": 0.57, "learning_rate": 0.00021410668429098283, "loss": 0.0139, "step": 113500 }, { "epoch": 0.57, "learning_rate": 0.0002140991165979688, "loss": 0.014, "step": 113510 }, { "epoch": 0.57, "learning_rate": 0.00021409154890495482, "loss": 0.0205, "step": 113520 }, { "epoch": 0.57, "learning_rate": 0.0002140839812119408, "loss": 0.0162, "step": 113530 }, { "epoch": 0.57, "learning_rate": 0.00021407641351892678, "loss": 0.0136, "step": 113540 }, { "epoch": 0.57, "learning_rate": 0.0002140688458259128, "loss": 0.0142, "step": 113550 }, { "epoch": 0.57, "learning_rate": 0.00021406127813289877, "loss": 0.0172, "step": 113560 }, { "epoch": 0.57, "learning_rate": 0.00021405371043988476, "loss": 0.013, "step": 113570 }, { "epoch": 0.57, "learning_rate": 0.00021404614274687076, "loss": 0.0134, "step": 113580 }, { "epoch": 0.57, "learning_rate": 0.00021403857505385675, "loss": 0.0112, "step": 113590 }, { "epoch": 0.57, "learning_rate": 0.00021403100736084273, "loss": 0.0147, "step": 113600 }, { "epoch": 0.57, "learning_rate": 0.0002140234396678287, "loss": 0.0163, "step": 113610 }, { "epoch": 0.57, "learning_rate": 0.00021401587197481472, "loss": 0.013, "step": 113620 }, { "epoch": 0.57, "learning_rate": 0.0002140083042818007, "loss": 0.0175, "step": 113630 }, { "epoch": 0.57, "learning_rate": 0.00021400073658878668, "loss": 0.0173, "step": 113640 }, { "epoch": 0.57, "learning_rate": 0.0002139931688957727, "loss": 0.0137, "step": 113650 }, { "epoch": 0.57, "learning_rate": 0.00021398560120275867, "loss": 0.013, "step": 113660 }, { "epoch": 0.57, "learning_rate": 0.00021397803350974465, "loss": 0.0123, "step": 113670 }, { "epoch": 0.57, "learning_rate": 0.00021397046581673066, "loss": 0.0183, "step": 113680 }, { "epoch": 0.57, "learning_rate": 0.00021396289812371664, "loss": 0.016, "step": 113690 }, { "epoch": 0.57, "learning_rate": 0.00021395533043070262, "loss": 0.0172, "step": 113700 }, { "epoch": 0.57, "learning_rate": 0.00021394776273768863, "loss": 0.0139, "step": 113710 }, { "epoch": 0.57, "learning_rate": 0.0002139401950446746, "loss": 0.0141, "step": 113720 }, { "epoch": 0.57, "learning_rate": 0.0002139326273516606, "loss": 0.0152, "step": 113730 }, { "epoch": 0.57, "learning_rate": 0.0002139250596586466, "loss": 0.0127, "step": 113740 }, { "epoch": 0.57, "learning_rate": 0.00021391749196563256, "loss": 0.0144, "step": 113750 }, { "epoch": 0.57, "learning_rate": 0.00021390992427261854, "loss": 0.0143, "step": 113760 }, { "epoch": 0.57, "learning_rate": 0.00021390235657960452, "loss": 0.0119, "step": 113770 }, { "epoch": 0.57, "learning_rate": 0.00021389478888659053, "loss": 0.0137, "step": 113780 }, { "epoch": 0.57, "learning_rate": 0.0002138872211935765, "loss": 0.0168, "step": 113790 }, { "epoch": 0.57, "learning_rate": 0.0002138796535005625, "loss": 0.014, "step": 113800 }, { "epoch": 0.57, "learning_rate": 0.0002138720858075485, "loss": 0.0155, "step": 113810 }, { "epoch": 0.57, "learning_rate": 0.00021386451811453448, "loss": 0.0164, "step": 113820 }, { "epoch": 0.57, "learning_rate": 0.00021385695042152046, "loss": 0.0149, "step": 113830 }, { "epoch": 0.57, "learning_rate": 0.00021384938272850644, "loss": 0.0165, "step": 113840 }, { "epoch": 0.57, "learning_rate": 0.00021384181503549245, "loss": 0.0137, "step": 113850 }, { "epoch": 0.57, "learning_rate": 0.00021383424734247843, "loss": 0.0124, "step": 113860 }, { "epoch": 0.57, "learning_rate": 0.00021382667964946442, "loss": 0.0167, "step": 113870 }, { "epoch": 0.57, "learning_rate": 0.00021381911195645042, "loss": 0.0139, "step": 113880 }, { "epoch": 0.57, "learning_rate": 0.0002138115442634364, "loss": 0.0131, "step": 113890 }, { "epoch": 0.57, "learning_rate": 0.0002138039765704224, "loss": 0.0157, "step": 113900 }, { "epoch": 0.57, "learning_rate": 0.0002137964088774084, "loss": 0.0146, "step": 113910 }, { "epoch": 0.57, "learning_rate": 0.00021378884118439438, "loss": 0.0136, "step": 113920 }, { "epoch": 0.57, "learning_rate": 0.00021378127349138036, "loss": 0.0117, "step": 113930 }, { "epoch": 0.57, "learning_rate": 0.00021377370579836637, "loss": 0.0126, "step": 113940 }, { "epoch": 0.57, "learning_rate": 0.00021376613810535235, "loss": 0.0138, "step": 113950 }, { "epoch": 0.57, "learning_rate": 0.00021375857041233833, "loss": 0.0143, "step": 113960 }, { "epoch": 0.57, "learning_rate": 0.00021375100271932434, "loss": 0.0129, "step": 113970 }, { "epoch": 0.58, "learning_rate": 0.00021374343502631032, "loss": 0.0132, "step": 113980 }, { "epoch": 0.58, "learning_rate": 0.0002137358673332963, "loss": 0.0198, "step": 113990 }, { "epoch": 0.58, "learning_rate": 0.00021372829964028228, "loss": 0.0163, "step": 114000 }, { "epoch": 0.58, "eval_cer": 0.9144751078837893, "eval_loss": 0.010899759829044342, "eval_runtime": 116.7433, "eval_samples_per_second": 17.132, "eval_steps_per_second": 4.283, "step": 114000 }, { "epoch": 0.58, "learning_rate": 0.0002137207319472683, "loss": 0.0124, "step": 114010 }, { "epoch": 0.58, "learning_rate": 0.00021371316425425427, "loss": 0.0174, "step": 114020 }, { "epoch": 0.58, "learning_rate": 0.00021370559656124025, "loss": 0.0158, "step": 114030 }, { "epoch": 0.58, "learning_rate": 0.00021369802886822626, "loss": 0.0166, "step": 114040 }, { "epoch": 0.58, "learning_rate": 0.00021369046117521224, "loss": 0.0124, "step": 114050 }, { "epoch": 0.58, "learning_rate": 0.00021368289348219823, "loss": 0.0182, "step": 114060 }, { "epoch": 0.58, "learning_rate": 0.00021367532578918423, "loss": 0.017, "step": 114070 }, { "epoch": 0.58, "learning_rate": 0.00021366775809617022, "loss": 0.0179, "step": 114080 }, { "epoch": 0.58, "learning_rate": 0.0002136601904031562, "loss": 0.0182, "step": 114090 }, { "epoch": 0.58, "learning_rate": 0.0002136526227101422, "loss": 0.0149, "step": 114100 }, { "epoch": 0.58, "learning_rate": 0.0002136450550171282, "loss": 0.019, "step": 114110 }, { "epoch": 0.58, "learning_rate": 0.00021363748732411417, "loss": 0.0156, "step": 114120 }, { "epoch": 0.58, "learning_rate": 0.00021362991963110018, "loss": 0.0116, "step": 114130 }, { "epoch": 0.58, "learning_rate": 0.00021362235193808616, "loss": 0.0136, "step": 114140 }, { "epoch": 0.58, "learning_rate": 0.00021361478424507214, "loss": 0.0135, "step": 114150 }, { "epoch": 0.58, "learning_rate": 0.00021360721655205815, "loss": 0.0153, "step": 114160 }, { "epoch": 0.58, "learning_rate": 0.00021359964885904413, "loss": 0.015, "step": 114170 }, { "epoch": 0.58, "learning_rate": 0.0002135920811660301, "loss": 0.0125, "step": 114180 }, { "epoch": 0.58, "learning_rate": 0.0002135845134730161, "loss": 0.0199, "step": 114190 }, { "epoch": 0.58, "learning_rate": 0.0002135769457800021, "loss": 0.013, "step": 114200 }, { "epoch": 0.58, "learning_rate": 0.00021356937808698808, "loss": 0.0131, "step": 114210 }, { "epoch": 0.58, "learning_rate": 0.00021356181039397406, "loss": 0.0158, "step": 114220 }, { "epoch": 0.58, "learning_rate": 0.00021355424270096007, "loss": 0.0137, "step": 114230 }, { "epoch": 0.58, "learning_rate": 0.00021354667500794605, "loss": 0.0186, "step": 114240 }, { "epoch": 0.58, "learning_rate": 0.00021353910731493204, "loss": 0.016, "step": 114250 }, { "epoch": 0.58, "learning_rate": 0.00021353153962191804, "loss": 0.0156, "step": 114260 }, { "epoch": 0.58, "learning_rate": 0.00021352397192890403, "loss": 0.0145, "step": 114270 }, { "epoch": 0.58, "learning_rate": 0.00021351640423589, "loss": 0.014, "step": 114280 }, { "epoch": 0.58, "learning_rate": 0.00021350883654287602, "loss": 0.0156, "step": 114290 }, { "epoch": 0.58, "learning_rate": 0.000213501268849862, "loss": 0.0177, "step": 114300 }, { "epoch": 0.58, "learning_rate": 0.00021349370115684798, "loss": 0.0136, "step": 114310 }, { "epoch": 0.58, "learning_rate": 0.000213486133463834, "loss": 0.0139, "step": 114320 }, { "epoch": 0.58, "learning_rate": 0.00021347856577081997, "loss": 0.0191, "step": 114330 }, { "epoch": 0.58, "learning_rate": 0.00021347099807780595, "loss": 0.0184, "step": 114340 }, { "epoch": 0.58, "learning_rate": 0.00021346343038479193, "loss": 0.018, "step": 114350 }, { "epoch": 0.58, "learning_rate": 0.00021345586269177794, "loss": 0.0148, "step": 114360 }, { "epoch": 0.58, "learning_rate": 0.00021344829499876392, "loss": 0.0157, "step": 114370 }, { "epoch": 0.58, "learning_rate": 0.0002134407273057499, "loss": 0.0136, "step": 114380 }, { "epoch": 0.58, "learning_rate": 0.0002134331596127359, "loss": 0.0158, "step": 114390 }, { "epoch": 0.58, "learning_rate": 0.0002134255919197219, "loss": 0.0144, "step": 114400 }, { "epoch": 0.58, "learning_rate": 0.00021341802422670787, "loss": 0.015, "step": 114410 }, { "epoch": 0.58, "learning_rate": 0.00021341045653369388, "loss": 0.013, "step": 114420 }, { "epoch": 0.58, "learning_rate": 0.00021340288884067986, "loss": 0.0137, "step": 114430 }, { "epoch": 0.58, "learning_rate": 0.00021339532114766585, "loss": 0.0161, "step": 114440 }, { "epoch": 0.58, "learning_rate": 0.00021338775345465185, "loss": 0.0173, "step": 114450 }, { "epoch": 0.58, "learning_rate": 0.00021338018576163784, "loss": 0.0167, "step": 114460 }, { "epoch": 0.58, "learning_rate": 0.00021337261806862382, "loss": 0.0128, "step": 114470 }, { "epoch": 0.58, "learning_rate": 0.00021336505037560983, "loss": 0.0147, "step": 114480 }, { "epoch": 0.58, "learning_rate": 0.0002133574826825958, "loss": 0.0143, "step": 114490 }, { "epoch": 0.58, "learning_rate": 0.0002133499149895818, "loss": 0.0149, "step": 114500 }, { "epoch": 0.58, "learning_rate": 0.00021334234729656777, "loss": 0.0123, "step": 114510 }, { "epoch": 0.58, "learning_rate": 0.00021333477960355378, "loss": 0.0166, "step": 114520 }, { "epoch": 0.58, "learning_rate": 0.00021332721191053976, "loss": 0.0144, "step": 114530 }, { "epoch": 0.58, "learning_rate": 0.00021331964421752574, "loss": 0.0137, "step": 114540 }, { "epoch": 0.58, "learning_rate": 0.00021331207652451175, "loss": 0.0149, "step": 114550 }, { "epoch": 0.58, "learning_rate": 0.00021330450883149773, "loss": 0.0172, "step": 114560 }, { "epoch": 0.58, "learning_rate": 0.0002132969411384837, "loss": 0.0155, "step": 114570 }, { "epoch": 0.58, "learning_rate": 0.00021328937344546972, "loss": 0.0166, "step": 114580 }, { "epoch": 0.58, "learning_rate": 0.0002132818057524557, "loss": 0.0122, "step": 114590 }, { "epoch": 0.58, "learning_rate": 0.00021327423805944168, "loss": 0.0126, "step": 114600 }, { "epoch": 0.58, "learning_rate": 0.0002132666703664277, "loss": 0.0165, "step": 114610 }, { "epoch": 0.58, "learning_rate": 0.00021325910267341367, "loss": 0.015, "step": 114620 }, { "epoch": 0.58, "learning_rate": 0.00021325153498039966, "loss": 0.0154, "step": 114630 }, { "epoch": 0.58, "learning_rate": 0.00021324396728738566, "loss": 0.0113, "step": 114640 }, { "epoch": 0.58, "learning_rate": 0.00021323639959437165, "loss": 0.016, "step": 114650 }, { "epoch": 0.58, "learning_rate": 0.00021322883190135763, "loss": 0.0173, "step": 114660 }, { "epoch": 0.58, "learning_rate": 0.00021322126420834364, "loss": 0.0144, "step": 114670 }, { "epoch": 0.58, "learning_rate": 0.00021321369651532962, "loss": 0.0172, "step": 114680 }, { "epoch": 0.58, "learning_rate": 0.0002132061288223156, "loss": 0.0195, "step": 114690 }, { "epoch": 0.58, "learning_rate": 0.00021319856112930158, "loss": 0.0155, "step": 114700 }, { "epoch": 0.58, "learning_rate": 0.0002131909934362876, "loss": 0.0172, "step": 114710 }, { "epoch": 0.58, "learning_rate": 0.00021318342574327357, "loss": 0.0176, "step": 114720 }, { "epoch": 0.58, "learning_rate": 0.00021317585805025955, "loss": 0.0133, "step": 114730 }, { "epoch": 0.58, "learning_rate": 0.00021316829035724556, "loss": 0.0148, "step": 114740 }, { "epoch": 0.58, "learning_rate": 0.00021316072266423154, "loss": 0.0113, "step": 114750 }, { "epoch": 0.58, "learning_rate": 0.00021315315497121752, "loss": 0.0164, "step": 114760 }, { "epoch": 0.58, "learning_rate": 0.00021314558727820353, "loss": 0.0172, "step": 114770 }, { "epoch": 0.58, "learning_rate": 0.0002131380195851895, "loss": 0.0137, "step": 114780 }, { "epoch": 0.58, "learning_rate": 0.0002131304518921755, "loss": 0.0176, "step": 114790 }, { "epoch": 0.58, "learning_rate": 0.0002131228841991615, "loss": 0.0144, "step": 114800 }, { "epoch": 0.58, "learning_rate": 0.00021311531650614748, "loss": 0.0164, "step": 114810 }, { "epoch": 0.58, "learning_rate": 0.00021310774881313347, "loss": 0.0147, "step": 114820 }, { "epoch": 0.58, "learning_rate": 0.00021310018112011947, "loss": 0.0126, "step": 114830 }, { "epoch": 0.58, "learning_rate": 0.00021309261342710546, "loss": 0.0139, "step": 114840 }, { "epoch": 0.58, "learning_rate": 0.00021308504573409144, "loss": 0.0145, "step": 114850 }, { "epoch": 0.58, "learning_rate": 0.00021307747804107742, "loss": 0.0157, "step": 114860 }, { "epoch": 0.58, "learning_rate": 0.00021306991034806343, "loss": 0.0135, "step": 114870 }, { "epoch": 0.58, "learning_rate": 0.0002130623426550494, "loss": 0.0161, "step": 114880 }, { "epoch": 0.58, "learning_rate": 0.0002130547749620354, "loss": 0.0139, "step": 114890 }, { "epoch": 0.58, "learning_rate": 0.0002130472072690214, "loss": 0.014, "step": 114900 }, { "epoch": 0.58, "learning_rate": 0.00021303963957600738, "loss": 0.016, "step": 114910 }, { "epoch": 0.58, "learning_rate": 0.00021303207188299336, "loss": 0.0133, "step": 114920 }, { "epoch": 0.58, "learning_rate": 0.00021302450418997937, "loss": 0.015, "step": 114930 }, { "epoch": 0.58, "learning_rate": 0.00021301693649696535, "loss": 0.0177, "step": 114940 }, { "epoch": 0.58, "learning_rate": 0.00021300936880395133, "loss": 0.0156, "step": 114950 }, { "epoch": 0.58, "learning_rate": 0.00021300180111093734, "loss": 0.0172, "step": 114960 }, { "epoch": 0.58, "learning_rate": 0.00021299423341792332, "loss": 0.0139, "step": 114970 }, { "epoch": 0.58, "learning_rate": 0.0002129866657249093, "loss": 0.0137, "step": 114980 }, { "epoch": 0.58, "learning_rate": 0.0002129790980318953, "loss": 0.0122, "step": 114990 }, { "epoch": 0.58, "learning_rate": 0.0002129715303388813, "loss": 0.0139, "step": 115000 }, { "epoch": 0.58, "eval_cer": 0.914481900656667, "eval_loss": 0.010673732496798038, "eval_runtime": 116.7514, "eval_samples_per_second": 17.13, "eval_steps_per_second": 4.283, "step": 115000 }, { "epoch": 0.58, "learning_rate": 0.00021296396264586725, "loss": 0.0189, "step": 115010 }, { "epoch": 0.58, "learning_rate": 0.00021295639495285323, "loss": 0.0179, "step": 115020 }, { "epoch": 0.58, "learning_rate": 0.00021294882725983924, "loss": 0.0161, "step": 115030 }, { "epoch": 0.58, "learning_rate": 0.00021294125956682522, "loss": 0.0156, "step": 115040 }, { "epoch": 0.58, "learning_rate": 0.0002129336918738112, "loss": 0.0132, "step": 115050 }, { "epoch": 0.58, "learning_rate": 0.0002129261241807972, "loss": 0.0175, "step": 115060 }, { "epoch": 0.58, "learning_rate": 0.0002129185564877832, "loss": 0.0137, "step": 115070 }, { "epoch": 0.58, "learning_rate": 0.00021291098879476917, "loss": 0.0133, "step": 115080 }, { "epoch": 0.58, "learning_rate": 0.00021290342110175515, "loss": 0.0138, "step": 115090 }, { "epoch": 0.58, "learning_rate": 0.00021289585340874116, "loss": 0.0155, "step": 115100 }, { "epoch": 0.58, "learning_rate": 0.00021288828571572714, "loss": 0.0138, "step": 115110 }, { "epoch": 0.58, "learning_rate": 0.00021288071802271313, "loss": 0.0133, "step": 115120 }, { "epoch": 0.58, "learning_rate": 0.00021287315032969913, "loss": 0.015, "step": 115130 }, { "epoch": 0.58, "learning_rate": 0.00021286558263668512, "loss": 0.0165, "step": 115140 }, { "epoch": 0.58, "learning_rate": 0.0002128580149436711, "loss": 0.0177, "step": 115150 }, { "epoch": 0.58, "learning_rate": 0.0002128504472506571, "loss": 0.0166, "step": 115160 }, { "epoch": 0.58, "learning_rate": 0.0002128428795576431, "loss": 0.0148, "step": 115170 }, { "epoch": 0.58, "learning_rate": 0.00021283531186462907, "loss": 0.015, "step": 115180 }, { "epoch": 0.58, "learning_rate": 0.00021282774417161508, "loss": 0.0151, "step": 115190 }, { "epoch": 0.58, "learning_rate": 0.00021282017647860106, "loss": 0.0125, "step": 115200 }, { "epoch": 0.58, "learning_rate": 0.00021281260878558704, "loss": 0.0148, "step": 115210 }, { "epoch": 0.58, "learning_rate": 0.00021280504109257305, "loss": 0.0161, "step": 115220 }, { "epoch": 0.58, "learning_rate": 0.00021279747339955903, "loss": 0.0156, "step": 115230 }, { "epoch": 0.58, "learning_rate": 0.000212789905706545, "loss": 0.0138, "step": 115240 }, { "epoch": 0.58, "learning_rate": 0.000212782338013531, "loss": 0.0171, "step": 115250 }, { "epoch": 0.58, "learning_rate": 0.000212774770320517, "loss": 0.0167, "step": 115260 }, { "epoch": 0.58, "learning_rate": 0.00021276720262750298, "loss": 0.0131, "step": 115270 }, { "epoch": 0.58, "learning_rate": 0.00021275963493448896, "loss": 0.014, "step": 115280 }, { "epoch": 0.58, "learning_rate": 0.00021275206724147497, "loss": 0.0129, "step": 115290 }, { "epoch": 0.58, "learning_rate": 0.00021274449954846095, "loss": 0.0186, "step": 115300 }, { "epoch": 0.58, "learning_rate": 0.00021273693185544694, "loss": 0.0129, "step": 115310 }, { "epoch": 0.58, "learning_rate": 0.00021272936416243294, "loss": 0.014, "step": 115320 }, { "epoch": 0.58, "learning_rate": 0.00021272179646941893, "loss": 0.017, "step": 115330 }, { "epoch": 0.58, "learning_rate": 0.0002127142287764049, "loss": 0.0142, "step": 115340 }, { "epoch": 0.58, "learning_rate": 0.00021270666108339092, "loss": 0.017, "step": 115350 }, { "epoch": 0.58, "learning_rate": 0.0002126990933903769, "loss": 0.0163, "step": 115360 }, { "epoch": 0.58, "learning_rate": 0.00021269152569736288, "loss": 0.0149, "step": 115370 }, { "epoch": 0.58, "learning_rate": 0.0002126839580043489, "loss": 0.0133, "step": 115380 }, { "epoch": 0.58, "learning_rate": 0.00021267639031133487, "loss": 0.0156, "step": 115390 }, { "epoch": 0.58, "learning_rate": 0.00021266882261832085, "loss": 0.0144, "step": 115400 }, { "epoch": 0.58, "learning_rate": 0.00021266125492530683, "loss": 0.0124, "step": 115410 }, { "epoch": 0.58, "learning_rate": 0.00021265368723229284, "loss": 0.0131, "step": 115420 }, { "epoch": 0.58, "learning_rate": 0.00021264611953927882, "loss": 0.0134, "step": 115430 }, { "epoch": 0.58, "learning_rate": 0.0002126385518462648, "loss": 0.0152, "step": 115440 }, { "epoch": 0.58, "learning_rate": 0.0002126309841532508, "loss": 0.013, "step": 115450 }, { "epoch": 0.58, "learning_rate": 0.0002126234164602368, "loss": 0.0147, "step": 115460 }, { "epoch": 0.58, "learning_rate": 0.00021261584876722277, "loss": 0.0212, "step": 115470 }, { "epoch": 0.58, "learning_rate": 0.00021260828107420878, "loss": 0.0134, "step": 115480 }, { "epoch": 0.58, "learning_rate": 0.00021260071338119476, "loss": 0.0186, "step": 115490 }, { "epoch": 0.58, "learning_rate": 0.00021259314568818075, "loss": 0.0145, "step": 115500 }, { "epoch": 0.58, "learning_rate": 0.00021258557799516675, "loss": 0.0126, "step": 115510 }, { "epoch": 0.58, "learning_rate": 0.00021257801030215274, "loss": 0.0182, "step": 115520 }, { "epoch": 0.58, "learning_rate": 0.00021257044260913872, "loss": 0.0148, "step": 115530 }, { "epoch": 0.58, "learning_rate": 0.00021256287491612473, "loss": 0.0169, "step": 115540 }, { "epoch": 0.58, "learning_rate": 0.0002125553072231107, "loss": 0.0121, "step": 115550 }, { "epoch": 0.58, "learning_rate": 0.0002125477395300967, "loss": 0.0132, "step": 115560 }, { "epoch": 0.58, "learning_rate": 0.0002125401718370827, "loss": 0.0173, "step": 115570 }, { "epoch": 0.58, "learning_rate": 0.00021253260414406868, "loss": 0.0155, "step": 115580 }, { "epoch": 0.58, "learning_rate": 0.00021252503645105466, "loss": 0.0125, "step": 115590 }, { "epoch": 0.58, "learning_rate": 0.00021251746875804064, "loss": 0.0122, "step": 115600 }, { "epoch": 0.58, "learning_rate": 0.00021250990106502665, "loss": 0.015, "step": 115610 }, { "epoch": 0.58, "learning_rate": 0.00021250233337201263, "loss": 0.0173, "step": 115620 }, { "epoch": 0.58, "learning_rate": 0.00021249476567899861, "loss": 0.0134, "step": 115630 }, { "epoch": 0.58, "learning_rate": 0.00021248719798598462, "loss": 0.0141, "step": 115640 }, { "epoch": 0.58, "learning_rate": 0.0002124796302929706, "loss": 0.0159, "step": 115650 }, { "epoch": 0.58, "learning_rate": 0.00021247206259995659, "loss": 0.0143, "step": 115660 }, { "epoch": 0.58, "learning_rate": 0.0002124644949069426, "loss": 0.0169, "step": 115670 }, { "epoch": 0.58, "learning_rate": 0.00021245692721392858, "loss": 0.0172, "step": 115680 }, { "epoch": 0.58, "learning_rate": 0.00021244935952091456, "loss": 0.0152, "step": 115690 }, { "epoch": 0.58, "learning_rate": 0.00021244179182790056, "loss": 0.0121, "step": 115700 }, { "epoch": 0.58, "learning_rate": 0.00021243422413488655, "loss": 0.0149, "step": 115710 }, { "epoch": 0.58, "learning_rate": 0.00021242665644187253, "loss": 0.0119, "step": 115720 }, { "epoch": 0.58, "learning_rate": 0.00021241908874885854, "loss": 0.0166, "step": 115730 }, { "epoch": 0.58, "learning_rate": 0.00021241152105584452, "loss": 0.0142, "step": 115740 }, { "epoch": 0.58, "learning_rate": 0.0002124039533628305, "loss": 0.0153, "step": 115750 }, { "epoch": 0.58, "learning_rate": 0.00021239638566981648, "loss": 0.012, "step": 115760 }, { "epoch": 0.58, "learning_rate": 0.0002123888179768025, "loss": 0.0147, "step": 115770 }, { "epoch": 0.58, "learning_rate": 0.00021238125028378847, "loss": 0.0127, "step": 115780 }, { "epoch": 0.58, "learning_rate": 0.00021237368259077445, "loss": 0.0133, "step": 115790 }, { "epoch": 0.58, "learning_rate": 0.00021236611489776046, "loss": 0.0144, "step": 115800 }, { "epoch": 0.58, "learning_rate": 0.00021235854720474644, "loss": 0.0151, "step": 115810 }, { "epoch": 0.58, "learning_rate": 0.00021235097951173242, "loss": 0.0127, "step": 115820 }, { "epoch": 0.58, "learning_rate": 0.00021234341181871843, "loss": 0.0137, "step": 115830 }, { "epoch": 0.58, "learning_rate": 0.00021233584412570441, "loss": 0.0156, "step": 115840 }, { "epoch": 0.58, "learning_rate": 0.0002123282764326904, "loss": 0.0145, "step": 115850 }, { "epoch": 0.58, "learning_rate": 0.0002123207087396764, "loss": 0.0158, "step": 115860 }, { "epoch": 0.58, "learning_rate": 0.00021231314104666239, "loss": 0.013, "step": 115870 }, { "epoch": 0.58, "learning_rate": 0.00021230557335364837, "loss": 0.0139, "step": 115880 }, { "epoch": 0.58, "learning_rate": 0.00021229800566063438, "loss": 0.0112, "step": 115890 }, { "epoch": 0.58, "learning_rate": 0.00021229043796762036, "loss": 0.0131, "step": 115900 }, { "epoch": 0.58, "learning_rate": 0.00021228287027460634, "loss": 0.0131, "step": 115910 }, { "epoch": 0.58, "learning_rate": 0.00021227530258159232, "loss": 0.0189, "step": 115920 }, { "epoch": 0.58, "learning_rate": 0.00021226773488857833, "loss": 0.0137, "step": 115930 }, { "epoch": 0.58, "learning_rate": 0.0002122601671955643, "loss": 0.0137, "step": 115940 }, { "epoch": 0.58, "learning_rate": 0.0002122525995025503, "loss": 0.0169, "step": 115950 }, { "epoch": 0.59, "learning_rate": 0.0002122450318095363, "loss": 0.0187, "step": 115960 }, { "epoch": 0.59, "learning_rate": 0.00021223746411652228, "loss": 0.021, "step": 115970 }, { "epoch": 0.59, "learning_rate": 0.00021222989642350826, "loss": 0.0137, "step": 115980 }, { "epoch": 0.59, "learning_rate": 0.00021222232873049427, "loss": 0.0138, "step": 115990 }, { "epoch": 0.59, "learning_rate": 0.00021221476103748025, "loss": 0.016, "step": 116000 }, { "epoch": 0.59, "eval_cer": 0.9144634631302844, "eval_loss": 0.01081350538879633, "eval_runtime": 116.7675, "eval_samples_per_second": 17.128, "eval_steps_per_second": 4.282, "step": 116000 }, { "epoch": 0.59, "learning_rate": 0.00021220719334446623, "loss": 0.013, "step": 116010 }, { "epoch": 0.59, "learning_rate": 0.00021219962565145224, "loss": 0.0133, "step": 116020 }, { "epoch": 0.59, "learning_rate": 0.00021219205795843822, "loss": 0.0153, "step": 116030 }, { "epoch": 0.59, "learning_rate": 0.0002121844902654242, "loss": 0.0156, "step": 116040 }, { "epoch": 0.59, "learning_rate": 0.00021217692257241021, "loss": 0.0145, "step": 116050 }, { "epoch": 0.59, "learning_rate": 0.0002121693548793962, "loss": 0.024, "step": 116060 }, { "epoch": 0.59, "learning_rate": 0.00021216178718638218, "loss": 0.0143, "step": 116070 }, { "epoch": 0.59, "learning_rate": 0.00021215421949336819, "loss": 0.0164, "step": 116080 }, { "epoch": 0.59, "learning_rate": 0.00021214665180035417, "loss": 0.0155, "step": 116090 }, { "epoch": 0.59, "learning_rate": 0.00021213908410734015, "loss": 0.0149, "step": 116100 }, { "epoch": 0.59, "learning_rate": 0.00021213151641432613, "loss": 0.0143, "step": 116110 }, { "epoch": 0.59, "learning_rate": 0.00021212394872131214, "loss": 0.0126, "step": 116120 }, { "epoch": 0.59, "learning_rate": 0.00021211638102829812, "loss": 0.0152, "step": 116130 }, { "epoch": 0.59, "learning_rate": 0.0002121088133352841, "loss": 0.0147, "step": 116140 }, { "epoch": 0.59, "learning_rate": 0.0002121012456422701, "loss": 0.0129, "step": 116150 }, { "epoch": 0.59, "learning_rate": 0.0002120936779492561, "loss": 0.0127, "step": 116160 }, { "epoch": 0.59, "learning_rate": 0.00021208611025624207, "loss": 0.015, "step": 116170 }, { "epoch": 0.59, "learning_rate": 0.00021207854256322808, "loss": 0.0169, "step": 116180 }, { "epoch": 0.59, "learning_rate": 0.00021207097487021406, "loss": 0.0161, "step": 116190 }, { "epoch": 0.59, "learning_rate": 0.00021206340717720004, "loss": 0.0145, "step": 116200 }, { "epoch": 0.59, "learning_rate": 0.00021205583948418605, "loss": 0.0162, "step": 116210 }, { "epoch": 0.59, "learning_rate": 0.00021204827179117203, "loss": 0.0171, "step": 116220 }, { "epoch": 0.59, "learning_rate": 0.00021204070409815802, "loss": 0.0155, "step": 116230 }, { "epoch": 0.59, "learning_rate": 0.00021203313640514402, "loss": 0.0171, "step": 116240 }, { "epoch": 0.59, "learning_rate": 0.00021202556871213, "loss": 0.0133, "step": 116250 }, { "epoch": 0.59, "learning_rate": 0.000212018001019116, "loss": 0.0139, "step": 116260 }, { "epoch": 0.59, "learning_rate": 0.00021201043332610194, "loss": 0.0144, "step": 116270 }, { "epoch": 0.59, "learning_rate": 0.00021200286563308795, "loss": 0.0149, "step": 116280 }, { "epoch": 0.59, "learning_rate": 0.00021199529794007393, "loss": 0.013, "step": 116290 }, { "epoch": 0.59, "learning_rate": 0.0002119877302470599, "loss": 0.0139, "step": 116300 }, { "epoch": 0.59, "learning_rate": 0.0002119801625540459, "loss": 0.0122, "step": 116310 }, { "epoch": 0.59, "learning_rate": 0.0002119725948610319, "loss": 0.0149, "step": 116320 }, { "epoch": 0.59, "learning_rate": 0.00021196502716801788, "loss": 0.015, "step": 116330 }, { "epoch": 0.59, "learning_rate": 0.00021195745947500387, "loss": 0.014, "step": 116340 }, { "epoch": 0.59, "learning_rate": 0.00021194989178198987, "loss": 0.0161, "step": 116350 }, { "epoch": 0.59, "learning_rate": 0.00021194232408897586, "loss": 0.0161, "step": 116360 }, { "epoch": 0.59, "learning_rate": 0.00021193475639596184, "loss": 0.0153, "step": 116370 }, { "epoch": 0.59, "learning_rate": 0.00021192718870294785, "loss": 0.0137, "step": 116380 }, { "epoch": 0.59, "learning_rate": 0.00021191962100993383, "loss": 0.0154, "step": 116390 }, { "epoch": 0.59, "learning_rate": 0.0002119120533169198, "loss": 0.0126, "step": 116400 }, { "epoch": 0.59, "learning_rate": 0.00021190448562390582, "loss": 0.014, "step": 116410 }, { "epoch": 0.59, "learning_rate": 0.0002118969179308918, "loss": 0.0166, "step": 116420 }, { "epoch": 0.59, "learning_rate": 0.00021188935023787778, "loss": 0.0128, "step": 116430 }, { "epoch": 0.59, "learning_rate": 0.0002118817825448638, "loss": 0.0144, "step": 116440 }, { "epoch": 0.59, "learning_rate": 0.00021187421485184977, "loss": 0.0169, "step": 116450 }, { "epoch": 0.59, "learning_rate": 0.00021186664715883575, "loss": 0.0134, "step": 116460 }, { "epoch": 0.59, "learning_rate": 0.00021185907946582176, "loss": 0.0123, "step": 116470 }, { "epoch": 0.59, "learning_rate": 0.00021185151177280774, "loss": 0.0149, "step": 116480 }, { "epoch": 0.59, "learning_rate": 0.00021184394407979372, "loss": 0.0131, "step": 116490 }, { "epoch": 0.59, "learning_rate": 0.0002118363763867797, "loss": 0.0142, "step": 116500 }, { "epoch": 0.59, "learning_rate": 0.0002118288086937657, "loss": 0.015, "step": 116510 }, { "epoch": 0.59, "learning_rate": 0.0002118212410007517, "loss": 0.0177, "step": 116520 }, { "epoch": 0.59, "learning_rate": 0.00021181367330773768, "loss": 0.0133, "step": 116530 }, { "epoch": 0.59, "learning_rate": 0.00021180610561472368, "loss": 0.0179, "step": 116540 }, { "epoch": 0.59, "learning_rate": 0.00021179853792170967, "loss": 0.0136, "step": 116550 }, { "epoch": 0.59, "learning_rate": 0.00021179097022869565, "loss": 0.0138, "step": 116560 }, { "epoch": 0.59, "learning_rate": 0.00021178340253568166, "loss": 0.0141, "step": 116570 }, { "epoch": 0.59, "learning_rate": 0.00021177583484266764, "loss": 0.0142, "step": 116580 }, { "epoch": 0.59, "learning_rate": 0.00021176826714965362, "loss": 0.013, "step": 116590 }, { "epoch": 0.59, "learning_rate": 0.00021176069945663963, "loss": 0.0142, "step": 116600 }, { "epoch": 0.59, "learning_rate": 0.0002117531317636256, "loss": 0.0128, "step": 116610 }, { "epoch": 0.59, "learning_rate": 0.0002117455640706116, "loss": 0.0121, "step": 116620 }, { "epoch": 0.59, "learning_rate": 0.0002117379963775976, "loss": 0.0155, "step": 116630 }, { "epoch": 0.59, "learning_rate": 0.00021173042868458358, "loss": 0.014, "step": 116640 }, { "epoch": 0.59, "learning_rate": 0.00021172286099156956, "loss": 0.0132, "step": 116650 }, { "epoch": 0.59, "learning_rate": 0.00021171529329855554, "loss": 0.0128, "step": 116660 }, { "epoch": 0.59, "learning_rate": 0.00021170772560554155, "loss": 0.0166, "step": 116670 }, { "epoch": 0.59, "learning_rate": 0.00021170015791252753, "loss": 0.0124, "step": 116680 }, { "epoch": 0.59, "learning_rate": 0.00021169259021951351, "loss": 0.0136, "step": 116690 }, { "epoch": 0.59, "learning_rate": 0.00021168502252649952, "loss": 0.012, "step": 116700 }, { "epoch": 0.59, "learning_rate": 0.0002116774548334855, "loss": 0.0143, "step": 116710 }, { "epoch": 0.59, "learning_rate": 0.00021166988714047149, "loss": 0.0139, "step": 116720 }, { "epoch": 0.59, "learning_rate": 0.0002116623194474575, "loss": 0.014, "step": 116730 }, { "epoch": 0.59, "learning_rate": 0.00021165475175444348, "loss": 0.0128, "step": 116740 }, { "epoch": 0.59, "learning_rate": 0.00021164718406142946, "loss": 0.0136, "step": 116750 }, { "epoch": 0.59, "learning_rate": 0.00021163961636841547, "loss": 0.0155, "step": 116760 }, { "epoch": 0.59, "learning_rate": 0.00021163204867540145, "loss": 0.0214, "step": 116770 }, { "epoch": 0.59, "learning_rate": 0.00021162448098238743, "loss": 0.013, "step": 116780 }, { "epoch": 0.59, "learning_rate": 0.00021161691328937344, "loss": 0.016, "step": 116790 }, { "epoch": 0.59, "learning_rate": 0.00021160934559635942, "loss": 0.0156, "step": 116800 }, { "epoch": 0.59, "learning_rate": 0.0002116017779033454, "loss": 0.0171, "step": 116810 }, { "epoch": 0.59, "learning_rate": 0.00021159421021033138, "loss": 0.0151, "step": 116820 }, { "epoch": 0.59, "learning_rate": 0.0002115866425173174, "loss": 0.013, "step": 116830 }, { "epoch": 0.59, "learning_rate": 0.00021157907482430337, "loss": 0.0132, "step": 116840 }, { "epoch": 0.59, "learning_rate": 0.00021157150713128935, "loss": 0.0106, "step": 116850 }, { "epoch": 0.59, "learning_rate": 0.00021156393943827536, "loss": 0.014, "step": 116860 }, { "epoch": 0.59, "learning_rate": 0.00021155637174526134, "loss": 0.0123, "step": 116870 }, { "epoch": 0.59, "learning_rate": 0.00021154880405224732, "loss": 0.0143, "step": 116880 }, { "epoch": 0.59, "learning_rate": 0.00021154123635923333, "loss": 0.0156, "step": 116890 }, { "epoch": 0.59, "learning_rate": 0.00021153366866621931, "loss": 0.0136, "step": 116900 }, { "epoch": 0.59, "learning_rate": 0.0002115261009732053, "loss": 0.0118, "step": 116910 }, { "epoch": 0.59, "learning_rate": 0.0002115185332801913, "loss": 0.0154, "step": 116920 }, { "epoch": 0.59, "learning_rate": 0.00021151096558717729, "loss": 0.0148, "step": 116930 }, { "epoch": 0.59, "learning_rate": 0.00021150339789416327, "loss": 0.0103, "step": 116940 }, { "epoch": 0.59, "learning_rate": 0.00021149583020114928, "loss": 0.0173, "step": 116950 }, { "epoch": 0.59, "learning_rate": 0.00021148826250813526, "loss": 0.0185, "step": 116960 }, { "epoch": 0.59, "learning_rate": 0.00021148069481512124, "loss": 0.0136, "step": 116970 }, { "epoch": 0.59, "learning_rate": 0.00021147312712210725, "loss": 0.017, "step": 116980 }, { "epoch": 0.59, "learning_rate": 0.00021146555942909323, "loss": 0.0213, "step": 116990 }, { "epoch": 0.59, "learning_rate": 0.0002114579917360792, "loss": 0.0164, "step": 117000 }, { "epoch": 0.59, "eval_cer": 0.9145207165016832, "eval_loss": 0.01061397697776556, "eval_runtime": 116.746, "eval_samples_per_second": 17.131, "eval_steps_per_second": 4.283, "step": 117000 }, { "epoch": 0.59, "learning_rate": 0.0002114504240430652, "loss": 0.0129, "step": 117010 }, { "epoch": 0.59, "learning_rate": 0.0002114428563500512, "loss": 0.0133, "step": 117020 }, { "epoch": 0.59, "learning_rate": 0.00021143528865703718, "loss": 0.0135, "step": 117030 }, { "epoch": 0.59, "learning_rate": 0.00021142772096402316, "loss": 0.0175, "step": 117040 }, { "epoch": 0.59, "learning_rate": 0.00021142015327100917, "loss": 0.0157, "step": 117050 }, { "epoch": 0.59, "learning_rate": 0.00021141258557799515, "loss": 0.0138, "step": 117060 }, { "epoch": 0.59, "learning_rate": 0.00021140501788498113, "loss": 0.0155, "step": 117070 }, { "epoch": 0.59, "learning_rate": 0.00021139745019196714, "loss": 0.0141, "step": 117080 }, { "epoch": 0.59, "learning_rate": 0.00021138988249895312, "loss": 0.0133, "step": 117090 }, { "epoch": 0.59, "learning_rate": 0.0002113823148059391, "loss": 0.0151, "step": 117100 }, { "epoch": 0.59, "learning_rate": 0.00021137474711292511, "loss": 0.0157, "step": 117110 }, { "epoch": 0.59, "learning_rate": 0.0002113671794199111, "loss": 0.0164, "step": 117120 }, { "epoch": 0.59, "learning_rate": 0.00021135961172689708, "loss": 0.016, "step": 117130 }, { "epoch": 0.59, "learning_rate": 0.00021135204403388309, "loss": 0.0148, "step": 117140 }, { "epoch": 0.59, "learning_rate": 0.00021134447634086907, "loss": 0.0135, "step": 117150 }, { "epoch": 0.59, "learning_rate": 0.00021133690864785505, "loss": 0.0131, "step": 117160 }, { "epoch": 0.59, "learning_rate": 0.00021132934095484103, "loss": 0.0162, "step": 117170 }, { "epoch": 0.59, "learning_rate": 0.00021132177326182704, "loss": 0.0168, "step": 117180 }, { "epoch": 0.59, "learning_rate": 0.00021131420556881302, "loss": 0.0176, "step": 117190 }, { "epoch": 0.59, "learning_rate": 0.000211306637875799, "loss": 0.0166, "step": 117200 }, { "epoch": 0.59, "learning_rate": 0.000211299070182785, "loss": 0.0153, "step": 117210 }, { "epoch": 0.59, "learning_rate": 0.000211291502489771, "loss": 0.0149, "step": 117220 }, { "epoch": 0.59, "learning_rate": 0.00021128393479675697, "loss": 0.0152, "step": 117230 }, { "epoch": 0.59, "learning_rate": 0.00021127636710374298, "loss": 0.0146, "step": 117240 }, { "epoch": 0.59, "learning_rate": 0.00021126879941072896, "loss": 0.0129, "step": 117250 }, { "epoch": 0.59, "learning_rate": 0.00021126123171771494, "loss": 0.0137, "step": 117260 }, { "epoch": 0.59, "learning_rate": 0.00021125366402470095, "loss": 0.013, "step": 117270 }, { "epoch": 0.59, "learning_rate": 0.00021124609633168693, "loss": 0.0134, "step": 117280 }, { "epoch": 0.59, "learning_rate": 0.00021123852863867292, "loss": 0.0115, "step": 117290 }, { "epoch": 0.59, "learning_rate": 0.00021123096094565892, "loss": 0.0174, "step": 117300 }, { "epoch": 0.59, "learning_rate": 0.0002112233932526449, "loss": 0.0155, "step": 117310 }, { "epoch": 0.59, "learning_rate": 0.0002112158255596309, "loss": 0.0114, "step": 117320 }, { "epoch": 0.59, "learning_rate": 0.00021120825786661687, "loss": 0.0146, "step": 117330 }, { "epoch": 0.59, "learning_rate": 0.00021120069017360288, "loss": 0.0154, "step": 117340 }, { "epoch": 0.59, "learning_rate": 0.00021119312248058886, "loss": 0.0151, "step": 117350 }, { "epoch": 0.59, "learning_rate": 0.00021118555478757484, "loss": 0.0113, "step": 117360 }, { "epoch": 0.59, "learning_rate": 0.00021117798709456085, "loss": 0.0131, "step": 117370 }, { "epoch": 0.59, "learning_rate": 0.00021117041940154683, "loss": 0.0129, "step": 117380 }, { "epoch": 0.59, "learning_rate": 0.0002111628517085328, "loss": 0.0139, "step": 117390 }, { "epoch": 0.59, "learning_rate": 0.00021115528401551882, "loss": 0.0163, "step": 117400 }, { "epoch": 0.59, "learning_rate": 0.0002111477163225048, "loss": 0.016, "step": 117410 }, { "epoch": 0.59, "learning_rate": 0.00021114014862949078, "loss": 0.018, "step": 117420 }, { "epoch": 0.59, "learning_rate": 0.0002111325809364768, "loss": 0.0146, "step": 117430 }, { "epoch": 0.59, "learning_rate": 0.00021112501324346277, "loss": 0.0153, "step": 117440 }, { "epoch": 0.59, "learning_rate": 0.00021111744555044875, "loss": 0.0147, "step": 117450 }, { "epoch": 0.59, "learning_rate": 0.00021110987785743476, "loss": 0.0149, "step": 117460 }, { "epoch": 0.59, "learning_rate": 0.00021110231016442074, "loss": 0.0228, "step": 117470 }, { "epoch": 0.59, "learning_rate": 0.00021109474247140673, "loss": 0.0154, "step": 117480 }, { "epoch": 0.59, "learning_rate": 0.0002110871747783927, "loss": 0.0123, "step": 117490 }, { "epoch": 0.59, "learning_rate": 0.00021107960708537872, "loss": 0.0124, "step": 117500 }, { "epoch": 0.59, "learning_rate": 0.0002110720393923647, "loss": 0.0125, "step": 117510 }, { "epoch": 0.59, "learning_rate": 0.00021106447169935065, "loss": 0.0151, "step": 117520 }, { "epoch": 0.59, "learning_rate": 0.00021105690400633666, "loss": 0.0168, "step": 117530 }, { "epoch": 0.59, "learning_rate": 0.00021104933631332264, "loss": 0.0157, "step": 117540 }, { "epoch": 0.59, "learning_rate": 0.00021104176862030862, "loss": 0.0147, "step": 117550 }, { "epoch": 0.59, "learning_rate": 0.0002110342009272946, "loss": 0.0121, "step": 117560 }, { "epoch": 0.59, "learning_rate": 0.0002110266332342806, "loss": 0.0139, "step": 117570 }, { "epoch": 0.59, "learning_rate": 0.0002110190655412666, "loss": 0.0167, "step": 117580 }, { "epoch": 0.59, "learning_rate": 0.00021101149784825258, "loss": 0.0138, "step": 117590 }, { "epoch": 0.59, "learning_rate": 0.00021100393015523858, "loss": 0.0147, "step": 117600 }, { "epoch": 0.59, "learning_rate": 0.00021099636246222457, "loss": 0.0164, "step": 117610 }, { "epoch": 0.59, "learning_rate": 0.00021098879476921055, "loss": 0.0148, "step": 117620 }, { "epoch": 0.59, "learning_rate": 0.00021098122707619656, "loss": 0.0139, "step": 117630 }, { "epoch": 0.59, "learning_rate": 0.00021097365938318254, "loss": 0.0129, "step": 117640 }, { "epoch": 0.59, "learning_rate": 0.00021096609169016852, "loss": 0.0179, "step": 117650 }, { "epoch": 0.59, "learning_rate": 0.00021095852399715453, "loss": 0.0141, "step": 117660 }, { "epoch": 0.59, "learning_rate": 0.0002109509563041405, "loss": 0.0157, "step": 117670 }, { "epoch": 0.59, "learning_rate": 0.0002109433886111265, "loss": 0.0187, "step": 117680 }, { "epoch": 0.59, "learning_rate": 0.0002109358209181125, "loss": 0.012, "step": 117690 }, { "epoch": 0.59, "learning_rate": 0.00021092825322509848, "loss": 0.0166, "step": 117700 }, { "epoch": 0.59, "learning_rate": 0.00021092068553208446, "loss": 0.0137, "step": 117710 }, { "epoch": 0.59, "learning_rate": 0.00021091311783907044, "loss": 0.0173, "step": 117720 }, { "epoch": 0.59, "learning_rate": 0.00021090555014605645, "loss": 0.0204, "step": 117730 }, { "epoch": 0.59, "learning_rate": 0.00021089798245304243, "loss": 0.0173, "step": 117740 }, { "epoch": 0.59, "learning_rate": 0.00021089041476002841, "loss": 0.0138, "step": 117750 }, { "epoch": 0.59, "learning_rate": 0.00021088284706701442, "loss": 0.0163, "step": 117760 }, { "epoch": 0.59, "learning_rate": 0.0002108752793740004, "loss": 0.0114, "step": 117770 }, { "epoch": 0.59, "learning_rate": 0.00021086771168098639, "loss": 0.0162, "step": 117780 }, { "epoch": 0.59, "learning_rate": 0.0002108601439879724, "loss": 0.0134, "step": 117790 }, { "epoch": 0.59, "learning_rate": 0.00021085257629495838, "loss": 0.0261, "step": 117800 }, { "epoch": 0.59, "learning_rate": 0.00021084500860194436, "loss": 0.0144, "step": 117810 }, { "epoch": 0.59, "learning_rate": 0.00021083744090893037, "loss": 0.0159, "step": 117820 }, { "epoch": 0.59, "learning_rate": 0.00021082987321591635, "loss": 0.0143, "step": 117830 }, { "epoch": 0.59, "learning_rate": 0.00021082230552290233, "loss": 0.0158, "step": 117840 }, { "epoch": 0.59, "learning_rate": 0.00021081473782988834, "loss": 0.018, "step": 117850 }, { "epoch": 0.59, "learning_rate": 0.00021080717013687432, "loss": 0.0162, "step": 117860 }, { "epoch": 0.59, "learning_rate": 0.0002107996024438603, "loss": 0.0135, "step": 117870 }, { "epoch": 0.59, "learning_rate": 0.00021079203475084628, "loss": 0.0147, "step": 117880 }, { "epoch": 0.59, "learning_rate": 0.0002107844670578323, "loss": 0.0208, "step": 117890 }, { "epoch": 0.59, "learning_rate": 0.00021077689936481827, "loss": 0.0149, "step": 117900 }, { "epoch": 0.59, "learning_rate": 0.00021076933167180425, "loss": 0.0127, "step": 117910 }, { "epoch": 0.59, "learning_rate": 0.00021076176397879026, "loss": 0.0122, "step": 117920 }, { "epoch": 0.59, "learning_rate": 0.00021075419628577624, "loss": 0.0154, "step": 117930 }, { "epoch": 0.6, "learning_rate": 0.00021074662859276222, "loss": 0.0141, "step": 117940 }, { "epoch": 0.6, "learning_rate": 0.00021073906089974823, "loss": 0.0142, "step": 117950 }, { "epoch": 0.6, "learning_rate": 0.00021073149320673421, "loss": 0.0141, "step": 117960 }, { "epoch": 0.6, "learning_rate": 0.0002107239255137202, "loss": 0.0135, "step": 117970 }, { "epoch": 0.6, "learning_rate": 0.0002107163578207062, "loss": 0.0156, "step": 117980 }, { "epoch": 0.6, "learning_rate": 0.00021070879012769219, "loss": 0.0186, "step": 117990 }, { "epoch": 0.6, "learning_rate": 0.00021070122243467817, "loss": 0.0162, "step": 118000 }, { "epoch": 0.6, "eval_cer": 0.9144702559031622, "eval_loss": 0.011005792766809464, "eval_runtime": 116.812, "eval_samples_per_second": 17.122, "eval_steps_per_second": 4.28, "step": 118000 }, { "epoch": 0.6, "learning_rate": 0.00021069365474166418, "loss": 0.0166, "step": 118010 }, { "epoch": 0.6, "learning_rate": 0.00021068608704865016, "loss": 0.018, "step": 118020 }, { "epoch": 0.6, "learning_rate": 0.00021067851935563614, "loss": 0.0176, "step": 118030 }, { "epoch": 0.6, "learning_rate": 0.00021067095166262215, "loss": 0.015, "step": 118040 }, { "epoch": 0.6, "learning_rate": 0.00021066338396960813, "loss": 0.0209, "step": 118050 }, { "epoch": 0.6, "learning_rate": 0.0002106558162765941, "loss": 0.0169, "step": 118060 }, { "epoch": 0.6, "learning_rate": 0.0002106482485835801, "loss": 0.0283, "step": 118070 }, { "epoch": 0.6, "learning_rate": 0.0002106406808905661, "loss": 0.0113, "step": 118080 }, { "epoch": 0.6, "learning_rate": 0.00021063311319755208, "loss": 0.0216, "step": 118090 }, { "epoch": 0.6, "learning_rate": 0.00021062554550453806, "loss": 0.0129, "step": 118100 }, { "epoch": 0.6, "learning_rate": 0.00021061797781152407, "loss": 0.0196, "step": 118110 }, { "epoch": 0.6, "learning_rate": 0.00021061041011851005, "loss": 0.0197, "step": 118120 }, { "epoch": 0.6, "learning_rate": 0.00021060284242549603, "loss": 0.0173, "step": 118130 }, { "epoch": 0.6, "learning_rate": 0.00021059527473248204, "loss": 0.015, "step": 118140 }, { "epoch": 0.6, "learning_rate": 0.00021058770703946802, "loss": 0.0151, "step": 118150 }, { "epoch": 0.6, "learning_rate": 0.000210580139346454, "loss": 0.0157, "step": 118160 }, { "epoch": 0.6, "learning_rate": 0.00021057257165344001, "loss": 0.0123, "step": 118170 }, { "epoch": 0.6, "learning_rate": 0.000210565003960426, "loss": 0.0149, "step": 118180 }, { "epoch": 0.6, "learning_rate": 0.00021055743626741198, "loss": 0.0152, "step": 118190 }, { "epoch": 0.6, "learning_rate": 0.00021054986857439799, "loss": 0.0126, "step": 118200 }, { "epoch": 0.6, "learning_rate": 0.00021054230088138397, "loss": 0.0138, "step": 118210 }, { "epoch": 0.6, "learning_rate": 0.00021053473318836995, "loss": 0.0186, "step": 118220 }, { "epoch": 0.6, "learning_rate": 0.00021052716549535593, "loss": 0.0178, "step": 118230 }, { "epoch": 0.6, "learning_rate": 0.00021051959780234194, "loss": 0.0149, "step": 118240 }, { "epoch": 0.6, "learning_rate": 0.00021051203010932792, "loss": 0.0153, "step": 118250 }, { "epoch": 0.6, "learning_rate": 0.0002105044624163139, "loss": 0.0157, "step": 118260 }, { "epoch": 0.6, "learning_rate": 0.0002104968947232999, "loss": 0.0161, "step": 118270 }, { "epoch": 0.6, "learning_rate": 0.0002104893270302859, "loss": 0.0169, "step": 118280 }, { "epoch": 0.6, "learning_rate": 0.00021048175933727187, "loss": 0.0169, "step": 118290 }, { "epoch": 0.6, "learning_rate": 0.00021047419164425788, "loss": 0.0122, "step": 118300 }, { "epoch": 0.6, "learning_rate": 0.00021046662395124386, "loss": 0.0108, "step": 118310 }, { "epoch": 0.6, "learning_rate": 0.00021045905625822984, "loss": 0.0183, "step": 118320 }, { "epoch": 0.6, "learning_rate": 0.00021045148856521585, "loss": 0.0128, "step": 118330 }, { "epoch": 0.6, "learning_rate": 0.00021044392087220183, "loss": 0.0144, "step": 118340 }, { "epoch": 0.6, "learning_rate": 0.00021043635317918782, "loss": 0.0143, "step": 118350 }, { "epoch": 0.6, "learning_rate": 0.00021042878548617382, "loss": 0.0145, "step": 118360 }, { "epoch": 0.6, "learning_rate": 0.0002104212177931598, "loss": 0.0146, "step": 118370 }, { "epoch": 0.6, "learning_rate": 0.0002104136501001458, "loss": 0.014, "step": 118380 }, { "epoch": 0.6, "learning_rate": 0.00021040608240713177, "loss": 0.0197, "step": 118390 }, { "epoch": 0.6, "learning_rate": 0.00021039851471411778, "loss": 0.014, "step": 118400 }, { "epoch": 0.6, "learning_rate": 0.00021039094702110376, "loss": 0.0142, "step": 118410 }, { "epoch": 0.6, "learning_rate": 0.00021038337932808974, "loss": 0.0147, "step": 118420 }, { "epoch": 0.6, "learning_rate": 0.00021037581163507575, "loss": 0.0132, "step": 118430 }, { "epoch": 0.6, "learning_rate": 0.00021036824394206173, "loss": 0.0125, "step": 118440 }, { "epoch": 0.6, "learning_rate": 0.0002103606762490477, "loss": 0.0166, "step": 118450 }, { "epoch": 0.6, "learning_rate": 0.00021035310855603372, "loss": 0.0163, "step": 118460 }, { "epoch": 0.6, "learning_rate": 0.0002103455408630197, "loss": 0.0156, "step": 118470 }, { "epoch": 0.6, "learning_rate": 0.00021033797317000568, "loss": 0.0151, "step": 118480 }, { "epoch": 0.6, "learning_rate": 0.0002103304054769917, "loss": 0.0129, "step": 118490 }, { "epoch": 0.6, "learning_rate": 0.00021032283778397767, "loss": 0.0152, "step": 118500 }, { "epoch": 0.6, "learning_rate": 0.00021031527009096365, "loss": 0.0148, "step": 118510 }, { "epoch": 0.6, "learning_rate": 0.00021030770239794966, "loss": 0.0142, "step": 118520 }, { "epoch": 0.6, "learning_rate": 0.00021030013470493564, "loss": 0.013, "step": 118530 }, { "epoch": 0.6, "learning_rate": 0.00021029256701192163, "loss": 0.018, "step": 118540 }, { "epoch": 0.6, "learning_rate": 0.00021028499931890763, "loss": 0.0146, "step": 118550 }, { "epoch": 0.6, "learning_rate": 0.00021027743162589362, "loss": 0.0125, "step": 118560 }, { "epoch": 0.6, "learning_rate": 0.0002102698639328796, "loss": 0.0145, "step": 118570 }, { "epoch": 0.6, "learning_rate": 0.00021026229623986558, "loss": 0.0133, "step": 118580 }, { "epoch": 0.6, "learning_rate": 0.0002102547285468516, "loss": 0.0145, "step": 118590 }, { "epoch": 0.6, "learning_rate": 0.00021024716085383757, "loss": 0.0142, "step": 118600 }, { "epoch": 0.6, "learning_rate": 0.00021023959316082355, "loss": 0.0131, "step": 118610 }, { "epoch": 0.6, "learning_rate": 0.00021023202546780956, "loss": 0.0132, "step": 118620 }, { "epoch": 0.6, "learning_rate": 0.00021022445777479554, "loss": 0.0149, "step": 118630 }, { "epoch": 0.6, "learning_rate": 0.00021021689008178152, "loss": 0.0152, "step": 118640 }, { "epoch": 0.6, "learning_rate": 0.00021020932238876753, "loss": 0.0163, "step": 118650 }, { "epoch": 0.6, "learning_rate": 0.0002102017546957535, "loss": 0.016, "step": 118660 }, { "epoch": 0.6, "learning_rate": 0.0002101941870027395, "loss": 0.016, "step": 118670 }, { "epoch": 0.6, "learning_rate": 0.0002101866193097255, "loss": 0.0181, "step": 118680 }, { "epoch": 0.6, "learning_rate": 0.00021017905161671148, "loss": 0.0159, "step": 118690 }, { "epoch": 0.6, "learning_rate": 0.00021017148392369746, "loss": 0.0128, "step": 118700 }, { "epoch": 0.6, "learning_rate": 0.00021016391623068347, "loss": 0.0137, "step": 118710 }, { "epoch": 0.6, "learning_rate": 0.00021015634853766945, "loss": 0.0132, "step": 118720 }, { "epoch": 0.6, "learning_rate": 0.00021014878084465544, "loss": 0.0165, "step": 118730 }, { "epoch": 0.6, "learning_rate": 0.00021014121315164142, "loss": 0.0123, "step": 118740 }, { "epoch": 0.6, "learning_rate": 0.00021013364545862743, "loss": 0.0131, "step": 118750 }, { "epoch": 0.6, "learning_rate": 0.0002101260777656134, "loss": 0.0165, "step": 118760 }, { "epoch": 0.6, "learning_rate": 0.0002101185100725994, "loss": 0.0175, "step": 118770 }, { "epoch": 0.6, "learning_rate": 0.00021011094237958534, "loss": 0.0118, "step": 118780 }, { "epoch": 0.6, "learning_rate": 0.00021010337468657135, "loss": 0.013, "step": 118790 }, { "epoch": 0.6, "learning_rate": 0.00021009580699355733, "loss": 0.0152, "step": 118800 }, { "epoch": 0.6, "learning_rate": 0.00021008823930054331, "loss": 0.0146, "step": 118810 }, { "epoch": 0.6, "learning_rate": 0.00021008067160752932, "loss": 0.0164, "step": 118820 }, { "epoch": 0.6, "learning_rate": 0.0002100731039145153, "loss": 0.0172, "step": 118830 }, { "epoch": 0.6, "learning_rate": 0.00021006553622150129, "loss": 0.0176, "step": 118840 }, { "epoch": 0.6, "learning_rate": 0.0002100579685284873, "loss": 0.0167, "step": 118850 }, { "epoch": 0.6, "learning_rate": 0.00021005040083547328, "loss": 0.0153, "step": 118860 }, { "epoch": 0.6, "learning_rate": 0.00021004283314245926, "loss": 0.0139, "step": 118870 }, { "epoch": 0.6, "learning_rate": 0.00021003526544944527, "loss": 0.0144, "step": 118880 }, { "epoch": 0.6, "learning_rate": 0.00021002769775643125, "loss": 0.0157, "step": 118890 }, { "epoch": 0.6, "learning_rate": 0.00021002013006341723, "loss": 0.0137, "step": 118900 }, { "epoch": 0.6, "learning_rate": 0.00021001256237040324, "loss": 0.0106, "step": 118910 }, { "epoch": 0.6, "learning_rate": 0.00021000499467738922, "loss": 0.0191, "step": 118920 }, { "epoch": 0.6, "learning_rate": 0.0002099974269843752, "loss": 0.0199, "step": 118930 }, { "epoch": 0.6, "learning_rate": 0.0002099898592913612, "loss": 0.0165, "step": 118940 }, { "epoch": 0.6, "learning_rate": 0.0002099822915983472, "loss": 0.017, "step": 118950 }, { "epoch": 0.6, "learning_rate": 0.00020997472390533317, "loss": 0.0181, "step": 118960 }, { "epoch": 0.6, "learning_rate": 0.00020996715621231915, "loss": 0.016, "step": 118970 }, { "epoch": 0.6, "learning_rate": 0.00020995958851930516, "loss": 0.0137, "step": 118980 }, { "epoch": 0.6, "learning_rate": 0.00020995202082629114, "loss": 0.0158, "step": 118990 }, { "epoch": 0.6, "learning_rate": 0.00020994445313327712, "loss": 0.0123, "step": 119000 }, { "epoch": 0.6, "eval_cer": 0.9144935454101719, "eval_loss": 0.010422189719974995, "eval_runtime": 116.7072, "eval_samples_per_second": 17.137, "eval_steps_per_second": 4.284, "step": 119000 }, { "epoch": 0.6, "learning_rate": 0.00020993688544026313, "loss": 0.0139, "step": 119010 }, { "epoch": 0.6, "learning_rate": 0.00020992931774724911, "loss": 0.0162, "step": 119020 }, { "epoch": 0.6, "learning_rate": 0.0002099217500542351, "loss": 0.016, "step": 119030 }, { "epoch": 0.6, "learning_rate": 0.0002099141823612211, "loss": 0.0134, "step": 119040 }, { "epoch": 0.6, "learning_rate": 0.00020990661466820709, "loss": 0.0138, "step": 119050 }, { "epoch": 0.6, "learning_rate": 0.00020989904697519307, "loss": 0.0166, "step": 119060 }, { "epoch": 0.6, "learning_rate": 0.00020989147928217908, "loss": 0.0143, "step": 119070 }, { "epoch": 0.6, "learning_rate": 0.00020988391158916506, "loss": 0.0137, "step": 119080 }, { "epoch": 0.6, "learning_rate": 0.00020987634389615104, "loss": 0.0136, "step": 119090 }, { "epoch": 0.6, "learning_rate": 0.00020986877620313705, "loss": 0.015, "step": 119100 }, { "epoch": 0.6, "learning_rate": 0.00020986120851012303, "loss": 0.012, "step": 119110 }, { "epoch": 0.6, "learning_rate": 0.000209853640817109, "loss": 0.0143, "step": 119120 }, { "epoch": 0.6, "learning_rate": 0.000209846073124095, "loss": 0.0157, "step": 119130 }, { "epoch": 0.6, "learning_rate": 0.000209838505431081, "loss": 0.0152, "step": 119140 }, { "epoch": 0.6, "learning_rate": 0.00020983093773806698, "loss": 0.0142, "step": 119150 }, { "epoch": 0.6, "learning_rate": 0.00020982337004505296, "loss": 0.0145, "step": 119160 }, { "epoch": 0.6, "learning_rate": 0.00020981580235203897, "loss": 0.0181, "step": 119170 }, { "epoch": 0.6, "learning_rate": 0.00020980823465902495, "loss": 0.0142, "step": 119180 }, { "epoch": 0.6, "learning_rate": 0.00020980066696601093, "loss": 0.014, "step": 119190 }, { "epoch": 0.6, "learning_rate": 0.00020979309927299694, "loss": 0.0137, "step": 119200 }, { "epoch": 0.6, "learning_rate": 0.00020978553157998292, "loss": 0.0153, "step": 119210 }, { "epoch": 0.6, "learning_rate": 0.0002097779638869689, "loss": 0.0161, "step": 119220 }, { "epoch": 0.6, "learning_rate": 0.00020977039619395491, "loss": 0.0139, "step": 119230 }, { "epoch": 0.6, "learning_rate": 0.0002097628285009409, "loss": 0.0143, "step": 119240 }, { "epoch": 0.6, "learning_rate": 0.00020975526080792688, "loss": 0.0138, "step": 119250 }, { "epoch": 0.6, "learning_rate": 0.00020974769311491289, "loss": 0.0141, "step": 119260 }, { "epoch": 0.6, "learning_rate": 0.00020974012542189887, "loss": 0.0148, "step": 119270 }, { "epoch": 0.6, "learning_rate": 0.00020973255772888485, "loss": 0.013, "step": 119280 }, { "epoch": 0.6, "learning_rate": 0.00020972499003587083, "loss": 0.0177, "step": 119290 }, { "epoch": 0.6, "learning_rate": 0.00020971742234285684, "loss": 0.015, "step": 119300 }, { "epoch": 0.6, "learning_rate": 0.00020970985464984282, "loss": 0.0168, "step": 119310 }, { "epoch": 0.6, "learning_rate": 0.0002097022869568288, "loss": 0.0153, "step": 119320 }, { "epoch": 0.6, "learning_rate": 0.0002096947192638148, "loss": 0.0144, "step": 119330 }, { "epoch": 0.6, "learning_rate": 0.0002096871515708008, "loss": 0.0113, "step": 119340 }, { "epoch": 0.6, "learning_rate": 0.00020967958387778677, "loss": 0.0135, "step": 119350 }, { "epoch": 0.6, "learning_rate": 0.00020967201618477278, "loss": 0.0132, "step": 119360 }, { "epoch": 0.6, "learning_rate": 0.00020966444849175876, "loss": 0.0178, "step": 119370 }, { "epoch": 0.6, "learning_rate": 0.00020965688079874474, "loss": 0.0146, "step": 119380 }, { "epoch": 0.6, "learning_rate": 0.00020964931310573075, "loss": 0.0147, "step": 119390 }, { "epoch": 0.6, "learning_rate": 0.00020964174541271673, "loss": 0.0146, "step": 119400 }, { "epoch": 0.6, "learning_rate": 0.00020963417771970272, "loss": 0.013, "step": 119410 }, { "epoch": 0.6, "learning_rate": 0.00020962661002668872, "loss": 0.0134, "step": 119420 }, { "epoch": 0.6, "learning_rate": 0.0002096190423336747, "loss": 0.0145, "step": 119430 }, { "epoch": 0.6, "learning_rate": 0.0002096114746406607, "loss": 0.0144, "step": 119440 }, { "epoch": 0.6, "learning_rate": 0.0002096039069476467, "loss": 0.0127, "step": 119450 }, { "epoch": 0.6, "learning_rate": 0.00020959633925463268, "loss": 0.0136, "step": 119460 }, { "epoch": 0.6, "learning_rate": 0.00020958877156161866, "loss": 0.0143, "step": 119470 }, { "epoch": 0.6, "learning_rate": 0.00020958120386860464, "loss": 0.0137, "step": 119480 }, { "epoch": 0.6, "learning_rate": 0.00020957363617559065, "loss": 0.0142, "step": 119490 }, { "epoch": 0.6, "learning_rate": 0.00020956606848257663, "loss": 0.0145, "step": 119500 }, { "epoch": 0.6, "learning_rate": 0.0002095585007895626, "loss": 0.0122, "step": 119510 }, { "epoch": 0.6, "learning_rate": 0.00020955093309654862, "loss": 0.011, "step": 119520 }, { "epoch": 0.6, "learning_rate": 0.0002095433654035346, "loss": 0.0145, "step": 119530 }, { "epoch": 0.6, "learning_rate": 0.00020953579771052058, "loss": 0.0115, "step": 119540 }, { "epoch": 0.6, "learning_rate": 0.0002095282300175066, "loss": 0.0141, "step": 119550 }, { "epoch": 0.6, "learning_rate": 0.00020952066232449257, "loss": 0.013, "step": 119560 }, { "epoch": 0.6, "learning_rate": 0.00020951309463147855, "loss": 0.0167, "step": 119570 }, { "epoch": 0.6, "learning_rate": 0.00020950552693846456, "loss": 0.014, "step": 119580 }, { "epoch": 0.6, "learning_rate": 0.00020949795924545054, "loss": 0.0142, "step": 119590 }, { "epoch": 0.6, "learning_rate": 0.00020949039155243653, "loss": 0.0164, "step": 119600 }, { "epoch": 0.6, "learning_rate": 0.00020948282385942253, "loss": 0.0139, "step": 119610 }, { "epoch": 0.6, "learning_rate": 0.00020947525616640852, "loss": 0.0117, "step": 119620 }, { "epoch": 0.6, "learning_rate": 0.0002094676884733945, "loss": 0.013, "step": 119630 }, { "epoch": 0.6, "learning_rate": 0.00020946012078038048, "loss": 0.0174, "step": 119640 }, { "epoch": 0.6, "learning_rate": 0.0002094525530873665, "loss": 0.016, "step": 119650 }, { "epoch": 0.6, "learning_rate": 0.00020944498539435247, "loss": 0.0191, "step": 119660 }, { "epoch": 0.6, "learning_rate": 0.00020943741770133845, "loss": 0.0144, "step": 119670 }, { "epoch": 0.6, "learning_rate": 0.00020942985000832446, "loss": 0.0164, "step": 119680 }, { "epoch": 0.6, "learning_rate": 0.00020942228231531044, "loss": 0.0128, "step": 119690 }, { "epoch": 0.6, "learning_rate": 0.00020941471462229642, "loss": 0.0169, "step": 119700 }, { "epoch": 0.6, "learning_rate": 0.00020940714692928243, "loss": 0.0163, "step": 119710 }, { "epoch": 0.6, "learning_rate": 0.0002093995792362684, "loss": 0.021, "step": 119720 }, { "epoch": 0.6, "learning_rate": 0.0002093920115432544, "loss": 0.0151, "step": 119730 }, { "epoch": 0.6, "learning_rate": 0.0002093844438502404, "loss": 0.017, "step": 119740 }, { "epoch": 0.6, "learning_rate": 0.00020937687615722638, "loss": 0.0143, "step": 119750 }, { "epoch": 0.6, "learning_rate": 0.00020936930846421236, "loss": 0.0155, "step": 119760 }, { "epoch": 0.6, "learning_rate": 0.00020936174077119837, "loss": 0.0139, "step": 119770 }, { "epoch": 0.6, "learning_rate": 0.00020935417307818435, "loss": 0.0162, "step": 119780 }, { "epoch": 0.6, "learning_rate": 0.00020934660538517034, "loss": 0.0112, "step": 119790 }, { "epoch": 0.6, "learning_rate": 0.00020933903769215632, "loss": 0.0147, "step": 119800 }, { "epoch": 0.6, "learning_rate": 0.00020933146999914233, "loss": 0.0165, "step": 119810 }, { "epoch": 0.6, "learning_rate": 0.0002093239023061283, "loss": 0.0204, "step": 119820 }, { "epoch": 0.6, "learning_rate": 0.0002093163346131143, "loss": 0.0165, "step": 119830 }, { "epoch": 0.6, "learning_rate": 0.0002093087669201003, "loss": 0.0146, "step": 119840 }, { "epoch": 0.6, "learning_rate": 0.00020930119922708628, "loss": 0.0148, "step": 119850 }, { "epoch": 0.6, "learning_rate": 0.00020929363153407226, "loss": 0.0122, "step": 119860 }, { "epoch": 0.6, "learning_rate": 0.00020928606384105827, "loss": 0.0138, "step": 119870 }, { "epoch": 0.6, "learning_rate": 0.00020927849614804425, "loss": 0.0156, "step": 119880 }, { "epoch": 0.6, "learning_rate": 0.00020927092845503023, "loss": 0.0138, "step": 119890 }, { "epoch": 0.6, "learning_rate": 0.00020926336076201624, "loss": 0.0159, "step": 119900 }, { "epoch": 0.6, "learning_rate": 0.00020925579306900222, "loss": 0.0143, "step": 119910 }, { "epoch": 0.61, "learning_rate": 0.0002092482253759882, "loss": 0.0155, "step": 119920 }, { "epoch": 0.61, "learning_rate": 0.0002092406576829742, "loss": 0.0276, "step": 119930 }, { "epoch": 0.61, "learning_rate": 0.0002092330899899602, "loss": 0.0167, "step": 119940 }, { "epoch": 0.61, "learning_rate": 0.00020922552229694617, "loss": 0.019, "step": 119950 }, { "epoch": 0.61, "learning_rate": 0.00020921795460393218, "loss": 0.0149, "step": 119960 }, { "epoch": 0.61, "learning_rate": 0.00020921038691091816, "loss": 0.0166, "step": 119970 }, { "epoch": 0.61, "learning_rate": 0.00020920281921790415, "loss": 0.0147, "step": 119980 }, { "epoch": 0.61, "learning_rate": 0.00020919525152489013, "loss": 0.013, "step": 119990 }, { "epoch": 0.61, "learning_rate": 0.00020918768383187614, "loss": 0.0134, "step": 120000 }, { "epoch": 0.61, "eval_cer": 0.9144925750140465, "eval_loss": 0.0107016796246171, "eval_runtime": 116.8152, "eval_samples_per_second": 17.121, "eval_steps_per_second": 4.28, "step": 120000 }, { "epoch": 0.61, "learning_rate": 0.00020918011613886212, "loss": 0.0128, "step": 120010 }, { "epoch": 0.61, "learning_rate": 0.0002091725484458481, "loss": 0.0138, "step": 120020 }, { "epoch": 0.61, "learning_rate": 0.0002091649807528341, "loss": 0.0138, "step": 120030 }, { "epoch": 0.61, "learning_rate": 0.00020915741305982006, "loss": 0.0128, "step": 120040 }, { "epoch": 0.61, "learning_rate": 0.00020914984536680604, "loss": 0.0164, "step": 120050 }, { "epoch": 0.61, "learning_rate": 0.00020914227767379202, "loss": 0.0129, "step": 120060 }, { "epoch": 0.61, "learning_rate": 0.00020913470998077803, "loss": 0.0156, "step": 120070 }, { "epoch": 0.61, "learning_rate": 0.00020912714228776401, "loss": 0.0199, "step": 120080 }, { "epoch": 0.61, "learning_rate": 0.00020911957459475, "loss": 0.0168, "step": 120090 }, { "epoch": 0.61, "learning_rate": 0.000209112006901736, "loss": 0.0181, "step": 120100 }, { "epoch": 0.61, "learning_rate": 0.00020910443920872199, "loss": 0.0154, "step": 120110 }, { "epoch": 0.61, "learning_rate": 0.00020909687151570797, "loss": 0.0125, "step": 120120 }, { "epoch": 0.61, "learning_rate": 0.00020908930382269398, "loss": 0.0178, "step": 120130 }, { "epoch": 0.61, "learning_rate": 0.00020908173612967996, "loss": 0.0169, "step": 120140 }, { "epoch": 0.61, "learning_rate": 0.00020907416843666594, "loss": 0.0147, "step": 120150 }, { "epoch": 0.61, "learning_rate": 0.00020906660074365195, "loss": 0.0131, "step": 120160 }, { "epoch": 0.61, "learning_rate": 0.00020905903305063793, "loss": 0.0128, "step": 120170 }, { "epoch": 0.61, "learning_rate": 0.0002090514653576239, "loss": 0.0131, "step": 120180 }, { "epoch": 0.61, "learning_rate": 0.0002090438976646099, "loss": 0.0158, "step": 120190 }, { "epoch": 0.61, "learning_rate": 0.0002090363299715959, "loss": 0.0133, "step": 120200 }, { "epoch": 0.61, "learning_rate": 0.00020902876227858188, "loss": 0.0129, "step": 120210 }, { "epoch": 0.61, "learning_rate": 0.00020902119458556786, "loss": 0.0143, "step": 120220 }, { "epoch": 0.61, "learning_rate": 0.00020901362689255387, "loss": 0.0149, "step": 120230 }, { "epoch": 0.61, "learning_rate": 0.00020900605919953985, "loss": 0.0151, "step": 120240 }, { "epoch": 0.61, "learning_rate": 0.00020899849150652583, "loss": 0.0167, "step": 120250 }, { "epoch": 0.61, "learning_rate": 0.00020899092381351184, "loss": 0.0139, "step": 120260 }, { "epoch": 0.61, "learning_rate": 0.00020898335612049782, "loss": 0.0131, "step": 120270 }, { "epoch": 0.61, "learning_rate": 0.0002089757884274838, "loss": 0.0173, "step": 120280 }, { "epoch": 0.61, "learning_rate": 0.00020896822073446981, "loss": 0.0135, "step": 120290 }, { "epoch": 0.61, "learning_rate": 0.0002089606530414558, "loss": 0.0149, "step": 120300 }, { "epoch": 0.61, "learning_rate": 0.00020895308534844178, "loss": 0.0184, "step": 120310 }, { "epoch": 0.61, "learning_rate": 0.00020894551765542779, "loss": 0.0142, "step": 120320 }, { "epoch": 0.61, "learning_rate": 0.00020893794996241377, "loss": 0.0196, "step": 120330 }, { "epoch": 0.61, "learning_rate": 0.00020893038226939975, "loss": 0.0188, "step": 120340 }, { "epoch": 0.61, "learning_rate": 0.00020892281457638576, "loss": 0.0132, "step": 120350 }, { "epoch": 0.61, "learning_rate": 0.00020891524688337174, "loss": 0.0193, "step": 120360 }, { "epoch": 0.61, "learning_rate": 0.00020890767919035772, "loss": 0.0121, "step": 120370 }, { "epoch": 0.61, "learning_rate": 0.0002089001114973437, "loss": 0.0174, "step": 120380 }, { "epoch": 0.61, "learning_rate": 0.0002088925438043297, "loss": 0.0142, "step": 120390 }, { "epoch": 0.61, "learning_rate": 0.0002088849761113157, "loss": 0.0119, "step": 120400 }, { "epoch": 0.61, "learning_rate": 0.00020887740841830167, "loss": 0.0116, "step": 120410 }, { "epoch": 0.61, "learning_rate": 0.00020886984072528768, "loss": 0.0146, "step": 120420 }, { "epoch": 0.61, "learning_rate": 0.00020886227303227366, "loss": 0.0198, "step": 120430 }, { "epoch": 0.61, "learning_rate": 0.00020885470533925964, "loss": 0.0147, "step": 120440 }, { "epoch": 0.61, "learning_rate": 0.00020884713764624565, "loss": 0.0152, "step": 120450 }, { "epoch": 0.61, "learning_rate": 0.00020883956995323163, "loss": 0.015, "step": 120460 }, { "epoch": 0.61, "learning_rate": 0.00020883200226021762, "loss": 0.0122, "step": 120470 }, { "epoch": 0.61, "learning_rate": 0.00020882443456720362, "loss": 0.0163, "step": 120480 }, { "epoch": 0.61, "learning_rate": 0.0002088168668741896, "loss": 0.0124, "step": 120490 }, { "epoch": 0.61, "learning_rate": 0.0002088092991811756, "loss": 0.0133, "step": 120500 }, { "epoch": 0.61, "learning_rate": 0.0002088017314881616, "loss": 0.0107, "step": 120510 }, { "epoch": 0.61, "learning_rate": 0.00020879416379514758, "loss": 0.0141, "step": 120520 }, { "epoch": 0.61, "learning_rate": 0.00020878659610213356, "loss": 0.0142, "step": 120530 }, { "epoch": 0.61, "learning_rate": 0.00020877902840911954, "loss": 0.0169, "step": 120540 }, { "epoch": 0.61, "learning_rate": 0.00020877146071610555, "loss": 0.016, "step": 120550 }, { "epoch": 0.61, "learning_rate": 0.00020876389302309153, "loss": 0.0174, "step": 120560 }, { "epoch": 0.61, "learning_rate": 0.0002087563253300775, "loss": 0.0186, "step": 120570 }, { "epoch": 0.61, "learning_rate": 0.00020874875763706352, "loss": 0.0281, "step": 120580 }, { "epoch": 0.61, "learning_rate": 0.0002087411899440495, "loss": 0.014, "step": 120590 }, { "epoch": 0.61, "learning_rate": 0.00020873362225103548, "loss": 0.0112, "step": 120600 }, { "epoch": 0.61, "learning_rate": 0.0002087260545580215, "loss": 0.018, "step": 120610 }, { "epoch": 0.61, "learning_rate": 0.00020871848686500747, "loss": 0.0143, "step": 120620 }, { "epoch": 0.61, "learning_rate": 0.00020871091917199345, "loss": 0.0158, "step": 120630 }, { "epoch": 0.61, "learning_rate": 0.00020870335147897946, "loss": 0.0145, "step": 120640 }, { "epoch": 0.61, "learning_rate": 0.00020869578378596544, "loss": 0.0171, "step": 120650 }, { "epoch": 0.61, "learning_rate": 0.00020868821609295143, "loss": 0.0136, "step": 120660 }, { "epoch": 0.61, "learning_rate": 0.00020868064839993743, "loss": 0.0166, "step": 120670 }, { "epoch": 0.61, "learning_rate": 0.00020867308070692342, "loss": 0.0151, "step": 120680 }, { "epoch": 0.61, "learning_rate": 0.0002086655130139094, "loss": 0.0136, "step": 120690 }, { "epoch": 0.61, "learning_rate": 0.00020865794532089538, "loss": 0.0127, "step": 120700 }, { "epoch": 0.61, "learning_rate": 0.0002086503776278814, "loss": 0.0199, "step": 120710 }, { "epoch": 0.61, "learning_rate": 0.00020864280993486737, "loss": 0.0166, "step": 120720 }, { "epoch": 0.61, "learning_rate": 0.00020863524224185335, "loss": 0.0137, "step": 120730 }, { "epoch": 0.61, "learning_rate": 0.00020862767454883936, "loss": 0.0138, "step": 120740 }, { "epoch": 0.61, "learning_rate": 0.00020862010685582534, "loss": 0.015, "step": 120750 }, { "epoch": 0.61, "learning_rate": 0.00020861253916281132, "loss": 0.0144, "step": 120760 }, { "epoch": 0.61, "learning_rate": 0.00020860497146979733, "loss": 0.0176, "step": 120770 }, { "epoch": 0.61, "learning_rate": 0.0002085974037767833, "loss": 0.0132, "step": 120780 }, { "epoch": 0.61, "learning_rate": 0.0002085898360837693, "loss": 0.0153, "step": 120790 }, { "epoch": 0.61, "learning_rate": 0.0002085822683907553, "loss": 0.0152, "step": 120800 }, { "epoch": 0.61, "learning_rate": 0.00020857470069774128, "loss": 0.0111, "step": 120810 }, { "epoch": 0.61, "learning_rate": 0.00020856713300472726, "loss": 0.014, "step": 120820 }, { "epoch": 0.61, "learning_rate": 0.00020855956531171327, "loss": 0.014, "step": 120830 }, { "epoch": 0.61, "learning_rate": 0.00020855199761869925, "loss": 0.0146, "step": 120840 }, { "epoch": 0.61, "learning_rate": 0.00020854442992568524, "loss": 0.0185, "step": 120850 }, { "epoch": 0.61, "learning_rate": 0.00020853686223267124, "loss": 0.0151, "step": 120860 }, { "epoch": 0.61, "learning_rate": 0.00020852929453965723, "loss": 0.0157, "step": 120870 }, { "epoch": 0.61, "learning_rate": 0.0002085217268466432, "loss": 0.0119, "step": 120880 }, { "epoch": 0.61, "learning_rate": 0.0002085141591536292, "loss": 0.0171, "step": 120890 }, { "epoch": 0.61, "learning_rate": 0.0002085065914606152, "loss": 0.017, "step": 120900 }, { "epoch": 0.61, "learning_rate": 0.00020849902376760118, "loss": 0.0143, "step": 120910 }, { "epoch": 0.61, "learning_rate": 0.00020849145607458716, "loss": 0.013, "step": 120920 }, { "epoch": 0.61, "learning_rate": 0.00020848388838157317, "loss": 0.0156, "step": 120930 }, { "epoch": 0.61, "learning_rate": 0.00020847632068855915, "loss": 0.0149, "step": 120940 }, { "epoch": 0.61, "learning_rate": 0.00020846875299554513, "loss": 0.015, "step": 120950 }, { "epoch": 0.61, "learning_rate": 0.00020846118530253114, "loss": 0.0135, "step": 120960 }, { "epoch": 0.61, "learning_rate": 0.00020845361760951712, "loss": 0.0167, "step": 120970 }, { "epoch": 0.61, "learning_rate": 0.0002084460499165031, "loss": 0.0149, "step": 120980 }, { "epoch": 0.61, "learning_rate": 0.0002084384822234891, "loss": 0.0136, "step": 120990 }, { "epoch": 0.61, "learning_rate": 0.0002084309145304751, "loss": 0.0164, "step": 121000 }, { "epoch": 0.61, "eval_cer": 0.9144799598644162, "eval_loss": 0.010320211760699749, "eval_runtime": 116.7947, "eval_samples_per_second": 17.124, "eval_steps_per_second": 4.281, "step": 121000 }, { "epoch": 0.61, "learning_rate": 0.00020842334683746107, "loss": 0.0171, "step": 121010 }, { "epoch": 0.61, "learning_rate": 0.00020841577914444708, "loss": 0.0128, "step": 121020 }, { "epoch": 0.61, "learning_rate": 0.00020840821145143306, "loss": 0.0111, "step": 121030 }, { "epoch": 0.61, "learning_rate": 0.00020840064375841905, "loss": 0.0125, "step": 121040 }, { "epoch": 0.61, "learning_rate": 0.00020839307606540503, "loss": 0.0127, "step": 121050 }, { "epoch": 0.61, "learning_rate": 0.00020838550837239104, "loss": 0.0125, "step": 121060 }, { "epoch": 0.61, "learning_rate": 0.00020837794067937702, "loss": 0.0152, "step": 121070 }, { "epoch": 0.61, "learning_rate": 0.000208370372986363, "loss": 0.0127, "step": 121080 }, { "epoch": 0.61, "learning_rate": 0.000208362805293349, "loss": 0.015, "step": 121090 }, { "epoch": 0.61, "learning_rate": 0.000208355237600335, "loss": 0.0185, "step": 121100 }, { "epoch": 0.61, "learning_rate": 0.00020834766990732097, "loss": 0.013, "step": 121110 }, { "epoch": 0.61, "learning_rate": 0.00020834010221430698, "loss": 0.0158, "step": 121120 }, { "epoch": 0.61, "learning_rate": 0.00020833253452129296, "loss": 0.013, "step": 121130 }, { "epoch": 0.61, "learning_rate": 0.00020832496682827894, "loss": 0.0131, "step": 121140 }, { "epoch": 0.61, "learning_rate": 0.00020831739913526495, "loss": 0.0155, "step": 121150 }, { "epoch": 0.61, "learning_rate": 0.00020830983144225093, "loss": 0.0147, "step": 121160 }, { "epoch": 0.61, "learning_rate": 0.0002083022637492369, "loss": 0.0139, "step": 121170 }, { "epoch": 0.61, "learning_rate": 0.00020829469605622292, "loss": 0.0123, "step": 121180 }, { "epoch": 0.61, "learning_rate": 0.0002082871283632089, "loss": 0.0152, "step": 121190 }, { "epoch": 0.61, "learning_rate": 0.00020827956067019488, "loss": 0.0135, "step": 121200 }, { "epoch": 0.61, "learning_rate": 0.00020827199297718087, "loss": 0.014, "step": 121210 }, { "epoch": 0.61, "learning_rate": 0.00020826442528416687, "loss": 0.0158, "step": 121220 }, { "epoch": 0.61, "learning_rate": 0.00020825685759115286, "loss": 0.0178, "step": 121230 }, { "epoch": 0.61, "learning_rate": 0.00020824928989813884, "loss": 0.013, "step": 121240 }, { "epoch": 0.61, "learning_rate": 0.00020824172220512485, "loss": 0.012, "step": 121250 }, { "epoch": 0.61, "learning_rate": 0.00020823415451211083, "loss": 0.0182, "step": 121260 }, { "epoch": 0.61, "learning_rate": 0.0002082265868190968, "loss": 0.0134, "step": 121270 }, { "epoch": 0.61, "learning_rate": 0.00020821901912608282, "loss": 0.0131, "step": 121280 }, { "epoch": 0.61, "learning_rate": 0.00020821145143306877, "loss": 0.0132, "step": 121290 }, { "epoch": 0.61, "learning_rate": 0.00020820388374005475, "loss": 0.0175, "step": 121300 }, { "epoch": 0.61, "learning_rate": 0.00020819631604704073, "loss": 0.014, "step": 121310 }, { "epoch": 0.61, "learning_rate": 0.00020818874835402674, "loss": 0.0147, "step": 121320 }, { "epoch": 0.61, "learning_rate": 0.00020818118066101272, "loss": 0.0177, "step": 121330 }, { "epoch": 0.61, "learning_rate": 0.0002081736129679987, "loss": 0.0204, "step": 121340 }, { "epoch": 0.61, "learning_rate": 0.00020816604527498471, "loss": 0.0134, "step": 121350 }, { "epoch": 0.61, "learning_rate": 0.0002081584775819707, "loss": 0.0176, "step": 121360 }, { "epoch": 0.61, "learning_rate": 0.00020815090988895668, "loss": 0.0171, "step": 121370 }, { "epoch": 0.61, "learning_rate": 0.00020814334219594269, "loss": 0.0166, "step": 121380 }, { "epoch": 0.61, "learning_rate": 0.00020813577450292867, "loss": 0.0158, "step": 121390 }, { "epoch": 0.61, "learning_rate": 0.00020812820680991465, "loss": 0.0142, "step": 121400 }, { "epoch": 0.61, "learning_rate": 0.00020812063911690066, "loss": 0.0157, "step": 121410 }, { "epoch": 0.61, "learning_rate": 0.00020811307142388664, "loss": 0.0127, "step": 121420 }, { "epoch": 0.61, "learning_rate": 0.00020810550373087262, "loss": 0.0142, "step": 121430 }, { "epoch": 0.61, "learning_rate": 0.0002080979360378586, "loss": 0.0117, "step": 121440 }, { "epoch": 0.61, "learning_rate": 0.0002080903683448446, "loss": 0.0126, "step": 121450 }, { "epoch": 0.61, "learning_rate": 0.0002080828006518306, "loss": 0.0128, "step": 121460 }, { "epoch": 0.61, "learning_rate": 0.00020807523295881657, "loss": 0.0128, "step": 121470 }, { "epoch": 0.61, "learning_rate": 0.00020806766526580258, "loss": 0.0146, "step": 121480 }, { "epoch": 0.61, "learning_rate": 0.00020806009757278856, "loss": 0.0152, "step": 121490 }, { "epoch": 0.61, "learning_rate": 0.00020805252987977455, "loss": 0.0143, "step": 121500 }, { "epoch": 0.61, "learning_rate": 0.00020804496218676055, "loss": 0.0154, "step": 121510 }, { "epoch": 0.61, "learning_rate": 0.00020803739449374654, "loss": 0.0153, "step": 121520 }, { "epoch": 0.61, "learning_rate": 0.00020802982680073252, "loss": 0.0131, "step": 121530 }, { "epoch": 0.61, "learning_rate": 0.00020802225910771853, "loss": 0.0113, "step": 121540 }, { "epoch": 0.61, "learning_rate": 0.0002080146914147045, "loss": 0.0138, "step": 121550 }, { "epoch": 0.61, "learning_rate": 0.0002080071237216905, "loss": 0.015, "step": 121560 }, { "epoch": 0.61, "learning_rate": 0.0002079995560286765, "loss": 0.0168, "step": 121570 }, { "epoch": 0.61, "learning_rate": 0.00020799198833566248, "loss": 0.0139, "step": 121580 }, { "epoch": 0.61, "learning_rate": 0.00020798442064264846, "loss": 0.0132, "step": 121590 }, { "epoch": 0.61, "learning_rate": 0.00020797685294963444, "loss": 0.0164, "step": 121600 }, { "epoch": 0.61, "learning_rate": 0.00020796928525662045, "loss": 0.0167, "step": 121610 }, { "epoch": 0.61, "learning_rate": 0.00020796171756360643, "loss": 0.0149, "step": 121620 }, { "epoch": 0.61, "learning_rate": 0.0002079541498705924, "loss": 0.0126, "step": 121630 }, { "epoch": 0.61, "learning_rate": 0.00020794658217757842, "loss": 0.0148, "step": 121640 }, { "epoch": 0.61, "learning_rate": 0.0002079390144845644, "loss": 0.0133, "step": 121650 }, { "epoch": 0.61, "learning_rate": 0.00020793144679155038, "loss": 0.0149, "step": 121660 }, { "epoch": 0.61, "learning_rate": 0.0002079238790985364, "loss": 0.015, "step": 121670 }, { "epoch": 0.61, "learning_rate": 0.00020791631140552237, "loss": 0.0141, "step": 121680 }, { "epoch": 0.61, "learning_rate": 0.00020790874371250836, "loss": 0.0146, "step": 121690 }, { "epoch": 0.61, "learning_rate": 0.00020790117601949436, "loss": 0.0159, "step": 121700 }, { "epoch": 0.61, "learning_rate": 0.00020789360832648035, "loss": 0.0128, "step": 121710 }, { "epoch": 0.61, "learning_rate": 0.00020788604063346633, "loss": 0.012, "step": 121720 }, { "epoch": 0.61, "learning_rate": 0.00020787847294045234, "loss": 0.0172, "step": 121730 }, { "epoch": 0.61, "learning_rate": 0.00020787090524743832, "loss": 0.0151, "step": 121740 }, { "epoch": 0.61, "learning_rate": 0.0002078633375544243, "loss": 0.0109, "step": 121750 }, { "epoch": 0.61, "learning_rate": 0.00020785576986141028, "loss": 0.0139, "step": 121760 }, { "epoch": 0.61, "learning_rate": 0.0002078482021683963, "loss": 0.0149, "step": 121770 }, { "epoch": 0.61, "learning_rate": 0.00020784063447538227, "loss": 0.0122, "step": 121780 }, { "epoch": 0.61, "learning_rate": 0.00020783306678236825, "loss": 0.012, "step": 121790 }, { "epoch": 0.61, "learning_rate": 0.00020782549908935426, "loss": 0.0131, "step": 121800 }, { "epoch": 0.61, "learning_rate": 0.00020781793139634024, "loss": 0.0137, "step": 121810 }, { "epoch": 0.61, "learning_rate": 0.00020781036370332622, "loss": 0.0151, "step": 121820 }, { "epoch": 0.61, "learning_rate": 0.00020780279601031223, "loss": 0.015, "step": 121830 }, { "epoch": 0.61, "learning_rate": 0.0002077952283172982, "loss": 0.0129, "step": 121840 }, { "epoch": 0.61, "learning_rate": 0.0002077876606242842, "loss": 0.0156, "step": 121850 }, { "epoch": 0.61, "learning_rate": 0.0002077800929312702, "loss": 0.0112, "step": 121860 }, { "epoch": 0.61, "learning_rate": 0.00020777252523825618, "loss": 0.0146, "step": 121870 }, { "epoch": 0.61, "learning_rate": 0.00020776495754524217, "loss": 0.0176, "step": 121880 }, { "epoch": 0.61, "learning_rate": 0.00020775738985222817, "loss": 0.0188, "step": 121890 }, { "epoch": 0.61, "learning_rate": 0.00020774982215921416, "loss": 0.0149, "step": 121900 }, { "epoch": 0.62, "learning_rate": 0.00020774225446620014, "loss": 0.0143, "step": 121910 }, { "epoch": 0.62, "learning_rate": 0.00020773468677318615, "loss": 0.0137, "step": 121920 }, { "epoch": 0.62, "learning_rate": 0.00020772711908017213, "loss": 0.0125, "step": 121930 }, { "epoch": 0.62, "learning_rate": 0.0002077195513871581, "loss": 0.0152, "step": 121940 }, { "epoch": 0.62, "learning_rate": 0.0002077119836941441, "loss": 0.0134, "step": 121950 }, { "epoch": 0.62, "learning_rate": 0.0002077044160011301, "loss": 0.0138, "step": 121960 }, { "epoch": 0.62, "learning_rate": 0.00020769684830811608, "loss": 0.0137, "step": 121970 }, { "epoch": 0.62, "learning_rate": 0.00020768928061510206, "loss": 0.0126, "step": 121980 }, { "epoch": 0.62, "learning_rate": 0.00020768171292208807, "loss": 0.0138, "step": 121990 }, { "epoch": 0.62, "learning_rate": 0.00020767414522907405, "loss": 0.0116, "step": 122000 }, { "epoch": 0.62, "eval_cer": 0.9145071309559275, "eval_loss": 0.010251490399241447, "eval_runtime": 116.7533, "eval_samples_per_second": 17.13, "eval_steps_per_second": 4.283, "step": 122000 }, { "epoch": 0.62, "learning_rate": 0.00020766657753606003, "loss": 0.0127, "step": 122010 }, { "epoch": 0.62, "learning_rate": 0.00020765900984304604, "loss": 0.0129, "step": 122020 }, { "epoch": 0.62, "learning_rate": 0.00020765144215003202, "loss": 0.0125, "step": 122030 }, { "epoch": 0.62, "learning_rate": 0.000207643874457018, "loss": 0.0144, "step": 122040 }, { "epoch": 0.62, "learning_rate": 0.000207636306764004, "loss": 0.0132, "step": 122050 }, { "epoch": 0.62, "learning_rate": 0.00020762873907099, "loss": 0.0163, "step": 122060 }, { "epoch": 0.62, "learning_rate": 0.00020762117137797598, "loss": 0.0123, "step": 122070 }, { "epoch": 0.62, "learning_rate": 0.00020761360368496198, "loss": 0.0163, "step": 122080 }, { "epoch": 0.62, "learning_rate": 0.00020760603599194797, "loss": 0.0137, "step": 122090 }, { "epoch": 0.62, "learning_rate": 0.00020759846829893395, "loss": 0.0135, "step": 122100 }, { "epoch": 0.62, "learning_rate": 0.00020759090060591993, "loss": 0.0141, "step": 122110 }, { "epoch": 0.62, "learning_rate": 0.00020758333291290594, "loss": 0.0157, "step": 122120 }, { "epoch": 0.62, "learning_rate": 0.00020757576521989192, "loss": 0.0123, "step": 122130 }, { "epoch": 0.62, "learning_rate": 0.0002075681975268779, "loss": 0.0138, "step": 122140 }, { "epoch": 0.62, "learning_rate": 0.0002075606298338639, "loss": 0.0136, "step": 122150 }, { "epoch": 0.62, "learning_rate": 0.0002075530621408499, "loss": 0.0135, "step": 122160 }, { "epoch": 0.62, "learning_rate": 0.00020754549444783587, "loss": 0.0155, "step": 122170 }, { "epoch": 0.62, "learning_rate": 0.00020753792675482188, "loss": 0.0187, "step": 122180 }, { "epoch": 0.62, "learning_rate": 0.00020753035906180786, "loss": 0.0157, "step": 122190 }, { "epoch": 0.62, "learning_rate": 0.00020752279136879384, "loss": 0.0145, "step": 122200 }, { "epoch": 0.62, "learning_rate": 0.00020751522367577985, "loss": 0.0169, "step": 122210 }, { "epoch": 0.62, "learning_rate": 0.00020750765598276583, "loss": 0.0125, "step": 122220 }, { "epoch": 0.62, "learning_rate": 0.00020750008828975181, "loss": 0.0133, "step": 122230 }, { "epoch": 0.62, "learning_rate": 0.00020749252059673782, "loss": 0.0157, "step": 122240 }, { "epoch": 0.62, "learning_rate": 0.0002074849529037238, "loss": 0.0152, "step": 122250 }, { "epoch": 0.62, "learning_rate": 0.00020747738521070979, "loss": 0.0164, "step": 122260 }, { "epoch": 0.62, "learning_rate": 0.00020746981751769577, "loss": 0.014, "step": 122270 }, { "epoch": 0.62, "learning_rate": 0.00020746224982468178, "loss": 0.0145, "step": 122280 }, { "epoch": 0.62, "learning_rate": 0.00020745468213166776, "loss": 0.0139, "step": 122290 }, { "epoch": 0.62, "learning_rate": 0.00020744711443865374, "loss": 0.0148, "step": 122300 }, { "epoch": 0.62, "learning_rate": 0.00020743954674563975, "loss": 0.0156, "step": 122310 }, { "epoch": 0.62, "learning_rate": 0.00020743197905262573, "loss": 0.0123, "step": 122320 }, { "epoch": 0.62, "learning_rate": 0.0002074244113596117, "loss": 0.0146, "step": 122330 }, { "epoch": 0.62, "learning_rate": 0.00020741684366659772, "loss": 0.011, "step": 122340 }, { "epoch": 0.62, "learning_rate": 0.0002074092759735837, "loss": 0.012, "step": 122350 }, { "epoch": 0.62, "learning_rate": 0.00020740170828056968, "loss": 0.0123, "step": 122360 }, { "epoch": 0.62, "learning_rate": 0.0002073941405875557, "loss": 0.0145, "step": 122370 }, { "epoch": 0.62, "learning_rate": 0.00020738657289454167, "loss": 0.0435, "step": 122380 }, { "epoch": 0.62, "learning_rate": 0.00020737900520152765, "loss": 0.0144, "step": 122390 }, { "epoch": 0.62, "learning_rate": 0.00020737143750851366, "loss": 0.015, "step": 122400 }, { "epoch": 0.62, "learning_rate": 0.00020736386981549964, "loss": 0.0163, "step": 122410 }, { "epoch": 0.62, "learning_rate": 0.00020735630212248562, "loss": 0.0156, "step": 122420 }, { "epoch": 0.62, "learning_rate": 0.00020734873442947163, "loss": 0.0174, "step": 122430 }, { "epoch": 0.62, "learning_rate": 0.00020734116673645761, "loss": 0.0168, "step": 122440 }, { "epoch": 0.62, "learning_rate": 0.0002073335990434436, "loss": 0.0173, "step": 122450 }, { "epoch": 0.62, "learning_rate": 0.00020732603135042958, "loss": 0.0157, "step": 122460 }, { "epoch": 0.62, "learning_rate": 0.00020731846365741559, "loss": 0.013, "step": 122470 }, { "epoch": 0.62, "learning_rate": 0.00020731089596440157, "loss": 0.0131, "step": 122480 }, { "epoch": 0.62, "learning_rate": 0.00020730332827138755, "loss": 0.0142, "step": 122490 }, { "epoch": 0.62, "learning_rate": 0.00020729576057837356, "loss": 0.0159, "step": 122500 }, { "epoch": 0.62, "learning_rate": 0.00020728819288535954, "loss": 0.0119, "step": 122510 }, { "epoch": 0.62, "learning_rate": 0.00020728062519234552, "loss": 0.0148, "step": 122520 }, { "epoch": 0.62, "learning_rate": 0.00020727305749933153, "loss": 0.0173, "step": 122530 }, { "epoch": 0.62, "learning_rate": 0.0002072654898063175, "loss": 0.0134, "step": 122540 }, { "epoch": 0.62, "learning_rate": 0.00020725792211330346, "loss": 0.0196, "step": 122550 }, { "epoch": 0.62, "learning_rate": 0.00020725035442028945, "loss": 0.0138, "step": 122560 }, { "epoch": 0.62, "learning_rate": 0.00020724278672727545, "loss": 0.014, "step": 122570 }, { "epoch": 0.62, "learning_rate": 0.00020723521903426144, "loss": 0.0147, "step": 122580 }, { "epoch": 0.62, "learning_rate": 0.00020722765134124742, "loss": 0.0126, "step": 122590 }, { "epoch": 0.62, "learning_rate": 0.00020722008364823343, "loss": 0.013, "step": 122600 }, { "epoch": 0.62, "learning_rate": 0.0002072125159552194, "loss": 0.0132, "step": 122610 }, { "epoch": 0.62, "learning_rate": 0.0002072049482622054, "loss": 0.0158, "step": 122620 }, { "epoch": 0.62, "learning_rate": 0.0002071973805691914, "loss": 0.0161, "step": 122630 }, { "epoch": 0.62, "learning_rate": 0.00020718981287617738, "loss": 0.0117, "step": 122640 }, { "epoch": 0.62, "learning_rate": 0.00020718224518316336, "loss": 0.0157, "step": 122650 }, { "epoch": 0.62, "learning_rate": 0.00020717467749014934, "loss": 0.0152, "step": 122660 }, { "epoch": 0.62, "learning_rate": 0.00020716710979713535, "loss": 0.0143, "step": 122670 }, { "epoch": 0.62, "learning_rate": 0.00020715954210412133, "loss": 0.0175, "step": 122680 }, { "epoch": 0.62, "learning_rate": 0.0002071519744111073, "loss": 0.0141, "step": 122690 }, { "epoch": 0.62, "learning_rate": 0.00020714440671809332, "loss": 0.0143, "step": 122700 }, { "epoch": 0.62, "learning_rate": 0.0002071368390250793, "loss": 0.0162, "step": 122710 }, { "epoch": 0.62, "learning_rate": 0.00020712927133206528, "loss": 0.018, "step": 122720 }, { "epoch": 0.62, "learning_rate": 0.0002071217036390513, "loss": 0.013, "step": 122730 }, { "epoch": 0.62, "learning_rate": 0.00020711413594603727, "loss": 0.017, "step": 122740 }, { "epoch": 0.62, "learning_rate": 0.00020710656825302326, "loss": 0.0204, "step": 122750 }, { "epoch": 0.62, "learning_rate": 0.00020709900056000926, "loss": 0.0187, "step": 122760 }, { "epoch": 0.62, "learning_rate": 0.00020709143286699525, "loss": 0.0143, "step": 122770 }, { "epoch": 0.62, "learning_rate": 0.00020708386517398123, "loss": 0.0157, "step": 122780 }, { "epoch": 0.62, "learning_rate": 0.00020707629748096724, "loss": 0.014, "step": 122790 }, { "epoch": 0.62, "learning_rate": 0.00020706872978795322, "loss": 0.0141, "step": 122800 }, { "epoch": 0.62, "learning_rate": 0.0002070611620949392, "loss": 0.0142, "step": 122810 }, { "epoch": 0.62, "learning_rate": 0.0002070535944019252, "loss": 0.0147, "step": 122820 }, { "epoch": 0.62, "learning_rate": 0.0002070460267089112, "loss": 0.0161, "step": 122830 }, { "epoch": 0.62, "learning_rate": 0.00020703845901589717, "loss": 0.0122, "step": 122840 }, { "epoch": 0.62, "learning_rate": 0.00020703089132288315, "loss": 0.0147, "step": 122850 }, { "epoch": 0.62, "learning_rate": 0.00020702332362986916, "loss": 0.0143, "step": 122860 }, { "epoch": 0.62, "learning_rate": 0.00020701575593685514, "loss": 0.0124, "step": 122870 }, { "epoch": 0.62, "learning_rate": 0.00020700818824384112, "loss": 0.0143, "step": 122880 }, { "epoch": 0.62, "learning_rate": 0.00020700062055082713, "loss": 0.0104, "step": 122890 }, { "epoch": 0.62, "learning_rate": 0.0002069930528578131, "loss": 0.014, "step": 122900 }, { "epoch": 0.62, "learning_rate": 0.0002069854851647991, "loss": 0.0162, "step": 122910 }, { "epoch": 0.62, "learning_rate": 0.0002069779174717851, "loss": 0.017, "step": 122920 }, { "epoch": 0.62, "learning_rate": 0.00020697034977877108, "loss": 0.0131, "step": 122930 }, { "epoch": 0.62, "learning_rate": 0.00020696278208575707, "loss": 0.0142, "step": 122940 }, { "epoch": 0.62, "learning_rate": 0.00020695521439274307, "loss": 0.0143, "step": 122950 }, { "epoch": 0.62, "learning_rate": 0.00020694764669972906, "loss": 0.0151, "step": 122960 }, { "epoch": 0.62, "learning_rate": 0.00020694007900671504, "loss": 0.0127, "step": 122970 }, { "epoch": 0.62, "learning_rate": 0.00020693251131370105, "loss": 0.0159, "step": 122980 }, { "epoch": 0.62, "learning_rate": 0.00020692494362068703, "loss": 0.0124, "step": 122990 }, { "epoch": 0.62, "learning_rate": 0.000206917375927673, "loss": 0.0134, "step": 123000 }, { "epoch": 0.62, "eval_cer": 0.9144566703574066, "eval_loss": 0.010365525260567665, "eval_runtime": 116.8218, "eval_samples_per_second": 17.12, "eval_steps_per_second": 4.28, "step": 123000 }, { "epoch": 0.62, "learning_rate": 0.000206909808234659, "loss": 0.0145, "step": 123010 }, { "epoch": 0.62, "learning_rate": 0.000206902240541645, "loss": 0.0131, "step": 123020 }, { "epoch": 0.62, "learning_rate": 0.00020689467284863098, "loss": 0.0168, "step": 123030 }, { "epoch": 0.62, "learning_rate": 0.00020688710515561696, "loss": 0.016, "step": 123040 }, { "epoch": 0.62, "learning_rate": 0.00020687953746260297, "loss": 0.0169, "step": 123050 }, { "epoch": 0.62, "learning_rate": 0.00020687196976958895, "loss": 0.0119, "step": 123060 }, { "epoch": 0.62, "learning_rate": 0.00020686440207657493, "loss": 0.0143, "step": 123070 }, { "epoch": 0.62, "learning_rate": 0.00020685683438356094, "loss": 0.0136, "step": 123080 }, { "epoch": 0.62, "learning_rate": 0.00020684926669054692, "loss": 0.0125, "step": 123090 }, { "epoch": 0.62, "learning_rate": 0.0002068416989975329, "loss": 0.0148, "step": 123100 }, { "epoch": 0.62, "learning_rate": 0.0002068341313045189, "loss": 0.0182, "step": 123110 }, { "epoch": 0.62, "learning_rate": 0.0002068265636115049, "loss": 0.0126, "step": 123120 }, { "epoch": 0.62, "learning_rate": 0.00020681899591849088, "loss": 0.0186, "step": 123130 }, { "epoch": 0.62, "learning_rate": 0.00020681142822547688, "loss": 0.015, "step": 123140 }, { "epoch": 0.62, "learning_rate": 0.00020680386053246287, "loss": 0.0183, "step": 123150 }, { "epoch": 0.62, "learning_rate": 0.00020679629283944885, "loss": 0.0152, "step": 123160 }, { "epoch": 0.62, "learning_rate": 0.00020678872514643483, "loss": 0.0167, "step": 123170 }, { "epoch": 0.62, "learning_rate": 0.00020678115745342084, "loss": 0.0172, "step": 123180 }, { "epoch": 0.62, "learning_rate": 0.00020677358976040682, "loss": 0.0158, "step": 123190 }, { "epoch": 0.62, "learning_rate": 0.0002067660220673928, "loss": 0.0166, "step": 123200 }, { "epoch": 0.62, "learning_rate": 0.0002067584543743788, "loss": 0.0189, "step": 123210 }, { "epoch": 0.62, "learning_rate": 0.0002067508866813648, "loss": 0.0145, "step": 123220 }, { "epoch": 0.62, "learning_rate": 0.00020674331898835077, "loss": 0.0174, "step": 123230 }, { "epoch": 0.62, "learning_rate": 0.00020673575129533678, "loss": 0.0134, "step": 123240 }, { "epoch": 0.62, "learning_rate": 0.00020672818360232276, "loss": 0.0143, "step": 123250 }, { "epoch": 0.62, "learning_rate": 0.00020672061590930874, "loss": 0.0149, "step": 123260 }, { "epoch": 0.62, "learning_rate": 0.00020671304821629475, "loss": 0.0132, "step": 123270 }, { "epoch": 0.62, "learning_rate": 0.00020670548052328073, "loss": 0.0122, "step": 123280 }, { "epoch": 0.62, "learning_rate": 0.00020669791283026671, "loss": 0.0134, "step": 123290 }, { "epoch": 0.62, "learning_rate": 0.00020669034513725272, "loss": 0.0132, "step": 123300 }, { "epoch": 0.62, "learning_rate": 0.0002066827774442387, "loss": 0.0129, "step": 123310 }, { "epoch": 0.62, "learning_rate": 0.00020667520975122469, "loss": 0.0147, "step": 123320 }, { "epoch": 0.62, "learning_rate": 0.0002066676420582107, "loss": 0.0126, "step": 123330 }, { "epoch": 0.62, "learning_rate": 0.00020666007436519668, "loss": 0.0118, "step": 123340 }, { "epoch": 0.62, "learning_rate": 0.00020665250667218266, "loss": 0.0151, "step": 123350 }, { "epoch": 0.62, "learning_rate": 0.00020664493897916864, "loss": 0.0155, "step": 123360 }, { "epoch": 0.62, "learning_rate": 0.00020663737128615465, "loss": 0.0147, "step": 123370 }, { "epoch": 0.62, "learning_rate": 0.00020662980359314063, "loss": 0.0131, "step": 123380 }, { "epoch": 0.62, "learning_rate": 0.0002066222359001266, "loss": 0.0148, "step": 123390 }, { "epoch": 0.62, "learning_rate": 0.00020661466820711262, "loss": 0.0121, "step": 123400 }, { "epoch": 0.62, "learning_rate": 0.0002066071005140986, "loss": 0.0143, "step": 123410 }, { "epoch": 0.62, "learning_rate": 0.00020659953282108458, "loss": 0.0121, "step": 123420 }, { "epoch": 0.62, "learning_rate": 0.0002065919651280706, "loss": 0.0118, "step": 123430 }, { "epoch": 0.62, "learning_rate": 0.00020658439743505657, "loss": 0.0133, "step": 123440 }, { "epoch": 0.62, "learning_rate": 0.00020657682974204255, "loss": 0.011, "step": 123450 }, { "epoch": 0.62, "learning_rate": 0.00020656926204902856, "loss": 0.014, "step": 123460 }, { "epoch": 0.62, "learning_rate": 0.00020656169435601454, "loss": 0.0164, "step": 123470 }, { "epoch": 0.62, "learning_rate": 0.00020655412666300052, "loss": 0.0161, "step": 123480 }, { "epoch": 0.62, "learning_rate": 0.00020654655896998653, "loss": 0.015, "step": 123490 }, { "epoch": 0.62, "learning_rate": 0.00020653899127697251, "loss": 0.0125, "step": 123500 }, { "epoch": 0.62, "learning_rate": 0.0002065314235839585, "loss": 0.0124, "step": 123510 }, { "epoch": 0.62, "learning_rate": 0.00020652385589094448, "loss": 0.014, "step": 123520 }, { "epoch": 0.62, "learning_rate": 0.00020651628819793049, "loss": 0.0137, "step": 123530 }, { "epoch": 0.62, "learning_rate": 0.00020650872050491647, "loss": 0.0161, "step": 123540 }, { "epoch": 0.62, "learning_rate": 0.00020650115281190245, "loss": 0.0128, "step": 123550 }, { "epoch": 0.62, "learning_rate": 0.00020649358511888846, "loss": 0.0125, "step": 123560 }, { "epoch": 0.62, "learning_rate": 0.00020648601742587444, "loss": 0.0125, "step": 123570 }, { "epoch": 0.62, "learning_rate": 0.00020647844973286042, "loss": 0.0165, "step": 123580 }, { "epoch": 0.62, "learning_rate": 0.00020647088203984643, "loss": 0.0129, "step": 123590 }, { "epoch": 0.62, "learning_rate": 0.0002064633143468324, "loss": 0.0127, "step": 123600 }, { "epoch": 0.62, "learning_rate": 0.0002064557466538184, "loss": 0.0133, "step": 123610 }, { "epoch": 0.62, "learning_rate": 0.0002064481789608044, "loss": 0.0152, "step": 123620 }, { "epoch": 0.62, "learning_rate": 0.00020644061126779038, "loss": 0.0143, "step": 123630 }, { "epoch": 0.62, "learning_rate": 0.00020643304357477636, "loss": 0.0128, "step": 123640 }, { "epoch": 0.62, "learning_rate": 0.00020642547588176237, "loss": 0.0133, "step": 123650 }, { "epoch": 0.62, "learning_rate": 0.00020641790818874835, "loss": 0.0152, "step": 123660 }, { "epoch": 0.62, "learning_rate": 0.00020641034049573433, "loss": 0.0143, "step": 123670 }, { "epoch": 0.62, "learning_rate": 0.00020640277280272032, "loss": 0.014, "step": 123680 }, { "epoch": 0.62, "learning_rate": 0.00020639520510970632, "loss": 0.0123, "step": 123690 }, { "epoch": 0.62, "learning_rate": 0.0002063876374166923, "loss": 0.0147, "step": 123700 }, { "epoch": 0.62, "learning_rate": 0.0002063800697236783, "loss": 0.016, "step": 123710 }, { "epoch": 0.62, "learning_rate": 0.0002063725020306643, "loss": 0.0119, "step": 123720 }, { "epoch": 0.62, "learning_rate": 0.00020636493433765028, "loss": 0.015, "step": 123730 }, { "epoch": 0.62, "learning_rate": 0.00020635736664463626, "loss": 0.0141, "step": 123740 }, { "epoch": 0.62, "learning_rate": 0.00020634979895162227, "loss": 0.0183, "step": 123750 }, { "epoch": 0.62, "learning_rate": 0.00020634223125860825, "loss": 0.0192, "step": 123760 }, { "epoch": 0.62, "learning_rate": 0.00020633466356559423, "loss": 0.0139, "step": 123770 }, { "epoch": 0.62, "learning_rate": 0.00020632709587258024, "loss": 0.0143, "step": 123780 }, { "epoch": 0.62, "learning_rate": 0.00020631952817956622, "loss": 0.0165, "step": 123790 }, { "epoch": 0.62, "learning_rate": 0.0002063119604865522, "loss": 0.0146, "step": 123800 }, { "epoch": 0.62, "learning_rate": 0.00020630439279353816, "loss": 0.0111, "step": 123810 }, { "epoch": 0.62, "learning_rate": 0.00020629682510052416, "loss": 0.0121, "step": 123820 }, { "epoch": 0.62, "learning_rate": 0.00020628925740751015, "loss": 0.0158, "step": 123830 }, { "epoch": 0.62, "learning_rate": 0.00020628168971449613, "loss": 0.0139, "step": 123840 }, { "epoch": 0.62, "learning_rate": 0.00020627412202148214, "loss": 0.0149, "step": 123850 }, { "epoch": 0.62, "learning_rate": 0.00020626655432846812, "loss": 0.0138, "step": 123860 }, { "epoch": 0.62, "learning_rate": 0.0002062589866354541, "loss": 0.0158, "step": 123870 }, { "epoch": 0.62, "learning_rate": 0.0002062514189424401, "loss": 0.0114, "step": 123880 }, { "epoch": 0.63, "learning_rate": 0.0002062438512494261, "loss": 0.0118, "step": 123890 }, { "epoch": 0.63, "learning_rate": 0.00020623628355641207, "loss": 0.0163, "step": 123900 }, { "epoch": 0.63, "learning_rate": 0.00020622871586339805, "loss": 0.0161, "step": 123910 }, { "epoch": 0.63, "learning_rate": 0.00020622114817038406, "loss": 0.0138, "step": 123920 }, { "epoch": 0.63, "learning_rate": 0.00020621358047737004, "loss": 0.0166, "step": 123930 }, { "epoch": 0.63, "learning_rate": 0.00020620601278435602, "loss": 0.0141, "step": 123940 }, { "epoch": 0.63, "learning_rate": 0.00020619844509134203, "loss": 0.0147, "step": 123950 }, { "epoch": 0.63, "learning_rate": 0.000206190877398328, "loss": 0.0161, "step": 123960 }, { "epoch": 0.63, "learning_rate": 0.000206183309705314, "loss": 0.0162, "step": 123970 }, { "epoch": 0.63, "learning_rate": 0.0002061757420123, "loss": 0.0101, "step": 123980 }, { "epoch": 0.63, "learning_rate": 0.00020616817431928598, "loss": 0.0125, "step": 123990 }, { "epoch": 0.63, "learning_rate": 0.00020616060662627197, "loss": 0.0134, "step": 124000 }, { "epoch": 0.63, "eval_cer": 0.9144877230334195, "eval_loss": 0.010582580231130123, "eval_runtime": 116.7375, "eval_samples_per_second": 17.132, "eval_steps_per_second": 4.283, "step": 124000 }, { "epoch": 0.63, "learning_rate": 0.00020615303893325797, "loss": 0.0157, "step": 124010 }, { "epoch": 0.63, "learning_rate": 0.00020614547124024396, "loss": 0.0124, "step": 124020 }, { "epoch": 0.63, "learning_rate": 0.00020613790354722994, "loss": 0.0161, "step": 124030 }, { "epoch": 0.63, "learning_rate": 0.00020613033585421595, "loss": 0.0163, "step": 124040 }, { "epoch": 0.63, "learning_rate": 0.00020612276816120193, "loss": 0.0119, "step": 124050 }, { "epoch": 0.63, "learning_rate": 0.0002061152004681879, "loss": 0.0167, "step": 124060 }, { "epoch": 0.63, "learning_rate": 0.0002061076327751739, "loss": 0.0129, "step": 124070 }, { "epoch": 0.63, "learning_rate": 0.0002061000650821599, "loss": 0.0137, "step": 124080 }, { "epoch": 0.63, "learning_rate": 0.00020609249738914588, "loss": 0.0138, "step": 124090 }, { "epoch": 0.63, "learning_rate": 0.00020608492969613186, "loss": 0.0148, "step": 124100 }, { "epoch": 0.63, "learning_rate": 0.00020607736200311787, "loss": 0.0134, "step": 124110 }, { "epoch": 0.63, "learning_rate": 0.00020606979431010385, "loss": 0.0143, "step": 124120 }, { "epoch": 0.63, "learning_rate": 0.00020606222661708983, "loss": 0.0169, "step": 124130 }, { "epoch": 0.63, "learning_rate": 0.00020605465892407584, "loss": 0.0122, "step": 124140 }, { "epoch": 0.63, "learning_rate": 0.00020604709123106182, "loss": 0.0155, "step": 124150 }, { "epoch": 0.63, "learning_rate": 0.0002060395235380478, "loss": 0.0132, "step": 124160 }, { "epoch": 0.63, "learning_rate": 0.0002060319558450338, "loss": 0.0157, "step": 124170 }, { "epoch": 0.63, "learning_rate": 0.0002060243881520198, "loss": 0.0148, "step": 124180 }, { "epoch": 0.63, "learning_rate": 0.00020601682045900578, "loss": 0.0143, "step": 124190 }, { "epoch": 0.63, "learning_rate": 0.00020600925276599178, "loss": 0.0121, "step": 124200 }, { "epoch": 0.63, "learning_rate": 0.00020600168507297777, "loss": 0.0146, "step": 124210 }, { "epoch": 0.63, "learning_rate": 0.00020599411737996375, "loss": 0.0146, "step": 124220 }, { "epoch": 0.63, "learning_rate": 0.00020598654968694976, "loss": 0.014, "step": 124230 }, { "epoch": 0.63, "learning_rate": 0.00020597898199393574, "loss": 0.0173, "step": 124240 }, { "epoch": 0.63, "learning_rate": 0.00020597141430092172, "loss": 0.0149, "step": 124250 }, { "epoch": 0.63, "learning_rate": 0.0002059638466079077, "loss": 0.0125, "step": 124260 }, { "epoch": 0.63, "learning_rate": 0.0002059562789148937, "loss": 0.0131, "step": 124270 }, { "epoch": 0.63, "learning_rate": 0.0002059487112218797, "loss": 0.0132, "step": 124280 }, { "epoch": 0.63, "learning_rate": 0.00020594114352886567, "loss": 0.0145, "step": 124290 }, { "epoch": 0.63, "learning_rate": 0.00020593357583585168, "loss": 0.0133, "step": 124300 }, { "epoch": 0.63, "learning_rate": 0.00020592600814283766, "loss": 0.0132, "step": 124310 }, { "epoch": 0.63, "learning_rate": 0.00020591844044982364, "loss": 0.0158, "step": 124320 }, { "epoch": 0.63, "learning_rate": 0.00020591087275680965, "loss": 0.0158, "step": 124330 }, { "epoch": 0.63, "learning_rate": 0.00020590330506379563, "loss": 0.0154, "step": 124340 }, { "epoch": 0.63, "learning_rate": 0.00020589573737078161, "loss": 0.0133, "step": 124350 }, { "epoch": 0.63, "learning_rate": 0.00020588816967776762, "loss": 0.0126, "step": 124360 }, { "epoch": 0.63, "learning_rate": 0.0002058806019847536, "loss": 0.016, "step": 124370 }, { "epoch": 0.63, "learning_rate": 0.00020587303429173959, "loss": 0.0133, "step": 124380 }, { "epoch": 0.63, "learning_rate": 0.0002058654665987256, "loss": 0.0157, "step": 124390 }, { "epoch": 0.63, "learning_rate": 0.00020585789890571158, "loss": 0.0272, "step": 124400 }, { "epoch": 0.63, "learning_rate": 0.00020585033121269756, "loss": 0.0157, "step": 124410 }, { "epoch": 0.63, "learning_rate": 0.00020584276351968354, "loss": 0.0145, "step": 124420 }, { "epoch": 0.63, "learning_rate": 0.00020583519582666955, "loss": 0.0132, "step": 124430 }, { "epoch": 0.63, "learning_rate": 0.00020582762813365553, "loss": 0.0104, "step": 124440 }, { "epoch": 0.63, "learning_rate": 0.0002058200604406415, "loss": 0.0154, "step": 124450 }, { "epoch": 0.63, "learning_rate": 0.00020581249274762752, "loss": 0.0152, "step": 124460 }, { "epoch": 0.63, "learning_rate": 0.0002058049250546135, "loss": 0.0136, "step": 124470 }, { "epoch": 0.63, "learning_rate": 0.00020579735736159948, "loss": 0.013, "step": 124480 }, { "epoch": 0.63, "learning_rate": 0.0002057897896685855, "loss": 0.0133, "step": 124490 }, { "epoch": 0.63, "learning_rate": 0.00020578222197557147, "loss": 0.0135, "step": 124500 }, { "epoch": 0.63, "learning_rate": 0.00020577465428255745, "loss": 0.014, "step": 124510 }, { "epoch": 0.63, "learning_rate": 0.00020576708658954346, "loss": 0.0176, "step": 124520 }, { "epoch": 0.63, "learning_rate": 0.00020575951889652944, "loss": 0.0134, "step": 124530 }, { "epoch": 0.63, "learning_rate": 0.00020575195120351542, "loss": 0.0143, "step": 124540 }, { "epoch": 0.63, "learning_rate": 0.00020574438351050143, "loss": 0.017, "step": 124550 }, { "epoch": 0.63, "learning_rate": 0.00020573681581748741, "loss": 0.0151, "step": 124560 }, { "epoch": 0.63, "learning_rate": 0.0002057292481244734, "loss": 0.0118, "step": 124570 }, { "epoch": 0.63, "learning_rate": 0.00020572168043145938, "loss": 0.014, "step": 124580 }, { "epoch": 0.63, "learning_rate": 0.00020571411273844539, "loss": 0.0118, "step": 124590 }, { "epoch": 0.63, "learning_rate": 0.00020570654504543137, "loss": 0.0144, "step": 124600 }, { "epoch": 0.63, "learning_rate": 0.00020569897735241735, "loss": 0.0149, "step": 124610 }, { "epoch": 0.63, "learning_rate": 0.00020569140965940336, "loss": 0.0164, "step": 124620 }, { "epoch": 0.63, "learning_rate": 0.00020568384196638934, "loss": 0.0174, "step": 124630 }, { "epoch": 0.63, "learning_rate": 0.00020567627427337532, "loss": 0.0131, "step": 124640 }, { "epoch": 0.63, "learning_rate": 0.00020566870658036133, "loss": 0.0133, "step": 124650 }, { "epoch": 0.63, "learning_rate": 0.0002056611388873473, "loss": 0.0157, "step": 124660 }, { "epoch": 0.63, "learning_rate": 0.0002056535711943333, "loss": 0.0131, "step": 124670 }, { "epoch": 0.63, "learning_rate": 0.0002056460035013193, "loss": 0.0143, "step": 124680 }, { "epoch": 0.63, "learning_rate": 0.00020563843580830528, "loss": 0.0127, "step": 124690 }, { "epoch": 0.63, "learning_rate": 0.00020563086811529126, "loss": 0.0128, "step": 124700 }, { "epoch": 0.63, "learning_rate": 0.00020562330042227727, "loss": 0.0173, "step": 124710 }, { "epoch": 0.63, "learning_rate": 0.00020561573272926325, "loss": 0.0166, "step": 124720 }, { "epoch": 0.63, "learning_rate": 0.00020560816503624923, "loss": 0.0147, "step": 124730 }, { "epoch": 0.63, "learning_rate": 0.00020560059734323524, "loss": 0.0121, "step": 124740 }, { "epoch": 0.63, "learning_rate": 0.00020559302965022122, "loss": 0.0116, "step": 124750 }, { "epoch": 0.63, "learning_rate": 0.0002055854619572072, "loss": 0.0155, "step": 124760 }, { "epoch": 0.63, "learning_rate": 0.0002055778942641932, "loss": 0.0136, "step": 124770 }, { "epoch": 0.63, "learning_rate": 0.0002055703265711792, "loss": 0.013, "step": 124780 }, { "epoch": 0.63, "learning_rate": 0.00020556275887816518, "loss": 0.0167, "step": 124790 }, { "epoch": 0.63, "learning_rate": 0.00020555519118515116, "loss": 0.0149, "step": 124800 }, { "epoch": 0.63, "learning_rate": 0.00020554762349213717, "loss": 0.0176, "step": 124810 }, { "epoch": 0.63, "learning_rate": 0.00020554005579912315, "loss": 0.0127, "step": 124820 }, { "epoch": 0.63, "learning_rate": 0.00020553248810610913, "loss": 0.0127, "step": 124830 }, { "epoch": 0.63, "learning_rate": 0.00020552492041309514, "loss": 0.0134, "step": 124840 }, { "epoch": 0.63, "learning_rate": 0.00020551735272008112, "loss": 0.0144, "step": 124850 }, { "epoch": 0.63, "learning_rate": 0.0002055097850270671, "loss": 0.0129, "step": 124860 }, { "epoch": 0.63, "learning_rate": 0.0002055022173340531, "loss": 0.0165, "step": 124870 }, { "epoch": 0.63, "learning_rate": 0.0002054946496410391, "loss": 0.0154, "step": 124880 }, { "epoch": 0.63, "learning_rate": 0.00020548708194802507, "loss": 0.0165, "step": 124890 }, { "epoch": 0.63, "learning_rate": 0.00020547951425501108, "loss": 0.0141, "step": 124900 }, { "epoch": 0.63, "learning_rate": 0.00020547194656199706, "loss": 0.0107, "step": 124910 }, { "epoch": 0.63, "learning_rate": 0.00020546437886898304, "loss": 0.0128, "step": 124920 }, { "epoch": 0.63, "learning_rate": 0.00020545681117596903, "loss": 0.0165, "step": 124930 }, { "epoch": 0.63, "learning_rate": 0.00020544924348295503, "loss": 0.0152, "step": 124940 }, { "epoch": 0.63, "learning_rate": 0.00020544167578994102, "loss": 0.0172, "step": 124950 }, { "epoch": 0.63, "learning_rate": 0.000205434108096927, "loss": 0.0126, "step": 124960 }, { "epoch": 0.63, "learning_rate": 0.000205426540403913, "loss": 0.0121, "step": 124970 }, { "epoch": 0.63, "learning_rate": 0.000205418972710899, "loss": 0.0107, "step": 124980 }, { "epoch": 0.63, "learning_rate": 0.00020541140501788497, "loss": 0.0136, "step": 124990 }, { "epoch": 0.63, "learning_rate": 0.00020540383732487098, "loss": 0.0122, "step": 125000 }, { "epoch": 0.63, "eval_cer": 0.9144945158062973, "eval_loss": 0.010605525225400925, "eval_runtime": 116.7031, "eval_samples_per_second": 17.138, "eval_steps_per_second": 4.284, "step": 125000 }, { "epoch": 0.63, "learning_rate": 0.00020539626963185696, "loss": 0.0155, "step": 125010 }, { "epoch": 0.63, "learning_rate": 0.00020538870193884294, "loss": 0.0101, "step": 125020 }, { "epoch": 0.63, "learning_rate": 0.00020538113424582895, "loss": 0.0155, "step": 125030 }, { "epoch": 0.63, "learning_rate": 0.00020537356655281493, "loss": 0.0162, "step": 125040 }, { "epoch": 0.63, "learning_rate": 0.0002053659988598009, "loss": 0.0154, "step": 125050 }, { "epoch": 0.63, "learning_rate": 0.00020535843116678692, "loss": 0.013, "step": 125060 }, { "epoch": 0.63, "learning_rate": 0.00020535086347377287, "loss": 0.0175, "step": 125070 }, { "epoch": 0.63, "learning_rate": 0.00020534329578075886, "loss": 0.0138, "step": 125080 }, { "epoch": 0.63, "learning_rate": 0.00020533572808774484, "loss": 0.0142, "step": 125090 }, { "epoch": 0.63, "learning_rate": 0.00020532816039473085, "loss": 0.0121, "step": 125100 }, { "epoch": 0.63, "learning_rate": 0.00020532059270171683, "loss": 0.0125, "step": 125110 }, { "epoch": 0.63, "learning_rate": 0.0002053130250087028, "loss": 0.0135, "step": 125120 }, { "epoch": 0.63, "learning_rate": 0.00020530545731568882, "loss": 0.0145, "step": 125130 }, { "epoch": 0.63, "learning_rate": 0.0002052978896226748, "loss": 0.0122, "step": 125140 }, { "epoch": 0.63, "learning_rate": 0.00020529032192966078, "loss": 0.0107, "step": 125150 }, { "epoch": 0.63, "learning_rate": 0.00020528275423664676, "loss": 0.0136, "step": 125160 }, { "epoch": 0.63, "learning_rate": 0.00020527518654363277, "loss": 0.0103, "step": 125170 }, { "epoch": 0.63, "learning_rate": 0.00020526761885061875, "loss": 0.0146, "step": 125180 }, { "epoch": 0.63, "learning_rate": 0.00020526005115760473, "loss": 0.0118, "step": 125190 }, { "epoch": 0.63, "learning_rate": 0.00020525248346459074, "loss": 0.0113, "step": 125200 }, { "epoch": 0.63, "learning_rate": 0.00020524491577157672, "loss": 0.0166, "step": 125210 }, { "epoch": 0.63, "learning_rate": 0.0002052373480785627, "loss": 0.0146, "step": 125220 }, { "epoch": 0.63, "learning_rate": 0.0002052297803855487, "loss": 0.016, "step": 125230 }, { "epoch": 0.63, "learning_rate": 0.0002052222126925347, "loss": 0.0173, "step": 125240 }, { "epoch": 0.63, "learning_rate": 0.00020521464499952068, "loss": 0.0163, "step": 125250 }, { "epoch": 0.63, "learning_rate": 0.00020520707730650668, "loss": 0.0192, "step": 125260 }, { "epoch": 0.63, "learning_rate": 0.00020519950961349267, "loss": 0.0153, "step": 125270 }, { "epoch": 0.63, "learning_rate": 0.00020519194192047865, "loss": 0.0139, "step": 125280 }, { "epoch": 0.63, "learning_rate": 0.00020518437422746466, "loss": 0.0154, "step": 125290 }, { "epoch": 0.63, "learning_rate": 0.00020517680653445064, "loss": 0.0135, "step": 125300 }, { "epoch": 0.63, "learning_rate": 0.00020516923884143662, "loss": 0.0164, "step": 125310 }, { "epoch": 0.63, "learning_rate": 0.0002051616711484226, "loss": 0.0139, "step": 125320 }, { "epoch": 0.63, "learning_rate": 0.0002051541034554086, "loss": 0.0178, "step": 125330 }, { "epoch": 0.63, "learning_rate": 0.0002051465357623946, "loss": 0.0122, "step": 125340 }, { "epoch": 0.63, "learning_rate": 0.00020513896806938057, "loss": 0.0152, "step": 125350 }, { "epoch": 0.63, "learning_rate": 0.00020513140037636658, "loss": 0.0173, "step": 125360 }, { "epoch": 0.63, "learning_rate": 0.00020512383268335256, "loss": 0.0151, "step": 125370 }, { "epoch": 0.63, "learning_rate": 0.00020511626499033854, "loss": 0.0117, "step": 125380 }, { "epoch": 0.63, "learning_rate": 0.00020510869729732455, "loss": 0.0149, "step": 125390 }, { "epoch": 0.63, "learning_rate": 0.00020510112960431053, "loss": 0.0164, "step": 125400 }, { "epoch": 0.63, "learning_rate": 0.00020509356191129651, "loss": 0.015, "step": 125410 }, { "epoch": 0.63, "learning_rate": 0.00020508599421828252, "loss": 0.0124, "step": 125420 }, { "epoch": 0.63, "learning_rate": 0.0002050784265252685, "loss": 0.0146, "step": 125430 }, { "epoch": 0.63, "learning_rate": 0.00020507085883225449, "loss": 0.0131, "step": 125440 }, { "epoch": 0.63, "learning_rate": 0.0002050632911392405, "loss": 0.0147, "step": 125450 }, { "epoch": 0.63, "learning_rate": 0.00020505572344622648, "loss": 0.0165, "step": 125460 }, { "epoch": 0.63, "learning_rate": 0.00020504815575321246, "loss": 0.0154, "step": 125470 }, { "epoch": 0.63, "learning_rate": 0.00020504058806019844, "loss": 0.0142, "step": 125480 }, { "epoch": 0.63, "learning_rate": 0.00020503302036718445, "loss": 0.0135, "step": 125490 }, { "epoch": 0.63, "learning_rate": 0.00020502545267417043, "loss": 0.0154, "step": 125500 }, { "epoch": 0.63, "learning_rate": 0.0002050178849811564, "loss": 0.0153, "step": 125510 }, { "epoch": 0.63, "learning_rate": 0.00020501031728814242, "loss": 0.0153, "step": 125520 }, { "epoch": 0.63, "learning_rate": 0.0002050027495951284, "loss": 0.012, "step": 125530 }, { "epoch": 0.63, "learning_rate": 0.00020499518190211438, "loss": 0.0141, "step": 125540 }, { "epoch": 0.63, "learning_rate": 0.0002049876142091004, "loss": 0.0155, "step": 125550 }, { "epoch": 0.63, "learning_rate": 0.00020498004651608637, "loss": 0.0136, "step": 125560 }, { "epoch": 0.63, "learning_rate": 0.00020497247882307235, "loss": 0.0139, "step": 125570 }, { "epoch": 0.63, "learning_rate": 0.00020496491113005836, "loss": 0.0128, "step": 125580 }, { "epoch": 0.63, "learning_rate": 0.00020495734343704434, "loss": 0.0139, "step": 125590 }, { "epoch": 0.63, "learning_rate": 0.00020494977574403032, "loss": 0.0159, "step": 125600 }, { "epoch": 0.63, "learning_rate": 0.00020494220805101633, "loss": 0.0131, "step": 125610 }, { "epoch": 0.63, "learning_rate": 0.00020493464035800231, "loss": 0.0133, "step": 125620 }, { "epoch": 0.63, "learning_rate": 0.0002049270726649883, "loss": 0.0143, "step": 125630 }, { "epoch": 0.63, "learning_rate": 0.00020491950497197428, "loss": 0.0164, "step": 125640 }, { "epoch": 0.63, "learning_rate": 0.00020491193727896029, "loss": 0.0103, "step": 125650 }, { "epoch": 0.63, "learning_rate": 0.00020490436958594627, "loss": 0.0116, "step": 125660 }, { "epoch": 0.63, "learning_rate": 0.00020489680189293225, "loss": 0.0149, "step": 125670 }, { "epoch": 0.63, "learning_rate": 0.00020488923419991826, "loss": 0.0128, "step": 125680 }, { "epoch": 0.63, "learning_rate": 0.00020488166650690424, "loss": 0.0188, "step": 125690 }, { "epoch": 0.63, "learning_rate": 0.00020487409881389022, "loss": 0.014, "step": 125700 }, { "epoch": 0.63, "learning_rate": 0.00020486653112087623, "loss": 0.0131, "step": 125710 }, { "epoch": 0.63, "learning_rate": 0.0002048589634278622, "loss": 0.0123, "step": 125720 }, { "epoch": 0.63, "learning_rate": 0.0002048513957348482, "loss": 0.0125, "step": 125730 }, { "epoch": 0.63, "learning_rate": 0.0002048438280418342, "loss": 0.0127, "step": 125740 }, { "epoch": 0.63, "learning_rate": 0.00020483626034882018, "loss": 0.019, "step": 125750 }, { "epoch": 0.63, "learning_rate": 0.00020482869265580616, "loss": 0.0151, "step": 125760 }, { "epoch": 0.63, "learning_rate": 0.00020482112496279217, "loss": 0.0157, "step": 125770 }, { "epoch": 0.63, "learning_rate": 0.00020481355726977815, "loss": 0.0133, "step": 125780 }, { "epoch": 0.63, "learning_rate": 0.00020480598957676413, "loss": 0.0143, "step": 125790 }, { "epoch": 0.63, "learning_rate": 0.00020479842188375014, "loss": 0.0131, "step": 125800 }, { "epoch": 0.63, "learning_rate": 0.00020479085419073612, "loss": 0.0138, "step": 125810 }, { "epoch": 0.63, "learning_rate": 0.0002047832864977221, "loss": 0.013, "step": 125820 }, { "epoch": 0.63, "learning_rate": 0.0002047757188047081, "loss": 0.0137, "step": 125830 }, { "epoch": 0.63, "learning_rate": 0.0002047681511116941, "loss": 0.0138, "step": 125840 }, { "epoch": 0.63, "learning_rate": 0.00020476058341868008, "loss": 0.0178, "step": 125850 }, { "epoch": 0.63, "learning_rate": 0.00020475301572566606, "loss": 0.013, "step": 125860 }, { "epoch": 0.64, "learning_rate": 0.00020474544803265207, "loss": 0.017, "step": 125870 }, { "epoch": 0.64, "learning_rate": 0.00020473788033963805, "loss": 0.0139, "step": 125880 }, { "epoch": 0.64, "learning_rate": 0.00020473031264662403, "loss": 0.0129, "step": 125890 }, { "epoch": 0.64, "learning_rate": 0.00020472274495361004, "loss": 0.0113, "step": 125900 }, { "epoch": 0.64, "learning_rate": 0.00020471517726059602, "loss": 0.0142, "step": 125910 }, { "epoch": 0.64, "learning_rate": 0.000204707609567582, "loss": 0.0166, "step": 125920 }, { "epoch": 0.64, "learning_rate": 0.000204700041874568, "loss": 0.0154, "step": 125930 }, { "epoch": 0.64, "learning_rate": 0.000204692474181554, "loss": 0.0121, "step": 125940 }, { "epoch": 0.64, "learning_rate": 0.00020468490648853997, "loss": 0.0149, "step": 125950 }, { "epoch": 0.64, "learning_rate": 0.00020467733879552598, "loss": 0.0165, "step": 125960 }, { "epoch": 0.64, "learning_rate": 0.00020466977110251196, "loss": 0.0161, "step": 125970 }, { "epoch": 0.64, "learning_rate": 0.00020466220340949794, "loss": 0.0138, "step": 125980 }, { "epoch": 0.64, "learning_rate": 0.00020465463571648393, "loss": 0.0133, "step": 125990 }, { "epoch": 0.64, "learning_rate": 0.00020464706802346993, "loss": 0.015, "step": 126000 }, { "epoch": 0.64, "eval_cer": 0.9145129533326799, "eval_loss": 0.010170434601604939, "eval_runtime": 116.6449, "eval_samples_per_second": 17.146, "eval_steps_per_second": 4.287, "step": 126000 }, { "epoch": 0.64, "learning_rate": 0.00020463950033045592, "loss": 0.0141, "step": 126010 }, { "epoch": 0.64, "learning_rate": 0.0002046319326374419, "loss": 0.0159, "step": 126020 }, { "epoch": 0.64, "learning_rate": 0.0002046243649444279, "loss": 0.0171, "step": 126030 }, { "epoch": 0.64, "learning_rate": 0.0002046167972514139, "loss": 0.014, "step": 126040 }, { "epoch": 0.64, "learning_rate": 0.00020460922955839987, "loss": 0.0152, "step": 126050 }, { "epoch": 0.64, "learning_rate": 0.00020460166186538588, "loss": 0.0184, "step": 126060 }, { "epoch": 0.64, "learning_rate": 0.00020459409417237186, "loss": 0.0149, "step": 126070 }, { "epoch": 0.64, "learning_rate": 0.00020458652647935784, "loss": 0.0139, "step": 126080 }, { "epoch": 0.64, "learning_rate": 0.00020457895878634385, "loss": 0.0134, "step": 126090 }, { "epoch": 0.64, "learning_rate": 0.00020457139109332983, "loss": 0.0206, "step": 126100 }, { "epoch": 0.64, "learning_rate": 0.0002045638234003158, "loss": 0.0154, "step": 126110 }, { "epoch": 0.64, "learning_rate": 0.00020455625570730182, "loss": 0.0186, "step": 126120 }, { "epoch": 0.64, "learning_rate": 0.0002045486880142878, "loss": 0.0124, "step": 126130 }, { "epoch": 0.64, "learning_rate": 0.00020454112032127378, "loss": 0.0152, "step": 126140 }, { "epoch": 0.64, "learning_rate": 0.00020453355262825976, "loss": 0.0171, "step": 126150 }, { "epoch": 0.64, "learning_rate": 0.00020452598493524577, "loss": 0.0144, "step": 126160 }, { "epoch": 0.64, "learning_rate": 0.00020451841724223175, "loss": 0.013, "step": 126170 }, { "epoch": 0.64, "learning_rate": 0.00020451084954921774, "loss": 0.0151, "step": 126180 }, { "epoch": 0.64, "learning_rate": 0.00020450328185620374, "loss": 0.0122, "step": 126190 }, { "epoch": 0.64, "learning_rate": 0.00020449571416318973, "loss": 0.0144, "step": 126200 }, { "epoch": 0.64, "learning_rate": 0.0002044881464701757, "loss": 0.014, "step": 126210 }, { "epoch": 0.64, "learning_rate": 0.00020448057877716172, "loss": 0.0135, "step": 126220 }, { "epoch": 0.64, "learning_rate": 0.0002044730110841477, "loss": 0.0141, "step": 126230 }, { "epoch": 0.64, "learning_rate": 0.00020446544339113368, "loss": 0.015, "step": 126240 }, { "epoch": 0.64, "learning_rate": 0.0002044578756981197, "loss": 0.0137, "step": 126250 }, { "epoch": 0.64, "learning_rate": 0.00020445030800510567, "loss": 0.0139, "step": 126260 }, { "epoch": 0.64, "learning_rate": 0.00020444274031209165, "loss": 0.0187, "step": 126270 }, { "epoch": 0.64, "learning_rate": 0.00020443517261907766, "loss": 0.0163, "step": 126280 }, { "epoch": 0.64, "learning_rate": 0.00020442760492606364, "loss": 0.0122, "step": 126290 }, { "epoch": 0.64, "learning_rate": 0.00020442003723304962, "loss": 0.0123, "step": 126300 }, { "epoch": 0.64, "learning_rate": 0.00020441246954003563, "loss": 0.0142, "step": 126310 }, { "epoch": 0.64, "learning_rate": 0.00020440490184702158, "loss": 0.0132, "step": 126320 }, { "epoch": 0.64, "learning_rate": 0.00020439733415400757, "loss": 0.0179, "step": 126330 }, { "epoch": 0.64, "learning_rate": 0.00020438976646099355, "loss": 0.0159, "step": 126340 }, { "epoch": 0.64, "learning_rate": 0.00020438219876797956, "loss": 0.0154, "step": 126350 }, { "epoch": 0.64, "learning_rate": 0.00020437463107496554, "loss": 0.0138, "step": 126360 }, { "epoch": 0.64, "learning_rate": 0.00020436706338195152, "loss": 0.0133, "step": 126370 }, { "epoch": 0.64, "learning_rate": 0.0002043594956889375, "loss": 0.0143, "step": 126380 }, { "epoch": 0.64, "learning_rate": 0.0002043519279959235, "loss": 0.0127, "step": 126390 }, { "epoch": 0.64, "learning_rate": 0.0002043443603029095, "loss": 0.0161, "step": 126400 }, { "epoch": 0.64, "learning_rate": 0.00020433679260989547, "loss": 0.0146, "step": 126410 }, { "epoch": 0.64, "learning_rate": 0.00020432922491688148, "loss": 0.0124, "step": 126420 }, { "epoch": 0.64, "learning_rate": 0.00020432165722386746, "loss": 0.0115, "step": 126430 }, { "epoch": 0.64, "learning_rate": 0.00020431408953085344, "loss": 0.0145, "step": 126440 }, { "epoch": 0.64, "learning_rate": 0.00020430652183783945, "loss": 0.0143, "step": 126450 }, { "epoch": 0.64, "learning_rate": 0.00020429895414482543, "loss": 0.0117, "step": 126460 }, { "epoch": 0.64, "learning_rate": 0.00020429138645181141, "loss": 0.0154, "step": 126470 }, { "epoch": 0.64, "learning_rate": 0.00020428381875879742, "loss": 0.0141, "step": 126480 }, { "epoch": 0.64, "learning_rate": 0.0002042762510657834, "loss": 0.0148, "step": 126490 }, { "epoch": 0.64, "learning_rate": 0.00020426868337276939, "loss": 0.0143, "step": 126500 }, { "epoch": 0.64, "learning_rate": 0.0002042611156797554, "loss": 0.0168, "step": 126510 }, { "epoch": 0.64, "learning_rate": 0.00020425354798674138, "loss": 0.0119, "step": 126520 }, { "epoch": 0.64, "learning_rate": 0.00020424598029372736, "loss": 0.0133, "step": 126530 }, { "epoch": 0.64, "learning_rate": 0.00020423841260071334, "loss": 0.0125, "step": 126540 }, { "epoch": 0.64, "learning_rate": 0.00020423084490769935, "loss": 0.0125, "step": 126550 }, { "epoch": 0.64, "learning_rate": 0.00020422327721468533, "loss": 0.0168, "step": 126560 }, { "epoch": 0.64, "learning_rate": 0.0002042157095216713, "loss": 0.0127, "step": 126570 }, { "epoch": 0.64, "learning_rate": 0.00020420814182865732, "loss": 0.0128, "step": 126580 }, { "epoch": 0.64, "learning_rate": 0.0002042005741356433, "loss": 0.0142, "step": 126590 }, { "epoch": 0.64, "learning_rate": 0.00020419300644262928, "loss": 0.0161, "step": 126600 }, { "epoch": 0.64, "learning_rate": 0.0002041854387496153, "loss": 0.0128, "step": 126610 }, { "epoch": 0.64, "learning_rate": 0.00020417787105660127, "loss": 0.015, "step": 126620 }, { "epoch": 0.64, "learning_rate": 0.00020417030336358725, "loss": 0.0137, "step": 126630 }, { "epoch": 0.64, "learning_rate": 0.00020416273567057326, "loss": 0.0127, "step": 126640 }, { "epoch": 0.64, "learning_rate": 0.00020415516797755924, "loss": 0.0119, "step": 126650 }, { "epoch": 0.64, "learning_rate": 0.00020414760028454522, "loss": 0.0109, "step": 126660 }, { "epoch": 0.64, "learning_rate": 0.00020414003259153123, "loss": 0.0129, "step": 126670 }, { "epoch": 0.64, "learning_rate": 0.00020413246489851721, "loss": 0.014, "step": 126680 }, { "epoch": 0.64, "learning_rate": 0.0002041248972055032, "loss": 0.0144, "step": 126690 }, { "epoch": 0.64, "learning_rate": 0.0002041173295124892, "loss": 0.0172, "step": 126700 }, { "epoch": 0.64, "learning_rate": 0.00020410976181947519, "loss": 0.0159, "step": 126710 }, { "epoch": 0.64, "learning_rate": 0.00020410219412646117, "loss": 0.0163, "step": 126720 }, { "epoch": 0.64, "learning_rate": 0.00020409462643344715, "loss": 0.0143, "step": 126730 }, { "epoch": 0.64, "learning_rate": 0.00020408705874043316, "loss": 0.0148, "step": 126740 }, { "epoch": 0.64, "learning_rate": 0.00020407949104741914, "loss": 0.0125, "step": 126750 }, { "epoch": 0.64, "learning_rate": 0.00020407192335440512, "loss": 0.0148, "step": 126760 }, { "epoch": 0.64, "learning_rate": 0.00020406435566139113, "loss": 0.0166, "step": 126770 }, { "epoch": 0.64, "learning_rate": 0.0002040567879683771, "loss": 0.0163, "step": 126780 }, { "epoch": 0.64, "learning_rate": 0.0002040492202753631, "loss": 0.0127, "step": 126790 }, { "epoch": 0.64, "learning_rate": 0.0002040416525823491, "loss": 0.0124, "step": 126800 }, { "epoch": 0.64, "learning_rate": 0.00020403408488933508, "loss": 0.0161, "step": 126810 }, { "epoch": 0.64, "learning_rate": 0.00020402651719632106, "loss": 0.0161, "step": 126820 }, { "epoch": 0.64, "learning_rate": 0.00020401894950330707, "loss": 0.0134, "step": 126830 }, { "epoch": 0.64, "learning_rate": 0.00020401138181029305, "loss": 0.0134, "step": 126840 }, { "epoch": 0.64, "learning_rate": 0.00020400381411727903, "loss": 0.0131, "step": 126850 }, { "epoch": 0.64, "learning_rate": 0.00020399624642426504, "loss": 0.0145, "step": 126860 }, { "epoch": 0.64, "learning_rate": 0.00020398867873125102, "loss": 0.0111, "step": 126870 }, { "epoch": 0.64, "learning_rate": 0.000203981111038237, "loss": 0.0137, "step": 126880 }, { "epoch": 0.64, "learning_rate": 0.000203973543345223, "loss": 0.0146, "step": 126890 }, { "epoch": 0.64, "learning_rate": 0.000203965975652209, "loss": 0.0117, "step": 126900 }, { "epoch": 0.64, "learning_rate": 0.00020395840795919498, "loss": 0.0152, "step": 126910 }, { "epoch": 0.64, "learning_rate": 0.00020395084026618096, "loss": 0.0147, "step": 126920 }, { "epoch": 0.64, "learning_rate": 0.00020394327257316697, "loss": 0.0108, "step": 126930 }, { "epoch": 0.64, "learning_rate": 0.00020393570488015295, "loss": 0.0163, "step": 126940 }, { "epoch": 0.64, "learning_rate": 0.00020392813718713893, "loss": 0.0122, "step": 126950 }, { "epoch": 0.64, "learning_rate": 0.00020392056949412494, "loss": 0.019, "step": 126960 }, { "epoch": 0.64, "learning_rate": 0.00020391300180111092, "loss": 0.0196, "step": 126970 }, { "epoch": 0.64, "learning_rate": 0.0002039054341080969, "loss": 0.0141, "step": 126980 }, { "epoch": 0.64, "learning_rate": 0.0002038978664150829, "loss": 0.012, "step": 126990 }, { "epoch": 0.64, "learning_rate": 0.0002038902987220689, "loss": 0.0183, "step": 127000 }, { "epoch": 0.64, "eval_cer": 0.9145129533326799, "eval_loss": 0.010238048620522022, "eval_runtime": 116.573, "eval_samples_per_second": 17.157, "eval_steps_per_second": 4.289, "step": 127000 }, { "epoch": 0.64, "learning_rate": 0.00020388273102905487, "loss": 0.0118, "step": 127010 }, { "epoch": 0.64, "learning_rate": 0.00020387516333604088, "loss": 0.0171, "step": 127020 }, { "epoch": 0.64, "learning_rate": 0.00020386759564302686, "loss": 0.0134, "step": 127030 }, { "epoch": 0.64, "learning_rate": 0.00020386002795001284, "loss": 0.0142, "step": 127040 }, { "epoch": 0.64, "learning_rate": 0.00020385246025699883, "loss": 0.0163, "step": 127050 }, { "epoch": 0.64, "learning_rate": 0.00020384489256398483, "loss": 0.0146, "step": 127060 }, { "epoch": 0.64, "learning_rate": 0.00020383732487097082, "loss": 0.0149, "step": 127070 }, { "epoch": 0.64, "learning_rate": 0.0002038297571779568, "loss": 0.0122, "step": 127080 }, { "epoch": 0.64, "learning_rate": 0.0002038221894849428, "loss": 0.0158, "step": 127090 }, { "epoch": 0.64, "learning_rate": 0.0002038146217919288, "loss": 0.0139, "step": 127100 }, { "epoch": 0.64, "learning_rate": 0.00020380705409891477, "loss": 0.0133, "step": 127110 }, { "epoch": 0.64, "learning_rate": 0.00020379948640590078, "loss": 0.0113, "step": 127120 }, { "epoch": 0.64, "learning_rate": 0.00020379191871288676, "loss": 0.0169, "step": 127130 }, { "epoch": 0.64, "learning_rate": 0.00020378435101987274, "loss": 0.0146, "step": 127140 }, { "epoch": 0.64, "learning_rate": 0.00020377678332685875, "loss": 0.0159, "step": 127150 }, { "epoch": 0.64, "learning_rate": 0.00020376921563384473, "loss": 0.0127, "step": 127160 }, { "epoch": 0.64, "learning_rate": 0.0002037616479408307, "loss": 0.0113, "step": 127170 }, { "epoch": 0.64, "learning_rate": 0.00020375408024781672, "loss": 0.0157, "step": 127180 }, { "epoch": 0.64, "learning_rate": 0.0002037465125548027, "loss": 0.0146, "step": 127190 }, { "epoch": 0.64, "learning_rate": 0.00020373894486178868, "loss": 0.0126, "step": 127200 }, { "epoch": 0.64, "learning_rate": 0.0002037313771687747, "loss": 0.0143, "step": 127210 }, { "epoch": 0.64, "learning_rate": 0.00020372380947576067, "loss": 0.0108, "step": 127220 }, { "epoch": 0.64, "learning_rate": 0.00020371624178274665, "loss": 0.0135, "step": 127230 }, { "epoch": 0.64, "learning_rate": 0.00020370867408973264, "loss": 0.0126, "step": 127240 }, { "epoch": 0.64, "learning_rate": 0.00020370110639671864, "loss": 0.0116, "step": 127250 }, { "epoch": 0.64, "learning_rate": 0.00020369353870370463, "loss": 0.0129, "step": 127260 }, { "epoch": 0.64, "learning_rate": 0.0002036859710106906, "loss": 0.0125, "step": 127270 }, { "epoch": 0.64, "learning_rate": 0.00020367840331767662, "loss": 0.0186, "step": 127280 }, { "epoch": 0.64, "learning_rate": 0.0002036708356246626, "loss": 0.012, "step": 127290 }, { "epoch": 0.64, "learning_rate": 0.00020366326793164858, "loss": 0.0162, "step": 127300 }, { "epoch": 0.64, "learning_rate": 0.0002036557002386346, "loss": 0.0141, "step": 127310 }, { "epoch": 0.64, "learning_rate": 0.00020364813254562057, "loss": 0.0152, "step": 127320 }, { "epoch": 0.64, "learning_rate": 0.00020364056485260655, "loss": 0.0136, "step": 127330 }, { "epoch": 0.64, "learning_rate": 0.00020363299715959256, "loss": 0.0158, "step": 127340 }, { "epoch": 0.64, "learning_rate": 0.00020362542946657854, "loss": 0.0128, "step": 127350 }, { "epoch": 0.64, "learning_rate": 0.00020361786177356452, "loss": 0.0141, "step": 127360 }, { "epoch": 0.64, "learning_rate": 0.00020361029408055053, "loss": 0.0118, "step": 127370 }, { "epoch": 0.64, "learning_rate": 0.0002036027263875365, "loss": 0.0121, "step": 127380 }, { "epoch": 0.64, "learning_rate": 0.0002035951586945225, "loss": 0.0129, "step": 127390 }, { "epoch": 0.64, "learning_rate": 0.00020358759100150848, "loss": 0.0127, "step": 127400 }, { "epoch": 0.64, "learning_rate": 0.00020358002330849448, "loss": 0.0146, "step": 127410 }, { "epoch": 0.64, "learning_rate": 0.00020357245561548047, "loss": 0.0154, "step": 127420 }, { "epoch": 0.64, "learning_rate": 0.00020356488792246645, "loss": 0.0091, "step": 127430 }, { "epoch": 0.64, "learning_rate": 0.00020355732022945246, "loss": 0.0132, "step": 127440 }, { "epoch": 0.64, "learning_rate": 0.00020354975253643844, "loss": 0.0116, "step": 127450 }, { "epoch": 0.64, "learning_rate": 0.00020354218484342442, "loss": 0.0136, "step": 127460 }, { "epoch": 0.64, "learning_rate": 0.00020353461715041043, "loss": 0.0141, "step": 127470 }, { "epoch": 0.64, "learning_rate": 0.0002035270494573964, "loss": 0.0129, "step": 127480 }, { "epoch": 0.64, "learning_rate": 0.0002035194817643824, "loss": 0.016, "step": 127490 }, { "epoch": 0.64, "learning_rate": 0.0002035119140713684, "loss": 0.0121, "step": 127500 }, { "epoch": 0.64, "learning_rate": 0.00020350434637835438, "loss": 0.0146, "step": 127510 }, { "epoch": 0.64, "learning_rate": 0.00020349677868534036, "loss": 0.0117, "step": 127520 }, { "epoch": 0.64, "learning_rate": 0.00020348921099232637, "loss": 0.0141, "step": 127530 }, { "epoch": 0.64, "learning_rate": 0.00020348164329931235, "loss": 0.0107, "step": 127540 }, { "epoch": 0.64, "learning_rate": 0.00020347407560629833, "loss": 0.0138, "step": 127550 }, { "epoch": 0.64, "learning_rate": 0.00020346650791328431, "loss": 0.0116, "step": 127560 }, { "epoch": 0.64, "learning_rate": 0.00020345894022027032, "loss": 0.0131, "step": 127570 }, { "epoch": 0.64, "learning_rate": 0.00020345137252725628, "loss": 0.0171, "step": 127580 }, { "epoch": 0.64, "learning_rate": 0.00020344380483424226, "loss": 0.0128, "step": 127590 }, { "epoch": 0.64, "learning_rate": 0.00020343623714122827, "loss": 0.0127, "step": 127600 }, { "epoch": 0.64, "learning_rate": 0.00020342866944821425, "loss": 0.0133, "step": 127610 }, { "epoch": 0.64, "learning_rate": 0.00020342110175520023, "loss": 0.0124, "step": 127620 }, { "epoch": 0.64, "learning_rate": 0.0002034135340621862, "loss": 0.0123, "step": 127630 }, { "epoch": 0.64, "learning_rate": 0.00020340596636917222, "loss": 0.0148, "step": 127640 }, { "epoch": 0.64, "learning_rate": 0.0002033983986761582, "loss": 0.0109, "step": 127650 }, { "epoch": 0.64, "learning_rate": 0.00020339083098314418, "loss": 0.013, "step": 127660 }, { "epoch": 0.64, "learning_rate": 0.0002033832632901302, "loss": 0.0124, "step": 127670 }, { "epoch": 0.64, "learning_rate": 0.00020337569559711617, "loss": 0.0161, "step": 127680 }, { "epoch": 0.64, "learning_rate": 0.00020336812790410215, "loss": 0.0146, "step": 127690 }, { "epoch": 0.64, "learning_rate": 0.00020336056021108816, "loss": 0.0156, "step": 127700 }, { "epoch": 0.64, "learning_rate": 0.00020335299251807414, "loss": 0.0141, "step": 127710 }, { "epoch": 0.64, "learning_rate": 0.00020334542482506013, "loss": 0.0164, "step": 127720 }, { "epoch": 0.64, "learning_rate": 0.00020333785713204613, "loss": 0.0194, "step": 127730 }, { "epoch": 0.64, "learning_rate": 0.00020333028943903212, "loss": 0.0193, "step": 127740 }, { "epoch": 0.64, "learning_rate": 0.0002033227217460181, "loss": 0.0237, "step": 127750 }, { "epoch": 0.64, "learning_rate": 0.0002033151540530041, "loss": 0.0147, "step": 127760 }, { "epoch": 0.64, "learning_rate": 0.0002033075863599901, "loss": 0.0134, "step": 127770 }, { "epoch": 0.64, "learning_rate": 0.00020330001866697607, "loss": 0.0156, "step": 127780 }, { "epoch": 0.64, "learning_rate": 0.00020329245097396205, "loss": 0.0145, "step": 127790 }, { "epoch": 0.64, "learning_rate": 0.00020328488328094806, "loss": 0.015, "step": 127800 }, { "epoch": 0.64, "learning_rate": 0.00020327731558793404, "loss": 0.0155, "step": 127810 }, { "epoch": 0.64, "learning_rate": 0.00020326974789492002, "loss": 0.0139, "step": 127820 }, { "epoch": 0.64, "learning_rate": 0.00020326218020190603, "loss": 0.015, "step": 127830 }, { "epoch": 0.64, "learning_rate": 0.000203254612508892, "loss": 0.0138, "step": 127840 }, { "epoch": 0.65, "learning_rate": 0.000203247044815878, "loss": 0.0129, "step": 127850 }, { "epoch": 0.65, "learning_rate": 0.000203239477122864, "loss": 0.0147, "step": 127860 }, { "epoch": 0.65, "learning_rate": 0.00020323190942984998, "loss": 0.0156, "step": 127870 }, { "epoch": 0.65, "learning_rate": 0.00020322434173683596, "loss": 0.0125, "step": 127880 }, { "epoch": 0.65, "learning_rate": 0.00020321677404382197, "loss": 0.0148, "step": 127890 }, { "epoch": 0.65, "learning_rate": 0.00020320920635080795, "loss": 0.0119, "step": 127900 }, { "epoch": 0.65, "learning_rate": 0.00020320163865779394, "loss": 0.0138, "step": 127910 }, { "epoch": 0.65, "learning_rate": 0.00020319407096477994, "loss": 0.0157, "step": 127920 }, { "epoch": 0.65, "learning_rate": 0.00020318650327176593, "loss": 0.0142, "step": 127930 }, { "epoch": 0.65, "learning_rate": 0.0002031789355787519, "loss": 0.0132, "step": 127940 }, { "epoch": 0.65, "learning_rate": 0.0002031713678857379, "loss": 0.0162, "step": 127950 }, { "epoch": 0.65, "learning_rate": 0.0002031638001927239, "loss": 0.0149, "step": 127960 }, { "epoch": 0.65, "learning_rate": 0.00020315623249970988, "loss": 0.0151, "step": 127970 }, { "epoch": 0.65, "learning_rate": 0.00020314866480669586, "loss": 0.0128, "step": 127980 }, { "epoch": 0.65, "learning_rate": 0.00020314109711368187, "loss": 0.0151, "step": 127990 }, { "epoch": 0.65, "learning_rate": 0.00020313352942066785, "loss": 0.0139, "step": 128000 }, { "epoch": 0.65, "eval_cer": 0.914481900656667, "eval_loss": 0.01020896527916193, "eval_runtime": 116.605, "eval_samples_per_second": 17.152, "eval_steps_per_second": 4.288, "step": 128000 }, { "epoch": 0.65, "learning_rate": 0.00020312596172765383, "loss": 0.0147, "step": 128010 }, { "epoch": 0.65, "learning_rate": 0.00020311839403463984, "loss": 0.0158, "step": 128020 }, { "epoch": 0.65, "learning_rate": 0.00020311082634162582, "loss": 0.0148, "step": 128030 }, { "epoch": 0.65, "learning_rate": 0.0002031032586486118, "loss": 0.0171, "step": 128040 }, { "epoch": 0.65, "learning_rate": 0.0002030956909555978, "loss": 0.0156, "step": 128050 }, { "epoch": 0.65, "learning_rate": 0.0002030881232625838, "loss": 0.0135, "step": 128060 }, { "epoch": 0.65, "learning_rate": 0.00020308055556956977, "loss": 0.0196, "step": 128070 }, { "epoch": 0.65, "learning_rate": 0.00020307298787655578, "loss": 0.0173, "step": 128080 }, { "epoch": 0.65, "learning_rate": 0.00020306542018354176, "loss": 0.018, "step": 128090 }, { "epoch": 0.65, "learning_rate": 0.00020305785249052775, "loss": 0.0159, "step": 128100 }, { "epoch": 0.65, "learning_rate": 0.00020305028479751375, "loss": 0.0195, "step": 128110 }, { "epoch": 0.65, "learning_rate": 0.00020304271710449974, "loss": 0.0158, "step": 128120 }, { "epoch": 0.65, "learning_rate": 0.00020303514941148572, "loss": 0.0177, "step": 128130 }, { "epoch": 0.65, "learning_rate": 0.0002030275817184717, "loss": 0.0116, "step": 128140 }, { "epoch": 0.65, "learning_rate": 0.0002030200140254577, "loss": 0.0167, "step": 128150 }, { "epoch": 0.65, "learning_rate": 0.0002030124463324437, "loss": 0.0141, "step": 128160 }, { "epoch": 0.65, "learning_rate": 0.00020300487863942967, "loss": 0.0144, "step": 128170 }, { "epoch": 0.65, "learning_rate": 0.00020299731094641568, "loss": 0.0141, "step": 128180 }, { "epoch": 0.65, "learning_rate": 0.00020298974325340166, "loss": 0.013, "step": 128190 }, { "epoch": 0.65, "learning_rate": 0.00020298217556038764, "loss": 0.0141, "step": 128200 }, { "epoch": 0.65, "learning_rate": 0.00020297460786737365, "loss": 0.0165, "step": 128210 }, { "epoch": 0.65, "learning_rate": 0.00020296704017435963, "loss": 0.015, "step": 128220 }, { "epoch": 0.65, "learning_rate": 0.0002029594724813456, "loss": 0.0138, "step": 128230 }, { "epoch": 0.65, "learning_rate": 0.00020295190478833162, "loss": 0.014, "step": 128240 }, { "epoch": 0.65, "learning_rate": 0.0002029443370953176, "loss": 0.0146, "step": 128250 }, { "epoch": 0.65, "learning_rate": 0.00020293676940230358, "loss": 0.0154, "step": 128260 }, { "epoch": 0.65, "learning_rate": 0.0002029292017092896, "loss": 0.0186, "step": 128270 }, { "epoch": 0.65, "learning_rate": 0.00020292163401627557, "loss": 0.0147, "step": 128280 }, { "epoch": 0.65, "learning_rate": 0.00020291406632326156, "loss": 0.0123, "step": 128290 }, { "epoch": 0.65, "learning_rate": 0.00020290649863024754, "loss": 0.0133, "step": 128300 }, { "epoch": 0.65, "learning_rate": 0.00020289893093723355, "loss": 0.0132, "step": 128310 }, { "epoch": 0.65, "learning_rate": 0.00020289136324421953, "loss": 0.0137, "step": 128320 }, { "epoch": 0.65, "learning_rate": 0.0002028837955512055, "loss": 0.0127, "step": 128330 }, { "epoch": 0.65, "learning_rate": 0.00020287622785819152, "loss": 0.0156, "step": 128340 }, { "epoch": 0.65, "learning_rate": 0.0002028686601651775, "loss": 0.0131, "step": 128350 }, { "epoch": 0.65, "learning_rate": 0.00020286109247216348, "loss": 0.0191, "step": 128360 }, { "epoch": 0.65, "learning_rate": 0.0002028535247791495, "loss": 0.0147, "step": 128370 }, { "epoch": 0.65, "learning_rate": 0.00020284595708613547, "loss": 0.0142, "step": 128380 }, { "epoch": 0.65, "learning_rate": 0.00020283838939312145, "loss": 0.0148, "step": 128390 }, { "epoch": 0.65, "learning_rate": 0.00020283082170010746, "loss": 0.0162, "step": 128400 }, { "epoch": 0.65, "learning_rate": 0.00020282325400709344, "loss": 0.01, "step": 128410 }, { "epoch": 0.65, "learning_rate": 0.00020281568631407942, "loss": 0.0144, "step": 128420 }, { "epoch": 0.65, "learning_rate": 0.00020280811862106543, "loss": 0.0126, "step": 128430 }, { "epoch": 0.65, "learning_rate": 0.0002028005509280514, "loss": 0.0132, "step": 128440 }, { "epoch": 0.65, "learning_rate": 0.0002027929832350374, "loss": 0.0175, "step": 128450 }, { "epoch": 0.65, "learning_rate": 0.00020278541554202338, "loss": 0.0135, "step": 128460 }, { "epoch": 0.65, "learning_rate": 0.00020277784784900938, "loss": 0.0134, "step": 128470 }, { "epoch": 0.65, "learning_rate": 0.00020277028015599537, "loss": 0.0134, "step": 128480 }, { "epoch": 0.65, "learning_rate": 0.00020276271246298135, "loss": 0.0131, "step": 128490 }, { "epoch": 0.65, "learning_rate": 0.00020275514476996736, "loss": 0.0153, "step": 128500 }, { "epoch": 0.65, "learning_rate": 0.00020274757707695334, "loss": 0.015, "step": 128510 }, { "epoch": 0.65, "learning_rate": 0.00020274000938393932, "loss": 0.0134, "step": 128520 }, { "epoch": 0.65, "learning_rate": 0.00020273244169092533, "loss": 0.0214, "step": 128530 }, { "epoch": 0.65, "learning_rate": 0.0002027248739979113, "loss": 0.0165, "step": 128540 }, { "epoch": 0.65, "learning_rate": 0.0002027173063048973, "loss": 0.0131, "step": 128550 }, { "epoch": 0.65, "learning_rate": 0.0002027097386118833, "loss": 0.0133, "step": 128560 }, { "epoch": 0.65, "learning_rate": 0.00020270217091886928, "loss": 0.0182, "step": 128570 }, { "epoch": 0.65, "learning_rate": 0.00020269460322585526, "loss": 0.0145, "step": 128580 }, { "epoch": 0.65, "learning_rate": 0.00020268703553284127, "loss": 0.0129, "step": 128590 }, { "epoch": 0.65, "learning_rate": 0.00020267946783982725, "loss": 0.0129, "step": 128600 }, { "epoch": 0.65, "learning_rate": 0.00020267190014681323, "loss": 0.0142, "step": 128610 }, { "epoch": 0.65, "learning_rate": 0.00020266433245379924, "loss": 0.0161, "step": 128620 }, { "epoch": 0.65, "learning_rate": 0.00020265676476078522, "loss": 0.0127, "step": 128630 }, { "epoch": 0.65, "learning_rate": 0.0002026491970677712, "loss": 0.0149, "step": 128640 }, { "epoch": 0.65, "learning_rate": 0.00020264162937475719, "loss": 0.0121, "step": 128650 }, { "epoch": 0.65, "learning_rate": 0.0002026340616817432, "loss": 0.0127, "step": 128660 }, { "epoch": 0.65, "learning_rate": 0.00020262649398872918, "loss": 0.0126, "step": 128670 }, { "epoch": 0.65, "learning_rate": 0.00020261892629571516, "loss": 0.0126, "step": 128680 }, { "epoch": 0.65, "learning_rate": 0.00020261135860270117, "loss": 0.0142, "step": 128690 }, { "epoch": 0.65, "learning_rate": 0.00020260379090968715, "loss": 0.0122, "step": 128700 }, { "epoch": 0.65, "learning_rate": 0.00020259622321667313, "loss": 0.0133, "step": 128710 }, { "epoch": 0.65, "learning_rate": 0.00020258865552365914, "loss": 0.0155, "step": 128720 }, { "epoch": 0.65, "learning_rate": 0.00020258108783064512, "loss": 0.0134, "step": 128730 }, { "epoch": 0.65, "learning_rate": 0.0002025735201376311, "loss": 0.0125, "step": 128740 }, { "epoch": 0.65, "learning_rate": 0.0002025659524446171, "loss": 0.0118, "step": 128750 }, { "epoch": 0.65, "learning_rate": 0.0002025583847516031, "loss": 0.0157, "step": 128760 }, { "epoch": 0.65, "learning_rate": 0.00020255081705858907, "loss": 0.0127, "step": 128770 }, { "epoch": 0.65, "learning_rate": 0.00020254324936557508, "loss": 0.0152, "step": 128780 }, { "epoch": 0.65, "learning_rate": 0.00020253568167256106, "loss": 0.0172, "step": 128790 }, { "epoch": 0.65, "learning_rate": 0.00020252811397954704, "loss": 0.0157, "step": 128800 }, { "epoch": 0.65, "learning_rate": 0.00020252054628653302, "loss": 0.0136, "step": 128810 }, { "epoch": 0.65, "learning_rate": 0.00020251297859351903, "loss": 0.0129, "step": 128820 }, { "epoch": 0.65, "learning_rate": 0.00020250541090050501, "loss": 0.0151, "step": 128830 }, { "epoch": 0.65, "learning_rate": 0.00020249784320749097, "loss": 0.0163, "step": 128840 }, { "epoch": 0.65, "learning_rate": 0.00020249027551447695, "loss": 0.0118, "step": 128850 }, { "epoch": 0.65, "learning_rate": 0.00020248270782146296, "loss": 0.0117, "step": 128860 }, { "epoch": 0.65, "learning_rate": 0.00020247514012844894, "loss": 0.0146, "step": 128870 }, { "epoch": 0.65, "learning_rate": 0.00020246757243543492, "loss": 0.015, "step": 128880 }, { "epoch": 0.65, "learning_rate": 0.00020246000474242093, "loss": 0.0144, "step": 128890 }, { "epoch": 0.65, "learning_rate": 0.0002024524370494069, "loss": 0.016, "step": 128900 }, { "epoch": 0.65, "learning_rate": 0.0002024448693563929, "loss": 0.0163, "step": 128910 }, { "epoch": 0.65, "learning_rate": 0.0002024373016633789, "loss": 0.0116, "step": 128920 }, { "epoch": 0.65, "learning_rate": 0.00020242973397036488, "loss": 0.0106, "step": 128930 }, { "epoch": 0.65, "learning_rate": 0.00020242216627735086, "loss": 0.0153, "step": 128940 }, { "epoch": 0.65, "learning_rate": 0.00020241459858433687, "loss": 0.0124, "step": 128950 }, { "epoch": 0.65, "learning_rate": 0.00020240703089132285, "loss": 0.0128, "step": 128960 }, { "epoch": 0.65, "learning_rate": 0.00020239946319830884, "loss": 0.0117, "step": 128970 }, { "epoch": 0.65, "learning_rate": 0.00020239189550529484, "loss": 0.0112, "step": 128980 }, { "epoch": 0.65, "learning_rate": 0.00020238432781228083, "loss": 0.0128, "step": 128990 }, { "epoch": 0.65, "learning_rate": 0.0002023767601192668, "loss": 0.0141, "step": 129000 }, { "epoch": 0.65, "eval_cer": 0.9144857822411687, "eval_loss": 0.009670346975326538, "eval_runtime": 116.6611, "eval_samples_per_second": 17.144, "eval_steps_per_second": 4.286, "step": 129000 }, { "epoch": 0.65, "learning_rate": 0.00020236919242625282, "loss": 0.0127, "step": 129010 }, { "epoch": 0.65, "learning_rate": 0.0002023616247332388, "loss": 0.0134, "step": 129020 }, { "epoch": 0.65, "learning_rate": 0.00020235405704022478, "loss": 0.0115, "step": 129030 }, { "epoch": 0.65, "learning_rate": 0.00020234648934721076, "loss": 0.0146, "step": 129040 }, { "epoch": 0.65, "learning_rate": 0.00020233892165419677, "loss": 0.0119, "step": 129050 }, { "epoch": 0.65, "learning_rate": 0.00020233135396118275, "loss": 0.0129, "step": 129060 }, { "epoch": 0.65, "learning_rate": 0.00020232378626816873, "loss": 0.0137, "step": 129070 }, { "epoch": 0.65, "learning_rate": 0.00020231621857515474, "loss": 0.0115, "step": 129080 }, { "epoch": 0.65, "learning_rate": 0.00020230865088214072, "loss": 0.0122, "step": 129090 }, { "epoch": 0.65, "learning_rate": 0.0002023010831891267, "loss": 0.0133, "step": 129100 }, { "epoch": 0.65, "learning_rate": 0.0002022935154961127, "loss": 0.0194, "step": 129110 }, { "epoch": 0.65, "learning_rate": 0.0002022859478030987, "loss": 0.0124, "step": 129120 }, { "epoch": 0.65, "learning_rate": 0.00020227838011008467, "loss": 0.0149, "step": 129130 }, { "epoch": 0.65, "learning_rate": 0.00020227081241707068, "loss": 0.0134, "step": 129140 }, { "epoch": 0.65, "learning_rate": 0.00020226324472405666, "loss": 0.0127, "step": 129150 }, { "epoch": 0.65, "learning_rate": 0.00020225567703104265, "loss": 0.0111, "step": 129160 }, { "epoch": 0.65, "learning_rate": 0.00020224810933802865, "loss": 0.0187, "step": 129170 }, { "epoch": 0.65, "learning_rate": 0.00020224054164501464, "loss": 0.0127, "step": 129180 }, { "epoch": 0.65, "learning_rate": 0.00020223297395200062, "loss": 0.0135, "step": 129190 }, { "epoch": 0.65, "learning_rate": 0.0002022254062589866, "loss": 0.0155, "step": 129200 }, { "epoch": 0.65, "learning_rate": 0.0002022178385659726, "loss": 0.0159, "step": 129210 }, { "epoch": 0.65, "learning_rate": 0.0002022102708729586, "loss": 0.0148, "step": 129220 }, { "epoch": 0.65, "learning_rate": 0.00020220270317994457, "loss": 0.0113, "step": 129230 }, { "epoch": 0.65, "learning_rate": 0.00020219513548693058, "loss": 0.0144, "step": 129240 }, { "epoch": 0.65, "learning_rate": 0.00020218756779391656, "loss": 0.015, "step": 129250 }, { "epoch": 0.65, "learning_rate": 0.00020218000010090254, "loss": 0.014, "step": 129260 }, { "epoch": 0.65, "learning_rate": 0.00020217243240788855, "loss": 0.0117, "step": 129270 }, { "epoch": 0.65, "learning_rate": 0.00020216486471487453, "loss": 0.0101, "step": 129280 }, { "epoch": 0.65, "learning_rate": 0.0002021572970218605, "loss": 0.0203, "step": 129290 }, { "epoch": 0.65, "learning_rate": 0.00020214972932884652, "loss": 0.0156, "step": 129300 }, { "epoch": 0.65, "learning_rate": 0.0002021421616358325, "loss": 0.0155, "step": 129310 }, { "epoch": 0.65, "learning_rate": 0.00020213459394281848, "loss": 0.0165, "step": 129320 }, { "epoch": 0.65, "learning_rate": 0.0002021270262498045, "loss": 0.0142, "step": 129330 }, { "epoch": 0.65, "learning_rate": 0.00020211945855679047, "loss": 0.0157, "step": 129340 }, { "epoch": 0.65, "learning_rate": 0.00020211189086377646, "loss": 0.0149, "step": 129350 }, { "epoch": 0.65, "learning_rate": 0.00020210432317076244, "loss": 0.0159, "step": 129360 }, { "epoch": 0.65, "learning_rate": 0.00020209675547774845, "loss": 0.013, "step": 129370 }, { "epoch": 0.65, "learning_rate": 0.00020208918778473443, "loss": 0.0159, "step": 129380 }, { "epoch": 0.65, "learning_rate": 0.0002020816200917204, "loss": 0.0134, "step": 129390 }, { "epoch": 0.65, "learning_rate": 0.00020207405239870642, "loss": 0.0152, "step": 129400 }, { "epoch": 0.65, "learning_rate": 0.0002020664847056924, "loss": 0.0137, "step": 129410 }, { "epoch": 0.65, "learning_rate": 0.00020205891701267838, "loss": 0.0123, "step": 129420 }, { "epoch": 0.65, "learning_rate": 0.0002020513493196644, "loss": 0.0144, "step": 129430 }, { "epoch": 0.65, "learning_rate": 0.00020204378162665037, "loss": 0.0143, "step": 129440 }, { "epoch": 0.65, "learning_rate": 0.00020203621393363635, "loss": 0.0182, "step": 129450 }, { "epoch": 0.65, "learning_rate": 0.00020202864624062236, "loss": 0.0125, "step": 129460 }, { "epoch": 0.65, "learning_rate": 0.00020202107854760834, "loss": 0.0149, "step": 129470 }, { "epoch": 0.65, "learning_rate": 0.00020201351085459432, "loss": 0.014, "step": 129480 }, { "epoch": 0.65, "learning_rate": 0.00020200594316158033, "loss": 0.0154, "step": 129490 }, { "epoch": 0.65, "learning_rate": 0.0002019983754685663, "loss": 0.0112, "step": 129500 }, { "epoch": 0.65, "learning_rate": 0.0002019908077755523, "loss": 0.0152, "step": 129510 }, { "epoch": 0.65, "learning_rate": 0.00020198324008253828, "loss": 0.0138, "step": 129520 }, { "epoch": 0.65, "learning_rate": 0.00020197567238952428, "loss": 0.0143, "step": 129530 }, { "epoch": 0.65, "learning_rate": 0.00020196810469651027, "loss": 0.0149, "step": 129540 }, { "epoch": 0.65, "learning_rate": 0.00020196053700349625, "loss": 0.0143, "step": 129550 }, { "epoch": 0.65, "learning_rate": 0.00020195296931048226, "loss": 0.0143, "step": 129560 }, { "epoch": 0.65, "learning_rate": 0.00020194540161746824, "loss": 0.0117, "step": 129570 }, { "epoch": 0.65, "learning_rate": 0.00020193783392445422, "loss": 0.0162, "step": 129580 }, { "epoch": 0.65, "learning_rate": 0.00020193026623144023, "loss": 0.0157, "step": 129590 }, { "epoch": 0.65, "learning_rate": 0.0002019226985384262, "loss": 0.0126, "step": 129600 }, { "epoch": 0.65, "learning_rate": 0.0002019151308454122, "loss": 0.0129, "step": 129610 }, { "epoch": 0.65, "learning_rate": 0.0002019075631523982, "loss": 0.0119, "step": 129620 }, { "epoch": 0.65, "learning_rate": 0.00020189999545938418, "loss": 0.0114, "step": 129630 }, { "epoch": 0.65, "learning_rate": 0.00020189242776637016, "loss": 0.013, "step": 129640 }, { "epoch": 0.65, "learning_rate": 0.00020188486007335617, "loss": 0.013, "step": 129650 }, { "epoch": 0.65, "learning_rate": 0.00020187729238034215, "loss": 0.0171, "step": 129660 }, { "epoch": 0.65, "learning_rate": 0.00020186972468732813, "loss": 0.0131, "step": 129670 }, { "epoch": 0.65, "learning_rate": 0.00020186215699431414, "loss": 0.0148, "step": 129680 }, { "epoch": 0.65, "learning_rate": 0.00020185458930130012, "loss": 0.0105, "step": 129690 }, { "epoch": 0.65, "learning_rate": 0.0002018470216082861, "loss": 0.0118, "step": 129700 }, { "epoch": 0.65, "learning_rate": 0.00020183945391527209, "loss": 0.0148, "step": 129710 }, { "epoch": 0.65, "learning_rate": 0.0002018318862222581, "loss": 0.0144, "step": 129720 }, { "epoch": 0.65, "learning_rate": 0.00020182431852924408, "loss": 0.0129, "step": 129730 }, { "epoch": 0.65, "learning_rate": 0.00020181675083623006, "loss": 0.0102, "step": 129740 }, { "epoch": 0.65, "learning_rate": 0.00020180918314321607, "loss": 0.0126, "step": 129750 }, { "epoch": 0.65, "learning_rate": 0.00020180161545020205, "loss": 0.0114, "step": 129760 }, { "epoch": 0.65, "learning_rate": 0.00020179404775718803, "loss": 0.0135, "step": 129770 }, { "epoch": 0.65, "learning_rate": 0.00020178648006417404, "loss": 0.0139, "step": 129780 }, { "epoch": 0.65, "learning_rate": 0.00020177891237116002, "loss": 0.0132, "step": 129790 }, { "epoch": 0.65, "learning_rate": 0.000201771344678146, "loss": 0.0142, "step": 129800 }, { "epoch": 0.65, "learning_rate": 0.000201763776985132, "loss": 0.0156, "step": 129810 }, { "epoch": 0.65, "learning_rate": 0.000201756209292118, "loss": 0.0145, "step": 129820 }, { "epoch": 0.66, "learning_rate": 0.00020174864159910397, "loss": 0.0146, "step": 129830 }, { "epoch": 0.66, "learning_rate": 0.00020174107390608998, "loss": 0.0128, "step": 129840 }, { "epoch": 0.66, "learning_rate": 0.00020173350621307596, "loss": 0.0139, "step": 129850 }, { "epoch": 0.66, "learning_rate": 0.00020172593852006194, "loss": 0.0145, "step": 129860 }, { "epoch": 0.66, "learning_rate": 0.00020171837082704792, "loss": 0.0142, "step": 129870 }, { "epoch": 0.66, "learning_rate": 0.00020171080313403393, "loss": 0.0132, "step": 129880 }, { "epoch": 0.66, "learning_rate": 0.00020170323544101991, "loss": 0.0127, "step": 129890 }, { "epoch": 0.66, "learning_rate": 0.0002016956677480059, "loss": 0.0136, "step": 129900 }, { "epoch": 0.66, "learning_rate": 0.0002016881000549919, "loss": 0.0135, "step": 129910 }, { "epoch": 0.66, "learning_rate": 0.00020168053236197789, "loss": 0.0127, "step": 129920 }, { "epoch": 0.66, "learning_rate": 0.00020167296466896387, "loss": 0.0122, "step": 129930 }, { "epoch": 0.66, "learning_rate": 0.00020166539697594988, "loss": 0.0163, "step": 129940 }, { "epoch": 0.66, "learning_rate": 0.00020165782928293586, "loss": 0.0134, "step": 129950 }, { "epoch": 0.66, "learning_rate": 0.00020165026158992184, "loss": 0.0132, "step": 129960 }, { "epoch": 0.66, "learning_rate": 0.00020164269389690785, "loss": 0.0164, "step": 129970 }, { "epoch": 0.66, "learning_rate": 0.00020163512620389383, "loss": 0.0125, "step": 129980 }, { "epoch": 0.66, "learning_rate": 0.0002016275585108798, "loss": 0.0152, "step": 129990 }, { "epoch": 0.66, "learning_rate": 0.00020161999081786582, "loss": 0.0161, "step": 130000 }, { "epoch": 0.66, "eval_cer": 0.9144828710527925, "eval_loss": 0.009702015668153763, "eval_runtime": 116.6027, "eval_samples_per_second": 17.152, "eval_steps_per_second": 4.288, "step": 130000 }, { "epoch": 0.66, "learning_rate": 0.0002016124231248518, "loss": 0.0188, "step": 130010 }, { "epoch": 0.66, "learning_rate": 0.00020160485543183778, "loss": 0.0146, "step": 130020 }, { "epoch": 0.66, "learning_rate": 0.00020159728773882376, "loss": 0.0123, "step": 130030 }, { "epoch": 0.66, "learning_rate": 0.00020158972004580977, "loss": 0.013, "step": 130040 }, { "epoch": 0.66, "learning_rate": 0.00020158215235279575, "loss": 0.0145, "step": 130050 }, { "epoch": 0.66, "learning_rate": 0.00020157458465978173, "loss": 0.0136, "step": 130060 }, { "epoch": 0.66, "learning_rate": 0.00020156701696676774, "loss": 0.0117, "step": 130070 }, { "epoch": 0.66, "learning_rate": 0.00020155944927375372, "loss": 0.0131, "step": 130080 }, { "epoch": 0.66, "learning_rate": 0.00020155188158073968, "loss": 0.0142, "step": 130090 }, { "epoch": 0.66, "learning_rate": 0.00020154431388772566, "loss": 0.0159, "step": 130100 }, { "epoch": 0.66, "learning_rate": 0.00020153674619471167, "loss": 0.0168, "step": 130110 }, { "epoch": 0.66, "learning_rate": 0.00020152917850169765, "loss": 0.0158, "step": 130120 }, { "epoch": 0.66, "learning_rate": 0.00020152161080868363, "loss": 0.0163, "step": 130130 }, { "epoch": 0.66, "learning_rate": 0.00020151404311566964, "loss": 0.0116, "step": 130140 }, { "epoch": 0.66, "learning_rate": 0.00020150647542265562, "loss": 0.0121, "step": 130150 }, { "epoch": 0.66, "learning_rate": 0.0002014989077296416, "loss": 0.012, "step": 130160 }, { "epoch": 0.66, "learning_rate": 0.0002014913400366276, "loss": 0.0146, "step": 130170 }, { "epoch": 0.66, "learning_rate": 0.0002014837723436136, "loss": 0.012, "step": 130180 }, { "epoch": 0.66, "learning_rate": 0.00020147620465059957, "loss": 0.0134, "step": 130190 }, { "epoch": 0.66, "learning_rate": 0.00020146863695758558, "loss": 0.0143, "step": 130200 }, { "epoch": 0.66, "learning_rate": 0.00020146106926457156, "loss": 0.0201, "step": 130210 }, { "epoch": 0.66, "learning_rate": 0.00020145350157155755, "loss": 0.0137, "step": 130220 }, { "epoch": 0.66, "learning_rate": 0.00020144593387854355, "loss": 0.0121, "step": 130230 }, { "epoch": 0.66, "learning_rate": 0.00020143836618552954, "loss": 0.0109, "step": 130240 }, { "epoch": 0.66, "learning_rate": 0.00020143079849251552, "loss": 0.0135, "step": 130250 }, { "epoch": 0.66, "learning_rate": 0.0002014232307995015, "loss": 0.0118, "step": 130260 }, { "epoch": 0.66, "learning_rate": 0.0002014156631064875, "loss": 0.0164, "step": 130270 }, { "epoch": 0.66, "learning_rate": 0.0002014080954134735, "loss": 0.0132, "step": 130280 }, { "epoch": 0.66, "learning_rate": 0.00020140052772045947, "loss": 0.014, "step": 130290 }, { "epoch": 0.66, "learning_rate": 0.00020139296002744548, "loss": 0.0133, "step": 130300 }, { "epoch": 0.66, "learning_rate": 0.00020138539233443146, "loss": 0.0155, "step": 130310 }, { "epoch": 0.66, "learning_rate": 0.00020137782464141744, "loss": 0.017, "step": 130320 }, { "epoch": 0.66, "learning_rate": 0.00020137025694840345, "loss": 0.0145, "step": 130330 }, { "epoch": 0.66, "learning_rate": 0.00020136268925538943, "loss": 0.0138, "step": 130340 }, { "epoch": 0.66, "learning_rate": 0.0002013551215623754, "loss": 0.0117, "step": 130350 }, { "epoch": 0.66, "learning_rate": 0.00020134755386936142, "loss": 0.0131, "step": 130360 }, { "epoch": 0.66, "learning_rate": 0.0002013399861763474, "loss": 0.0135, "step": 130370 }, { "epoch": 0.66, "learning_rate": 0.00020133241848333338, "loss": 0.0123, "step": 130380 }, { "epoch": 0.66, "learning_rate": 0.0002013248507903194, "loss": 0.0159, "step": 130390 }, { "epoch": 0.66, "learning_rate": 0.00020131728309730537, "loss": 0.018, "step": 130400 }, { "epoch": 0.66, "learning_rate": 0.00020130971540429136, "loss": 0.0128, "step": 130410 }, { "epoch": 0.66, "learning_rate": 0.00020130214771127734, "loss": 0.0131, "step": 130420 }, { "epoch": 0.66, "learning_rate": 0.00020129458001826335, "loss": 0.0135, "step": 130430 }, { "epoch": 0.66, "learning_rate": 0.00020128701232524933, "loss": 0.0147, "step": 130440 }, { "epoch": 0.66, "learning_rate": 0.0002012794446322353, "loss": 0.0171, "step": 130450 }, { "epoch": 0.66, "learning_rate": 0.00020127187693922132, "loss": 0.0132, "step": 130460 }, { "epoch": 0.66, "learning_rate": 0.0002012643092462073, "loss": 0.0136, "step": 130470 }, { "epoch": 0.66, "learning_rate": 0.00020125674155319328, "loss": 0.0139, "step": 130480 }, { "epoch": 0.66, "learning_rate": 0.0002012491738601793, "loss": 0.0135, "step": 130490 }, { "epoch": 0.66, "learning_rate": 0.00020124160616716527, "loss": 0.0121, "step": 130500 }, { "epoch": 0.66, "learning_rate": 0.00020123403847415125, "loss": 0.0146, "step": 130510 }, { "epoch": 0.66, "learning_rate": 0.00020122647078113726, "loss": 0.0149, "step": 130520 }, { "epoch": 0.66, "learning_rate": 0.00020121890308812324, "loss": 0.0157, "step": 130530 }, { "epoch": 0.66, "learning_rate": 0.00020121133539510922, "loss": 0.0126, "step": 130540 }, { "epoch": 0.66, "learning_rate": 0.00020120376770209523, "loss": 0.0113, "step": 130550 }, { "epoch": 0.66, "learning_rate": 0.0002011962000090812, "loss": 0.0197, "step": 130560 }, { "epoch": 0.66, "learning_rate": 0.0002011886323160672, "loss": 0.0133, "step": 130570 }, { "epoch": 0.66, "learning_rate": 0.0002011810646230532, "loss": 0.0151, "step": 130580 }, { "epoch": 0.66, "learning_rate": 0.00020117349693003918, "loss": 0.0155, "step": 130590 }, { "epoch": 0.66, "learning_rate": 0.00020116592923702517, "loss": 0.0148, "step": 130600 }, { "epoch": 0.66, "learning_rate": 0.00020115836154401115, "loss": 0.0139, "step": 130610 }, { "epoch": 0.66, "learning_rate": 0.00020115079385099716, "loss": 0.0117, "step": 130620 }, { "epoch": 0.66, "learning_rate": 0.00020114322615798314, "loss": 0.0157, "step": 130630 }, { "epoch": 0.66, "learning_rate": 0.00020113565846496912, "loss": 0.0122, "step": 130640 }, { "epoch": 0.66, "learning_rate": 0.00020112809077195513, "loss": 0.0144, "step": 130650 }, { "epoch": 0.66, "learning_rate": 0.0002011205230789411, "loss": 0.0109, "step": 130660 }, { "epoch": 0.66, "learning_rate": 0.0002011129553859271, "loss": 0.016, "step": 130670 }, { "epoch": 0.66, "learning_rate": 0.0002011053876929131, "loss": 0.0129, "step": 130680 }, { "epoch": 0.66, "learning_rate": 0.00020109781999989908, "loss": 0.0159, "step": 130690 }, { "epoch": 0.66, "learning_rate": 0.00020109025230688506, "loss": 0.0155, "step": 130700 }, { "epoch": 0.66, "learning_rate": 0.00020108268461387107, "loss": 0.0149, "step": 130710 }, { "epoch": 0.66, "learning_rate": 0.00020107511692085705, "loss": 0.0126, "step": 130720 }, { "epoch": 0.66, "learning_rate": 0.00020106754922784303, "loss": 0.012, "step": 130730 }, { "epoch": 0.66, "learning_rate": 0.00020105998153482904, "loss": 0.0123, "step": 130740 }, { "epoch": 0.66, "learning_rate": 0.00020105241384181502, "loss": 0.0133, "step": 130750 }, { "epoch": 0.66, "learning_rate": 0.000201044846148801, "loss": 0.0175, "step": 130760 }, { "epoch": 0.66, "learning_rate": 0.00020103727845578699, "loss": 0.0149, "step": 130770 }, { "epoch": 0.66, "learning_rate": 0.000201029710762773, "loss": 0.015, "step": 130780 }, { "epoch": 0.66, "learning_rate": 0.00020102214306975898, "loss": 0.0116, "step": 130790 }, { "epoch": 0.66, "learning_rate": 0.00020101457537674496, "loss": 0.0112, "step": 130800 }, { "epoch": 0.66, "learning_rate": 0.00020100700768373097, "loss": 0.0121, "step": 130810 }, { "epoch": 0.66, "learning_rate": 0.00020099943999071695, "loss": 0.0189, "step": 130820 }, { "epoch": 0.66, "learning_rate": 0.00020099187229770293, "loss": 0.0152, "step": 130830 }, { "epoch": 0.66, "learning_rate": 0.00020098430460468894, "loss": 0.0132, "step": 130840 }, { "epoch": 0.66, "learning_rate": 0.00020097673691167492, "loss": 0.0127, "step": 130850 }, { "epoch": 0.66, "learning_rate": 0.0002009691692186609, "loss": 0.0109, "step": 130860 }, { "epoch": 0.66, "learning_rate": 0.0002009616015256469, "loss": 0.0161, "step": 130870 }, { "epoch": 0.66, "learning_rate": 0.0002009540338326329, "loss": 0.015, "step": 130880 }, { "epoch": 0.66, "learning_rate": 0.00020094646613961887, "loss": 0.0112, "step": 130890 }, { "epoch": 0.66, "learning_rate": 0.00020093889844660488, "loss": 0.0136, "step": 130900 }, { "epoch": 0.66, "learning_rate": 0.00020093133075359086, "loss": 0.0122, "step": 130910 }, { "epoch": 0.66, "learning_rate": 0.00020092376306057684, "loss": 0.0134, "step": 130920 }, { "epoch": 0.66, "learning_rate": 0.00020091619536756282, "loss": 0.0165, "step": 130930 }, { "epoch": 0.66, "learning_rate": 0.00020090862767454883, "loss": 0.0144, "step": 130940 }, { "epoch": 0.66, "learning_rate": 0.00020090105998153481, "loss": 0.0148, "step": 130950 }, { "epoch": 0.66, "learning_rate": 0.0002008934922885208, "loss": 0.0157, "step": 130960 }, { "epoch": 0.66, "learning_rate": 0.0002008859245955068, "loss": 0.0184, "step": 130970 }, { "epoch": 0.66, "learning_rate": 0.00020087835690249279, "loss": 0.0131, "step": 130980 }, { "epoch": 0.66, "learning_rate": 0.00020087078920947877, "loss": 0.0125, "step": 130990 }, { "epoch": 0.66, "learning_rate": 0.00020086322151646478, "loss": 0.0129, "step": 131000 }, { "epoch": 0.66, "eval_cer": 0.9145090717481783, "eval_loss": 0.009523593820631504, "eval_runtime": 116.9784, "eval_samples_per_second": 17.097, "eval_steps_per_second": 4.274, "step": 131000 }, { "epoch": 0.66, "learning_rate": 0.00020085565382345076, "loss": 0.0139, "step": 131010 }, { "epoch": 0.66, "learning_rate": 0.00020084808613043674, "loss": 0.0161, "step": 131020 }, { "epoch": 0.66, "learning_rate": 0.00020084051843742275, "loss": 0.0112, "step": 131030 }, { "epoch": 0.66, "learning_rate": 0.00020083295074440873, "loss": 0.0114, "step": 131040 }, { "epoch": 0.66, "learning_rate": 0.0002008253830513947, "loss": 0.0119, "step": 131050 }, { "epoch": 0.66, "learning_rate": 0.00020081781535838072, "loss": 0.0165, "step": 131060 }, { "epoch": 0.66, "learning_rate": 0.0002008102476653667, "loss": 0.0111, "step": 131070 }, { "epoch": 0.66, "learning_rate": 0.00020080267997235268, "loss": 0.0125, "step": 131080 }, { "epoch": 0.66, "learning_rate": 0.0002007951122793387, "loss": 0.0126, "step": 131090 }, { "epoch": 0.66, "learning_rate": 0.00020078754458632467, "loss": 0.0132, "step": 131100 }, { "epoch": 0.66, "learning_rate": 0.00020077997689331065, "loss": 0.0137, "step": 131110 }, { "epoch": 0.66, "learning_rate": 0.00020077240920029663, "loss": 0.0126, "step": 131120 }, { "epoch": 0.66, "learning_rate": 0.00020076484150728264, "loss": 0.0139, "step": 131130 }, { "epoch": 0.66, "learning_rate": 0.00020075727381426862, "loss": 0.0147, "step": 131140 }, { "epoch": 0.66, "learning_rate": 0.0002007497061212546, "loss": 0.0149, "step": 131150 }, { "epoch": 0.66, "learning_rate": 0.00020074213842824061, "loss": 0.0187, "step": 131160 }, { "epoch": 0.66, "learning_rate": 0.0002007345707352266, "loss": 0.0143, "step": 131170 }, { "epoch": 0.66, "learning_rate": 0.00020072700304221258, "loss": 0.0157, "step": 131180 }, { "epoch": 0.66, "learning_rate": 0.00020071943534919859, "loss": 0.0176, "step": 131190 }, { "epoch": 0.66, "learning_rate": 0.00020071186765618457, "loss": 0.0137, "step": 131200 }, { "epoch": 0.66, "learning_rate": 0.00020070429996317055, "loss": 0.0128, "step": 131210 }, { "epoch": 0.66, "learning_rate": 0.00020069673227015656, "loss": 0.0139, "step": 131220 }, { "epoch": 0.66, "learning_rate": 0.00020068916457714254, "loss": 0.014, "step": 131230 }, { "epoch": 0.66, "learning_rate": 0.00020068159688412852, "loss": 0.0117, "step": 131240 }, { "epoch": 0.66, "learning_rate": 0.00020067402919111453, "loss": 0.0152, "step": 131250 }, { "epoch": 0.66, "learning_rate": 0.0002006664614981005, "loss": 0.0124, "step": 131260 }, { "epoch": 0.66, "learning_rate": 0.0002006588938050865, "loss": 0.0135, "step": 131270 }, { "epoch": 0.66, "learning_rate": 0.00020065132611207247, "loss": 0.0143, "step": 131280 }, { "epoch": 0.66, "learning_rate": 0.00020064375841905848, "loss": 0.0141, "step": 131290 }, { "epoch": 0.66, "learning_rate": 0.00020063619072604446, "loss": 0.0137, "step": 131300 }, { "epoch": 0.66, "learning_rate": 0.00020062862303303044, "loss": 0.0125, "step": 131310 }, { "epoch": 0.66, "learning_rate": 0.00020062105534001645, "loss": 0.0113, "step": 131320 }, { "epoch": 0.66, "learning_rate": 0.00020061348764700243, "loss": 0.0145, "step": 131330 }, { "epoch": 0.66, "learning_rate": 0.00020060591995398842, "loss": 0.0164, "step": 131340 }, { "epoch": 0.66, "learning_rate": 0.00020059835226097437, "loss": 0.015, "step": 131350 }, { "epoch": 0.66, "learning_rate": 0.00020059078456796038, "loss": 0.014, "step": 131360 }, { "epoch": 0.66, "learning_rate": 0.00020058321687494636, "loss": 0.0136, "step": 131370 }, { "epoch": 0.66, "learning_rate": 0.00020057564918193234, "loss": 0.0184, "step": 131380 }, { "epoch": 0.66, "learning_rate": 0.00020056808148891835, "loss": 0.0122, "step": 131390 }, { "epoch": 0.66, "learning_rate": 0.00020056051379590433, "loss": 0.0152, "step": 131400 }, { "epoch": 0.66, "learning_rate": 0.0002005529461028903, "loss": 0.0142, "step": 131410 }, { "epoch": 0.66, "learning_rate": 0.00020054537840987632, "loss": 0.0145, "step": 131420 }, { "epoch": 0.66, "learning_rate": 0.0002005378107168623, "loss": 0.0137, "step": 131430 }, { "epoch": 0.66, "learning_rate": 0.00020053024302384828, "loss": 0.0124, "step": 131440 }, { "epoch": 0.66, "learning_rate": 0.0002005226753308343, "loss": 0.0152, "step": 131450 }, { "epoch": 0.66, "learning_rate": 0.00020051510763782027, "loss": 0.0126, "step": 131460 }, { "epoch": 0.66, "learning_rate": 0.00020050753994480626, "loss": 0.0145, "step": 131470 }, { "epoch": 0.66, "learning_rate": 0.00020049997225179226, "loss": 0.0155, "step": 131480 }, { "epoch": 0.66, "learning_rate": 0.00020049240455877825, "loss": 0.0133, "step": 131490 }, { "epoch": 0.66, "learning_rate": 0.00020048483686576423, "loss": 0.0112, "step": 131500 }, { "epoch": 0.66, "learning_rate": 0.0002004772691727502, "loss": 0.0174, "step": 131510 }, { "epoch": 0.66, "learning_rate": 0.00020046970147973622, "loss": 0.0156, "step": 131520 }, { "epoch": 0.66, "learning_rate": 0.0002004621337867222, "loss": 0.0137, "step": 131530 }, { "epoch": 0.66, "learning_rate": 0.00020045456609370818, "loss": 0.0124, "step": 131540 }, { "epoch": 0.66, "learning_rate": 0.0002004469984006942, "loss": 0.0122, "step": 131550 }, { "epoch": 0.66, "learning_rate": 0.00020043943070768017, "loss": 0.0114, "step": 131560 }, { "epoch": 0.66, "learning_rate": 0.00020043186301466615, "loss": 0.01, "step": 131570 }, { "epoch": 0.66, "learning_rate": 0.00020042429532165216, "loss": 0.0125, "step": 131580 }, { "epoch": 0.66, "learning_rate": 0.00020041672762863814, "loss": 0.0138, "step": 131590 }, { "epoch": 0.66, "learning_rate": 0.00020040915993562412, "loss": 0.0148, "step": 131600 }, { "epoch": 0.66, "learning_rate": 0.00020040159224261013, "loss": 0.0111, "step": 131610 }, { "epoch": 0.66, "learning_rate": 0.0002003940245495961, "loss": 0.0117, "step": 131620 }, { "epoch": 0.66, "learning_rate": 0.0002003864568565821, "loss": 0.0124, "step": 131630 }, { "epoch": 0.66, "learning_rate": 0.0002003788891635681, "loss": 0.0105, "step": 131640 }, { "epoch": 0.66, "learning_rate": 0.00020037132147055408, "loss": 0.0123, "step": 131650 }, { "epoch": 0.66, "learning_rate": 0.00020036375377754007, "loss": 0.0117, "step": 131660 }, { "epoch": 0.66, "learning_rate": 0.00020035618608452605, "loss": 0.0142, "step": 131670 }, { "epoch": 0.66, "learning_rate": 0.00020034861839151206, "loss": 0.0134, "step": 131680 }, { "epoch": 0.66, "learning_rate": 0.00020034105069849804, "loss": 0.0137, "step": 131690 }, { "epoch": 0.66, "learning_rate": 0.00020033348300548402, "loss": 0.0121, "step": 131700 }, { "epoch": 0.66, "learning_rate": 0.00020032591531247003, "loss": 0.0112, "step": 131710 }, { "epoch": 0.66, "learning_rate": 0.000200318347619456, "loss": 0.0125, "step": 131720 }, { "epoch": 0.66, "learning_rate": 0.000200310779926442, "loss": 0.0124, "step": 131730 }, { "epoch": 0.66, "learning_rate": 0.000200303212233428, "loss": 0.0193, "step": 131740 }, { "epoch": 0.66, "learning_rate": 0.00020029564454041398, "loss": 0.0135, "step": 131750 }, { "epoch": 0.66, "learning_rate": 0.00020028807684739996, "loss": 0.0144, "step": 131760 }, { "epoch": 0.66, "learning_rate": 0.00020028050915438597, "loss": 0.014, "step": 131770 }, { "epoch": 0.66, "learning_rate": 0.00020027294146137195, "loss": 0.0099, "step": 131780 }, { "epoch": 0.66, "learning_rate": 0.00020026537376835793, "loss": 0.0153, "step": 131790 }, { "epoch": 0.66, "learning_rate": 0.00020025780607534394, "loss": 0.0137, "step": 131800 }, { "epoch": 0.66, "learning_rate": 0.00020025023838232992, "loss": 0.0179, "step": 131810 }, { "epoch": 0.67, "learning_rate": 0.0002002426706893159, "loss": 0.0137, "step": 131820 }, { "epoch": 0.67, "learning_rate": 0.00020023510299630189, "loss": 0.0191, "step": 131830 }, { "epoch": 0.67, "learning_rate": 0.0002002275353032879, "loss": 0.0138, "step": 131840 }, { "epoch": 0.67, "learning_rate": 0.00020021996761027388, "loss": 0.0135, "step": 131850 }, { "epoch": 0.67, "learning_rate": 0.00020021239991725986, "loss": 0.0122, "step": 131860 }, { "epoch": 0.67, "learning_rate": 0.00020020483222424587, "loss": 0.0146, "step": 131870 }, { "epoch": 0.67, "learning_rate": 0.00020019726453123185, "loss": 0.0136, "step": 131880 }, { "epoch": 0.67, "learning_rate": 0.00020018969683821783, "loss": 0.013, "step": 131890 }, { "epoch": 0.67, "learning_rate": 0.00020018212914520384, "loss": 0.0137, "step": 131900 }, { "epoch": 0.67, "learning_rate": 0.00020017456145218982, "loss": 0.0128, "step": 131910 }, { "epoch": 0.67, "learning_rate": 0.0002001669937591758, "loss": 0.013, "step": 131920 }, { "epoch": 0.67, "learning_rate": 0.0002001594260661618, "loss": 0.0138, "step": 131930 }, { "epoch": 0.67, "learning_rate": 0.0002001518583731478, "loss": 0.0117, "step": 131940 }, { "epoch": 0.67, "learning_rate": 0.00020014429068013377, "loss": 0.015, "step": 131950 }, { "epoch": 0.67, "learning_rate": 0.00020013672298711978, "loss": 0.0124, "step": 131960 }, { "epoch": 0.67, "learning_rate": 0.00020012915529410576, "loss": 0.0153, "step": 131970 }, { "epoch": 0.67, "learning_rate": 0.00020012158760109174, "loss": 0.0134, "step": 131980 }, { "epoch": 0.67, "learning_rate": 0.00020011401990807775, "loss": 0.0133, "step": 131990 }, { "epoch": 0.67, "learning_rate": 0.00020010645221506373, "loss": 0.0141, "step": 132000 }, { "epoch": 0.67, "eval_cer": 0.9144430848116509, "eval_loss": 0.009661003015935421, "eval_runtime": 116.7282, "eval_samples_per_second": 17.134, "eval_steps_per_second": 4.283, "step": 132000 }, { "epoch": 0.67, "learning_rate": 0.00020009888452204971, "loss": 0.0143, "step": 132010 }, { "epoch": 0.67, "learning_rate": 0.0002000913168290357, "loss": 0.0144, "step": 132020 }, { "epoch": 0.67, "learning_rate": 0.0002000837491360217, "loss": 0.0149, "step": 132030 }, { "epoch": 0.67, "learning_rate": 0.00020007618144300769, "loss": 0.0115, "step": 132040 }, { "epoch": 0.67, "learning_rate": 0.00020006861374999367, "loss": 0.0116, "step": 132050 }, { "epoch": 0.67, "learning_rate": 0.00020006104605697968, "loss": 0.0161, "step": 132060 }, { "epoch": 0.67, "learning_rate": 0.00020005347836396566, "loss": 0.0162, "step": 132070 }, { "epoch": 0.67, "learning_rate": 0.00020004591067095164, "loss": 0.0132, "step": 132080 }, { "epoch": 0.67, "learning_rate": 0.00020003834297793765, "loss": 0.0195, "step": 132090 }, { "epoch": 0.67, "learning_rate": 0.00020003077528492363, "loss": 0.0137, "step": 132100 }, { "epoch": 0.67, "learning_rate": 0.0002000232075919096, "loss": 0.0134, "step": 132110 }, { "epoch": 0.67, "learning_rate": 0.00020001563989889562, "loss": 0.0159, "step": 132120 }, { "epoch": 0.67, "learning_rate": 0.0002000080722058816, "loss": 0.0092, "step": 132130 }, { "epoch": 0.67, "learning_rate": 0.00020000050451286758, "loss": 0.0113, "step": 132140 }, { "epoch": 0.67, "learning_rate": 0.0001999929368198536, "loss": 0.0126, "step": 132150 }, { "epoch": 0.67, "learning_rate": 0.00019998536912683957, "loss": 0.014, "step": 132160 }, { "epoch": 0.67, "learning_rate": 0.00019997780143382555, "loss": 0.0112, "step": 132170 }, { "epoch": 0.67, "learning_rate": 0.00019997023374081153, "loss": 0.0116, "step": 132180 }, { "epoch": 0.67, "learning_rate": 0.00019996266604779754, "loss": 0.0139, "step": 132190 }, { "epoch": 0.67, "learning_rate": 0.00019995509835478352, "loss": 0.0143, "step": 132200 }, { "epoch": 0.67, "learning_rate": 0.0001999475306617695, "loss": 0.0152, "step": 132210 }, { "epoch": 0.67, "learning_rate": 0.00019993996296875551, "loss": 0.0129, "step": 132220 }, { "epoch": 0.67, "learning_rate": 0.0001999323952757415, "loss": 0.0126, "step": 132230 }, { "epoch": 0.67, "learning_rate": 0.00019992482758272748, "loss": 0.0154, "step": 132240 }, { "epoch": 0.67, "learning_rate": 0.00019991725988971349, "loss": 0.0118, "step": 132250 }, { "epoch": 0.67, "learning_rate": 0.00019990969219669947, "loss": 0.0154, "step": 132260 }, { "epoch": 0.67, "learning_rate": 0.00019990212450368545, "loss": 0.0166, "step": 132270 }, { "epoch": 0.67, "learning_rate": 0.00019989455681067146, "loss": 0.0145, "step": 132280 }, { "epoch": 0.67, "learning_rate": 0.00019988698911765744, "loss": 0.011, "step": 132290 }, { "epoch": 0.67, "learning_rate": 0.00019987942142464342, "loss": 0.0157, "step": 132300 }, { "epoch": 0.67, "learning_rate": 0.00019987185373162943, "loss": 0.015, "step": 132310 }, { "epoch": 0.67, "learning_rate": 0.0001998642860386154, "loss": 0.0122, "step": 132320 }, { "epoch": 0.67, "learning_rate": 0.0001998567183456014, "loss": 0.0153, "step": 132330 }, { "epoch": 0.67, "learning_rate": 0.00019984915065258737, "loss": 0.0142, "step": 132340 }, { "epoch": 0.67, "learning_rate": 0.00019984158295957338, "loss": 0.0143, "step": 132350 }, { "epoch": 0.67, "learning_rate": 0.00019983401526655936, "loss": 0.0134, "step": 132360 }, { "epoch": 0.67, "learning_rate": 0.00019982644757354534, "loss": 0.0192, "step": 132370 }, { "epoch": 0.67, "learning_rate": 0.00019981887988053135, "loss": 0.0155, "step": 132380 }, { "epoch": 0.67, "learning_rate": 0.00019981131218751733, "loss": 0.0139, "step": 132390 }, { "epoch": 0.67, "learning_rate": 0.00019980374449450332, "loss": 0.0122, "step": 132400 }, { "epoch": 0.67, "learning_rate": 0.00019979617680148932, "loss": 0.0141, "step": 132410 }, { "epoch": 0.67, "learning_rate": 0.0001997886091084753, "loss": 0.0137, "step": 132420 }, { "epoch": 0.67, "learning_rate": 0.0001997810414154613, "loss": 0.0144, "step": 132430 }, { "epoch": 0.67, "learning_rate": 0.0001997734737224473, "loss": 0.0115, "step": 132440 }, { "epoch": 0.67, "learning_rate": 0.00019976590602943328, "loss": 0.0166, "step": 132450 }, { "epoch": 0.67, "learning_rate": 0.00019975833833641926, "loss": 0.0139, "step": 132460 }, { "epoch": 0.67, "learning_rate": 0.00019975077064340527, "loss": 0.0301, "step": 132470 }, { "epoch": 0.67, "learning_rate": 0.00019974320295039125, "loss": 0.0163, "step": 132480 }, { "epoch": 0.67, "learning_rate": 0.00019973563525737723, "loss": 0.0141, "step": 132490 }, { "epoch": 0.67, "learning_rate": 0.00019972806756436324, "loss": 0.0141, "step": 132500 }, { "epoch": 0.67, "learning_rate": 0.00019972049987134922, "loss": 0.0141, "step": 132510 }, { "epoch": 0.67, "learning_rate": 0.0001997129321783352, "loss": 0.0153, "step": 132520 }, { "epoch": 0.67, "learning_rate": 0.00019970536448532118, "loss": 0.012, "step": 132530 }, { "epoch": 0.67, "learning_rate": 0.0001996977967923072, "loss": 0.0157, "step": 132540 }, { "epoch": 0.67, "learning_rate": 0.00019969022909929317, "loss": 0.0149, "step": 132550 }, { "epoch": 0.67, "learning_rate": 0.00019968266140627915, "loss": 0.0137, "step": 132560 }, { "epoch": 0.67, "learning_rate": 0.00019967509371326516, "loss": 0.0116, "step": 132570 }, { "epoch": 0.67, "learning_rate": 0.00019966752602025114, "loss": 0.0141, "step": 132580 }, { "epoch": 0.67, "learning_rate": 0.00019965995832723713, "loss": 0.0176, "step": 132590 }, { "epoch": 0.67, "learning_rate": 0.00019965239063422313, "loss": 0.0151, "step": 132600 }, { "epoch": 0.67, "learning_rate": 0.0001996448229412091, "loss": 0.014, "step": 132610 }, { "epoch": 0.67, "learning_rate": 0.00019963725524819507, "loss": 0.025, "step": 132620 }, { "epoch": 0.67, "learning_rate": 0.00019962968755518105, "loss": 0.0155, "step": 132630 }, { "epoch": 0.67, "learning_rate": 0.00019962211986216706, "loss": 0.0168, "step": 132640 }, { "epoch": 0.67, "learning_rate": 0.00019961455216915304, "loss": 0.0151, "step": 132650 }, { "epoch": 0.67, "learning_rate": 0.00019960698447613902, "loss": 0.0133, "step": 132660 }, { "epoch": 0.67, "learning_rate": 0.00019959941678312503, "loss": 0.0117, "step": 132670 }, { "epoch": 0.67, "learning_rate": 0.000199591849090111, "loss": 0.0165, "step": 132680 }, { "epoch": 0.67, "learning_rate": 0.000199584281397097, "loss": 0.0162, "step": 132690 }, { "epoch": 0.67, "learning_rate": 0.000199576713704083, "loss": 0.011, "step": 132700 }, { "epoch": 0.67, "learning_rate": 0.00019956914601106898, "loss": 0.0129, "step": 132710 }, { "epoch": 0.67, "learning_rate": 0.00019956157831805497, "loss": 0.0153, "step": 132720 }, { "epoch": 0.67, "learning_rate": 0.00019955401062504095, "loss": 0.0128, "step": 132730 }, { "epoch": 0.67, "learning_rate": 0.00019954644293202696, "loss": 0.012, "step": 132740 }, { "epoch": 0.67, "learning_rate": 0.00019953887523901294, "loss": 0.0143, "step": 132750 }, { "epoch": 0.67, "learning_rate": 0.00019953130754599892, "loss": 0.0132, "step": 132760 }, { "epoch": 0.67, "learning_rate": 0.00019952373985298493, "loss": 0.0135, "step": 132770 }, { "epoch": 0.67, "learning_rate": 0.0001995161721599709, "loss": 0.0138, "step": 132780 }, { "epoch": 0.67, "learning_rate": 0.0001995086044669569, "loss": 0.0139, "step": 132790 }, { "epoch": 0.67, "learning_rate": 0.0001995010367739429, "loss": 0.0161, "step": 132800 }, { "epoch": 0.67, "learning_rate": 0.00019949346908092888, "loss": 0.0145, "step": 132810 }, { "epoch": 0.67, "learning_rate": 0.00019948590138791486, "loss": 0.0119, "step": 132820 }, { "epoch": 0.67, "learning_rate": 0.00019947833369490087, "loss": 0.017, "step": 132830 }, { "epoch": 0.67, "learning_rate": 0.00019947076600188685, "loss": 0.0116, "step": 132840 }, { "epoch": 0.67, "learning_rate": 0.00019946319830887283, "loss": 0.0134, "step": 132850 }, { "epoch": 0.67, "learning_rate": 0.00019945563061585884, "loss": 0.0169, "step": 132860 }, { "epoch": 0.67, "learning_rate": 0.00019944806292284482, "loss": 0.0109, "step": 132870 }, { "epoch": 0.67, "learning_rate": 0.0001994404952298308, "loss": 0.0142, "step": 132880 }, { "epoch": 0.67, "learning_rate": 0.0001994329275368168, "loss": 0.0132, "step": 132890 }, { "epoch": 0.67, "learning_rate": 0.0001994253598438028, "loss": 0.0153, "step": 132900 }, { "epoch": 0.67, "learning_rate": 0.00019941779215078878, "loss": 0.0141, "step": 132910 }, { "epoch": 0.67, "learning_rate": 0.00019941022445777476, "loss": 0.0148, "step": 132920 }, { "epoch": 0.67, "learning_rate": 0.00019940265676476077, "loss": 0.014, "step": 132930 }, { "epoch": 0.67, "learning_rate": 0.00019939508907174675, "loss": 0.0136, "step": 132940 }, { "epoch": 0.67, "learning_rate": 0.00019938752137873273, "loss": 0.0159, "step": 132950 }, { "epoch": 0.67, "learning_rate": 0.00019937995368571874, "loss": 0.0128, "step": 132960 }, { "epoch": 0.67, "learning_rate": 0.00019937238599270472, "loss": 0.0162, "step": 132970 }, { "epoch": 0.67, "learning_rate": 0.0001993648182996907, "loss": 0.0122, "step": 132980 }, { "epoch": 0.67, "learning_rate": 0.0001993572506066767, "loss": 0.0117, "step": 132990 }, { "epoch": 0.67, "learning_rate": 0.0001993496829136627, "loss": 0.0126, "step": 133000 }, { "epoch": 0.67, "eval_cer": 0.9144964565985481, "eval_loss": 0.009822376072406769, "eval_runtime": 116.6404, "eval_samples_per_second": 17.147, "eval_steps_per_second": 4.287, "step": 133000 }, { "epoch": 0.67, "learning_rate": 0.00019934211522064867, "loss": 0.0111, "step": 133010 }, { "epoch": 0.67, "learning_rate": 0.00019933454752763468, "loss": 0.0119, "step": 133020 }, { "epoch": 0.67, "learning_rate": 0.00019932697983462066, "loss": 0.0162, "step": 133030 }, { "epoch": 0.67, "learning_rate": 0.00019931941214160664, "loss": 0.0136, "step": 133040 }, { "epoch": 0.67, "learning_rate": 0.00019931184444859265, "loss": 0.0115, "step": 133050 }, { "epoch": 0.67, "learning_rate": 0.00019930427675557863, "loss": 0.0158, "step": 133060 }, { "epoch": 0.67, "learning_rate": 0.00019929670906256462, "loss": 0.014, "step": 133070 }, { "epoch": 0.67, "learning_rate": 0.0001992891413695506, "loss": 0.0145, "step": 133080 }, { "epoch": 0.67, "learning_rate": 0.0001992815736765366, "loss": 0.0151, "step": 133090 }, { "epoch": 0.67, "learning_rate": 0.00019927400598352259, "loss": 0.0139, "step": 133100 }, { "epoch": 0.67, "learning_rate": 0.00019926643829050857, "loss": 0.0117, "step": 133110 }, { "epoch": 0.67, "learning_rate": 0.00019925887059749458, "loss": 0.0152, "step": 133120 }, { "epoch": 0.67, "learning_rate": 0.00019925130290448056, "loss": 0.0139, "step": 133130 }, { "epoch": 0.67, "learning_rate": 0.00019924373521146654, "loss": 0.0135, "step": 133140 }, { "epoch": 0.67, "learning_rate": 0.00019923616751845255, "loss": 0.0137, "step": 133150 }, { "epoch": 0.67, "learning_rate": 0.00019922859982543853, "loss": 0.0132, "step": 133160 }, { "epoch": 0.67, "learning_rate": 0.0001992210321324245, "loss": 0.0126, "step": 133170 }, { "epoch": 0.67, "learning_rate": 0.00019921346443941052, "loss": 0.0132, "step": 133180 }, { "epoch": 0.67, "learning_rate": 0.0001992058967463965, "loss": 0.0142, "step": 133190 }, { "epoch": 0.67, "learning_rate": 0.00019919832905338248, "loss": 0.0135, "step": 133200 }, { "epoch": 0.67, "learning_rate": 0.0001991907613603685, "loss": 0.012, "step": 133210 }, { "epoch": 0.67, "learning_rate": 0.00019918319366735447, "loss": 0.0154, "step": 133220 }, { "epoch": 0.67, "learning_rate": 0.00019917562597434045, "loss": 0.0119, "step": 133230 }, { "epoch": 0.67, "learning_rate": 0.00019916805828132644, "loss": 0.0132, "step": 133240 }, { "epoch": 0.67, "learning_rate": 0.00019916049058831244, "loss": 0.0139, "step": 133250 }, { "epoch": 0.67, "learning_rate": 0.00019915292289529843, "loss": 0.016, "step": 133260 }, { "epoch": 0.67, "learning_rate": 0.0001991453552022844, "loss": 0.0159, "step": 133270 }, { "epoch": 0.67, "learning_rate": 0.00019913778750927042, "loss": 0.017, "step": 133280 }, { "epoch": 0.67, "learning_rate": 0.0001991302198162564, "loss": 0.0142, "step": 133290 }, { "epoch": 0.67, "learning_rate": 0.00019912265212324238, "loss": 0.0113, "step": 133300 }, { "epoch": 0.67, "learning_rate": 0.0001991150844302284, "loss": 0.0138, "step": 133310 }, { "epoch": 0.67, "learning_rate": 0.00019910751673721437, "loss": 0.0151, "step": 133320 }, { "epoch": 0.67, "learning_rate": 0.00019909994904420035, "loss": 0.0111, "step": 133330 }, { "epoch": 0.67, "learning_rate": 0.00019909238135118636, "loss": 0.0135, "step": 133340 }, { "epoch": 0.67, "learning_rate": 0.00019908481365817234, "loss": 0.0143, "step": 133350 }, { "epoch": 0.67, "learning_rate": 0.00019907724596515832, "loss": 0.0141, "step": 133360 }, { "epoch": 0.67, "learning_rate": 0.00019906967827214433, "loss": 0.0137, "step": 133370 }, { "epoch": 0.67, "learning_rate": 0.0001990621105791303, "loss": 0.0222, "step": 133380 }, { "epoch": 0.67, "learning_rate": 0.0001990545428861163, "loss": 0.0161, "step": 133390 }, { "epoch": 0.67, "learning_rate": 0.00019904697519310227, "loss": 0.0142, "step": 133400 }, { "epoch": 0.67, "learning_rate": 0.00019903940750008828, "loss": 0.0174, "step": 133410 }, { "epoch": 0.67, "learning_rate": 0.00019903183980707426, "loss": 0.0133, "step": 133420 }, { "epoch": 0.67, "learning_rate": 0.00019902427211406025, "loss": 0.0131, "step": 133430 }, { "epoch": 0.67, "learning_rate": 0.00019901670442104625, "loss": 0.0162, "step": 133440 }, { "epoch": 0.67, "learning_rate": 0.00019900913672803224, "loss": 0.0132, "step": 133450 }, { "epoch": 0.67, "learning_rate": 0.00019900156903501822, "loss": 0.014, "step": 133460 }, { "epoch": 0.67, "learning_rate": 0.00019899400134200423, "loss": 0.0126, "step": 133470 }, { "epoch": 0.67, "learning_rate": 0.0001989864336489902, "loss": 0.0117, "step": 133480 }, { "epoch": 0.67, "learning_rate": 0.0001989788659559762, "loss": 0.0151, "step": 133490 }, { "epoch": 0.67, "learning_rate": 0.0001989712982629622, "loss": 0.0167, "step": 133500 }, { "epoch": 0.67, "learning_rate": 0.00019896373056994818, "loss": 0.0134, "step": 133510 }, { "epoch": 0.67, "learning_rate": 0.00019895616287693416, "loss": 0.0131, "step": 133520 }, { "epoch": 0.67, "learning_rate": 0.00019894859518392017, "loss": 0.0181, "step": 133530 }, { "epoch": 0.67, "learning_rate": 0.00019894102749090615, "loss": 0.0124, "step": 133540 }, { "epoch": 0.67, "learning_rate": 0.00019893345979789213, "loss": 0.0133, "step": 133550 }, { "epoch": 0.67, "learning_rate": 0.00019892589210487814, "loss": 0.0145, "step": 133560 }, { "epoch": 0.67, "learning_rate": 0.00019891832441186412, "loss": 0.0111, "step": 133570 }, { "epoch": 0.67, "learning_rate": 0.0001989107567188501, "loss": 0.0136, "step": 133580 }, { "epoch": 0.67, "learning_rate": 0.00019890318902583608, "loss": 0.0133, "step": 133590 }, { "epoch": 0.67, "learning_rate": 0.0001988956213328221, "loss": 0.0127, "step": 133600 }, { "epoch": 0.67, "learning_rate": 0.00019888805363980807, "loss": 0.0153, "step": 133610 }, { "epoch": 0.67, "learning_rate": 0.00019888048594679406, "loss": 0.0156, "step": 133620 }, { "epoch": 0.67, "learning_rate": 0.00019887291825378006, "loss": 0.0149, "step": 133630 }, { "epoch": 0.67, "learning_rate": 0.00019886535056076605, "loss": 0.0124, "step": 133640 }, { "epoch": 0.67, "learning_rate": 0.00019885778286775203, "loss": 0.0134, "step": 133650 }, { "epoch": 0.67, "learning_rate": 0.00019885021517473804, "loss": 0.0127, "step": 133660 }, { "epoch": 0.67, "learning_rate": 0.00019884264748172402, "loss": 0.0143, "step": 133670 }, { "epoch": 0.67, "learning_rate": 0.00019883507978871, "loss": 0.0136, "step": 133680 }, { "epoch": 0.67, "learning_rate": 0.000198827512095696, "loss": 0.017, "step": 133690 }, { "epoch": 0.67, "learning_rate": 0.000198819944402682, "loss": 0.0152, "step": 133700 }, { "epoch": 0.67, "learning_rate": 0.00019881237670966797, "loss": 0.0143, "step": 133710 }, { "epoch": 0.67, "learning_rate": 0.00019880480901665398, "loss": 0.0131, "step": 133720 }, { "epoch": 0.67, "learning_rate": 0.00019879724132363996, "loss": 0.0134, "step": 133730 }, { "epoch": 0.67, "learning_rate": 0.00019878967363062594, "loss": 0.0125, "step": 133740 }, { "epoch": 0.67, "learning_rate": 0.00019878210593761192, "loss": 0.0173, "step": 133750 }, { "epoch": 0.67, "learning_rate": 0.00019877453824459793, "loss": 0.0147, "step": 133760 }, { "epoch": 0.67, "learning_rate": 0.0001987669705515839, "loss": 0.0143, "step": 133770 }, { "epoch": 0.67, "learning_rate": 0.0001987594028585699, "loss": 0.0199, "step": 133780 }, { "epoch": 0.67, "learning_rate": 0.0001987518351655559, "loss": 0.0149, "step": 133790 }, { "epoch": 0.68, "learning_rate": 0.00019874426747254188, "loss": 0.0138, "step": 133800 }, { "epoch": 0.68, "learning_rate": 0.00019873669977952787, "loss": 0.0168, "step": 133810 }, { "epoch": 0.68, "learning_rate": 0.00019872913208651387, "loss": 0.0164, "step": 133820 }, { "epoch": 0.68, "learning_rate": 0.00019872156439349986, "loss": 0.0147, "step": 133830 }, { "epoch": 0.68, "learning_rate": 0.00019871399670048584, "loss": 0.0139, "step": 133840 }, { "epoch": 0.68, "learning_rate": 0.00019870642900747185, "loss": 0.0138, "step": 133850 }, { "epoch": 0.68, "learning_rate": 0.0001986988613144578, "loss": 0.0147, "step": 133860 }, { "epoch": 0.68, "learning_rate": 0.00019869129362144378, "loss": 0.0134, "step": 133870 }, { "epoch": 0.68, "learning_rate": 0.00019868372592842976, "loss": 0.0165, "step": 133880 }, { "epoch": 0.68, "learning_rate": 0.00019867615823541577, "loss": 0.0134, "step": 133890 }, { "epoch": 0.68, "learning_rate": 0.00019866859054240175, "loss": 0.0158, "step": 133900 }, { "epoch": 0.68, "learning_rate": 0.00019866102284938773, "loss": 0.0148, "step": 133910 }, { "epoch": 0.68, "learning_rate": 0.00019865345515637374, "loss": 0.0147, "step": 133920 }, { "epoch": 0.68, "learning_rate": 0.00019864588746335972, "loss": 0.0124, "step": 133930 }, { "epoch": 0.68, "learning_rate": 0.0001986383197703457, "loss": 0.014, "step": 133940 }, { "epoch": 0.68, "learning_rate": 0.00019863075207733171, "loss": 0.0327, "step": 133950 }, { "epoch": 0.68, "learning_rate": 0.0001986231843843177, "loss": 0.0124, "step": 133960 }, { "epoch": 0.68, "learning_rate": 0.00019861561669130368, "loss": 0.0166, "step": 133970 }, { "epoch": 0.68, "learning_rate": 0.00019860804899828966, "loss": 0.0152, "step": 133980 }, { "epoch": 0.68, "learning_rate": 0.00019860048130527567, "loss": 0.0125, "step": 133990 }, { "epoch": 0.68, "learning_rate": 0.00019859291361226165, "loss": 0.0116, "step": 134000 }, { "epoch": 0.68, "eval_cer": 0.9144634631302844, "eval_loss": 0.009661918506026268, "eval_runtime": 116.6673, "eval_samples_per_second": 17.143, "eval_steps_per_second": 4.286, "step": 134000 }, { "epoch": 0.68, "learning_rate": 0.00019858534591924763, "loss": 0.0112, "step": 134010 }, { "epoch": 0.68, "learning_rate": 0.00019857777822623364, "loss": 0.0165, "step": 134020 }, { "epoch": 0.68, "learning_rate": 0.00019857021053321962, "loss": 0.0158, "step": 134030 }, { "epoch": 0.68, "learning_rate": 0.0001985626428402056, "loss": 0.014, "step": 134040 }, { "epoch": 0.68, "learning_rate": 0.0001985550751471916, "loss": 0.0279, "step": 134050 }, { "epoch": 0.68, "learning_rate": 0.0001985475074541776, "loss": 0.0158, "step": 134060 }, { "epoch": 0.68, "learning_rate": 0.00019853993976116357, "loss": 0.0154, "step": 134070 }, { "epoch": 0.68, "learning_rate": 0.00019853237206814958, "loss": 0.0199, "step": 134080 }, { "epoch": 0.68, "learning_rate": 0.00019852480437513556, "loss": 0.014, "step": 134090 }, { "epoch": 0.68, "learning_rate": 0.00019851723668212154, "loss": 0.0144, "step": 134100 }, { "epoch": 0.68, "learning_rate": 0.00019850966898910755, "loss": 0.0148, "step": 134110 }, { "epoch": 0.68, "learning_rate": 0.00019850210129609353, "loss": 0.0191, "step": 134120 }, { "epoch": 0.68, "learning_rate": 0.00019849453360307952, "loss": 0.0129, "step": 134130 }, { "epoch": 0.68, "learning_rate": 0.0001984869659100655, "loss": 0.0112, "step": 134140 }, { "epoch": 0.68, "learning_rate": 0.0001984793982170515, "loss": 0.0142, "step": 134150 }, { "epoch": 0.68, "learning_rate": 0.0001984718305240375, "loss": 0.0197, "step": 134160 }, { "epoch": 0.68, "learning_rate": 0.00019846426283102347, "loss": 0.0161, "step": 134170 }, { "epoch": 0.68, "learning_rate": 0.00019845669513800948, "loss": 0.0147, "step": 134180 }, { "epoch": 0.68, "learning_rate": 0.00019844912744499546, "loss": 0.0188, "step": 134190 }, { "epoch": 0.68, "learning_rate": 0.00019844155975198144, "loss": 0.014, "step": 134200 }, { "epoch": 0.68, "learning_rate": 0.00019843399205896745, "loss": 0.0116, "step": 134210 }, { "epoch": 0.68, "learning_rate": 0.00019842642436595343, "loss": 0.0155, "step": 134220 }, { "epoch": 0.68, "learning_rate": 0.0001984188566729394, "loss": 0.0154, "step": 134230 }, { "epoch": 0.68, "learning_rate": 0.00019841128897992542, "loss": 0.0153, "step": 134240 }, { "epoch": 0.68, "learning_rate": 0.0001984037212869114, "loss": 0.0159, "step": 134250 }, { "epoch": 0.68, "learning_rate": 0.00019839615359389738, "loss": 0.0147, "step": 134260 }, { "epoch": 0.68, "learning_rate": 0.0001983885859008834, "loss": 0.0141, "step": 134270 }, { "epoch": 0.68, "learning_rate": 0.00019838101820786937, "loss": 0.0137, "step": 134280 }, { "epoch": 0.68, "learning_rate": 0.00019837345051485535, "loss": 0.014, "step": 134290 }, { "epoch": 0.68, "learning_rate": 0.00019836588282184134, "loss": 0.0135, "step": 134300 }, { "epoch": 0.68, "learning_rate": 0.00019835831512882734, "loss": 0.0129, "step": 134310 }, { "epoch": 0.68, "learning_rate": 0.00019835074743581333, "loss": 0.016, "step": 134320 }, { "epoch": 0.68, "learning_rate": 0.0001983431797427993, "loss": 0.0169, "step": 134330 }, { "epoch": 0.68, "learning_rate": 0.00019833561204978532, "loss": 0.0161, "step": 134340 }, { "epoch": 0.68, "learning_rate": 0.0001983280443567713, "loss": 0.0122, "step": 134350 }, { "epoch": 0.68, "learning_rate": 0.00019832047666375728, "loss": 0.0151, "step": 134360 }, { "epoch": 0.68, "learning_rate": 0.0001983129089707433, "loss": 0.0157, "step": 134370 }, { "epoch": 0.68, "learning_rate": 0.00019830534127772927, "loss": 0.0123, "step": 134380 }, { "epoch": 0.68, "learning_rate": 0.00019829777358471525, "loss": 0.0123, "step": 134390 }, { "epoch": 0.68, "learning_rate": 0.00019829020589170126, "loss": 0.0128, "step": 134400 }, { "epoch": 0.68, "learning_rate": 0.00019828263819868724, "loss": 0.015, "step": 134410 }, { "epoch": 0.68, "learning_rate": 0.00019827507050567322, "loss": 0.0152, "step": 134420 }, { "epoch": 0.68, "learning_rate": 0.00019826750281265923, "loss": 0.0142, "step": 134430 }, { "epoch": 0.68, "learning_rate": 0.0001982599351196452, "loss": 0.0155, "step": 134440 }, { "epoch": 0.68, "learning_rate": 0.0001982523674266312, "loss": 0.0137, "step": 134450 }, { "epoch": 0.68, "learning_rate": 0.0001982447997336172, "loss": 0.0117, "step": 134460 }, { "epoch": 0.68, "learning_rate": 0.00019823723204060318, "loss": 0.0139, "step": 134470 }, { "epoch": 0.68, "learning_rate": 0.00019822966434758916, "loss": 0.0139, "step": 134480 }, { "epoch": 0.68, "learning_rate": 0.00019822209665457515, "loss": 0.0126, "step": 134490 }, { "epoch": 0.68, "learning_rate": 0.00019821452896156115, "loss": 0.0156, "step": 134500 }, { "epoch": 0.68, "learning_rate": 0.00019820696126854714, "loss": 0.0141, "step": 134510 }, { "epoch": 0.68, "learning_rate": 0.00019819939357553312, "loss": 0.0152, "step": 134520 }, { "epoch": 0.68, "learning_rate": 0.00019819182588251913, "loss": 0.0165, "step": 134530 }, { "epoch": 0.68, "learning_rate": 0.0001981842581895051, "loss": 0.0133, "step": 134540 }, { "epoch": 0.68, "learning_rate": 0.0001981766904964911, "loss": 0.0151, "step": 134550 }, { "epoch": 0.68, "learning_rate": 0.0001981691228034771, "loss": 0.0169, "step": 134560 }, { "epoch": 0.68, "learning_rate": 0.00019816155511046308, "loss": 0.014, "step": 134570 }, { "epoch": 0.68, "learning_rate": 0.00019815398741744906, "loss": 0.0189, "step": 134580 }, { "epoch": 0.68, "learning_rate": 0.00019814641972443507, "loss": 0.0148, "step": 134590 }, { "epoch": 0.68, "learning_rate": 0.00019813885203142105, "loss": 0.0132, "step": 134600 }, { "epoch": 0.68, "learning_rate": 0.00019813128433840703, "loss": 0.0138, "step": 134610 }, { "epoch": 0.68, "learning_rate": 0.00019812371664539304, "loss": 0.0141, "step": 134620 }, { "epoch": 0.68, "learning_rate": 0.00019811614895237902, "loss": 0.0151, "step": 134630 }, { "epoch": 0.68, "learning_rate": 0.000198108581259365, "loss": 0.0166, "step": 134640 }, { "epoch": 0.68, "learning_rate": 0.00019810101356635098, "loss": 0.0142, "step": 134650 }, { "epoch": 0.68, "learning_rate": 0.000198093445873337, "loss": 0.0141, "step": 134660 }, { "epoch": 0.68, "learning_rate": 0.00019808587818032297, "loss": 0.0137, "step": 134670 }, { "epoch": 0.68, "learning_rate": 0.00019807831048730896, "loss": 0.0123, "step": 134680 }, { "epoch": 0.68, "learning_rate": 0.00019807074279429496, "loss": 0.0149, "step": 134690 }, { "epoch": 0.68, "learning_rate": 0.00019806317510128095, "loss": 0.0125, "step": 134700 }, { "epoch": 0.68, "learning_rate": 0.00019805560740826693, "loss": 0.0145, "step": 134710 }, { "epoch": 0.68, "learning_rate": 0.00019804803971525294, "loss": 0.0112, "step": 134720 }, { "epoch": 0.68, "learning_rate": 0.00019804047202223892, "loss": 0.014, "step": 134730 }, { "epoch": 0.68, "learning_rate": 0.0001980329043292249, "loss": 0.0117, "step": 134740 }, { "epoch": 0.68, "learning_rate": 0.0001980253366362109, "loss": 0.0125, "step": 134750 }, { "epoch": 0.68, "learning_rate": 0.0001980177689431969, "loss": 0.0136, "step": 134760 }, { "epoch": 0.68, "learning_rate": 0.00019801020125018287, "loss": 0.0134, "step": 134770 }, { "epoch": 0.68, "learning_rate": 0.00019800263355716888, "loss": 0.013, "step": 134780 }, { "epoch": 0.68, "learning_rate": 0.00019799506586415486, "loss": 0.0126, "step": 134790 }, { "epoch": 0.68, "learning_rate": 0.00019798749817114084, "loss": 0.0148, "step": 134800 }, { "epoch": 0.68, "learning_rate": 0.00019797993047812682, "loss": 0.014, "step": 134810 }, { "epoch": 0.68, "learning_rate": 0.00019797236278511283, "loss": 0.0144, "step": 134820 }, { "epoch": 0.68, "learning_rate": 0.0001979647950920988, "loss": 0.0155, "step": 134830 }, { "epoch": 0.68, "learning_rate": 0.0001979572273990848, "loss": 0.0149, "step": 134840 }, { "epoch": 0.68, "learning_rate": 0.0001979496597060708, "loss": 0.0176, "step": 134850 }, { "epoch": 0.68, "learning_rate": 0.00019794209201305678, "loss": 0.0131, "step": 134860 }, { "epoch": 0.68, "learning_rate": 0.00019793452432004277, "loss": 0.0146, "step": 134870 }, { "epoch": 0.68, "learning_rate": 0.00019792695662702877, "loss": 0.0134, "step": 134880 }, { "epoch": 0.68, "learning_rate": 0.00019791938893401476, "loss": 0.0142, "step": 134890 }, { "epoch": 0.68, "learning_rate": 0.00019791182124100074, "loss": 0.0109, "step": 134900 }, { "epoch": 0.68, "learning_rate": 0.00019790425354798675, "loss": 0.013, "step": 134910 }, { "epoch": 0.68, "learning_rate": 0.00019789668585497273, "loss": 0.0203, "step": 134920 }, { "epoch": 0.68, "learning_rate": 0.0001978891181619587, "loss": 0.0123, "step": 134930 }, { "epoch": 0.68, "learning_rate": 0.00019788155046894472, "loss": 0.0158, "step": 134940 }, { "epoch": 0.68, "learning_rate": 0.0001978739827759307, "loss": 0.0146, "step": 134950 }, { "epoch": 0.68, "learning_rate": 0.00019786641508291668, "loss": 0.0126, "step": 134960 }, { "epoch": 0.68, "learning_rate": 0.0001978588473899027, "loss": 0.0152, "step": 134970 }, { "epoch": 0.68, "learning_rate": 0.00019785127969688867, "loss": 0.0125, "step": 134980 }, { "epoch": 0.68, "learning_rate": 0.00019784371200387465, "loss": 0.0143, "step": 134990 }, { "epoch": 0.68, "learning_rate": 0.00019783614431086063, "loss": 0.0117, "step": 135000 }, { "epoch": 0.68, "eval_cer": 0.9144663743186606, "eval_loss": 0.00933473464101553, "eval_runtime": 116.6822, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 135000 }, { "epoch": 0.68, "learning_rate": 0.00019782857661784664, "loss": 0.0122, "step": 135010 }, { "epoch": 0.68, "learning_rate": 0.00019782100892483262, "loss": 0.0107, "step": 135020 }, { "epoch": 0.68, "learning_rate": 0.0001978134412318186, "loss": 0.015, "step": 135030 }, { "epoch": 0.68, "learning_rate": 0.0001978058735388046, "loss": 0.014, "step": 135040 }, { "epoch": 0.68, "learning_rate": 0.0001977983058457906, "loss": 0.019, "step": 135050 }, { "epoch": 0.68, "learning_rate": 0.00019779073815277658, "loss": 0.0179, "step": 135060 }, { "epoch": 0.68, "learning_rate": 0.00019778317045976258, "loss": 0.0143, "step": 135070 }, { "epoch": 0.68, "learning_rate": 0.00019777560276674857, "loss": 0.0168, "step": 135080 }, { "epoch": 0.68, "learning_rate": 0.00019776803507373455, "loss": 0.0132, "step": 135090 }, { "epoch": 0.68, "learning_rate": 0.00019776046738072056, "loss": 0.0127, "step": 135100 }, { "epoch": 0.68, "learning_rate": 0.00019775289968770654, "loss": 0.0127, "step": 135110 }, { "epoch": 0.68, "learning_rate": 0.0001977453319946925, "loss": 0.0143, "step": 135120 }, { "epoch": 0.68, "learning_rate": 0.00019773776430167847, "loss": 0.0116, "step": 135130 }, { "epoch": 0.68, "learning_rate": 0.00019773019660866448, "loss": 0.0169, "step": 135140 }, { "epoch": 0.68, "learning_rate": 0.00019772262891565046, "loss": 0.0111, "step": 135150 }, { "epoch": 0.68, "learning_rate": 0.00019771506122263644, "loss": 0.0118, "step": 135160 }, { "epoch": 0.68, "learning_rate": 0.00019770749352962245, "loss": 0.0142, "step": 135170 }, { "epoch": 0.68, "learning_rate": 0.00019769992583660843, "loss": 0.0148, "step": 135180 }, { "epoch": 0.68, "learning_rate": 0.00019769235814359442, "loss": 0.0119, "step": 135190 }, { "epoch": 0.68, "learning_rate": 0.0001976847904505804, "loss": 0.0158, "step": 135200 }, { "epoch": 0.68, "learning_rate": 0.0001976772227575664, "loss": 0.0143, "step": 135210 }, { "epoch": 0.68, "learning_rate": 0.0001976696550645524, "loss": 0.0149, "step": 135220 }, { "epoch": 0.68, "learning_rate": 0.00019766208737153837, "loss": 0.0147, "step": 135230 }, { "epoch": 0.68, "learning_rate": 0.00019765451967852438, "loss": 0.0117, "step": 135240 }, { "epoch": 0.68, "learning_rate": 0.00019764695198551036, "loss": 0.0128, "step": 135250 }, { "epoch": 0.68, "learning_rate": 0.00019763938429249634, "loss": 0.0205, "step": 135260 }, { "epoch": 0.68, "learning_rate": 0.00019763181659948235, "loss": 0.011, "step": 135270 }, { "epoch": 0.68, "learning_rate": 0.00019762424890646833, "loss": 0.0122, "step": 135280 }, { "epoch": 0.68, "learning_rate": 0.0001976166812134543, "loss": 0.0129, "step": 135290 }, { "epoch": 0.68, "learning_rate": 0.00019760911352044032, "loss": 0.0136, "step": 135300 }, { "epoch": 0.68, "learning_rate": 0.0001976015458274263, "loss": 0.0141, "step": 135310 }, { "epoch": 0.68, "learning_rate": 0.00019759397813441228, "loss": 0.0129, "step": 135320 }, { "epoch": 0.68, "learning_rate": 0.0001975864104413983, "loss": 0.0111, "step": 135330 }, { "epoch": 0.68, "learning_rate": 0.00019757884274838427, "loss": 0.0113, "step": 135340 }, { "epoch": 0.68, "learning_rate": 0.00019757127505537025, "loss": 0.0137, "step": 135350 }, { "epoch": 0.68, "learning_rate": 0.00019756370736235626, "loss": 0.0151, "step": 135360 }, { "epoch": 0.68, "learning_rate": 0.00019755613966934224, "loss": 0.0134, "step": 135370 }, { "epoch": 0.68, "learning_rate": 0.00019754857197632823, "loss": 0.0149, "step": 135380 }, { "epoch": 0.68, "learning_rate": 0.0001975410042833142, "loss": 0.0132, "step": 135390 }, { "epoch": 0.68, "learning_rate": 0.00019753343659030022, "loss": 0.014, "step": 135400 }, { "epoch": 0.68, "learning_rate": 0.0001975258688972862, "loss": 0.0124, "step": 135410 }, { "epoch": 0.68, "learning_rate": 0.00019751830120427218, "loss": 0.0117, "step": 135420 }, { "epoch": 0.68, "learning_rate": 0.0001975107335112582, "loss": 0.0134, "step": 135430 }, { "epoch": 0.68, "learning_rate": 0.00019750316581824417, "loss": 0.0148, "step": 135440 }, { "epoch": 0.68, "learning_rate": 0.00019749559812523015, "loss": 0.0132, "step": 135450 }, { "epoch": 0.68, "learning_rate": 0.00019748803043221616, "loss": 0.013, "step": 135460 }, { "epoch": 0.68, "learning_rate": 0.00019748046273920214, "loss": 0.0108, "step": 135470 }, { "epoch": 0.68, "learning_rate": 0.00019747289504618812, "loss": 0.0133, "step": 135480 }, { "epoch": 0.68, "learning_rate": 0.00019746532735317413, "loss": 0.0164, "step": 135490 }, { "epoch": 0.68, "learning_rate": 0.0001974577596601601, "loss": 0.0146, "step": 135500 }, { "epoch": 0.68, "learning_rate": 0.0001974501919671461, "loss": 0.0148, "step": 135510 }, { "epoch": 0.68, "learning_rate": 0.0001974426242741321, "loss": 0.0177, "step": 135520 }, { "epoch": 0.68, "learning_rate": 0.00019743505658111808, "loss": 0.0128, "step": 135530 }, { "epoch": 0.68, "learning_rate": 0.00019742748888810406, "loss": 0.0183, "step": 135540 }, { "epoch": 0.68, "learning_rate": 0.00019741992119509005, "loss": 0.0151, "step": 135550 }, { "epoch": 0.68, "learning_rate": 0.00019741235350207605, "loss": 0.0183, "step": 135560 }, { "epoch": 0.68, "learning_rate": 0.00019740478580906204, "loss": 0.0148, "step": 135570 }, { "epoch": 0.68, "learning_rate": 0.00019739721811604802, "loss": 0.0146, "step": 135580 }, { "epoch": 0.68, "learning_rate": 0.00019738965042303403, "loss": 0.0162, "step": 135590 }, { "epoch": 0.68, "learning_rate": 0.00019738208273002, "loss": 0.0134, "step": 135600 }, { "epoch": 0.68, "learning_rate": 0.000197374515037006, "loss": 0.0136, "step": 135610 }, { "epoch": 0.68, "learning_rate": 0.000197366947343992, "loss": 0.0145, "step": 135620 }, { "epoch": 0.68, "learning_rate": 0.00019735937965097798, "loss": 0.0105, "step": 135630 }, { "epoch": 0.68, "learning_rate": 0.00019735181195796396, "loss": 0.0102, "step": 135640 }, { "epoch": 0.68, "learning_rate": 0.00019734424426494997, "loss": 0.013, "step": 135650 }, { "epoch": 0.68, "learning_rate": 0.00019733667657193595, "loss": 0.0098, "step": 135660 }, { "epoch": 0.68, "learning_rate": 0.00019732910887892193, "loss": 0.0126, "step": 135670 }, { "epoch": 0.68, "learning_rate": 0.00019732154118590794, "loss": 0.0154, "step": 135680 }, { "epoch": 0.68, "learning_rate": 0.00019731397349289392, "loss": 0.0128, "step": 135690 }, { "epoch": 0.68, "learning_rate": 0.0001973064057998799, "loss": 0.0131, "step": 135700 }, { "epoch": 0.68, "learning_rate": 0.00019729883810686588, "loss": 0.0124, "step": 135710 }, { "epoch": 0.68, "learning_rate": 0.0001972912704138519, "loss": 0.0122, "step": 135720 }, { "epoch": 0.68, "learning_rate": 0.00019728370272083787, "loss": 0.0134, "step": 135730 }, { "epoch": 0.68, "learning_rate": 0.00019727613502782386, "loss": 0.0138, "step": 135740 }, { "epoch": 0.68, "learning_rate": 0.00019726856733480986, "loss": 0.0124, "step": 135750 }, { "epoch": 0.68, "learning_rate": 0.00019726099964179585, "loss": 0.0137, "step": 135760 }, { "epoch": 0.68, "learning_rate": 0.00019725343194878183, "loss": 0.0131, "step": 135770 }, { "epoch": 0.69, "learning_rate": 0.00019724586425576784, "loss": 0.0148, "step": 135780 }, { "epoch": 0.69, "learning_rate": 0.00019723829656275382, "loss": 0.0161, "step": 135790 }, { "epoch": 0.69, "learning_rate": 0.0001972307288697398, "loss": 0.0136, "step": 135800 }, { "epoch": 0.69, "learning_rate": 0.0001972231611767258, "loss": 0.0111, "step": 135810 }, { "epoch": 0.69, "learning_rate": 0.0001972155934837118, "loss": 0.0104, "step": 135820 }, { "epoch": 0.69, "learning_rate": 0.00019720802579069777, "loss": 0.0129, "step": 135830 }, { "epoch": 0.69, "learning_rate": 0.00019720045809768378, "loss": 0.0123, "step": 135840 }, { "epoch": 0.69, "learning_rate": 0.00019719289040466976, "loss": 0.0154, "step": 135850 }, { "epoch": 0.69, "learning_rate": 0.00019718532271165574, "loss": 0.0106, "step": 135860 }, { "epoch": 0.69, "learning_rate": 0.00019717775501864175, "loss": 0.0124, "step": 135870 }, { "epoch": 0.69, "learning_rate": 0.00019717018732562773, "loss": 0.0121, "step": 135880 }, { "epoch": 0.69, "learning_rate": 0.0001971626196326137, "loss": 0.0112, "step": 135890 }, { "epoch": 0.69, "learning_rate": 0.0001971550519395997, "loss": 0.0111, "step": 135900 }, { "epoch": 0.69, "learning_rate": 0.0001971474842465857, "loss": 0.0161, "step": 135910 }, { "epoch": 0.69, "learning_rate": 0.00019713991655357168, "loss": 0.0132, "step": 135920 }, { "epoch": 0.69, "learning_rate": 0.00019713234886055767, "loss": 0.0151, "step": 135930 }, { "epoch": 0.69, "learning_rate": 0.00019712478116754367, "loss": 0.0137, "step": 135940 }, { "epoch": 0.69, "learning_rate": 0.00019711721347452966, "loss": 0.0143, "step": 135950 }, { "epoch": 0.69, "learning_rate": 0.00019710964578151564, "loss": 0.0124, "step": 135960 }, { "epoch": 0.69, "learning_rate": 0.00019710207808850165, "loss": 0.0159, "step": 135970 }, { "epoch": 0.69, "learning_rate": 0.00019709451039548763, "loss": 0.0162, "step": 135980 }, { "epoch": 0.69, "learning_rate": 0.0001970869427024736, "loss": 0.0157, "step": 135990 }, { "epoch": 0.69, "learning_rate": 0.00019707937500945962, "loss": 0.0106, "step": 136000 }, { "epoch": 0.69, "eval_cer": 0.9144586111496574, "eval_loss": 0.009702920913696289, "eval_runtime": 116.6777, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 136000 }, { "epoch": 0.69, "learning_rate": 0.0001970718073164456, "loss": 0.0132, "step": 136010 }, { "epoch": 0.69, "learning_rate": 0.00019706423962343158, "loss": 0.011, "step": 136020 }, { "epoch": 0.69, "learning_rate": 0.0001970566719304176, "loss": 0.0127, "step": 136030 }, { "epoch": 0.69, "learning_rate": 0.00019704910423740357, "loss": 0.017, "step": 136040 }, { "epoch": 0.69, "learning_rate": 0.00019704153654438955, "loss": 0.0134, "step": 136050 }, { "epoch": 0.69, "learning_rate": 0.00019703396885137553, "loss": 0.0156, "step": 136060 }, { "epoch": 0.69, "learning_rate": 0.00019702640115836154, "loss": 0.0128, "step": 136070 }, { "epoch": 0.69, "learning_rate": 0.00019701883346534752, "loss": 0.0122, "step": 136080 }, { "epoch": 0.69, "learning_rate": 0.0001970112657723335, "loss": 0.0161, "step": 136090 }, { "epoch": 0.69, "learning_rate": 0.0001970036980793195, "loss": 0.0111, "step": 136100 }, { "epoch": 0.69, "learning_rate": 0.0001969961303863055, "loss": 0.0135, "step": 136110 }, { "epoch": 0.69, "learning_rate": 0.00019698856269329148, "loss": 0.0146, "step": 136120 }, { "epoch": 0.69, "learning_rate": 0.00019698099500027748, "loss": 0.0135, "step": 136130 }, { "epoch": 0.69, "learning_rate": 0.00019697342730726347, "loss": 0.0135, "step": 136140 }, { "epoch": 0.69, "learning_rate": 0.00019696585961424945, "loss": 0.0127, "step": 136150 }, { "epoch": 0.69, "learning_rate": 0.00019695829192123546, "loss": 0.0135, "step": 136160 }, { "epoch": 0.69, "learning_rate": 0.00019695072422822144, "loss": 0.0124, "step": 136170 }, { "epoch": 0.69, "learning_rate": 0.00019694315653520742, "loss": 0.0131, "step": 136180 }, { "epoch": 0.69, "learning_rate": 0.00019693558884219343, "loss": 0.0183, "step": 136190 }, { "epoch": 0.69, "learning_rate": 0.0001969280211491794, "loss": 0.0163, "step": 136200 }, { "epoch": 0.69, "learning_rate": 0.0001969204534561654, "loss": 0.0133, "step": 136210 }, { "epoch": 0.69, "learning_rate": 0.00019691288576315137, "loss": 0.0157, "step": 136220 }, { "epoch": 0.69, "learning_rate": 0.00019690531807013738, "loss": 0.0134, "step": 136230 }, { "epoch": 0.69, "learning_rate": 0.00019689775037712336, "loss": 0.014, "step": 136240 }, { "epoch": 0.69, "learning_rate": 0.00019689018268410934, "loss": 0.0109, "step": 136250 }, { "epoch": 0.69, "learning_rate": 0.00019688261499109535, "loss": 0.0135, "step": 136260 }, { "epoch": 0.69, "learning_rate": 0.00019687504729808133, "loss": 0.0123, "step": 136270 }, { "epoch": 0.69, "learning_rate": 0.00019686747960506731, "loss": 0.0179, "step": 136280 }, { "epoch": 0.69, "learning_rate": 0.00019685991191205332, "loss": 0.0127, "step": 136290 }, { "epoch": 0.69, "learning_rate": 0.0001968523442190393, "loss": 0.0116, "step": 136300 }, { "epoch": 0.69, "learning_rate": 0.00019684477652602529, "loss": 0.0128, "step": 136310 }, { "epoch": 0.69, "learning_rate": 0.0001968372088330113, "loss": 0.0176, "step": 136320 }, { "epoch": 0.69, "learning_rate": 0.00019682964113999728, "loss": 0.0134, "step": 136330 }, { "epoch": 0.69, "learning_rate": 0.00019682207344698326, "loss": 0.0114, "step": 136340 }, { "epoch": 0.69, "learning_rate": 0.00019681450575396927, "loss": 0.014, "step": 136350 }, { "epoch": 0.69, "learning_rate": 0.00019680693806095525, "loss": 0.0137, "step": 136360 }, { "epoch": 0.69, "learning_rate": 0.00019679937036794123, "loss": 0.0153, "step": 136370 }, { "epoch": 0.69, "learning_rate": 0.00019679180267492718, "loss": 0.0135, "step": 136380 }, { "epoch": 0.69, "learning_rate": 0.0001967842349819132, "loss": 0.011, "step": 136390 }, { "epoch": 0.69, "learning_rate": 0.00019677666728889917, "loss": 0.0117, "step": 136400 }, { "epoch": 0.69, "learning_rate": 0.00019676909959588515, "loss": 0.0144, "step": 136410 }, { "epoch": 0.69, "learning_rate": 0.00019676153190287116, "loss": 0.0189, "step": 136420 }, { "epoch": 0.69, "learning_rate": 0.00019675396420985714, "loss": 0.0138, "step": 136430 }, { "epoch": 0.69, "learning_rate": 0.00019674639651684313, "loss": 0.0149, "step": 136440 }, { "epoch": 0.69, "learning_rate": 0.0001967388288238291, "loss": 0.0118, "step": 136450 }, { "epoch": 0.69, "learning_rate": 0.00019673126113081512, "loss": 0.0119, "step": 136460 }, { "epoch": 0.69, "learning_rate": 0.0001967236934378011, "loss": 0.0147, "step": 136470 }, { "epoch": 0.69, "learning_rate": 0.00019671612574478708, "loss": 0.0142, "step": 136480 }, { "epoch": 0.69, "learning_rate": 0.0001967085580517731, "loss": 0.012, "step": 136490 }, { "epoch": 0.69, "learning_rate": 0.00019670099035875907, "loss": 0.0116, "step": 136500 }, { "epoch": 0.69, "learning_rate": 0.00019669342266574505, "loss": 0.0124, "step": 136510 }, { "epoch": 0.69, "learning_rate": 0.00019668585497273106, "loss": 0.0137, "step": 136520 }, { "epoch": 0.69, "learning_rate": 0.00019667828727971704, "loss": 0.0134, "step": 136530 }, { "epoch": 0.69, "learning_rate": 0.00019667071958670302, "loss": 0.0137, "step": 136540 }, { "epoch": 0.69, "learning_rate": 0.00019666315189368903, "loss": 0.013, "step": 136550 }, { "epoch": 0.69, "learning_rate": 0.000196655584200675, "loss": 0.0112, "step": 136560 }, { "epoch": 0.69, "learning_rate": 0.000196648016507661, "loss": 0.0183, "step": 136570 }, { "epoch": 0.69, "learning_rate": 0.000196640448814647, "loss": 0.0112, "step": 136580 }, { "epoch": 0.69, "learning_rate": 0.00019663288112163298, "loss": 0.0123, "step": 136590 }, { "epoch": 0.69, "learning_rate": 0.00019662531342861896, "loss": 0.013, "step": 136600 }, { "epoch": 0.69, "learning_rate": 0.00019661774573560495, "loss": 0.0127, "step": 136610 }, { "epoch": 0.69, "learning_rate": 0.00019661017804259095, "loss": 0.01, "step": 136620 }, { "epoch": 0.69, "learning_rate": 0.00019660261034957694, "loss": 0.0118, "step": 136630 }, { "epoch": 0.69, "learning_rate": 0.00019659504265656292, "loss": 0.0179, "step": 136640 }, { "epoch": 0.69, "learning_rate": 0.00019658747496354893, "loss": 0.0138, "step": 136650 }, { "epoch": 0.69, "learning_rate": 0.0001965799072705349, "loss": 0.0122, "step": 136660 }, { "epoch": 0.69, "learning_rate": 0.0001965723395775209, "loss": 0.0123, "step": 136670 }, { "epoch": 0.69, "learning_rate": 0.0001965647718845069, "loss": 0.0153, "step": 136680 }, { "epoch": 0.69, "learning_rate": 0.00019655720419149288, "loss": 0.0126, "step": 136690 }, { "epoch": 0.69, "learning_rate": 0.00019654963649847886, "loss": 0.0124, "step": 136700 }, { "epoch": 0.69, "learning_rate": 0.00019654206880546487, "loss": 0.015, "step": 136710 }, { "epoch": 0.69, "learning_rate": 0.00019653450111245085, "loss": 0.0141, "step": 136720 }, { "epoch": 0.69, "learning_rate": 0.00019652693341943683, "loss": 0.0182, "step": 136730 }, { "epoch": 0.69, "learning_rate": 0.00019651936572642284, "loss": 0.0153, "step": 136740 }, { "epoch": 0.69, "learning_rate": 0.00019651179803340882, "loss": 0.0119, "step": 136750 }, { "epoch": 0.69, "learning_rate": 0.0001965042303403948, "loss": 0.0148, "step": 136760 }, { "epoch": 0.69, "learning_rate": 0.0001964966626473808, "loss": 0.0092, "step": 136770 }, { "epoch": 0.69, "learning_rate": 0.0001964890949543668, "loss": 0.0151, "step": 136780 }, { "epoch": 0.69, "learning_rate": 0.00019648152726135277, "loss": 0.013, "step": 136790 }, { "epoch": 0.69, "learning_rate": 0.00019647395956833876, "loss": 0.0186, "step": 136800 }, { "epoch": 0.69, "learning_rate": 0.00019646639187532476, "loss": 0.015, "step": 136810 }, { "epoch": 0.69, "learning_rate": 0.00019645882418231075, "loss": 0.0149, "step": 136820 }, { "epoch": 0.69, "learning_rate": 0.00019645125648929673, "loss": 0.013, "step": 136830 }, { "epoch": 0.69, "learning_rate": 0.00019644368879628274, "loss": 0.0142, "step": 136840 }, { "epoch": 0.69, "learning_rate": 0.00019643612110326872, "loss": 0.0135, "step": 136850 }, { "epoch": 0.69, "learning_rate": 0.0001964285534102547, "loss": 0.0171, "step": 136860 }, { "epoch": 0.69, "learning_rate": 0.0001964209857172407, "loss": 0.0136, "step": 136870 }, { "epoch": 0.69, "learning_rate": 0.0001964134180242267, "loss": 0.0126, "step": 136880 }, { "epoch": 0.69, "learning_rate": 0.00019640585033121267, "loss": 0.0149, "step": 136890 }, { "epoch": 0.69, "learning_rate": 0.00019639828263819868, "loss": 0.0149, "step": 136900 }, { "epoch": 0.69, "learning_rate": 0.00019639071494518466, "loss": 0.0183, "step": 136910 }, { "epoch": 0.69, "learning_rate": 0.00019638314725217064, "loss": 0.0138, "step": 136920 }, { "epoch": 0.69, "learning_rate": 0.00019637557955915665, "loss": 0.0111, "step": 136930 }, { "epoch": 0.69, "learning_rate": 0.00019636801186614263, "loss": 0.0111, "step": 136940 }, { "epoch": 0.69, "learning_rate": 0.0001963604441731286, "loss": 0.0159, "step": 136950 }, { "epoch": 0.69, "learning_rate": 0.0001963528764801146, "loss": 0.0109, "step": 136960 }, { "epoch": 0.69, "learning_rate": 0.0001963453087871006, "loss": 0.0137, "step": 136970 }, { "epoch": 0.69, "learning_rate": 0.00019633774109408658, "loss": 0.0116, "step": 136980 }, { "epoch": 0.69, "learning_rate": 0.00019633017340107257, "loss": 0.011, "step": 136990 }, { "epoch": 0.69, "learning_rate": 0.00019632260570805857, "loss": 0.0151, "step": 137000 }, { "epoch": 0.69, "eval_cer": 0.914462492734159, "eval_loss": 0.009697197005152702, "eval_runtime": 116.8588, "eval_samples_per_second": 17.115, "eval_steps_per_second": 4.279, "step": 137000 }, { "epoch": 0.69, "learning_rate": 0.00019631503801504456, "loss": 0.0125, "step": 137010 }, { "epoch": 0.69, "learning_rate": 0.00019630747032203054, "loss": 0.0121, "step": 137020 }, { "epoch": 0.69, "learning_rate": 0.00019629990262901655, "loss": 0.0134, "step": 137030 }, { "epoch": 0.69, "learning_rate": 0.00019629233493600253, "loss": 0.0124, "step": 137040 }, { "epoch": 0.69, "learning_rate": 0.0001962847672429885, "loss": 0.0112, "step": 137050 }, { "epoch": 0.69, "learning_rate": 0.00019627719954997452, "loss": 0.0138, "step": 137060 }, { "epoch": 0.69, "learning_rate": 0.0001962696318569605, "loss": 0.0137, "step": 137070 }, { "epoch": 0.69, "learning_rate": 0.00019626206416394648, "loss": 0.0146, "step": 137080 }, { "epoch": 0.69, "learning_rate": 0.0001962544964709325, "loss": 0.0131, "step": 137090 }, { "epoch": 0.69, "learning_rate": 0.00019624692877791847, "loss": 0.014, "step": 137100 }, { "epoch": 0.69, "learning_rate": 0.00019623936108490445, "loss": 0.0163, "step": 137110 }, { "epoch": 0.69, "learning_rate": 0.00019623179339189043, "loss": 0.0127, "step": 137120 }, { "epoch": 0.69, "learning_rate": 0.00019622422569887644, "loss": 0.0135, "step": 137130 }, { "epoch": 0.69, "learning_rate": 0.00019621665800586242, "loss": 0.0147, "step": 137140 }, { "epoch": 0.69, "learning_rate": 0.0001962090903128484, "loss": 0.0138, "step": 137150 }, { "epoch": 0.69, "learning_rate": 0.0001962015226198344, "loss": 0.0134, "step": 137160 }, { "epoch": 0.69, "learning_rate": 0.0001961939549268204, "loss": 0.0146, "step": 137170 }, { "epoch": 0.69, "learning_rate": 0.00019618638723380638, "loss": 0.0127, "step": 137180 }, { "epoch": 0.69, "learning_rate": 0.00019617881954079238, "loss": 0.015, "step": 137190 }, { "epoch": 0.69, "learning_rate": 0.00019617125184777837, "loss": 0.0133, "step": 137200 }, { "epoch": 0.69, "learning_rate": 0.00019616368415476435, "loss": 0.0132, "step": 137210 }, { "epoch": 0.69, "learning_rate": 0.00019615611646175036, "loss": 0.0115, "step": 137220 }, { "epoch": 0.69, "learning_rate": 0.00019614854876873634, "loss": 0.0117, "step": 137230 }, { "epoch": 0.69, "learning_rate": 0.00019614098107572232, "loss": 0.0124, "step": 137240 }, { "epoch": 0.69, "learning_rate": 0.00019613341338270833, "loss": 0.0129, "step": 137250 }, { "epoch": 0.69, "learning_rate": 0.0001961258456896943, "loss": 0.0119, "step": 137260 }, { "epoch": 0.69, "learning_rate": 0.0001961182779966803, "loss": 0.0138, "step": 137270 }, { "epoch": 0.69, "learning_rate": 0.00019611071030366627, "loss": 0.0175, "step": 137280 }, { "epoch": 0.69, "learning_rate": 0.00019610314261065228, "loss": 0.016, "step": 137290 }, { "epoch": 0.69, "learning_rate": 0.00019609557491763826, "loss": 0.0146, "step": 137300 }, { "epoch": 0.69, "learning_rate": 0.00019608800722462424, "loss": 0.0115, "step": 137310 }, { "epoch": 0.69, "learning_rate": 0.00019608043953161025, "loss": 0.0112, "step": 137320 }, { "epoch": 0.69, "learning_rate": 0.00019607287183859623, "loss": 0.0111, "step": 137330 }, { "epoch": 0.69, "learning_rate": 0.00019606530414558221, "loss": 0.0155, "step": 137340 }, { "epoch": 0.69, "learning_rate": 0.00019605773645256822, "loss": 0.0134, "step": 137350 }, { "epoch": 0.69, "learning_rate": 0.0001960501687595542, "loss": 0.0138, "step": 137360 }, { "epoch": 0.69, "learning_rate": 0.00019604260106654019, "loss": 0.011, "step": 137370 }, { "epoch": 0.69, "learning_rate": 0.0001960350333735262, "loss": 0.0125, "step": 137380 }, { "epoch": 0.69, "learning_rate": 0.00019602746568051218, "loss": 0.0132, "step": 137390 }, { "epoch": 0.69, "learning_rate": 0.00019601989798749816, "loss": 0.012, "step": 137400 }, { "epoch": 0.69, "learning_rate": 0.00019601233029448417, "loss": 0.0142, "step": 137410 }, { "epoch": 0.69, "learning_rate": 0.00019600476260147015, "loss": 0.0114, "step": 137420 }, { "epoch": 0.69, "learning_rate": 0.00019599719490845613, "loss": 0.0148, "step": 137430 }, { "epoch": 0.69, "learning_rate": 0.00019598962721544214, "loss": 0.0163, "step": 137440 }, { "epoch": 0.69, "learning_rate": 0.00019598205952242812, "loss": 0.0148, "step": 137450 }, { "epoch": 0.69, "learning_rate": 0.0001959744918294141, "loss": 0.0126, "step": 137460 }, { "epoch": 0.69, "learning_rate": 0.00019596692413640008, "loss": 0.0134, "step": 137470 }, { "epoch": 0.69, "learning_rate": 0.0001959593564433861, "loss": 0.0143, "step": 137480 }, { "epoch": 0.69, "learning_rate": 0.00019595178875037207, "loss": 0.0114, "step": 137490 }, { "epoch": 0.69, "learning_rate": 0.00019594422105735805, "loss": 0.0161, "step": 137500 }, { "epoch": 0.69, "learning_rate": 0.00019593665336434406, "loss": 0.0121, "step": 137510 }, { "epoch": 0.69, "learning_rate": 0.00019592908567133004, "loss": 0.0138, "step": 137520 }, { "epoch": 0.69, "learning_rate": 0.00019592151797831602, "loss": 0.0116, "step": 137530 }, { "epoch": 0.69, "learning_rate": 0.00019591395028530203, "loss": 0.0099, "step": 137540 }, { "epoch": 0.69, "learning_rate": 0.00019590638259228801, "loss": 0.0118, "step": 137550 }, { "epoch": 0.69, "learning_rate": 0.000195898814899274, "loss": 0.0136, "step": 137560 }, { "epoch": 0.69, "learning_rate": 0.00019589124720626, "loss": 0.0131, "step": 137570 }, { "epoch": 0.69, "learning_rate": 0.00019588367951324599, "loss": 0.012, "step": 137580 }, { "epoch": 0.69, "learning_rate": 0.00019587611182023197, "loss": 0.0135, "step": 137590 }, { "epoch": 0.69, "learning_rate": 0.00019586854412721798, "loss": 0.0123, "step": 137600 }, { "epoch": 0.69, "learning_rate": 0.00019586097643420396, "loss": 0.0142, "step": 137610 }, { "epoch": 0.69, "learning_rate": 0.00019585340874118994, "loss": 0.0162, "step": 137620 }, { "epoch": 0.69, "learning_rate": 0.0001958458410481759, "loss": 0.0137, "step": 137630 }, { "epoch": 0.69, "learning_rate": 0.0001958382733551619, "loss": 0.0122, "step": 137640 }, { "epoch": 0.69, "learning_rate": 0.00019583070566214788, "loss": 0.0111, "step": 137650 }, { "epoch": 0.69, "learning_rate": 0.00019582313796913386, "loss": 0.0133, "step": 137660 }, { "epoch": 0.69, "learning_rate": 0.00019581557027611985, "loss": 0.0147, "step": 137670 }, { "epoch": 0.69, "learning_rate": 0.00019580800258310585, "loss": 0.0147, "step": 137680 }, { "epoch": 0.69, "learning_rate": 0.00019580043489009184, "loss": 0.0167, "step": 137690 }, { "epoch": 0.69, "learning_rate": 0.00019579286719707782, "loss": 0.0125, "step": 137700 }, { "epoch": 0.69, "learning_rate": 0.00019578529950406383, "loss": 0.0128, "step": 137710 }, { "epoch": 0.69, "learning_rate": 0.0001957777318110498, "loss": 0.0137, "step": 137720 }, { "epoch": 0.69, "learning_rate": 0.0001957701641180358, "loss": 0.0108, "step": 137730 }, { "epoch": 0.69, "learning_rate": 0.0001957625964250218, "loss": 0.0136, "step": 137740 }, { "epoch": 0.69, "learning_rate": 0.00019575502873200778, "loss": 0.0122, "step": 137750 }, { "epoch": 0.7, "learning_rate": 0.00019574746103899376, "loss": 0.013, "step": 137760 }, { "epoch": 0.7, "learning_rate": 0.00019573989334597977, "loss": 0.0126, "step": 137770 }, { "epoch": 0.7, "learning_rate": 0.00019573232565296575, "loss": 0.0156, "step": 137780 }, { "epoch": 0.7, "learning_rate": 0.00019572475795995173, "loss": 0.0121, "step": 137790 }, { "epoch": 0.7, "learning_rate": 0.00019571719026693774, "loss": 0.0118, "step": 137800 }, { "epoch": 0.7, "learning_rate": 0.00019570962257392372, "loss": 0.0113, "step": 137810 }, { "epoch": 0.7, "learning_rate": 0.0001957020548809097, "loss": 0.0131, "step": 137820 }, { "epoch": 0.7, "learning_rate": 0.0001956944871878957, "loss": 0.0132, "step": 137830 }, { "epoch": 0.7, "learning_rate": 0.0001956869194948817, "loss": 0.0109, "step": 137840 }, { "epoch": 0.7, "learning_rate": 0.00019567935180186767, "loss": 0.0143, "step": 137850 }, { "epoch": 0.7, "learning_rate": 0.00019567178410885366, "loss": 0.0111, "step": 137860 }, { "epoch": 0.7, "learning_rate": 0.00019566421641583966, "loss": 0.0131, "step": 137870 }, { "epoch": 0.7, "learning_rate": 0.00019565664872282565, "loss": 0.0167, "step": 137880 }, { "epoch": 0.7, "learning_rate": 0.00019564908102981163, "loss": 0.015, "step": 137890 }, { "epoch": 0.7, "learning_rate": 0.00019564151333679764, "loss": 0.0151, "step": 137900 }, { "epoch": 0.7, "learning_rate": 0.00019563394564378362, "loss": 0.0129, "step": 137910 }, { "epoch": 0.7, "learning_rate": 0.0001956263779507696, "loss": 0.0131, "step": 137920 }, { "epoch": 0.7, "learning_rate": 0.0001956188102577556, "loss": 0.0124, "step": 137930 }, { "epoch": 0.7, "learning_rate": 0.0001956112425647416, "loss": 0.0113, "step": 137940 }, { "epoch": 0.7, "learning_rate": 0.00019560367487172757, "loss": 0.0141, "step": 137950 }, { "epoch": 0.7, "learning_rate": 0.00019559610717871358, "loss": 0.0157, "step": 137960 }, { "epoch": 0.7, "learning_rate": 0.00019558853948569956, "loss": 0.0125, "step": 137970 }, { "epoch": 0.7, "learning_rate": 0.00019558097179268554, "loss": 0.0117, "step": 137980 }, { "epoch": 0.7, "learning_rate": 0.00019557340409967155, "loss": 0.0138, "step": 137990 }, { "epoch": 0.7, "learning_rate": 0.00019556583640665753, "loss": 0.0116, "step": 138000 }, { "epoch": 0.7, "eval_cer": 0.9144770486760401, "eval_loss": 0.009700953029096127, "eval_runtime": 116.67, "eval_samples_per_second": 17.142, "eval_steps_per_second": 4.286, "step": 138000 }, { "epoch": 0.7, "learning_rate": 0.0001955582687136435, "loss": 0.0138, "step": 138010 }, { "epoch": 0.7, "learning_rate": 0.0001955507010206295, "loss": 0.0124, "step": 138020 }, { "epoch": 0.7, "learning_rate": 0.0001955431333276155, "loss": 0.0145, "step": 138030 }, { "epoch": 0.7, "learning_rate": 0.00019553556563460148, "loss": 0.0182, "step": 138040 }, { "epoch": 0.7, "learning_rate": 0.00019552799794158747, "loss": 0.0142, "step": 138050 }, { "epoch": 0.7, "learning_rate": 0.00019552043024857347, "loss": 0.0124, "step": 138060 }, { "epoch": 0.7, "learning_rate": 0.00019551286255555946, "loss": 0.0141, "step": 138070 }, { "epoch": 0.7, "learning_rate": 0.00019550529486254544, "loss": 0.0134, "step": 138080 }, { "epoch": 0.7, "learning_rate": 0.00019549772716953145, "loss": 0.0149, "step": 138090 }, { "epoch": 0.7, "learning_rate": 0.00019549015947651743, "loss": 0.0114, "step": 138100 }, { "epoch": 0.7, "learning_rate": 0.0001954825917835034, "loss": 0.0134, "step": 138110 }, { "epoch": 0.7, "learning_rate": 0.00019547502409048942, "loss": 0.0108, "step": 138120 }, { "epoch": 0.7, "learning_rate": 0.0001954674563974754, "loss": 0.0123, "step": 138130 }, { "epoch": 0.7, "learning_rate": 0.00019545988870446138, "loss": 0.0118, "step": 138140 }, { "epoch": 0.7, "learning_rate": 0.0001954523210114474, "loss": 0.0122, "step": 138150 }, { "epoch": 0.7, "learning_rate": 0.00019544475331843337, "loss": 0.0127, "step": 138160 }, { "epoch": 0.7, "learning_rate": 0.00019543718562541935, "loss": 0.0163, "step": 138170 }, { "epoch": 0.7, "learning_rate": 0.00019542961793240533, "loss": 0.013, "step": 138180 }, { "epoch": 0.7, "learning_rate": 0.00019542205023939134, "loss": 0.014, "step": 138190 }, { "epoch": 0.7, "learning_rate": 0.00019541448254637732, "loss": 0.0125, "step": 138200 }, { "epoch": 0.7, "learning_rate": 0.0001954069148533633, "loss": 0.013, "step": 138210 }, { "epoch": 0.7, "learning_rate": 0.0001953993471603493, "loss": 0.0118, "step": 138220 }, { "epoch": 0.7, "learning_rate": 0.0001953917794673353, "loss": 0.0124, "step": 138230 }, { "epoch": 0.7, "learning_rate": 0.00019538421177432128, "loss": 0.012, "step": 138240 }, { "epoch": 0.7, "learning_rate": 0.00019537664408130728, "loss": 0.0177, "step": 138250 }, { "epoch": 0.7, "learning_rate": 0.00019536907638829327, "loss": 0.0122, "step": 138260 }, { "epoch": 0.7, "learning_rate": 0.00019536150869527925, "loss": 0.0106, "step": 138270 }, { "epoch": 0.7, "learning_rate": 0.00019535394100226526, "loss": 0.0116, "step": 138280 }, { "epoch": 0.7, "learning_rate": 0.00019534637330925124, "loss": 0.0129, "step": 138290 }, { "epoch": 0.7, "learning_rate": 0.00019533880561623722, "loss": 0.015, "step": 138300 }, { "epoch": 0.7, "learning_rate": 0.00019533123792322323, "loss": 0.0163, "step": 138310 }, { "epoch": 0.7, "learning_rate": 0.0001953236702302092, "loss": 0.0154, "step": 138320 }, { "epoch": 0.7, "learning_rate": 0.0001953161025371952, "loss": 0.0121, "step": 138330 }, { "epoch": 0.7, "learning_rate": 0.0001953085348441812, "loss": 0.0129, "step": 138340 }, { "epoch": 0.7, "learning_rate": 0.00019530096715116718, "loss": 0.0129, "step": 138350 }, { "epoch": 0.7, "learning_rate": 0.00019529339945815316, "loss": 0.0116, "step": 138360 }, { "epoch": 0.7, "learning_rate": 0.00019528583176513914, "loss": 0.0105, "step": 138370 }, { "epoch": 0.7, "learning_rate": 0.00019527826407212515, "loss": 0.0136, "step": 138380 }, { "epoch": 0.7, "learning_rate": 0.00019527069637911113, "loss": 0.0123, "step": 138390 }, { "epoch": 0.7, "learning_rate": 0.00019526312868609711, "loss": 0.0154, "step": 138400 }, { "epoch": 0.7, "learning_rate": 0.00019525556099308312, "loss": 0.0113, "step": 138410 }, { "epoch": 0.7, "learning_rate": 0.0001952479933000691, "loss": 0.0135, "step": 138420 }, { "epoch": 0.7, "learning_rate": 0.00019524042560705509, "loss": 0.0124, "step": 138430 }, { "epoch": 0.7, "learning_rate": 0.0001952328579140411, "loss": 0.0094, "step": 138440 }, { "epoch": 0.7, "learning_rate": 0.00019522529022102708, "loss": 0.0118, "step": 138450 }, { "epoch": 0.7, "learning_rate": 0.00019521772252801306, "loss": 0.0121, "step": 138460 }, { "epoch": 0.7, "learning_rate": 0.00019521015483499907, "loss": 0.0124, "step": 138470 }, { "epoch": 0.7, "learning_rate": 0.00019520258714198505, "loss": 0.0146, "step": 138480 }, { "epoch": 0.7, "learning_rate": 0.00019519501944897103, "loss": 0.0141, "step": 138490 }, { "epoch": 0.7, "learning_rate": 0.00019518745175595704, "loss": 0.0126, "step": 138500 }, { "epoch": 0.7, "learning_rate": 0.00019517988406294302, "loss": 0.0128, "step": 138510 }, { "epoch": 0.7, "learning_rate": 0.000195172316369929, "loss": 0.011, "step": 138520 }, { "epoch": 0.7, "learning_rate": 0.00019516474867691498, "loss": 0.0153, "step": 138530 }, { "epoch": 0.7, "learning_rate": 0.000195157180983901, "loss": 0.0141, "step": 138540 }, { "epoch": 0.7, "learning_rate": 0.00019514961329088697, "loss": 0.0116, "step": 138550 }, { "epoch": 0.7, "learning_rate": 0.00019514204559787295, "loss": 0.0118, "step": 138560 }, { "epoch": 0.7, "learning_rate": 0.00019513447790485896, "loss": 0.0142, "step": 138570 }, { "epoch": 0.7, "learning_rate": 0.00019512691021184494, "loss": 0.0147, "step": 138580 }, { "epoch": 0.7, "learning_rate": 0.00019511934251883092, "loss": 0.0183, "step": 138590 }, { "epoch": 0.7, "learning_rate": 0.00019511177482581693, "loss": 0.0133, "step": 138600 }, { "epoch": 0.7, "learning_rate": 0.00019510420713280291, "loss": 0.013, "step": 138610 }, { "epoch": 0.7, "learning_rate": 0.0001950966394397889, "loss": 0.012, "step": 138620 }, { "epoch": 0.7, "learning_rate": 0.0001950890717467749, "loss": 0.0123, "step": 138630 }, { "epoch": 0.7, "learning_rate": 0.00019508150405376089, "loss": 0.0172, "step": 138640 }, { "epoch": 0.7, "learning_rate": 0.00019507393636074687, "loss": 0.018, "step": 138650 }, { "epoch": 0.7, "learning_rate": 0.00019506636866773288, "loss": 0.0112, "step": 138660 }, { "epoch": 0.7, "learning_rate": 0.00019505880097471886, "loss": 0.0169, "step": 138670 }, { "epoch": 0.7, "learning_rate": 0.00019505123328170484, "loss": 0.0119, "step": 138680 }, { "epoch": 0.7, "learning_rate": 0.00019504366558869082, "loss": 0.0108, "step": 138690 }, { "epoch": 0.7, "learning_rate": 0.00019503609789567683, "loss": 0.0136, "step": 138700 }, { "epoch": 0.7, "learning_rate": 0.0001950285302026628, "loss": 0.0145, "step": 138710 }, { "epoch": 0.7, "learning_rate": 0.0001950209625096488, "loss": 0.0104, "step": 138720 }, { "epoch": 0.7, "learning_rate": 0.0001950133948166348, "loss": 0.0128, "step": 138730 }, { "epoch": 0.7, "learning_rate": 0.00019500582712362078, "loss": 0.0139, "step": 138740 }, { "epoch": 0.7, "learning_rate": 0.00019499825943060676, "loss": 0.0109, "step": 138750 }, { "epoch": 0.7, "learning_rate": 0.00019499069173759277, "loss": 0.0145, "step": 138760 }, { "epoch": 0.7, "learning_rate": 0.00019498312404457875, "loss": 0.0118, "step": 138770 }, { "epoch": 0.7, "learning_rate": 0.00019497555635156473, "loss": 0.013, "step": 138780 }, { "epoch": 0.7, "learning_rate": 0.00019496798865855074, "loss": 0.0149, "step": 138790 }, { "epoch": 0.7, "learning_rate": 0.00019496042096553672, "loss": 0.012, "step": 138800 }, { "epoch": 0.7, "learning_rate": 0.0001949528532725227, "loss": 0.0134, "step": 138810 }, { "epoch": 0.7, "learning_rate": 0.00019494528557950871, "loss": 0.0138, "step": 138820 }, { "epoch": 0.7, "learning_rate": 0.0001949377178864947, "loss": 0.0132, "step": 138830 }, { "epoch": 0.7, "learning_rate": 0.00019493015019348068, "loss": 0.0143, "step": 138840 }, { "epoch": 0.7, "learning_rate": 0.00019492258250046669, "loss": 0.0177, "step": 138850 }, { "epoch": 0.7, "learning_rate": 0.00019491501480745267, "loss": 0.0126, "step": 138860 }, { "epoch": 0.7, "learning_rate": 0.00019490744711443865, "loss": 0.0197, "step": 138870 }, { "epoch": 0.7, "learning_rate": 0.00019489987942142463, "loss": 0.016, "step": 138880 }, { "epoch": 0.7, "learning_rate": 0.0001948923117284106, "loss": 0.013, "step": 138890 }, { "epoch": 0.7, "learning_rate": 0.0001948847440353966, "loss": 0.0131, "step": 138900 }, { "epoch": 0.7, "learning_rate": 0.00019487717634238258, "loss": 0.0136, "step": 138910 }, { "epoch": 0.7, "learning_rate": 0.00019486960864936856, "loss": 0.0137, "step": 138920 }, { "epoch": 0.7, "learning_rate": 0.00019486204095635457, "loss": 0.0124, "step": 138930 }, { "epoch": 0.7, "learning_rate": 0.00019485447326334055, "loss": 0.0102, "step": 138940 }, { "epoch": 0.7, "learning_rate": 0.00019484690557032653, "loss": 0.0145, "step": 138950 }, { "epoch": 0.7, "learning_rate": 0.00019483933787731254, "loss": 0.0114, "step": 138960 }, { "epoch": 0.7, "learning_rate": 0.00019483177018429852, "loss": 0.0136, "step": 138970 }, { "epoch": 0.7, "learning_rate": 0.0001948242024912845, "loss": 0.0131, "step": 138980 }, { "epoch": 0.7, "learning_rate": 0.0001948166347982705, "loss": 0.0174, "step": 138990 }, { "epoch": 0.7, "learning_rate": 0.0001948090671052565, "loss": 0.0138, "step": 139000 }, { "epoch": 0.7, "eval_cer": 0.9144751078837893, "eval_loss": 0.009447253309190273, "eval_runtime": 116.7733, "eval_samples_per_second": 17.127, "eval_steps_per_second": 4.282, "step": 139000 }, { "epoch": 0.7, "learning_rate": 0.00019480149941224247, "loss": 0.0125, "step": 139010 }, { "epoch": 0.7, "learning_rate": 0.00019479393171922848, "loss": 0.0135, "step": 139020 }, { "epoch": 0.7, "learning_rate": 0.00019478636402621446, "loss": 0.0139, "step": 139030 }, { "epoch": 0.7, "learning_rate": 0.00019477879633320044, "loss": 0.0116, "step": 139040 }, { "epoch": 0.7, "learning_rate": 0.00019477122864018645, "loss": 0.0139, "step": 139050 }, { "epoch": 0.7, "learning_rate": 0.00019476366094717243, "loss": 0.0141, "step": 139060 }, { "epoch": 0.7, "learning_rate": 0.00019475609325415841, "loss": 0.0104, "step": 139070 }, { "epoch": 0.7, "learning_rate": 0.0001947485255611444, "loss": 0.0156, "step": 139080 }, { "epoch": 0.7, "learning_rate": 0.0001947409578681304, "loss": 0.0188, "step": 139090 }, { "epoch": 0.7, "learning_rate": 0.00019473339017511639, "loss": 0.014, "step": 139100 }, { "epoch": 0.7, "learning_rate": 0.00019472582248210237, "loss": 0.0193, "step": 139110 }, { "epoch": 0.7, "learning_rate": 0.00019471825478908838, "loss": 0.0167, "step": 139120 }, { "epoch": 0.7, "learning_rate": 0.00019471068709607436, "loss": 0.0139, "step": 139130 }, { "epoch": 0.7, "learning_rate": 0.00019470311940306034, "loss": 0.0127, "step": 139140 }, { "epoch": 0.7, "learning_rate": 0.00019469555171004635, "loss": 0.0144, "step": 139150 }, { "epoch": 0.7, "learning_rate": 0.00019468798401703233, "loss": 0.0127, "step": 139160 }, { "epoch": 0.7, "learning_rate": 0.0001946804163240183, "loss": 0.0117, "step": 139170 }, { "epoch": 0.7, "learning_rate": 0.00019467284863100432, "loss": 0.0132, "step": 139180 }, { "epoch": 0.7, "learning_rate": 0.0001946652809379903, "loss": 0.0188, "step": 139190 }, { "epoch": 0.7, "learning_rate": 0.00019465771324497628, "loss": 0.0143, "step": 139200 }, { "epoch": 0.7, "learning_rate": 0.0001946501455519623, "loss": 0.0135, "step": 139210 }, { "epoch": 0.7, "learning_rate": 0.00019464257785894827, "loss": 0.0121, "step": 139220 }, { "epoch": 0.7, "learning_rate": 0.00019463501016593425, "loss": 0.013, "step": 139230 }, { "epoch": 0.7, "learning_rate": 0.00019462744247292026, "loss": 0.0142, "step": 139240 }, { "epoch": 0.7, "learning_rate": 0.00019461987477990624, "loss": 0.016, "step": 139250 }, { "epoch": 0.7, "learning_rate": 0.00019461230708689222, "loss": 0.0141, "step": 139260 }, { "epoch": 0.7, "learning_rate": 0.0001946047393938782, "loss": 0.0132, "step": 139270 }, { "epoch": 0.7, "learning_rate": 0.00019459717170086421, "loss": 0.0141, "step": 139280 }, { "epoch": 0.7, "learning_rate": 0.0001945896040078502, "loss": 0.0149, "step": 139290 }, { "epoch": 0.7, "learning_rate": 0.00019458203631483618, "loss": 0.0111, "step": 139300 }, { "epoch": 0.7, "learning_rate": 0.00019457446862182219, "loss": 0.015, "step": 139310 }, { "epoch": 0.7, "learning_rate": 0.00019456690092880817, "loss": 0.0106, "step": 139320 }, { "epoch": 0.7, "learning_rate": 0.00019455933323579415, "loss": 0.0135, "step": 139330 }, { "epoch": 0.7, "learning_rate": 0.00019455176554278016, "loss": 0.0112, "step": 139340 }, { "epoch": 0.7, "learning_rate": 0.00019454419784976614, "loss": 0.0135, "step": 139350 }, { "epoch": 0.7, "learning_rate": 0.00019453663015675212, "loss": 0.0117, "step": 139360 }, { "epoch": 0.7, "learning_rate": 0.00019452906246373813, "loss": 0.0133, "step": 139370 }, { "epoch": 0.7, "learning_rate": 0.0001945214947707241, "loss": 0.0123, "step": 139380 }, { "epoch": 0.7, "learning_rate": 0.0001945139270777101, "loss": 0.0128, "step": 139390 }, { "epoch": 0.7, "learning_rate": 0.0001945063593846961, "loss": 0.0141, "step": 139400 }, { "epoch": 0.7, "learning_rate": 0.00019449879169168208, "loss": 0.016, "step": 139410 }, { "epoch": 0.7, "learning_rate": 0.00019449122399866806, "loss": 0.0145, "step": 139420 }, { "epoch": 0.7, "learning_rate": 0.00019448365630565404, "loss": 0.0158, "step": 139430 }, { "epoch": 0.7, "learning_rate": 0.00019447608861264005, "loss": 0.0159, "step": 139440 }, { "epoch": 0.7, "learning_rate": 0.00019446852091962603, "loss": 0.0126, "step": 139450 }, { "epoch": 0.7, "learning_rate": 0.00019446095322661202, "loss": 0.0143, "step": 139460 }, { "epoch": 0.7, "learning_rate": 0.00019445338553359802, "loss": 0.0136, "step": 139470 }, { "epoch": 0.7, "learning_rate": 0.000194445817840584, "loss": 0.0168, "step": 139480 }, { "epoch": 0.7, "learning_rate": 0.00019443825014757, "loss": 0.0159, "step": 139490 }, { "epoch": 0.7, "learning_rate": 0.000194430682454556, "loss": 0.0118, "step": 139500 }, { "epoch": 0.7, "learning_rate": 0.00019442311476154198, "loss": 0.015, "step": 139510 }, { "epoch": 0.7, "learning_rate": 0.00019441554706852796, "loss": 0.0125, "step": 139520 }, { "epoch": 0.7, "learning_rate": 0.00019440797937551397, "loss": 0.0141, "step": 139530 }, { "epoch": 0.7, "learning_rate": 0.00019440041168249995, "loss": 0.0133, "step": 139540 }, { "epoch": 0.7, "learning_rate": 0.00019439284398948593, "loss": 0.0126, "step": 139550 }, { "epoch": 0.7, "learning_rate": 0.00019438527629647194, "loss": 0.0125, "step": 139560 }, { "epoch": 0.7, "learning_rate": 0.00019437770860345792, "loss": 0.013, "step": 139570 }, { "epoch": 0.7, "learning_rate": 0.0001943701409104439, "loss": 0.013, "step": 139580 }, { "epoch": 0.7, "learning_rate": 0.00019436257321742988, "loss": 0.0138, "step": 139590 }, { "epoch": 0.7, "learning_rate": 0.0001943550055244159, "loss": 0.0157, "step": 139600 }, { "epoch": 0.7, "learning_rate": 0.00019434743783140187, "loss": 0.0139, "step": 139610 }, { "epoch": 0.7, "learning_rate": 0.00019433987013838785, "loss": 0.0128, "step": 139620 }, { "epoch": 0.7, "learning_rate": 0.00019433230244537386, "loss": 0.0127, "step": 139630 }, { "epoch": 0.7, "learning_rate": 0.00019432473475235984, "loss": 0.0131, "step": 139640 }, { "epoch": 0.7, "learning_rate": 0.00019431716705934583, "loss": 0.0135, "step": 139650 }, { "epoch": 0.7, "learning_rate": 0.00019430959936633183, "loss": 0.0118, "step": 139660 }, { "epoch": 0.7, "learning_rate": 0.00019430203167331782, "loss": 0.0101, "step": 139670 }, { "epoch": 0.7, "learning_rate": 0.0001942944639803038, "loss": 0.0125, "step": 139680 }, { "epoch": 0.7, "learning_rate": 0.0001942868962872898, "loss": 0.0119, "step": 139690 }, { "epoch": 0.7, "learning_rate": 0.0001942793285942758, "loss": 0.0151, "step": 139700 }, { "epoch": 0.7, "learning_rate": 0.00019427176090126177, "loss": 0.0141, "step": 139710 }, { "epoch": 0.7, "learning_rate": 0.00019426419320824778, "loss": 0.0115, "step": 139720 }, { "epoch": 0.7, "learning_rate": 0.00019425662551523376, "loss": 0.0163, "step": 139730 }, { "epoch": 0.71, "learning_rate": 0.00019424905782221974, "loss": 0.0122, "step": 139740 }, { "epoch": 0.71, "learning_rate": 0.00019424149012920575, "loss": 0.0147, "step": 139750 }, { "epoch": 0.71, "learning_rate": 0.00019423392243619173, "loss": 0.0118, "step": 139760 }, { "epoch": 0.71, "learning_rate": 0.0001942263547431777, "loss": 0.017, "step": 139770 }, { "epoch": 0.71, "learning_rate": 0.0001942187870501637, "loss": 0.0108, "step": 139780 }, { "epoch": 0.71, "learning_rate": 0.0001942112193571497, "loss": 0.0151, "step": 139790 }, { "epoch": 0.71, "learning_rate": 0.00019420365166413568, "loss": 0.0142, "step": 139800 }, { "epoch": 0.71, "learning_rate": 0.00019419608397112166, "loss": 0.0132, "step": 139810 }, { "epoch": 0.71, "learning_rate": 0.00019418851627810767, "loss": 0.0099, "step": 139820 }, { "epoch": 0.71, "learning_rate": 0.00019418094858509365, "loss": 0.0114, "step": 139830 }, { "epoch": 0.71, "learning_rate": 0.00019417338089207964, "loss": 0.0124, "step": 139840 }, { "epoch": 0.71, "learning_rate": 0.00019416581319906564, "loss": 0.0111, "step": 139850 }, { "epoch": 0.71, "learning_rate": 0.00019415824550605163, "loss": 0.0131, "step": 139860 }, { "epoch": 0.71, "learning_rate": 0.0001941506778130376, "loss": 0.0137, "step": 139870 }, { "epoch": 0.71, "learning_rate": 0.00019414311012002362, "loss": 0.0105, "step": 139880 }, { "epoch": 0.71, "learning_rate": 0.0001941355424270096, "loss": 0.0149, "step": 139890 }, { "epoch": 0.71, "learning_rate": 0.00019412797473399558, "loss": 0.0131, "step": 139900 }, { "epoch": 0.71, "learning_rate": 0.0001941204070409816, "loss": 0.0176, "step": 139910 }, { "epoch": 0.71, "learning_rate": 0.00019411283934796757, "loss": 0.0124, "step": 139920 }, { "epoch": 0.71, "learning_rate": 0.00019410527165495355, "loss": 0.0143, "step": 139930 }, { "epoch": 0.71, "learning_rate": 0.00019409770396193953, "loss": 0.0131, "step": 139940 }, { "epoch": 0.71, "learning_rate": 0.00019409013626892554, "loss": 0.0117, "step": 139950 }, { "epoch": 0.71, "learning_rate": 0.00019408256857591152, "loss": 0.0114, "step": 139960 }, { "epoch": 0.71, "learning_rate": 0.0001940750008828975, "loss": 0.0117, "step": 139970 }, { "epoch": 0.71, "learning_rate": 0.0001940674331898835, "loss": 0.0121, "step": 139980 }, { "epoch": 0.71, "learning_rate": 0.0001940598654968695, "loss": 0.0126, "step": 139990 }, { "epoch": 0.71, "learning_rate": 0.00019405229780385547, "loss": 0.0152, "step": 140000 }, { "epoch": 0.71, "eval_cer": 0.9144741374876638, "eval_loss": 0.009188586845993996, "eval_runtime": 116.7594, "eval_samples_per_second": 17.129, "eval_steps_per_second": 4.282, "step": 140000 }, { "epoch": 0.71, "learning_rate": 0.00019404473011084148, "loss": 0.015, "step": 140010 }, { "epoch": 0.71, "learning_rate": 0.00019403716241782746, "loss": 0.0123, "step": 140020 }, { "epoch": 0.71, "learning_rate": 0.00019402959472481345, "loss": 0.0155, "step": 140030 }, { "epoch": 0.71, "learning_rate": 0.00019402202703179945, "loss": 0.0138, "step": 140040 }, { "epoch": 0.71, "learning_rate": 0.00019401445933878544, "loss": 0.0173, "step": 140050 }, { "epoch": 0.71, "learning_rate": 0.00019400689164577142, "loss": 0.0135, "step": 140060 }, { "epoch": 0.71, "learning_rate": 0.00019399932395275743, "loss": 0.0115, "step": 140070 }, { "epoch": 0.71, "learning_rate": 0.0001939917562597434, "loss": 0.0169, "step": 140080 }, { "epoch": 0.71, "learning_rate": 0.0001939841885667294, "loss": 0.0127, "step": 140090 }, { "epoch": 0.71, "learning_rate": 0.00019397662087371537, "loss": 0.0138, "step": 140100 }, { "epoch": 0.71, "learning_rate": 0.00019396905318070138, "loss": 0.0135, "step": 140110 }, { "epoch": 0.71, "learning_rate": 0.00019396148548768736, "loss": 0.0114, "step": 140120 }, { "epoch": 0.71, "learning_rate": 0.00019395391779467334, "loss": 0.015, "step": 140130 }, { "epoch": 0.71, "learning_rate": 0.00019394635010165935, "loss": 0.0135, "step": 140140 }, { "epoch": 0.71, "learning_rate": 0.0001939387824086453, "loss": 0.0129, "step": 140150 }, { "epoch": 0.71, "learning_rate": 0.00019393121471563129, "loss": 0.0104, "step": 140160 }, { "epoch": 0.71, "learning_rate": 0.00019392364702261727, "loss": 0.0169, "step": 140170 }, { "epoch": 0.71, "learning_rate": 0.00019391607932960328, "loss": 0.0121, "step": 140180 }, { "epoch": 0.71, "learning_rate": 0.00019390851163658926, "loss": 0.0145, "step": 140190 }, { "epoch": 0.71, "learning_rate": 0.00019390094394357524, "loss": 0.011, "step": 140200 }, { "epoch": 0.71, "learning_rate": 0.00019389337625056125, "loss": 0.014, "step": 140210 }, { "epoch": 0.71, "learning_rate": 0.00019388580855754723, "loss": 0.0134, "step": 140220 }, { "epoch": 0.71, "learning_rate": 0.0001938782408645332, "loss": 0.0139, "step": 140230 }, { "epoch": 0.71, "learning_rate": 0.00019387067317151922, "loss": 0.0191, "step": 140240 }, { "epoch": 0.71, "learning_rate": 0.0001938631054785052, "loss": 0.0126, "step": 140250 }, { "epoch": 0.71, "learning_rate": 0.00019385553778549118, "loss": 0.0164, "step": 140260 }, { "epoch": 0.71, "learning_rate": 0.0001938479700924772, "loss": 0.0151, "step": 140270 }, { "epoch": 0.71, "learning_rate": 0.00019384040239946317, "loss": 0.0122, "step": 140280 }, { "epoch": 0.71, "learning_rate": 0.00019383283470644915, "loss": 0.014, "step": 140290 }, { "epoch": 0.71, "learning_rate": 0.00019382526701343516, "loss": 0.0121, "step": 140300 }, { "epoch": 0.71, "learning_rate": 0.00019381769932042114, "loss": 0.012, "step": 140310 }, { "epoch": 0.71, "learning_rate": 0.00019381013162740712, "loss": 0.0141, "step": 140320 }, { "epoch": 0.71, "learning_rate": 0.0001938025639343931, "loss": 0.0135, "step": 140330 }, { "epoch": 0.71, "learning_rate": 0.00019379499624137911, "loss": 0.0094, "step": 140340 }, { "epoch": 0.71, "learning_rate": 0.0001937874285483651, "loss": 0.0128, "step": 140350 }, { "epoch": 0.71, "learning_rate": 0.00019377986085535108, "loss": 0.0149, "step": 140360 }, { "epoch": 0.71, "learning_rate": 0.00019377229316233709, "loss": 0.0177, "step": 140370 }, { "epoch": 0.71, "learning_rate": 0.00019376472546932307, "loss": 0.0164, "step": 140380 }, { "epoch": 0.71, "learning_rate": 0.00019375715777630905, "loss": 0.0127, "step": 140390 }, { "epoch": 0.71, "learning_rate": 0.00019374959008329506, "loss": 0.0131, "step": 140400 }, { "epoch": 0.71, "learning_rate": 0.00019374202239028104, "loss": 0.013, "step": 140410 }, { "epoch": 0.71, "learning_rate": 0.00019373445469726702, "loss": 0.0133, "step": 140420 }, { "epoch": 0.71, "learning_rate": 0.00019372688700425303, "loss": 0.014, "step": 140430 }, { "epoch": 0.71, "learning_rate": 0.000193719319311239, "loss": 0.013, "step": 140440 }, { "epoch": 0.71, "learning_rate": 0.000193711751618225, "loss": 0.0145, "step": 140450 }, { "epoch": 0.71, "learning_rate": 0.000193704183925211, "loss": 0.0134, "step": 140460 }, { "epoch": 0.71, "learning_rate": 0.00019369661623219698, "loss": 0.0139, "step": 140470 }, { "epoch": 0.71, "learning_rate": 0.00019368904853918296, "loss": 0.0159, "step": 140480 }, { "epoch": 0.71, "learning_rate": 0.00019368148084616894, "loss": 0.0162, "step": 140490 }, { "epoch": 0.71, "learning_rate": 0.00019367391315315495, "loss": 0.0142, "step": 140500 }, { "epoch": 0.71, "learning_rate": 0.00019366634546014093, "loss": 0.0115, "step": 140510 }, { "epoch": 0.71, "learning_rate": 0.00019365877776712692, "loss": 0.0145, "step": 140520 }, { "epoch": 0.71, "learning_rate": 0.00019365121007411292, "loss": 0.0145, "step": 140530 }, { "epoch": 0.71, "learning_rate": 0.0001936436423810989, "loss": 0.0166, "step": 140540 }, { "epoch": 0.71, "learning_rate": 0.0001936360746880849, "loss": 0.0129, "step": 140550 }, { "epoch": 0.71, "learning_rate": 0.0001936285069950709, "loss": 0.0117, "step": 140560 }, { "epoch": 0.71, "learning_rate": 0.00019362093930205688, "loss": 0.0149, "step": 140570 }, { "epoch": 0.71, "learning_rate": 0.00019361337160904286, "loss": 0.0128, "step": 140580 }, { "epoch": 0.71, "learning_rate": 0.00019360580391602887, "loss": 0.0128, "step": 140590 }, { "epoch": 0.71, "learning_rate": 0.00019359823622301485, "loss": 0.0126, "step": 140600 }, { "epoch": 0.71, "learning_rate": 0.00019359066853000083, "loss": 0.0108, "step": 140610 }, { "epoch": 0.71, "learning_rate": 0.00019358310083698684, "loss": 0.0111, "step": 140620 }, { "epoch": 0.71, "learning_rate": 0.00019357553314397282, "loss": 0.0137, "step": 140630 }, { "epoch": 0.71, "learning_rate": 0.0001935679654509588, "loss": 0.0139, "step": 140640 }, { "epoch": 0.71, "learning_rate": 0.0001935603977579448, "loss": 0.0156, "step": 140650 }, { "epoch": 0.71, "learning_rate": 0.0001935528300649308, "loss": 0.0108, "step": 140660 }, { "epoch": 0.71, "learning_rate": 0.00019354526237191677, "loss": 0.0127, "step": 140670 }, { "epoch": 0.71, "learning_rate": 0.00019353769467890275, "loss": 0.0103, "step": 140680 }, { "epoch": 0.71, "learning_rate": 0.00019353012698588876, "loss": 0.0114, "step": 140690 }, { "epoch": 0.71, "learning_rate": 0.00019352255929287474, "loss": 0.0127, "step": 140700 }, { "epoch": 0.71, "learning_rate": 0.00019351499159986073, "loss": 0.0139, "step": 140710 }, { "epoch": 0.71, "learning_rate": 0.00019350742390684673, "loss": 0.015, "step": 140720 }, { "epoch": 0.71, "learning_rate": 0.00019349985621383272, "loss": 0.0135, "step": 140730 }, { "epoch": 0.71, "learning_rate": 0.0001934922885208187, "loss": 0.0119, "step": 140740 }, { "epoch": 0.71, "learning_rate": 0.0001934847208278047, "loss": 0.0116, "step": 140750 }, { "epoch": 0.71, "learning_rate": 0.0001934771531347907, "loss": 0.0139, "step": 140760 }, { "epoch": 0.71, "learning_rate": 0.00019346958544177667, "loss": 0.0136, "step": 140770 }, { "epoch": 0.71, "learning_rate": 0.00019346201774876268, "loss": 0.011, "step": 140780 }, { "epoch": 0.71, "learning_rate": 0.00019345445005574866, "loss": 0.0107, "step": 140790 }, { "epoch": 0.71, "learning_rate": 0.00019344688236273464, "loss": 0.0098, "step": 140800 }, { "epoch": 0.71, "learning_rate": 0.00019343931466972065, "loss": 0.0113, "step": 140810 }, { "epoch": 0.71, "learning_rate": 0.00019343174697670663, "loss": 0.0161, "step": 140820 }, { "epoch": 0.71, "learning_rate": 0.0001934241792836926, "loss": 0.0159, "step": 140830 }, { "epoch": 0.71, "learning_rate": 0.0001934166115906786, "loss": 0.013, "step": 140840 }, { "epoch": 0.71, "learning_rate": 0.0001934090438976646, "loss": 0.0135, "step": 140850 }, { "epoch": 0.71, "learning_rate": 0.00019340147620465058, "loss": 0.0126, "step": 140860 }, { "epoch": 0.71, "learning_rate": 0.00019339390851163656, "loss": 0.0128, "step": 140870 }, { "epoch": 0.71, "learning_rate": 0.00019338634081862257, "loss": 0.0126, "step": 140880 }, { "epoch": 0.71, "learning_rate": 0.00019337877312560855, "loss": 0.0095, "step": 140890 }, { "epoch": 0.71, "learning_rate": 0.00019337120543259454, "loss": 0.014, "step": 140900 }, { "epoch": 0.71, "learning_rate": 0.00019336363773958054, "loss": 0.0139, "step": 140910 }, { "epoch": 0.71, "learning_rate": 0.00019335607004656653, "loss": 0.0146, "step": 140920 }, { "epoch": 0.71, "learning_rate": 0.0001933485023535525, "loss": 0.0119, "step": 140930 }, { "epoch": 0.71, "learning_rate": 0.00019334093466053852, "loss": 0.0132, "step": 140940 }, { "epoch": 0.71, "learning_rate": 0.0001933333669675245, "loss": 0.0131, "step": 140950 }, { "epoch": 0.71, "learning_rate": 0.00019332579927451048, "loss": 0.0132, "step": 140960 }, { "epoch": 0.71, "learning_rate": 0.0001933182315814965, "loss": 0.0111, "step": 140970 }, { "epoch": 0.71, "learning_rate": 0.00019331066388848247, "loss": 0.0155, "step": 140980 }, { "epoch": 0.71, "learning_rate": 0.00019330309619546845, "loss": 0.0134, "step": 140990 }, { "epoch": 0.71, "learning_rate": 0.00019329552850245443, "loss": 0.0156, "step": 141000 }, { "epoch": 0.71, "eval_cer": 0.9144789894682909, "eval_loss": 0.009155085310339928, "eval_runtime": 116.8383, "eval_samples_per_second": 17.118, "eval_steps_per_second": 4.279, "step": 141000 }, { "epoch": 0.71, "learning_rate": 0.00019328796080944044, "loss": 0.0143, "step": 141010 }, { "epoch": 0.71, "learning_rate": 0.00019328039311642642, "loss": 0.0152, "step": 141020 }, { "epoch": 0.71, "learning_rate": 0.0001932728254234124, "loss": 0.0157, "step": 141030 }, { "epoch": 0.71, "learning_rate": 0.0001932652577303984, "loss": 0.0117, "step": 141040 }, { "epoch": 0.71, "learning_rate": 0.0001932576900373844, "loss": 0.0128, "step": 141050 }, { "epoch": 0.71, "learning_rate": 0.00019325012234437037, "loss": 0.0142, "step": 141060 }, { "epoch": 0.71, "learning_rate": 0.00019324255465135638, "loss": 0.0126, "step": 141070 }, { "epoch": 0.71, "learning_rate": 0.00019323498695834236, "loss": 0.0138, "step": 141080 }, { "epoch": 0.71, "learning_rate": 0.00019322741926532835, "loss": 0.0145, "step": 141090 }, { "epoch": 0.71, "learning_rate": 0.00019321985157231435, "loss": 0.0108, "step": 141100 }, { "epoch": 0.71, "learning_rate": 0.00019321228387930034, "loss": 0.0143, "step": 141110 }, { "epoch": 0.71, "learning_rate": 0.00019320471618628632, "loss": 0.012, "step": 141120 }, { "epoch": 0.71, "learning_rate": 0.00019319714849327233, "loss": 0.0135, "step": 141130 }, { "epoch": 0.71, "learning_rate": 0.0001931895808002583, "loss": 0.0145, "step": 141140 }, { "epoch": 0.71, "learning_rate": 0.0001931820131072443, "loss": 0.0112, "step": 141150 }, { "epoch": 0.71, "learning_rate": 0.00019317444541423027, "loss": 0.0124, "step": 141160 }, { "epoch": 0.71, "learning_rate": 0.00019316687772121628, "loss": 0.0108, "step": 141170 }, { "epoch": 0.71, "learning_rate": 0.00019315931002820226, "loss": 0.0124, "step": 141180 }, { "epoch": 0.71, "learning_rate": 0.00019315174233518824, "loss": 0.0145, "step": 141190 }, { "epoch": 0.71, "learning_rate": 0.00019314417464217425, "loss": 0.0142, "step": 141200 }, { "epoch": 0.71, "learning_rate": 0.00019313660694916023, "loss": 0.0146, "step": 141210 }, { "epoch": 0.71, "learning_rate": 0.0001931290392561462, "loss": 0.0126, "step": 141220 }, { "epoch": 0.71, "learning_rate": 0.00019312147156313222, "loss": 0.0134, "step": 141230 }, { "epoch": 0.71, "learning_rate": 0.0001931139038701182, "loss": 0.0142, "step": 141240 }, { "epoch": 0.71, "learning_rate": 0.00019310633617710418, "loss": 0.0144, "step": 141250 }, { "epoch": 0.71, "learning_rate": 0.0001930987684840902, "loss": 0.0141, "step": 141260 }, { "epoch": 0.71, "learning_rate": 0.00019309120079107617, "loss": 0.0141, "step": 141270 }, { "epoch": 0.71, "learning_rate": 0.00019308363309806216, "loss": 0.0135, "step": 141280 }, { "epoch": 0.71, "learning_rate": 0.00019307606540504816, "loss": 0.0129, "step": 141290 }, { "epoch": 0.71, "learning_rate": 0.00019306849771203415, "loss": 0.0113, "step": 141300 }, { "epoch": 0.71, "learning_rate": 0.00019306093001902013, "loss": 0.0134, "step": 141310 }, { "epoch": 0.71, "learning_rate": 0.00019305336232600614, "loss": 0.0137, "step": 141320 }, { "epoch": 0.71, "learning_rate": 0.00019304579463299212, "loss": 0.0137, "step": 141330 }, { "epoch": 0.71, "learning_rate": 0.0001930382269399781, "loss": 0.0123, "step": 141340 }, { "epoch": 0.71, "learning_rate": 0.00019303065924696408, "loss": 0.0129, "step": 141350 }, { "epoch": 0.71, "learning_rate": 0.0001930230915539501, "loss": 0.0136, "step": 141360 }, { "epoch": 0.71, "learning_rate": 0.00019301552386093607, "loss": 0.0127, "step": 141370 }, { "epoch": 0.71, "learning_rate": 0.00019300795616792205, "loss": 0.0119, "step": 141380 }, { "epoch": 0.71, "learning_rate": 0.00019300038847490806, "loss": 0.0146, "step": 141390 }, { "epoch": 0.71, "learning_rate": 0.00019299282078189401, "loss": 0.0123, "step": 141400 }, { "epoch": 0.71, "learning_rate": 0.00019298525308888, "loss": 0.0107, "step": 141410 }, { "epoch": 0.71, "learning_rate": 0.00019297768539586598, "loss": 0.0132, "step": 141420 }, { "epoch": 0.71, "learning_rate": 0.00019297011770285199, "loss": 0.0157, "step": 141430 }, { "epoch": 0.71, "learning_rate": 0.00019296255000983797, "loss": 0.0114, "step": 141440 }, { "epoch": 0.71, "learning_rate": 0.00019295498231682395, "loss": 0.0147, "step": 141450 }, { "epoch": 0.71, "learning_rate": 0.00019294741462380996, "loss": 0.0173, "step": 141460 }, { "epoch": 0.71, "learning_rate": 0.00019293984693079594, "loss": 0.0122, "step": 141470 }, { "epoch": 0.71, "learning_rate": 0.00019293227923778192, "loss": 0.0114, "step": 141480 }, { "epoch": 0.71, "learning_rate": 0.00019292471154476793, "loss": 0.0129, "step": 141490 }, { "epoch": 0.71, "learning_rate": 0.0001929171438517539, "loss": 0.0169, "step": 141500 }, { "epoch": 0.71, "learning_rate": 0.0001929095761587399, "loss": 0.0118, "step": 141510 }, { "epoch": 0.71, "learning_rate": 0.0001929020084657259, "loss": 0.014, "step": 141520 }, { "epoch": 0.71, "learning_rate": 0.00019289444077271188, "loss": 0.0137, "step": 141530 }, { "epoch": 0.71, "learning_rate": 0.00019288687307969786, "loss": 0.0142, "step": 141540 }, { "epoch": 0.71, "learning_rate": 0.00019287930538668384, "loss": 0.0145, "step": 141550 }, { "epoch": 0.71, "learning_rate": 0.00019287173769366985, "loss": 0.0126, "step": 141560 }, { "epoch": 0.71, "learning_rate": 0.00019286417000065583, "loss": 0.0119, "step": 141570 }, { "epoch": 0.71, "learning_rate": 0.00019285660230764182, "loss": 0.0123, "step": 141580 }, { "epoch": 0.71, "learning_rate": 0.00019284903461462782, "loss": 0.013, "step": 141590 }, { "epoch": 0.71, "learning_rate": 0.0001928414669216138, "loss": 0.0117, "step": 141600 }, { "epoch": 0.71, "learning_rate": 0.0001928338992285998, "loss": 0.0123, "step": 141610 }, { "epoch": 0.71, "learning_rate": 0.0001928263315355858, "loss": 0.0122, "step": 141620 }, { "epoch": 0.71, "learning_rate": 0.00019281876384257178, "loss": 0.0144, "step": 141630 }, { "epoch": 0.71, "learning_rate": 0.00019281119614955776, "loss": 0.0118, "step": 141640 }, { "epoch": 0.71, "learning_rate": 0.00019280362845654377, "loss": 0.0139, "step": 141650 }, { "epoch": 0.71, "learning_rate": 0.00019279606076352975, "loss": 0.0135, "step": 141660 }, { "epoch": 0.71, "learning_rate": 0.00019278849307051573, "loss": 0.0124, "step": 141670 }, { "epoch": 0.71, "learning_rate": 0.00019278092537750174, "loss": 0.0122, "step": 141680 }, { "epoch": 0.71, "learning_rate": 0.00019277335768448772, "loss": 0.0108, "step": 141690 }, { "epoch": 0.71, "learning_rate": 0.0001927657899914737, "loss": 0.0142, "step": 141700 }, { "epoch": 0.71, "learning_rate": 0.0001927582222984597, "loss": 0.0109, "step": 141710 }, { "epoch": 0.71, "learning_rate": 0.0001927506546054457, "loss": 0.0122, "step": 141720 }, { "epoch": 0.72, "learning_rate": 0.00019274308691243167, "loss": 0.0158, "step": 141730 }, { "epoch": 0.72, "learning_rate": 0.00019273551921941765, "loss": 0.0124, "step": 141740 }, { "epoch": 0.72, "learning_rate": 0.00019272795152640366, "loss": 0.0136, "step": 141750 }, { "epoch": 0.72, "learning_rate": 0.00019272038383338964, "loss": 0.0113, "step": 141760 }, { "epoch": 0.72, "learning_rate": 0.00019271281614037563, "loss": 0.0123, "step": 141770 }, { "epoch": 0.72, "learning_rate": 0.00019270524844736163, "loss": 0.0123, "step": 141780 }, { "epoch": 0.72, "learning_rate": 0.00019269768075434762, "loss": 0.0114, "step": 141790 }, { "epoch": 0.72, "learning_rate": 0.0001926901130613336, "loss": 0.0109, "step": 141800 }, { "epoch": 0.72, "learning_rate": 0.0001926825453683196, "loss": 0.0136, "step": 141810 }, { "epoch": 0.72, "learning_rate": 0.0001926749776753056, "loss": 0.0123, "step": 141820 }, { "epoch": 0.72, "learning_rate": 0.00019266740998229157, "loss": 0.0145, "step": 141830 }, { "epoch": 0.72, "learning_rate": 0.00019265984228927758, "loss": 0.0155, "step": 141840 }, { "epoch": 0.72, "learning_rate": 0.00019265227459626356, "loss": 0.0221, "step": 141850 }, { "epoch": 0.72, "learning_rate": 0.00019264470690324954, "loss": 0.0091, "step": 141860 }, { "epoch": 0.72, "learning_rate": 0.00019263713921023555, "loss": 0.014, "step": 141870 }, { "epoch": 0.72, "learning_rate": 0.00019262957151722153, "loss": 0.0132, "step": 141880 }, { "epoch": 0.72, "learning_rate": 0.0001926220038242075, "loss": 0.0193, "step": 141890 }, { "epoch": 0.72, "learning_rate": 0.0001926144361311935, "loss": 0.0147, "step": 141900 }, { "epoch": 0.72, "learning_rate": 0.0001926068684381795, "loss": 0.0123, "step": 141910 }, { "epoch": 0.72, "learning_rate": 0.00019259930074516548, "loss": 0.0165, "step": 141920 }, { "epoch": 0.72, "learning_rate": 0.00019259173305215146, "loss": 0.0159, "step": 141930 }, { "epoch": 0.72, "learning_rate": 0.00019258416535913747, "loss": 0.0135, "step": 141940 }, { "epoch": 0.72, "learning_rate": 0.00019257659766612345, "loss": 0.0166, "step": 141950 }, { "epoch": 0.72, "learning_rate": 0.00019256902997310944, "loss": 0.0119, "step": 141960 }, { "epoch": 0.72, "learning_rate": 0.00019256146228009544, "loss": 0.0129, "step": 141970 }, { "epoch": 0.72, "learning_rate": 0.00019255389458708143, "loss": 0.0146, "step": 141980 }, { "epoch": 0.72, "learning_rate": 0.0001925463268940674, "loss": 0.015, "step": 141990 }, { "epoch": 0.72, "learning_rate": 0.00019253875920105342, "loss": 0.0109, "step": 142000 }, { "epoch": 0.72, "eval_cer": 0.9144751078837893, "eval_loss": 0.009451182559132576, "eval_runtime": 116.6955, "eval_samples_per_second": 17.139, "eval_steps_per_second": 4.285, "step": 142000 }, { "epoch": 0.72, "learning_rate": 0.0001925311915080394, "loss": 0.0138, "step": 142010 }, { "epoch": 0.72, "learning_rate": 0.00019252362381502538, "loss": 0.014, "step": 142020 }, { "epoch": 0.72, "learning_rate": 0.0001925160561220114, "loss": 0.0146, "step": 142030 }, { "epoch": 0.72, "learning_rate": 0.00019250848842899737, "loss": 0.0153, "step": 142040 }, { "epoch": 0.72, "learning_rate": 0.00019250092073598335, "loss": 0.0132, "step": 142050 }, { "epoch": 0.72, "learning_rate": 0.00019249335304296933, "loss": 0.0153, "step": 142060 }, { "epoch": 0.72, "learning_rate": 0.00019248578534995534, "loss": 0.0151, "step": 142070 }, { "epoch": 0.72, "learning_rate": 0.00019247821765694132, "loss": 0.0142, "step": 142080 }, { "epoch": 0.72, "learning_rate": 0.0001924706499639273, "loss": 0.0145, "step": 142090 }, { "epoch": 0.72, "learning_rate": 0.0001924630822709133, "loss": 0.0106, "step": 142100 }, { "epoch": 0.72, "learning_rate": 0.0001924555145778993, "loss": 0.0153, "step": 142110 }, { "epoch": 0.72, "learning_rate": 0.00019244794688488527, "loss": 0.0152, "step": 142120 }, { "epoch": 0.72, "learning_rate": 0.00019244037919187128, "loss": 0.0128, "step": 142130 }, { "epoch": 0.72, "learning_rate": 0.00019243281149885726, "loss": 0.014, "step": 142140 }, { "epoch": 0.72, "learning_rate": 0.00019242524380584325, "loss": 0.0126, "step": 142150 }, { "epoch": 0.72, "learning_rate": 0.00019241767611282925, "loss": 0.0171, "step": 142160 }, { "epoch": 0.72, "learning_rate": 0.00019241010841981524, "loss": 0.0135, "step": 142170 }, { "epoch": 0.72, "learning_rate": 0.00019240254072680122, "loss": 0.0184, "step": 142180 }, { "epoch": 0.72, "learning_rate": 0.00019239497303378723, "loss": 0.013, "step": 142190 }, { "epoch": 0.72, "learning_rate": 0.0001923874053407732, "loss": 0.0143, "step": 142200 }, { "epoch": 0.72, "learning_rate": 0.0001923798376477592, "loss": 0.018, "step": 142210 }, { "epoch": 0.72, "learning_rate": 0.0001923722699547452, "loss": 0.014, "step": 142220 }, { "epoch": 0.72, "learning_rate": 0.00019236470226173118, "loss": 0.0103, "step": 142230 }, { "epoch": 0.72, "learning_rate": 0.00019235713456871716, "loss": 0.0136, "step": 142240 }, { "epoch": 0.72, "learning_rate": 0.00019234956687570314, "loss": 0.0144, "step": 142250 }, { "epoch": 0.72, "learning_rate": 0.00019234199918268915, "loss": 0.0158, "step": 142260 }, { "epoch": 0.72, "learning_rate": 0.00019233443148967513, "loss": 0.0122, "step": 142270 }, { "epoch": 0.72, "learning_rate": 0.0001923268637966611, "loss": 0.0139, "step": 142280 }, { "epoch": 0.72, "learning_rate": 0.00019231929610364712, "loss": 0.0112, "step": 142290 }, { "epoch": 0.72, "learning_rate": 0.0001923117284106331, "loss": 0.0123, "step": 142300 }, { "epoch": 0.72, "learning_rate": 0.00019230416071761908, "loss": 0.0143, "step": 142310 }, { "epoch": 0.72, "learning_rate": 0.0001922965930246051, "loss": 0.0179, "step": 142320 }, { "epoch": 0.72, "learning_rate": 0.00019228902533159107, "loss": 0.0118, "step": 142330 }, { "epoch": 0.72, "learning_rate": 0.00019228145763857706, "loss": 0.013, "step": 142340 }, { "epoch": 0.72, "learning_rate": 0.00019227388994556306, "loss": 0.0128, "step": 142350 }, { "epoch": 0.72, "learning_rate": 0.00019226632225254905, "loss": 0.011, "step": 142360 }, { "epoch": 0.72, "learning_rate": 0.00019225875455953503, "loss": 0.0148, "step": 142370 }, { "epoch": 0.72, "learning_rate": 0.00019225118686652104, "loss": 0.0181, "step": 142380 }, { "epoch": 0.72, "learning_rate": 0.00019224361917350702, "loss": 0.0131, "step": 142390 }, { "epoch": 0.72, "learning_rate": 0.000192236051480493, "loss": 0.0149, "step": 142400 }, { "epoch": 0.72, "learning_rate": 0.00019222848378747898, "loss": 0.0153, "step": 142410 }, { "epoch": 0.72, "learning_rate": 0.000192220916094465, "loss": 0.0126, "step": 142420 }, { "epoch": 0.72, "learning_rate": 0.00019221334840145097, "loss": 0.0121, "step": 142430 }, { "epoch": 0.72, "learning_rate": 0.00019220578070843695, "loss": 0.011, "step": 142440 }, { "epoch": 0.72, "learning_rate": 0.00019219821301542296, "loss": 0.0117, "step": 142450 }, { "epoch": 0.72, "learning_rate": 0.00019219064532240894, "loss": 0.0129, "step": 142460 }, { "epoch": 0.72, "learning_rate": 0.00019218307762939492, "loss": 0.0139, "step": 142470 }, { "epoch": 0.72, "learning_rate": 0.00019217550993638093, "loss": 0.0126, "step": 142480 }, { "epoch": 0.72, "learning_rate": 0.0001921679422433669, "loss": 0.0118, "step": 142490 }, { "epoch": 0.72, "learning_rate": 0.0001921603745503529, "loss": 0.0116, "step": 142500 }, { "epoch": 0.72, "learning_rate": 0.0001921528068573389, "loss": 0.0144, "step": 142510 }, { "epoch": 0.72, "learning_rate": 0.00019214523916432488, "loss": 0.014, "step": 142520 }, { "epoch": 0.72, "learning_rate": 0.00019213767147131087, "loss": 0.0122, "step": 142530 }, { "epoch": 0.72, "learning_rate": 0.00019213010377829687, "loss": 0.016, "step": 142540 }, { "epoch": 0.72, "learning_rate": 0.00019212253608528286, "loss": 0.0103, "step": 142550 }, { "epoch": 0.72, "learning_rate": 0.00019211496839226884, "loss": 0.0127, "step": 142560 }, { "epoch": 0.72, "learning_rate": 0.00019210740069925482, "loss": 0.0114, "step": 142570 }, { "epoch": 0.72, "learning_rate": 0.00019209983300624083, "loss": 0.0091, "step": 142580 }, { "epoch": 0.72, "learning_rate": 0.0001920922653132268, "loss": 0.014, "step": 142590 }, { "epoch": 0.72, "learning_rate": 0.0001920846976202128, "loss": 0.0124, "step": 142600 }, { "epoch": 0.72, "learning_rate": 0.0001920771299271988, "loss": 0.013, "step": 142610 }, { "epoch": 0.72, "learning_rate": 0.00019206956223418478, "loss": 0.01, "step": 142620 }, { "epoch": 0.72, "learning_rate": 0.00019206199454117076, "loss": 0.0132, "step": 142630 }, { "epoch": 0.72, "learning_rate": 0.00019205442684815677, "loss": 0.0143, "step": 142640 }, { "epoch": 0.72, "learning_rate": 0.00019204685915514275, "loss": 0.0164, "step": 142650 }, { "epoch": 0.72, "learning_rate": 0.0001920392914621287, "loss": 0.0102, "step": 142660 }, { "epoch": 0.72, "learning_rate": 0.0001920317237691147, "loss": 0.0154, "step": 142670 }, { "epoch": 0.72, "learning_rate": 0.0001920241560761007, "loss": 0.0115, "step": 142680 }, { "epoch": 0.72, "learning_rate": 0.00019201658838308668, "loss": 0.0125, "step": 142690 }, { "epoch": 0.72, "learning_rate": 0.00019200902069007266, "loss": 0.0144, "step": 142700 }, { "epoch": 0.72, "learning_rate": 0.00019200145299705867, "loss": 0.0121, "step": 142710 }, { "epoch": 0.72, "learning_rate": 0.00019199388530404465, "loss": 0.0112, "step": 142720 }, { "epoch": 0.72, "learning_rate": 0.00019198631761103063, "loss": 0.0116, "step": 142730 }, { "epoch": 0.72, "learning_rate": 0.00019197874991801664, "loss": 0.0134, "step": 142740 }, { "epoch": 0.72, "learning_rate": 0.00019197118222500262, "loss": 0.0114, "step": 142750 }, { "epoch": 0.72, "learning_rate": 0.0001919636145319886, "loss": 0.012, "step": 142760 }, { "epoch": 0.72, "learning_rate": 0.0001919560468389746, "loss": 0.0119, "step": 142770 }, { "epoch": 0.72, "learning_rate": 0.0001919484791459606, "loss": 0.0134, "step": 142780 }, { "epoch": 0.72, "learning_rate": 0.00019194091145294657, "loss": 0.0118, "step": 142790 }, { "epoch": 0.72, "learning_rate": 0.00019193334375993255, "loss": 0.0128, "step": 142800 }, { "epoch": 0.72, "learning_rate": 0.00019192577606691856, "loss": 0.0123, "step": 142810 }, { "epoch": 0.72, "learning_rate": 0.00019191820837390454, "loss": 0.0112, "step": 142820 }, { "epoch": 0.72, "learning_rate": 0.00019191064068089053, "loss": 0.0137, "step": 142830 }, { "epoch": 0.72, "learning_rate": 0.00019190307298787653, "loss": 0.0129, "step": 142840 }, { "epoch": 0.72, "learning_rate": 0.00019189550529486252, "loss": 0.0115, "step": 142850 }, { "epoch": 0.72, "learning_rate": 0.0001918879376018485, "loss": 0.0116, "step": 142860 }, { "epoch": 0.72, "learning_rate": 0.0001918803699088345, "loss": 0.0101, "step": 142870 }, { "epoch": 0.72, "learning_rate": 0.0001918728022158205, "loss": 0.0141, "step": 142880 }, { "epoch": 0.72, "learning_rate": 0.00019186523452280647, "loss": 0.0137, "step": 142890 }, { "epoch": 0.72, "learning_rate": 0.00019185766682979248, "loss": 0.0127, "step": 142900 }, { "epoch": 0.72, "learning_rate": 0.00019185009913677846, "loss": 0.0171, "step": 142910 }, { "epoch": 0.72, "learning_rate": 0.00019184253144376444, "loss": 0.0109, "step": 142920 }, { "epoch": 0.72, "learning_rate": 0.00019183496375075045, "loss": 0.0139, "step": 142930 }, { "epoch": 0.72, "learning_rate": 0.00019182739605773643, "loss": 0.0149, "step": 142940 }, { "epoch": 0.72, "learning_rate": 0.0001918198283647224, "loss": 0.0144, "step": 142950 }, { "epoch": 0.72, "learning_rate": 0.0001918122606717084, "loss": 0.012, "step": 142960 }, { "epoch": 0.72, "learning_rate": 0.0001918046929786944, "loss": 0.0132, "step": 142970 }, { "epoch": 0.72, "learning_rate": 0.00019179712528568038, "loss": 0.0132, "step": 142980 }, { "epoch": 0.72, "learning_rate": 0.00019178955759266636, "loss": 0.0131, "step": 142990 }, { "epoch": 0.72, "learning_rate": 0.00019178198989965237, "loss": 0.0133, "step": 143000 }, { "epoch": 0.72, "eval_cer": 0.9144770486760401, "eval_loss": 0.00942008476704359, "eval_runtime": 116.7292, "eval_samples_per_second": 17.134, "eval_steps_per_second": 4.283, "step": 143000 }, { "epoch": 0.72, "learning_rate": 0.00019177442220663835, "loss": 0.0117, "step": 143010 }, { "epoch": 0.72, "learning_rate": 0.00019176685451362434, "loss": 0.0151, "step": 143020 }, { "epoch": 0.72, "learning_rate": 0.00019175928682061034, "loss": 0.0119, "step": 143030 }, { "epoch": 0.72, "learning_rate": 0.00019175171912759633, "loss": 0.0118, "step": 143040 }, { "epoch": 0.72, "learning_rate": 0.0001917441514345823, "loss": 0.0126, "step": 143050 }, { "epoch": 0.72, "learning_rate": 0.00019173658374156832, "loss": 0.0122, "step": 143060 }, { "epoch": 0.72, "learning_rate": 0.0001917290160485543, "loss": 0.014, "step": 143070 }, { "epoch": 0.72, "learning_rate": 0.00019172144835554028, "loss": 0.0141, "step": 143080 }, { "epoch": 0.72, "learning_rate": 0.0001917138806625263, "loss": 0.0156, "step": 143090 }, { "epoch": 0.72, "learning_rate": 0.00019170631296951227, "loss": 0.0138, "step": 143100 }, { "epoch": 0.72, "learning_rate": 0.00019169874527649825, "loss": 0.0142, "step": 143110 }, { "epoch": 0.72, "learning_rate": 0.00019169117758348426, "loss": 0.0129, "step": 143120 }, { "epoch": 0.72, "learning_rate": 0.00019168360989047024, "loss": 0.0148, "step": 143130 }, { "epoch": 0.72, "learning_rate": 0.00019167604219745622, "loss": 0.0118, "step": 143140 }, { "epoch": 0.72, "learning_rate": 0.0001916684745044422, "loss": 0.0114, "step": 143150 }, { "epoch": 0.72, "learning_rate": 0.0001916609068114282, "loss": 0.0154, "step": 143160 }, { "epoch": 0.72, "learning_rate": 0.0001916533391184142, "loss": 0.0101, "step": 143170 }, { "epoch": 0.72, "learning_rate": 0.00019164577142540017, "loss": 0.0117, "step": 143180 }, { "epoch": 0.72, "learning_rate": 0.00019163820373238618, "loss": 0.013, "step": 143190 }, { "epoch": 0.72, "learning_rate": 0.00019163063603937216, "loss": 0.0107, "step": 143200 }, { "epoch": 0.72, "learning_rate": 0.00019162306834635815, "loss": 0.0127, "step": 143210 }, { "epoch": 0.72, "learning_rate": 0.00019161550065334415, "loss": 0.0124, "step": 143220 }, { "epoch": 0.72, "learning_rate": 0.00019160793296033014, "loss": 0.0114, "step": 143230 }, { "epoch": 0.72, "learning_rate": 0.00019160036526731612, "loss": 0.0146, "step": 143240 }, { "epoch": 0.72, "learning_rate": 0.00019159279757430213, "loss": 0.0129, "step": 143250 }, { "epoch": 0.72, "learning_rate": 0.0001915852298812881, "loss": 0.0117, "step": 143260 }, { "epoch": 0.72, "learning_rate": 0.0001915776621882741, "loss": 0.0119, "step": 143270 }, { "epoch": 0.72, "learning_rate": 0.0001915700944952601, "loss": 0.014, "step": 143280 }, { "epoch": 0.72, "learning_rate": 0.00019156252680224608, "loss": 0.0117, "step": 143290 }, { "epoch": 0.72, "learning_rate": 0.00019155495910923206, "loss": 0.0136, "step": 143300 }, { "epoch": 0.72, "learning_rate": 0.00019154739141621804, "loss": 0.0107, "step": 143310 }, { "epoch": 0.72, "learning_rate": 0.00019153982372320405, "loss": 0.0184, "step": 143320 }, { "epoch": 0.72, "learning_rate": 0.00019153225603019003, "loss": 0.013, "step": 143330 }, { "epoch": 0.72, "learning_rate": 0.000191524688337176, "loss": 0.0119, "step": 143340 }, { "epoch": 0.72, "learning_rate": 0.00019151712064416202, "loss": 0.0107, "step": 143350 }, { "epoch": 0.72, "learning_rate": 0.000191509552951148, "loss": 0.0104, "step": 143360 }, { "epoch": 0.72, "learning_rate": 0.00019150198525813398, "loss": 0.0135, "step": 143370 }, { "epoch": 0.72, "learning_rate": 0.00019149441756512, "loss": 0.0128, "step": 143380 }, { "epoch": 0.72, "learning_rate": 0.00019148684987210597, "loss": 0.0124, "step": 143390 }, { "epoch": 0.72, "learning_rate": 0.00019147928217909196, "loss": 0.0147, "step": 143400 }, { "epoch": 0.72, "learning_rate": 0.00019147171448607796, "loss": 0.0101, "step": 143410 }, { "epoch": 0.72, "learning_rate": 0.00019146414679306395, "loss": 0.0112, "step": 143420 }, { "epoch": 0.72, "learning_rate": 0.00019145657910004993, "loss": 0.0129, "step": 143430 }, { "epoch": 0.72, "learning_rate": 0.00019144901140703594, "loss": 0.0153, "step": 143440 }, { "epoch": 0.72, "learning_rate": 0.00019144144371402192, "loss": 0.0125, "step": 143450 }, { "epoch": 0.72, "learning_rate": 0.0001914338760210079, "loss": 0.0118, "step": 143460 }, { "epoch": 0.72, "learning_rate": 0.00019142630832799388, "loss": 0.0151, "step": 143470 }, { "epoch": 0.72, "learning_rate": 0.0001914187406349799, "loss": 0.0118, "step": 143480 }, { "epoch": 0.72, "learning_rate": 0.00019141117294196587, "loss": 0.0106, "step": 143490 }, { "epoch": 0.72, "learning_rate": 0.00019140360524895185, "loss": 0.0139, "step": 143500 }, { "epoch": 0.72, "learning_rate": 0.00019139603755593786, "loss": 0.0128, "step": 143510 }, { "epoch": 0.72, "learning_rate": 0.00019138846986292384, "loss": 0.0123, "step": 143520 }, { "epoch": 0.72, "learning_rate": 0.00019138090216990982, "loss": 0.0137, "step": 143530 }, { "epoch": 0.72, "learning_rate": 0.00019137333447689583, "loss": 0.0155, "step": 143540 }, { "epoch": 0.72, "learning_rate": 0.0001913657667838818, "loss": 0.0148, "step": 143550 }, { "epoch": 0.72, "learning_rate": 0.0001913581990908678, "loss": 0.0126, "step": 143560 }, { "epoch": 0.72, "learning_rate": 0.0001913506313978538, "loss": 0.0119, "step": 143570 }, { "epoch": 0.72, "learning_rate": 0.00019134306370483978, "loss": 0.0104, "step": 143580 }, { "epoch": 0.72, "learning_rate": 0.00019133549601182577, "loss": 0.0147, "step": 143590 }, { "epoch": 0.72, "learning_rate": 0.00019132792831881177, "loss": 0.0133, "step": 143600 }, { "epoch": 0.72, "learning_rate": 0.00019132036062579776, "loss": 0.0133, "step": 143610 }, { "epoch": 0.72, "learning_rate": 0.00019131279293278374, "loss": 0.0137, "step": 143620 }, { "epoch": 0.72, "learning_rate": 0.00019130522523976975, "loss": 0.0189, "step": 143630 }, { "epoch": 0.72, "learning_rate": 0.00019129765754675573, "loss": 0.0178, "step": 143640 }, { "epoch": 0.72, "learning_rate": 0.0001912900898537417, "loss": 0.0132, "step": 143650 }, { "epoch": 0.72, "learning_rate": 0.0001912825221607277, "loss": 0.0116, "step": 143660 }, { "epoch": 0.72, "learning_rate": 0.0001912749544677137, "loss": 0.0155, "step": 143670 }, { "epoch": 0.72, "learning_rate": 0.00019126738677469968, "loss": 0.0131, "step": 143680 }, { "epoch": 0.72, "learning_rate": 0.00019125981908168566, "loss": 0.0139, "step": 143690 }, { "epoch": 0.72, "learning_rate": 0.00019125225138867167, "loss": 0.0125, "step": 143700 }, { "epoch": 0.73, "learning_rate": 0.00019124468369565765, "loss": 0.0117, "step": 143710 }, { "epoch": 0.73, "learning_rate": 0.00019123711600264363, "loss": 0.0148, "step": 143720 }, { "epoch": 0.73, "learning_rate": 0.00019122954830962964, "loss": 0.0123, "step": 143730 }, { "epoch": 0.73, "learning_rate": 0.00019122198061661562, "loss": 0.0124, "step": 143740 }, { "epoch": 0.73, "learning_rate": 0.0001912144129236016, "loss": 0.0141, "step": 143750 }, { "epoch": 0.73, "learning_rate": 0.0001912068452305876, "loss": 0.0107, "step": 143760 }, { "epoch": 0.73, "learning_rate": 0.0001911992775375736, "loss": 0.0144, "step": 143770 }, { "epoch": 0.73, "learning_rate": 0.00019119170984455958, "loss": 0.0149, "step": 143780 }, { "epoch": 0.73, "learning_rate": 0.00019118414215154558, "loss": 0.0112, "step": 143790 }, { "epoch": 0.73, "learning_rate": 0.00019117657445853157, "loss": 0.0141, "step": 143800 }, { "epoch": 0.73, "learning_rate": 0.00019116900676551755, "loss": 0.0118, "step": 143810 }, { "epoch": 0.73, "learning_rate": 0.00019116143907250353, "loss": 0.012, "step": 143820 }, { "epoch": 0.73, "learning_rate": 0.00019115387137948954, "loss": 0.0146, "step": 143830 }, { "epoch": 0.73, "learning_rate": 0.00019114630368647552, "loss": 0.011, "step": 143840 }, { "epoch": 0.73, "learning_rate": 0.0001911387359934615, "loss": 0.0112, "step": 143850 }, { "epoch": 0.73, "learning_rate": 0.0001911311683004475, "loss": 0.0162, "step": 143860 }, { "epoch": 0.73, "learning_rate": 0.0001911236006074335, "loss": 0.0139, "step": 143870 }, { "epoch": 0.73, "learning_rate": 0.00019111603291441947, "loss": 0.0144, "step": 143880 }, { "epoch": 0.73, "learning_rate": 0.00019110846522140548, "loss": 0.0134, "step": 143890 }, { "epoch": 0.73, "learning_rate": 0.00019110089752839146, "loss": 0.0126, "step": 143900 }, { "epoch": 0.73, "learning_rate": 0.00019109332983537744, "loss": 0.0127, "step": 143910 }, { "epoch": 0.73, "learning_rate": 0.0001910857621423634, "loss": 0.0119, "step": 143920 }, { "epoch": 0.73, "learning_rate": 0.0001910781944493494, "loss": 0.016, "step": 143930 }, { "epoch": 0.73, "learning_rate": 0.0001910706267563354, "loss": 0.0108, "step": 143940 }, { "epoch": 0.73, "learning_rate": 0.00019106305906332137, "loss": 0.0166, "step": 143950 }, { "epoch": 0.73, "learning_rate": 0.00019105549137030738, "loss": 0.0135, "step": 143960 }, { "epoch": 0.73, "learning_rate": 0.00019104792367729336, "loss": 0.0133, "step": 143970 }, { "epoch": 0.73, "learning_rate": 0.00019104035598427934, "loss": 0.0134, "step": 143980 }, { "epoch": 0.73, "learning_rate": 0.00019103278829126535, "loss": 0.0121, "step": 143990 }, { "epoch": 0.73, "learning_rate": 0.00019102522059825133, "loss": 0.0111, "step": 144000 }, { "epoch": 0.73, "eval_cer": 0.914481900656667, "eval_loss": 0.009388601407408714, "eval_runtime": 116.6959, "eval_samples_per_second": 17.139, "eval_steps_per_second": 4.285, "step": 144000 }, { "epoch": 0.73, "learning_rate": 0.0001910176529052373, "loss": 0.01, "step": 144010 }, { "epoch": 0.73, "learning_rate": 0.00019101008521222332, "loss": 0.0112, "step": 144020 }, { "epoch": 0.73, "learning_rate": 0.0001910025175192093, "loss": 0.012, "step": 144030 }, { "epoch": 0.73, "learning_rate": 0.00019099494982619528, "loss": 0.0141, "step": 144040 }, { "epoch": 0.73, "learning_rate": 0.00019098738213318126, "loss": 0.0147, "step": 144050 }, { "epoch": 0.73, "learning_rate": 0.00019097981444016727, "loss": 0.0136, "step": 144060 }, { "epoch": 0.73, "learning_rate": 0.00019097224674715325, "loss": 0.011, "step": 144070 }, { "epoch": 0.73, "learning_rate": 0.00019096467905413924, "loss": 0.0129, "step": 144080 }, { "epoch": 0.73, "learning_rate": 0.00019095711136112524, "loss": 0.012, "step": 144090 }, { "epoch": 0.73, "learning_rate": 0.00019094954366811123, "loss": 0.0137, "step": 144100 }, { "epoch": 0.73, "learning_rate": 0.0001909419759750972, "loss": 0.0132, "step": 144110 }, { "epoch": 0.73, "learning_rate": 0.00019093440828208322, "loss": 0.0133, "step": 144120 }, { "epoch": 0.73, "learning_rate": 0.0001909268405890692, "loss": 0.0107, "step": 144130 }, { "epoch": 0.73, "learning_rate": 0.00019091927289605518, "loss": 0.0116, "step": 144140 }, { "epoch": 0.73, "learning_rate": 0.0001909117052030412, "loss": 0.0114, "step": 144150 }, { "epoch": 0.73, "learning_rate": 0.00019090413751002717, "loss": 0.0115, "step": 144160 }, { "epoch": 0.73, "learning_rate": 0.00019089656981701315, "loss": 0.0125, "step": 144170 }, { "epoch": 0.73, "learning_rate": 0.00019088900212399916, "loss": 0.0101, "step": 144180 }, { "epoch": 0.73, "learning_rate": 0.00019088143443098514, "loss": 0.016, "step": 144190 }, { "epoch": 0.73, "learning_rate": 0.00019087386673797112, "loss": 0.0162, "step": 144200 }, { "epoch": 0.73, "learning_rate": 0.0001908662990449571, "loss": 0.0118, "step": 144210 }, { "epoch": 0.73, "learning_rate": 0.0001908587313519431, "loss": 0.0122, "step": 144220 }, { "epoch": 0.73, "learning_rate": 0.0001908511636589291, "loss": 0.0149, "step": 144230 }, { "epoch": 0.73, "learning_rate": 0.00019084359596591507, "loss": 0.012, "step": 144240 }, { "epoch": 0.73, "learning_rate": 0.00019083602827290108, "loss": 0.0141, "step": 144250 }, { "epoch": 0.73, "learning_rate": 0.00019082846057988706, "loss": 0.0098, "step": 144260 }, { "epoch": 0.73, "learning_rate": 0.00019082089288687305, "loss": 0.0121, "step": 144270 }, { "epoch": 0.73, "learning_rate": 0.00019081332519385905, "loss": 0.0129, "step": 144280 }, { "epoch": 0.73, "learning_rate": 0.00019080575750084504, "loss": 0.0143, "step": 144290 }, { "epoch": 0.73, "learning_rate": 0.00019079818980783102, "loss": 0.012, "step": 144300 }, { "epoch": 0.73, "learning_rate": 0.00019079062211481703, "loss": 0.0132, "step": 144310 }, { "epoch": 0.73, "learning_rate": 0.000190783054421803, "loss": 0.0128, "step": 144320 }, { "epoch": 0.73, "learning_rate": 0.000190775486728789, "loss": 0.0153, "step": 144330 }, { "epoch": 0.73, "learning_rate": 0.000190767919035775, "loss": 0.014, "step": 144340 }, { "epoch": 0.73, "learning_rate": 0.00019076035134276098, "loss": 0.0125, "step": 144350 }, { "epoch": 0.73, "learning_rate": 0.00019075278364974696, "loss": 0.0138, "step": 144360 }, { "epoch": 0.73, "learning_rate": 0.00019074521595673294, "loss": 0.0145, "step": 144370 }, { "epoch": 0.73, "learning_rate": 0.00019073764826371895, "loss": 0.0121, "step": 144380 }, { "epoch": 0.73, "learning_rate": 0.00019073008057070493, "loss": 0.0144, "step": 144390 }, { "epoch": 0.73, "learning_rate": 0.0001907225128776909, "loss": 0.0141, "step": 144400 }, { "epoch": 0.73, "learning_rate": 0.00019071494518467692, "loss": 0.0119, "step": 144410 }, { "epoch": 0.73, "learning_rate": 0.0001907073774916629, "loss": 0.0145, "step": 144420 }, { "epoch": 0.73, "learning_rate": 0.00019069980979864888, "loss": 0.0189, "step": 144430 }, { "epoch": 0.73, "learning_rate": 0.0001906922421056349, "loss": 0.0111, "step": 144440 }, { "epoch": 0.73, "learning_rate": 0.00019068467441262087, "loss": 0.0135, "step": 144450 }, { "epoch": 0.73, "learning_rate": 0.00019067710671960686, "loss": 0.0128, "step": 144460 }, { "epoch": 0.73, "learning_rate": 0.00019066953902659286, "loss": 0.0092, "step": 144470 }, { "epoch": 0.73, "learning_rate": 0.00019066197133357885, "loss": 0.0114, "step": 144480 }, { "epoch": 0.73, "learning_rate": 0.00019065440364056483, "loss": 0.0122, "step": 144490 }, { "epoch": 0.73, "learning_rate": 0.00019064683594755084, "loss": 0.0118, "step": 144500 }, { "epoch": 0.73, "learning_rate": 0.00019063926825453682, "loss": 0.0137, "step": 144510 }, { "epoch": 0.73, "learning_rate": 0.0001906317005615228, "loss": 0.0118, "step": 144520 }, { "epoch": 0.73, "learning_rate": 0.0001906241328685088, "loss": 0.0152, "step": 144530 }, { "epoch": 0.73, "learning_rate": 0.0001906165651754948, "loss": 0.0183, "step": 144540 }, { "epoch": 0.73, "learning_rate": 0.00019060899748248077, "loss": 0.0167, "step": 144550 }, { "epoch": 0.73, "learning_rate": 0.00019060142978946675, "loss": 0.0118, "step": 144560 }, { "epoch": 0.73, "learning_rate": 0.00019059386209645276, "loss": 0.0128, "step": 144570 }, { "epoch": 0.73, "learning_rate": 0.00019058629440343874, "loss": 0.0116, "step": 144580 }, { "epoch": 0.73, "learning_rate": 0.00019057872671042472, "loss": 0.0121, "step": 144590 }, { "epoch": 0.73, "learning_rate": 0.00019057115901741073, "loss": 0.0132, "step": 144600 }, { "epoch": 0.73, "learning_rate": 0.0001905635913243967, "loss": 0.0143, "step": 144610 }, { "epoch": 0.73, "learning_rate": 0.0001905560236313827, "loss": 0.0125, "step": 144620 }, { "epoch": 0.73, "learning_rate": 0.0001905484559383687, "loss": 0.0147, "step": 144630 }, { "epoch": 0.73, "learning_rate": 0.00019054088824535468, "loss": 0.0128, "step": 144640 }, { "epoch": 0.73, "learning_rate": 0.00019053332055234067, "loss": 0.0147, "step": 144650 }, { "epoch": 0.73, "learning_rate": 0.00019052575285932667, "loss": 0.0123, "step": 144660 }, { "epoch": 0.73, "learning_rate": 0.00019051818516631266, "loss": 0.0182, "step": 144670 }, { "epoch": 0.73, "learning_rate": 0.00019051061747329864, "loss": 0.0139, "step": 144680 }, { "epoch": 0.73, "learning_rate": 0.00019050304978028465, "loss": 0.0118, "step": 144690 }, { "epoch": 0.73, "learning_rate": 0.00019049548208727063, "loss": 0.0149, "step": 144700 }, { "epoch": 0.73, "learning_rate": 0.0001904879143942566, "loss": 0.0144, "step": 144710 }, { "epoch": 0.73, "learning_rate": 0.0001904803467012426, "loss": 0.0136, "step": 144720 }, { "epoch": 0.73, "learning_rate": 0.0001904727790082286, "loss": 0.0174, "step": 144730 }, { "epoch": 0.73, "learning_rate": 0.00019046521131521458, "loss": 0.0144, "step": 144740 }, { "epoch": 0.73, "learning_rate": 0.00019045764362220056, "loss": 0.0121, "step": 144750 }, { "epoch": 0.73, "learning_rate": 0.00019045007592918657, "loss": 0.0161, "step": 144760 }, { "epoch": 0.73, "learning_rate": 0.00019044250823617255, "loss": 0.0108, "step": 144770 }, { "epoch": 0.73, "learning_rate": 0.00019043494054315853, "loss": 0.0159, "step": 144780 }, { "epoch": 0.73, "learning_rate": 0.00019042737285014454, "loss": 0.0115, "step": 144790 }, { "epoch": 0.73, "learning_rate": 0.00019041980515713052, "loss": 0.0113, "step": 144800 }, { "epoch": 0.73, "learning_rate": 0.0001904122374641165, "loss": 0.0127, "step": 144810 }, { "epoch": 0.73, "learning_rate": 0.00019040466977110251, "loss": 0.0158, "step": 144820 }, { "epoch": 0.73, "learning_rate": 0.0001903971020780885, "loss": 0.0134, "step": 144830 }, { "epoch": 0.73, "learning_rate": 0.00019038953438507448, "loss": 0.0149, "step": 144840 }, { "epoch": 0.73, "learning_rate": 0.00019038196669206049, "loss": 0.0154, "step": 144850 }, { "epoch": 0.73, "learning_rate": 0.00019037439899904647, "loss": 0.0132, "step": 144860 }, { "epoch": 0.73, "learning_rate": 0.00019036683130603245, "loss": 0.0134, "step": 144870 }, { "epoch": 0.73, "learning_rate": 0.00019035926361301843, "loss": 0.014, "step": 144880 }, { "epoch": 0.73, "learning_rate": 0.00019035169592000444, "loss": 0.0122, "step": 144890 }, { "epoch": 0.73, "learning_rate": 0.00019034412822699042, "loss": 0.0125, "step": 144900 }, { "epoch": 0.73, "learning_rate": 0.0001903365605339764, "loss": 0.0123, "step": 144910 }, { "epoch": 0.73, "learning_rate": 0.0001903289928409624, "loss": 0.0155, "step": 144920 }, { "epoch": 0.73, "learning_rate": 0.0001903214251479484, "loss": 0.0157, "step": 144930 }, { "epoch": 0.73, "learning_rate": 0.00019031385745493437, "loss": 0.0114, "step": 144940 }, { "epoch": 0.73, "learning_rate": 0.00019030628976192038, "loss": 0.0132, "step": 144950 }, { "epoch": 0.73, "learning_rate": 0.00019029872206890636, "loss": 0.0115, "step": 144960 }, { "epoch": 0.73, "learning_rate": 0.00019029115437589234, "loss": 0.011, "step": 144970 }, { "epoch": 0.73, "learning_rate": 0.00019028358668287835, "loss": 0.0123, "step": 144980 }, { "epoch": 0.73, "learning_rate": 0.00019027601898986433, "loss": 0.0121, "step": 144990 }, { "epoch": 0.73, "learning_rate": 0.00019026845129685032, "loss": 0.0122, "step": 145000 }, { "epoch": 0.73, "eval_cer": 0.9144566703574066, "eval_loss": 0.00918771605938673, "eval_runtime": 116.6602, "eval_samples_per_second": 17.144, "eval_steps_per_second": 4.286, "step": 145000 }, { "epoch": 0.73, "learning_rate": 0.00019026088360383632, "loss": 0.0124, "step": 145010 }, { "epoch": 0.73, "learning_rate": 0.0001902533159108223, "loss": 0.0144, "step": 145020 }, { "epoch": 0.73, "learning_rate": 0.0001902457482178083, "loss": 0.0127, "step": 145030 }, { "epoch": 0.73, "learning_rate": 0.00019023818052479427, "loss": 0.0136, "step": 145040 }, { "epoch": 0.73, "learning_rate": 0.00019023061283178028, "loss": 0.011, "step": 145050 }, { "epoch": 0.73, "learning_rate": 0.00019022304513876626, "loss": 0.0146, "step": 145060 }, { "epoch": 0.73, "learning_rate": 0.00019021547744575224, "loss": 0.0122, "step": 145070 }, { "epoch": 0.73, "learning_rate": 0.00019020790975273825, "loss": 0.0126, "step": 145080 }, { "epoch": 0.73, "learning_rate": 0.00019020034205972423, "loss": 0.0142, "step": 145090 }, { "epoch": 0.73, "learning_rate": 0.0001901927743667102, "loss": 0.0154, "step": 145100 }, { "epoch": 0.73, "learning_rate": 0.00019018520667369622, "loss": 0.0162, "step": 145110 }, { "epoch": 0.73, "learning_rate": 0.0001901776389806822, "loss": 0.0114, "step": 145120 }, { "epoch": 0.73, "learning_rate": 0.00019017007128766818, "loss": 0.0099, "step": 145130 }, { "epoch": 0.73, "learning_rate": 0.0001901625035946542, "loss": 0.0117, "step": 145140 }, { "epoch": 0.73, "learning_rate": 0.00019015493590164017, "loss": 0.0137, "step": 145150 }, { "epoch": 0.73, "learning_rate": 0.00019014736820862615, "loss": 0.0133, "step": 145160 }, { "epoch": 0.73, "learning_rate": 0.00019013980051561216, "loss": 0.0083, "step": 145170 }, { "epoch": 0.73, "learning_rate": 0.00019013223282259812, "loss": 0.0161, "step": 145180 }, { "epoch": 0.73, "learning_rate": 0.0001901246651295841, "loss": 0.0127, "step": 145190 }, { "epoch": 0.73, "learning_rate": 0.00019011709743657008, "loss": 0.0132, "step": 145200 }, { "epoch": 0.73, "learning_rate": 0.0001901095297435561, "loss": 0.0121, "step": 145210 }, { "epoch": 0.73, "learning_rate": 0.00019010196205054207, "loss": 0.0138, "step": 145220 }, { "epoch": 0.73, "learning_rate": 0.00019009439435752805, "loss": 0.0111, "step": 145230 }, { "epoch": 0.73, "learning_rate": 0.00019008682666451406, "loss": 0.0104, "step": 145240 }, { "epoch": 0.73, "learning_rate": 0.00019007925897150004, "loss": 0.0138, "step": 145250 }, { "epoch": 0.73, "learning_rate": 0.00019007169127848602, "loss": 0.0134, "step": 145260 }, { "epoch": 0.73, "learning_rate": 0.000190064123585472, "loss": 0.0118, "step": 145270 }, { "epoch": 0.73, "learning_rate": 0.000190056555892458, "loss": 0.0102, "step": 145280 }, { "epoch": 0.73, "learning_rate": 0.000190048988199444, "loss": 0.0148, "step": 145290 }, { "epoch": 0.73, "learning_rate": 0.00019004142050642998, "loss": 0.0117, "step": 145300 }, { "epoch": 0.73, "learning_rate": 0.00019003385281341598, "loss": 0.0125, "step": 145310 }, { "epoch": 0.73, "learning_rate": 0.00019002628512040197, "loss": 0.0093, "step": 145320 }, { "epoch": 0.73, "learning_rate": 0.00019001871742738795, "loss": 0.0128, "step": 145330 }, { "epoch": 0.73, "learning_rate": 0.00019001114973437396, "loss": 0.0137, "step": 145340 }, { "epoch": 0.73, "learning_rate": 0.00019000358204135994, "loss": 0.0143, "step": 145350 }, { "epoch": 0.73, "learning_rate": 0.00018999601434834592, "loss": 0.0134, "step": 145360 }, { "epoch": 0.73, "learning_rate": 0.00018998844665533193, "loss": 0.0143, "step": 145370 }, { "epoch": 0.73, "learning_rate": 0.0001899808789623179, "loss": 0.0155, "step": 145380 }, { "epoch": 0.73, "learning_rate": 0.0001899733112693039, "loss": 0.0134, "step": 145390 }, { "epoch": 0.73, "learning_rate": 0.0001899657435762899, "loss": 0.0108, "step": 145400 }, { "epoch": 0.73, "learning_rate": 0.00018995817588327588, "loss": 0.0098, "step": 145410 }, { "epoch": 0.73, "learning_rate": 0.00018995060819026186, "loss": 0.0128, "step": 145420 }, { "epoch": 0.73, "learning_rate": 0.00018994304049724784, "loss": 0.0108, "step": 145430 }, { "epoch": 0.73, "learning_rate": 0.00018993547280423385, "loss": 0.0138, "step": 145440 }, { "epoch": 0.73, "learning_rate": 0.00018992790511121983, "loss": 0.0129, "step": 145450 }, { "epoch": 0.73, "learning_rate": 0.00018992033741820581, "loss": 0.0134, "step": 145460 }, { "epoch": 0.73, "learning_rate": 0.00018991276972519182, "loss": 0.0147, "step": 145470 }, { "epoch": 0.73, "learning_rate": 0.0001899052020321778, "loss": 0.011, "step": 145480 }, { "epoch": 0.73, "learning_rate": 0.00018989763433916379, "loss": 0.0132, "step": 145490 }, { "epoch": 0.73, "learning_rate": 0.0001898900666461498, "loss": 0.0127, "step": 145500 }, { "epoch": 0.73, "learning_rate": 0.00018988249895313578, "loss": 0.0114, "step": 145510 }, { "epoch": 0.73, "learning_rate": 0.00018987493126012176, "loss": 0.0111, "step": 145520 }, { "epoch": 0.73, "learning_rate": 0.00018986736356710777, "loss": 0.0169, "step": 145530 }, { "epoch": 0.73, "learning_rate": 0.00018985979587409375, "loss": 0.0125, "step": 145540 }, { "epoch": 0.73, "learning_rate": 0.00018985222818107973, "loss": 0.0183, "step": 145550 }, { "epoch": 0.73, "learning_rate": 0.00018984466048806574, "loss": 0.0129, "step": 145560 }, { "epoch": 0.73, "learning_rate": 0.00018983709279505172, "loss": 0.0134, "step": 145570 }, { "epoch": 0.73, "learning_rate": 0.0001898295251020377, "loss": 0.0119, "step": 145580 }, { "epoch": 0.73, "learning_rate": 0.0001898219574090237, "loss": 0.014, "step": 145590 }, { "epoch": 0.73, "learning_rate": 0.0001898143897160097, "loss": 0.0116, "step": 145600 }, { "epoch": 0.73, "learning_rate": 0.00018980682202299567, "loss": 0.013, "step": 145610 }, { "epoch": 0.73, "learning_rate": 0.00018979925432998165, "loss": 0.0135, "step": 145620 }, { "epoch": 0.73, "learning_rate": 0.00018979168663696766, "loss": 0.0126, "step": 145630 }, { "epoch": 0.73, "learning_rate": 0.00018978411894395364, "loss": 0.0169, "step": 145640 }, { "epoch": 0.73, "learning_rate": 0.00018977655125093962, "loss": 0.0104, "step": 145650 }, { "epoch": 0.73, "learning_rate": 0.00018976898355792563, "loss": 0.0143, "step": 145660 }, { "epoch": 0.73, "learning_rate": 0.00018976141586491161, "loss": 0.0128, "step": 145670 }, { "epoch": 0.73, "learning_rate": 0.0001897538481718976, "loss": 0.0149, "step": 145680 }, { "epoch": 0.74, "learning_rate": 0.0001897462804788836, "loss": 0.0128, "step": 145690 }, { "epoch": 0.74, "learning_rate": 0.00018973871278586959, "loss": 0.0147, "step": 145700 }, { "epoch": 0.74, "learning_rate": 0.00018973114509285557, "loss": 0.0128, "step": 145710 }, { "epoch": 0.74, "learning_rate": 0.00018972357739984158, "loss": 0.0137, "step": 145720 }, { "epoch": 0.74, "learning_rate": 0.00018971600970682756, "loss": 0.0156, "step": 145730 }, { "epoch": 0.74, "learning_rate": 0.00018970844201381354, "loss": 0.0128, "step": 145740 }, { "epoch": 0.74, "learning_rate": 0.00018970087432079955, "loss": 0.0138, "step": 145750 }, { "epoch": 0.74, "learning_rate": 0.00018969330662778553, "loss": 0.0172, "step": 145760 }, { "epoch": 0.74, "learning_rate": 0.0001896857389347715, "loss": 0.0127, "step": 145770 }, { "epoch": 0.74, "learning_rate": 0.0001896781712417575, "loss": 0.0116, "step": 145780 }, { "epoch": 0.74, "learning_rate": 0.0001896706035487435, "loss": 0.0107, "step": 145790 }, { "epoch": 0.74, "learning_rate": 0.00018966303585572948, "loss": 0.0138, "step": 145800 }, { "epoch": 0.74, "learning_rate": 0.00018965546816271546, "loss": 0.0175, "step": 145810 }, { "epoch": 0.74, "learning_rate": 0.00018964790046970147, "loss": 0.0105, "step": 145820 }, { "epoch": 0.74, "learning_rate": 0.00018964033277668745, "loss": 0.0113, "step": 145830 }, { "epoch": 0.74, "learning_rate": 0.00018963276508367343, "loss": 0.0144, "step": 145840 }, { "epoch": 0.74, "learning_rate": 0.00018962519739065944, "loss": 0.0151, "step": 145850 }, { "epoch": 0.74, "learning_rate": 0.00018961762969764542, "loss": 0.0126, "step": 145860 }, { "epoch": 0.74, "learning_rate": 0.0001896100620046314, "loss": 0.0119, "step": 145870 }, { "epoch": 0.74, "learning_rate": 0.00018960249431161741, "loss": 0.0121, "step": 145880 }, { "epoch": 0.74, "learning_rate": 0.0001895949266186034, "loss": 0.0137, "step": 145890 }, { "epoch": 0.74, "learning_rate": 0.00018958735892558938, "loss": 0.0108, "step": 145900 }, { "epoch": 0.74, "learning_rate": 0.00018957979123257539, "loss": 0.0146, "step": 145910 }, { "epoch": 0.74, "learning_rate": 0.00018957222353956137, "loss": 0.0137, "step": 145920 }, { "epoch": 0.74, "learning_rate": 0.00018956465584654735, "loss": 0.013, "step": 145930 }, { "epoch": 0.74, "learning_rate": 0.00018955708815353333, "loss": 0.013, "step": 145940 }, { "epoch": 0.74, "learning_rate": 0.00018954952046051934, "loss": 0.0113, "step": 145950 }, { "epoch": 0.74, "learning_rate": 0.00018954195276750532, "loss": 0.0143, "step": 145960 }, { "epoch": 0.74, "learning_rate": 0.0001895343850744913, "loss": 0.0102, "step": 145970 }, { "epoch": 0.74, "learning_rate": 0.0001895268173814773, "loss": 0.0118, "step": 145980 }, { "epoch": 0.74, "learning_rate": 0.0001895192496884633, "loss": 0.0121, "step": 145990 }, { "epoch": 0.74, "learning_rate": 0.00018951168199544927, "loss": 0.0157, "step": 146000 }, { "epoch": 0.74, "eval_cer": 0.9144770486760401, "eval_loss": 0.009305712766945362, "eval_runtime": 116.6484, "eval_samples_per_second": 17.146, "eval_steps_per_second": 4.286, "step": 146000 }, { "epoch": 0.74, "learning_rate": 0.00018950411430243528, "loss": 0.0103, "step": 146010 }, { "epoch": 0.74, "learning_rate": 0.00018949654660942126, "loss": 0.0162, "step": 146020 }, { "epoch": 0.74, "learning_rate": 0.00018948897891640724, "loss": 0.01, "step": 146030 }, { "epoch": 0.74, "learning_rate": 0.00018948141122339325, "loss": 0.0143, "step": 146040 }, { "epoch": 0.74, "learning_rate": 0.00018947384353037923, "loss": 0.014, "step": 146050 }, { "epoch": 0.74, "learning_rate": 0.00018946627583736522, "loss": 0.0128, "step": 146060 }, { "epoch": 0.74, "learning_rate": 0.00018945870814435122, "loss": 0.0133, "step": 146070 }, { "epoch": 0.74, "learning_rate": 0.0001894511404513372, "loss": 0.0132, "step": 146080 }, { "epoch": 0.74, "learning_rate": 0.0001894435727583232, "loss": 0.0133, "step": 146090 }, { "epoch": 0.74, "learning_rate": 0.0001894360050653092, "loss": 0.0127, "step": 146100 }, { "epoch": 0.74, "learning_rate": 0.00018942843737229518, "loss": 0.0104, "step": 146110 }, { "epoch": 0.74, "learning_rate": 0.00018942086967928116, "loss": 0.0102, "step": 146120 }, { "epoch": 0.74, "learning_rate": 0.00018941330198626714, "loss": 0.0129, "step": 146130 }, { "epoch": 0.74, "learning_rate": 0.00018940573429325315, "loss": 0.0128, "step": 146140 }, { "epoch": 0.74, "learning_rate": 0.00018939816660023913, "loss": 0.0118, "step": 146150 }, { "epoch": 0.74, "learning_rate": 0.0001893905989072251, "loss": 0.0127, "step": 146160 }, { "epoch": 0.74, "learning_rate": 0.00018938303121421112, "loss": 0.0113, "step": 146170 }, { "epoch": 0.74, "learning_rate": 0.0001893754635211971, "loss": 0.0113, "step": 146180 }, { "epoch": 0.74, "learning_rate": 0.00018936789582818308, "loss": 0.0154, "step": 146190 }, { "epoch": 0.74, "learning_rate": 0.0001893603281351691, "loss": 0.0127, "step": 146200 }, { "epoch": 0.74, "learning_rate": 0.00018935276044215507, "loss": 0.0134, "step": 146210 }, { "epoch": 0.74, "learning_rate": 0.00018934519274914105, "loss": 0.0145, "step": 146220 }, { "epoch": 0.74, "learning_rate": 0.00018933762505612706, "loss": 0.0145, "step": 146230 }, { "epoch": 0.74, "learning_rate": 0.00018933005736311304, "loss": 0.0116, "step": 146240 }, { "epoch": 0.74, "learning_rate": 0.00018932248967009903, "loss": 0.0126, "step": 146250 }, { "epoch": 0.74, "learning_rate": 0.00018931492197708503, "loss": 0.0094, "step": 146260 }, { "epoch": 0.74, "learning_rate": 0.00018930735428407102, "loss": 0.0142, "step": 146270 }, { "epoch": 0.74, "learning_rate": 0.000189299786591057, "loss": 0.0114, "step": 146280 }, { "epoch": 0.74, "learning_rate": 0.00018929221889804298, "loss": 0.0165, "step": 146290 }, { "epoch": 0.74, "learning_rate": 0.000189284651205029, "loss": 0.0119, "step": 146300 }, { "epoch": 0.74, "learning_rate": 0.00018927708351201497, "loss": 0.0185, "step": 146310 }, { "epoch": 0.74, "learning_rate": 0.00018926951581900095, "loss": 0.0133, "step": 146320 }, { "epoch": 0.74, "learning_rate": 0.00018926194812598696, "loss": 0.0124, "step": 146330 }, { "epoch": 0.74, "learning_rate": 0.00018925438043297294, "loss": 0.01, "step": 146340 }, { "epoch": 0.74, "learning_rate": 0.00018924681273995892, "loss": 0.0126, "step": 146350 }, { "epoch": 0.74, "learning_rate": 0.00018923924504694493, "loss": 0.0106, "step": 146360 }, { "epoch": 0.74, "learning_rate": 0.0001892316773539309, "loss": 0.0127, "step": 146370 }, { "epoch": 0.74, "learning_rate": 0.0001892241096609169, "loss": 0.0116, "step": 146380 }, { "epoch": 0.74, "learning_rate": 0.0001892165419679029, "loss": 0.0138, "step": 146390 }, { "epoch": 0.74, "learning_rate": 0.00018920897427488888, "loss": 0.015, "step": 146400 }, { "epoch": 0.74, "learning_rate": 0.00018920140658187486, "loss": 0.0128, "step": 146410 }, { "epoch": 0.74, "learning_rate": 0.00018919383888886087, "loss": 0.0128, "step": 146420 }, { "epoch": 0.74, "learning_rate": 0.00018918627119584683, "loss": 0.0137, "step": 146430 }, { "epoch": 0.74, "learning_rate": 0.0001891787035028328, "loss": 0.0099, "step": 146440 }, { "epoch": 0.74, "learning_rate": 0.0001891711358098188, "loss": 0.0089, "step": 146450 }, { "epoch": 0.74, "learning_rate": 0.0001891635681168048, "loss": 0.0142, "step": 146460 }, { "epoch": 0.74, "learning_rate": 0.00018915600042379078, "loss": 0.0104, "step": 146470 }, { "epoch": 0.74, "learning_rate": 0.00018914843273077676, "loss": 0.0111, "step": 146480 }, { "epoch": 0.74, "learning_rate": 0.00018914086503776277, "loss": 0.0136, "step": 146490 }, { "epoch": 0.74, "learning_rate": 0.00018913329734474875, "loss": 0.0143, "step": 146500 }, { "epoch": 0.74, "learning_rate": 0.00018912572965173473, "loss": 0.012, "step": 146510 }, { "epoch": 0.74, "learning_rate": 0.00018911816195872071, "loss": 0.0107, "step": 146520 }, { "epoch": 0.74, "learning_rate": 0.00018911059426570672, "loss": 0.0107, "step": 146530 }, { "epoch": 0.74, "learning_rate": 0.0001891030265726927, "loss": 0.0127, "step": 146540 }, { "epoch": 0.74, "learning_rate": 0.00018909545887967869, "loss": 0.013, "step": 146550 }, { "epoch": 0.74, "learning_rate": 0.0001890878911866647, "loss": 0.0143, "step": 146560 }, { "epoch": 0.74, "learning_rate": 0.00018908032349365068, "loss": 0.0135, "step": 146570 }, { "epoch": 0.74, "learning_rate": 0.00018907275580063666, "loss": 0.0128, "step": 146580 }, { "epoch": 0.74, "learning_rate": 0.00018906518810762267, "loss": 0.0124, "step": 146590 }, { "epoch": 0.74, "learning_rate": 0.00018905762041460865, "loss": 0.0144, "step": 146600 }, { "epoch": 0.74, "learning_rate": 0.00018905005272159463, "loss": 0.0141, "step": 146610 }, { "epoch": 0.74, "learning_rate": 0.00018904248502858064, "loss": 0.0121, "step": 146620 }, { "epoch": 0.74, "learning_rate": 0.00018903491733556662, "loss": 0.0158, "step": 146630 }, { "epoch": 0.74, "learning_rate": 0.0001890273496425526, "loss": 0.0117, "step": 146640 }, { "epoch": 0.74, "learning_rate": 0.0001890197819495386, "loss": 0.0097, "step": 146650 }, { "epoch": 0.74, "learning_rate": 0.0001890122142565246, "loss": 0.0161, "step": 146660 }, { "epoch": 0.74, "learning_rate": 0.00018900464656351057, "loss": 0.0094, "step": 146670 }, { "epoch": 0.74, "learning_rate": 0.00018899707887049655, "loss": 0.013, "step": 146680 }, { "epoch": 0.74, "learning_rate": 0.00018898951117748256, "loss": 0.015, "step": 146690 }, { "epoch": 0.74, "learning_rate": 0.00018898194348446854, "loss": 0.0135, "step": 146700 }, { "epoch": 0.74, "learning_rate": 0.00018897437579145452, "loss": 0.0152, "step": 146710 }, { "epoch": 0.74, "learning_rate": 0.00018896680809844053, "loss": 0.0142, "step": 146720 }, { "epoch": 0.74, "learning_rate": 0.00018895924040542651, "loss": 0.014, "step": 146730 }, { "epoch": 0.74, "learning_rate": 0.0001889516727124125, "loss": 0.0123, "step": 146740 }, { "epoch": 0.74, "learning_rate": 0.0001889441050193985, "loss": 0.0142, "step": 146750 }, { "epoch": 0.74, "learning_rate": 0.00018893653732638449, "loss": 0.0121, "step": 146760 }, { "epoch": 0.74, "learning_rate": 0.00018892896963337047, "loss": 0.0116, "step": 146770 }, { "epoch": 0.74, "learning_rate": 0.00018892140194035648, "loss": 0.0117, "step": 146780 }, { "epoch": 0.74, "learning_rate": 0.00018891383424734246, "loss": 0.0113, "step": 146790 }, { "epoch": 0.74, "learning_rate": 0.00018890626655432844, "loss": 0.0107, "step": 146800 }, { "epoch": 0.74, "learning_rate": 0.00018889869886131445, "loss": 0.0138, "step": 146810 }, { "epoch": 0.74, "learning_rate": 0.00018889113116830043, "loss": 0.013, "step": 146820 }, { "epoch": 0.74, "learning_rate": 0.0001888835634752864, "loss": 0.0139, "step": 146830 }, { "epoch": 0.74, "learning_rate": 0.0001888759957822724, "loss": 0.0129, "step": 146840 }, { "epoch": 0.74, "learning_rate": 0.0001888684280892584, "loss": 0.0121, "step": 146850 }, { "epoch": 0.74, "learning_rate": 0.00018886086039624438, "loss": 0.0145, "step": 146860 }, { "epoch": 0.74, "learning_rate": 0.00018885329270323036, "loss": 0.0144, "step": 146870 }, { "epoch": 0.74, "learning_rate": 0.00018884572501021637, "loss": 0.0156, "step": 146880 }, { "epoch": 0.74, "learning_rate": 0.00018883815731720235, "loss": 0.0133, "step": 146890 }, { "epoch": 0.74, "learning_rate": 0.00018883058962418833, "loss": 0.0132, "step": 146900 }, { "epoch": 0.74, "learning_rate": 0.00018882302193117434, "loss": 0.0141, "step": 146910 }, { "epoch": 0.74, "learning_rate": 0.00018881545423816032, "loss": 0.0138, "step": 146920 }, { "epoch": 0.74, "learning_rate": 0.0001888078865451463, "loss": 0.0111, "step": 146930 }, { "epoch": 0.74, "learning_rate": 0.00018880031885213231, "loss": 0.0111, "step": 146940 }, { "epoch": 0.74, "learning_rate": 0.0001887927511591183, "loss": 0.0135, "step": 146950 }, { "epoch": 0.74, "learning_rate": 0.00018878518346610428, "loss": 0.0141, "step": 146960 }, { "epoch": 0.74, "learning_rate": 0.00018877761577309029, "loss": 0.0126, "step": 146970 }, { "epoch": 0.74, "learning_rate": 0.00018877004808007627, "loss": 0.0121, "step": 146980 }, { "epoch": 0.74, "learning_rate": 0.00018876248038706225, "loss": 0.0122, "step": 146990 }, { "epoch": 0.74, "learning_rate": 0.00018875491269404826, "loss": 0.0125, "step": 147000 }, { "epoch": 0.74, "eval_cer": 0.914457640753532, "eval_loss": 0.009390231221914291, "eval_runtime": 115.7292, "eval_samples_per_second": 17.282, "eval_steps_per_second": 4.32, "step": 147000 }, { "epoch": 0.74, "learning_rate": 0.00018874734500103424, "loss": 0.0168, "step": 147010 }, { "epoch": 0.74, "learning_rate": 0.00018873977730802022, "loss": 0.0153, "step": 147020 }, { "epoch": 0.74, "learning_rate": 0.0001887322096150062, "loss": 0.0142, "step": 147030 }, { "epoch": 0.74, "learning_rate": 0.0001887246419219922, "loss": 0.0138, "step": 147040 }, { "epoch": 0.74, "learning_rate": 0.0001887170742289782, "loss": 0.0144, "step": 147050 }, { "epoch": 0.74, "learning_rate": 0.00018870950653596417, "loss": 0.0118, "step": 147060 }, { "epoch": 0.74, "learning_rate": 0.00018870193884295018, "loss": 0.0128, "step": 147070 }, { "epoch": 0.74, "learning_rate": 0.00018869437114993616, "loss": 0.0133, "step": 147080 }, { "epoch": 0.74, "learning_rate": 0.00018868680345692214, "loss": 0.0148, "step": 147090 }, { "epoch": 0.74, "learning_rate": 0.00018867923576390815, "loss": 0.013, "step": 147100 }, { "epoch": 0.74, "learning_rate": 0.00018867166807089413, "loss": 0.0122, "step": 147110 }, { "epoch": 0.74, "learning_rate": 0.00018866410037788012, "loss": 0.0137, "step": 147120 }, { "epoch": 0.74, "learning_rate": 0.00018865653268486612, "loss": 0.0127, "step": 147130 }, { "epoch": 0.74, "learning_rate": 0.0001886489649918521, "loss": 0.0151, "step": 147140 }, { "epoch": 0.74, "learning_rate": 0.0001886413972988381, "loss": 0.0145, "step": 147150 }, { "epoch": 0.74, "learning_rate": 0.0001886338296058241, "loss": 0.0142, "step": 147160 }, { "epoch": 0.74, "learning_rate": 0.00018862626191281008, "loss": 0.0187, "step": 147170 }, { "epoch": 0.74, "learning_rate": 0.00018861869421979606, "loss": 0.0136, "step": 147180 }, { "epoch": 0.74, "learning_rate": 0.00018861112652678204, "loss": 0.0119, "step": 147190 }, { "epoch": 0.74, "learning_rate": 0.00018860355883376805, "loss": 0.0126, "step": 147200 }, { "epoch": 0.74, "learning_rate": 0.00018859599114075403, "loss": 0.0126, "step": 147210 }, { "epoch": 0.74, "learning_rate": 0.00018858842344774, "loss": 0.0144, "step": 147220 }, { "epoch": 0.74, "learning_rate": 0.00018858085575472602, "loss": 0.0143, "step": 147230 }, { "epoch": 0.74, "learning_rate": 0.000188573288061712, "loss": 0.0139, "step": 147240 }, { "epoch": 0.74, "learning_rate": 0.00018856572036869798, "loss": 0.0123, "step": 147250 }, { "epoch": 0.74, "learning_rate": 0.000188558152675684, "loss": 0.0161, "step": 147260 }, { "epoch": 0.74, "learning_rate": 0.00018855058498266997, "loss": 0.0156, "step": 147270 }, { "epoch": 0.74, "learning_rate": 0.00018854301728965595, "loss": 0.0119, "step": 147280 }, { "epoch": 0.74, "learning_rate": 0.00018853544959664196, "loss": 0.0136, "step": 147290 }, { "epoch": 0.74, "learning_rate": 0.00018852788190362794, "loss": 0.0152, "step": 147300 }, { "epoch": 0.74, "learning_rate": 0.00018852031421061393, "loss": 0.0135, "step": 147310 }, { "epoch": 0.74, "learning_rate": 0.00018851274651759993, "loss": 0.0117, "step": 147320 }, { "epoch": 0.74, "learning_rate": 0.00018850517882458592, "loss": 0.0136, "step": 147330 }, { "epoch": 0.74, "learning_rate": 0.0001884976111315719, "loss": 0.0143, "step": 147340 }, { "epoch": 0.74, "learning_rate": 0.00018849004343855788, "loss": 0.0097, "step": 147350 }, { "epoch": 0.74, "learning_rate": 0.0001884824757455439, "loss": 0.0157, "step": 147360 }, { "epoch": 0.74, "learning_rate": 0.00018847490805252987, "loss": 0.0125, "step": 147370 }, { "epoch": 0.74, "learning_rate": 0.00018846734035951585, "loss": 0.0113, "step": 147380 }, { "epoch": 0.74, "learning_rate": 0.00018845977266650186, "loss": 0.0133, "step": 147390 }, { "epoch": 0.74, "learning_rate": 0.00018845220497348784, "loss": 0.0119, "step": 147400 }, { "epoch": 0.74, "learning_rate": 0.00018844463728047382, "loss": 0.0108, "step": 147410 }, { "epoch": 0.74, "learning_rate": 0.00018843706958745983, "loss": 0.0169, "step": 147420 }, { "epoch": 0.74, "learning_rate": 0.0001884295018944458, "loss": 0.0117, "step": 147430 }, { "epoch": 0.74, "learning_rate": 0.0001884219342014318, "loss": 0.0177, "step": 147440 }, { "epoch": 0.74, "learning_rate": 0.0001884143665084178, "loss": 0.0168, "step": 147450 }, { "epoch": 0.74, "learning_rate": 0.00018840679881540378, "loss": 0.0136, "step": 147460 }, { "epoch": 0.74, "learning_rate": 0.00018839923112238976, "loss": 0.0131, "step": 147470 }, { "epoch": 0.74, "learning_rate": 0.00018839166342937577, "loss": 0.0133, "step": 147480 }, { "epoch": 0.74, "learning_rate": 0.00018838409573636175, "loss": 0.0148, "step": 147490 }, { "epoch": 0.74, "learning_rate": 0.00018837652804334774, "loss": 0.0119, "step": 147500 }, { "epoch": 0.74, "learning_rate": 0.00018836896035033374, "loss": 0.0116, "step": 147510 }, { "epoch": 0.74, "learning_rate": 0.00018836139265731973, "loss": 0.011, "step": 147520 }, { "epoch": 0.74, "learning_rate": 0.0001883538249643057, "loss": 0.0143, "step": 147530 }, { "epoch": 0.74, "learning_rate": 0.0001883462572712917, "loss": 0.0133, "step": 147540 }, { "epoch": 0.74, "learning_rate": 0.0001883386895782777, "loss": 0.0136, "step": 147550 }, { "epoch": 0.74, "learning_rate": 0.00018833112188526368, "loss": 0.0161, "step": 147560 }, { "epoch": 0.74, "learning_rate": 0.00018832355419224966, "loss": 0.0123, "step": 147570 }, { "epoch": 0.74, "learning_rate": 0.00018831598649923567, "loss": 0.0163, "step": 147580 }, { "epoch": 0.74, "learning_rate": 0.00018830841880622165, "loss": 0.0165, "step": 147590 }, { "epoch": 0.74, "learning_rate": 0.00018830085111320763, "loss": 0.0138, "step": 147600 }, { "epoch": 0.74, "learning_rate": 0.00018829328342019364, "loss": 0.0126, "step": 147610 }, { "epoch": 0.74, "learning_rate": 0.00018828571572717962, "loss": 0.0133, "step": 147620 }, { "epoch": 0.74, "learning_rate": 0.0001882781480341656, "loss": 0.0129, "step": 147630 }, { "epoch": 0.74, "learning_rate": 0.0001882705803411516, "loss": 0.014, "step": 147640 }, { "epoch": 0.74, "learning_rate": 0.0001882630126481376, "loss": 0.0203, "step": 147650 }, { "epoch": 0.74, "learning_rate": 0.00018825544495512357, "loss": 0.0125, "step": 147660 }, { "epoch": 0.75, "learning_rate": 0.00018824787726210958, "loss": 0.0102, "step": 147670 }, { "epoch": 0.75, "learning_rate": 0.00018824030956909556, "loss": 0.0194, "step": 147680 }, { "epoch": 0.75, "learning_rate": 0.00018823274187608152, "loss": 0.0132, "step": 147690 }, { "epoch": 0.75, "learning_rate": 0.0001882251741830675, "loss": 0.0143, "step": 147700 }, { "epoch": 0.75, "learning_rate": 0.0001882176064900535, "loss": 0.0124, "step": 147710 }, { "epoch": 0.75, "learning_rate": 0.0001882100387970395, "loss": 0.0128, "step": 147720 }, { "epoch": 0.75, "learning_rate": 0.00018820247110402547, "loss": 0.0116, "step": 147730 }, { "epoch": 0.75, "learning_rate": 0.00018819490341101145, "loss": 0.0126, "step": 147740 }, { "epoch": 0.75, "learning_rate": 0.00018818733571799746, "loss": 0.0118, "step": 147750 }, { "epoch": 0.75, "learning_rate": 0.00018817976802498344, "loss": 0.0131, "step": 147760 }, { "epoch": 0.75, "learning_rate": 0.00018817220033196942, "loss": 0.0151, "step": 147770 }, { "epoch": 0.75, "learning_rate": 0.00018816463263895543, "loss": 0.0143, "step": 147780 }, { "epoch": 0.75, "learning_rate": 0.00018815706494594141, "loss": 0.0139, "step": 147790 }, { "epoch": 0.75, "learning_rate": 0.0001881494972529274, "loss": 0.0103, "step": 147800 }, { "epoch": 0.75, "learning_rate": 0.0001881419295599134, "loss": 0.0167, "step": 147810 }, { "epoch": 0.75, "learning_rate": 0.00018813436186689939, "loss": 0.0122, "step": 147820 }, { "epoch": 0.75, "learning_rate": 0.00018812679417388537, "loss": 0.011, "step": 147830 }, { "epoch": 0.75, "learning_rate": 0.00018811922648087138, "loss": 0.0152, "step": 147840 }, { "epoch": 0.75, "learning_rate": 0.00018811165878785736, "loss": 0.0138, "step": 147850 }, { "epoch": 0.75, "learning_rate": 0.00018810409109484334, "loss": 0.0142, "step": 147860 }, { "epoch": 0.75, "learning_rate": 0.00018809652340182935, "loss": 0.0131, "step": 147870 }, { "epoch": 0.75, "learning_rate": 0.00018808895570881533, "loss": 0.0126, "step": 147880 }, { "epoch": 0.75, "learning_rate": 0.0001880813880158013, "loss": 0.0138, "step": 147890 }, { "epoch": 0.75, "learning_rate": 0.00018807382032278732, "loss": 0.0108, "step": 147900 }, { "epoch": 0.75, "learning_rate": 0.0001880662526297733, "loss": 0.0136, "step": 147910 }, { "epoch": 0.75, "learning_rate": 0.00018805868493675928, "loss": 0.0121, "step": 147920 }, { "epoch": 0.75, "learning_rate": 0.00018805111724374526, "loss": 0.0116, "step": 147930 }, { "epoch": 0.75, "learning_rate": 0.00018804354955073127, "loss": 0.0122, "step": 147940 }, { "epoch": 0.75, "learning_rate": 0.00018803598185771725, "loss": 0.0095, "step": 147950 }, { "epoch": 0.75, "learning_rate": 0.00018802841416470323, "loss": 0.0169, "step": 147960 }, { "epoch": 0.75, "learning_rate": 0.00018802084647168924, "loss": 0.0119, "step": 147970 }, { "epoch": 0.75, "learning_rate": 0.00018801327877867522, "loss": 0.0121, "step": 147980 }, { "epoch": 0.75, "learning_rate": 0.0001880057110856612, "loss": 0.0152, "step": 147990 }, { "epoch": 0.75, "learning_rate": 0.00018799814339264721, "loss": 0.0136, "step": 148000 }, { "epoch": 0.75, "eval_cer": 0.9144741374876638, "eval_loss": 0.009097721427679062, "eval_runtime": 116.6762, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 148000 }, { "epoch": 0.75, "learning_rate": 0.0001879905756996332, "loss": 0.016, "step": 148010 }, { "epoch": 0.75, "learning_rate": 0.00018798300800661918, "loss": 0.0138, "step": 148020 }, { "epoch": 0.75, "learning_rate": 0.00018797544031360519, "loss": 0.0145, "step": 148030 }, { "epoch": 0.75, "learning_rate": 0.00018796787262059117, "loss": 0.0128, "step": 148040 }, { "epoch": 0.75, "learning_rate": 0.00018796030492757715, "loss": 0.0167, "step": 148050 }, { "epoch": 0.75, "learning_rate": 0.00018795273723456316, "loss": 0.0175, "step": 148060 }, { "epoch": 0.75, "learning_rate": 0.00018794516954154914, "loss": 0.0136, "step": 148070 }, { "epoch": 0.75, "learning_rate": 0.00018793760184853512, "loss": 0.0129, "step": 148080 }, { "epoch": 0.75, "learning_rate": 0.0001879300341555211, "loss": 0.0146, "step": 148090 }, { "epoch": 0.75, "learning_rate": 0.0001879224664625071, "loss": 0.0162, "step": 148100 }, { "epoch": 0.75, "learning_rate": 0.0001879148987694931, "loss": 0.0122, "step": 148110 }, { "epoch": 0.75, "learning_rate": 0.00018790733107647907, "loss": 0.0128, "step": 148120 }, { "epoch": 0.75, "learning_rate": 0.00018789976338346508, "loss": 0.0124, "step": 148130 }, { "epoch": 0.75, "learning_rate": 0.00018789219569045106, "loss": 0.0112, "step": 148140 }, { "epoch": 0.75, "learning_rate": 0.00018788462799743704, "loss": 0.0116, "step": 148150 }, { "epoch": 0.75, "learning_rate": 0.00018787706030442305, "loss": 0.0113, "step": 148160 }, { "epoch": 0.75, "learning_rate": 0.00018786949261140903, "loss": 0.0106, "step": 148170 }, { "epoch": 0.75, "learning_rate": 0.00018786192491839502, "loss": 0.012, "step": 148180 }, { "epoch": 0.75, "learning_rate": 0.00018785435722538102, "loss": 0.013, "step": 148190 }, { "epoch": 0.75, "learning_rate": 0.000187846789532367, "loss": 0.0164, "step": 148200 }, { "epoch": 0.75, "learning_rate": 0.000187839221839353, "loss": 0.011, "step": 148210 }, { "epoch": 0.75, "learning_rate": 0.000187831654146339, "loss": 0.017, "step": 148220 }, { "epoch": 0.75, "learning_rate": 0.00018782408645332498, "loss": 0.015, "step": 148230 }, { "epoch": 0.75, "learning_rate": 0.00018781651876031096, "loss": 0.0115, "step": 148240 }, { "epoch": 0.75, "learning_rate": 0.00018780895106729694, "loss": 0.0114, "step": 148250 }, { "epoch": 0.75, "learning_rate": 0.00018780138337428295, "loss": 0.0139, "step": 148260 }, { "epoch": 0.75, "learning_rate": 0.00018779381568126893, "loss": 0.0115, "step": 148270 }, { "epoch": 0.75, "learning_rate": 0.0001877862479882549, "loss": 0.0128, "step": 148280 }, { "epoch": 0.75, "learning_rate": 0.00018777868029524092, "loss": 0.0121, "step": 148290 }, { "epoch": 0.75, "learning_rate": 0.0001877711126022269, "loss": 0.0134, "step": 148300 }, { "epoch": 0.75, "learning_rate": 0.00018776354490921288, "loss": 0.0091, "step": 148310 }, { "epoch": 0.75, "learning_rate": 0.0001877559772161989, "loss": 0.0105, "step": 148320 }, { "epoch": 0.75, "learning_rate": 0.00018774840952318487, "loss": 0.0131, "step": 148330 }, { "epoch": 0.75, "learning_rate": 0.00018774084183017085, "loss": 0.0114, "step": 148340 }, { "epoch": 0.75, "learning_rate": 0.00018773327413715686, "loss": 0.0142, "step": 148350 }, { "epoch": 0.75, "learning_rate": 0.00018772570644414284, "loss": 0.012, "step": 148360 }, { "epoch": 0.75, "learning_rate": 0.00018771813875112883, "loss": 0.0122, "step": 148370 }, { "epoch": 0.75, "learning_rate": 0.00018771057105811483, "loss": 0.0123, "step": 148380 }, { "epoch": 0.75, "learning_rate": 0.00018770300336510082, "loss": 0.0134, "step": 148390 }, { "epoch": 0.75, "learning_rate": 0.0001876954356720868, "loss": 0.0158, "step": 148400 }, { "epoch": 0.75, "learning_rate": 0.0001876878679790728, "loss": 0.0137, "step": 148410 }, { "epoch": 0.75, "learning_rate": 0.0001876803002860588, "loss": 0.0114, "step": 148420 }, { "epoch": 0.75, "learning_rate": 0.00018767273259304477, "loss": 0.0125, "step": 148430 }, { "epoch": 0.75, "learning_rate": 0.00018766516490003075, "loss": 0.0134, "step": 148440 }, { "epoch": 0.75, "learning_rate": 0.00018765759720701676, "loss": 0.0123, "step": 148450 }, { "epoch": 0.75, "learning_rate": 0.00018765002951400274, "loss": 0.0112, "step": 148460 }, { "epoch": 0.75, "learning_rate": 0.00018764246182098872, "loss": 0.0111, "step": 148470 }, { "epoch": 0.75, "learning_rate": 0.00018763489412797473, "loss": 0.012, "step": 148480 }, { "epoch": 0.75, "learning_rate": 0.0001876273264349607, "loss": 0.0116, "step": 148490 }, { "epoch": 0.75, "learning_rate": 0.0001876197587419467, "loss": 0.0145, "step": 148500 }, { "epoch": 0.75, "learning_rate": 0.0001876121910489327, "loss": 0.0133, "step": 148510 }, { "epoch": 0.75, "learning_rate": 0.00018760462335591868, "loss": 0.011, "step": 148520 }, { "epoch": 0.75, "learning_rate": 0.00018759705566290466, "loss": 0.0161, "step": 148530 }, { "epoch": 0.75, "learning_rate": 0.00018758948796989067, "loss": 0.0134, "step": 148540 }, { "epoch": 0.75, "learning_rate": 0.00018758192027687665, "loss": 0.0102, "step": 148550 }, { "epoch": 0.75, "learning_rate": 0.00018757435258386264, "loss": 0.0115, "step": 148560 }, { "epoch": 0.75, "learning_rate": 0.00018756678489084864, "loss": 0.0123, "step": 148570 }, { "epoch": 0.75, "learning_rate": 0.00018755921719783463, "loss": 0.0123, "step": 148580 }, { "epoch": 0.75, "learning_rate": 0.0001875516495048206, "loss": 0.0108, "step": 148590 }, { "epoch": 0.75, "learning_rate": 0.0001875440818118066, "loss": 0.0125, "step": 148600 }, { "epoch": 0.75, "learning_rate": 0.0001875365141187926, "loss": 0.0115, "step": 148610 }, { "epoch": 0.75, "learning_rate": 0.00018752894642577858, "loss": 0.0128, "step": 148620 }, { "epoch": 0.75, "learning_rate": 0.00018752137873276456, "loss": 0.0118, "step": 148630 }, { "epoch": 0.75, "learning_rate": 0.00018751381103975057, "loss": 0.0169, "step": 148640 }, { "epoch": 0.75, "learning_rate": 0.00018750624334673655, "loss": 0.014, "step": 148650 }, { "epoch": 0.75, "learning_rate": 0.00018749867565372253, "loss": 0.0177, "step": 148660 }, { "epoch": 0.75, "learning_rate": 0.00018749110796070854, "loss": 0.0156, "step": 148670 }, { "epoch": 0.75, "learning_rate": 0.00018748354026769452, "loss": 0.015, "step": 148680 }, { "epoch": 0.75, "learning_rate": 0.0001874759725746805, "loss": 0.0136, "step": 148690 }, { "epoch": 0.75, "learning_rate": 0.0001874684048816665, "loss": 0.0124, "step": 148700 }, { "epoch": 0.75, "learning_rate": 0.0001874608371886525, "loss": 0.0119, "step": 148710 }, { "epoch": 0.75, "learning_rate": 0.00018745326949563847, "loss": 0.0102, "step": 148720 }, { "epoch": 0.75, "learning_rate": 0.00018744570180262448, "loss": 0.0105, "step": 148730 }, { "epoch": 0.75, "learning_rate": 0.00018743813410961046, "loss": 0.0094, "step": 148740 }, { "epoch": 0.75, "learning_rate": 0.00018743056641659645, "loss": 0.0146, "step": 148750 }, { "epoch": 0.75, "learning_rate": 0.00018742299872358243, "loss": 0.011, "step": 148760 }, { "epoch": 0.75, "learning_rate": 0.00018741543103056844, "loss": 0.0125, "step": 148770 }, { "epoch": 0.75, "learning_rate": 0.00018740786333755442, "loss": 0.0189, "step": 148780 }, { "epoch": 0.75, "learning_rate": 0.0001874002956445404, "loss": 0.0137, "step": 148790 }, { "epoch": 0.75, "learning_rate": 0.0001873927279515264, "loss": 0.0113, "step": 148800 }, { "epoch": 0.75, "learning_rate": 0.0001873851602585124, "loss": 0.013, "step": 148810 }, { "epoch": 0.75, "learning_rate": 0.00018737759256549837, "loss": 0.0116, "step": 148820 }, { "epoch": 0.75, "learning_rate": 0.00018737002487248438, "loss": 0.0098, "step": 148830 }, { "epoch": 0.75, "learning_rate": 0.00018736245717947036, "loss": 0.0136, "step": 148840 }, { "epoch": 0.75, "learning_rate": 0.00018735488948645634, "loss": 0.0115, "step": 148850 }, { "epoch": 0.75, "learning_rate": 0.00018734732179344235, "loss": 0.012, "step": 148860 }, { "epoch": 0.75, "learning_rate": 0.00018733975410042833, "loss": 0.0108, "step": 148870 }, { "epoch": 0.75, "learning_rate": 0.0001873321864074143, "loss": 0.0124, "step": 148880 }, { "epoch": 0.75, "learning_rate": 0.00018732461871440032, "loss": 0.012, "step": 148890 }, { "epoch": 0.75, "learning_rate": 0.0001873170510213863, "loss": 0.0123, "step": 148900 }, { "epoch": 0.75, "learning_rate": 0.00018730948332837228, "loss": 0.0141, "step": 148910 }, { "epoch": 0.75, "learning_rate": 0.00018730191563535827, "loss": 0.0228, "step": 148920 }, { "epoch": 0.75, "learning_rate": 0.00018729434794234427, "loss": 0.0132, "step": 148930 }, { "epoch": 0.75, "learning_rate": 0.00018728678024933026, "loss": 0.0147, "step": 148940 }, { "epoch": 0.75, "learning_rate": 0.0001872792125563162, "loss": 0.0122, "step": 148950 }, { "epoch": 0.75, "learning_rate": 0.00018727164486330222, "loss": 0.0163, "step": 148960 }, { "epoch": 0.75, "learning_rate": 0.0001872640771702882, "loss": 0.0108, "step": 148970 }, { "epoch": 0.75, "learning_rate": 0.00018725650947727418, "loss": 0.0169, "step": 148980 }, { "epoch": 0.75, "learning_rate": 0.00018724894178426016, "loss": 0.0163, "step": 148990 }, { "epoch": 0.75, "learning_rate": 0.00018724137409124617, "loss": 0.019, "step": 149000 }, { "epoch": 0.75, "eval_cer": 0.9144751078837893, "eval_loss": 0.009037774056196213, "eval_runtime": 116.6835, "eval_samples_per_second": 17.14, "eval_steps_per_second": 4.285, "step": 149000 }, { "epoch": 0.75, "learning_rate": 0.00018723380639823215, "loss": 0.0123, "step": 149010 }, { "epoch": 0.75, "learning_rate": 0.00018722623870521813, "loss": 0.013, "step": 149020 }, { "epoch": 0.75, "learning_rate": 0.00018721867101220414, "loss": 0.0146, "step": 149030 }, { "epoch": 0.75, "learning_rate": 0.00018721110331919012, "loss": 0.0126, "step": 149040 }, { "epoch": 0.75, "learning_rate": 0.0001872035356261761, "loss": 0.0105, "step": 149050 }, { "epoch": 0.75, "learning_rate": 0.00018719596793316211, "loss": 0.0149, "step": 149060 }, { "epoch": 0.75, "learning_rate": 0.0001871884002401481, "loss": 0.0138, "step": 149070 }, { "epoch": 0.75, "learning_rate": 0.00018718083254713408, "loss": 0.0135, "step": 149080 }, { "epoch": 0.75, "learning_rate": 0.00018717326485412009, "loss": 0.0127, "step": 149090 }, { "epoch": 0.75, "learning_rate": 0.00018716569716110607, "loss": 0.0153, "step": 149100 }, { "epoch": 0.75, "learning_rate": 0.00018715812946809205, "loss": 0.0154, "step": 149110 }, { "epoch": 0.75, "learning_rate": 0.00018715056177507806, "loss": 0.0151, "step": 149120 }, { "epoch": 0.75, "learning_rate": 0.00018714299408206404, "loss": 0.0149, "step": 149130 }, { "epoch": 0.75, "learning_rate": 0.00018713542638905002, "loss": 0.0113, "step": 149140 }, { "epoch": 0.75, "learning_rate": 0.000187127858696036, "loss": 0.0185, "step": 149150 }, { "epoch": 0.75, "learning_rate": 0.000187120291003022, "loss": 0.0144, "step": 149160 }, { "epoch": 0.75, "learning_rate": 0.000187112723310008, "loss": 0.0124, "step": 149170 }, { "epoch": 0.75, "learning_rate": 0.00018710515561699397, "loss": 0.0121, "step": 149180 }, { "epoch": 0.75, "learning_rate": 0.00018709758792397998, "loss": 0.0129, "step": 149190 }, { "epoch": 0.75, "learning_rate": 0.00018709002023096596, "loss": 0.0101, "step": 149200 }, { "epoch": 0.75, "learning_rate": 0.00018708245253795194, "loss": 0.0137, "step": 149210 }, { "epoch": 0.75, "learning_rate": 0.00018707488484493795, "loss": 0.0132, "step": 149220 }, { "epoch": 0.75, "learning_rate": 0.00018706731715192393, "loss": 0.0107, "step": 149230 }, { "epoch": 0.75, "learning_rate": 0.00018705974945890992, "loss": 0.0129, "step": 149240 }, { "epoch": 0.75, "learning_rate": 0.00018705218176589592, "loss": 0.0107, "step": 149250 }, { "epoch": 0.75, "learning_rate": 0.0001870446140728819, "loss": 0.0149, "step": 149260 }, { "epoch": 0.75, "learning_rate": 0.0001870370463798679, "loss": 0.011, "step": 149270 }, { "epoch": 0.75, "learning_rate": 0.0001870294786868539, "loss": 0.012, "step": 149280 }, { "epoch": 0.75, "learning_rate": 0.00018702191099383988, "loss": 0.0133, "step": 149290 }, { "epoch": 0.75, "learning_rate": 0.00018701434330082586, "loss": 0.0115, "step": 149300 }, { "epoch": 0.75, "learning_rate": 0.00018700677560781184, "loss": 0.0155, "step": 149310 }, { "epoch": 0.75, "learning_rate": 0.00018699920791479785, "loss": 0.0124, "step": 149320 }, { "epoch": 0.75, "learning_rate": 0.00018699164022178383, "loss": 0.0129, "step": 149330 }, { "epoch": 0.75, "learning_rate": 0.0001869840725287698, "loss": 0.012, "step": 149340 }, { "epoch": 0.75, "learning_rate": 0.00018697650483575582, "loss": 0.0114, "step": 149350 }, { "epoch": 0.75, "learning_rate": 0.0001869689371427418, "loss": 0.0147, "step": 149360 }, { "epoch": 0.75, "learning_rate": 0.00018696136944972778, "loss": 0.0151, "step": 149370 }, { "epoch": 0.75, "learning_rate": 0.0001869538017567138, "loss": 0.015, "step": 149380 }, { "epoch": 0.75, "learning_rate": 0.00018694623406369977, "loss": 0.0155, "step": 149390 }, { "epoch": 0.75, "learning_rate": 0.00018693866637068575, "loss": 0.0161, "step": 149400 }, { "epoch": 0.75, "learning_rate": 0.00018693109867767176, "loss": 0.0122, "step": 149410 }, { "epoch": 0.75, "learning_rate": 0.00018692353098465774, "loss": 0.0132, "step": 149420 }, { "epoch": 0.75, "learning_rate": 0.00018691596329164373, "loss": 0.0129, "step": 149430 }, { "epoch": 0.75, "learning_rate": 0.00018690839559862973, "loss": 0.018, "step": 149440 }, { "epoch": 0.75, "learning_rate": 0.00018690082790561572, "loss": 0.0137, "step": 149450 }, { "epoch": 0.75, "learning_rate": 0.0001868932602126017, "loss": 0.0142, "step": 149460 }, { "epoch": 0.75, "learning_rate": 0.0001868856925195877, "loss": 0.0145, "step": 149470 }, { "epoch": 0.75, "learning_rate": 0.0001868781248265737, "loss": 0.0095, "step": 149480 }, { "epoch": 0.75, "learning_rate": 0.00018687055713355967, "loss": 0.0127, "step": 149490 }, { "epoch": 0.75, "learning_rate": 0.00018686298944054565, "loss": 0.0162, "step": 149500 }, { "epoch": 0.75, "learning_rate": 0.00018685542174753166, "loss": 0.0174, "step": 149510 }, { "epoch": 0.75, "learning_rate": 0.00018684785405451764, "loss": 0.0115, "step": 149520 }, { "epoch": 0.75, "learning_rate": 0.00018684028636150362, "loss": 0.0126, "step": 149530 }, { "epoch": 0.75, "learning_rate": 0.00018683271866848963, "loss": 0.0129, "step": 149540 }, { "epoch": 0.75, "learning_rate": 0.0001868251509754756, "loss": 0.0121, "step": 149550 }, { "epoch": 0.75, "learning_rate": 0.0001868175832824616, "loss": 0.0121, "step": 149560 }, { "epoch": 0.75, "learning_rate": 0.0001868100155894476, "loss": 0.0166, "step": 149570 }, { "epoch": 0.75, "learning_rate": 0.00018680244789643358, "loss": 0.0095, "step": 149580 }, { "epoch": 0.75, "learning_rate": 0.00018679488020341956, "loss": 0.0134, "step": 149590 }, { "epoch": 0.75, "learning_rate": 0.00018678731251040557, "loss": 0.0108, "step": 149600 }, { "epoch": 0.75, "learning_rate": 0.00018677974481739155, "loss": 0.0167, "step": 149610 }, { "epoch": 0.75, "learning_rate": 0.00018677217712437754, "loss": 0.0141, "step": 149620 }, { "epoch": 0.75, "learning_rate": 0.00018676460943136354, "loss": 0.0117, "step": 149630 }, { "epoch": 0.75, "learning_rate": 0.00018675704173834953, "loss": 0.0113, "step": 149640 }, { "epoch": 0.76, "learning_rate": 0.0001867494740453355, "loss": 0.0172, "step": 149650 }, { "epoch": 0.76, "learning_rate": 0.0001867419063523215, "loss": 0.0099, "step": 149660 }, { "epoch": 0.76, "learning_rate": 0.0001867343386593075, "loss": 0.0109, "step": 149670 }, { "epoch": 0.76, "learning_rate": 0.00018672677096629348, "loss": 0.0152, "step": 149680 }, { "epoch": 0.76, "learning_rate": 0.00018671920327327946, "loss": 0.0152, "step": 149690 }, { "epoch": 0.76, "learning_rate": 0.00018671163558026547, "loss": 0.0116, "step": 149700 }, { "epoch": 0.76, "learning_rate": 0.00018670406788725145, "loss": 0.0138, "step": 149710 }, { "epoch": 0.76, "learning_rate": 0.00018669650019423743, "loss": 0.0166, "step": 149720 }, { "epoch": 0.76, "learning_rate": 0.00018668893250122344, "loss": 0.0128, "step": 149730 }, { "epoch": 0.76, "learning_rate": 0.00018668136480820942, "loss": 0.0136, "step": 149740 }, { "epoch": 0.76, "learning_rate": 0.0001866737971151954, "loss": 0.0126, "step": 149750 }, { "epoch": 0.76, "learning_rate": 0.0001866662294221814, "loss": 0.0147, "step": 149760 }, { "epoch": 0.76, "learning_rate": 0.0001866586617291674, "loss": 0.0118, "step": 149770 }, { "epoch": 0.76, "learning_rate": 0.00018665109403615337, "loss": 0.0116, "step": 149780 }, { "epoch": 0.76, "learning_rate": 0.00018664352634313938, "loss": 0.0117, "step": 149790 }, { "epoch": 0.76, "learning_rate": 0.00018663595865012536, "loss": 0.0152, "step": 149800 }, { "epoch": 0.76, "learning_rate": 0.00018662839095711135, "loss": 0.0135, "step": 149810 }, { "epoch": 0.76, "learning_rate": 0.00018662082326409733, "loss": 0.0131, "step": 149820 }, { "epoch": 0.76, "learning_rate": 0.00018661325557108334, "loss": 0.0165, "step": 149830 }, { "epoch": 0.76, "learning_rate": 0.00018660568787806932, "loss": 0.0147, "step": 149840 }, { "epoch": 0.76, "learning_rate": 0.0001865981201850553, "loss": 0.0125, "step": 149850 }, { "epoch": 0.76, "learning_rate": 0.0001865905524920413, "loss": 0.0152, "step": 149860 }, { "epoch": 0.76, "learning_rate": 0.0001865829847990273, "loss": 0.0146, "step": 149870 }, { "epoch": 0.76, "learning_rate": 0.00018657541710601327, "loss": 0.0148, "step": 149880 }, { "epoch": 0.76, "learning_rate": 0.00018656784941299928, "loss": 0.0123, "step": 149890 }, { "epoch": 0.76, "learning_rate": 0.00018656028171998526, "loss": 0.0121, "step": 149900 }, { "epoch": 0.76, "learning_rate": 0.00018655271402697124, "loss": 0.0144, "step": 149910 }, { "epoch": 0.76, "learning_rate": 0.00018654514633395725, "loss": 0.0161, "step": 149920 }, { "epoch": 0.76, "learning_rate": 0.00018653757864094323, "loss": 0.0126, "step": 149930 }, { "epoch": 0.76, "learning_rate": 0.0001865300109479292, "loss": 0.0218, "step": 149940 }, { "epoch": 0.76, "learning_rate": 0.00018652244325491522, "loss": 0.0143, "step": 149950 }, { "epoch": 0.76, "learning_rate": 0.0001865148755619012, "loss": 0.0144, "step": 149960 }, { "epoch": 0.76, "learning_rate": 0.00018650730786888718, "loss": 0.0104, "step": 149970 }, { "epoch": 0.76, "learning_rate": 0.0001864997401758732, "loss": 0.0141, "step": 149980 }, { "epoch": 0.76, "learning_rate": 0.00018649217248285917, "loss": 0.014, "step": 149990 }, { "epoch": 0.76, "learning_rate": 0.00018648460478984516, "loss": 0.012, "step": 150000 }, { "epoch": 0.76, "eval_cer": 0.9144857822411687, "eval_loss": 0.008926572278141975, "eval_runtime": 116.0551, "eval_samples_per_second": 17.233, "eval_steps_per_second": 4.308, "step": 150000 }, { "epoch": 0.76, "learning_rate": 0.00018647703709683114, "loss": 0.0139, "step": 150010 }, { "epoch": 0.76, "learning_rate": 0.00018646946940381715, "loss": 0.0121, "step": 150020 }, { "epoch": 0.76, "learning_rate": 0.00018646190171080313, "loss": 0.0115, "step": 150030 }, { "epoch": 0.76, "learning_rate": 0.0001864543340177891, "loss": 0.0109, "step": 150040 }, { "epoch": 0.76, "learning_rate": 0.00018644676632477512, "loss": 0.0137, "step": 150050 }, { "epoch": 0.76, "learning_rate": 0.0001864391986317611, "loss": 0.0137, "step": 150060 }, { "epoch": 0.76, "learning_rate": 0.00018643163093874708, "loss": 0.015, "step": 150070 }, { "epoch": 0.76, "learning_rate": 0.0001864240632457331, "loss": 0.0114, "step": 150080 }, { "epoch": 0.76, "learning_rate": 0.00018641649555271907, "loss": 0.0102, "step": 150090 }, { "epoch": 0.76, "learning_rate": 0.00018640892785970505, "loss": 0.0133, "step": 150100 }, { "epoch": 0.76, "learning_rate": 0.00018640136016669106, "loss": 0.0132, "step": 150110 }, { "epoch": 0.76, "learning_rate": 0.00018639379247367704, "loss": 0.012, "step": 150120 }, { "epoch": 0.76, "learning_rate": 0.00018638622478066302, "loss": 0.0124, "step": 150130 }, { "epoch": 0.76, "learning_rate": 0.00018637865708764903, "loss": 0.0113, "step": 150140 }, { "epoch": 0.76, "learning_rate": 0.000186371089394635, "loss": 0.0131, "step": 150150 }, { "epoch": 0.76, "learning_rate": 0.000186363521701621, "loss": 0.0122, "step": 150160 }, { "epoch": 0.76, "learning_rate": 0.00018635595400860698, "loss": 0.0127, "step": 150170 }, { "epoch": 0.76, "learning_rate": 0.00018634838631559298, "loss": 0.0116, "step": 150180 }, { "epoch": 0.76, "learning_rate": 0.00018634081862257897, "loss": 0.0137, "step": 150190 }, { "epoch": 0.76, "learning_rate": 0.00018633325092956492, "loss": 0.0133, "step": 150200 }, { "epoch": 0.76, "learning_rate": 0.0001863256832365509, "loss": 0.0131, "step": 150210 }, { "epoch": 0.76, "learning_rate": 0.0001863181155435369, "loss": 0.0157, "step": 150220 }, { "epoch": 0.76, "learning_rate": 0.0001863105478505229, "loss": 0.0153, "step": 150230 }, { "epoch": 0.76, "learning_rate": 0.00018630298015750887, "loss": 0.0136, "step": 150240 }, { "epoch": 0.76, "learning_rate": 0.00018629541246449488, "loss": 0.0134, "step": 150250 }, { "epoch": 0.76, "learning_rate": 0.00018628784477148086, "loss": 0.0107, "step": 150260 }, { "epoch": 0.76, "learning_rate": 0.00018628027707846684, "loss": 0.0121, "step": 150270 }, { "epoch": 0.76, "learning_rate": 0.00018627270938545285, "loss": 0.0164, "step": 150280 }, { "epoch": 0.76, "learning_rate": 0.00018626514169243883, "loss": 0.0144, "step": 150290 }, { "epoch": 0.76, "learning_rate": 0.00018625757399942482, "loss": 0.0094, "step": 150300 }, { "epoch": 0.76, "learning_rate": 0.00018625000630641082, "loss": 0.014, "step": 150310 }, { "epoch": 0.76, "learning_rate": 0.0001862424386133968, "loss": 0.0117, "step": 150320 }, { "epoch": 0.76, "learning_rate": 0.0001862348709203828, "loss": 0.0151, "step": 150330 }, { "epoch": 0.76, "learning_rate": 0.0001862273032273688, "loss": 0.0137, "step": 150340 }, { "epoch": 0.76, "learning_rate": 0.00018621973553435478, "loss": 0.0163, "step": 150350 }, { "epoch": 0.76, "learning_rate": 0.00018621216784134076, "loss": 0.0098, "step": 150360 }, { "epoch": 0.76, "learning_rate": 0.00018620460014832677, "loss": 0.0141, "step": 150370 }, { "epoch": 0.76, "learning_rate": 0.00018619703245531275, "loss": 0.0116, "step": 150380 }, { "epoch": 0.76, "learning_rate": 0.00018618946476229873, "loss": 0.0127, "step": 150390 }, { "epoch": 0.76, "learning_rate": 0.0001861818970692847, "loss": 0.0108, "step": 150400 }, { "epoch": 0.76, "learning_rate": 0.00018617432937627072, "loss": 0.0158, "step": 150410 }, { "epoch": 0.76, "learning_rate": 0.0001861667616832567, "loss": 0.0146, "step": 150420 }, { "epoch": 0.76, "learning_rate": 0.00018615919399024268, "loss": 0.0151, "step": 150430 }, { "epoch": 0.76, "learning_rate": 0.0001861516262972287, "loss": 0.0123, "step": 150440 }, { "epoch": 0.76, "learning_rate": 0.00018614405860421467, "loss": 0.0136, "step": 150450 }, { "epoch": 0.76, "learning_rate": 0.00018613649091120066, "loss": 0.0167, "step": 150460 }, { "epoch": 0.76, "learning_rate": 0.00018612892321818666, "loss": 0.0133, "step": 150470 }, { "epoch": 0.76, "learning_rate": 0.00018612135552517264, "loss": 0.0115, "step": 150480 }, { "epoch": 0.76, "learning_rate": 0.00018611378783215863, "loss": 0.0131, "step": 150490 }, { "epoch": 0.76, "learning_rate": 0.00018610622013914463, "loss": 0.0169, "step": 150500 }, { "epoch": 0.76, "learning_rate": 0.00018609865244613062, "loss": 0.014, "step": 150510 }, { "epoch": 0.76, "learning_rate": 0.0001860910847531166, "loss": 0.0155, "step": 150520 }, { "epoch": 0.76, "learning_rate": 0.0001860835170601026, "loss": 0.0136, "step": 150530 }, { "epoch": 0.76, "learning_rate": 0.0001860759493670886, "loss": 0.0115, "step": 150540 }, { "epoch": 0.76, "learning_rate": 0.00018606838167407457, "loss": 0.0092, "step": 150550 }, { "epoch": 0.76, "learning_rate": 0.00018606081398106055, "loss": 0.0118, "step": 150560 }, { "epoch": 0.76, "learning_rate": 0.00018605324628804656, "loss": 0.0131, "step": 150570 }, { "epoch": 0.76, "learning_rate": 0.00018604567859503254, "loss": 0.0131, "step": 150580 }, { "epoch": 0.76, "learning_rate": 0.00018603811090201852, "loss": 0.0128, "step": 150590 }, { "epoch": 0.76, "learning_rate": 0.00018603054320900453, "loss": 0.0138, "step": 150600 }, { "epoch": 0.76, "learning_rate": 0.0001860229755159905, "loss": 0.0117, "step": 150610 }, { "epoch": 0.76, "learning_rate": 0.0001860154078229765, "loss": 0.0149, "step": 150620 }, { "epoch": 0.76, "learning_rate": 0.0001860078401299625, "loss": 0.0148, "step": 150630 }, { "epoch": 0.76, "learning_rate": 0.00018600027243694848, "loss": 0.0143, "step": 150640 }, { "epoch": 0.76, "learning_rate": 0.00018599270474393447, "loss": 0.0151, "step": 150650 }, { "epoch": 0.76, "learning_rate": 0.00018598513705092047, "loss": 0.0116, "step": 150660 }, { "epoch": 0.76, "learning_rate": 0.00018597756935790646, "loss": 0.0146, "step": 150670 }, { "epoch": 0.76, "learning_rate": 0.00018597000166489244, "loss": 0.0112, "step": 150680 }, { "epoch": 0.76, "learning_rate": 0.00018596243397187845, "loss": 0.0105, "step": 150690 }, { "epoch": 0.76, "learning_rate": 0.00018595486627886443, "loss": 0.0139, "step": 150700 }, { "epoch": 0.76, "learning_rate": 0.0001859472985858504, "loss": 0.0105, "step": 150710 }, { "epoch": 0.76, "learning_rate": 0.0001859397308928364, "loss": 0.0125, "step": 150720 }, { "epoch": 0.76, "learning_rate": 0.0001859321631998224, "loss": 0.012, "step": 150730 }, { "epoch": 0.76, "learning_rate": 0.00018592459550680838, "loss": 0.0114, "step": 150740 }, { "epoch": 0.76, "learning_rate": 0.00018591702781379436, "loss": 0.0129, "step": 150750 }, { "epoch": 0.76, "learning_rate": 0.00018590946012078037, "loss": 0.0112, "step": 150760 }, { "epoch": 0.76, "learning_rate": 0.00018590189242776635, "loss": 0.0135, "step": 150770 }, { "epoch": 0.76, "learning_rate": 0.00018589432473475233, "loss": 0.0138, "step": 150780 }, { "epoch": 0.76, "learning_rate": 0.00018588675704173834, "loss": 0.0158, "step": 150790 }, { "epoch": 0.76, "learning_rate": 0.00018587918934872432, "loss": 0.0143, "step": 150800 }, { "epoch": 0.76, "learning_rate": 0.0001858716216557103, "loss": 0.0139, "step": 150810 }, { "epoch": 0.76, "learning_rate": 0.0001858640539626963, "loss": 0.0118, "step": 150820 }, { "epoch": 0.76, "learning_rate": 0.0001858564862696823, "loss": 0.0112, "step": 150830 }, { "epoch": 0.76, "learning_rate": 0.00018584891857666828, "loss": 0.0104, "step": 150840 }, { "epoch": 0.76, "learning_rate": 0.00018584135088365428, "loss": 0.0118, "step": 150850 }, { "epoch": 0.76, "learning_rate": 0.00018583378319064027, "loss": 0.0122, "step": 150860 }, { "epoch": 0.76, "learning_rate": 0.00018582621549762625, "loss": 0.0142, "step": 150870 }, { "epoch": 0.76, "learning_rate": 0.00018581864780461226, "loss": 0.0119, "step": 150880 }, { "epoch": 0.76, "learning_rate": 0.00018581108011159824, "loss": 0.0122, "step": 150890 }, { "epoch": 0.76, "learning_rate": 0.00018580351241858422, "loss": 0.0147, "step": 150900 }, { "epoch": 0.76, "learning_rate": 0.0001857959447255702, "loss": 0.0147, "step": 150910 }, { "epoch": 0.76, "learning_rate": 0.0001857883770325562, "loss": 0.0139, "step": 150920 }, { "epoch": 0.76, "learning_rate": 0.0001857808093395422, "loss": 0.0158, "step": 150930 }, { "epoch": 0.76, "learning_rate": 0.00018577324164652817, "loss": 0.0113, "step": 150940 }, { "epoch": 0.76, "learning_rate": 0.00018576567395351418, "loss": 0.0117, "step": 150950 }, { "epoch": 0.76, "learning_rate": 0.00018575810626050016, "loss": 0.0124, "step": 150960 }, { "epoch": 0.76, "learning_rate": 0.00018575053856748614, "loss": 0.0141, "step": 150970 }, { "epoch": 0.76, "learning_rate": 0.00018574297087447215, "loss": 0.0149, "step": 150980 }, { "epoch": 0.76, "learning_rate": 0.00018573540318145813, "loss": 0.0116, "step": 150990 }, { "epoch": 0.76, "learning_rate": 0.00018572783548844411, "loss": 0.0146, "step": 151000 }, { "epoch": 0.76, "eval_cer": 0.9144760782799146, "eval_loss": 0.00918071623891592, "eval_runtime": 116.7205, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 151000 }, { "epoch": 0.76, "learning_rate": 0.00018572026779543012, "loss": 0.0125, "step": 151010 }, { "epoch": 0.76, "learning_rate": 0.0001857127001024161, "loss": 0.0133, "step": 151020 }, { "epoch": 0.76, "learning_rate": 0.00018570513240940209, "loss": 0.0129, "step": 151030 }, { "epoch": 0.76, "learning_rate": 0.0001856975647163881, "loss": 0.0122, "step": 151040 }, { "epoch": 0.76, "learning_rate": 0.00018568999702337408, "loss": 0.0135, "step": 151050 }, { "epoch": 0.76, "learning_rate": 0.00018568242933036006, "loss": 0.0141, "step": 151060 }, { "epoch": 0.76, "learning_rate": 0.00018567486163734604, "loss": 0.0118, "step": 151070 }, { "epoch": 0.76, "learning_rate": 0.00018566729394433205, "loss": 0.0113, "step": 151080 }, { "epoch": 0.76, "learning_rate": 0.00018565972625131803, "loss": 0.015, "step": 151090 }, { "epoch": 0.76, "learning_rate": 0.000185652158558304, "loss": 0.0135, "step": 151100 }, { "epoch": 0.76, "learning_rate": 0.00018564459086529002, "loss": 0.0149, "step": 151110 }, { "epoch": 0.76, "learning_rate": 0.000185637023172276, "loss": 0.0118, "step": 151120 }, { "epoch": 0.76, "learning_rate": 0.00018562945547926198, "loss": 0.013, "step": 151130 }, { "epoch": 0.76, "learning_rate": 0.000185621887786248, "loss": 0.0111, "step": 151140 }, { "epoch": 0.76, "learning_rate": 0.00018561432009323397, "loss": 0.0139, "step": 151150 }, { "epoch": 0.76, "learning_rate": 0.00018560675240021995, "loss": 0.0121, "step": 151160 }, { "epoch": 0.76, "learning_rate": 0.00018559918470720596, "loss": 0.0114, "step": 151170 }, { "epoch": 0.76, "learning_rate": 0.00018559161701419194, "loss": 0.0111, "step": 151180 }, { "epoch": 0.76, "learning_rate": 0.00018558404932117792, "loss": 0.0192, "step": 151190 }, { "epoch": 0.76, "learning_rate": 0.00018557648162816393, "loss": 0.0119, "step": 151200 }, { "epoch": 0.76, "learning_rate": 0.00018556891393514991, "loss": 0.0108, "step": 151210 }, { "epoch": 0.76, "learning_rate": 0.0001855613462421359, "loss": 0.0114, "step": 151220 }, { "epoch": 0.76, "learning_rate": 0.00018555377854912188, "loss": 0.0104, "step": 151230 }, { "epoch": 0.76, "learning_rate": 0.00018554621085610789, "loss": 0.0143, "step": 151240 }, { "epoch": 0.76, "learning_rate": 0.00018553864316309387, "loss": 0.0122, "step": 151250 }, { "epoch": 0.76, "learning_rate": 0.00018553107547007985, "loss": 0.0103, "step": 151260 }, { "epoch": 0.76, "learning_rate": 0.00018552350777706586, "loss": 0.0133, "step": 151270 }, { "epoch": 0.76, "learning_rate": 0.00018551594008405184, "loss": 0.0112, "step": 151280 }, { "epoch": 0.76, "learning_rate": 0.00018550837239103782, "loss": 0.0123, "step": 151290 }, { "epoch": 0.76, "learning_rate": 0.00018550080469802383, "loss": 0.0121, "step": 151300 }, { "epoch": 0.76, "learning_rate": 0.0001854932370050098, "loss": 0.0125, "step": 151310 }, { "epoch": 0.76, "learning_rate": 0.0001854856693119958, "loss": 0.0135, "step": 151320 }, { "epoch": 0.76, "learning_rate": 0.0001854781016189818, "loss": 0.0115, "step": 151330 }, { "epoch": 0.76, "learning_rate": 0.00018547053392596778, "loss": 0.0086, "step": 151340 }, { "epoch": 0.76, "learning_rate": 0.00018546296623295376, "loss": 0.0119, "step": 151350 }, { "epoch": 0.76, "learning_rate": 0.00018545539853993977, "loss": 0.0117, "step": 151360 }, { "epoch": 0.76, "learning_rate": 0.00018544783084692575, "loss": 0.0129, "step": 151370 }, { "epoch": 0.76, "learning_rate": 0.00018544026315391173, "loss": 0.0141, "step": 151380 }, { "epoch": 0.76, "learning_rate": 0.00018543269546089774, "loss": 0.0139, "step": 151390 }, { "epoch": 0.76, "learning_rate": 0.00018542512776788372, "loss": 0.0141, "step": 151400 }, { "epoch": 0.76, "learning_rate": 0.0001854175600748697, "loss": 0.0112, "step": 151410 }, { "epoch": 0.76, "learning_rate": 0.0001854099923818557, "loss": 0.014, "step": 151420 }, { "epoch": 0.76, "learning_rate": 0.0001854024246888417, "loss": 0.0133, "step": 151430 }, { "epoch": 0.76, "learning_rate": 0.00018539485699582768, "loss": 0.0128, "step": 151440 }, { "epoch": 0.76, "learning_rate": 0.00018538728930281366, "loss": 0.0111, "step": 151450 }, { "epoch": 0.76, "learning_rate": 0.0001853797216097996, "loss": 0.0141, "step": 151460 }, { "epoch": 0.76, "learning_rate": 0.00018537215391678562, "loss": 0.0125, "step": 151470 }, { "epoch": 0.76, "learning_rate": 0.0001853645862237716, "loss": 0.0131, "step": 151480 }, { "epoch": 0.76, "learning_rate": 0.00018535701853075758, "loss": 0.0144, "step": 151490 }, { "epoch": 0.76, "learning_rate": 0.0001853494508377436, "loss": 0.0118, "step": 151500 }, { "epoch": 0.76, "learning_rate": 0.00018534188314472957, "loss": 0.0126, "step": 151510 }, { "epoch": 0.76, "learning_rate": 0.00018533431545171556, "loss": 0.0117, "step": 151520 }, { "epoch": 0.76, "learning_rate": 0.00018532674775870156, "loss": 0.0142, "step": 151530 }, { "epoch": 0.76, "learning_rate": 0.00018531918006568755, "loss": 0.0144, "step": 151540 }, { "epoch": 0.76, "learning_rate": 0.00018531161237267353, "loss": 0.0117, "step": 151550 }, { "epoch": 0.76, "learning_rate": 0.00018530404467965954, "loss": 0.0178, "step": 151560 }, { "epoch": 0.76, "learning_rate": 0.00018529647698664552, "loss": 0.0133, "step": 151570 }, { "epoch": 0.76, "learning_rate": 0.0001852889092936315, "loss": 0.0144, "step": 151580 }, { "epoch": 0.76, "learning_rate": 0.0001852813416006175, "loss": 0.0131, "step": 151590 }, { "epoch": 0.76, "learning_rate": 0.0001852737739076035, "loss": 0.0136, "step": 151600 }, { "epoch": 0.76, "learning_rate": 0.00018526620621458947, "loss": 0.0125, "step": 151610 }, { "epoch": 0.76, "learning_rate": 0.00018525863852157545, "loss": 0.0122, "step": 151620 }, { "epoch": 0.76, "learning_rate": 0.00018525107082856146, "loss": 0.0166, "step": 151630 }, { "epoch": 0.77, "learning_rate": 0.00018524350313554744, "loss": 0.0127, "step": 151640 }, { "epoch": 0.77, "learning_rate": 0.00018523593544253342, "loss": 0.012, "step": 151650 }, { "epoch": 0.77, "learning_rate": 0.00018522836774951943, "loss": 0.0187, "step": 151660 }, { "epoch": 0.77, "learning_rate": 0.0001852208000565054, "loss": 0.0119, "step": 151670 }, { "epoch": 0.77, "learning_rate": 0.0001852132323634914, "loss": 0.0146, "step": 151680 }, { "epoch": 0.77, "learning_rate": 0.0001852056646704774, "loss": 0.0126, "step": 151690 }, { "epoch": 0.77, "learning_rate": 0.00018519809697746338, "loss": 0.0128, "step": 151700 }, { "epoch": 0.77, "learning_rate": 0.00018519052928444937, "loss": 0.0125, "step": 151710 }, { "epoch": 0.77, "learning_rate": 0.00018518296159143537, "loss": 0.0139, "step": 151720 }, { "epoch": 0.77, "learning_rate": 0.00018517539389842136, "loss": 0.0112, "step": 151730 }, { "epoch": 0.77, "learning_rate": 0.00018516782620540734, "loss": 0.0099, "step": 151740 }, { "epoch": 0.77, "learning_rate": 0.00018516025851239335, "loss": 0.0105, "step": 151750 }, { "epoch": 0.77, "learning_rate": 0.00018515269081937933, "loss": 0.0139, "step": 151760 }, { "epoch": 0.77, "learning_rate": 0.0001851451231263653, "loss": 0.0109, "step": 151770 }, { "epoch": 0.77, "learning_rate": 0.00018513755543335132, "loss": 0.0135, "step": 151780 }, { "epoch": 0.77, "learning_rate": 0.0001851299877403373, "loss": 0.0145, "step": 151790 }, { "epoch": 0.77, "learning_rate": 0.00018512242004732328, "loss": 0.0136, "step": 151800 }, { "epoch": 0.77, "learning_rate": 0.00018511485235430926, "loss": 0.018, "step": 151810 }, { "epoch": 0.77, "learning_rate": 0.00018510728466129527, "loss": 0.0134, "step": 151820 }, { "epoch": 0.77, "learning_rate": 0.00018509971696828125, "loss": 0.0104, "step": 151830 }, { "epoch": 0.77, "learning_rate": 0.00018509214927526723, "loss": 0.0141, "step": 151840 }, { "epoch": 0.77, "learning_rate": 0.00018508458158225324, "loss": 0.0125, "step": 151850 }, { "epoch": 0.77, "learning_rate": 0.00018507701388923922, "loss": 0.0154, "step": 151860 }, { "epoch": 0.77, "learning_rate": 0.0001850694461962252, "loss": 0.0109, "step": 151870 }, { "epoch": 0.77, "learning_rate": 0.0001850618785032112, "loss": 0.0108, "step": 151880 }, { "epoch": 0.77, "learning_rate": 0.0001850543108101972, "loss": 0.0131, "step": 151890 }, { "epoch": 0.77, "learning_rate": 0.00018504674311718318, "loss": 0.0095, "step": 151900 }, { "epoch": 0.77, "learning_rate": 0.00018503917542416918, "loss": 0.0151, "step": 151910 }, { "epoch": 0.77, "learning_rate": 0.00018503160773115517, "loss": 0.0112, "step": 151920 }, { "epoch": 0.77, "learning_rate": 0.00018502404003814115, "loss": 0.0126, "step": 151930 }, { "epoch": 0.77, "learning_rate": 0.00018501647234512716, "loss": 0.0124, "step": 151940 }, { "epoch": 0.77, "learning_rate": 0.00018500890465211314, "loss": 0.0118, "step": 151950 }, { "epoch": 0.77, "learning_rate": 0.00018500133695909912, "loss": 0.0133, "step": 151960 }, { "epoch": 0.77, "learning_rate": 0.0001849937692660851, "loss": 0.0117, "step": 151970 }, { "epoch": 0.77, "learning_rate": 0.0001849862015730711, "loss": 0.0124, "step": 151980 }, { "epoch": 0.77, "learning_rate": 0.0001849786338800571, "loss": 0.0122, "step": 151990 }, { "epoch": 0.77, "learning_rate": 0.00018497106618704307, "loss": 0.0119, "step": 152000 }, { "epoch": 0.77, "eval_cer": 0.914467344714786, "eval_loss": 0.00894253607839346, "eval_runtime": 116.687, "eval_samples_per_second": 17.14, "eval_steps_per_second": 4.285, "step": 152000 }, { "epoch": 0.77, "learning_rate": 0.00018496349849402908, "loss": 0.0124, "step": 152010 }, { "epoch": 0.77, "learning_rate": 0.00018495593080101506, "loss": 0.0146, "step": 152020 }, { "epoch": 0.77, "learning_rate": 0.00018494836310800104, "loss": 0.0107, "step": 152030 }, { "epoch": 0.77, "learning_rate": 0.00018494079541498705, "loss": 0.014, "step": 152040 }, { "epoch": 0.77, "learning_rate": 0.00018493322772197303, "loss": 0.0096, "step": 152050 }, { "epoch": 0.77, "learning_rate": 0.00018492566002895901, "loss": 0.0149, "step": 152060 }, { "epoch": 0.77, "learning_rate": 0.00018491809233594502, "loss": 0.0156, "step": 152070 }, { "epoch": 0.77, "learning_rate": 0.000184910524642931, "loss": 0.0122, "step": 152080 }, { "epoch": 0.77, "learning_rate": 0.00018490295694991699, "loss": 0.0115, "step": 152090 }, { "epoch": 0.77, "learning_rate": 0.000184895389256903, "loss": 0.0144, "step": 152100 }, { "epoch": 0.77, "learning_rate": 0.00018488782156388898, "loss": 0.0134, "step": 152110 }, { "epoch": 0.77, "learning_rate": 0.00018488025387087496, "loss": 0.0129, "step": 152120 }, { "epoch": 0.77, "learning_rate": 0.00018487268617786094, "loss": 0.0152, "step": 152130 }, { "epoch": 0.77, "learning_rate": 0.00018486511848484695, "loss": 0.0098, "step": 152140 }, { "epoch": 0.77, "learning_rate": 0.00018485755079183293, "loss": 0.0128, "step": 152150 }, { "epoch": 0.77, "learning_rate": 0.0001848499830988189, "loss": 0.0131, "step": 152160 }, { "epoch": 0.77, "learning_rate": 0.00018484241540580492, "loss": 0.0136, "step": 152170 }, { "epoch": 0.77, "learning_rate": 0.0001848348477127909, "loss": 0.0114, "step": 152180 }, { "epoch": 0.77, "learning_rate": 0.00018482728001977688, "loss": 0.0113, "step": 152190 }, { "epoch": 0.77, "learning_rate": 0.0001848197123267629, "loss": 0.0161, "step": 152200 }, { "epoch": 0.77, "learning_rate": 0.00018481214463374887, "loss": 0.0161, "step": 152210 }, { "epoch": 0.77, "learning_rate": 0.00018480457694073485, "loss": 0.0136, "step": 152220 }, { "epoch": 0.77, "learning_rate": 0.00018479700924772086, "loss": 0.0108, "step": 152230 }, { "epoch": 0.77, "learning_rate": 0.00018478944155470684, "loss": 0.0123, "step": 152240 }, { "epoch": 0.77, "learning_rate": 0.00018478187386169282, "loss": 0.0108, "step": 152250 }, { "epoch": 0.77, "learning_rate": 0.00018477430616867883, "loss": 0.0125, "step": 152260 }, { "epoch": 0.77, "learning_rate": 0.00018476673847566481, "loss": 0.012, "step": 152270 }, { "epoch": 0.77, "learning_rate": 0.0001847591707826508, "loss": 0.0111, "step": 152280 }, { "epoch": 0.77, "learning_rate": 0.0001847516030896368, "loss": 0.0152, "step": 152290 }, { "epoch": 0.77, "learning_rate": 0.00018474403539662279, "loss": 0.0117, "step": 152300 }, { "epoch": 0.77, "learning_rate": 0.00018473646770360877, "loss": 0.0133, "step": 152310 }, { "epoch": 0.77, "learning_rate": 0.00018472890001059475, "loss": 0.0144, "step": 152320 }, { "epoch": 0.77, "learning_rate": 0.00018472133231758076, "loss": 0.0119, "step": 152330 }, { "epoch": 0.77, "learning_rate": 0.00018471376462456674, "loss": 0.0142, "step": 152340 }, { "epoch": 0.77, "learning_rate": 0.00018470619693155272, "loss": 0.0156, "step": 152350 }, { "epoch": 0.77, "learning_rate": 0.00018469862923853873, "loss": 0.0131, "step": 152360 }, { "epoch": 0.77, "learning_rate": 0.0001846910615455247, "loss": 0.0107, "step": 152370 }, { "epoch": 0.77, "learning_rate": 0.0001846834938525107, "loss": 0.0103, "step": 152380 }, { "epoch": 0.77, "learning_rate": 0.0001846759261594967, "loss": 0.0149, "step": 152390 }, { "epoch": 0.77, "learning_rate": 0.00018466835846648268, "loss": 0.0123, "step": 152400 }, { "epoch": 0.77, "learning_rate": 0.00018466079077346866, "loss": 0.0113, "step": 152410 }, { "epoch": 0.77, "learning_rate": 0.00018465322308045467, "loss": 0.0129, "step": 152420 }, { "epoch": 0.77, "learning_rate": 0.00018464565538744065, "loss": 0.0164, "step": 152430 }, { "epoch": 0.77, "learning_rate": 0.00018463808769442663, "loss": 0.0129, "step": 152440 }, { "epoch": 0.77, "learning_rate": 0.00018463052000141264, "loss": 0.014, "step": 152450 }, { "epoch": 0.77, "learning_rate": 0.00018462295230839862, "loss": 0.0125, "step": 152460 }, { "epoch": 0.77, "learning_rate": 0.0001846153846153846, "loss": 0.0141, "step": 152470 }, { "epoch": 0.77, "learning_rate": 0.0001846078169223706, "loss": 0.0139, "step": 152480 }, { "epoch": 0.77, "learning_rate": 0.0001846002492293566, "loss": 0.0225, "step": 152490 }, { "epoch": 0.77, "learning_rate": 0.00018459268153634258, "loss": 0.0156, "step": 152500 }, { "epoch": 0.77, "learning_rate": 0.00018458511384332856, "loss": 0.0118, "step": 152510 }, { "epoch": 0.77, "learning_rate": 0.00018457754615031457, "loss": 0.0132, "step": 152520 }, { "epoch": 0.77, "learning_rate": 0.00018456997845730055, "loss": 0.0178, "step": 152530 }, { "epoch": 0.77, "learning_rate": 0.00018456241076428653, "loss": 0.0088, "step": 152540 }, { "epoch": 0.77, "learning_rate": 0.00018455484307127254, "loss": 0.0104, "step": 152550 }, { "epoch": 0.77, "learning_rate": 0.00018454727537825852, "loss": 0.0112, "step": 152560 }, { "epoch": 0.77, "learning_rate": 0.0001845397076852445, "loss": 0.0143, "step": 152570 }, { "epoch": 0.77, "learning_rate": 0.0001845321399922305, "loss": 0.0126, "step": 152580 }, { "epoch": 0.77, "learning_rate": 0.0001845245722992165, "loss": 0.0107, "step": 152590 }, { "epoch": 0.77, "learning_rate": 0.00018451700460620247, "loss": 0.0125, "step": 152600 }, { "epoch": 0.77, "learning_rate": 0.00018450943691318848, "loss": 0.0116, "step": 152610 }, { "epoch": 0.77, "learning_rate": 0.00018450186922017446, "loss": 0.0143, "step": 152620 }, { "epoch": 0.77, "learning_rate": 0.00018449430152716044, "loss": 0.0144, "step": 152630 }, { "epoch": 0.77, "learning_rate": 0.00018448673383414643, "loss": 0.0101, "step": 152640 }, { "epoch": 0.77, "learning_rate": 0.00018447916614113243, "loss": 0.0143, "step": 152650 }, { "epoch": 0.77, "learning_rate": 0.00018447159844811842, "loss": 0.0116, "step": 152660 }, { "epoch": 0.77, "learning_rate": 0.0001844640307551044, "loss": 0.0124, "step": 152670 }, { "epoch": 0.77, "learning_rate": 0.0001844564630620904, "loss": 0.0126, "step": 152680 }, { "epoch": 0.77, "learning_rate": 0.0001844488953690764, "loss": 0.0152, "step": 152690 }, { "epoch": 0.77, "learning_rate": 0.00018444132767606237, "loss": 0.0134, "step": 152700 }, { "epoch": 0.77, "learning_rate": 0.00018443375998304838, "loss": 0.01, "step": 152710 }, { "epoch": 0.77, "learning_rate": 0.00018442619229003433, "loss": 0.0135, "step": 152720 }, { "epoch": 0.77, "learning_rate": 0.0001844186245970203, "loss": 0.0117, "step": 152730 }, { "epoch": 0.77, "learning_rate": 0.0001844110569040063, "loss": 0.0171, "step": 152740 }, { "epoch": 0.77, "learning_rate": 0.0001844034892109923, "loss": 0.012, "step": 152750 }, { "epoch": 0.77, "learning_rate": 0.00018439592151797828, "loss": 0.0111, "step": 152760 }, { "epoch": 0.77, "learning_rate": 0.00018438835382496427, "loss": 0.0111, "step": 152770 }, { "epoch": 0.77, "learning_rate": 0.00018438078613195027, "loss": 0.0114, "step": 152780 }, { "epoch": 0.77, "learning_rate": 0.00018437321843893626, "loss": 0.0123, "step": 152790 }, { "epoch": 0.77, "learning_rate": 0.00018436565074592224, "loss": 0.0127, "step": 152800 }, { "epoch": 0.77, "learning_rate": 0.00018435808305290825, "loss": 0.0121, "step": 152810 }, { "epoch": 0.77, "learning_rate": 0.00018435051535989423, "loss": 0.0137, "step": 152820 }, { "epoch": 0.77, "learning_rate": 0.0001843429476668802, "loss": 0.0105, "step": 152830 }, { "epoch": 0.77, "learning_rate": 0.00018433537997386622, "loss": 0.0113, "step": 152840 }, { "epoch": 0.77, "learning_rate": 0.0001843278122808522, "loss": 0.0186, "step": 152850 }, { "epoch": 0.77, "learning_rate": 0.00018432024458783818, "loss": 0.0117, "step": 152860 }, { "epoch": 0.77, "learning_rate": 0.00018431267689482416, "loss": 0.0124, "step": 152870 }, { "epoch": 0.77, "learning_rate": 0.00018430510920181017, "loss": 0.0127, "step": 152880 }, { "epoch": 0.77, "learning_rate": 0.00018429754150879615, "loss": 0.0141, "step": 152890 }, { "epoch": 0.77, "learning_rate": 0.00018428997381578213, "loss": 0.0143, "step": 152900 }, { "epoch": 0.77, "learning_rate": 0.00018428240612276814, "loss": 0.0147, "step": 152910 }, { "epoch": 0.77, "learning_rate": 0.00018427483842975412, "loss": 0.0119, "step": 152920 }, { "epoch": 0.77, "learning_rate": 0.0001842672707367401, "loss": 0.0155, "step": 152930 }, { "epoch": 0.77, "learning_rate": 0.0001842597030437261, "loss": 0.0131, "step": 152940 }, { "epoch": 0.77, "learning_rate": 0.0001842521353507121, "loss": 0.0135, "step": 152950 }, { "epoch": 0.77, "learning_rate": 0.00018424456765769808, "loss": 0.011, "step": 152960 }, { "epoch": 0.77, "learning_rate": 0.00018423699996468408, "loss": 0.0125, "step": 152970 }, { "epoch": 0.77, "learning_rate": 0.00018422943227167007, "loss": 0.0144, "step": 152980 }, { "epoch": 0.77, "learning_rate": 0.00018422186457865605, "loss": 0.0123, "step": 152990 }, { "epoch": 0.77, "learning_rate": 0.00018421429688564206, "loss": 0.0142, "step": 153000 }, { "epoch": 0.77, "eval_cer": 0.9144702559031622, "eval_loss": 0.008783689700067043, "eval_runtime": 116.6617, "eval_samples_per_second": 17.144, "eval_steps_per_second": 4.286, "step": 153000 }, { "epoch": 0.77, "learning_rate": 0.00018420672919262804, "loss": 0.0109, "step": 153010 }, { "epoch": 0.77, "learning_rate": 0.00018419916149961402, "loss": 0.0154, "step": 153020 }, { "epoch": 0.77, "learning_rate": 0.0001841915938066, "loss": 0.0121, "step": 153030 }, { "epoch": 0.77, "learning_rate": 0.000184184026113586, "loss": 0.0115, "step": 153040 }, { "epoch": 0.77, "learning_rate": 0.000184176458420572, "loss": 0.0118, "step": 153050 }, { "epoch": 0.77, "learning_rate": 0.00018416889072755797, "loss": 0.0121, "step": 153060 }, { "epoch": 0.77, "learning_rate": 0.00018416132303454398, "loss": 0.0127, "step": 153070 }, { "epoch": 0.77, "learning_rate": 0.00018415375534152996, "loss": 0.0151, "step": 153080 }, { "epoch": 0.77, "learning_rate": 0.00018414618764851594, "loss": 0.0142, "step": 153090 }, { "epoch": 0.77, "learning_rate": 0.00018413861995550195, "loss": 0.0153, "step": 153100 }, { "epoch": 0.77, "learning_rate": 0.00018413105226248793, "loss": 0.0132, "step": 153110 }, { "epoch": 0.77, "learning_rate": 0.00018412348456947391, "loss": 0.012, "step": 153120 }, { "epoch": 0.77, "learning_rate": 0.00018411591687645992, "loss": 0.0117, "step": 153130 }, { "epoch": 0.77, "learning_rate": 0.0001841083491834459, "loss": 0.0112, "step": 153140 }, { "epoch": 0.77, "learning_rate": 0.00018410078149043189, "loss": 0.0183, "step": 153150 }, { "epoch": 0.77, "learning_rate": 0.0001840932137974179, "loss": 0.0155, "step": 153160 }, { "epoch": 0.77, "learning_rate": 0.00018408564610440388, "loss": 0.016, "step": 153170 }, { "epoch": 0.77, "learning_rate": 0.00018407807841138986, "loss": 0.0132, "step": 153180 }, { "epoch": 0.77, "learning_rate": 0.00018407051071837584, "loss": 0.0181, "step": 153190 }, { "epoch": 0.77, "learning_rate": 0.00018406294302536185, "loss": 0.0173, "step": 153200 }, { "epoch": 0.77, "learning_rate": 0.00018405537533234783, "loss": 0.018, "step": 153210 }, { "epoch": 0.77, "learning_rate": 0.0001840478076393338, "loss": 0.0161, "step": 153220 }, { "epoch": 0.77, "learning_rate": 0.00018404023994631982, "loss": 0.0144, "step": 153230 }, { "epoch": 0.77, "learning_rate": 0.0001840326722533058, "loss": 0.015, "step": 153240 }, { "epoch": 0.77, "learning_rate": 0.00018402510456029178, "loss": 0.0151, "step": 153250 }, { "epoch": 0.77, "learning_rate": 0.0001840175368672778, "loss": 0.0126, "step": 153260 }, { "epoch": 0.77, "learning_rate": 0.00018400996917426377, "loss": 0.0133, "step": 153270 }, { "epoch": 0.77, "learning_rate": 0.00018400240148124975, "loss": 0.0149, "step": 153280 }, { "epoch": 0.77, "learning_rate": 0.00018399483378823576, "loss": 0.0156, "step": 153290 }, { "epoch": 0.77, "learning_rate": 0.00018398726609522174, "loss": 0.0117, "step": 153300 }, { "epoch": 0.77, "learning_rate": 0.00018397969840220772, "loss": 0.0125, "step": 153310 }, { "epoch": 0.77, "learning_rate": 0.00018397213070919373, "loss": 0.0121, "step": 153320 }, { "epoch": 0.77, "learning_rate": 0.00018396456301617971, "loss": 0.0136, "step": 153330 }, { "epoch": 0.77, "learning_rate": 0.0001839569953231657, "loss": 0.0131, "step": 153340 }, { "epoch": 0.77, "learning_rate": 0.0001839494276301517, "loss": 0.012, "step": 153350 }, { "epoch": 0.77, "learning_rate": 0.00018394185993713769, "loss": 0.0146, "step": 153360 }, { "epoch": 0.77, "learning_rate": 0.00018393429224412367, "loss": 0.0115, "step": 153370 }, { "epoch": 0.77, "learning_rate": 0.00018392672455110965, "loss": 0.0106, "step": 153380 }, { "epoch": 0.77, "learning_rate": 0.00018391915685809566, "loss": 0.0102, "step": 153390 }, { "epoch": 0.77, "learning_rate": 0.00018391158916508164, "loss": 0.0142, "step": 153400 }, { "epoch": 0.77, "learning_rate": 0.00018390402147206762, "loss": 0.0135, "step": 153410 }, { "epoch": 0.77, "learning_rate": 0.00018389645377905363, "loss": 0.0128, "step": 153420 }, { "epoch": 0.77, "learning_rate": 0.0001838888860860396, "loss": 0.0129, "step": 153430 }, { "epoch": 0.77, "learning_rate": 0.0001838813183930256, "loss": 0.0138, "step": 153440 }, { "epoch": 0.77, "learning_rate": 0.0001838737507000116, "loss": 0.0145, "step": 153450 }, { "epoch": 0.77, "learning_rate": 0.00018386618300699758, "loss": 0.0112, "step": 153460 }, { "epoch": 0.77, "learning_rate": 0.00018385861531398356, "loss": 0.0088, "step": 153470 }, { "epoch": 0.77, "learning_rate": 0.00018385104762096957, "loss": 0.0178, "step": 153480 }, { "epoch": 0.77, "learning_rate": 0.00018384347992795555, "loss": 0.017, "step": 153490 }, { "epoch": 0.77, "learning_rate": 0.00018383591223494153, "loss": 0.012, "step": 153500 }, { "epoch": 0.77, "learning_rate": 0.00018382834454192754, "loss": 0.0136, "step": 153510 }, { "epoch": 0.77, "learning_rate": 0.00018382077684891352, "loss": 0.0135, "step": 153520 }, { "epoch": 0.77, "learning_rate": 0.0001838132091558995, "loss": 0.0123, "step": 153530 }, { "epoch": 0.77, "learning_rate": 0.0001838056414628855, "loss": 0.0118, "step": 153540 }, { "epoch": 0.77, "learning_rate": 0.0001837980737698715, "loss": 0.0128, "step": 153550 }, { "epoch": 0.77, "learning_rate": 0.00018379050607685748, "loss": 0.0107, "step": 153560 }, { "epoch": 0.77, "learning_rate": 0.00018378293838384346, "loss": 0.0158, "step": 153570 }, { "epoch": 0.77, "learning_rate": 0.00018377537069082947, "loss": 0.0121, "step": 153580 }, { "epoch": 0.77, "learning_rate": 0.00018376780299781545, "loss": 0.0098, "step": 153590 }, { "epoch": 0.77, "learning_rate": 0.00018376023530480143, "loss": 0.0156, "step": 153600 }, { "epoch": 0.77, "learning_rate": 0.00018375266761178744, "loss": 0.0129, "step": 153610 }, { "epoch": 0.78, "learning_rate": 0.00018374509991877342, "loss": 0.0095, "step": 153620 }, { "epoch": 0.78, "learning_rate": 0.0001837375322257594, "loss": 0.0139, "step": 153630 }, { "epoch": 0.78, "learning_rate": 0.0001837299645327454, "loss": 0.0128, "step": 153640 }, { "epoch": 0.78, "learning_rate": 0.0001837223968397314, "loss": 0.0146, "step": 153650 }, { "epoch": 0.78, "learning_rate": 0.00018371482914671737, "loss": 0.0122, "step": 153660 }, { "epoch": 0.78, "learning_rate": 0.00018370726145370338, "loss": 0.0142, "step": 153670 }, { "epoch": 0.78, "learning_rate": 0.00018369969376068936, "loss": 0.0119, "step": 153680 }, { "epoch": 0.78, "learning_rate": 0.00018369212606767534, "loss": 0.0089, "step": 153690 }, { "epoch": 0.78, "learning_rate": 0.00018368455837466133, "loss": 0.011, "step": 153700 }, { "epoch": 0.78, "learning_rate": 0.00018367699068164733, "loss": 0.0145, "step": 153710 }, { "epoch": 0.78, "learning_rate": 0.00018366942298863332, "loss": 0.0122, "step": 153720 }, { "epoch": 0.78, "learning_rate": 0.0001836618552956193, "loss": 0.0124, "step": 153730 }, { "epoch": 0.78, "learning_rate": 0.0001836542876026053, "loss": 0.0126, "step": 153740 }, { "epoch": 0.78, "learning_rate": 0.0001836467199095913, "loss": 0.0112, "step": 153750 }, { "epoch": 0.78, "learning_rate": 0.00018363915221657727, "loss": 0.0137, "step": 153760 }, { "epoch": 0.78, "learning_rate": 0.00018363158452356328, "loss": 0.011, "step": 153770 }, { "epoch": 0.78, "learning_rate": 0.00018362401683054926, "loss": 0.0143, "step": 153780 }, { "epoch": 0.78, "learning_rate": 0.00018361644913753524, "loss": 0.0137, "step": 153790 }, { "epoch": 0.78, "learning_rate": 0.00018360888144452125, "loss": 0.0131, "step": 153800 }, { "epoch": 0.78, "learning_rate": 0.00018360131375150723, "loss": 0.0101, "step": 153810 }, { "epoch": 0.78, "learning_rate": 0.0001835937460584932, "loss": 0.0145, "step": 153820 }, { "epoch": 0.78, "learning_rate": 0.00018358617836547922, "loss": 0.0116, "step": 153830 }, { "epoch": 0.78, "learning_rate": 0.0001835786106724652, "loss": 0.0104, "step": 153840 }, { "epoch": 0.78, "learning_rate": 0.00018357104297945118, "loss": 0.0114, "step": 153850 }, { "epoch": 0.78, "learning_rate": 0.0001835634752864372, "loss": 0.0122, "step": 153860 }, { "epoch": 0.78, "learning_rate": 0.00018355590759342317, "loss": 0.0109, "step": 153870 }, { "epoch": 0.78, "learning_rate": 0.00018354833990040915, "loss": 0.0132, "step": 153880 }, { "epoch": 0.78, "learning_rate": 0.00018354077220739514, "loss": 0.0143, "step": 153890 }, { "epoch": 0.78, "learning_rate": 0.00018353320451438114, "loss": 0.0126, "step": 153900 }, { "epoch": 0.78, "learning_rate": 0.00018352563682136713, "loss": 0.0112, "step": 153910 }, { "epoch": 0.78, "learning_rate": 0.0001835180691283531, "loss": 0.01, "step": 153920 }, { "epoch": 0.78, "learning_rate": 0.00018351050143533912, "loss": 0.0111, "step": 153930 }, { "epoch": 0.78, "learning_rate": 0.0001835029337423251, "loss": 0.0125, "step": 153940 }, { "epoch": 0.78, "learning_rate": 0.00018349536604931108, "loss": 0.0126, "step": 153950 }, { "epoch": 0.78, "learning_rate": 0.0001834877983562971, "loss": 0.0158, "step": 153960 }, { "epoch": 0.78, "learning_rate": 0.00018348023066328304, "loss": 0.0129, "step": 153970 }, { "epoch": 0.78, "learning_rate": 0.00018347266297026902, "loss": 0.0126, "step": 153980 }, { "epoch": 0.78, "learning_rate": 0.000183465095277255, "loss": 0.0096, "step": 153990 }, { "epoch": 0.78, "learning_rate": 0.000183457527584241, "loss": 0.0128, "step": 154000 }, { "epoch": 0.78, "eval_cer": 0.9144789894682909, "eval_loss": 0.008818663656711578, "eval_runtime": 116.7061, "eval_samples_per_second": 17.137, "eval_steps_per_second": 4.284, "step": 154000 }, { "epoch": 0.78, "learning_rate": 0.000183449959891227, "loss": 0.011, "step": 154010 }, { "epoch": 0.78, "learning_rate": 0.00018344239219821298, "loss": 0.0127, "step": 154020 }, { "epoch": 0.78, "learning_rate": 0.00018343482450519898, "loss": 0.0111, "step": 154030 }, { "epoch": 0.78, "learning_rate": 0.00018342725681218497, "loss": 0.0127, "step": 154040 }, { "epoch": 0.78, "learning_rate": 0.00018341968911917095, "loss": 0.0114, "step": 154050 }, { "epoch": 0.78, "learning_rate": 0.00018341212142615696, "loss": 0.0101, "step": 154060 }, { "epoch": 0.78, "learning_rate": 0.00018340455373314294, "loss": 0.0143, "step": 154070 }, { "epoch": 0.78, "learning_rate": 0.00018339698604012892, "loss": 0.013, "step": 154080 }, { "epoch": 0.78, "learning_rate": 0.0001833894183471149, "loss": 0.0121, "step": 154090 }, { "epoch": 0.78, "learning_rate": 0.0001833818506541009, "loss": 0.0158, "step": 154100 }, { "epoch": 0.78, "learning_rate": 0.0001833742829610869, "loss": 0.013, "step": 154110 }, { "epoch": 0.78, "learning_rate": 0.00018336671526807287, "loss": 0.0161, "step": 154120 }, { "epoch": 0.78, "learning_rate": 0.00018335914757505888, "loss": 0.0153, "step": 154130 }, { "epoch": 0.78, "learning_rate": 0.00018335157988204486, "loss": 0.0163, "step": 154140 }, { "epoch": 0.78, "learning_rate": 0.00018334401218903084, "loss": 0.014, "step": 154150 }, { "epoch": 0.78, "learning_rate": 0.00018333644449601685, "loss": 0.011, "step": 154160 }, { "epoch": 0.78, "learning_rate": 0.00018332887680300283, "loss": 0.0134, "step": 154170 }, { "epoch": 0.78, "learning_rate": 0.00018332130910998881, "loss": 0.0101, "step": 154180 }, { "epoch": 0.78, "learning_rate": 0.00018331374141697482, "loss": 0.014, "step": 154190 }, { "epoch": 0.78, "learning_rate": 0.0001833061737239608, "loss": 0.0103, "step": 154200 }, { "epoch": 0.78, "learning_rate": 0.00018329860603094679, "loss": 0.0127, "step": 154210 }, { "epoch": 0.78, "learning_rate": 0.0001832910383379328, "loss": 0.0098, "step": 154220 }, { "epoch": 0.78, "learning_rate": 0.00018328347064491878, "loss": 0.0135, "step": 154230 }, { "epoch": 0.78, "learning_rate": 0.00018327590295190476, "loss": 0.012, "step": 154240 }, { "epoch": 0.78, "learning_rate": 0.00018326833525889077, "loss": 0.0125, "step": 154250 }, { "epoch": 0.78, "learning_rate": 0.00018326076756587675, "loss": 0.0116, "step": 154260 }, { "epoch": 0.78, "learning_rate": 0.00018325319987286273, "loss": 0.0137, "step": 154270 }, { "epoch": 0.78, "learning_rate": 0.0001832456321798487, "loss": 0.0114, "step": 154280 }, { "epoch": 0.78, "learning_rate": 0.00018323806448683472, "loss": 0.0127, "step": 154290 }, { "epoch": 0.78, "learning_rate": 0.0001832304967938207, "loss": 0.0126, "step": 154300 }, { "epoch": 0.78, "learning_rate": 0.00018322292910080668, "loss": 0.0166, "step": 154310 }, { "epoch": 0.78, "learning_rate": 0.0001832153614077927, "loss": 0.0135, "step": 154320 }, { "epoch": 0.78, "learning_rate": 0.00018320779371477867, "loss": 0.0116, "step": 154330 }, { "epoch": 0.78, "learning_rate": 0.00018320022602176465, "loss": 0.0122, "step": 154340 }, { "epoch": 0.78, "learning_rate": 0.00018319265832875066, "loss": 0.0115, "step": 154350 }, { "epoch": 0.78, "learning_rate": 0.00018318509063573664, "loss": 0.0096, "step": 154360 }, { "epoch": 0.78, "learning_rate": 0.00018317752294272262, "loss": 0.0114, "step": 154370 }, { "epoch": 0.78, "learning_rate": 0.00018316995524970863, "loss": 0.0115, "step": 154380 }, { "epoch": 0.78, "learning_rate": 0.00018316238755669461, "loss": 0.0101, "step": 154390 }, { "epoch": 0.78, "learning_rate": 0.0001831548198636806, "loss": 0.0109, "step": 154400 }, { "epoch": 0.78, "learning_rate": 0.0001831472521706666, "loss": 0.0094, "step": 154410 }, { "epoch": 0.78, "learning_rate": 0.00018313968447765259, "loss": 0.0119, "step": 154420 }, { "epoch": 0.78, "learning_rate": 0.00018313211678463857, "loss": 0.0128, "step": 154430 }, { "epoch": 0.78, "learning_rate": 0.00018312454909162455, "loss": 0.0131, "step": 154440 }, { "epoch": 0.78, "learning_rate": 0.00018311698139861056, "loss": 0.0112, "step": 154450 }, { "epoch": 0.78, "learning_rate": 0.00018310941370559654, "loss": 0.0107, "step": 154460 }, { "epoch": 0.78, "learning_rate": 0.00018310184601258252, "loss": 0.0141, "step": 154470 }, { "epoch": 0.78, "learning_rate": 0.00018309427831956853, "loss": 0.0112, "step": 154480 }, { "epoch": 0.78, "learning_rate": 0.0001830867106265545, "loss": 0.0154, "step": 154490 }, { "epoch": 0.78, "learning_rate": 0.0001830791429335405, "loss": 0.0103, "step": 154500 }, { "epoch": 0.78, "learning_rate": 0.0001830715752405265, "loss": 0.0175, "step": 154510 }, { "epoch": 0.78, "learning_rate": 0.00018306400754751248, "loss": 0.0152, "step": 154520 }, { "epoch": 0.78, "learning_rate": 0.00018305643985449846, "loss": 0.0131, "step": 154530 }, { "epoch": 0.78, "learning_rate": 0.00018304887216148447, "loss": 0.013, "step": 154540 }, { "epoch": 0.78, "learning_rate": 0.00018304130446847045, "loss": 0.0145, "step": 154550 }, { "epoch": 0.78, "learning_rate": 0.00018303373677545643, "loss": 0.0134, "step": 154560 }, { "epoch": 0.78, "learning_rate": 0.00018302616908244244, "loss": 0.0129, "step": 154570 }, { "epoch": 0.78, "learning_rate": 0.00018301860138942842, "loss": 0.0149, "step": 154580 }, { "epoch": 0.78, "learning_rate": 0.0001830110336964144, "loss": 0.0105, "step": 154590 }, { "epoch": 0.78, "learning_rate": 0.0001830034660034004, "loss": 0.0161, "step": 154600 }, { "epoch": 0.78, "learning_rate": 0.0001829958983103864, "loss": 0.0127, "step": 154610 }, { "epoch": 0.78, "learning_rate": 0.00018298833061737238, "loss": 0.0137, "step": 154620 }, { "epoch": 0.78, "learning_rate": 0.00018298076292435836, "loss": 0.012, "step": 154630 }, { "epoch": 0.78, "learning_rate": 0.00018297319523134437, "loss": 0.0128, "step": 154640 }, { "epoch": 0.78, "learning_rate": 0.00018296562753833035, "loss": 0.0123, "step": 154650 }, { "epoch": 0.78, "learning_rate": 0.00018295805984531633, "loss": 0.0124, "step": 154660 }, { "epoch": 0.78, "learning_rate": 0.00018295049215230234, "loss": 0.0133, "step": 154670 }, { "epoch": 0.78, "learning_rate": 0.00018294292445928832, "loss": 0.013, "step": 154680 }, { "epoch": 0.78, "learning_rate": 0.0001829353567662743, "loss": 0.0147, "step": 154690 }, { "epoch": 0.78, "learning_rate": 0.0001829277890732603, "loss": 0.0109, "step": 154700 }, { "epoch": 0.78, "learning_rate": 0.0001829202213802463, "loss": 0.0137, "step": 154710 }, { "epoch": 0.78, "learning_rate": 0.00018291265368723227, "loss": 0.0109, "step": 154720 }, { "epoch": 0.78, "learning_rate": 0.00018290508599421828, "loss": 0.0137, "step": 154730 }, { "epoch": 0.78, "learning_rate": 0.00018289751830120426, "loss": 0.0115, "step": 154740 }, { "epoch": 0.78, "learning_rate": 0.00018288995060819024, "loss": 0.0111, "step": 154750 }, { "epoch": 0.78, "learning_rate": 0.00018288238291517625, "loss": 0.0122, "step": 154760 }, { "epoch": 0.78, "learning_rate": 0.00018287481522216223, "loss": 0.011, "step": 154770 }, { "epoch": 0.78, "learning_rate": 0.00018286724752914822, "loss": 0.0113, "step": 154780 }, { "epoch": 0.78, "learning_rate": 0.0001828596798361342, "loss": 0.0159, "step": 154790 }, { "epoch": 0.78, "learning_rate": 0.0001828521121431202, "loss": 0.0114, "step": 154800 }, { "epoch": 0.78, "learning_rate": 0.0001828445444501062, "loss": 0.0116, "step": 154810 }, { "epoch": 0.78, "learning_rate": 0.00018283697675709217, "loss": 0.0101, "step": 154820 }, { "epoch": 0.78, "learning_rate": 0.00018282940906407818, "loss": 0.0133, "step": 154830 }, { "epoch": 0.78, "learning_rate": 0.00018282184137106416, "loss": 0.0113, "step": 154840 }, { "epoch": 0.78, "learning_rate": 0.00018281427367805014, "loss": 0.013, "step": 154850 }, { "epoch": 0.78, "learning_rate": 0.00018280670598503615, "loss": 0.0141, "step": 154860 }, { "epoch": 0.78, "learning_rate": 0.00018279913829202213, "loss": 0.0136, "step": 154870 }, { "epoch": 0.78, "learning_rate": 0.0001827915705990081, "loss": 0.0107, "step": 154880 }, { "epoch": 0.78, "learning_rate": 0.00018278400290599412, "loss": 0.0158, "step": 154890 }, { "epoch": 0.78, "learning_rate": 0.0001827764352129801, "loss": 0.0116, "step": 154900 }, { "epoch": 0.78, "learning_rate": 0.00018276886751996608, "loss": 0.0114, "step": 154910 }, { "epoch": 0.78, "learning_rate": 0.0001827612998269521, "loss": 0.0124, "step": 154920 }, { "epoch": 0.78, "learning_rate": 0.00018275373213393807, "loss": 0.0138, "step": 154930 }, { "epoch": 0.78, "learning_rate": 0.00018274616444092405, "loss": 0.0102, "step": 154940 }, { "epoch": 0.78, "learning_rate": 0.00018273859674791004, "loss": 0.013, "step": 154950 }, { "epoch": 0.78, "learning_rate": 0.00018273102905489604, "loss": 0.0128, "step": 154960 }, { "epoch": 0.78, "learning_rate": 0.00018272346136188203, "loss": 0.0162, "step": 154970 }, { "epoch": 0.78, "learning_rate": 0.000182715893668868, "loss": 0.014, "step": 154980 }, { "epoch": 0.78, "learning_rate": 0.00018270832597585402, "loss": 0.0116, "step": 154990 }, { "epoch": 0.78, "learning_rate": 0.00018270075828284, "loss": 0.012, "step": 155000 }, { "epoch": 0.78, "eval_cer": 0.9144731670915385, "eval_loss": 0.009108257479965687, "eval_runtime": 116.7273, "eval_samples_per_second": 17.134, "eval_steps_per_second": 4.283, "step": 155000 }, { "epoch": 0.78, "learning_rate": 0.00018269319058982598, "loss": 0.0115, "step": 155010 }, { "epoch": 0.78, "learning_rate": 0.000182685622896812, "loss": 0.0206, "step": 155020 }, { "epoch": 0.78, "learning_rate": 0.00018267805520379797, "loss": 0.0122, "step": 155030 }, { "epoch": 0.78, "learning_rate": 0.00018267048751078395, "loss": 0.0132, "step": 155040 }, { "epoch": 0.78, "learning_rate": 0.00018266291981776996, "loss": 0.0166, "step": 155050 }, { "epoch": 0.78, "learning_rate": 0.00018265535212475594, "loss": 0.0127, "step": 155060 }, { "epoch": 0.78, "learning_rate": 0.00018264778443174192, "loss": 0.0139, "step": 155070 }, { "epoch": 0.78, "learning_rate": 0.00018264021673872793, "loss": 0.0103, "step": 155080 }, { "epoch": 0.78, "learning_rate": 0.0001826326490457139, "loss": 0.0136, "step": 155090 }, { "epoch": 0.78, "learning_rate": 0.0001826250813526999, "loss": 0.0147, "step": 155100 }, { "epoch": 0.78, "learning_rate": 0.00018261751365968587, "loss": 0.0111, "step": 155110 }, { "epoch": 0.78, "learning_rate": 0.00018260994596667188, "loss": 0.0137, "step": 155120 }, { "epoch": 0.78, "learning_rate": 0.00018260237827365786, "loss": 0.0121, "step": 155130 }, { "epoch": 0.78, "learning_rate": 0.00018259481058064385, "loss": 0.0143, "step": 155140 }, { "epoch": 0.78, "learning_rate": 0.00018258724288762985, "loss": 0.0134, "step": 155150 }, { "epoch": 0.78, "learning_rate": 0.00018257967519461584, "loss": 0.0147, "step": 155160 }, { "epoch": 0.78, "learning_rate": 0.00018257210750160182, "loss": 0.0109, "step": 155170 }, { "epoch": 0.78, "learning_rate": 0.00018256453980858783, "loss": 0.0182, "step": 155180 }, { "epoch": 0.78, "learning_rate": 0.0001825569721155738, "loss": 0.0164, "step": 155190 }, { "epoch": 0.78, "learning_rate": 0.0001825494044225598, "loss": 0.017, "step": 155200 }, { "epoch": 0.78, "learning_rate": 0.0001825418367295458, "loss": 0.012, "step": 155210 }, { "epoch": 0.78, "learning_rate": 0.00018253426903653178, "loss": 0.015, "step": 155220 }, { "epoch": 0.78, "learning_rate": 0.00018252670134351773, "loss": 0.0128, "step": 155230 }, { "epoch": 0.78, "learning_rate": 0.00018251913365050371, "loss": 0.0164, "step": 155240 }, { "epoch": 0.78, "learning_rate": 0.00018251156595748972, "loss": 0.0184, "step": 155250 }, { "epoch": 0.78, "learning_rate": 0.0001825039982644757, "loss": 0.0144, "step": 155260 }, { "epoch": 0.78, "learning_rate": 0.00018249643057146169, "loss": 0.0143, "step": 155270 }, { "epoch": 0.78, "learning_rate": 0.0001824888628784477, "loss": 0.0101, "step": 155280 }, { "epoch": 0.78, "learning_rate": 0.00018248129518543368, "loss": 0.0154, "step": 155290 }, { "epoch": 0.78, "learning_rate": 0.00018247372749241966, "loss": 0.0149, "step": 155300 }, { "epoch": 0.78, "learning_rate": 0.00018246615979940567, "loss": 0.0109, "step": 155310 }, { "epoch": 0.78, "learning_rate": 0.00018245859210639165, "loss": 0.0128, "step": 155320 }, { "epoch": 0.78, "learning_rate": 0.00018245102441337763, "loss": 0.0135, "step": 155330 }, { "epoch": 0.78, "learning_rate": 0.0001824434567203636, "loss": 0.014, "step": 155340 }, { "epoch": 0.78, "learning_rate": 0.00018243588902734962, "loss": 0.0136, "step": 155350 }, { "epoch": 0.78, "learning_rate": 0.0001824283213343356, "loss": 0.0132, "step": 155360 }, { "epoch": 0.78, "learning_rate": 0.00018242075364132158, "loss": 0.0132, "step": 155370 }, { "epoch": 0.78, "learning_rate": 0.0001824131859483076, "loss": 0.0131, "step": 155380 }, { "epoch": 0.78, "learning_rate": 0.00018240561825529357, "loss": 0.0112, "step": 155390 }, { "epoch": 0.78, "learning_rate": 0.00018239805056227955, "loss": 0.0143, "step": 155400 }, { "epoch": 0.78, "learning_rate": 0.00018239048286926556, "loss": 0.0127, "step": 155410 }, { "epoch": 0.78, "learning_rate": 0.00018238291517625154, "loss": 0.0128, "step": 155420 }, { "epoch": 0.78, "learning_rate": 0.00018237534748323752, "loss": 0.0122, "step": 155430 }, { "epoch": 0.78, "learning_rate": 0.00018236777979022353, "loss": 0.0105, "step": 155440 }, { "epoch": 0.78, "learning_rate": 0.00018236021209720951, "loss": 0.0133, "step": 155450 }, { "epoch": 0.78, "learning_rate": 0.0001823526444041955, "loss": 0.0129, "step": 155460 }, { "epoch": 0.78, "learning_rate": 0.0001823450767111815, "loss": 0.0138, "step": 155470 }, { "epoch": 0.78, "learning_rate": 0.00018233750901816749, "loss": 0.0088, "step": 155480 }, { "epoch": 0.78, "learning_rate": 0.00018232994132515347, "loss": 0.0127, "step": 155490 }, { "epoch": 0.78, "learning_rate": 0.00018232237363213945, "loss": 0.0125, "step": 155500 }, { "epoch": 0.78, "learning_rate": 0.00018231480593912546, "loss": 0.0124, "step": 155510 }, { "epoch": 0.78, "learning_rate": 0.00018230723824611144, "loss": 0.0138, "step": 155520 }, { "epoch": 0.78, "learning_rate": 0.00018229967055309742, "loss": 0.0122, "step": 155530 }, { "epoch": 0.78, "learning_rate": 0.00018229210286008343, "loss": 0.0136, "step": 155540 }, { "epoch": 0.78, "learning_rate": 0.0001822845351670694, "loss": 0.0114, "step": 155550 }, { "epoch": 0.78, "learning_rate": 0.0001822769674740554, "loss": 0.0147, "step": 155560 }, { "epoch": 0.78, "learning_rate": 0.0001822693997810414, "loss": 0.0114, "step": 155570 }, { "epoch": 0.78, "learning_rate": 0.00018226183208802738, "loss": 0.0108, "step": 155580 }, { "epoch": 0.78, "learning_rate": 0.00018225426439501336, "loss": 0.0138, "step": 155590 }, { "epoch": 0.79, "learning_rate": 0.00018224669670199937, "loss": 0.014, "step": 155600 }, { "epoch": 0.79, "learning_rate": 0.00018223912900898535, "loss": 0.0133, "step": 155610 }, { "epoch": 0.79, "learning_rate": 0.00018223156131597133, "loss": 0.0132, "step": 155620 }, { "epoch": 0.79, "learning_rate": 0.00018222399362295734, "loss": 0.0134, "step": 155630 }, { "epoch": 0.79, "learning_rate": 0.00018221642592994332, "loss": 0.0174, "step": 155640 }, { "epoch": 0.79, "learning_rate": 0.0001822088582369293, "loss": 0.013, "step": 155650 }, { "epoch": 0.79, "learning_rate": 0.00018220129054391531, "loss": 0.012, "step": 155660 }, { "epoch": 0.79, "learning_rate": 0.0001821937228509013, "loss": 0.0115, "step": 155670 }, { "epoch": 0.79, "learning_rate": 0.00018218615515788728, "loss": 0.0114, "step": 155680 }, { "epoch": 0.79, "learning_rate": 0.00018217858746487326, "loss": 0.0108, "step": 155690 }, { "epoch": 0.79, "learning_rate": 0.00018217101977185927, "loss": 0.0118, "step": 155700 }, { "epoch": 0.79, "learning_rate": 0.00018216345207884525, "loss": 0.0119, "step": 155710 }, { "epoch": 0.79, "learning_rate": 0.00018215588438583123, "loss": 0.0112, "step": 155720 }, { "epoch": 0.79, "learning_rate": 0.00018214831669281724, "loss": 0.0102, "step": 155730 }, { "epoch": 0.79, "learning_rate": 0.00018214074899980322, "loss": 0.0129, "step": 155740 }, { "epoch": 0.79, "learning_rate": 0.0001821331813067892, "loss": 0.0142, "step": 155750 }, { "epoch": 0.79, "learning_rate": 0.0001821256136137752, "loss": 0.0108, "step": 155760 }, { "epoch": 0.79, "learning_rate": 0.0001821180459207612, "loss": 0.0133, "step": 155770 }, { "epoch": 0.79, "learning_rate": 0.00018211047822774717, "loss": 0.0161, "step": 155780 }, { "epoch": 0.79, "learning_rate": 0.00018210291053473318, "loss": 0.0138, "step": 155790 }, { "epoch": 0.79, "learning_rate": 0.00018209534284171916, "loss": 0.011, "step": 155800 }, { "epoch": 0.79, "learning_rate": 0.00018208777514870514, "loss": 0.0129, "step": 155810 }, { "epoch": 0.79, "learning_rate": 0.00018208020745569115, "loss": 0.0124, "step": 155820 }, { "epoch": 0.79, "learning_rate": 0.00018207263976267713, "loss": 0.0126, "step": 155830 }, { "epoch": 0.79, "learning_rate": 0.00018206507206966312, "loss": 0.0143, "step": 155840 }, { "epoch": 0.79, "learning_rate": 0.0001820575043766491, "loss": 0.0099, "step": 155850 }, { "epoch": 0.79, "learning_rate": 0.0001820499366836351, "loss": 0.0129, "step": 155860 }, { "epoch": 0.79, "learning_rate": 0.0001820423689906211, "loss": 0.0159, "step": 155870 }, { "epoch": 0.79, "learning_rate": 0.00018203480129760707, "loss": 0.0127, "step": 155880 }, { "epoch": 0.79, "learning_rate": 0.00018202723360459308, "loss": 0.0144, "step": 155890 }, { "epoch": 0.79, "learning_rate": 0.00018201966591157906, "loss": 0.0133, "step": 155900 }, { "epoch": 0.79, "learning_rate": 0.00018201209821856504, "loss": 0.0155, "step": 155910 }, { "epoch": 0.79, "learning_rate": 0.00018200453052555105, "loss": 0.0125, "step": 155920 }, { "epoch": 0.79, "learning_rate": 0.00018199696283253703, "loss": 0.0125, "step": 155930 }, { "epoch": 0.79, "learning_rate": 0.000181989395139523, "loss": 0.0128, "step": 155940 }, { "epoch": 0.79, "learning_rate": 0.00018198182744650902, "loss": 0.0123, "step": 155950 }, { "epoch": 0.79, "learning_rate": 0.000181974259753495, "loss": 0.0128, "step": 155960 }, { "epoch": 0.79, "learning_rate": 0.00018196669206048098, "loss": 0.0139, "step": 155970 }, { "epoch": 0.79, "learning_rate": 0.000181959124367467, "loss": 0.0133, "step": 155980 }, { "epoch": 0.79, "learning_rate": 0.00018195155667445297, "loss": 0.01, "step": 155990 }, { "epoch": 0.79, "learning_rate": 0.00018194398898143895, "loss": 0.013, "step": 156000 }, { "epoch": 0.79, "eval_cer": 0.9144838414489178, "eval_loss": 0.00919434055685997, "eval_runtime": 116.631, "eval_samples_per_second": 17.148, "eval_steps_per_second": 4.287, "step": 156000 }, { "epoch": 0.79, "learning_rate": 0.00018193642128842494, "loss": 0.0116, "step": 156010 }, { "epoch": 0.79, "learning_rate": 0.00018192885359541094, "loss": 0.0135, "step": 156020 }, { "epoch": 0.79, "learning_rate": 0.00018192128590239693, "loss": 0.0128, "step": 156030 }, { "epoch": 0.79, "learning_rate": 0.0001819137182093829, "loss": 0.0144, "step": 156040 }, { "epoch": 0.79, "learning_rate": 0.00018190615051636892, "loss": 0.0157, "step": 156050 }, { "epoch": 0.79, "learning_rate": 0.0001818985828233549, "loss": 0.0149, "step": 156060 }, { "epoch": 0.79, "learning_rate": 0.00018189101513034088, "loss": 0.0116, "step": 156070 }, { "epoch": 0.79, "learning_rate": 0.0001818834474373269, "loss": 0.0124, "step": 156080 }, { "epoch": 0.79, "learning_rate": 0.00018187587974431287, "loss": 0.0116, "step": 156090 }, { "epoch": 0.79, "learning_rate": 0.00018186831205129885, "loss": 0.014, "step": 156100 }, { "epoch": 0.79, "learning_rate": 0.00018186074435828486, "loss": 0.0123, "step": 156110 }, { "epoch": 0.79, "learning_rate": 0.00018185317666527084, "loss": 0.0124, "step": 156120 }, { "epoch": 0.79, "learning_rate": 0.00018184560897225682, "loss": 0.0124, "step": 156130 }, { "epoch": 0.79, "learning_rate": 0.00018183804127924283, "loss": 0.0112, "step": 156140 }, { "epoch": 0.79, "learning_rate": 0.0001818304735862288, "loss": 0.012, "step": 156150 }, { "epoch": 0.79, "learning_rate": 0.0001818229058932148, "loss": 0.0125, "step": 156160 }, { "epoch": 0.79, "learning_rate": 0.0001818153382002008, "loss": 0.013, "step": 156170 }, { "epoch": 0.79, "learning_rate": 0.00018180777050718678, "loss": 0.0136, "step": 156180 }, { "epoch": 0.79, "learning_rate": 0.00018180020281417276, "loss": 0.0117, "step": 156190 }, { "epoch": 0.79, "learning_rate": 0.00018179263512115875, "loss": 0.0137, "step": 156200 }, { "epoch": 0.79, "learning_rate": 0.00018178506742814475, "loss": 0.0122, "step": 156210 }, { "epoch": 0.79, "learning_rate": 0.00018177749973513074, "loss": 0.0134, "step": 156220 }, { "epoch": 0.79, "learning_rate": 0.00018176993204211672, "loss": 0.0133, "step": 156230 }, { "epoch": 0.79, "learning_rate": 0.00018176236434910273, "loss": 0.0091, "step": 156240 }, { "epoch": 0.79, "learning_rate": 0.0001817547966560887, "loss": 0.0171, "step": 156250 }, { "epoch": 0.79, "learning_rate": 0.0001817472289630747, "loss": 0.0132, "step": 156260 }, { "epoch": 0.79, "learning_rate": 0.0001817396612700607, "loss": 0.0129, "step": 156270 }, { "epoch": 0.79, "learning_rate": 0.00018173209357704668, "loss": 0.0103, "step": 156280 }, { "epoch": 0.79, "learning_rate": 0.00018172452588403266, "loss": 0.014, "step": 156290 }, { "epoch": 0.79, "learning_rate": 0.00018171695819101867, "loss": 0.0107, "step": 156300 }, { "epoch": 0.79, "learning_rate": 0.00018170939049800465, "loss": 0.013, "step": 156310 }, { "epoch": 0.79, "learning_rate": 0.00018170182280499063, "loss": 0.0106, "step": 156320 }, { "epoch": 0.79, "learning_rate": 0.00018169425511197664, "loss": 0.0093, "step": 156330 }, { "epoch": 0.79, "learning_rate": 0.00018168668741896262, "loss": 0.012, "step": 156340 }, { "epoch": 0.79, "learning_rate": 0.0001816791197259486, "loss": 0.0085, "step": 156350 }, { "epoch": 0.79, "learning_rate": 0.00018167155203293459, "loss": 0.0136, "step": 156360 }, { "epoch": 0.79, "learning_rate": 0.0001816639843399206, "loss": 0.0105, "step": 156370 }, { "epoch": 0.79, "learning_rate": 0.00018165641664690657, "loss": 0.0127, "step": 156380 }, { "epoch": 0.79, "learning_rate": 0.00018164884895389256, "loss": 0.011, "step": 156390 }, { "epoch": 0.79, "learning_rate": 0.00018164128126087856, "loss": 0.01, "step": 156400 }, { "epoch": 0.79, "learning_rate": 0.00018163371356786455, "loss": 0.0115, "step": 156410 }, { "epoch": 0.79, "learning_rate": 0.00018162614587485053, "loss": 0.0155, "step": 156420 }, { "epoch": 0.79, "learning_rate": 0.00018161857818183654, "loss": 0.011, "step": 156430 }, { "epoch": 0.79, "learning_rate": 0.00018161101048882252, "loss": 0.0144, "step": 156440 }, { "epoch": 0.79, "learning_rate": 0.0001816034427958085, "loss": 0.0128, "step": 156450 }, { "epoch": 0.79, "learning_rate": 0.0001815958751027945, "loss": 0.0154, "step": 156460 }, { "epoch": 0.79, "learning_rate": 0.0001815883074097805, "loss": 0.0142, "step": 156470 }, { "epoch": 0.79, "learning_rate": 0.00018158073971676647, "loss": 0.0153, "step": 156480 }, { "epoch": 0.79, "learning_rate": 0.00018157317202375243, "loss": 0.0105, "step": 156490 }, { "epoch": 0.79, "learning_rate": 0.00018156560433073843, "loss": 0.0127, "step": 156500 }, { "epoch": 0.79, "learning_rate": 0.00018155803663772442, "loss": 0.0116, "step": 156510 }, { "epoch": 0.79, "learning_rate": 0.0001815504689447104, "loss": 0.0123, "step": 156520 }, { "epoch": 0.79, "learning_rate": 0.0001815429012516964, "loss": 0.0115, "step": 156530 }, { "epoch": 0.79, "learning_rate": 0.0001815353335586824, "loss": 0.0195, "step": 156540 }, { "epoch": 0.79, "learning_rate": 0.00018152776586566837, "loss": 0.0108, "step": 156550 }, { "epoch": 0.79, "learning_rate": 0.00018152019817265438, "loss": 0.014, "step": 156560 }, { "epoch": 0.79, "learning_rate": 0.00018151263047964036, "loss": 0.0119, "step": 156570 }, { "epoch": 0.79, "learning_rate": 0.00018150506278662634, "loss": 0.0114, "step": 156580 }, { "epoch": 0.79, "learning_rate": 0.00018149749509361232, "loss": 0.0134, "step": 156590 }, { "epoch": 0.79, "learning_rate": 0.00018148992740059833, "loss": 0.012, "step": 156600 }, { "epoch": 0.79, "learning_rate": 0.0001814823597075843, "loss": 0.0273, "step": 156610 }, { "epoch": 0.79, "learning_rate": 0.0001814747920145703, "loss": 0.0154, "step": 156620 }, { "epoch": 0.79, "learning_rate": 0.0001814672243215563, "loss": 0.0153, "step": 156630 }, { "epoch": 0.79, "learning_rate": 0.00018145965662854228, "loss": 0.0129, "step": 156640 }, { "epoch": 0.79, "learning_rate": 0.00018145208893552826, "loss": 0.0135, "step": 156650 }, { "epoch": 0.79, "learning_rate": 0.00018144452124251427, "loss": 0.0116, "step": 156660 }, { "epoch": 0.79, "learning_rate": 0.00018143695354950025, "loss": 0.0133, "step": 156670 }, { "epoch": 0.79, "learning_rate": 0.00018142938585648624, "loss": 0.0105, "step": 156680 }, { "epoch": 0.79, "learning_rate": 0.00018142181816347224, "loss": 0.0111, "step": 156690 }, { "epoch": 0.79, "learning_rate": 0.00018141425047045823, "loss": 0.0115, "step": 156700 }, { "epoch": 0.79, "learning_rate": 0.0001814066827774442, "loss": 0.0133, "step": 156710 }, { "epoch": 0.79, "learning_rate": 0.00018139911508443022, "loss": 0.0111, "step": 156720 }, { "epoch": 0.79, "learning_rate": 0.0001813915473914162, "loss": 0.0119, "step": 156730 }, { "epoch": 0.79, "learning_rate": 0.00018138397969840218, "loss": 0.0122, "step": 156740 }, { "epoch": 0.79, "learning_rate": 0.00018137641200538816, "loss": 0.014, "step": 156750 }, { "epoch": 0.79, "learning_rate": 0.00018136884431237417, "loss": 0.0091, "step": 156760 }, { "epoch": 0.79, "learning_rate": 0.00018136127661936015, "loss": 0.0101, "step": 156770 }, { "epoch": 0.79, "learning_rate": 0.00018135370892634613, "loss": 0.0108, "step": 156780 }, { "epoch": 0.79, "learning_rate": 0.00018134614123333214, "loss": 0.0159, "step": 156790 }, { "epoch": 0.79, "learning_rate": 0.00018133857354031812, "loss": 0.0131, "step": 156800 }, { "epoch": 0.79, "learning_rate": 0.0001813310058473041, "loss": 0.011, "step": 156810 }, { "epoch": 0.79, "learning_rate": 0.0001813234381542901, "loss": 0.0105, "step": 156820 }, { "epoch": 0.79, "learning_rate": 0.0001813158704612761, "loss": 0.0155, "step": 156830 }, { "epoch": 0.79, "learning_rate": 0.00018130830276826207, "loss": 0.0148, "step": 156840 }, { "epoch": 0.79, "learning_rate": 0.00018130073507524808, "loss": 0.0139, "step": 156850 }, { "epoch": 0.79, "learning_rate": 0.00018129316738223406, "loss": 0.0119, "step": 156860 }, { "epoch": 0.79, "learning_rate": 0.00018128559968922005, "loss": 0.0145, "step": 156870 }, { "epoch": 0.79, "learning_rate": 0.00018127803199620605, "loss": 0.0132, "step": 156880 }, { "epoch": 0.79, "learning_rate": 0.00018127046430319204, "loss": 0.0132, "step": 156890 }, { "epoch": 0.79, "learning_rate": 0.00018126289661017802, "loss": 0.012, "step": 156900 }, { "epoch": 0.79, "learning_rate": 0.000181255328917164, "loss": 0.012, "step": 156910 }, { "epoch": 0.79, "learning_rate": 0.00018124776122415, "loss": 0.0128, "step": 156920 }, { "epoch": 0.79, "learning_rate": 0.000181240193531136, "loss": 0.0122, "step": 156930 }, { "epoch": 0.79, "learning_rate": 0.00018123262583812197, "loss": 0.0125, "step": 156940 }, { "epoch": 0.79, "learning_rate": 0.00018122505814510798, "loss": 0.0148, "step": 156950 }, { "epoch": 0.79, "learning_rate": 0.00018121749045209396, "loss": 0.0116, "step": 156960 }, { "epoch": 0.79, "learning_rate": 0.00018120992275907994, "loss": 0.0112, "step": 156970 }, { "epoch": 0.79, "learning_rate": 0.00018120235506606595, "loss": 0.0101, "step": 156980 }, { "epoch": 0.79, "learning_rate": 0.00018119478737305193, "loss": 0.0123, "step": 156990 }, { "epoch": 0.79, "learning_rate": 0.0001811872196800379, "loss": 0.0119, "step": 157000 }, { "epoch": 0.79, "eval_cer": 0.9144983973907989, "eval_loss": 0.009071653708815575, "eval_runtime": 116.5721, "eval_samples_per_second": 17.157, "eval_steps_per_second": 4.289, "step": 157000 }, { "epoch": 0.79, "learning_rate": 0.00018117965198702392, "loss": 0.0129, "step": 157010 }, { "epoch": 0.79, "learning_rate": 0.0001811720842940099, "loss": 0.0134, "step": 157020 }, { "epoch": 0.79, "learning_rate": 0.00018116451660099588, "loss": 0.0115, "step": 157030 }, { "epoch": 0.79, "learning_rate": 0.0001811569489079819, "loss": 0.015, "step": 157040 }, { "epoch": 0.79, "learning_rate": 0.00018114938121496787, "loss": 0.0136, "step": 157050 }, { "epoch": 0.79, "learning_rate": 0.00018114181352195386, "loss": 0.0166, "step": 157060 }, { "epoch": 0.79, "learning_rate": 0.00018113424582893984, "loss": 0.0115, "step": 157070 }, { "epoch": 0.79, "learning_rate": 0.00018112667813592585, "loss": 0.0144, "step": 157080 }, { "epoch": 0.79, "learning_rate": 0.00018111911044291183, "loss": 0.019, "step": 157090 }, { "epoch": 0.79, "learning_rate": 0.0001811115427498978, "loss": 0.0121, "step": 157100 }, { "epoch": 0.79, "learning_rate": 0.00018110397505688382, "loss": 0.0156, "step": 157110 }, { "epoch": 0.79, "learning_rate": 0.0001810964073638698, "loss": 0.014, "step": 157120 }, { "epoch": 0.79, "learning_rate": 0.00018108883967085578, "loss": 0.0136, "step": 157130 }, { "epoch": 0.79, "learning_rate": 0.0001810812719778418, "loss": 0.0128, "step": 157140 }, { "epoch": 0.79, "learning_rate": 0.00018107370428482777, "loss": 0.0151, "step": 157150 }, { "epoch": 0.79, "learning_rate": 0.00018106613659181375, "loss": 0.0142, "step": 157160 }, { "epoch": 0.79, "learning_rate": 0.00018105856889879976, "loss": 0.0154, "step": 157170 }, { "epoch": 0.79, "learning_rate": 0.00018105100120578574, "loss": 0.0146, "step": 157180 }, { "epoch": 0.79, "learning_rate": 0.00018104343351277172, "loss": 0.0104, "step": 157190 }, { "epoch": 0.79, "learning_rate": 0.00018103586581975773, "loss": 0.0094, "step": 157200 }, { "epoch": 0.79, "learning_rate": 0.0001810282981267437, "loss": 0.0141, "step": 157210 }, { "epoch": 0.79, "learning_rate": 0.0001810207304337297, "loss": 0.0138, "step": 157220 }, { "epoch": 0.79, "learning_rate": 0.0001810131627407157, "loss": 0.0128, "step": 157230 }, { "epoch": 0.79, "learning_rate": 0.00018100559504770168, "loss": 0.0136, "step": 157240 }, { "epoch": 0.79, "learning_rate": 0.00018099802735468767, "loss": 0.0148, "step": 157250 }, { "epoch": 0.79, "learning_rate": 0.00018099045966167365, "loss": 0.0119, "step": 157260 }, { "epoch": 0.79, "learning_rate": 0.00018098289196865966, "loss": 0.0152, "step": 157270 }, { "epoch": 0.79, "learning_rate": 0.00018097532427564564, "loss": 0.0164, "step": 157280 }, { "epoch": 0.79, "learning_rate": 0.00018096775658263162, "loss": 0.0145, "step": 157290 }, { "epoch": 0.79, "learning_rate": 0.00018096018888961763, "loss": 0.0142, "step": 157300 }, { "epoch": 0.79, "learning_rate": 0.0001809526211966036, "loss": 0.0148, "step": 157310 }, { "epoch": 0.79, "learning_rate": 0.0001809450535035896, "loss": 0.012, "step": 157320 }, { "epoch": 0.79, "learning_rate": 0.0001809374858105756, "loss": 0.0153, "step": 157330 }, { "epoch": 0.79, "learning_rate": 0.00018092991811756158, "loss": 0.0122, "step": 157340 }, { "epoch": 0.79, "learning_rate": 0.00018092235042454756, "loss": 0.0111, "step": 157350 }, { "epoch": 0.79, "learning_rate": 0.00018091478273153357, "loss": 0.012, "step": 157360 }, { "epoch": 0.79, "learning_rate": 0.00018090721503851955, "loss": 0.0133, "step": 157370 }, { "epoch": 0.79, "learning_rate": 0.00018089964734550553, "loss": 0.0125, "step": 157380 }, { "epoch": 0.79, "learning_rate": 0.00018089207965249154, "loss": 0.0117, "step": 157390 }, { "epoch": 0.79, "learning_rate": 0.00018088451195947752, "loss": 0.0113, "step": 157400 }, { "epoch": 0.79, "learning_rate": 0.0001808769442664635, "loss": 0.0109, "step": 157410 }, { "epoch": 0.79, "learning_rate": 0.00018086937657344949, "loss": 0.0105, "step": 157420 }, { "epoch": 0.79, "learning_rate": 0.0001808618088804355, "loss": 0.0119, "step": 157430 }, { "epoch": 0.79, "learning_rate": 0.00018085424118742148, "loss": 0.0085, "step": 157440 }, { "epoch": 0.79, "learning_rate": 0.00018084667349440746, "loss": 0.0113, "step": 157450 }, { "epoch": 0.79, "learning_rate": 0.00018083910580139347, "loss": 0.0113, "step": 157460 }, { "epoch": 0.79, "learning_rate": 0.00018083153810837945, "loss": 0.0138, "step": 157470 }, { "epoch": 0.79, "learning_rate": 0.00018082397041536543, "loss": 0.011, "step": 157480 }, { "epoch": 0.79, "learning_rate": 0.00018081640272235144, "loss": 0.0103, "step": 157490 }, { "epoch": 0.79, "learning_rate": 0.00018080883502933742, "loss": 0.0204, "step": 157500 }, { "epoch": 0.79, "learning_rate": 0.0001808012673363234, "loss": 0.0136, "step": 157510 }, { "epoch": 0.79, "learning_rate": 0.0001807936996433094, "loss": 0.0155, "step": 157520 }, { "epoch": 0.79, "learning_rate": 0.0001807861319502954, "loss": 0.0137, "step": 157530 }, { "epoch": 0.79, "learning_rate": 0.00018077856425728137, "loss": 0.0102, "step": 157540 }, { "epoch": 0.79, "learning_rate": 0.00018077099656426738, "loss": 0.012, "step": 157550 }, { "epoch": 0.79, "learning_rate": 0.00018076342887125336, "loss": 0.0117, "step": 157560 }, { "epoch": 0.79, "learning_rate": 0.00018075586117823934, "loss": 0.0141, "step": 157570 }, { "epoch": 0.8, "learning_rate": 0.00018074829348522532, "loss": 0.0114, "step": 157580 }, { "epoch": 0.8, "learning_rate": 0.00018074072579221133, "loss": 0.0129, "step": 157590 }, { "epoch": 0.8, "learning_rate": 0.00018073315809919731, "loss": 0.0117, "step": 157600 }, { "epoch": 0.8, "learning_rate": 0.0001807255904061833, "loss": 0.0122, "step": 157610 }, { "epoch": 0.8, "learning_rate": 0.0001807180227131693, "loss": 0.0169, "step": 157620 }, { "epoch": 0.8, "learning_rate": 0.00018071045502015529, "loss": 0.0116, "step": 157630 }, { "epoch": 0.8, "learning_rate": 0.00018070288732714127, "loss": 0.0102, "step": 157640 }, { "epoch": 0.8, "learning_rate": 0.00018069531963412728, "loss": 0.0117, "step": 157650 }, { "epoch": 0.8, "learning_rate": 0.00018068775194111326, "loss": 0.0149, "step": 157660 }, { "epoch": 0.8, "learning_rate": 0.00018068018424809924, "loss": 0.0128, "step": 157670 }, { "epoch": 0.8, "learning_rate": 0.00018067261655508525, "loss": 0.0141, "step": 157680 }, { "epoch": 0.8, "learning_rate": 0.00018066504886207123, "loss": 0.0116, "step": 157690 }, { "epoch": 0.8, "learning_rate": 0.0001806574811690572, "loss": 0.0113, "step": 157700 }, { "epoch": 0.8, "learning_rate": 0.00018064991347604322, "loss": 0.0129, "step": 157710 }, { "epoch": 0.8, "learning_rate": 0.0001806423457830292, "loss": 0.0115, "step": 157720 }, { "epoch": 0.8, "learning_rate": 0.00018063477809001518, "loss": 0.0133, "step": 157730 }, { "epoch": 0.8, "learning_rate": 0.00018062721039700114, "loss": 0.0121, "step": 157740 }, { "epoch": 0.8, "learning_rate": 0.00018061964270398714, "loss": 0.0122, "step": 157750 }, { "epoch": 0.8, "learning_rate": 0.00018061207501097313, "loss": 0.0114, "step": 157760 }, { "epoch": 0.8, "learning_rate": 0.0001806045073179591, "loss": 0.0107, "step": 157770 }, { "epoch": 0.8, "learning_rate": 0.00018059693962494512, "loss": 0.013, "step": 157780 }, { "epoch": 0.8, "learning_rate": 0.0001805893719319311, "loss": 0.0116, "step": 157790 }, { "epoch": 0.8, "learning_rate": 0.00018058180423891708, "loss": 0.012, "step": 157800 }, { "epoch": 0.8, "learning_rate": 0.00018057423654590306, "loss": 0.0123, "step": 157810 }, { "epoch": 0.8, "learning_rate": 0.00018056666885288907, "loss": 0.0151, "step": 157820 }, { "epoch": 0.8, "learning_rate": 0.00018055910115987505, "loss": 0.0102, "step": 157830 }, { "epoch": 0.8, "learning_rate": 0.00018055153346686103, "loss": 0.013, "step": 157840 }, { "epoch": 0.8, "learning_rate": 0.00018054396577384704, "loss": 0.0131, "step": 157850 }, { "epoch": 0.8, "learning_rate": 0.00018053639808083302, "loss": 0.014, "step": 157860 }, { "epoch": 0.8, "learning_rate": 0.000180528830387819, "loss": 0.0152, "step": 157870 }, { "epoch": 0.8, "learning_rate": 0.000180521262694805, "loss": 0.012, "step": 157880 }, { "epoch": 0.8, "learning_rate": 0.000180513695001791, "loss": 0.013, "step": 157890 }, { "epoch": 0.8, "learning_rate": 0.00018050612730877697, "loss": 0.0118, "step": 157900 }, { "epoch": 0.8, "learning_rate": 0.00018049855961576298, "loss": 0.0138, "step": 157910 }, { "epoch": 0.8, "learning_rate": 0.00018049099192274896, "loss": 0.0125, "step": 157920 }, { "epoch": 0.8, "learning_rate": 0.00018048342422973495, "loss": 0.0118, "step": 157930 }, { "epoch": 0.8, "learning_rate": 0.00018047585653672095, "loss": 0.0112, "step": 157940 }, { "epoch": 0.8, "learning_rate": 0.00018046828884370694, "loss": 0.0108, "step": 157950 }, { "epoch": 0.8, "learning_rate": 0.00018046072115069292, "loss": 0.01, "step": 157960 }, { "epoch": 0.8, "learning_rate": 0.0001804531534576789, "loss": 0.0122, "step": 157970 }, { "epoch": 0.8, "learning_rate": 0.0001804455857646649, "loss": 0.0122, "step": 157980 }, { "epoch": 0.8, "learning_rate": 0.0001804380180716509, "loss": 0.0087, "step": 157990 }, { "epoch": 0.8, "learning_rate": 0.00018043045037863687, "loss": 0.0117, "step": 158000 }, { "epoch": 0.8, "eval_cer": 0.914447936792278, "eval_loss": 0.008715854957699776, "eval_runtime": 116.7633, "eval_samples_per_second": 17.129, "eval_steps_per_second": 4.282, "step": 158000 }, { "epoch": 0.8, "learning_rate": 0.00018042288268562288, "loss": 0.0173, "step": 158010 }, { "epoch": 0.8, "learning_rate": 0.00018041531499260886, "loss": 0.0147, "step": 158020 }, { "epoch": 0.8, "learning_rate": 0.00018040774729959484, "loss": 0.0137, "step": 158030 }, { "epoch": 0.8, "learning_rate": 0.00018040017960658085, "loss": 0.0125, "step": 158040 }, { "epoch": 0.8, "learning_rate": 0.00018039261191356683, "loss": 0.0133, "step": 158050 }, { "epoch": 0.8, "learning_rate": 0.0001803850442205528, "loss": 0.0181, "step": 158060 }, { "epoch": 0.8, "learning_rate": 0.00018037747652753882, "loss": 0.0132, "step": 158070 }, { "epoch": 0.8, "learning_rate": 0.0001803699088345248, "loss": 0.0106, "step": 158080 }, { "epoch": 0.8, "learning_rate": 0.00018036234114151078, "loss": 0.011, "step": 158090 }, { "epoch": 0.8, "learning_rate": 0.0001803547734484968, "loss": 0.013, "step": 158100 }, { "epoch": 0.8, "learning_rate": 0.00018034720575548277, "loss": 0.0116, "step": 158110 }, { "epoch": 0.8, "learning_rate": 0.00018033963806246876, "loss": 0.0122, "step": 158120 }, { "epoch": 0.8, "learning_rate": 0.00018033207036945476, "loss": 0.0159, "step": 158130 }, { "epoch": 0.8, "learning_rate": 0.00018032450267644075, "loss": 0.0092, "step": 158140 }, { "epoch": 0.8, "learning_rate": 0.00018031693498342673, "loss": 0.0128, "step": 158150 }, { "epoch": 0.8, "learning_rate": 0.0001803093672904127, "loss": 0.0155, "step": 158160 }, { "epoch": 0.8, "learning_rate": 0.00018030179959739872, "loss": 0.0114, "step": 158170 }, { "epoch": 0.8, "learning_rate": 0.0001802942319043847, "loss": 0.0131, "step": 158180 }, { "epoch": 0.8, "learning_rate": 0.00018028666421137068, "loss": 0.0101, "step": 158190 }, { "epoch": 0.8, "learning_rate": 0.0001802790965183567, "loss": 0.0129, "step": 158200 }, { "epoch": 0.8, "learning_rate": 0.00018027152882534267, "loss": 0.0118, "step": 158210 }, { "epoch": 0.8, "learning_rate": 0.00018026396113232865, "loss": 0.0122, "step": 158220 }, { "epoch": 0.8, "learning_rate": 0.00018025639343931466, "loss": 0.0133, "step": 158230 }, { "epoch": 0.8, "learning_rate": 0.00018024882574630064, "loss": 0.0115, "step": 158240 }, { "epoch": 0.8, "learning_rate": 0.00018024125805328662, "loss": 0.0151, "step": 158250 }, { "epoch": 0.8, "learning_rate": 0.00018023369036027263, "loss": 0.014, "step": 158260 }, { "epoch": 0.8, "learning_rate": 0.0001802261226672586, "loss": 0.0101, "step": 158270 }, { "epoch": 0.8, "learning_rate": 0.0001802185549742446, "loss": 0.0135, "step": 158280 }, { "epoch": 0.8, "learning_rate": 0.0001802109872812306, "loss": 0.0105, "step": 158290 }, { "epoch": 0.8, "learning_rate": 0.00018020341958821658, "loss": 0.0109, "step": 158300 }, { "epoch": 0.8, "learning_rate": 0.00018019585189520257, "loss": 0.013, "step": 158310 }, { "epoch": 0.8, "learning_rate": 0.00018018828420218855, "loss": 0.0156, "step": 158320 }, { "epoch": 0.8, "learning_rate": 0.00018018071650917456, "loss": 0.018, "step": 158330 }, { "epoch": 0.8, "learning_rate": 0.00018017314881616054, "loss": 0.0102, "step": 158340 }, { "epoch": 0.8, "learning_rate": 0.00018016558112314652, "loss": 0.0142, "step": 158350 }, { "epoch": 0.8, "learning_rate": 0.00018015801343013253, "loss": 0.0117, "step": 158360 }, { "epoch": 0.8, "learning_rate": 0.0001801504457371185, "loss": 0.012, "step": 158370 }, { "epoch": 0.8, "learning_rate": 0.0001801428780441045, "loss": 0.0158, "step": 158380 }, { "epoch": 0.8, "learning_rate": 0.0001801353103510905, "loss": 0.0143, "step": 158390 }, { "epoch": 0.8, "learning_rate": 0.00018012774265807648, "loss": 0.013, "step": 158400 }, { "epoch": 0.8, "learning_rate": 0.00018012017496506246, "loss": 0.0131, "step": 158410 }, { "epoch": 0.8, "learning_rate": 0.00018011260727204847, "loss": 0.0107, "step": 158420 }, { "epoch": 0.8, "learning_rate": 0.00018010503957903445, "loss": 0.0126, "step": 158430 }, { "epoch": 0.8, "learning_rate": 0.00018009747188602043, "loss": 0.0111, "step": 158440 }, { "epoch": 0.8, "learning_rate": 0.00018008990419300644, "loss": 0.0099, "step": 158450 }, { "epoch": 0.8, "learning_rate": 0.00018008233649999242, "loss": 0.0132, "step": 158460 }, { "epoch": 0.8, "learning_rate": 0.0001800747688069784, "loss": 0.0148, "step": 158470 }, { "epoch": 0.8, "learning_rate": 0.00018006720111396439, "loss": 0.0158, "step": 158480 }, { "epoch": 0.8, "learning_rate": 0.0001800596334209504, "loss": 0.0129, "step": 158490 }, { "epoch": 0.8, "learning_rate": 0.00018005206572793638, "loss": 0.0093, "step": 158500 }, { "epoch": 0.8, "learning_rate": 0.00018004449803492236, "loss": 0.0131, "step": 158510 }, { "epoch": 0.8, "learning_rate": 0.00018003693034190837, "loss": 0.0118, "step": 158520 }, { "epoch": 0.8, "learning_rate": 0.00018002936264889435, "loss": 0.0135, "step": 158530 }, { "epoch": 0.8, "learning_rate": 0.00018002179495588033, "loss": 0.0108, "step": 158540 }, { "epoch": 0.8, "learning_rate": 0.00018001422726286634, "loss": 0.0139, "step": 158550 }, { "epoch": 0.8, "learning_rate": 0.00018000665956985232, "loss": 0.0124, "step": 158560 }, { "epoch": 0.8, "learning_rate": 0.0001799990918768383, "loss": 0.0103, "step": 158570 }, { "epoch": 0.8, "learning_rate": 0.0001799915241838243, "loss": 0.0095, "step": 158580 }, { "epoch": 0.8, "learning_rate": 0.0001799839564908103, "loss": 0.0132, "step": 158590 }, { "epoch": 0.8, "learning_rate": 0.00017997638879779627, "loss": 0.0116, "step": 158600 }, { "epoch": 0.8, "learning_rate": 0.00017996882110478228, "loss": 0.013, "step": 158610 }, { "epoch": 0.8, "learning_rate": 0.00017996125341176826, "loss": 0.015, "step": 158620 }, { "epoch": 0.8, "learning_rate": 0.00017995368571875424, "loss": 0.0121, "step": 158630 }, { "epoch": 0.8, "learning_rate": 0.00017994611802574025, "loss": 0.0111, "step": 158640 }, { "epoch": 0.8, "learning_rate": 0.00017993855033272623, "loss": 0.013, "step": 158650 }, { "epoch": 0.8, "learning_rate": 0.00017993098263971221, "loss": 0.0107, "step": 158660 }, { "epoch": 0.8, "learning_rate": 0.0001799234149466982, "loss": 0.0101, "step": 158670 }, { "epoch": 0.8, "learning_rate": 0.0001799158472536842, "loss": 0.0116, "step": 158680 }, { "epoch": 0.8, "learning_rate": 0.00017990827956067019, "loss": 0.0124, "step": 158690 }, { "epoch": 0.8, "learning_rate": 0.00017990071186765617, "loss": 0.0127, "step": 158700 }, { "epoch": 0.8, "learning_rate": 0.00017989314417464218, "loss": 0.0143, "step": 158710 }, { "epoch": 0.8, "learning_rate": 0.00017988557648162816, "loss": 0.0103, "step": 158720 }, { "epoch": 0.8, "learning_rate": 0.00017987800878861414, "loss": 0.0103, "step": 158730 }, { "epoch": 0.8, "learning_rate": 0.00017987044109560015, "loss": 0.0143, "step": 158740 }, { "epoch": 0.8, "learning_rate": 0.00017986287340258613, "loss": 0.0149, "step": 158750 }, { "epoch": 0.8, "learning_rate": 0.0001798553057095721, "loss": 0.0141, "step": 158760 }, { "epoch": 0.8, "learning_rate": 0.00017984773801655812, "loss": 0.0097, "step": 158770 }, { "epoch": 0.8, "learning_rate": 0.0001798401703235441, "loss": 0.0136, "step": 158780 }, { "epoch": 0.8, "learning_rate": 0.00017983260263053008, "loss": 0.0129, "step": 158790 }, { "epoch": 0.8, "learning_rate": 0.0001798250349375161, "loss": 0.0104, "step": 158800 }, { "epoch": 0.8, "learning_rate": 0.00017981746724450207, "loss": 0.0119, "step": 158810 }, { "epoch": 0.8, "learning_rate": 0.00017980989955148805, "loss": 0.0171, "step": 158820 }, { "epoch": 0.8, "learning_rate": 0.00017980233185847403, "loss": 0.0094, "step": 158830 }, { "epoch": 0.8, "learning_rate": 0.00017979476416546004, "loss": 0.0098, "step": 158840 }, { "epoch": 0.8, "learning_rate": 0.00017978719647244602, "loss": 0.014, "step": 158850 }, { "epoch": 0.8, "learning_rate": 0.000179779628779432, "loss": 0.012, "step": 158860 }, { "epoch": 0.8, "learning_rate": 0.00017977206108641801, "loss": 0.0127, "step": 158870 }, { "epoch": 0.8, "learning_rate": 0.000179764493393404, "loss": 0.0169, "step": 158880 }, { "epoch": 0.8, "learning_rate": 0.00017975692570038998, "loss": 0.0093, "step": 158890 }, { "epoch": 0.8, "learning_rate": 0.00017974935800737599, "loss": 0.0186, "step": 158900 }, { "epoch": 0.8, "learning_rate": 0.00017974179031436197, "loss": 0.013, "step": 158910 }, { "epoch": 0.8, "learning_rate": 0.00017973422262134795, "loss": 0.0127, "step": 158920 }, { "epoch": 0.8, "learning_rate": 0.00017972665492833396, "loss": 0.0131, "step": 158930 }, { "epoch": 0.8, "learning_rate": 0.00017971908723531994, "loss": 0.013, "step": 158940 }, { "epoch": 0.8, "learning_rate": 0.00017971151954230592, "loss": 0.0113, "step": 158950 }, { "epoch": 0.8, "learning_rate": 0.00017970395184929193, "loss": 0.0098, "step": 158960 }, { "epoch": 0.8, "learning_rate": 0.0001796963841562779, "loss": 0.0105, "step": 158970 }, { "epoch": 0.8, "learning_rate": 0.0001796888164632639, "loss": 0.0108, "step": 158980 }, { "epoch": 0.8, "learning_rate": 0.00017968124877024987, "loss": 0.0124, "step": 158990 }, { "epoch": 0.8, "learning_rate": 0.00017967368107723585, "loss": 0.012, "step": 159000 }, { "epoch": 0.8, "eval_cer": 0.9144945158062973, "eval_loss": 0.00861455500125885, "eval_runtime": 116.6046, "eval_samples_per_second": 17.152, "eval_steps_per_second": 4.288, "step": 159000 }, { "epoch": 0.8, "learning_rate": 0.00017966611338422184, "loss": 0.0116, "step": 159010 }, { "epoch": 0.8, "learning_rate": 0.00017965854569120782, "loss": 0.0118, "step": 159020 }, { "epoch": 0.8, "learning_rate": 0.00017965097799819383, "loss": 0.0135, "step": 159030 }, { "epoch": 0.8, "learning_rate": 0.0001796434103051798, "loss": 0.011, "step": 159040 }, { "epoch": 0.8, "learning_rate": 0.0001796358426121658, "loss": 0.0123, "step": 159050 }, { "epoch": 0.8, "learning_rate": 0.00017962827491915177, "loss": 0.0132, "step": 159060 }, { "epoch": 0.8, "learning_rate": 0.00017962070722613778, "loss": 0.0123, "step": 159070 }, { "epoch": 0.8, "learning_rate": 0.00017961313953312376, "loss": 0.0127, "step": 159080 }, { "epoch": 0.8, "learning_rate": 0.00017960557184010974, "loss": 0.0141, "step": 159090 }, { "epoch": 0.8, "learning_rate": 0.00017959800414709575, "loss": 0.0123, "step": 159100 }, { "epoch": 0.8, "learning_rate": 0.00017959043645408173, "loss": 0.0098, "step": 159110 }, { "epoch": 0.8, "learning_rate": 0.0001795828687610677, "loss": 0.0104, "step": 159120 }, { "epoch": 0.8, "learning_rate": 0.00017957530106805372, "loss": 0.0117, "step": 159130 }, { "epoch": 0.8, "learning_rate": 0.0001795677333750397, "loss": 0.012, "step": 159140 }, { "epoch": 0.8, "learning_rate": 0.00017956016568202568, "loss": 0.0123, "step": 159150 }, { "epoch": 0.8, "learning_rate": 0.0001795525979890117, "loss": 0.0127, "step": 159160 }, { "epoch": 0.8, "learning_rate": 0.00017954503029599767, "loss": 0.0131, "step": 159170 }, { "epoch": 0.8, "learning_rate": 0.00017953746260298366, "loss": 0.0109, "step": 159180 }, { "epoch": 0.8, "learning_rate": 0.00017952989490996966, "loss": 0.0125, "step": 159190 }, { "epoch": 0.8, "learning_rate": 0.00017952232721695565, "loss": 0.0111, "step": 159200 }, { "epoch": 0.8, "learning_rate": 0.00017951475952394163, "loss": 0.0191, "step": 159210 }, { "epoch": 0.8, "learning_rate": 0.0001795071918309276, "loss": 0.0091, "step": 159220 }, { "epoch": 0.8, "learning_rate": 0.00017949962413791362, "loss": 0.0133, "step": 159230 }, { "epoch": 0.8, "learning_rate": 0.0001794920564448996, "loss": 0.0126, "step": 159240 }, { "epoch": 0.8, "learning_rate": 0.00017948448875188558, "loss": 0.012, "step": 159250 }, { "epoch": 0.8, "learning_rate": 0.0001794769210588716, "loss": 0.0124, "step": 159260 }, { "epoch": 0.8, "learning_rate": 0.00017946935336585757, "loss": 0.0115, "step": 159270 }, { "epoch": 0.8, "learning_rate": 0.00017946178567284355, "loss": 0.0193, "step": 159280 }, { "epoch": 0.8, "learning_rate": 0.00017945421797982956, "loss": 0.0141, "step": 159290 }, { "epoch": 0.8, "learning_rate": 0.00017944665028681554, "loss": 0.0113, "step": 159300 }, { "epoch": 0.8, "learning_rate": 0.00017943908259380152, "loss": 0.0142, "step": 159310 }, { "epoch": 0.8, "learning_rate": 0.00017943151490078753, "loss": 0.0114, "step": 159320 }, { "epoch": 0.8, "learning_rate": 0.0001794239472077735, "loss": 0.0111, "step": 159330 }, { "epoch": 0.8, "learning_rate": 0.0001794163795147595, "loss": 0.02, "step": 159340 }, { "epoch": 0.8, "learning_rate": 0.0001794088118217455, "loss": 0.0143, "step": 159350 }, { "epoch": 0.8, "learning_rate": 0.00017940124412873148, "loss": 0.0158, "step": 159360 }, { "epoch": 0.8, "learning_rate": 0.00017939367643571747, "loss": 0.0125, "step": 159370 }, { "epoch": 0.8, "learning_rate": 0.00017938610874270345, "loss": 0.0116, "step": 159380 }, { "epoch": 0.8, "learning_rate": 0.00017937854104968946, "loss": 0.0107, "step": 159390 }, { "epoch": 0.8, "learning_rate": 0.00017937097335667544, "loss": 0.0139, "step": 159400 }, { "epoch": 0.8, "learning_rate": 0.00017936340566366142, "loss": 0.0131, "step": 159410 }, { "epoch": 0.8, "learning_rate": 0.00017935583797064743, "loss": 0.0109, "step": 159420 }, { "epoch": 0.8, "learning_rate": 0.0001793482702776334, "loss": 0.014, "step": 159430 }, { "epoch": 0.8, "learning_rate": 0.0001793407025846194, "loss": 0.011, "step": 159440 }, { "epoch": 0.8, "learning_rate": 0.0001793331348916054, "loss": 0.0121, "step": 159450 }, { "epoch": 0.8, "learning_rate": 0.00017932556719859138, "loss": 0.0132, "step": 159460 }, { "epoch": 0.8, "learning_rate": 0.00017931799950557736, "loss": 0.0112, "step": 159470 }, { "epoch": 0.8, "learning_rate": 0.00017931043181256337, "loss": 0.0158, "step": 159480 }, { "epoch": 0.8, "learning_rate": 0.00017930286411954935, "loss": 0.0108, "step": 159490 }, { "epoch": 0.8, "learning_rate": 0.00017929529642653533, "loss": 0.0115, "step": 159500 }, { "epoch": 0.8, "learning_rate": 0.00017928772873352134, "loss": 0.013, "step": 159510 }, { "epoch": 0.8, "learning_rate": 0.00017928016104050732, "loss": 0.0108, "step": 159520 }, { "epoch": 0.8, "learning_rate": 0.0001792725933474933, "loss": 0.0116, "step": 159530 }, { "epoch": 0.8, "learning_rate": 0.0001792650256544793, "loss": 0.0105, "step": 159540 }, { "epoch": 0.8, "learning_rate": 0.0001792574579614653, "loss": 0.0127, "step": 159550 }, { "epoch": 0.8, "learning_rate": 0.00017924989026845128, "loss": 0.0139, "step": 159560 }, { "epoch": 0.81, "learning_rate": 0.00017924232257543726, "loss": 0.011, "step": 159570 }, { "epoch": 0.81, "learning_rate": 0.00017923475488242327, "loss": 0.0143, "step": 159580 }, { "epoch": 0.81, "learning_rate": 0.00017922718718940925, "loss": 0.0109, "step": 159590 }, { "epoch": 0.81, "learning_rate": 0.00017921961949639523, "loss": 0.0108, "step": 159600 }, { "epoch": 0.81, "learning_rate": 0.00017921205180338124, "loss": 0.0119, "step": 159610 }, { "epoch": 0.81, "learning_rate": 0.00017920448411036722, "loss": 0.0187, "step": 159620 }, { "epoch": 0.81, "learning_rate": 0.0001791969164173532, "loss": 0.0142, "step": 159630 }, { "epoch": 0.81, "learning_rate": 0.0001791893487243392, "loss": 0.0135, "step": 159640 }, { "epoch": 0.81, "learning_rate": 0.0001791817810313252, "loss": 0.015, "step": 159650 }, { "epoch": 0.81, "learning_rate": 0.00017917421333831117, "loss": 0.0122, "step": 159660 }, { "epoch": 0.81, "learning_rate": 0.00017916664564529718, "loss": 0.0115, "step": 159670 }, { "epoch": 0.81, "learning_rate": 0.00017915907795228316, "loss": 0.0106, "step": 159680 }, { "epoch": 0.81, "learning_rate": 0.00017915151025926914, "loss": 0.0127, "step": 159690 }, { "epoch": 0.81, "learning_rate": 0.00017914394256625515, "loss": 0.0124, "step": 159700 }, { "epoch": 0.81, "learning_rate": 0.00017913637487324113, "loss": 0.0161, "step": 159710 }, { "epoch": 0.81, "learning_rate": 0.00017912880718022711, "loss": 0.0138, "step": 159720 }, { "epoch": 0.81, "learning_rate": 0.0001791212394872131, "loss": 0.0105, "step": 159730 }, { "epoch": 0.81, "learning_rate": 0.0001791136717941991, "loss": 0.0097, "step": 159740 }, { "epoch": 0.81, "learning_rate": 0.00017910610410118509, "loss": 0.0126, "step": 159750 }, { "epoch": 0.81, "learning_rate": 0.00017909853640817107, "loss": 0.0131, "step": 159760 }, { "epoch": 0.81, "learning_rate": 0.00017909096871515708, "loss": 0.0107, "step": 159770 }, { "epoch": 0.81, "learning_rate": 0.00017908340102214306, "loss": 0.0111, "step": 159780 }, { "epoch": 0.81, "learning_rate": 0.00017907583332912904, "loss": 0.0144, "step": 159790 }, { "epoch": 0.81, "learning_rate": 0.00017906826563611505, "loss": 0.0123, "step": 159800 }, { "epoch": 0.81, "learning_rate": 0.00017906069794310103, "loss": 0.0135, "step": 159810 }, { "epoch": 0.81, "learning_rate": 0.000179053130250087, "loss": 0.0127, "step": 159820 }, { "epoch": 0.81, "learning_rate": 0.00017904556255707302, "loss": 0.0131, "step": 159830 }, { "epoch": 0.81, "learning_rate": 0.000179037994864059, "loss": 0.0153, "step": 159840 }, { "epoch": 0.81, "learning_rate": 0.00017903042717104498, "loss": 0.0109, "step": 159850 }, { "epoch": 0.81, "learning_rate": 0.000179022859478031, "loss": 0.0116, "step": 159860 }, { "epoch": 0.81, "learning_rate": 0.00017901529178501697, "loss": 0.0124, "step": 159870 }, { "epoch": 0.81, "learning_rate": 0.00017900772409200295, "loss": 0.0109, "step": 159880 }, { "epoch": 0.81, "learning_rate": 0.00017900015639898893, "loss": 0.0117, "step": 159890 }, { "epoch": 0.81, "learning_rate": 0.00017899258870597494, "loss": 0.0133, "step": 159900 }, { "epoch": 0.81, "learning_rate": 0.00017898502101296092, "loss": 0.0131, "step": 159910 }, { "epoch": 0.81, "learning_rate": 0.0001789774533199469, "loss": 0.0113, "step": 159920 }, { "epoch": 0.81, "learning_rate": 0.00017896988562693291, "loss": 0.0105, "step": 159930 }, { "epoch": 0.81, "learning_rate": 0.0001789623179339189, "loss": 0.0135, "step": 159940 }, { "epoch": 0.81, "learning_rate": 0.00017895475024090488, "loss": 0.0128, "step": 159950 }, { "epoch": 0.81, "learning_rate": 0.00017894718254789089, "loss": 0.0129, "step": 159960 }, { "epoch": 0.81, "learning_rate": 0.00017893961485487687, "loss": 0.0184, "step": 159970 }, { "epoch": 0.81, "learning_rate": 0.00017893204716186285, "loss": 0.0144, "step": 159980 }, { "epoch": 0.81, "learning_rate": 0.00017892447946884886, "loss": 0.0096, "step": 159990 }, { "epoch": 0.81, "learning_rate": 0.00017891691177583484, "loss": 0.0133, "step": 160000 }, { "epoch": 0.81, "eval_cer": 0.9144867526372941, "eval_loss": 0.008828338235616684, "eval_runtime": 116.6369, "eval_samples_per_second": 17.147, "eval_steps_per_second": 4.287, "step": 160000 }, { "epoch": 0.81, "learning_rate": 0.00017890934408282082, "loss": 0.0108, "step": 160010 }, { "epoch": 0.81, "learning_rate": 0.00017890177638980683, "loss": 0.013, "step": 160020 }, { "epoch": 0.81, "learning_rate": 0.0001788942086967928, "loss": 0.0134, "step": 160030 }, { "epoch": 0.81, "learning_rate": 0.0001788866410037788, "loss": 0.0124, "step": 160040 }, { "epoch": 0.81, "learning_rate": 0.0001788790733107648, "loss": 0.0117, "step": 160050 }, { "epoch": 0.81, "learning_rate": 0.00017887150561775078, "loss": 0.0132, "step": 160060 }, { "epoch": 0.81, "learning_rate": 0.00017886393792473676, "loss": 0.0121, "step": 160070 }, { "epoch": 0.81, "learning_rate": 0.00017885637023172274, "loss": 0.0138, "step": 160080 }, { "epoch": 0.81, "learning_rate": 0.00017884880253870875, "loss": 0.0117, "step": 160090 }, { "epoch": 0.81, "learning_rate": 0.00017884123484569473, "loss": 0.0116, "step": 160100 }, { "epoch": 0.81, "learning_rate": 0.00017883366715268072, "loss": 0.0141, "step": 160110 }, { "epoch": 0.81, "learning_rate": 0.00017882609945966672, "loss": 0.0142, "step": 160120 }, { "epoch": 0.81, "learning_rate": 0.0001788185317666527, "loss": 0.0164, "step": 160130 }, { "epoch": 0.81, "learning_rate": 0.0001788109640736387, "loss": 0.0105, "step": 160140 }, { "epoch": 0.81, "learning_rate": 0.0001788033963806247, "loss": 0.0151, "step": 160150 }, { "epoch": 0.81, "learning_rate": 0.00017879582868761068, "loss": 0.0183, "step": 160160 }, { "epoch": 0.81, "learning_rate": 0.00017878826099459666, "loss": 0.0106, "step": 160170 }, { "epoch": 0.81, "learning_rate": 0.00017878069330158267, "loss": 0.0155, "step": 160180 }, { "epoch": 0.81, "learning_rate": 0.00017877312560856865, "loss": 0.0123, "step": 160190 }, { "epoch": 0.81, "learning_rate": 0.00017876555791555463, "loss": 0.0141, "step": 160200 }, { "epoch": 0.81, "learning_rate": 0.00017875799022254064, "loss": 0.0124, "step": 160210 }, { "epoch": 0.81, "learning_rate": 0.00017875042252952662, "loss": 0.0151, "step": 160220 }, { "epoch": 0.81, "learning_rate": 0.0001787428548365126, "loss": 0.0108, "step": 160230 }, { "epoch": 0.81, "learning_rate": 0.00017873528714349858, "loss": 0.0112, "step": 160240 }, { "epoch": 0.81, "learning_rate": 0.0001787277194504846, "loss": 0.0133, "step": 160250 }, { "epoch": 0.81, "learning_rate": 0.00017872015175747055, "loss": 0.0109, "step": 160260 }, { "epoch": 0.81, "learning_rate": 0.00017871258406445653, "loss": 0.013, "step": 160270 }, { "epoch": 0.81, "learning_rate": 0.0001787050163714425, "loss": 0.0102, "step": 160280 }, { "epoch": 0.81, "learning_rate": 0.00017869744867842852, "loss": 0.0133, "step": 160290 }, { "epoch": 0.81, "learning_rate": 0.0001786898809854145, "loss": 0.0137, "step": 160300 }, { "epoch": 0.81, "learning_rate": 0.00017868231329240048, "loss": 0.0132, "step": 160310 }, { "epoch": 0.81, "learning_rate": 0.0001786747455993865, "loss": 0.013, "step": 160320 }, { "epoch": 0.81, "learning_rate": 0.00017866717790637247, "loss": 0.0109, "step": 160330 }, { "epoch": 0.81, "learning_rate": 0.00017865961021335845, "loss": 0.0129, "step": 160340 }, { "epoch": 0.81, "learning_rate": 0.00017865204252034446, "loss": 0.0106, "step": 160350 }, { "epoch": 0.81, "learning_rate": 0.00017864447482733044, "loss": 0.0135, "step": 160360 }, { "epoch": 0.81, "learning_rate": 0.00017863690713431642, "loss": 0.0097, "step": 160370 }, { "epoch": 0.81, "learning_rate": 0.00017862933944130243, "loss": 0.0139, "step": 160380 }, { "epoch": 0.81, "learning_rate": 0.0001786217717482884, "loss": 0.0092, "step": 160390 }, { "epoch": 0.81, "learning_rate": 0.0001786142040552744, "loss": 0.0143, "step": 160400 }, { "epoch": 0.81, "learning_rate": 0.0001786066363622604, "loss": 0.0108, "step": 160410 }, { "epoch": 0.81, "learning_rate": 0.00017859906866924638, "loss": 0.0146, "step": 160420 }, { "epoch": 0.81, "learning_rate": 0.00017859150097623237, "loss": 0.0118, "step": 160430 }, { "epoch": 0.81, "learning_rate": 0.00017858393328321837, "loss": 0.0136, "step": 160440 }, { "epoch": 0.81, "learning_rate": 0.00017857636559020436, "loss": 0.0121, "step": 160450 }, { "epoch": 0.81, "learning_rate": 0.00017856879789719034, "loss": 0.0147, "step": 160460 }, { "epoch": 0.81, "learning_rate": 0.00017856123020417632, "loss": 0.0117, "step": 160470 }, { "epoch": 0.81, "learning_rate": 0.00017855366251116233, "loss": 0.0129, "step": 160480 }, { "epoch": 0.81, "learning_rate": 0.0001785460948181483, "loss": 0.0139, "step": 160490 }, { "epoch": 0.81, "learning_rate": 0.0001785385271251343, "loss": 0.0111, "step": 160500 }, { "epoch": 0.81, "learning_rate": 0.0001785309594321203, "loss": 0.013, "step": 160510 }, { "epoch": 0.81, "learning_rate": 0.00017852339173910628, "loss": 0.0109, "step": 160520 }, { "epoch": 0.81, "learning_rate": 0.00017851582404609226, "loss": 0.0127, "step": 160530 }, { "epoch": 0.81, "learning_rate": 0.00017850825635307827, "loss": 0.0139, "step": 160540 }, { "epoch": 0.81, "learning_rate": 0.00017850068866006425, "loss": 0.0095, "step": 160550 }, { "epoch": 0.81, "learning_rate": 0.00017849312096705023, "loss": 0.0111, "step": 160560 }, { "epoch": 0.81, "learning_rate": 0.00017848555327403624, "loss": 0.0126, "step": 160570 }, { "epoch": 0.81, "learning_rate": 0.00017847798558102222, "loss": 0.0107, "step": 160580 }, { "epoch": 0.81, "learning_rate": 0.0001784704178880082, "loss": 0.0107, "step": 160590 }, { "epoch": 0.81, "learning_rate": 0.0001784628501949942, "loss": 0.0111, "step": 160600 }, { "epoch": 0.81, "learning_rate": 0.0001784552825019802, "loss": 0.0118, "step": 160610 }, { "epoch": 0.81, "learning_rate": 0.00017844771480896618, "loss": 0.0118, "step": 160620 }, { "epoch": 0.81, "learning_rate": 0.00017844014711595216, "loss": 0.0115, "step": 160630 }, { "epoch": 0.81, "learning_rate": 0.00017843257942293817, "loss": 0.01, "step": 160640 }, { "epoch": 0.81, "learning_rate": 0.00017842501172992415, "loss": 0.0114, "step": 160650 }, { "epoch": 0.81, "learning_rate": 0.00017841744403691013, "loss": 0.0137, "step": 160660 }, { "epoch": 0.81, "learning_rate": 0.00017840987634389614, "loss": 0.0107, "step": 160670 }, { "epoch": 0.81, "learning_rate": 0.00017840230865088212, "loss": 0.01, "step": 160680 }, { "epoch": 0.81, "learning_rate": 0.0001783947409578681, "loss": 0.0131, "step": 160690 }, { "epoch": 0.81, "learning_rate": 0.0001783871732648541, "loss": 0.0122, "step": 160700 }, { "epoch": 0.81, "learning_rate": 0.0001783796055718401, "loss": 0.0114, "step": 160710 }, { "epoch": 0.81, "learning_rate": 0.00017837203787882607, "loss": 0.0138, "step": 160720 }, { "epoch": 0.81, "learning_rate": 0.00017836447018581208, "loss": 0.0136, "step": 160730 }, { "epoch": 0.81, "learning_rate": 0.00017835690249279806, "loss": 0.0107, "step": 160740 }, { "epoch": 0.81, "learning_rate": 0.00017834933479978404, "loss": 0.0095, "step": 160750 }, { "epoch": 0.81, "learning_rate": 0.00017834176710677005, "loss": 0.0146, "step": 160760 }, { "epoch": 0.81, "learning_rate": 0.00017833419941375603, "loss": 0.0109, "step": 160770 }, { "epoch": 0.81, "learning_rate": 0.00017832663172074201, "loss": 0.0089, "step": 160780 }, { "epoch": 0.81, "learning_rate": 0.000178319064027728, "loss": 0.013, "step": 160790 }, { "epoch": 0.81, "learning_rate": 0.000178311496334714, "loss": 0.0118, "step": 160800 }, { "epoch": 0.81, "learning_rate": 0.00017830392864169999, "loss": 0.0137, "step": 160810 }, { "epoch": 0.81, "learning_rate": 0.00017829636094868597, "loss": 0.0128, "step": 160820 }, { "epoch": 0.81, "learning_rate": 0.00017828879325567198, "loss": 0.0109, "step": 160830 }, { "epoch": 0.81, "learning_rate": 0.00017828122556265796, "loss": 0.0167, "step": 160840 }, { "epoch": 0.81, "learning_rate": 0.00017827365786964394, "loss": 0.0137, "step": 160850 }, { "epoch": 0.81, "learning_rate": 0.00017826609017662995, "loss": 0.0107, "step": 160860 }, { "epoch": 0.81, "learning_rate": 0.00017825852248361593, "loss": 0.0119, "step": 160870 }, { "epoch": 0.81, "learning_rate": 0.0001782509547906019, "loss": 0.0135, "step": 160880 }, { "epoch": 0.81, "learning_rate": 0.00017824338709758792, "loss": 0.0102, "step": 160890 }, { "epoch": 0.81, "learning_rate": 0.0001782358194045739, "loss": 0.0138, "step": 160900 }, { "epoch": 0.81, "learning_rate": 0.00017822825171155988, "loss": 0.0143, "step": 160910 }, { "epoch": 0.81, "learning_rate": 0.0001782206840185459, "loss": 0.0113, "step": 160920 }, { "epoch": 0.81, "learning_rate": 0.00017821311632553187, "loss": 0.0144, "step": 160930 }, { "epoch": 0.81, "learning_rate": 0.00017820554863251785, "loss": 0.0107, "step": 160940 }, { "epoch": 0.81, "learning_rate": 0.00017819798093950383, "loss": 0.0136, "step": 160950 }, { "epoch": 0.81, "learning_rate": 0.00017819041324648984, "loss": 0.0118, "step": 160960 }, { "epoch": 0.81, "learning_rate": 0.00017818284555347582, "loss": 0.0134, "step": 160970 }, { "epoch": 0.81, "learning_rate": 0.0001781752778604618, "loss": 0.013, "step": 160980 }, { "epoch": 0.81, "learning_rate": 0.00017816771016744781, "loss": 0.0126, "step": 160990 }, { "epoch": 0.81, "learning_rate": 0.0001781601424744338, "loss": 0.0127, "step": 161000 }, { "epoch": 0.81, "eval_cer": 0.9144789894682909, "eval_loss": 0.008487106300890446, "eval_runtime": 116.5295, "eval_samples_per_second": 17.163, "eval_steps_per_second": 4.291, "step": 161000 }, { "epoch": 0.81, "learning_rate": 0.00017815257478141978, "loss": 0.013, "step": 161010 }, { "epoch": 0.81, "learning_rate": 0.00017814500708840579, "loss": 0.0154, "step": 161020 }, { "epoch": 0.81, "learning_rate": 0.00017813743939539177, "loss": 0.0145, "step": 161030 }, { "epoch": 0.81, "learning_rate": 0.00017812987170237775, "loss": 0.0103, "step": 161040 }, { "epoch": 0.81, "learning_rate": 0.00017812230400936376, "loss": 0.0117, "step": 161050 }, { "epoch": 0.81, "learning_rate": 0.00017811473631634974, "loss": 0.0102, "step": 161060 }, { "epoch": 0.81, "learning_rate": 0.00017810716862333572, "loss": 0.0116, "step": 161070 }, { "epoch": 0.81, "learning_rate": 0.00017809960093032173, "loss": 0.0136, "step": 161080 }, { "epoch": 0.81, "learning_rate": 0.0001780920332373077, "loss": 0.0112, "step": 161090 }, { "epoch": 0.81, "learning_rate": 0.0001780844655442937, "loss": 0.0114, "step": 161100 }, { "epoch": 0.81, "learning_rate": 0.0001780768978512797, "loss": 0.013, "step": 161110 }, { "epoch": 0.81, "learning_rate": 0.00017806933015826568, "loss": 0.012, "step": 161120 }, { "epoch": 0.81, "learning_rate": 0.00017806176246525166, "loss": 0.0091, "step": 161130 }, { "epoch": 0.81, "learning_rate": 0.00017805419477223764, "loss": 0.0154, "step": 161140 }, { "epoch": 0.81, "learning_rate": 0.00017804662707922365, "loss": 0.0104, "step": 161150 }, { "epoch": 0.81, "learning_rate": 0.00017803905938620963, "loss": 0.0115, "step": 161160 }, { "epoch": 0.81, "learning_rate": 0.00017803149169319562, "loss": 0.0114, "step": 161170 }, { "epoch": 0.81, "learning_rate": 0.00017802392400018162, "loss": 0.0143, "step": 161180 }, { "epoch": 0.81, "learning_rate": 0.0001780163563071676, "loss": 0.0102, "step": 161190 }, { "epoch": 0.81, "learning_rate": 0.0001780087886141536, "loss": 0.0117, "step": 161200 }, { "epoch": 0.81, "learning_rate": 0.0001780012209211396, "loss": 0.0116, "step": 161210 }, { "epoch": 0.81, "learning_rate": 0.00017799365322812558, "loss": 0.0114, "step": 161220 }, { "epoch": 0.81, "learning_rate": 0.00017798608553511156, "loss": 0.0126, "step": 161230 }, { "epoch": 0.81, "learning_rate": 0.00017797851784209757, "loss": 0.013, "step": 161240 }, { "epoch": 0.81, "learning_rate": 0.00017797095014908355, "loss": 0.0143, "step": 161250 }, { "epoch": 0.81, "learning_rate": 0.00017796338245606953, "loss": 0.0134, "step": 161260 }, { "epoch": 0.81, "learning_rate": 0.00017795581476305554, "loss": 0.0098, "step": 161270 }, { "epoch": 0.81, "learning_rate": 0.00017794824707004152, "loss": 0.0118, "step": 161280 }, { "epoch": 0.81, "learning_rate": 0.0001779406793770275, "loss": 0.0133, "step": 161290 }, { "epoch": 0.81, "learning_rate": 0.00017793311168401348, "loss": 0.0139, "step": 161300 }, { "epoch": 0.81, "learning_rate": 0.0001779255439909995, "loss": 0.0132, "step": 161310 }, { "epoch": 0.81, "learning_rate": 0.00017791797629798547, "loss": 0.0124, "step": 161320 }, { "epoch": 0.81, "learning_rate": 0.00017791040860497145, "loss": 0.0137, "step": 161330 }, { "epoch": 0.81, "learning_rate": 0.00017790284091195746, "loss": 0.0127, "step": 161340 }, { "epoch": 0.81, "learning_rate": 0.00017789527321894344, "loss": 0.0129, "step": 161350 }, { "epoch": 0.81, "learning_rate": 0.00017788770552592943, "loss": 0.0149, "step": 161360 }, { "epoch": 0.81, "learning_rate": 0.00017788013783291543, "loss": 0.0113, "step": 161370 }, { "epoch": 0.81, "learning_rate": 0.00017787257013990142, "loss": 0.0116, "step": 161380 }, { "epoch": 0.81, "learning_rate": 0.0001778650024468874, "loss": 0.0111, "step": 161390 }, { "epoch": 0.81, "learning_rate": 0.0001778574347538734, "loss": 0.0127, "step": 161400 }, { "epoch": 0.81, "learning_rate": 0.0001778498670608594, "loss": 0.0114, "step": 161410 }, { "epoch": 0.81, "learning_rate": 0.00017784229936784537, "loss": 0.0104, "step": 161420 }, { "epoch": 0.81, "learning_rate": 0.00017783473167483138, "loss": 0.014, "step": 161430 }, { "epoch": 0.81, "learning_rate": 0.00017782716398181736, "loss": 0.0135, "step": 161440 }, { "epoch": 0.81, "learning_rate": 0.00017781959628880334, "loss": 0.0104, "step": 161450 }, { "epoch": 0.81, "learning_rate": 0.00017781202859578932, "loss": 0.0124, "step": 161460 }, { "epoch": 0.81, "learning_rate": 0.00017780446090277533, "loss": 0.0107, "step": 161470 }, { "epoch": 0.81, "learning_rate": 0.0001777968932097613, "loss": 0.0119, "step": 161480 }, { "epoch": 0.81, "learning_rate": 0.0001777893255167473, "loss": 0.0158, "step": 161490 }, { "epoch": 0.81, "learning_rate": 0.0001777817578237333, "loss": 0.0112, "step": 161500 }, { "epoch": 0.81, "learning_rate": 0.00017777419013071926, "loss": 0.012, "step": 161510 }, { "epoch": 0.81, "learning_rate": 0.00017776662243770524, "loss": 0.0122, "step": 161520 }, { "epoch": 0.81, "learning_rate": 0.00017775905474469122, "loss": 0.0116, "step": 161530 }, { "epoch": 0.81, "learning_rate": 0.00017775148705167723, "loss": 0.0106, "step": 161540 }, { "epoch": 0.82, "learning_rate": 0.0001777439193586632, "loss": 0.0106, "step": 161550 }, { "epoch": 0.82, "learning_rate": 0.0001777363516656492, "loss": 0.0102, "step": 161560 }, { "epoch": 0.82, "learning_rate": 0.0001777287839726352, "loss": 0.0144, "step": 161570 }, { "epoch": 0.82, "learning_rate": 0.00017772121627962118, "loss": 0.014, "step": 161580 }, { "epoch": 0.82, "learning_rate": 0.00017771364858660716, "loss": 0.0132, "step": 161590 }, { "epoch": 0.82, "learning_rate": 0.00017770608089359317, "loss": 0.0104, "step": 161600 }, { "epoch": 0.82, "learning_rate": 0.00017769851320057915, "loss": 0.0104, "step": 161610 }, { "epoch": 0.82, "learning_rate": 0.00017769094550756513, "loss": 0.0104, "step": 161620 }, { "epoch": 0.82, "learning_rate": 0.00017768337781455114, "loss": 0.0127, "step": 161630 }, { "epoch": 0.82, "learning_rate": 0.00017767581012153712, "loss": 0.0128, "step": 161640 }, { "epoch": 0.82, "learning_rate": 0.0001776682424285231, "loss": 0.0155, "step": 161650 }, { "epoch": 0.82, "learning_rate": 0.0001776606747355091, "loss": 0.0119, "step": 161660 }, { "epoch": 0.82, "learning_rate": 0.0001776531070424951, "loss": 0.0106, "step": 161670 }, { "epoch": 0.82, "learning_rate": 0.00017764553934948108, "loss": 0.0149, "step": 161680 }, { "epoch": 0.82, "learning_rate": 0.00017763797165646706, "loss": 0.0144, "step": 161690 }, { "epoch": 0.82, "learning_rate": 0.00017763040396345307, "loss": 0.0103, "step": 161700 }, { "epoch": 0.82, "learning_rate": 0.00017762283627043905, "loss": 0.0131, "step": 161710 }, { "epoch": 0.82, "learning_rate": 0.00017761526857742503, "loss": 0.0096, "step": 161720 }, { "epoch": 0.82, "learning_rate": 0.00017760770088441104, "loss": 0.011, "step": 161730 }, { "epoch": 0.82, "learning_rate": 0.00017760013319139702, "loss": 0.0119, "step": 161740 }, { "epoch": 0.82, "learning_rate": 0.000177592565498383, "loss": 0.0118, "step": 161750 }, { "epoch": 0.82, "learning_rate": 0.000177584997805369, "loss": 0.0106, "step": 161760 }, { "epoch": 0.82, "learning_rate": 0.000177577430112355, "loss": 0.0101, "step": 161770 }, { "epoch": 0.82, "learning_rate": 0.00017756986241934097, "loss": 0.0228, "step": 161780 }, { "epoch": 0.82, "learning_rate": 0.00017756229472632698, "loss": 0.0153, "step": 161790 }, { "epoch": 0.82, "learning_rate": 0.00017755472703331296, "loss": 0.0118, "step": 161800 }, { "epoch": 0.82, "learning_rate": 0.00017754715934029894, "loss": 0.013, "step": 161810 }, { "epoch": 0.82, "learning_rate": 0.00017753959164728495, "loss": 0.0125, "step": 161820 }, { "epoch": 0.82, "learning_rate": 0.00017753202395427093, "loss": 0.0141, "step": 161830 }, { "epoch": 0.82, "learning_rate": 0.00017752445626125691, "loss": 0.0116, "step": 161840 }, { "epoch": 0.82, "learning_rate": 0.0001775168885682429, "loss": 0.0099, "step": 161850 }, { "epoch": 0.82, "learning_rate": 0.0001775093208752289, "loss": 0.0132, "step": 161860 }, { "epoch": 0.82, "learning_rate": 0.00017750175318221489, "loss": 0.0111, "step": 161870 }, { "epoch": 0.82, "learning_rate": 0.00017749418548920087, "loss": 0.0105, "step": 161880 }, { "epoch": 0.82, "learning_rate": 0.00017748661779618688, "loss": 0.0139, "step": 161890 }, { "epoch": 0.82, "learning_rate": 0.00017747905010317286, "loss": 0.0133, "step": 161900 }, { "epoch": 0.82, "learning_rate": 0.00017747148241015884, "loss": 0.0111, "step": 161910 }, { "epoch": 0.82, "learning_rate": 0.00017746391471714485, "loss": 0.0119, "step": 161920 }, { "epoch": 0.82, "learning_rate": 0.00017745634702413083, "loss": 0.0188, "step": 161930 }, { "epoch": 0.82, "learning_rate": 0.0001774487793311168, "loss": 0.0113, "step": 161940 }, { "epoch": 0.82, "learning_rate": 0.00017744121163810282, "loss": 0.0133, "step": 161950 }, { "epoch": 0.82, "learning_rate": 0.0001774336439450888, "loss": 0.0144, "step": 161960 }, { "epoch": 0.82, "learning_rate": 0.00017742607625207478, "loss": 0.0112, "step": 161970 }, { "epoch": 0.82, "learning_rate": 0.0001774185085590608, "loss": 0.0123, "step": 161980 }, { "epoch": 0.82, "learning_rate": 0.00017741094086604677, "loss": 0.0088, "step": 161990 }, { "epoch": 0.82, "learning_rate": 0.00017740337317303275, "loss": 0.0211, "step": 162000 }, { "epoch": 0.82, "eval_cer": 0.9144663743186606, "eval_loss": 0.008896621875464916, "eval_runtime": 115.9502, "eval_samples_per_second": 17.249, "eval_steps_per_second": 4.312, "step": 162000 }, { "epoch": 0.82, "learning_rate": 0.00017739580548001876, "loss": 0.0128, "step": 162010 }, { "epoch": 0.82, "learning_rate": 0.00017738823778700474, "loss": 0.0124, "step": 162020 }, { "epoch": 0.82, "learning_rate": 0.00017738067009399072, "loss": 0.0148, "step": 162030 }, { "epoch": 0.82, "learning_rate": 0.0001773731024009767, "loss": 0.0181, "step": 162040 }, { "epoch": 0.82, "learning_rate": 0.00017736553470796271, "loss": 0.012, "step": 162050 }, { "epoch": 0.82, "learning_rate": 0.0001773579670149487, "loss": 0.0131, "step": 162060 }, { "epoch": 0.82, "learning_rate": 0.00017735039932193468, "loss": 0.0103, "step": 162070 }, { "epoch": 0.82, "learning_rate": 0.00017734283162892069, "loss": 0.0133, "step": 162080 }, { "epoch": 0.82, "learning_rate": 0.00017733526393590667, "loss": 0.0112, "step": 162090 }, { "epoch": 0.82, "learning_rate": 0.00017732769624289265, "loss": 0.0136, "step": 162100 }, { "epoch": 0.82, "learning_rate": 0.00017732012854987866, "loss": 0.0141, "step": 162110 }, { "epoch": 0.82, "learning_rate": 0.00017731256085686464, "loss": 0.0125, "step": 162120 }, { "epoch": 0.82, "learning_rate": 0.00017730499316385062, "loss": 0.0113, "step": 162130 }, { "epoch": 0.82, "learning_rate": 0.00017729742547083663, "loss": 0.0113, "step": 162140 }, { "epoch": 0.82, "learning_rate": 0.0001772898577778226, "loss": 0.0118, "step": 162150 }, { "epoch": 0.82, "learning_rate": 0.0001772822900848086, "loss": 0.0096, "step": 162160 }, { "epoch": 0.82, "learning_rate": 0.0001772747223917946, "loss": 0.0131, "step": 162170 }, { "epoch": 0.82, "learning_rate": 0.00017726715469878058, "loss": 0.0102, "step": 162180 }, { "epoch": 0.82, "learning_rate": 0.00017725958700576656, "loss": 0.013, "step": 162190 }, { "epoch": 0.82, "learning_rate": 0.00017725201931275255, "loss": 0.0102, "step": 162200 }, { "epoch": 0.82, "learning_rate": 0.00017724445161973855, "loss": 0.0093, "step": 162210 }, { "epoch": 0.82, "learning_rate": 0.00017723688392672454, "loss": 0.0157, "step": 162220 }, { "epoch": 0.82, "learning_rate": 0.00017722931623371052, "loss": 0.0124, "step": 162230 }, { "epoch": 0.82, "learning_rate": 0.00017722174854069653, "loss": 0.0108, "step": 162240 }, { "epoch": 0.82, "learning_rate": 0.0001772141808476825, "loss": 0.0122, "step": 162250 }, { "epoch": 0.82, "learning_rate": 0.0001772066131546685, "loss": 0.0154, "step": 162260 }, { "epoch": 0.82, "learning_rate": 0.0001771990454616545, "loss": 0.0118, "step": 162270 }, { "epoch": 0.82, "learning_rate": 0.00017719147776864048, "loss": 0.0111, "step": 162280 }, { "epoch": 0.82, "learning_rate": 0.00017718391007562646, "loss": 0.0093, "step": 162290 }, { "epoch": 0.82, "learning_rate": 0.00017717634238261247, "loss": 0.0132, "step": 162300 }, { "epoch": 0.82, "learning_rate": 0.00017716877468959845, "loss": 0.0119, "step": 162310 }, { "epoch": 0.82, "learning_rate": 0.00017716120699658443, "loss": 0.0105, "step": 162320 }, { "epoch": 0.82, "learning_rate": 0.00017715363930357044, "loss": 0.0126, "step": 162330 }, { "epoch": 0.82, "learning_rate": 0.00017714607161055642, "loss": 0.0177, "step": 162340 }, { "epoch": 0.82, "learning_rate": 0.0001771385039175424, "loss": 0.0147, "step": 162350 }, { "epoch": 0.82, "learning_rate": 0.00017713093622452838, "loss": 0.0197, "step": 162360 }, { "epoch": 0.82, "learning_rate": 0.0001771233685315144, "loss": 0.0111, "step": 162370 }, { "epoch": 0.82, "learning_rate": 0.00017711580083850037, "loss": 0.0146, "step": 162380 }, { "epoch": 0.82, "learning_rate": 0.00017710823314548636, "loss": 0.0105, "step": 162390 }, { "epoch": 0.82, "learning_rate": 0.00017710066545247236, "loss": 0.0119, "step": 162400 }, { "epoch": 0.82, "learning_rate": 0.00017709309775945835, "loss": 0.0127, "step": 162410 }, { "epoch": 0.82, "learning_rate": 0.00017708553006644433, "loss": 0.0151, "step": 162420 }, { "epoch": 0.82, "learning_rate": 0.00017707796237343034, "loss": 0.0123, "step": 162430 }, { "epoch": 0.82, "learning_rate": 0.00017707039468041632, "loss": 0.0156, "step": 162440 }, { "epoch": 0.82, "learning_rate": 0.0001770628269874023, "loss": 0.0119, "step": 162450 }, { "epoch": 0.82, "learning_rate": 0.0001770552592943883, "loss": 0.0128, "step": 162460 }, { "epoch": 0.82, "learning_rate": 0.0001770476916013743, "loss": 0.011, "step": 162470 }, { "epoch": 0.82, "learning_rate": 0.00017704012390836027, "loss": 0.0122, "step": 162480 }, { "epoch": 0.82, "learning_rate": 0.00017703255621534628, "loss": 0.0121, "step": 162490 }, { "epoch": 0.82, "learning_rate": 0.00017702498852233226, "loss": 0.0117, "step": 162500 }, { "epoch": 0.82, "learning_rate": 0.00017701742082931824, "loss": 0.0103, "step": 162510 }, { "epoch": 0.82, "learning_rate": 0.00017700985313630425, "loss": 0.0104, "step": 162520 }, { "epoch": 0.82, "learning_rate": 0.00017700228544329023, "loss": 0.0142, "step": 162530 }, { "epoch": 0.82, "learning_rate": 0.0001769947177502762, "loss": 0.0133, "step": 162540 }, { "epoch": 0.82, "learning_rate": 0.0001769871500572622, "loss": 0.0139, "step": 162550 }, { "epoch": 0.82, "learning_rate": 0.0001769795823642482, "loss": 0.0116, "step": 162560 }, { "epoch": 0.82, "learning_rate": 0.00017697201467123418, "loss": 0.0139, "step": 162570 }, { "epoch": 0.82, "learning_rate": 0.00017696444697822017, "loss": 0.015, "step": 162580 }, { "epoch": 0.82, "learning_rate": 0.00017695687928520617, "loss": 0.0108, "step": 162590 }, { "epoch": 0.82, "learning_rate": 0.00017694931159219216, "loss": 0.0144, "step": 162600 }, { "epoch": 0.82, "learning_rate": 0.00017694174389917814, "loss": 0.0124, "step": 162610 }, { "epoch": 0.82, "learning_rate": 0.00017693417620616415, "loss": 0.0102, "step": 162620 }, { "epoch": 0.82, "learning_rate": 0.00017692660851315013, "loss": 0.0106, "step": 162630 }, { "epoch": 0.82, "learning_rate": 0.0001769190408201361, "loss": 0.0111, "step": 162640 }, { "epoch": 0.82, "learning_rate": 0.00017691147312712212, "loss": 0.0154, "step": 162650 }, { "epoch": 0.82, "learning_rate": 0.0001769039054341081, "loss": 0.0169, "step": 162660 }, { "epoch": 0.82, "learning_rate": 0.00017689633774109408, "loss": 0.013, "step": 162670 }, { "epoch": 0.82, "learning_rate": 0.0001768887700480801, "loss": 0.0133, "step": 162680 }, { "epoch": 0.82, "learning_rate": 0.00017688120235506607, "loss": 0.011, "step": 162690 }, { "epoch": 0.82, "learning_rate": 0.00017687363466205205, "loss": 0.0106, "step": 162700 }, { "epoch": 0.82, "learning_rate": 0.00017686606696903803, "loss": 0.0114, "step": 162710 }, { "epoch": 0.82, "learning_rate": 0.00017685849927602404, "loss": 0.0147, "step": 162720 }, { "epoch": 0.82, "learning_rate": 0.00017685093158301002, "loss": 0.0114, "step": 162730 }, { "epoch": 0.82, "learning_rate": 0.000176843363889996, "loss": 0.0111, "step": 162740 }, { "epoch": 0.82, "learning_rate": 0.000176835796196982, "loss": 0.0099, "step": 162750 }, { "epoch": 0.82, "learning_rate": 0.000176828228503968, "loss": 0.0131, "step": 162760 }, { "epoch": 0.82, "learning_rate": 0.00017682066081095395, "loss": 0.0133, "step": 162770 }, { "epoch": 0.82, "learning_rate": 0.00017681309311793993, "loss": 0.0119, "step": 162780 }, { "epoch": 0.82, "learning_rate": 0.00017680552542492594, "loss": 0.0145, "step": 162790 }, { "epoch": 0.82, "learning_rate": 0.00017679795773191192, "loss": 0.0131, "step": 162800 }, { "epoch": 0.82, "learning_rate": 0.0001767903900388979, "loss": 0.0152, "step": 162810 }, { "epoch": 0.82, "learning_rate": 0.0001767828223458839, "loss": 0.0176, "step": 162820 }, { "epoch": 0.82, "learning_rate": 0.0001767752546528699, "loss": 0.014, "step": 162830 }, { "epoch": 0.82, "learning_rate": 0.00017676768695985587, "loss": 0.0114, "step": 162840 }, { "epoch": 0.82, "learning_rate": 0.00017676011926684188, "loss": 0.0139, "step": 162850 }, { "epoch": 0.82, "learning_rate": 0.00017675255157382786, "loss": 0.0103, "step": 162860 }, { "epoch": 0.82, "learning_rate": 0.00017674498388081384, "loss": 0.0114, "step": 162870 }, { "epoch": 0.82, "learning_rate": 0.00017673741618779985, "loss": 0.0123, "step": 162880 }, { "epoch": 0.82, "learning_rate": 0.00017672984849478583, "loss": 0.0173, "step": 162890 }, { "epoch": 0.82, "learning_rate": 0.00017672228080177182, "loss": 0.0135, "step": 162900 }, { "epoch": 0.82, "learning_rate": 0.00017671471310875782, "loss": 0.0136, "step": 162910 }, { "epoch": 0.82, "learning_rate": 0.0001767071454157438, "loss": 0.0115, "step": 162920 }, { "epoch": 0.82, "learning_rate": 0.0001766995777227298, "loss": 0.0139, "step": 162930 }, { "epoch": 0.82, "learning_rate": 0.00017669201002971577, "loss": 0.0116, "step": 162940 }, { "epoch": 0.82, "learning_rate": 0.00017668444233670178, "loss": 0.0155, "step": 162950 }, { "epoch": 0.82, "learning_rate": 0.00017667687464368776, "loss": 0.0123, "step": 162960 }, { "epoch": 0.82, "learning_rate": 0.00017666930695067374, "loss": 0.0093, "step": 162970 }, { "epoch": 0.82, "learning_rate": 0.00017666173925765975, "loss": 0.0114, "step": 162980 }, { "epoch": 0.82, "learning_rate": 0.00017665417156464573, "loss": 0.0108, "step": 162990 }, { "epoch": 0.82, "learning_rate": 0.0001766466038716317, "loss": 0.0087, "step": 163000 }, { "epoch": 0.82, "eval_cer": 0.9144401736232748, "eval_loss": 0.00887399259954691, "eval_runtime": 116.6416, "eval_samples_per_second": 17.147, "eval_steps_per_second": 4.287, "step": 163000 }, { "epoch": 0.82, "learning_rate": 0.00017663903617861772, "loss": 0.0108, "step": 163010 }, { "epoch": 0.82, "learning_rate": 0.0001766314684856037, "loss": 0.0116, "step": 163020 }, { "epoch": 0.82, "learning_rate": 0.00017662390079258968, "loss": 0.0129, "step": 163030 }, { "epoch": 0.82, "learning_rate": 0.0001766163330995757, "loss": 0.011, "step": 163040 }, { "epoch": 0.82, "learning_rate": 0.00017660876540656167, "loss": 0.0127, "step": 163050 }, { "epoch": 0.82, "learning_rate": 0.00017660119771354765, "loss": 0.014, "step": 163060 }, { "epoch": 0.82, "learning_rate": 0.00017659363002053366, "loss": 0.0137, "step": 163070 }, { "epoch": 0.82, "learning_rate": 0.00017658606232751964, "loss": 0.0109, "step": 163080 }, { "epoch": 0.82, "learning_rate": 0.00017657849463450563, "loss": 0.0148, "step": 163090 }, { "epoch": 0.82, "learning_rate": 0.0001765709269414916, "loss": 0.0113, "step": 163100 }, { "epoch": 0.82, "learning_rate": 0.00017656335924847762, "loss": 0.0107, "step": 163110 }, { "epoch": 0.82, "learning_rate": 0.0001765557915554636, "loss": 0.0121, "step": 163120 }, { "epoch": 0.82, "learning_rate": 0.00017654822386244958, "loss": 0.0124, "step": 163130 }, { "epoch": 0.82, "learning_rate": 0.0001765406561694356, "loss": 0.0104, "step": 163140 }, { "epoch": 0.82, "learning_rate": 0.00017653308847642157, "loss": 0.0127, "step": 163150 }, { "epoch": 0.82, "learning_rate": 0.00017652552078340755, "loss": 0.0112, "step": 163160 }, { "epoch": 0.82, "learning_rate": 0.00017651795309039356, "loss": 0.014, "step": 163170 }, { "epoch": 0.82, "learning_rate": 0.00017651038539737954, "loss": 0.0109, "step": 163180 }, { "epoch": 0.82, "learning_rate": 0.00017650281770436552, "loss": 0.0139, "step": 163190 }, { "epoch": 0.82, "learning_rate": 0.00017649525001135153, "loss": 0.0115, "step": 163200 }, { "epoch": 0.82, "learning_rate": 0.0001764876823183375, "loss": 0.0113, "step": 163210 }, { "epoch": 0.82, "learning_rate": 0.0001764801146253235, "loss": 0.0175, "step": 163220 }, { "epoch": 0.82, "learning_rate": 0.0001764725469323095, "loss": 0.0156, "step": 163230 }, { "epoch": 0.82, "learning_rate": 0.00017646497923929548, "loss": 0.0146, "step": 163240 }, { "epoch": 0.82, "learning_rate": 0.00017645741154628146, "loss": 0.0101, "step": 163250 }, { "epoch": 0.82, "learning_rate": 0.00017644984385326745, "loss": 0.0131, "step": 163260 }, { "epoch": 0.82, "learning_rate": 0.00017644227616025345, "loss": 0.0115, "step": 163270 }, { "epoch": 0.82, "learning_rate": 0.00017643470846723944, "loss": 0.0112, "step": 163280 }, { "epoch": 0.82, "learning_rate": 0.00017642714077422542, "loss": 0.0121, "step": 163290 }, { "epoch": 0.82, "learning_rate": 0.00017641957308121143, "loss": 0.0116, "step": 163300 }, { "epoch": 0.82, "learning_rate": 0.0001764120053881974, "loss": 0.0129, "step": 163310 }, { "epoch": 0.82, "learning_rate": 0.0001764044376951834, "loss": 0.0151, "step": 163320 }, { "epoch": 0.82, "learning_rate": 0.0001763968700021694, "loss": 0.0129, "step": 163330 }, { "epoch": 0.82, "learning_rate": 0.00017638930230915538, "loss": 0.0104, "step": 163340 }, { "epoch": 0.82, "learning_rate": 0.00017638173461614136, "loss": 0.0112, "step": 163350 }, { "epoch": 0.82, "learning_rate": 0.00017637416692312737, "loss": 0.0176, "step": 163360 }, { "epoch": 0.82, "learning_rate": 0.00017636659923011335, "loss": 0.013, "step": 163370 }, { "epoch": 0.82, "learning_rate": 0.00017635903153709933, "loss": 0.0107, "step": 163380 }, { "epoch": 0.82, "learning_rate": 0.00017635146384408534, "loss": 0.0144, "step": 163390 }, { "epoch": 0.82, "learning_rate": 0.00017634389615107132, "loss": 0.0103, "step": 163400 }, { "epoch": 0.82, "learning_rate": 0.0001763363284580573, "loss": 0.0186, "step": 163410 }, { "epoch": 0.82, "learning_rate": 0.0001763287607650433, "loss": 0.0119, "step": 163420 }, { "epoch": 0.82, "learning_rate": 0.0001763211930720293, "loss": 0.0118, "step": 163430 }, { "epoch": 0.82, "learning_rate": 0.00017631362537901527, "loss": 0.0124, "step": 163440 }, { "epoch": 0.82, "learning_rate": 0.00017630605768600126, "loss": 0.0119, "step": 163450 }, { "epoch": 0.82, "learning_rate": 0.00017629848999298726, "loss": 0.0149, "step": 163460 }, { "epoch": 0.82, "learning_rate": 0.00017629092229997325, "loss": 0.013, "step": 163470 }, { "epoch": 0.82, "learning_rate": 0.00017628335460695923, "loss": 0.0112, "step": 163480 }, { "epoch": 0.82, "learning_rate": 0.00017627578691394524, "loss": 0.011, "step": 163490 }, { "epoch": 0.82, "learning_rate": 0.00017626821922093122, "loss": 0.0104, "step": 163500 }, { "epoch": 0.82, "learning_rate": 0.0001762606515279172, "loss": 0.0106, "step": 163510 }, { "epoch": 0.82, "learning_rate": 0.0001762530838349032, "loss": 0.0114, "step": 163520 }, { "epoch": 0.83, "learning_rate": 0.0001762455161418892, "loss": 0.012, "step": 163530 }, { "epoch": 0.83, "learning_rate": 0.00017623794844887517, "loss": 0.0131, "step": 163540 }, { "epoch": 0.83, "learning_rate": 0.00017623038075586118, "loss": 0.0114, "step": 163550 }, { "epoch": 0.83, "learning_rate": 0.00017622281306284716, "loss": 0.0109, "step": 163560 }, { "epoch": 0.83, "learning_rate": 0.00017621524536983314, "loss": 0.0081, "step": 163570 }, { "epoch": 0.83, "learning_rate": 0.00017620767767681915, "loss": 0.0116, "step": 163580 }, { "epoch": 0.83, "learning_rate": 0.00017620010998380513, "loss": 0.0141, "step": 163590 }, { "epoch": 0.83, "learning_rate": 0.0001761925422907911, "loss": 0.0126, "step": 163600 }, { "epoch": 0.83, "learning_rate": 0.0001761849745977771, "loss": 0.0111, "step": 163610 }, { "epoch": 0.83, "learning_rate": 0.0001761774069047631, "loss": 0.0096, "step": 163620 }, { "epoch": 0.83, "learning_rate": 0.00017616983921174908, "loss": 0.01, "step": 163630 }, { "epoch": 0.83, "learning_rate": 0.00017616227151873507, "loss": 0.0098, "step": 163640 }, { "epoch": 0.83, "learning_rate": 0.00017615470382572107, "loss": 0.0147, "step": 163650 }, { "epoch": 0.83, "learning_rate": 0.00017614713613270706, "loss": 0.0122, "step": 163660 }, { "epoch": 0.83, "learning_rate": 0.00017613956843969304, "loss": 0.0112, "step": 163670 }, { "epoch": 0.83, "learning_rate": 0.00017613200074667905, "loss": 0.0117, "step": 163680 }, { "epoch": 0.83, "learning_rate": 0.00017612443305366503, "loss": 0.0117, "step": 163690 }, { "epoch": 0.83, "learning_rate": 0.000176116865360651, "loss": 0.013, "step": 163700 }, { "epoch": 0.83, "learning_rate": 0.00017610929766763702, "loss": 0.0121, "step": 163710 }, { "epoch": 0.83, "learning_rate": 0.000176101729974623, "loss": 0.0133, "step": 163720 }, { "epoch": 0.83, "learning_rate": 0.00017609416228160898, "loss": 0.0118, "step": 163730 }, { "epoch": 0.83, "learning_rate": 0.000176086594588595, "loss": 0.0106, "step": 163740 }, { "epoch": 0.83, "learning_rate": 0.00017607902689558097, "loss": 0.0129, "step": 163750 }, { "epoch": 0.83, "learning_rate": 0.00017607145920256695, "loss": 0.012, "step": 163760 }, { "epoch": 0.83, "learning_rate": 0.00017606389150955293, "loss": 0.0138, "step": 163770 }, { "epoch": 0.83, "learning_rate": 0.00017605632381653894, "loss": 0.0132, "step": 163780 }, { "epoch": 0.83, "learning_rate": 0.00017604875612352492, "loss": 0.0206, "step": 163790 }, { "epoch": 0.83, "learning_rate": 0.0001760411884305109, "loss": 0.0131, "step": 163800 }, { "epoch": 0.83, "learning_rate": 0.0001760336207374969, "loss": 0.0162, "step": 163810 }, { "epoch": 0.83, "learning_rate": 0.0001760260530444829, "loss": 0.0125, "step": 163820 }, { "epoch": 0.83, "learning_rate": 0.00017601848535146888, "loss": 0.0117, "step": 163830 }, { "epoch": 0.83, "learning_rate": 0.00017601091765845488, "loss": 0.0132, "step": 163840 }, { "epoch": 0.83, "learning_rate": 0.00017600334996544087, "loss": 0.0109, "step": 163850 }, { "epoch": 0.83, "learning_rate": 0.00017599578227242685, "loss": 0.0156, "step": 163860 }, { "epoch": 0.83, "learning_rate": 0.00017598821457941286, "loss": 0.0141, "step": 163870 }, { "epoch": 0.83, "learning_rate": 0.00017598064688639884, "loss": 0.0145, "step": 163880 }, { "epoch": 0.83, "learning_rate": 0.00017597307919338482, "loss": 0.0128, "step": 163890 }, { "epoch": 0.83, "learning_rate": 0.00017596551150037083, "loss": 0.0138, "step": 163900 }, { "epoch": 0.83, "learning_rate": 0.0001759579438073568, "loss": 0.0102, "step": 163910 }, { "epoch": 0.83, "learning_rate": 0.0001759503761143428, "loss": 0.016, "step": 163920 }, { "epoch": 0.83, "learning_rate": 0.0001759428084213288, "loss": 0.016, "step": 163930 }, { "epoch": 0.83, "learning_rate": 0.00017593524072831478, "loss": 0.0106, "step": 163940 }, { "epoch": 0.83, "learning_rate": 0.00017592767303530076, "loss": 0.0141, "step": 163950 }, { "epoch": 0.83, "learning_rate": 0.00017592010534228674, "loss": 0.0091, "step": 163960 }, { "epoch": 0.83, "learning_rate": 0.00017591253764927275, "loss": 0.0125, "step": 163970 }, { "epoch": 0.83, "learning_rate": 0.00017590496995625873, "loss": 0.0139, "step": 163980 }, { "epoch": 0.83, "learning_rate": 0.00017589740226324471, "loss": 0.0128, "step": 163990 }, { "epoch": 0.83, "learning_rate": 0.00017588983457023072, "loss": 0.0148, "step": 164000 }, { "epoch": 0.83, "eval_cer": 0.914481900656667, "eval_loss": 0.009098981507122517, "eval_runtime": 116.6318, "eval_samples_per_second": 17.148, "eval_steps_per_second": 4.287, "step": 164000 }, { "epoch": 0.83, "learning_rate": 0.0001758822668772167, "loss": 0.0169, "step": 164010 }, { "epoch": 0.83, "learning_rate": 0.00017587469918420269, "loss": 0.0105, "step": 164020 }, { "epoch": 0.83, "learning_rate": 0.00017586713149118864, "loss": 0.0115, "step": 164030 }, { "epoch": 0.83, "learning_rate": 0.00017585956379817465, "loss": 0.011, "step": 164040 }, { "epoch": 0.83, "learning_rate": 0.00017585199610516063, "loss": 0.0092, "step": 164050 }, { "epoch": 0.83, "learning_rate": 0.0001758444284121466, "loss": 0.0128, "step": 164060 }, { "epoch": 0.83, "learning_rate": 0.00017583686071913262, "loss": 0.0118, "step": 164070 }, { "epoch": 0.83, "learning_rate": 0.0001758292930261186, "loss": 0.0104, "step": 164080 }, { "epoch": 0.83, "learning_rate": 0.00017582172533310458, "loss": 0.0117, "step": 164090 }, { "epoch": 0.83, "learning_rate": 0.0001758141576400906, "loss": 0.0123, "step": 164100 }, { "epoch": 0.83, "learning_rate": 0.00017580658994707657, "loss": 0.0113, "step": 164110 }, { "epoch": 0.83, "learning_rate": 0.00017579902225406255, "loss": 0.0085, "step": 164120 }, { "epoch": 0.83, "learning_rate": 0.00017579145456104856, "loss": 0.01, "step": 164130 }, { "epoch": 0.83, "learning_rate": 0.00017578388686803454, "loss": 0.0129, "step": 164140 }, { "epoch": 0.83, "learning_rate": 0.00017577631917502053, "loss": 0.0115, "step": 164150 }, { "epoch": 0.83, "learning_rate": 0.0001757687514820065, "loss": 0.0104, "step": 164160 }, { "epoch": 0.83, "learning_rate": 0.00017576118378899252, "loss": 0.0162, "step": 164170 }, { "epoch": 0.83, "learning_rate": 0.0001757536160959785, "loss": 0.0133, "step": 164180 }, { "epoch": 0.83, "learning_rate": 0.00017574604840296448, "loss": 0.0133, "step": 164190 }, { "epoch": 0.83, "learning_rate": 0.0001757384807099505, "loss": 0.0137, "step": 164200 }, { "epoch": 0.83, "learning_rate": 0.00017573091301693647, "loss": 0.0119, "step": 164210 }, { "epoch": 0.83, "learning_rate": 0.00017572334532392245, "loss": 0.0125, "step": 164220 }, { "epoch": 0.83, "learning_rate": 0.00017571577763090846, "loss": 0.0117, "step": 164230 }, { "epoch": 0.83, "learning_rate": 0.00017570820993789444, "loss": 0.0152, "step": 164240 }, { "epoch": 0.83, "learning_rate": 0.00017570064224488042, "loss": 0.0141, "step": 164250 }, { "epoch": 0.83, "learning_rate": 0.00017569307455186643, "loss": 0.0122, "step": 164260 }, { "epoch": 0.83, "learning_rate": 0.0001756855068588524, "loss": 0.0126, "step": 164270 }, { "epoch": 0.83, "learning_rate": 0.0001756779391658384, "loss": 0.0112, "step": 164280 }, { "epoch": 0.83, "learning_rate": 0.0001756703714728244, "loss": 0.0101, "step": 164290 }, { "epoch": 0.83, "learning_rate": 0.00017566280377981038, "loss": 0.0127, "step": 164300 }, { "epoch": 0.83, "learning_rate": 0.00017565523608679636, "loss": 0.0159, "step": 164310 }, { "epoch": 0.83, "learning_rate": 0.00017564766839378237, "loss": 0.0124, "step": 164320 }, { "epoch": 0.83, "learning_rate": 0.00017564010070076835, "loss": 0.0119, "step": 164330 }, { "epoch": 0.83, "learning_rate": 0.00017563253300775434, "loss": 0.013, "step": 164340 }, { "epoch": 0.83, "learning_rate": 0.00017562496531474032, "loss": 0.0102, "step": 164350 }, { "epoch": 0.83, "learning_rate": 0.00017561739762172633, "loss": 0.0148, "step": 164360 }, { "epoch": 0.83, "learning_rate": 0.0001756098299287123, "loss": 0.0117, "step": 164370 }, { "epoch": 0.83, "learning_rate": 0.0001756022622356983, "loss": 0.0124, "step": 164380 }, { "epoch": 0.83, "learning_rate": 0.0001755946945426843, "loss": 0.0129, "step": 164390 }, { "epoch": 0.83, "learning_rate": 0.00017558712684967028, "loss": 0.0101, "step": 164400 }, { "epoch": 0.83, "learning_rate": 0.00017557955915665626, "loss": 0.0136, "step": 164410 }, { "epoch": 0.83, "learning_rate": 0.00017557199146364227, "loss": 0.0121, "step": 164420 }, { "epoch": 0.83, "learning_rate": 0.00017556442377062825, "loss": 0.0123, "step": 164430 }, { "epoch": 0.83, "learning_rate": 0.00017555685607761423, "loss": 0.0108, "step": 164440 }, { "epoch": 0.83, "learning_rate": 0.00017554928838460024, "loss": 0.0126, "step": 164450 }, { "epoch": 0.83, "learning_rate": 0.00017554172069158622, "loss": 0.012, "step": 164460 }, { "epoch": 0.83, "learning_rate": 0.0001755341529985722, "loss": 0.0112, "step": 164470 }, { "epoch": 0.83, "learning_rate": 0.0001755265853055582, "loss": 0.0139, "step": 164480 }, { "epoch": 0.83, "learning_rate": 0.0001755190176125442, "loss": 0.0129, "step": 164490 }, { "epoch": 0.83, "learning_rate": 0.00017551144991953017, "loss": 0.012, "step": 164500 }, { "epoch": 0.83, "learning_rate": 0.00017550388222651616, "loss": 0.0103, "step": 164510 }, { "epoch": 0.83, "learning_rate": 0.00017549631453350216, "loss": 0.0139, "step": 164520 }, { "epoch": 0.83, "learning_rate": 0.00017548874684048815, "loss": 0.01, "step": 164530 }, { "epoch": 0.83, "learning_rate": 0.00017548117914747413, "loss": 0.0083, "step": 164540 }, { "epoch": 0.83, "learning_rate": 0.00017547361145446014, "loss": 0.015, "step": 164550 }, { "epoch": 0.83, "learning_rate": 0.00017546604376144612, "loss": 0.0137, "step": 164560 }, { "epoch": 0.83, "learning_rate": 0.0001754584760684321, "loss": 0.0121, "step": 164570 }, { "epoch": 0.83, "learning_rate": 0.0001754509083754181, "loss": 0.0107, "step": 164580 }, { "epoch": 0.83, "learning_rate": 0.0001754433406824041, "loss": 0.0125, "step": 164590 }, { "epoch": 0.83, "learning_rate": 0.00017543577298939007, "loss": 0.014, "step": 164600 }, { "epoch": 0.83, "learning_rate": 0.00017542820529637608, "loss": 0.0104, "step": 164610 }, { "epoch": 0.83, "learning_rate": 0.00017542063760336206, "loss": 0.016, "step": 164620 }, { "epoch": 0.83, "learning_rate": 0.00017541306991034804, "loss": 0.0153, "step": 164630 }, { "epoch": 0.83, "learning_rate": 0.00017540550221733405, "loss": 0.0118, "step": 164640 }, { "epoch": 0.83, "learning_rate": 0.00017539793452432003, "loss": 0.0119, "step": 164650 }, { "epoch": 0.83, "learning_rate": 0.000175390366831306, "loss": 0.0114, "step": 164660 }, { "epoch": 0.83, "learning_rate": 0.000175382799138292, "loss": 0.0138, "step": 164670 }, { "epoch": 0.83, "learning_rate": 0.000175375231445278, "loss": 0.0159, "step": 164680 }, { "epoch": 0.83, "learning_rate": 0.00017536766375226398, "loss": 0.013, "step": 164690 }, { "epoch": 0.83, "learning_rate": 0.00017536009605924997, "loss": 0.0117, "step": 164700 }, { "epoch": 0.83, "learning_rate": 0.00017535252836623597, "loss": 0.011, "step": 164710 }, { "epoch": 0.83, "learning_rate": 0.00017534496067322196, "loss": 0.0126, "step": 164720 }, { "epoch": 0.83, "learning_rate": 0.00017533739298020794, "loss": 0.0095, "step": 164730 }, { "epoch": 0.83, "learning_rate": 0.00017532982528719395, "loss": 0.0147, "step": 164740 }, { "epoch": 0.83, "learning_rate": 0.00017532225759417993, "loss": 0.0116, "step": 164750 }, { "epoch": 0.83, "learning_rate": 0.0001753146899011659, "loss": 0.0159, "step": 164760 }, { "epoch": 0.83, "learning_rate": 0.00017530712220815192, "loss": 0.016, "step": 164770 }, { "epoch": 0.83, "learning_rate": 0.0001752995545151379, "loss": 0.0113, "step": 164780 }, { "epoch": 0.83, "learning_rate": 0.00017529198682212388, "loss": 0.0161, "step": 164790 }, { "epoch": 0.83, "learning_rate": 0.0001752844191291099, "loss": 0.0122, "step": 164800 }, { "epoch": 0.83, "learning_rate": 0.00017527685143609587, "loss": 0.0103, "step": 164810 }, { "epoch": 0.83, "learning_rate": 0.00017526928374308185, "loss": 0.0138, "step": 164820 }, { "epoch": 0.83, "learning_rate": 0.00017526171605006783, "loss": 0.0142, "step": 164830 }, { "epoch": 0.83, "learning_rate": 0.00017525414835705384, "loss": 0.0111, "step": 164840 }, { "epoch": 0.83, "learning_rate": 0.00017524658066403982, "loss": 0.012, "step": 164850 }, { "epoch": 0.83, "learning_rate": 0.0001752390129710258, "loss": 0.0133, "step": 164860 }, { "epoch": 0.83, "learning_rate": 0.0001752314452780118, "loss": 0.0146, "step": 164870 }, { "epoch": 0.83, "learning_rate": 0.0001752238775849978, "loss": 0.013, "step": 164880 }, { "epoch": 0.83, "learning_rate": 0.00017521630989198378, "loss": 0.0146, "step": 164890 }, { "epoch": 0.83, "learning_rate": 0.00017520874219896978, "loss": 0.0109, "step": 164900 }, { "epoch": 0.83, "learning_rate": 0.00017520117450595577, "loss": 0.0128, "step": 164910 }, { "epoch": 0.83, "learning_rate": 0.00017519360681294175, "loss": 0.0135, "step": 164920 }, { "epoch": 0.83, "learning_rate": 0.00017518603911992776, "loss": 0.015, "step": 164930 }, { "epoch": 0.83, "learning_rate": 0.00017517847142691374, "loss": 0.0097, "step": 164940 }, { "epoch": 0.83, "learning_rate": 0.00017517090373389972, "loss": 0.013, "step": 164950 }, { "epoch": 0.83, "learning_rate": 0.00017516333604088573, "loss": 0.0096, "step": 164960 }, { "epoch": 0.83, "learning_rate": 0.0001751557683478717, "loss": 0.0137, "step": 164970 }, { "epoch": 0.83, "learning_rate": 0.0001751482006548577, "loss": 0.0133, "step": 164980 }, { "epoch": 0.83, "learning_rate": 0.0001751406329618437, "loss": 0.0143, "step": 164990 }, { "epoch": 0.83, "learning_rate": 0.00017513306526882968, "loss": 0.0129, "step": 165000 }, { "epoch": 0.83, "eval_cer": 0.9144586111496574, "eval_loss": 0.008332598023116589, "eval_runtime": 116.7175, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 165000 }, { "epoch": 0.83, "learning_rate": 0.00017512549757581566, "loss": 0.0141, "step": 165010 }, { "epoch": 0.83, "learning_rate": 0.00017511792988280164, "loss": 0.0119, "step": 165020 }, { "epoch": 0.83, "learning_rate": 0.00017511036218978765, "loss": 0.0104, "step": 165030 }, { "epoch": 0.83, "learning_rate": 0.00017510279449677363, "loss": 0.0161, "step": 165040 }, { "epoch": 0.83, "learning_rate": 0.00017509522680375961, "loss": 0.0128, "step": 165050 }, { "epoch": 0.83, "learning_rate": 0.00017508765911074562, "loss": 0.0116, "step": 165060 }, { "epoch": 0.83, "learning_rate": 0.0001750800914177316, "loss": 0.0123, "step": 165070 }, { "epoch": 0.83, "learning_rate": 0.00017507252372471759, "loss": 0.0106, "step": 165080 }, { "epoch": 0.83, "learning_rate": 0.0001750649560317036, "loss": 0.0124, "step": 165090 }, { "epoch": 0.83, "learning_rate": 0.00017505738833868958, "loss": 0.0103, "step": 165100 }, { "epoch": 0.83, "learning_rate": 0.00017504982064567556, "loss": 0.0126, "step": 165110 }, { "epoch": 0.83, "learning_rate": 0.00017504225295266157, "loss": 0.0129, "step": 165120 }, { "epoch": 0.83, "learning_rate": 0.00017503468525964755, "loss": 0.0126, "step": 165130 }, { "epoch": 0.83, "learning_rate": 0.00017502711756663353, "loss": 0.0123, "step": 165140 }, { "epoch": 0.83, "learning_rate": 0.00017501954987361954, "loss": 0.015, "step": 165150 }, { "epoch": 0.83, "learning_rate": 0.00017501198218060552, "loss": 0.0114, "step": 165160 }, { "epoch": 0.83, "learning_rate": 0.0001750044144875915, "loss": 0.0114, "step": 165170 }, { "epoch": 0.83, "learning_rate": 0.00017499684679457748, "loss": 0.0153, "step": 165180 }, { "epoch": 0.83, "learning_rate": 0.0001749892791015635, "loss": 0.0112, "step": 165190 }, { "epoch": 0.83, "learning_rate": 0.00017498171140854947, "loss": 0.01, "step": 165200 }, { "epoch": 0.83, "learning_rate": 0.00017497414371553545, "loss": 0.0115, "step": 165210 }, { "epoch": 0.83, "learning_rate": 0.00017496657602252146, "loss": 0.0123, "step": 165220 }, { "epoch": 0.83, "learning_rate": 0.00017495900832950744, "loss": 0.0108, "step": 165230 }, { "epoch": 0.83, "learning_rate": 0.00017495144063649342, "loss": 0.0118, "step": 165240 }, { "epoch": 0.83, "learning_rate": 0.00017494387294347943, "loss": 0.0105, "step": 165250 }, { "epoch": 0.83, "learning_rate": 0.00017493630525046541, "loss": 0.0114, "step": 165260 }, { "epoch": 0.83, "learning_rate": 0.0001749287375574514, "loss": 0.0103, "step": 165270 }, { "epoch": 0.83, "learning_rate": 0.0001749211698644374, "loss": 0.0143, "step": 165280 }, { "epoch": 0.83, "learning_rate": 0.00017491360217142336, "loss": 0.0137, "step": 165290 }, { "epoch": 0.83, "learning_rate": 0.00017490603447840934, "loss": 0.011, "step": 165300 }, { "epoch": 0.83, "learning_rate": 0.00017489846678539532, "loss": 0.0081, "step": 165310 }, { "epoch": 0.83, "learning_rate": 0.00017489089909238133, "loss": 0.0122, "step": 165320 }, { "epoch": 0.83, "learning_rate": 0.0001748833313993673, "loss": 0.0095, "step": 165330 }, { "epoch": 0.83, "learning_rate": 0.0001748757637063533, "loss": 0.0117, "step": 165340 }, { "epoch": 0.83, "learning_rate": 0.0001748681960133393, "loss": 0.0125, "step": 165350 }, { "epoch": 0.83, "learning_rate": 0.00017486062832032528, "loss": 0.0095, "step": 165360 }, { "epoch": 0.83, "learning_rate": 0.00017485306062731126, "loss": 0.0132, "step": 165370 }, { "epoch": 0.83, "learning_rate": 0.00017484549293429727, "loss": 0.0103, "step": 165380 }, { "epoch": 0.83, "learning_rate": 0.00017483792524128325, "loss": 0.0107, "step": 165390 }, { "epoch": 0.83, "learning_rate": 0.00017483035754826924, "loss": 0.0107, "step": 165400 }, { "epoch": 0.83, "learning_rate": 0.00017482278985525522, "loss": 0.0115, "step": 165410 }, { "epoch": 0.83, "learning_rate": 0.00017481522216224123, "loss": 0.0117, "step": 165420 }, { "epoch": 0.83, "learning_rate": 0.0001748076544692272, "loss": 0.0134, "step": 165430 }, { "epoch": 0.83, "learning_rate": 0.0001748000867762132, "loss": 0.0156, "step": 165440 }, { "epoch": 0.83, "learning_rate": 0.0001747925190831992, "loss": 0.0152, "step": 165450 }, { "epoch": 0.83, "learning_rate": 0.00017478495139018518, "loss": 0.0143, "step": 165460 }, { "epoch": 0.83, "learning_rate": 0.00017477738369717116, "loss": 0.0114, "step": 165470 }, { "epoch": 0.83, "learning_rate": 0.00017476981600415717, "loss": 0.0118, "step": 165480 }, { "epoch": 0.83, "learning_rate": 0.00017476224831114315, "loss": 0.0091, "step": 165490 }, { "epoch": 0.83, "learning_rate": 0.00017475468061812913, "loss": 0.0112, "step": 165500 }, { "epoch": 0.84, "learning_rate": 0.00017474711292511514, "loss": 0.0143, "step": 165510 }, { "epoch": 0.84, "learning_rate": 0.00017473954523210112, "loss": 0.0131, "step": 165520 }, { "epoch": 0.84, "learning_rate": 0.0001747319775390871, "loss": 0.0116, "step": 165530 }, { "epoch": 0.84, "learning_rate": 0.0001747244098460731, "loss": 0.0138, "step": 165540 }, { "epoch": 0.84, "learning_rate": 0.0001747168421530591, "loss": 0.0124, "step": 165550 }, { "epoch": 0.84, "learning_rate": 0.00017470927446004507, "loss": 0.0114, "step": 165560 }, { "epoch": 0.84, "learning_rate": 0.00017470170676703106, "loss": 0.0123, "step": 165570 }, { "epoch": 0.84, "learning_rate": 0.00017469413907401706, "loss": 0.0143, "step": 165580 }, { "epoch": 0.84, "learning_rate": 0.00017468657138100305, "loss": 0.0184, "step": 165590 }, { "epoch": 0.84, "learning_rate": 0.00017467900368798903, "loss": 0.0129, "step": 165600 }, { "epoch": 0.84, "learning_rate": 0.00017467143599497504, "loss": 0.012, "step": 165610 }, { "epoch": 0.84, "learning_rate": 0.00017466386830196102, "loss": 0.0108, "step": 165620 }, { "epoch": 0.84, "learning_rate": 0.000174656300608947, "loss": 0.0095, "step": 165630 }, { "epoch": 0.84, "learning_rate": 0.000174648732915933, "loss": 0.0122, "step": 165640 }, { "epoch": 0.84, "learning_rate": 0.000174641165222919, "loss": 0.013, "step": 165650 }, { "epoch": 0.84, "learning_rate": 0.00017463359752990497, "loss": 0.0153, "step": 165660 }, { "epoch": 0.84, "learning_rate": 0.00017462602983689098, "loss": 0.012, "step": 165670 }, { "epoch": 0.84, "learning_rate": 0.00017461846214387696, "loss": 0.0134, "step": 165680 }, { "epoch": 0.84, "learning_rate": 0.00017461089445086294, "loss": 0.0123, "step": 165690 }, { "epoch": 0.84, "learning_rate": 0.00017460332675784895, "loss": 0.0107, "step": 165700 }, { "epoch": 0.84, "learning_rate": 0.00017459575906483493, "loss": 0.012, "step": 165710 }, { "epoch": 0.84, "learning_rate": 0.0001745881913718209, "loss": 0.0105, "step": 165720 }, { "epoch": 0.84, "learning_rate": 0.0001745806236788069, "loss": 0.0115, "step": 165730 }, { "epoch": 0.84, "learning_rate": 0.0001745730559857929, "loss": 0.0161, "step": 165740 }, { "epoch": 0.84, "learning_rate": 0.00017456548829277888, "loss": 0.0111, "step": 165750 }, { "epoch": 0.84, "learning_rate": 0.00017455792059976487, "loss": 0.0125, "step": 165760 }, { "epoch": 0.84, "learning_rate": 0.00017455035290675087, "loss": 0.0112, "step": 165770 }, { "epoch": 0.84, "learning_rate": 0.00017454278521373686, "loss": 0.0128, "step": 165780 }, { "epoch": 0.84, "learning_rate": 0.00017453521752072284, "loss": 0.0127, "step": 165790 }, { "epoch": 0.84, "learning_rate": 0.00017452764982770885, "loss": 0.012, "step": 165800 }, { "epoch": 0.84, "learning_rate": 0.00017452008213469483, "loss": 0.0095, "step": 165810 }, { "epoch": 0.84, "learning_rate": 0.0001745125144416808, "loss": 0.0107, "step": 165820 }, { "epoch": 0.84, "learning_rate": 0.00017450494674866682, "loss": 0.0116, "step": 165830 }, { "epoch": 0.84, "learning_rate": 0.0001744973790556528, "loss": 0.0088, "step": 165840 }, { "epoch": 0.84, "learning_rate": 0.00017448981136263878, "loss": 0.0102, "step": 165850 }, { "epoch": 0.84, "learning_rate": 0.0001744822436696248, "loss": 0.01, "step": 165860 }, { "epoch": 0.84, "learning_rate": 0.00017447467597661077, "loss": 0.0103, "step": 165870 }, { "epoch": 0.84, "learning_rate": 0.00017446710828359675, "loss": 0.0114, "step": 165880 }, { "epoch": 0.84, "learning_rate": 0.00017445954059058276, "loss": 0.0148, "step": 165890 }, { "epoch": 0.84, "learning_rate": 0.00017445197289756874, "loss": 0.0133, "step": 165900 }, { "epoch": 0.84, "learning_rate": 0.00017444440520455472, "loss": 0.0115, "step": 165910 }, { "epoch": 0.84, "learning_rate": 0.0001744368375115407, "loss": 0.0105, "step": 165920 }, { "epoch": 0.84, "learning_rate": 0.0001744292698185267, "loss": 0.0107, "step": 165930 }, { "epoch": 0.84, "learning_rate": 0.0001744217021255127, "loss": 0.0098, "step": 165940 }, { "epoch": 0.84, "learning_rate": 0.00017441413443249868, "loss": 0.0108, "step": 165950 }, { "epoch": 0.84, "learning_rate": 0.00017440656673948468, "loss": 0.0116, "step": 165960 }, { "epoch": 0.84, "learning_rate": 0.00017439899904647067, "loss": 0.01, "step": 165970 }, { "epoch": 0.84, "learning_rate": 0.00017439143135345665, "loss": 0.0128, "step": 165980 }, { "epoch": 0.84, "learning_rate": 0.00017438386366044266, "loss": 0.0129, "step": 165990 }, { "epoch": 0.84, "learning_rate": 0.00017437629596742864, "loss": 0.0114, "step": 166000 }, { "epoch": 0.84, "eval_cer": 0.9144508479806542, "eval_loss": 0.008648986928164959, "eval_runtime": 116.5926, "eval_samples_per_second": 17.154, "eval_steps_per_second": 4.288, "step": 166000 }, { "epoch": 0.84, "learning_rate": 0.00017436872827441462, "loss": 0.0157, "step": 166010 }, { "epoch": 0.84, "learning_rate": 0.00017436116058140063, "loss": 0.0134, "step": 166020 }, { "epoch": 0.84, "learning_rate": 0.0001743535928883866, "loss": 0.0149, "step": 166030 }, { "epoch": 0.84, "learning_rate": 0.0001743460251953726, "loss": 0.0105, "step": 166040 }, { "epoch": 0.84, "learning_rate": 0.0001743384575023586, "loss": 0.0075, "step": 166050 }, { "epoch": 0.84, "learning_rate": 0.00017433088980934458, "loss": 0.0124, "step": 166060 }, { "epoch": 0.84, "learning_rate": 0.00017432332211633056, "loss": 0.011, "step": 166070 }, { "epoch": 0.84, "learning_rate": 0.00017431575442331654, "loss": 0.0146, "step": 166080 }, { "epoch": 0.84, "learning_rate": 0.00017430818673030255, "loss": 0.0113, "step": 166090 }, { "epoch": 0.84, "learning_rate": 0.00017430061903728853, "loss": 0.0151, "step": 166100 }, { "epoch": 0.84, "learning_rate": 0.00017429305134427451, "loss": 0.0094, "step": 166110 }, { "epoch": 0.84, "learning_rate": 0.00017428548365126052, "loss": 0.0113, "step": 166120 }, { "epoch": 0.84, "learning_rate": 0.0001742779159582465, "loss": 0.0137, "step": 166130 }, { "epoch": 0.84, "learning_rate": 0.00017427034826523249, "loss": 0.0128, "step": 166140 }, { "epoch": 0.84, "learning_rate": 0.0001742627805722185, "loss": 0.0154, "step": 166150 }, { "epoch": 0.84, "learning_rate": 0.00017425521287920448, "loss": 0.013, "step": 166160 }, { "epoch": 0.84, "learning_rate": 0.00017424764518619046, "loss": 0.0152, "step": 166170 }, { "epoch": 0.84, "learning_rate": 0.00017424007749317647, "loss": 0.0132, "step": 166180 }, { "epoch": 0.84, "learning_rate": 0.00017423250980016245, "loss": 0.0114, "step": 166190 }, { "epoch": 0.84, "learning_rate": 0.00017422494210714843, "loss": 0.0114, "step": 166200 }, { "epoch": 0.84, "learning_rate": 0.00017421737441413444, "loss": 0.0129, "step": 166210 }, { "epoch": 0.84, "learning_rate": 0.00017420980672112042, "loss": 0.0129, "step": 166220 }, { "epoch": 0.84, "learning_rate": 0.0001742022390281064, "loss": 0.0094, "step": 166230 }, { "epoch": 0.84, "learning_rate": 0.00017419467133509238, "loss": 0.0112, "step": 166240 }, { "epoch": 0.84, "learning_rate": 0.0001741871036420784, "loss": 0.0107, "step": 166250 }, { "epoch": 0.84, "learning_rate": 0.00017417953594906437, "loss": 0.0133, "step": 166260 }, { "epoch": 0.84, "learning_rate": 0.00017417196825605035, "loss": 0.0128, "step": 166270 }, { "epoch": 0.84, "learning_rate": 0.00017416440056303636, "loss": 0.0112, "step": 166280 }, { "epoch": 0.84, "learning_rate": 0.00017415683287002234, "loss": 0.013, "step": 166290 }, { "epoch": 0.84, "learning_rate": 0.00017414926517700832, "loss": 0.0125, "step": 166300 }, { "epoch": 0.84, "learning_rate": 0.00017414169748399433, "loss": 0.0129, "step": 166310 }, { "epoch": 0.84, "learning_rate": 0.00017413412979098031, "loss": 0.0122, "step": 166320 }, { "epoch": 0.84, "learning_rate": 0.0001741265620979663, "loss": 0.0102, "step": 166330 }, { "epoch": 0.84, "learning_rate": 0.0001741189944049523, "loss": 0.0123, "step": 166340 }, { "epoch": 0.84, "learning_rate": 0.00017411142671193829, "loss": 0.0116, "step": 166350 }, { "epoch": 0.84, "learning_rate": 0.00017410385901892427, "loss": 0.0143, "step": 166360 }, { "epoch": 0.84, "learning_rate": 0.00017409629132591028, "loss": 0.0112, "step": 166370 }, { "epoch": 0.84, "learning_rate": 0.00017408872363289626, "loss": 0.0116, "step": 166380 }, { "epoch": 0.84, "learning_rate": 0.00017408115593988224, "loss": 0.0101, "step": 166390 }, { "epoch": 0.84, "learning_rate": 0.00017407358824686825, "loss": 0.0112, "step": 166400 }, { "epoch": 0.84, "learning_rate": 0.00017406602055385423, "loss": 0.0138, "step": 166410 }, { "epoch": 0.84, "learning_rate": 0.0001740584528608402, "loss": 0.0123, "step": 166420 }, { "epoch": 0.84, "learning_rate": 0.0001740508851678262, "loss": 0.0136, "step": 166430 }, { "epoch": 0.84, "learning_rate": 0.0001740433174748122, "loss": 0.0097, "step": 166440 }, { "epoch": 0.84, "learning_rate": 0.00017403574978179818, "loss": 0.012, "step": 166450 }, { "epoch": 0.84, "learning_rate": 0.00017402818208878416, "loss": 0.0113, "step": 166460 }, { "epoch": 0.84, "learning_rate": 0.00017402061439577017, "loss": 0.0106, "step": 166470 }, { "epoch": 0.84, "learning_rate": 0.00017401304670275615, "loss": 0.0121, "step": 166480 }, { "epoch": 0.84, "learning_rate": 0.00017400547900974213, "loss": 0.012, "step": 166490 }, { "epoch": 0.84, "learning_rate": 0.00017399791131672814, "loss": 0.0156, "step": 166500 }, { "epoch": 0.84, "learning_rate": 0.00017399034362371412, "loss": 0.0114, "step": 166510 }, { "epoch": 0.84, "learning_rate": 0.0001739827759307001, "loss": 0.0105, "step": 166520 }, { "epoch": 0.84, "learning_rate": 0.00017397520823768611, "loss": 0.011, "step": 166530 }, { "epoch": 0.84, "learning_rate": 0.00017396764054467207, "loss": 0.0108, "step": 166540 }, { "epoch": 0.84, "learning_rate": 0.00017396007285165805, "loss": 0.0133, "step": 166550 }, { "epoch": 0.84, "learning_rate": 0.00017395250515864403, "loss": 0.0113, "step": 166560 }, { "epoch": 0.84, "learning_rate": 0.00017394493746563004, "loss": 0.0152, "step": 166570 }, { "epoch": 0.84, "learning_rate": 0.00017393736977261602, "loss": 0.0163, "step": 166580 }, { "epoch": 0.84, "learning_rate": 0.000173929802079602, "loss": 0.0113, "step": 166590 }, { "epoch": 0.84, "learning_rate": 0.000173922234386588, "loss": 0.0157, "step": 166600 }, { "epoch": 0.84, "learning_rate": 0.000173914666693574, "loss": 0.0118, "step": 166610 }, { "epoch": 0.84, "learning_rate": 0.00017390709900055997, "loss": 0.016, "step": 166620 }, { "epoch": 0.84, "learning_rate": 0.00017389953130754596, "loss": 0.0121, "step": 166630 }, { "epoch": 0.84, "learning_rate": 0.00017389196361453196, "loss": 0.0125, "step": 166640 }, { "epoch": 0.84, "learning_rate": 0.00017388439592151795, "loss": 0.0123, "step": 166650 }, { "epoch": 0.84, "learning_rate": 0.00017387682822850393, "loss": 0.0106, "step": 166660 }, { "epoch": 0.84, "learning_rate": 0.00017386926053548994, "loss": 0.0118, "step": 166670 }, { "epoch": 0.84, "learning_rate": 0.00017386169284247592, "loss": 0.0119, "step": 166680 }, { "epoch": 0.84, "learning_rate": 0.0001738541251494619, "loss": 0.0081, "step": 166690 }, { "epoch": 0.84, "learning_rate": 0.0001738465574564479, "loss": 0.0124, "step": 166700 }, { "epoch": 0.84, "learning_rate": 0.0001738389897634339, "loss": 0.0149, "step": 166710 }, { "epoch": 0.84, "learning_rate": 0.00017383142207041987, "loss": 0.0119, "step": 166720 }, { "epoch": 0.84, "learning_rate": 0.00017382385437740588, "loss": 0.0129, "step": 166730 }, { "epoch": 0.84, "learning_rate": 0.00017381628668439186, "loss": 0.0107, "step": 166740 }, { "epoch": 0.84, "learning_rate": 0.00017380871899137784, "loss": 0.0131, "step": 166750 }, { "epoch": 0.84, "learning_rate": 0.00017380115129836385, "loss": 0.0118, "step": 166760 }, { "epoch": 0.84, "learning_rate": 0.00017379358360534983, "loss": 0.0103, "step": 166770 }, { "epoch": 0.84, "learning_rate": 0.0001737860159123358, "loss": 0.0115, "step": 166780 }, { "epoch": 0.84, "learning_rate": 0.00017377844821932182, "loss": 0.0114, "step": 166790 }, { "epoch": 0.84, "learning_rate": 0.0001737708805263078, "loss": 0.0098, "step": 166800 }, { "epoch": 0.84, "learning_rate": 0.00017376331283329378, "loss": 0.0121, "step": 166810 }, { "epoch": 0.84, "learning_rate": 0.00017375574514027977, "loss": 0.0119, "step": 166820 }, { "epoch": 0.84, "learning_rate": 0.00017374817744726577, "loss": 0.0106, "step": 166830 }, { "epoch": 0.84, "learning_rate": 0.00017374060975425176, "loss": 0.0118, "step": 166840 }, { "epoch": 0.84, "learning_rate": 0.00017373304206123774, "loss": 0.0119, "step": 166850 }, { "epoch": 0.84, "learning_rate": 0.00017372547436822375, "loss": 0.0102, "step": 166860 }, { "epoch": 0.84, "learning_rate": 0.00017371790667520973, "loss": 0.0139, "step": 166870 }, { "epoch": 0.84, "learning_rate": 0.0001737103389821957, "loss": 0.0119, "step": 166880 }, { "epoch": 0.84, "learning_rate": 0.00017370277128918172, "loss": 0.0108, "step": 166890 }, { "epoch": 0.84, "learning_rate": 0.0001736952035961677, "loss": 0.0122, "step": 166900 }, { "epoch": 0.84, "learning_rate": 0.00017368763590315368, "loss": 0.0102, "step": 166910 }, { "epoch": 0.84, "learning_rate": 0.0001736800682101397, "loss": 0.0112, "step": 166920 }, { "epoch": 0.84, "learning_rate": 0.00017367250051712567, "loss": 0.01, "step": 166930 }, { "epoch": 0.84, "learning_rate": 0.00017366493282411165, "loss": 0.0123, "step": 166940 }, { "epoch": 0.84, "learning_rate": 0.00017365736513109766, "loss": 0.0113, "step": 166950 }, { "epoch": 0.84, "learning_rate": 0.00017364979743808364, "loss": 0.0096, "step": 166960 }, { "epoch": 0.84, "learning_rate": 0.00017364222974506962, "loss": 0.0096, "step": 166970 }, { "epoch": 0.84, "learning_rate": 0.0001736346620520556, "loss": 0.0114, "step": 166980 }, { "epoch": 0.84, "learning_rate": 0.0001736270943590416, "loss": 0.0108, "step": 166990 }, { "epoch": 0.84, "learning_rate": 0.0001736195266660276, "loss": 0.0144, "step": 167000 }, { "epoch": 0.84, "eval_cer": 0.9144906342217957, "eval_loss": 0.008696102537214756, "eval_runtime": 116.717, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 167000 }, { "epoch": 0.84, "learning_rate": 0.00017361195897301358, "loss": 0.0094, "step": 167010 }, { "epoch": 0.84, "learning_rate": 0.00017360439127999958, "loss": 0.0124, "step": 167020 }, { "epoch": 0.84, "learning_rate": 0.00017359682358698557, "loss": 0.0132, "step": 167030 }, { "epoch": 0.84, "learning_rate": 0.00017358925589397155, "loss": 0.01, "step": 167040 }, { "epoch": 0.84, "learning_rate": 0.00017358168820095756, "loss": 0.0132, "step": 167050 }, { "epoch": 0.84, "learning_rate": 0.00017357412050794354, "loss": 0.0123, "step": 167060 }, { "epoch": 0.84, "learning_rate": 0.00017356655281492952, "loss": 0.0114, "step": 167070 }, { "epoch": 0.84, "learning_rate": 0.00017355898512191553, "loss": 0.0145, "step": 167080 }, { "epoch": 0.84, "learning_rate": 0.0001735514174289015, "loss": 0.01, "step": 167090 }, { "epoch": 0.84, "learning_rate": 0.0001735438497358875, "loss": 0.0122, "step": 167100 }, { "epoch": 0.84, "learning_rate": 0.0001735362820428735, "loss": 0.0117, "step": 167110 }, { "epoch": 0.84, "learning_rate": 0.00017352871434985948, "loss": 0.0097, "step": 167120 }, { "epoch": 0.84, "learning_rate": 0.00017352114665684546, "loss": 0.013, "step": 167130 }, { "epoch": 0.84, "learning_rate": 0.00017351357896383144, "loss": 0.0112, "step": 167140 }, { "epoch": 0.84, "learning_rate": 0.00017350601127081745, "loss": 0.0142, "step": 167150 }, { "epoch": 0.84, "learning_rate": 0.00017349844357780343, "loss": 0.0128, "step": 167160 }, { "epoch": 0.84, "learning_rate": 0.00017349087588478941, "loss": 0.0121, "step": 167170 }, { "epoch": 0.84, "learning_rate": 0.00017348330819177542, "loss": 0.0113, "step": 167180 }, { "epoch": 0.84, "learning_rate": 0.0001734757404987614, "loss": 0.0109, "step": 167190 }, { "epoch": 0.84, "learning_rate": 0.00017346817280574739, "loss": 0.0136, "step": 167200 }, { "epoch": 0.84, "learning_rate": 0.0001734606051127334, "loss": 0.0099, "step": 167210 }, { "epoch": 0.84, "learning_rate": 0.00017345303741971938, "loss": 0.0107, "step": 167220 }, { "epoch": 0.84, "learning_rate": 0.00017344546972670536, "loss": 0.0121, "step": 167230 }, { "epoch": 0.84, "learning_rate": 0.00017343790203369137, "loss": 0.011, "step": 167240 }, { "epoch": 0.84, "learning_rate": 0.00017343033434067735, "loss": 0.0119, "step": 167250 }, { "epoch": 0.84, "learning_rate": 0.00017342276664766333, "loss": 0.0121, "step": 167260 }, { "epoch": 0.84, "learning_rate": 0.00017341519895464934, "loss": 0.0112, "step": 167270 }, { "epoch": 0.84, "learning_rate": 0.00017340763126163532, "loss": 0.0117, "step": 167280 }, { "epoch": 0.84, "learning_rate": 0.0001734000635686213, "loss": 0.012, "step": 167290 }, { "epoch": 0.84, "learning_rate": 0.0001733924958756073, "loss": 0.0103, "step": 167300 }, { "epoch": 0.84, "learning_rate": 0.0001733849281825933, "loss": 0.0111, "step": 167310 }, { "epoch": 0.84, "learning_rate": 0.00017337736048957927, "loss": 0.0115, "step": 167320 }, { "epoch": 0.84, "learning_rate": 0.00017336979279656525, "loss": 0.0086, "step": 167330 }, { "epoch": 0.84, "learning_rate": 0.00017336222510355126, "loss": 0.0151, "step": 167340 }, { "epoch": 0.84, "learning_rate": 0.00017335465741053724, "loss": 0.0096, "step": 167350 }, { "epoch": 0.84, "learning_rate": 0.00017334708971752322, "loss": 0.0109, "step": 167360 }, { "epoch": 0.84, "learning_rate": 0.00017333952202450923, "loss": 0.0148, "step": 167370 }, { "epoch": 0.84, "learning_rate": 0.00017333195433149521, "loss": 0.013, "step": 167380 }, { "epoch": 0.84, "learning_rate": 0.0001733243866384812, "loss": 0.0121, "step": 167390 }, { "epoch": 0.84, "learning_rate": 0.0001733168189454672, "loss": 0.0105, "step": 167400 }, { "epoch": 0.84, "learning_rate": 0.00017330925125245319, "loss": 0.0123, "step": 167410 }, { "epoch": 0.84, "learning_rate": 0.00017330168355943917, "loss": 0.0119, "step": 167420 }, { "epoch": 0.84, "learning_rate": 0.00017329411586642518, "loss": 0.0118, "step": 167430 }, { "epoch": 0.84, "learning_rate": 0.00017328654817341116, "loss": 0.0103, "step": 167440 }, { "epoch": 0.84, "learning_rate": 0.00017327898048039714, "loss": 0.0102, "step": 167450 }, { "epoch": 0.84, "learning_rate": 0.00017327141278738315, "loss": 0.0108, "step": 167460 }, { "epoch": 0.84, "learning_rate": 0.00017326384509436913, "loss": 0.0096, "step": 167470 }, { "epoch": 0.84, "learning_rate": 0.0001732562774013551, "loss": 0.0141, "step": 167480 }, { "epoch": 0.85, "learning_rate": 0.0001732487097083411, "loss": 0.0153, "step": 167490 }, { "epoch": 0.85, "learning_rate": 0.0001732411420153271, "loss": 0.0126, "step": 167500 }, { "epoch": 0.85, "learning_rate": 0.00017323357432231308, "loss": 0.0137, "step": 167510 }, { "epoch": 0.85, "learning_rate": 0.00017322600662929906, "loss": 0.015, "step": 167520 }, { "epoch": 0.85, "learning_rate": 0.00017321843893628507, "loss": 0.0118, "step": 167530 }, { "epoch": 0.85, "learning_rate": 0.00017321087124327105, "loss": 0.0108, "step": 167540 }, { "epoch": 0.85, "learning_rate": 0.00017320330355025703, "loss": 0.0101, "step": 167550 }, { "epoch": 0.85, "learning_rate": 0.00017319573585724304, "loss": 0.0102, "step": 167560 }, { "epoch": 0.85, "learning_rate": 0.00017318816816422902, "loss": 0.0129, "step": 167570 }, { "epoch": 0.85, "learning_rate": 0.000173180600471215, "loss": 0.0145, "step": 167580 }, { "epoch": 0.85, "learning_rate": 0.00017317303277820101, "loss": 0.012, "step": 167590 }, { "epoch": 0.85, "learning_rate": 0.000173165465085187, "loss": 0.0163, "step": 167600 }, { "epoch": 0.85, "learning_rate": 0.00017315789739217298, "loss": 0.0091, "step": 167610 }, { "epoch": 0.85, "learning_rate": 0.00017315032969915899, "loss": 0.0127, "step": 167620 }, { "epoch": 0.85, "learning_rate": 0.00017314276200614497, "loss": 0.0114, "step": 167630 }, { "epoch": 0.85, "learning_rate": 0.00017313519431313095, "loss": 0.0142, "step": 167640 }, { "epoch": 0.85, "learning_rate": 0.00017312762662011693, "loss": 0.0122, "step": 167650 }, { "epoch": 0.85, "learning_rate": 0.00017312005892710294, "loss": 0.011, "step": 167660 }, { "epoch": 0.85, "learning_rate": 0.00017311249123408892, "loss": 0.0138, "step": 167670 }, { "epoch": 0.85, "learning_rate": 0.0001731049235410749, "loss": 0.014, "step": 167680 }, { "epoch": 0.85, "learning_rate": 0.0001730973558480609, "loss": 0.0115, "step": 167690 }, { "epoch": 0.85, "learning_rate": 0.0001730897881550469, "loss": 0.0123, "step": 167700 }, { "epoch": 0.85, "learning_rate": 0.00017308222046203287, "loss": 0.0152, "step": 167710 }, { "epoch": 0.85, "learning_rate": 0.00017307465276901888, "loss": 0.0124, "step": 167720 }, { "epoch": 0.85, "learning_rate": 0.00017306708507600486, "loss": 0.0114, "step": 167730 }, { "epoch": 0.85, "learning_rate": 0.00017305951738299084, "loss": 0.0119, "step": 167740 }, { "epoch": 0.85, "learning_rate": 0.00017305194968997685, "loss": 0.0122, "step": 167750 }, { "epoch": 0.85, "learning_rate": 0.00017304438199696283, "loss": 0.0202, "step": 167760 }, { "epoch": 0.85, "learning_rate": 0.00017303681430394882, "loss": 0.012, "step": 167770 }, { "epoch": 0.85, "learning_rate": 0.00017302924661093482, "loss": 0.0115, "step": 167780 }, { "epoch": 0.85, "learning_rate": 0.0001730216789179208, "loss": 0.011, "step": 167790 }, { "epoch": 0.85, "learning_rate": 0.00017301411122490676, "loss": 0.0136, "step": 167800 }, { "epoch": 0.85, "learning_rate": 0.00017300654353189274, "loss": 0.012, "step": 167810 }, { "epoch": 0.85, "learning_rate": 0.00017299897583887875, "loss": 0.0144, "step": 167820 }, { "epoch": 0.85, "learning_rate": 0.00017299140814586473, "loss": 0.0135, "step": 167830 }, { "epoch": 0.85, "learning_rate": 0.00017298384045285071, "loss": 0.0133, "step": 167840 }, { "epoch": 0.85, "learning_rate": 0.00017297627275983672, "loss": 0.012, "step": 167850 }, { "epoch": 0.85, "learning_rate": 0.0001729687050668227, "loss": 0.0126, "step": 167860 }, { "epoch": 0.85, "learning_rate": 0.00017296113737380869, "loss": 0.0136, "step": 167870 }, { "epoch": 0.85, "learning_rate": 0.00017295356968079467, "loss": 0.0127, "step": 167880 }, { "epoch": 0.85, "learning_rate": 0.00017294600198778067, "loss": 0.0127, "step": 167890 }, { "epoch": 0.85, "learning_rate": 0.00017293843429476666, "loss": 0.0118, "step": 167900 }, { "epoch": 0.85, "learning_rate": 0.00017293086660175264, "loss": 0.0123, "step": 167910 }, { "epoch": 0.85, "learning_rate": 0.00017292329890873865, "loss": 0.0128, "step": 167920 }, { "epoch": 0.85, "learning_rate": 0.00017291573121572463, "loss": 0.0128, "step": 167930 }, { "epoch": 0.85, "learning_rate": 0.0001729081635227106, "loss": 0.0138, "step": 167940 }, { "epoch": 0.85, "learning_rate": 0.00017290059582969662, "loss": 0.0138, "step": 167950 }, { "epoch": 0.85, "learning_rate": 0.0001728930281366826, "loss": 0.0106, "step": 167960 }, { "epoch": 0.85, "learning_rate": 0.00017288546044366858, "loss": 0.0127, "step": 167970 }, { "epoch": 0.85, "learning_rate": 0.0001728778927506546, "loss": 0.0111, "step": 167980 }, { "epoch": 0.85, "learning_rate": 0.00017287032505764057, "loss": 0.0111, "step": 167990 }, { "epoch": 0.85, "learning_rate": 0.00017286275736462655, "loss": 0.012, "step": 168000 }, { "epoch": 0.85, "eval_cer": 0.9144615223380336, "eval_loss": 0.008770990185439587, "eval_runtime": 116.7217, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 168000 }, { "epoch": 0.85, "learning_rate": 0.00017285518967161256, "loss": 0.0147, "step": 168010 }, { "epoch": 0.85, "learning_rate": 0.00017284762197859854, "loss": 0.0125, "step": 168020 }, { "epoch": 0.85, "learning_rate": 0.00017284005428558452, "loss": 0.012, "step": 168030 }, { "epoch": 0.85, "learning_rate": 0.0001728324865925705, "loss": 0.0086, "step": 168040 }, { "epoch": 0.85, "learning_rate": 0.00017282491889955651, "loss": 0.0135, "step": 168050 }, { "epoch": 0.85, "learning_rate": 0.0001728173512065425, "loss": 0.0141, "step": 168060 }, { "epoch": 0.85, "learning_rate": 0.00017280978351352848, "loss": 0.0135, "step": 168070 }, { "epoch": 0.85, "learning_rate": 0.00017280221582051449, "loss": 0.0137, "step": 168080 }, { "epoch": 0.85, "learning_rate": 0.00017279464812750047, "loss": 0.01, "step": 168090 }, { "epoch": 0.85, "learning_rate": 0.00017278708043448645, "loss": 0.0123, "step": 168100 }, { "epoch": 0.85, "learning_rate": 0.00017277951274147246, "loss": 0.013, "step": 168110 }, { "epoch": 0.85, "learning_rate": 0.00017277194504845844, "loss": 0.01, "step": 168120 }, { "epoch": 0.85, "learning_rate": 0.00017276437735544442, "loss": 0.0123, "step": 168130 }, { "epoch": 0.85, "learning_rate": 0.00017275680966243043, "loss": 0.0131, "step": 168140 }, { "epoch": 0.85, "learning_rate": 0.0001727492419694164, "loss": 0.01, "step": 168150 }, { "epoch": 0.85, "learning_rate": 0.0001727416742764024, "loss": 0.0154, "step": 168160 }, { "epoch": 0.85, "learning_rate": 0.0001727341065833884, "loss": 0.0103, "step": 168170 }, { "epoch": 0.85, "learning_rate": 0.00017272653889037438, "loss": 0.0105, "step": 168180 }, { "epoch": 0.85, "learning_rate": 0.00017271897119736036, "loss": 0.0125, "step": 168190 }, { "epoch": 0.85, "learning_rate": 0.00017271140350434637, "loss": 0.0122, "step": 168200 }, { "epoch": 0.85, "learning_rate": 0.00017270383581133235, "loss": 0.0112, "step": 168210 }, { "epoch": 0.85, "learning_rate": 0.00017269626811831833, "loss": 0.0126, "step": 168220 }, { "epoch": 0.85, "learning_rate": 0.00017268870042530432, "loss": 0.0117, "step": 168230 }, { "epoch": 0.85, "learning_rate": 0.00017268113273229032, "loss": 0.0132, "step": 168240 }, { "epoch": 0.85, "learning_rate": 0.0001726735650392763, "loss": 0.0142, "step": 168250 }, { "epoch": 0.85, "learning_rate": 0.0001726659973462623, "loss": 0.0142, "step": 168260 }, { "epoch": 0.85, "learning_rate": 0.0001726584296532483, "loss": 0.0155, "step": 168270 }, { "epoch": 0.85, "learning_rate": 0.00017265086196023428, "loss": 0.0107, "step": 168280 }, { "epoch": 0.85, "learning_rate": 0.00017264329426722026, "loss": 0.0107, "step": 168290 }, { "epoch": 0.85, "learning_rate": 0.00017263572657420627, "loss": 0.0151, "step": 168300 }, { "epoch": 0.85, "learning_rate": 0.00017262815888119225, "loss": 0.0118, "step": 168310 }, { "epoch": 0.85, "learning_rate": 0.00017262059118817823, "loss": 0.014, "step": 168320 }, { "epoch": 0.85, "learning_rate": 0.00017261302349516424, "loss": 0.0142, "step": 168330 }, { "epoch": 0.85, "learning_rate": 0.00017260545580215022, "loss": 0.0116, "step": 168340 }, { "epoch": 0.85, "learning_rate": 0.0001725978881091362, "loss": 0.0125, "step": 168350 }, { "epoch": 0.85, "learning_rate": 0.0001725903204161222, "loss": 0.0129, "step": 168360 }, { "epoch": 0.85, "learning_rate": 0.0001725827527231082, "loss": 0.0115, "step": 168370 }, { "epoch": 0.85, "learning_rate": 0.00017257518503009417, "loss": 0.0126, "step": 168380 }, { "epoch": 0.85, "learning_rate": 0.00017256761733708015, "loss": 0.014, "step": 168390 }, { "epoch": 0.85, "learning_rate": 0.00017256004964406616, "loss": 0.0147, "step": 168400 }, { "epoch": 0.85, "learning_rate": 0.00017255248195105214, "loss": 0.0114, "step": 168410 }, { "epoch": 0.85, "learning_rate": 0.00017254491425803813, "loss": 0.0113, "step": 168420 }, { "epoch": 0.85, "learning_rate": 0.00017253734656502413, "loss": 0.0099, "step": 168430 }, { "epoch": 0.85, "learning_rate": 0.00017252977887201012, "loss": 0.0123, "step": 168440 }, { "epoch": 0.85, "learning_rate": 0.0001725222111789961, "loss": 0.0137, "step": 168450 }, { "epoch": 0.85, "learning_rate": 0.0001725146434859821, "loss": 0.0128, "step": 168460 }, { "epoch": 0.85, "learning_rate": 0.0001725070757929681, "loss": 0.0117, "step": 168470 }, { "epoch": 0.85, "learning_rate": 0.00017249950809995407, "loss": 0.0119, "step": 168480 }, { "epoch": 0.85, "learning_rate": 0.00017249194040694008, "loss": 0.0117, "step": 168490 }, { "epoch": 0.85, "learning_rate": 0.00017248437271392606, "loss": 0.0097, "step": 168500 }, { "epoch": 0.85, "learning_rate": 0.00017247680502091204, "loss": 0.0095, "step": 168510 }, { "epoch": 0.85, "learning_rate": 0.00017246923732789805, "loss": 0.0114, "step": 168520 }, { "epoch": 0.85, "learning_rate": 0.00017246166963488403, "loss": 0.0118, "step": 168530 }, { "epoch": 0.85, "learning_rate": 0.00017245410194187, "loss": 0.0109, "step": 168540 }, { "epoch": 0.85, "learning_rate": 0.000172446534248856, "loss": 0.0108, "step": 168550 }, { "epoch": 0.85, "learning_rate": 0.000172438966555842, "loss": 0.0125, "step": 168560 }, { "epoch": 0.85, "learning_rate": 0.00017243139886282798, "loss": 0.0102, "step": 168570 }, { "epoch": 0.85, "learning_rate": 0.00017242383116981396, "loss": 0.0117, "step": 168580 }, { "epoch": 0.85, "learning_rate": 0.00017241626347679997, "loss": 0.0107, "step": 168590 }, { "epoch": 0.85, "learning_rate": 0.00017240869578378595, "loss": 0.0119, "step": 168600 }, { "epoch": 0.85, "learning_rate": 0.00017240112809077194, "loss": 0.0104, "step": 168610 }, { "epoch": 0.85, "learning_rate": 0.00017239356039775794, "loss": 0.013, "step": 168620 }, { "epoch": 0.85, "learning_rate": 0.00017238599270474393, "loss": 0.0133, "step": 168630 }, { "epoch": 0.85, "learning_rate": 0.0001723784250117299, "loss": 0.014, "step": 168640 }, { "epoch": 0.85, "learning_rate": 0.00017237085731871592, "loss": 0.0151, "step": 168650 }, { "epoch": 0.85, "learning_rate": 0.0001723632896257019, "loss": 0.0118, "step": 168660 }, { "epoch": 0.85, "learning_rate": 0.00017235572193268788, "loss": 0.017, "step": 168670 }, { "epoch": 0.85, "learning_rate": 0.0001723481542396739, "loss": 0.0123, "step": 168680 }, { "epoch": 0.85, "learning_rate": 0.00017234058654665987, "loss": 0.0113, "step": 168690 }, { "epoch": 0.85, "learning_rate": 0.00017233301885364585, "loss": 0.0135, "step": 168700 }, { "epoch": 0.85, "learning_rate": 0.00017232545116063183, "loss": 0.0087, "step": 168710 }, { "epoch": 0.85, "learning_rate": 0.00017231788346761784, "loss": 0.0144, "step": 168720 }, { "epoch": 0.85, "learning_rate": 0.00017231031577460382, "loss": 0.0153, "step": 168730 }, { "epoch": 0.85, "learning_rate": 0.0001723027480815898, "loss": 0.0119, "step": 168740 }, { "epoch": 0.85, "learning_rate": 0.0001722951803885758, "loss": 0.0116, "step": 168750 }, { "epoch": 0.85, "learning_rate": 0.0001722876126955618, "loss": 0.0104, "step": 168760 }, { "epoch": 0.85, "learning_rate": 0.00017228004500254777, "loss": 0.0118, "step": 168770 }, { "epoch": 0.85, "learning_rate": 0.00017227247730953378, "loss": 0.0119, "step": 168780 }, { "epoch": 0.85, "learning_rate": 0.00017226490961651976, "loss": 0.0123, "step": 168790 }, { "epoch": 0.85, "learning_rate": 0.00017225734192350575, "loss": 0.0121, "step": 168800 }, { "epoch": 0.85, "learning_rate": 0.00017224977423049175, "loss": 0.0109, "step": 168810 }, { "epoch": 0.85, "learning_rate": 0.00017224220653747774, "loss": 0.0138, "step": 168820 }, { "epoch": 0.85, "learning_rate": 0.00017223463884446372, "loss": 0.014, "step": 168830 }, { "epoch": 0.85, "learning_rate": 0.00017222707115144973, "loss": 0.011, "step": 168840 }, { "epoch": 0.85, "learning_rate": 0.0001722195034584357, "loss": 0.0108, "step": 168850 }, { "epoch": 0.85, "learning_rate": 0.0001722119357654217, "loss": 0.0111, "step": 168860 }, { "epoch": 0.85, "learning_rate": 0.0001722043680724077, "loss": 0.0112, "step": 168870 }, { "epoch": 0.85, "learning_rate": 0.00017219680037939368, "loss": 0.0131, "step": 168880 }, { "epoch": 0.85, "learning_rate": 0.00017218923268637966, "loss": 0.014, "step": 168890 }, { "epoch": 0.85, "learning_rate": 0.00017218166499336564, "loss": 0.0154, "step": 168900 }, { "epoch": 0.85, "learning_rate": 0.00017217409730035165, "loss": 0.0108, "step": 168910 }, { "epoch": 0.85, "learning_rate": 0.00017216652960733763, "loss": 0.0129, "step": 168920 }, { "epoch": 0.85, "learning_rate": 0.0001721589619143236, "loss": 0.0135, "step": 168930 }, { "epoch": 0.85, "learning_rate": 0.00017215139422130962, "loss": 0.0101, "step": 168940 }, { "epoch": 0.85, "learning_rate": 0.0001721438265282956, "loss": 0.0124, "step": 168950 }, { "epoch": 0.85, "learning_rate": 0.00017213625883528158, "loss": 0.0111, "step": 168960 }, { "epoch": 0.85, "learning_rate": 0.0001721286911422676, "loss": 0.0107, "step": 168970 }, { "epoch": 0.85, "learning_rate": 0.00017212112344925357, "loss": 0.0089, "step": 168980 }, { "epoch": 0.85, "learning_rate": 0.00017211355575623956, "loss": 0.0138, "step": 168990 }, { "epoch": 0.85, "learning_rate": 0.00017210598806322556, "loss": 0.0129, "step": 169000 }, { "epoch": 0.85, "eval_cer": 0.9144751078837893, "eval_loss": 0.008490633219480515, "eval_runtime": 116.745, "eval_samples_per_second": 17.131, "eval_steps_per_second": 4.283, "step": 169000 }, { "epoch": 0.85, "learning_rate": 0.00017209842037021155, "loss": 0.0123, "step": 169010 }, { "epoch": 0.85, "learning_rate": 0.00017209085267719753, "loss": 0.0113, "step": 169020 }, { "epoch": 0.85, "learning_rate": 0.00017208328498418354, "loss": 0.017, "step": 169030 }, { "epoch": 0.85, "learning_rate": 0.00017207571729116952, "loss": 0.0104, "step": 169040 }, { "epoch": 0.85, "learning_rate": 0.0001720681495981555, "loss": 0.0144, "step": 169050 }, { "epoch": 0.85, "learning_rate": 0.00017206058190514145, "loss": 0.0148, "step": 169060 }, { "epoch": 0.85, "learning_rate": 0.00017205301421212746, "loss": 0.0138, "step": 169070 }, { "epoch": 0.85, "learning_rate": 0.00017204544651911344, "loss": 0.0138, "step": 169080 }, { "epoch": 0.85, "learning_rate": 0.00017203787882609942, "loss": 0.0119, "step": 169090 }, { "epoch": 0.85, "learning_rate": 0.00017203031113308543, "loss": 0.0121, "step": 169100 }, { "epoch": 0.85, "learning_rate": 0.00017202274344007141, "loss": 0.0147, "step": 169110 }, { "epoch": 0.85, "learning_rate": 0.0001720151757470574, "loss": 0.0131, "step": 169120 }, { "epoch": 0.85, "learning_rate": 0.00017200760805404338, "loss": 0.0117, "step": 169130 }, { "epoch": 0.85, "learning_rate": 0.00017200004036102939, "loss": 0.0119, "step": 169140 }, { "epoch": 0.85, "learning_rate": 0.00017199247266801537, "loss": 0.0121, "step": 169150 }, { "epoch": 0.85, "learning_rate": 0.00017198490497500135, "loss": 0.0098, "step": 169160 }, { "epoch": 0.85, "learning_rate": 0.00017197733728198736, "loss": 0.0112, "step": 169170 }, { "epoch": 0.85, "learning_rate": 0.00017196976958897334, "loss": 0.0108, "step": 169180 }, { "epoch": 0.85, "learning_rate": 0.00017196220189595932, "loss": 0.0121, "step": 169190 }, { "epoch": 0.85, "learning_rate": 0.00017195463420294533, "loss": 0.0125, "step": 169200 }, { "epoch": 0.85, "learning_rate": 0.0001719470665099313, "loss": 0.0115, "step": 169210 }, { "epoch": 0.85, "learning_rate": 0.0001719394988169173, "loss": 0.0125, "step": 169220 }, { "epoch": 0.85, "learning_rate": 0.0001719319311239033, "loss": 0.0139, "step": 169230 }, { "epoch": 0.85, "learning_rate": 0.00017192436343088928, "loss": 0.01, "step": 169240 }, { "epoch": 0.85, "learning_rate": 0.00017191679573787526, "loss": 0.0127, "step": 169250 }, { "epoch": 0.85, "learning_rate": 0.00017190922804486127, "loss": 0.012, "step": 169260 }, { "epoch": 0.85, "learning_rate": 0.00017190166035184725, "loss": 0.0133, "step": 169270 }, { "epoch": 0.85, "learning_rate": 0.00017189409265883323, "loss": 0.0124, "step": 169280 }, { "epoch": 0.85, "learning_rate": 0.00017188652496581922, "loss": 0.0108, "step": 169290 }, { "epoch": 0.85, "learning_rate": 0.00017187895727280522, "loss": 0.0101, "step": 169300 }, { "epoch": 0.85, "learning_rate": 0.0001718713895797912, "loss": 0.0131, "step": 169310 }, { "epoch": 0.85, "learning_rate": 0.0001718638218867772, "loss": 0.0193, "step": 169320 }, { "epoch": 0.85, "learning_rate": 0.0001718562541937632, "loss": 0.0136, "step": 169330 }, { "epoch": 0.85, "learning_rate": 0.00017184868650074918, "loss": 0.012, "step": 169340 }, { "epoch": 0.85, "learning_rate": 0.00017184111880773516, "loss": 0.0128, "step": 169350 }, { "epoch": 0.85, "learning_rate": 0.00017183355111472117, "loss": 0.0118, "step": 169360 }, { "epoch": 0.85, "learning_rate": 0.00017182598342170715, "loss": 0.0119, "step": 169370 }, { "epoch": 0.85, "learning_rate": 0.00017181841572869313, "loss": 0.0135, "step": 169380 }, { "epoch": 0.85, "learning_rate": 0.00017181084803567914, "loss": 0.013, "step": 169390 }, { "epoch": 0.85, "learning_rate": 0.00017180328034266512, "loss": 0.0116, "step": 169400 }, { "epoch": 0.85, "learning_rate": 0.0001717957126496511, "loss": 0.015, "step": 169410 }, { "epoch": 0.85, "learning_rate": 0.0001717881449566371, "loss": 0.0127, "step": 169420 }, { "epoch": 0.85, "learning_rate": 0.0001717805772636231, "loss": 0.0144, "step": 169430 }, { "epoch": 0.85, "learning_rate": 0.00017177300957060907, "loss": 0.0112, "step": 169440 }, { "epoch": 0.85, "learning_rate": 0.00017176544187759505, "loss": 0.0133, "step": 169450 }, { "epoch": 0.85, "learning_rate": 0.00017175787418458106, "loss": 0.0128, "step": 169460 }, { "epoch": 0.85, "learning_rate": 0.00017175030649156704, "loss": 0.014, "step": 169470 }, { "epoch": 0.86, "learning_rate": 0.00017174273879855303, "loss": 0.0123, "step": 169480 }, { "epoch": 0.86, "learning_rate": 0.00017173517110553903, "loss": 0.012, "step": 169490 }, { "epoch": 0.86, "learning_rate": 0.00017172760341252502, "loss": 0.0136, "step": 169500 }, { "epoch": 0.86, "learning_rate": 0.000171720035719511, "loss": 0.0091, "step": 169510 }, { "epoch": 0.86, "learning_rate": 0.000171712468026497, "loss": 0.0108, "step": 169520 }, { "epoch": 0.86, "learning_rate": 0.000171704900333483, "loss": 0.0122, "step": 169530 }, { "epoch": 0.86, "learning_rate": 0.00017169733264046897, "loss": 0.0137, "step": 169540 }, { "epoch": 0.86, "learning_rate": 0.00017168976494745498, "loss": 0.0132, "step": 169550 }, { "epoch": 0.86, "learning_rate": 0.00017168219725444096, "loss": 0.0103, "step": 169560 }, { "epoch": 0.86, "learning_rate": 0.00017167462956142694, "loss": 0.0129, "step": 169570 }, { "epoch": 0.86, "learning_rate": 0.00017166706186841295, "loss": 0.0103, "step": 169580 }, { "epoch": 0.86, "learning_rate": 0.00017165949417539893, "loss": 0.01, "step": 169590 }, { "epoch": 0.86, "learning_rate": 0.0001716519264823849, "loss": 0.0152, "step": 169600 }, { "epoch": 0.86, "learning_rate": 0.0001716443587893709, "loss": 0.0107, "step": 169610 }, { "epoch": 0.86, "learning_rate": 0.0001716367910963569, "loss": 0.011, "step": 169620 }, { "epoch": 0.86, "learning_rate": 0.00017162922340334288, "loss": 0.0135, "step": 169630 }, { "epoch": 0.86, "learning_rate": 0.00017162165571032886, "loss": 0.0098, "step": 169640 }, { "epoch": 0.86, "learning_rate": 0.00017161408801731487, "loss": 0.0088, "step": 169650 }, { "epoch": 0.86, "learning_rate": 0.00017160652032430085, "loss": 0.0099, "step": 169660 }, { "epoch": 0.86, "learning_rate": 0.00017159895263128684, "loss": 0.0094, "step": 169670 }, { "epoch": 0.86, "learning_rate": 0.00017159138493827284, "loss": 0.0123, "step": 169680 }, { "epoch": 0.86, "learning_rate": 0.00017158381724525883, "loss": 0.0152, "step": 169690 }, { "epoch": 0.86, "learning_rate": 0.0001715762495522448, "loss": 0.0108, "step": 169700 }, { "epoch": 0.86, "learning_rate": 0.00017156868185923082, "loss": 0.0098, "step": 169710 }, { "epoch": 0.86, "learning_rate": 0.0001715611141662168, "loss": 0.0096, "step": 169720 }, { "epoch": 0.86, "learning_rate": 0.00017155354647320278, "loss": 0.0138, "step": 169730 }, { "epoch": 0.86, "learning_rate": 0.0001715459787801888, "loss": 0.0136, "step": 169740 }, { "epoch": 0.86, "learning_rate": 0.00017153841108717477, "loss": 0.0111, "step": 169750 }, { "epoch": 0.86, "learning_rate": 0.00017153084339416075, "loss": 0.0103, "step": 169760 }, { "epoch": 0.86, "learning_rate": 0.00017152327570114676, "loss": 0.0115, "step": 169770 }, { "epoch": 0.86, "learning_rate": 0.00017151570800813274, "loss": 0.0116, "step": 169780 }, { "epoch": 0.86, "learning_rate": 0.00017150814031511872, "loss": 0.01, "step": 169790 }, { "epoch": 0.86, "learning_rate": 0.0001715005726221047, "loss": 0.0111, "step": 169800 }, { "epoch": 0.86, "learning_rate": 0.0001714930049290907, "loss": 0.012, "step": 169810 }, { "epoch": 0.86, "learning_rate": 0.0001714854372360767, "loss": 0.011, "step": 169820 }, { "epoch": 0.86, "learning_rate": 0.00017147786954306267, "loss": 0.0097, "step": 169830 }, { "epoch": 0.86, "learning_rate": 0.00017147030185004868, "loss": 0.0122, "step": 169840 }, { "epoch": 0.86, "learning_rate": 0.00017146273415703466, "loss": 0.0112, "step": 169850 }, { "epoch": 0.86, "learning_rate": 0.00017145516646402065, "loss": 0.0126, "step": 169860 }, { "epoch": 0.86, "learning_rate": 0.00017144759877100665, "loss": 0.0124, "step": 169870 }, { "epoch": 0.86, "learning_rate": 0.00017144003107799264, "loss": 0.0147, "step": 169880 }, { "epoch": 0.86, "learning_rate": 0.00017143246338497862, "loss": 0.0113, "step": 169890 }, { "epoch": 0.86, "learning_rate": 0.00017142489569196463, "loss": 0.0103, "step": 169900 }, { "epoch": 0.86, "learning_rate": 0.0001714173279989506, "loss": 0.0116, "step": 169910 }, { "epoch": 0.86, "learning_rate": 0.0001714097603059366, "loss": 0.0103, "step": 169920 }, { "epoch": 0.86, "learning_rate": 0.0001714021926129226, "loss": 0.0128, "step": 169930 }, { "epoch": 0.86, "learning_rate": 0.00017139462491990858, "loss": 0.0119, "step": 169940 }, { "epoch": 0.86, "learning_rate": 0.00017138705722689456, "loss": 0.0113, "step": 169950 }, { "epoch": 0.86, "learning_rate": 0.00017137948953388054, "loss": 0.0139, "step": 169960 }, { "epoch": 0.86, "learning_rate": 0.00017137192184086655, "loss": 0.0115, "step": 169970 }, { "epoch": 0.86, "learning_rate": 0.00017136435414785253, "loss": 0.0093, "step": 169980 }, { "epoch": 0.86, "learning_rate": 0.0001713567864548385, "loss": 0.0162, "step": 169990 }, { "epoch": 0.86, "learning_rate": 0.00017134921876182452, "loss": 0.015, "step": 170000 }, { "epoch": 0.86, "eval_cer": 0.9144799598644162, "eval_loss": 0.00878238771110773, "eval_runtime": 116.6286, "eval_samples_per_second": 17.148, "eval_steps_per_second": 4.287, "step": 170000 }, { "epoch": 0.86, "learning_rate": 0.0001713416510688105, "loss": 0.0126, "step": 170010 }, { "epoch": 0.86, "learning_rate": 0.00017133408337579648, "loss": 0.0136, "step": 170020 }, { "epoch": 0.86, "learning_rate": 0.0001713265156827825, "loss": 0.0109, "step": 170030 }, { "epoch": 0.86, "learning_rate": 0.00017131894798976847, "loss": 0.0117, "step": 170040 }, { "epoch": 0.86, "learning_rate": 0.00017131138029675446, "loss": 0.0139, "step": 170050 }, { "epoch": 0.86, "learning_rate": 0.00017130381260374046, "loss": 0.0119, "step": 170060 }, { "epoch": 0.86, "learning_rate": 0.00017129624491072645, "loss": 0.011, "step": 170070 }, { "epoch": 0.86, "learning_rate": 0.00017128867721771243, "loss": 0.0101, "step": 170080 }, { "epoch": 0.86, "learning_rate": 0.00017128110952469844, "loss": 0.0131, "step": 170090 }, { "epoch": 0.86, "learning_rate": 0.00017127354183168442, "loss": 0.0118, "step": 170100 }, { "epoch": 0.86, "learning_rate": 0.0001712659741386704, "loss": 0.0122, "step": 170110 }, { "epoch": 0.86, "learning_rate": 0.00017125840644565638, "loss": 0.0124, "step": 170120 }, { "epoch": 0.86, "learning_rate": 0.0001712508387526424, "loss": 0.0122, "step": 170130 }, { "epoch": 0.86, "learning_rate": 0.00017124327105962837, "loss": 0.0124, "step": 170140 }, { "epoch": 0.86, "learning_rate": 0.00017123570336661435, "loss": 0.0128, "step": 170150 }, { "epoch": 0.86, "learning_rate": 0.00017122813567360036, "loss": 0.0099, "step": 170160 }, { "epoch": 0.86, "learning_rate": 0.00017122056798058634, "loss": 0.0125, "step": 170170 }, { "epoch": 0.86, "learning_rate": 0.00017121300028757232, "loss": 0.0101, "step": 170180 }, { "epoch": 0.86, "learning_rate": 0.00017120543259455833, "loss": 0.0121, "step": 170190 }, { "epoch": 0.86, "learning_rate": 0.0001711978649015443, "loss": 0.0113, "step": 170200 }, { "epoch": 0.86, "learning_rate": 0.0001711902972085303, "loss": 0.011, "step": 170210 }, { "epoch": 0.86, "learning_rate": 0.0001711827295155163, "loss": 0.0158, "step": 170220 }, { "epoch": 0.86, "learning_rate": 0.00017117516182250228, "loss": 0.0129, "step": 170230 }, { "epoch": 0.86, "learning_rate": 0.00017116759412948827, "loss": 0.0127, "step": 170240 }, { "epoch": 0.86, "learning_rate": 0.00017116002643647427, "loss": 0.0115, "step": 170250 }, { "epoch": 0.86, "learning_rate": 0.00017115245874346026, "loss": 0.0271, "step": 170260 }, { "epoch": 0.86, "learning_rate": 0.00017114489105044624, "loss": 0.0112, "step": 170270 }, { "epoch": 0.86, "learning_rate": 0.00017113732335743225, "loss": 0.0129, "step": 170280 }, { "epoch": 0.86, "learning_rate": 0.00017112975566441823, "loss": 0.0123, "step": 170290 }, { "epoch": 0.86, "learning_rate": 0.0001711221879714042, "loss": 0.0142, "step": 170300 }, { "epoch": 0.86, "learning_rate": 0.00017111462027839016, "loss": 0.0148, "step": 170310 }, { "epoch": 0.86, "learning_rate": 0.00017110705258537617, "loss": 0.0113, "step": 170320 }, { "epoch": 0.86, "learning_rate": 0.00017109948489236215, "loss": 0.012, "step": 170330 }, { "epoch": 0.86, "learning_rate": 0.00017109191719934813, "loss": 0.011, "step": 170340 }, { "epoch": 0.86, "learning_rate": 0.00017108434950633412, "loss": 0.0127, "step": 170350 }, { "epoch": 0.86, "learning_rate": 0.00017107678181332012, "loss": 0.0173, "step": 170360 }, { "epoch": 0.86, "learning_rate": 0.0001710692141203061, "loss": 0.015, "step": 170370 }, { "epoch": 0.86, "learning_rate": 0.0001710616464272921, "loss": 0.0106, "step": 170380 }, { "epoch": 0.86, "learning_rate": 0.0001710540787342781, "loss": 0.0098, "step": 170390 }, { "epoch": 0.86, "learning_rate": 0.00017104651104126408, "loss": 0.0113, "step": 170400 }, { "epoch": 0.86, "learning_rate": 0.00017103894334825006, "loss": 0.023, "step": 170410 }, { "epoch": 0.86, "learning_rate": 0.00017103137565523607, "loss": 0.0125, "step": 170420 }, { "epoch": 0.86, "learning_rate": 0.00017102380796222205, "loss": 0.0142, "step": 170430 }, { "epoch": 0.86, "learning_rate": 0.00017101624026920803, "loss": 0.0121, "step": 170440 }, { "epoch": 0.86, "learning_rate": 0.00017100867257619404, "loss": 0.0095, "step": 170450 }, { "epoch": 0.86, "learning_rate": 0.00017100110488318002, "loss": 0.0118, "step": 170460 }, { "epoch": 0.86, "learning_rate": 0.000170993537190166, "loss": 0.0098, "step": 170470 }, { "epoch": 0.86, "learning_rate": 0.000170985969497152, "loss": 0.0096, "step": 170480 }, { "epoch": 0.86, "learning_rate": 0.000170978401804138, "loss": 0.0117, "step": 170490 }, { "epoch": 0.86, "learning_rate": 0.00017097083411112397, "loss": 0.0129, "step": 170500 }, { "epoch": 0.86, "learning_rate": 0.00017096326641810995, "loss": 0.0102, "step": 170510 }, { "epoch": 0.86, "learning_rate": 0.00017095569872509596, "loss": 0.0144, "step": 170520 }, { "epoch": 0.86, "learning_rate": 0.00017094813103208194, "loss": 0.0121, "step": 170530 }, { "epoch": 0.86, "learning_rate": 0.00017094056333906793, "loss": 0.0141, "step": 170540 }, { "epoch": 0.86, "learning_rate": 0.00017093299564605393, "loss": 0.0121, "step": 170550 }, { "epoch": 0.86, "learning_rate": 0.00017092542795303992, "loss": 0.0126, "step": 170560 }, { "epoch": 0.86, "learning_rate": 0.0001709178602600259, "loss": 0.0125, "step": 170570 }, { "epoch": 0.86, "learning_rate": 0.0001709102925670119, "loss": 0.0105, "step": 170580 }, { "epoch": 0.86, "learning_rate": 0.0001709027248739979, "loss": 0.0116, "step": 170590 }, { "epoch": 0.86, "learning_rate": 0.00017089515718098387, "loss": 0.0133, "step": 170600 }, { "epoch": 0.86, "learning_rate": 0.00017088758948796988, "loss": 0.0117, "step": 170610 }, { "epoch": 0.86, "learning_rate": 0.00017088002179495586, "loss": 0.0116, "step": 170620 }, { "epoch": 0.86, "learning_rate": 0.00017087245410194184, "loss": 0.0113, "step": 170630 }, { "epoch": 0.86, "learning_rate": 0.00017086488640892785, "loss": 0.0117, "step": 170640 }, { "epoch": 0.86, "learning_rate": 0.00017085731871591383, "loss": 0.0138, "step": 170650 }, { "epoch": 0.86, "learning_rate": 0.0001708497510228998, "loss": 0.0104, "step": 170660 }, { "epoch": 0.86, "learning_rate": 0.00017084218332988582, "loss": 0.0165, "step": 170670 }, { "epoch": 0.86, "learning_rate": 0.0001708346156368718, "loss": 0.0107, "step": 170680 }, { "epoch": 0.86, "learning_rate": 0.00017082704794385778, "loss": 0.0118, "step": 170690 }, { "epoch": 0.86, "learning_rate": 0.00017081948025084376, "loss": 0.0125, "step": 170700 }, { "epoch": 0.86, "learning_rate": 0.00017081191255782977, "loss": 0.0113, "step": 170710 }, { "epoch": 0.86, "learning_rate": 0.00017080434486481575, "loss": 0.0132, "step": 170720 }, { "epoch": 0.86, "learning_rate": 0.00017079677717180174, "loss": 0.0098, "step": 170730 }, { "epoch": 0.86, "learning_rate": 0.00017078920947878774, "loss": 0.0098, "step": 170740 }, { "epoch": 0.86, "learning_rate": 0.00017078164178577373, "loss": 0.0121, "step": 170750 }, { "epoch": 0.86, "learning_rate": 0.0001707740740927597, "loss": 0.0148, "step": 170760 }, { "epoch": 0.86, "learning_rate": 0.00017076650639974572, "loss": 0.0139, "step": 170770 }, { "epoch": 0.86, "learning_rate": 0.0001707589387067317, "loss": 0.0155, "step": 170780 }, { "epoch": 0.86, "learning_rate": 0.00017075137101371768, "loss": 0.0094, "step": 170790 }, { "epoch": 0.86, "learning_rate": 0.0001707438033207037, "loss": 0.0137, "step": 170800 }, { "epoch": 0.86, "learning_rate": 0.00017073623562768967, "loss": 0.0097, "step": 170810 }, { "epoch": 0.86, "learning_rate": 0.00017072866793467565, "loss": 0.0095, "step": 170820 }, { "epoch": 0.86, "learning_rate": 0.00017072110024166166, "loss": 0.0162, "step": 170830 }, { "epoch": 0.86, "learning_rate": 0.00017071353254864764, "loss": 0.0122, "step": 170840 }, { "epoch": 0.86, "learning_rate": 0.00017070596485563362, "loss": 0.0098, "step": 170850 }, { "epoch": 0.86, "learning_rate": 0.0001706983971626196, "loss": 0.0128, "step": 170860 }, { "epoch": 0.86, "learning_rate": 0.0001706908294696056, "loss": 0.0116, "step": 170870 }, { "epoch": 0.86, "learning_rate": 0.0001706832617765916, "loss": 0.0118, "step": 170880 }, { "epoch": 0.86, "learning_rate": 0.00017067569408357757, "loss": 0.0102, "step": 170890 }, { "epoch": 0.86, "learning_rate": 0.00017066812639056358, "loss": 0.0121, "step": 170900 }, { "epoch": 0.86, "learning_rate": 0.00017066055869754956, "loss": 0.0111, "step": 170910 }, { "epoch": 0.86, "learning_rate": 0.00017065299100453555, "loss": 0.0113, "step": 170920 }, { "epoch": 0.86, "learning_rate": 0.00017064542331152155, "loss": 0.0141, "step": 170930 }, { "epoch": 0.86, "learning_rate": 0.00017063785561850754, "loss": 0.0115, "step": 170940 }, { "epoch": 0.86, "learning_rate": 0.00017063028792549352, "loss": 0.0227, "step": 170950 }, { "epoch": 0.86, "learning_rate": 0.00017062272023247953, "loss": 0.0105, "step": 170960 }, { "epoch": 0.86, "learning_rate": 0.0001706151525394655, "loss": 0.0113, "step": 170970 }, { "epoch": 0.86, "learning_rate": 0.0001706075848464515, "loss": 0.0103, "step": 170980 }, { "epoch": 0.86, "learning_rate": 0.0001706000171534375, "loss": 0.0109, "step": 170990 }, { "epoch": 0.86, "learning_rate": 0.00017059244946042348, "loss": 0.0112, "step": 171000 }, { "epoch": 0.86, "eval_cer": 0.914508101352053, "eval_loss": 0.008454186841845512, "eval_runtime": 116.644, "eval_samples_per_second": 17.146, "eval_steps_per_second": 4.287, "step": 171000 }, { "epoch": 0.86, "learning_rate": 0.00017058488176740946, "loss": 0.0105, "step": 171010 }, { "epoch": 0.86, "learning_rate": 0.00017057731407439544, "loss": 0.0115, "step": 171020 }, { "epoch": 0.86, "learning_rate": 0.00017056974638138145, "loss": 0.0135, "step": 171030 }, { "epoch": 0.86, "learning_rate": 0.00017056217868836743, "loss": 0.0112, "step": 171040 }, { "epoch": 0.86, "learning_rate": 0.0001705546109953534, "loss": 0.0095, "step": 171050 }, { "epoch": 0.86, "learning_rate": 0.00017054704330233942, "loss": 0.0116, "step": 171060 }, { "epoch": 0.86, "learning_rate": 0.0001705394756093254, "loss": 0.0101, "step": 171070 }, { "epoch": 0.86, "learning_rate": 0.00017053190791631138, "loss": 0.0124, "step": 171080 }, { "epoch": 0.86, "learning_rate": 0.0001705243402232974, "loss": 0.0097, "step": 171090 }, { "epoch": 0.86, "learning_rate": 0.00017051677253028337, "loss": 0.011, "step": 171100 }, { "epoch": 0.86, "learning_rate": 0.00017050920483726936, "loss": 0.0133, "step": 171110 }, { "epoch": 0.86, "learning_rate": 0.00017050163714425536, "loss": 0.0121, "step": 171120 }, { "epoch": 0.86, "learning_rate": 0.00017049406945124135, "loss": 0.0109, "step": 171130 }, { "epoch": 0.86, "learning_rate": 0.00017048650175822733, "loss": 0.0118, "step": 171140 }, { "epoch": 0.86, "learning_rate": 0.00017047893406521334, "loss": 0.0097, "step": 171150 }, { "epoch": 0.86, "learning_rate": 0.00017047136637219932, "loss": 0.0131, "step": 171160 }, { "epoch": 0.86, "learning_rate": 0.0001704637986791853, "loss": 0.0114, "step": 171170 }, { "epoch": 0.86, "learning_rate": 0.0001704562309861713, "loss": 0.01, "step": 171180 }, { "epoch": 0.86, "learning_rate": 0.0001704486632931573, "loss": 0.0127, "step": 171190 }, { "epoch": 0.86, "learning_rate": 0.00017044109560014327, "loss": 0.0152, "step": 171200 }, { "epoch": 0.86, "learning_rate": 0.00017043352790712925, "loss": 0.0144, "step": 171210 }, { "epoch": 0.86, "learning_rate": 0.00017042596021411526, "loss": 0.0109, "step": 171220 }, { "epoch": 0.86, "learning_rate": 0.00017041839252110124, "loss": 0.0093, "step": 171230 }, { "epoch": 0.86, "learning_rate": 0.00017041082482808722, "loss": 0.0102, "step": 171240 }, { "epoch": 0.86, "learning_rate": 0.00017040325713507323, "loss": 0.0106, "step": 171250 }, { "epoch": 0.86, "learning_rate": 0.0001703956894420592, "loss": 0.012, "step": 171260 }, { "epoch": 0.86, "learning_rate": 0.0001703881217490452, "loss": 0.0092, "step": 171270 }, { "epoch": 0.86, "learning_rate": 0.0001703805540560312, "loss": 0.0085, "step": 171280 }, { "epoch": 0.86, "learning_rate": 0.00017037298636301718, "loss": 0.0103, "step": 171290 }, { "epoch": 0.86, "learning_rate": 0.00017036541867000317, "loss": 0.0119, "step": 171300 }, { "epoch": 0.86, "learning_rate": 0.00017035785097698917, "loss": 0.0116, "step": 171310 }, { "epoch": 0.86, "learning_rate": 0.00017035028328397516, "loss": 0.0106, "step": 171320 }, { "epoch": 0.86, "learning_rate": 0.00017034271559096114, "loss": 0.0105, "step": 171330 }, { "epoch": 0.86, "learning_rate": 0.00017033514789794715, "loss": 0.009, "step": 171340 }, { "epoch": 0.86, "learning_rate": 0.00017032758020493313, "loss": 0.0111, "step": 171350 }, { "epoch": 0.86, "learning_rate": 0.0001703200125119191, "loss": 0.0101, "step": 171360 }, { "epoch": 0.86, "learning_rate": 0.0001703124448189051, "loss": 0.0129, "step": 171370 }, { "epoch": 0.86, "learning_rate": 0.0001703048771258911, "loss": 0.0114, "step": 171380 }, { "epoch": 0.86, "learning_rate": 0.00017029730943287708, "loss": 0.0128, "step": 171390 }, { "epoch": 0.86, "learning_rate": 0.00017028974173986306, "loss": 0.011, "step": 171400 }, { "epoch": 0.86, "learning_rate": 0.00017028217404684907, "loss": 0.0086, "step": 171410 }, { "epoch": 0.86, "learning_rate": 0.00017027460635383505, "loss": 0.0116, "step": 171420 }, { "epoch": 0.86, "learning_rate": 0.00017026703866082103, "loss": 0.012, "step": 171430 }, { "epoch": 0.86, "learning_rate": 0.00017025947096780704, "loss": 0.0109, "step": 171440 }, { "epoch": 0.86, "learning_rate": 0.00017025190327479302, "loss": 0.0098, "step": 171450 }, { "epoch": 0.87, "learning_rate": 0.000170244335581779, "loss": 0.0105, "step": 171460 }, { "epoch": 0.87, "learning_rate": 0.000170236767888765, "loss": 0.0107, "step": 171470 }, { "epoch": 0.87, "learning_rate": 0.000170229200195751, "loss": 0.0118, "step": 171480 }, { "epoch": 0.87, "learning_rate": 0.00017022163250273698, "loss": 0.0116, "step": 171490 }, { "epoch": 0.87, "learning_rate": 0.00017021406480972298, "loss": 0.0115, "step": 171500 }, { "epoch": 0.87, "learning_rate": 0.00017020649711670897, "loss": 0.0115, "step": 171510 }, { "epoch": 0.87, "learning_rate": 0.00017019892942369495, "loss": 0.01, "step": 171520 }, { "epoch": 0.87, "learning_rate": 0.00017019136173068093, "loss": 0.0124, "step": 171530 }, { "epoch": 0.87, "learning_rate": 0.00017018379403766694, "loss": 0.0118, "step": 171540 }, { "epoch": 0.87, "learning_rate": 0.00017017622634465292, "loss": 0.0116, "step": 171550 }, { "epoch": 0.87, "learning_rate": 0.0001701686586516389, "loss": 0.0131, "step": 171560 }, { "epoch": 0.87, "learning_rate": 0.00017016109095862488, "loss": 0.0154, "step": 171570 }, { "epoch": 0.87, "learning_rate": 0.00017015352326561086, "loss": 0.0102, "step": 171580 }, { "epoch": 0.87, "learning_rate": 0.00017014595557259684, "loss": 0.011, "step": 171590 }, { "epoch": 0.87, "learning_rate": 0.00017013838787958283, "loss": 0.0132, "step": 171600 }, { "epoch": 0.87, "learning_rate": 0.00017013082018656883, "loss": 0.0096, "step": 171610 }, { "epoch": 0.87, "learning_rate": 0.00017012325249355482, "loss": 0.0092, "step": 171620 }, { "epoch": 0.87, "learning_rate": 0.0001701156848005408, "loss": 0.017, "step": 171630 }, { "epoch": 0.87, "learning_rate": 0.0001701081171075268, "loss": 0.0112, "step": 171640 }, { "epoch": 0.87, "learning_rate": 0.0001701005494145128, "loss": 0.0108, "step": 171650 }, { "epoch": 0.87, "learning_rate": 0.00017009298172149877, "loss": 0.0099, "step": 171660 }, { "epoch": 0.87, "learning_rate": 0.00017008541402848478, "loss": 0.0111, "step": 171670 }, { "epoch": 0.87, "learning_rate": 0.00017007784633547076, "loss": 0.0118, "step": 171680 }, { "epoch": 0.87, "learning_rate": 0.00017007027864245674, "loss": 0.0108, "step": 171690 }, { "epoch": 0.87, "learning_rate": 0.00017006271094944275, "loss": 0.0088, "step": 171700 }, { "epoch": 0.87, "learning_rate": 0.00017005514325642873, "loss": 0.0282, "step": 171710 }, { "epoch": 0.87, "learning_rate": 0.0001700475755634147, "loss": 0.0125, "step": 171720 }, { "epoch": 0.87, "learning_rate": 0.00017004000787040072, "loss": 0.0127, "step": 171730 }, { "epoch": 0.87, "learning_rate": 0.0001700324401773867, "loss": 0.0111, "step": 171740 }, { "epoch": 0.87, "learning_rate": 0.00017002487248437268, "loss": 0.0106, "step": 171750 }, { "epoch": 0.87, "learning_rate": 0.00017001730479135866, "loss": 0.0117, "step": 171760 }, { "epoch": 0.87, "learning_rate": 0.00017000973709834467, "loss": 0.0125, "step": 171770 }, { "epoch": 0.87, "learning_rate": 0.00017000216940533065, "loss": 0.0092, "step": 171780 }, { "epoch": 0.87, "learning_rate": 0.00016999460171231664, "loss": 0.0109, "step": 171790 }, { "epoch": 0.87, "learning_rate": 0.00016998703401930264, "loss": 0.0102, "step": 171800 }, { "epoch": 0.87, "learning_rate": 0.00016997946632628863, "loss": 0.012, "step": 171810 }, { "epoch": 0.87, "learning_rate": 0.0001699718986332746, "loss": 0.0099, "step": 171820 }, { "epoch": 0.87, "learning_rate": 0.00016996433094026062, "loss": 0.0109, "step": 171830 }, { "epoch": 0.87, "learning_rate": 0.0001699567632472466, "loss": 0.0103, "step": 171840 }, { "epoch": 0.87, "learning_rate": 0.00016994919555423258, "loss": 0.0121, "step": 171850 }, { "epoch": 0.87, "learning_rate": 0.0001699416278612186, "loss": 0.0107, "step": 171860 }, { "epoch": 0.87, "learning_rate": 0.00016993406016820457, "loss": 0.0111, "step": 171870 }, { "epoch": 0.87, "learning_rate": 0.00016992649247519055, "loss": 0.009, "step": 171880 }, { "epoch": 0.87, "learning_rate": 0.00016991892478217656, "loss": 0.0139, "step": 171890 }, { "epoch": 0.87, "learning_rate": 0.00016991135708916254, "loss": 0.009, "step": 171900 }, { "epoch": 0.87, "learning_rate": 0.00016990378939614852, "loss": 0.0108, "step": 171910 }, { "epoch": 0.87, "learning_rate": 0.0001698962217031345, "loss": 0.011, "step": 171920 }, { "epoch": 0.87, "learning_rate": 0.0001698886540101205, "loss": 0.0123, "step": 171930 }, { "epoch": 0.87, "learning_rate": 0.0001698810863171065, "loss": 0.0106, "step": 171940 }, { "epoch": 0.87, "learning_rate": 0.00016987351862409247, "loss": 0.0106, "step": 171950 }, { "epoch": 0.87, "learning_rate": 0.00016986595093107848, "loss": 0.0097, "step": 171960 }, { "epoch": 0.87, "learning_rate": 0.00016985838323806446, "loss": 0.016, "step": 171970 }, { "epoch": 0.87, "learning_rate": 0.00016985081554505045, "loss": 0.0124, "step": 171980 }, { "epoch": 0.87, "learning_rate": 0.00016984324785203645, "loss": 0.012, "step": 171990 }, { "epoch": 0.87, "learning_rate": 0.00016983568015902244, "loss": 0.011, "step": 172000 }, { "epoch": 0.87, "eval_cer": 0.9145003381830497, "eval_loss": 0.00847652181982994, "eval_runtime": 116.6974, "eval_samples_per_second": 17.138, "eval_steps_per_second": 4.285, "step": 172000 }, { "epoch": 0.87, "learning_rate": 0.00016982811246600842, "loss": 0.0102, "step": 172010 }, { "epoch": 0.87, "learning_rate": 0.00016982054477299443, "loss": 0.0126, "step": 172020 }, { "epoch": 0.87, "learning_rate": 0.0001698129770799804, "loss": 0.01, "step": 172030 }, { "epoch": 0.87, "learning_rate": 0.0001698054093869664, "loss": 0.0121, "step": 172040 }, { "epoch": 0.87, "learning_rate": 0.0001697978416939524, "loss": 0.0103, "step": 172050 }, { "epoch": 0.87, "learning_rate": 0.00016979027400093838, "loss": 0.0138, "step": 172060 }, { "epoch": 0.87, "learning_rate": 0.00016978270630792436, "loss": 0.0139, "step": 172070 }, { "epoch": 0.87, "learning_rate": 0.00016977513861491037, "loss": 0.0152, "step": 172080 }, { "epoch": 0.87, "learning_rate": 0.00016976757092189635, "loss": 0.0113, "step": 172090 }, { "epoch": 0.87, "learning_rate": 0.00016976000322888233, "loss": 0.0123, "step": 172100 }, { "epoch": 0.87, "learning_rate": 0.0001697524355358683, "loss": 0.0147, "step": 172110 }, { "epoch": 0.87, "learning_rate": 0.00016974486784285432, "loss": 0.0077, "step": 172120 }, { "epoch": 0.87, "learning_rate": 0.0001697373001498403, "loss": 0.0108, "step": 172130 }, { "epoch": 0.87, "learning_rate": 0.00016972973245682628, "loss": 0.0153, "step": 172140 }, { "epoch": 0.87, "learning_rate": 0.0001697221647638123, "loss": 0.01, "step": 172150 }, { "epoch": 0.87, "learning_rate": 0.00016971459707079827, "loss": 0.0128, "step": 172160 }, { "epoch": 0.87, "learning_rate": 0.00016970702937778426, "loss": 0.0133, "step": 172170 }, { "epoch": 0.87, "learning_rate": 0.00016969946168477026, "loss": 0.013, "step": 172180 }, { "epoch": 0.87, "learning_rate": 0.00016969189399175625, "loss": 0.0123, "step": 172190 }, { "epoch": 0.87, "learning_rate": 0.00016968432629874223, "loss": 0.0142, "step": 172200 }, { "epoch": 0.87, "learning_rate": 0.00016967675860572824, "loss": 0.0098, "step": 172210 }, { "epoch": 0.87, "learning_rate": 0.00016966919091271422, "loss": 0.0096, "step": 172220 }, { "epoch": 0.87, "learning_rate": 0.0001696616232197002, "loss": 0.0123, "step": 172230 }, { "epoch": 0.87, "learning_rate": 0.0001696540555266862, "loss": 0.0134, "step": 172240 }, { "epoch": 0.87, "learning_rate": 0.0001696464878336722, "loss": 0.0133, "step": 172250 }, { "epoch": 0.87, "learning_rate": 0.00016963892014065817, "loss": 0.0122, "step": 172260 }, { "epoch": 0.87, "learning_rate": 0.00016963135244764415, "loss": 0.0126, "step": 172270 }, { "epoch": 0.87, "learning_rate": 0.00016962378475463016, "loss": 0.0114, "step": 172280 }, { "epoch": 0.87, "learning_rate": 0.00016961621706161614, "loss": 0.0126, "step": 172290 }, { "epoch": 0.87, "learning_rate": 0.00016960864936860212, "loss": 0.0121, "step": 172300 }, { "epoch": 0.87, "learning_rate": 0.00016960108167558813, "loss": 0.0157, "step": 172310 }, { "epoch": 0.87, "learning_rate": 0.0001695935139825741, "loss": 0.0136, "step": 172320 }, { "epoch": 0.87, "learning_rate": 0.0001695859462895601, "loss": 0.0127, "step": 172330 }, { "epoch": 0.87, "learning_rate": 0.0001695783785965461, "loss": 0.0127, "step": 172340 }, { "epoch": 0.87, "learning_rate": 0.00016957081090353208, "loss": 0.0112, "step": 172350 }, { "epoch": 0.87, "learning_rate": 0.00016956324321051807, "loss": 0.0104, "step": 172360 }, { "epoch": 0.87, "learning_rate": 0.00016955567551750407, "loss": 0.0099, "step": 172370 }, { "epoch": 0.87, "learning_rate": 0.00016954810782449006, "loss": 0.0114, "step": 172380 }, { "epoch": 0.87, "learning_rate": 0.00016954054013147604, "loss": 0.013, "step": 172390 }, { "epoch": 0.87, "learning_rate": 0.00016953297243846205, "loss": 0.0135, "step": 172400 }, { "epoch": 0.87, "learning_rate": 0.00016952540474544803, "loss": 0.0131, "step": 172410 }, { "epoch": 0.87, "learning_rate": 0.000169517837052434, "loss": 0.0124, "step": 172420 }, { "epoch": 0.87, "learning_rate": 0.00016951026935942, "loss": 0.0106, "step": 172430 }, { "epoch": 0.87, "learning_rate": 0.000169502701666406, "loss": 0.0102, "step": 172440 }, { "epoch": 0.87, "learning_rate": 0.00016949513397339198, "loss": 0.0116, "step": 172450 }, { "epoch": 0.87, "learning_rate": 0.00016948756628037796, "loss": 0.0109, "step": 172460 }, { "epoch": 0.87, "learning_rate": 0.00016947999858736397, "loss": 0.0129, "step": 172470 }, { "epoch": 0.87, "learning_rate": 0.00016947243089434995, "loss": 0.0124, "step": 172480 }, { "epoch": 0.87, "learning_rate": 0.00016946486320133593, "loss": 0.0147, "step": 172490 }, { "epoch": 0.87, "learning_rate": 0.00016945729550832194, "loss": 0.0126, "step": 172500 }, { "epoch": 0.87, "learning_rate": 0.00016944972781530792, "loss": 0.0113, "step": 172510 }, { "epoch": 0.87, "learning_rate": 0.0001694421601222939, "loss": 0.0116, "step": 172520 }, { "epoch": 0.87, "learning_rate": 0.0001694345924292799, "loss": 0.0178, "step": 172530 }, { "epoch": 0.87, "learning_rate": 0.0001694270247362659, "loss": 0.0161, "step": 172540 }, { "epoch": 0.87, "learning_rate": 0.00016941945704325188, "loss": 0.0105, "step": 172550 }, { "epoch": 0.87, "learning_rate": 0.00016941188935023788, "loss": 0.0102, "step": 172560 }, { "epoch": 0.87, "learning_rate": 0.00016940432165722387, "loss": 0.0096, "step": 172570 }, { "epoch": 0.87, "learning_rate": 0.00016939675396420985, "loss": 0.0099, "step": 172580 }, { "epoch": 0.87, "learning_rate": 0.00016938918627119583, "loss": 0.012, "step": 172590 }, { "epoch": 0.87, "learning_rate": 0.00016938161857818184, "loss": 0.0118, "step": 172600 }, { "epoch": 0.87, "learning_rate": 0.00016937405088516782, "loss": 0.0129, "step": 172610 }, { "epoch": 0.87, "learning_rate": 0.0001693664831921538, "loss": 0.0124, "step": 172620 }, { "epoch": 0.87, "learning_rate": 0.0001693589154991398, "loss": 0.0109, "step": 172630 }, { "epoch": 0.87, "learning_rate": 0.0001693513478061258, "loss": 0.0111, "step": 172640 }, { "epoch": 0.87, "learning_rate": 0.00016934378011311177, "loss": 0.0121, "step": 172650 }, { "epoch": 0.87, "learning_rate": 0.00016933621242009778, "loss": 0.0125, "step": 172660 }, { "epoch": 0.87, "learning_rate": 0.00016932864472708376, "loss": 0.0118, "step": 172670 }, { "epoch": 0.87, "learning_rate": 0.00016932107703406974, "loss": 0.0128, "step": 172680 }, { "epoch": 0.87, "learning_rate": 0.00016931350934105575, "loss": 0.0122, "step": 172690 }, { "epoch": 0.87, "learning_rate": 0.00016930594164804173, "loss": 0.012, "step": 172700 }, { "epoch": 0.87, "learning_rate": 0.00016929837395502771, "loss": 0.0111, "step": 172710 }, { "epoch": 0.87, "learning_rate": 0.00016929080626201372, "loss": 0.012, "step": 172720 }, { "epoch": 0.87, "learning_rate": 0.0001692832385689997, "loss": 0.0109, "step": 172730 }, { "epoch": 0.87, "learning_rate": 0.00016927567087598569, "loss": 0.0133, "step": 172740 }, { "epoch": 0.87, "learning_rate": 0.0001692681031829717, "loss": 0.0126, "step": 172750 }, { "epoch": 0.87, "learning_rate": 0.00016926053548995768, "loss": 0.0131, "step": 172760 }, { "epoch": 0.87, "learning_rate": 0.00016925296779694366, "loss": 0.0128, "step": 172770 }, { "epoch": 0.87, "learning_rate": 0.00016924540010392964, "loss": 0.0091, "step": 172780 }, { "epoch": 0.87, "learning_rate": 0.00016923783241091565, "loss": 0.0085, "step": 172790 }, { "epoch": 0.87, "learning_rate": 0.00016923026471790163, "loss": 0.0116, "step": 172800 }, { "epoch": 0.87, "learning_rate": 0.0001692226970248876, "loss": 0.0147, "step": 172810 }, { "epoch": 0.87, "learning_rate": 0.00016921512933187362, "loss": 0.0115, "step": 172820 }, { "epoch": 0.87, "learning_rate": 0.00016920756163885957, "loss": 0.0095, "step": 172830 }, { "epoch": 0.87, "learning_rate": 0.00016919999394584555, "loss": 0.012, "step": 172840 }, { "epoch": 0.87, "learning_rate": 0.00016919242625283154, "loss": 0.0104, "step": 172850 }, { "epoch": 0.87, "learning_rate": 0.00016918485855981754, "loss": 0.011, "step": 172860 }, { "epoch": 0.87, "learning_rate": 0.00016917729086680353, "loss": 0.0128, "step": 172870 }, { "epoch": 0.87, "learning_rate": 0.0001691697231737895, "loss": 0.0164, "step": 172880 }, { "epoch": 0.87, "learning_rate": 0.00016916215548077552, "loss": 0.0117, "step": 172890 }, { "epoch": 0.87, "learning_rate": 0.0001691545877877615, "loss": 0.012, "step": 172900 }, { "epoch": 0.87, "learning_rate": 0.00016914702009474748, "loss": 0.014, "step": 172910 }, { "epoch": 0.87, "learning_rate": 0.0001691394524017335, "loss": 0.0113, "step": 172920 }, { "epoch": 0.87, "learning_rate": 0.00016913188470871947, "loss": 0.0157, "step": 172930 }, { "epoch": 0.87, "learning_rate": 0.00016912431701570545, "loss": 0.0115, "step": 172940 }, { "epoch": 0.87, "learning_rate": 0.00016911674932269146, "loss": 0.0128, "step": 172950 }, { "epoch": 0.87, "learning_rate": 0.00016910918162967744, "loss": 0.0118, "step": 172960 }, { "epoch": 0.87, "learning_rate": 0.00016910161393666342, "loss": 0.0147, "step": 172970 }, { "epoch": 0.87, "learning_rate": 0.00016909404624364943, "loss": 0.0104, "step": 172980 }, { "epoch": 0.87, "learning_rate": 0.0001690864785506354, "loss": 0.0115, "step": 172990 }, { "epoch": 0.87, "learning_rate": 0.0001690789108576214, "loss": 0.0146, "step": 173000 }, { "epoch": 0.87, "eval_cer": 0.9145003381830497, "eval_loss": 0.008254943415522575, "eval_runtime": 116.8302, "eval_samples_per_second": 17.119, "eval_steps_per_second": 4.28, "step": 173000 }, { "epoch": 0.87, "learning_rate": 0.00016907134316460737, "loss": 0.0116, "step": 173010 }, { "epoch": 0.87, "learning_rate": 0.00016906377547159338, "loss": 0.0118, "step": 173020 }, { "epoch": 0.87, "learning_rate": 0.00016905620777857936, "loss": 0.0114, "step": 173030 }, { "epoch": 0.87, "learning_rate": 0.00016904864008556535, "loss": 0.0126, "step": 173040 }, { "epoch": 0.87, "learning_rate": 0.00016904107239255135, "loss": 0.0095, "step": 173050 }, { "epoch": 0.87, "learning_rate": 0.00016903350469953734, "loss": 0.0099, "step": 173060 }, { "epoch": 0.87, "learning_rate": 0.00016902593700652332, "loss": 0.0109, "step": 173070 }, { "epoch": 0.87, "learning_rate": 0.00016901836931350933, "loss": 0.0124, "step": 173080 }, { "epoch": 0.87, "learning_rate": 0.0001690108016204953, "loss": 0.0124, "step": 173090 }, { "epoch": 0.87, "learning_rate": 0.0001690032339274813, "loss": 0.0123, "step": 173100 }, { "epoch": 0.87, "learning_rate": 0.0001689956662344673, "loss": 0.0135, "step": 173110 }, { "epoch": 0.87, "learning_rate": 0.00016898809854145328, "loss": 0.0114, "step": 173120 }, { "epoch": 0.87, "learning_rate": 0.00016898053084843926, "loss": 0.0131, "step": 173130 }, { "epoch": 0.87, "learning_rate": 0.00016897296315542527, "loss": 0.0121, "step": 173140 }, { "epoch": 0.87, "learning_rate": 0.00016896539546241125, "loss": 0.0107, "step": 173150 }, { "epoch": 0.87, "learning_rate": 0.00016895782776939723, "loss": 0.0147, "step": 173160 }, { "epoch": 0.87, "learning_rate": 0.0001689502600763832, "loss": 0.0129, "step": 173170 }, { "epoch": 0.87, "learning_rate": 0.00016894269238336922, "loss": 0.0115, "step": 173180 }, { "epoch": 0.87, "learning_rate": 0.0001689351246903552, "loss": 0.0149, "step": 173190 }, { "epoch": 0.87, "learning_rate": 0.00016892755699734118, "loss": 0.0107, "step": 173200 }, { "epoch": 0.87, "learning_rate": 0.0001689199893043272, "loss": 0.0116, "step": 173210 }, { "epoch": 0.87, "learning_rate": 0.00016891242161131317, "loss": 0.0092, "step": 173220 }, { "epoch": 0.87, "learning_rate": 0.00016890485391829916, "loss": 0.0112, "step": 173230 }, { "epoch": 0.87, "learning_rate": 0.00016889728622528516, "loss": 0.0091, "step": 173240 }, { "epoch": 0.87, "learning_rate": 0.00016888971853227115, "loss": 0.0133, "step": 173250 }, { "epoch": 0.87, "learning_rate": 0.00016888215083925713, "loss": 0.0127, "step": 173260 }, { "epoch": 0.87, "learning_rate": 0.00016887458314624314, "loss": 0.0124, "step": 173270 }, { "epoch": 0.87, "learning_rate": 0.00016886701545322912, "loss": 0.0125, "step": 173280 }, { "epoch": 0.87, "learning_rate": 0.0001688594477602151, "loss": 0.0104, "step": 173290 }, { "epoch": 0.87, "learning_rate": 0.0001688518800672011, "loss": 0.0155, "step": 173300 }, { "epoch": 0.87, "learning_rate": 0.0001688443123741871, "loss": 0.0156, "step": 173310 }, { "epoch": 0.87, "learning_rate": 0.00016883674468117307, "loss": 0.0135, "step": 173320 }, { "epoch": 0.87, "learning_rate": 0.00016882917698815905, "loss": 0.0126, "step": 173330 }, { "epoch": 0.87, "learning_rate": 0.00016882160929514506, "loss": 0.0139, "step": 173340 }, { "epoch": 0.87, "learning_rate": 0.00016881404160213104, "loss": 0.0113, "step": 173350 }, { "epoch": 0.87, "learning_rate": 0.00016880647390911702, "loss": 0.0099, "step": 173360 }, { "epoch": 0.87, "learning_rate": 0.00016879890621610303, "loss": 0.0102, "step": 173370 }, { "epoch": 0.87, "learning_rate": 0.000168791338523089, "loss": 0.01, "step": 173380 }, { "epoch": 0.87, "learning_rate": 0.000168783770830075, "loss": 0.0125, "step": 173390 }, { "epoch": 0.87, "learning_rate": 0.000168776203137061, "loss": 0.0106, "step": 173400 }, { "epoch": 0.87, "learning_rate": 0.00016876863544404698, "loss": 0.0115, "step": 173410 }, { "epoch": 0.87, "learning_rate": 0.00016876106775103297, "loss": 0.0119, "step": 173420 }, { "epoch": 0.87, "learning_rate": 0.00016875350005801897, "loss": 0.013, "step": 173430 }, { "epoch": 0.88, "learning_rate": 0.00016874593236500496, "loss": 0.013, "step": 173440 }, { "epoch": 0.88, "learning_rate": 0.00016873836467199094, "loss": 0.012, "step": 173450 }, { "epoch": 0.88, "learning_rate": 0.00016873079697897695, "loss": 0.0103, "step": 173460 }, { "epoch": 0.88, "learning_rate": 0.00016872322928596293, "loss": 0.0123, "step": 173470 }, { "epoch": 0.88, "learning_rate": 0.0001687156615929489, "loss": 0.0134, "step": 173480 }, { "epoch": 0.88, "learning_rate": 0.0001687080938999349, "loss": 0.0126, "step": 173490 }, { "epoch": 0.88, "learning_rate": 0.0001687005262069209, "loss": 0.0122, "step": 173500 }, { "epoch": 0.88, "learning_rate": 0.00016869295851390688, "loss": 0.0121, "step": 173510 }, { "epoch": 0.88, "learning_rate": 0.00016868539082089286, "loss": 0.0143, "step": 173520 }, { "epoch": 0.88, "learning_rate": 0.00016867782312787887, "loss": 0.0112, "step": 173530 }, { "epoch": 0.88, "learning_rate": 0.00016867025543486485, "loss": 0.0152, "step": 173540 }, { "epoch": 0.88, "learning_rate": 0.00016866268774185083, "loss": 0.0105, "step": 173550 }, { "epoch": 0.88, "learning_rate": 0.00016865512004883684, "loss": 0.0091, "step": 173560 }, { "epoch": 0.88, "learning_rate": 0.00016864755235582282, "loss": 0.01, "step": 173570 }, { "epoch": 0.88, "learning_rate": 0.0001686399846628088, "loss": 0.0158, "step": 173580 }, { "epoch": 0.88, "learning_rate": 0.0001686324169697948, "loss": 0.01, "step": 173590 }, { "epoch": 0.88, "learning_rate": 0.0001686248492767808, "loss": 0.0135, "step": 173600 }, { "epoch": 0.88, "learning_rate": 0.00016861728158376678, "loss": 0.0092, "step": 173610 }, { "epoch": 0.88, "learning_rate": 0.00016860971389075278, "loss": 0.0101, "step": 173620 }, { "epoch": 0.88, "learning_rate": 0.00016860214619773877, "loss": 0.013, "step": 173630 }, { "epoch": 0.88, "learning_rate": 0.00016859457850472475, "loss": 0.0092, "step": 173640 }, { "epoch": 0.88, "learning_rate": 0.00016858701081171076, "loss": 0.0128, "step": 173650 }, { "epoch": 0.88, "learning_rate": 0.00016857944311869674, "loss": 0.0123, "step": 173660 }, { "epoch": 0.88, "learning_rate": 0.00016857187542568272, "loss": 0.0131, "step": 173670 }, { "epoch": 0.88, "learning_rate": 0.0001685643077326687, "loss": 0.012, "step": 173680 }, { "epoch": 0.88, "learning_rate": 0.0001685567400396547, "loss": 0.0117, "step": 173690 }, { "epoch": 0.88, "learning_rate": 0.0001685491723466407, "loss": 0.0113, "step": 173700 }, { "epoch": 0.88, "learning_rate": 0.00016854160465362667, "loss": 0.0143, "step": 173710 }, { "epoch": 0.88, "learning_rate": 0.00016853403696061268, "loss": 0.0109, "step": 173720 }, { "epoch": 0.88, "learning_rate": 0.00016852646926759866, "loss": 0.0139, "step": 173730 }, { "epoch": 0.88, "learning_rate": 0.00016851890157458464, "loss": 0.0117, "step": 173740 }, { "epoch": 0.88, "learning_rate": 0.00016851133388157065, "loss": 0.0112, "step": 173750 }, { "epoch": 0.88, "learning_rate": 0.00016850376618855663, "loss": 0.0101, "step": 173760 }, { "epoch": 0.88, "learning_rate": 0.00016849619849554261, "loss": 0.0126, "step": 173770 }, { "epoch": 0.88, "learning_rate": 0.00016848863080252862, "loss": 0.0122, "step": 173780 }, { "epoch": 0.88, "learning_rate": 0.0001684810631095146, "loss": 0.0147, "step": 173790 }, { "epoch": 0.88, "learning_rate": 0.00016847349541650059, "loss": 0.0124, "step": 173800 }, { "epoch": 0.88, "learning_rate": 0.0001684659277234866, "loss": 0.0127, "step": 173810 }, { "epoch": 0.88, "learning_rate": 0.00016845836003047258, "loss": 0.0084, "step": 173820 }, { "epoch": 0.88, "learning_rate": 0.00016845079233745856, "loss": 0.0099, "step": 173830 }, { "epoch": 0.88, "learning_rate": 0.00016844322464444454, "loss": 0.0115, "step": 173840 }, { "epoch": 0.88, "learning_rate": 0.00016843565695143055, "loss": 0.0107, "step": 173850 }, { "epoch": 0.88, "learning_rate": 0.00016842808925841653, "loss": 0.0147, "step": 173860 }, { "epoch": 0.88, "learning_rate": 0.0001684205215654025, "loss": 0.0123, "step": 173870 }, { "epoch": 0.88, "learning_rate": 0.00016841295387238852, "loss": 0.0131, "step": 173880 }, { "epoch": 0.88, "learning_rate": 0.0001684053861793745, "loss": 0.0166, "step": 173890 }, { "epoch": 0.88, "learning_rate": 0.00016839781848636048, "loss": 0.0117, "step": 173900 }, { "epoch": 0.88, "learning_rate": 0.0001683902507933465, "loss": 0.0117, "step": 173910 }, { "epoch": 0.88, "learning_rate": 0.00016838268310033247, "loss": 0.0101, "step": 173920 }, { "epoch": 0.88, "learning_rate": 0.00016837511540731845, "loss": 0.0107, "step": 173930 }, { "epoch": 0.88, "learning_rate": 0.00016836754771430446, "loss": 0.0134, "step": 173940 }, { "epoch": 0.88, "learning_rate": 0.00016835998002129044, "loss": 0.0124, "step": 173950 }, { "epoch": 0.88, "learning_rate": 0.00016835241232827643, "loss": 0.0116, "step": 173960 }, { "epoch": 0.88, "learning_rate": 0.00016834484463526243, "loss": 0.01, "step": 173970 }, { "epoch": 0.88, "learning_rate": 0.00016833727694224842, "loss": 0.012, "step": 173980 }, { "epoch": 0.88, "learning_rate": 0.0001683297092492344, "loss": 0.012, "step": 173990 }, { "epoch": 0.88, "learning_rate": 0.00016832214155622038, "loss": 0.0158, "step": 174000 }, { "epoch": 0.88, "eval_cer": 0.9144935454101719, "eval_loss": 0.008368046954274178, "eval_runtime": 116.7718, "eval_samples_per_second": 17.127, "eval_steps_per_second": 4.282, "step": 174000 }, { "epoch": 0.88, "learning_rate": 0.0001683145738632064, "loss": 0.0139, "step": 174010 }, { "epoch": 0.88, "learning_rate": 0.00016830700617019237, "loss": 0.0124, "step": 174020 }, { "epoch": 0.88, "learning_rate": 0.00016829943847717835, "loss": 0.0109, "step": 174030 }, { "epoch": 0.88, "learning_rate": 0.00016829187078416436, "loss": 0.0119, "step": 174040 }, { "epoch": 0.88, "learning_rate": 0.00016828430309115034, "loss": 0.0109, "step": 174050 }, { "epoch": 0.88, "learning_rate": 0.00016827673539813632, "loss": 0.0111, "step": 174060 }, { "epoch": 0.88, "learning_rate": 0.00016826916770512233, "loss": 0.0111, "step": 174070 }, { "epoch": 0.88, "learning_rate": 0.00016826160001210828, "loss": 0.0125, "step": 174080 }, { "epoch": 0.88, "learning_rate": 0.00016825403231909427, "loss": 0.0105, "step": 174090 }, { "epoch": 0.88, "learning_rate": 0.00016824646462608025, "loss": 0.0113, "step": 174100 }, { "epoch": 0.88, "learning_rate": 0.00016823889693306626, "loss": 0.01, "step": 174110 }, { "epoch": 0.88, "learning_rate": 0.00016823132924005224, "loss": 0.0127, "step": 174120 }, { "epoch": 0.88, "learning_rate": 0.00016822376154703822, "loss": 0.0127, "step": 174130 }, { "epoch": 0.88, "learning_rate": 0.00016821619385402423, "loss": 0.0132, "step": 174140 }, { "epoch": 0.88, "learning_rate": 0.0001682086261610102, "loss": 0.0115, "step": 174150 }, { "epoch": 0.88, "learning_rate": 0.0001682010584679962, "loss": 0.016, "step": 174160 }, { "epoch": 0.88, "learning_rate": 0.0001681934907749822, "loss": 0.0159, "step": 174170 }, { "epoch": 0.88, "learning_rate": 0.00016818592308196818, "loss": 0.0128, "step": 174180 }, { "epoch": 0.88, "learning_rate": 0.00016817835538895416, "loss": 0.0096, "step": 174190 }, { "epoch": 0.88, "learning_rate": 0.00016817078769594017, "loss": 0.0148, "step": 174200 }, { "epoch": 0.88, "learning_rate": 0.00016816322000292615, "loss": 0.0113, "step": 174210 }, { "epoch": 0.88, "learning_rate": 0.00016815565230991213, "loss": 0.0112, "step": 174220 }, { "epoch": 0.88, "learning_rate": 0.00016814808461689811, "loss": 0.0109, "step": 174230 }, { "epoch": 0.88, "learning_rate": 0.00016814051692388412, "loss": 0.0105, "step": 174240 }, { "epoch": 0.88, "learning_rate": 0.0001681329492308701, "loss": 0.0129, "step": 174250 }, { "epoch": 0.88, "learning_rate": 0.00016812538153785609, "loss": 0.0125, "step": 174260 }, { "epoch": 0.88, "learning_rate": 0.0001681178138448421, "loss": 0.01, "step": 174270 }, { "epoch": 0.88, "learning_rate": 0.00016811024615182808, "loss": 0.0126, "step": 174280 }, { "epoch": 0.88, "learning_rate": 0.00016810267845881406, "loss": 0.0113, "step": 174290 }, { "epoch": 0.88, "learning_rate": 0.00016809511076580007, "loss": 0.0104, "step": 174300 }, { "epoch": 0.88, "learning_rate": 0.00016808754307278605, "loss": 0.0091, "step": 174310 }, { "epoch": 0.88, "learning_rate": 0.00016807997537977203, "loss": 0.0122, "step": 174320 }, { "epoch": 0.88, "learning_rate": 0.00016807240768675804, "loss": 0.0118, "step": 174330 }, { "epoch": 0.88, "learning_rate": 0.00016806483999374402, "loss": 0.0109, "step": 174340 }, { "epoch": 0.88, "learning_rate": 0.00016805727230073, "loss": 0.0142, "step": 174350 }, { "epoch": 0.88, "learning_rate": 0.000168049704607716, "loss": 0.0124, "step": 174360 }, { "epoch": 0.88, "learning_rate": 0.000168042136914702, "loss": 0.0108, "step": 174370 }, { "epoch": 0.88, "learning_rate": 0.00016803456922168797, "loss": 0.0127, "step": 174380 }, { "epoch": 0.88, "learning_rate": 0.00016802700152867395, "loss": 0.0171, "step": 174390 }, { "epoch": 0.88, "learning_rate": 0.00016801943383565996, "loss": 0.0124, "step": 174400 }, { "epoch": 0.88, "learning_rate": 0.00016801186614264594, "loss": 0.012, "step": 174410 }, { "epoch": 0.88, "learning_rate": 0.00016800429844963192, "loss": 0.0125, "step": 174420 }, { "epoch": 0.88, "learning_rate": 0.00016799673075661793, "loss": 0.0132, "step": 174430 }, { "epoch": 0.88, "learning_rate": 0.00016798916306360391, "loss": 0.0117, "step": 174440 }, { "epoch": 0.88, "learning_rate": 0.0001679815953705899, "loss": 0.0106, "step": 174450 }, { "epoch": 0.88, "learning_rate": 0.0001679740276775759, "loss": 0.0155, "step": 174460 }, { "epoch": 0.88, "learning_rate": 0.00016796645998456189, "loss": 0.0109, "step": 174470 }, { "epoch": 0.88, "learning_rate": 0.00016795889229154787, "loss": 0.0123, "step": 174480 }, { "epoch": 0.88, "learning_rate": 0.00016795132459853388, "loss": 0.0099, "step": 174490 }, { "epoch": 0.88, "learning_rate": 0.00016794375690551986, "loss": 0.0129, "step": 174500 }, { "epoch": 0.88, "learning_rate": 0.00016793618921250584, "loss": 0.0128, "step": 174510 }, { "epoch": 0.88, "learning_rate": 0.00016792862151949185, "loss": 0.0121, "step": 174520 }, { "epoch": 0.88, "learning_rate": 0.00016792105382647783, "loss": 0.0142, "step": 174530 }, { "epoch": 0.88, "learning_rate": 0.0001679134861334638, "loss": 0.0112, "step": 174540 }, { "epoch": 0.88, "learning_rate": 0.00016790591844044982, "loss": 0.0118, "step": 174550 }, { "epoch": 0.88, "learning_rate": 0.0001678983507474358, "loss": 0.0131, "step": 174560 }, { "epoch": 0.88, "learning_rate": 0.00016789078305442178, "loss": 0.0134, "step": 174570 }, { "epoch": 0.88, "learning_rate": 0.00016788321536140776, "loss": 0.0129, "step": 174580 }, { "epoch": 0.88, "learning_rate": 0.00016787564766839377, "loss": 0.0142, "step": 174590 }, { "epoch": 0.88, "learning_rate": 0.00016786807997537975, "loss": 0.0105, "step": 174600 }, { "epoch": 0.88, "learning_rate": 0.00016786051228236573, "loss": 0.0125, "step": 174610 }, { "epoch": 0.88, "learning_rate": 0.00016785294458935174, "loss": 0.0111, "step": 174620 }, { "epoch": 0.88, "learning_rate": 0.00016784537689633772, "loss": 0.0116, "step": 174630 }, { "epoch": 0.88, "learning_rate": 0.0001678378092033237, "loss": 0.0102, "step": 174640 }, { "epoch": 0.88, "learning_rate": 0.00016783024151030971, "loss": 0.012, "step": 174650 }, { "epoch": 0.88, "learning_rate": 0.0001678226738172957, "loss": 0.0114, "step": 174660 }, { "epoch": 0.88, "learning_rate": 0.00016781510612428168, "loss": 0.0125, "step": 174670 }, { "epoch": 0.88, "learning_rate": 0.00016780753843126769, "loss": 0.0111, "step": 174680 }, { "epoch": 0.88, "learning_rate": 0.00016779997073825367, "loss": 0.0131, "step": 174690 }, { "epoch": 0.88, "learning_rate": 0.00016779240304523965, "loss": 0.0107, "step": 174700 }, { "epoch": 0.88, "learning_rate": 0.00016778483535222566, "loss": 0.0114, "step": 174710 }, { "epoch": 0.88, "learning_rate": 0.00016777726765921164, "loss": 0.0112, "step": 174720 }, { "epoch": 0.88, "learning_rate": 0.00016776969996619762, "loss": 0.0146, "step": 174730 }, { "epoch": 0.88, "learning_rate": 0.0001677621322731836, "loss": 0.0094, "step": 174740 }, { "epoch": 0.88, "learning_rate": 0.0001677545645801696, "loss": 0.0108, "step": 174750 }, { "epoch": 0.88, "learning_rate": 0.0001677469968871556, "loss": 0.0112, "step": 174760 }, { "epoch": 0.88, "learning_rate": 0.00016773942919414157, "loss": 0.0125, "step": 174770 }, { "epoch": 0.88, "learning_rate": 0.00016773186150112758, "loss": 0.0134, "step": 174780 }, { "epoch": 0.88, "learning_rate": 0.00016772429380811356, "loss": 0.0144, "step": 174790 }, { "epoch": 0.88, "learning_rate": 0.00016771672611509954, "loss": 0.0119, "step": 174800 }, { "epoch": 0.88, "learning_rate": 0.00016770915842208555, "loss": 0.0101, "step": 174810 }, { "epoch": 0.88, "learning_rate": 0.00016770159072907153, "loss": 0.0094, "step": 174820 }, { "epoch": 0.88, "learning_rate": 0.00016769402303605752, "loss": 0.0108, "step": 174830 }, { "epoch": 0.88, "learning_rate": 0.00016768645534304352, "loss": 0.0135, "step": 174840 }, { "epoch": 0.88, "learning_rate": 0.0001676788876500295, "loss": 0.012, "step": 174850 }, { "epoch": 0.88, "learning_rate": 0.0001676713199570155, "loss": 0.0097, "step": 174860 }, { "epoch": 0.88, "learning_rate": 0.0001676637522640015, "loss": 0.0116, "step": 174870 }, { "epoch": 0.88, "learning_rate": 0.00016765618457098748, "loss": 0.0154, "step": 174880 }, { "epoch": 0.88, "learning_rate": 0.00016764861687797346, "loss": 0.0117, "step": 174890 }, { "epoch": 0.88, "learning_rate": 0.00016764104918495944, "loss": 0.0136, "step": 174900 }, { "epoch": 0.88, "learning_rate": 0.00016763348149194545, "loss": 0.0115, "step": 174910 }, { "epoch": 0.88, "learning_rate": 0.00016762591379893143, "loss": 0.0115, "step": 174920 }, { "epoch": 0.88, "learning_rate": 0.0001676183461059174, "loss": 0.0157, "step": 174930 }, { "epoch": 0.88, "learning_rate": 0.00016761077841290342, "loss": 0.0141, "step": 174940 }, { "epoch": 0.88, "learning_rate": 0.0001676032107198894, "loss": 0.0148, "step": 174950 }, { "epoch": 0.88, "learning_rate": 0.00016759564302687538, "loss": 0.0887, "step": 174960 }, { "epoch": 0.88, "learning_rate": 0.0001675880753338614, "loss": 0.0107, "step": 174970 }, { "epoch": 0.88, "learning_rate": 0.00016758050764084737, "loss": 0.0109, "step": 174980 }, { "epoch": 0.88, "learning_rate": 0.00016757293994783335, "loss": 0.0149, "step": 174990 }, { "epoch": 0.88, "learning_rate": 0.00016756537225481936, "loss": 0.0152, "step": 175000 }, { "epoch": 0.88, "eval_cer": 0.9144993677869243, "eval_loss": 0.008513858541846275, "eval_runtime": 116.6209, "eval_samples_per_second": 17.15, "eval_steps_per_second": 4.287, "step": 175000 }, { "epoch": 0.88, "learning_rate": 0.00016755780456180534, "loss": 0.011, "step": 175010 }, { "epoch": 0.88, "learning_rate": 0.00016755023686879133, "loss": 0.0107, "step": 175020 }, { "epoch": 0.88, "learning_rate": 0.00016754266917577733, "loss": 0.0094, "step": 175030 }, { "epoch": 0.88, "learning_rate": 0.00016753510148276332, "loss": 0.0135, "step": 175040 }, { "epoch": 0.88, "learning_rate": 0.0001675275337897493, "loss": 0.0135, "step": 175050 }, { "epoch": 0.88, "learning_rate": 0.0001675199660967353, "loss": 0.0105, "step": 175060 }, { "epoch": 0.88, "learning_rate": 0.0001675123984037213, "loss": 0.0112, "step": 175070 }, { "epoch": 0.88, "learning_rate": 0.00016750483071070727, "loss": 0.0127, "step": 175080 }, { "epoch": 0.88, "learning_rate": 0.00016749726301769325, "loss": 0.0088, "step": 175090 }, { "epoch": 0.88, "learning_rate": 0.00016748969532467926, "loss": 0.013, "step": 175100 }, { "epoch": 0.88, "learning_rate": 0.00016748212763166524, "loss": 0.0099, "step": 175110 }, { "epoch": 0.88, "learning_rate": 0.00016747455993865122, "loss": 0.0102, "step": 175120 }, { "epoch": 0.88, "learning_rate": 0.00016746699224563723, "loss": 0.0136, "step": 175130 }, { "epoch": 0.88, "learning_rate": 0.0001674594245526232, "loss": 0.01, "step": 175140 }, { "epoch": 0.88, "learning_rate": 0.0001674518568596092, "loss": 0.0104, "step": 175150 }, { "epoch": 0.88, "learning_rate": 0.0001674442891665952, "loss": 0.0131, "step": 175160 }, { "epoch": 0.88, "learning_rate": 0.00016743672147358118, "loss": 0.0118, "step": 175170 }, { "epoch": 0.88, "learning_rate": 0.00016742915378056716, "loss": 0.0116, "step": 175180 }, { "epoch": 0.88, "learning_rate": 0.00016742158608755317, "loss": 0.0102, "step": 175190 }, { "epoch": 0.88, "learning_rate": 0.00016741401839453915, "loss": 0.0098, "step": 175200 }, { "epoch": 0.88, "learning_rate": 0.00016740645070152514, "loss": 0.0161, "step": 175210 }, { "epoch": 0.88, "learning_rate": 0.00016739888300851114, "loss": 0.0142, "step": 175220 }, { "epoch": 0.88, "learning_rate": 0.00016739131531549713, "loss": 0.0103, "step": 175230 }, { "epoch": 0.88, "learning_rate": 0.0001673837476224831, "loss": 0.0101, "step": 175240 }, { "epoch": 0.88, "learning_rate": 0.0001673761799294691, "loss": 0.0103, "step": 175250 }, { "epoch": 0.88, "learning_rate": 0.0001673686122364551, "loss": 0.0115, "step": 175260 }, { "epoch": 0.88, "learning_rate": 0.00016736104454344108, "loss": 0.0131, "step": 175270 }, { "epoch": 0.88, "learning_rate": 0.00016735347685042706, "loss": 0.0109, "step": 175280 }, { "epoch": 0.88, "learning_rate": 0.00016734590915741307, "loss": 0.0166, "step": 175290 }, { "epoch": 0.88, "learning_rate": 0.00016733834146439905, "loss": 0.0112, "step": 175300 }, { "epoch": 0.88, "learning_rate": 0.00016733077377138503, "loss": 0.0108, "step": 175310 }, { "epoch": 0.88, "learning_rate": 0.00016732320607837104, "loss": 0.0121, "step": 175320 }, { "epoch": 0.88, "learning_rate": 0.00016731563838535702, "loss": 0.0146, "step": 175330 }, { "epoch": 0.88, "learning_rate": 0.00016730807069234298, "loss": 0.0115, "step": 175340 }, { "epoch": 0.88, "learning_rate": 0.00016730050299932896, "loss": 0.01, "step": 175350 }, { "epoch": 0.88, "learning_rate": 0.00016729293530631497, "loss": 0.0127, "step": 175360 }, { "epoch": 0.88, "learning_rate": 0.00016728536761330095, "loss": 0.0126, "step": 175370 }, { "epoch": 0.88, "learning_rate": 0.00016727779992028693, "loss": 0.0124, "step": 175380 }, { "epoch": 0.88, "learning_rate": 0.00016727023222727294, "loss": 0.0123, "step": 175390 }, { "epoch": 0.88, "learning_rate": 0.00016726266453425892, "loss": 0.0139, "step": 175400 }, { "epoch": 0.88, "learning_rate": 0.0001672550968412449, "loss": 0.0119, "step": 175410 }, { "epoch": 0.89, "learning_rate": 0.0001672475291482309, "loss": 0.0114, "step": 175420 }, { "epoch": 0.89, "learning_rate": 0.0001672399614552169, "loss": 0.0104, "step": 175430 }, { "epoch": 0.89, "learning_rate": 0.00016723239376220287, "loss": 0.0096, "step": 175440 }, { "epoch": 0.89, "learning_rate": 0.00016722482606918888, "loss": 0.0138, "step": 175450 }, { "epoch": 0.89, "learning_rate": 0.00016721725837617486, "loss": 0.0134, "step": 175460 }, { "epoch": 0.89, "learning_rate": 0.00016720969068316084, "loss": 0.01, "step": 175470 }, { "epoch": 0.89, "learning_rate": 0.00016720212299014682, "loss": 0.0178, "step": 175480 }, { "epoch": 0.89, "learning_rate": 0.00016719455529713283, "loss": 0.0152, "step": 175490 }, { "epoch": 0.89, "learning_rate": 0.00016718698760411881, "loss": 0.0124, "step": 175500 }, { "epoch": 0.89, "learning_rate": 0.0001671794199111048, "loss": 0.0128, "step": 175510 }, { "epoch": 0.89, "learning_rate": 0.0001671718522180908, "loss": 0.0107, "step": 175520 }, { "epoch": 0.89, "learning_rate": 0.00016716428452507679, "loss": 0.0123, "step": 175530 }, { "epoch": 0.89, "learning_rate": 0.00016715671683206277, "loss": 0.0117, "step": 175540 }, { "epoch": 0.89, "learning_rate": 0.00016714914913904878, "loss": 0.0108, "step": 175550 }, { "epoch": 0.89, "learning_rate": 0.00016714158144603476, "loss": 0.0101, "step": 175560 }, { "epoch": 0.89, "learning_rate": 0.00016713401375302074, "loss": 0.0141, "step": 175570 }, { "epoch": 0.89, "learning_rate": 0.00016712644606000675, "loss": 0.012, "step": 175580 }, { "epoch": 0.89, "learning_rate": 0.00016711887836699273, "loss": 0.0092, "step": 175590 }, { "epoch": 0.89, "learning_rate": 0.0001671113106739787, "loss": 0.0102, "step": 175600 }, { "epoch": 0.89, "learning_rate": 0.00016710374298096472, "loss": 0.0124, "step": 175610 }, { "epoch": 0.89, "learning_rate": 0.0001670961752879507, "loss": 0.0137, "step": 175620 }, { "epoch": 0.89, "learning_rate": 0.00016708860759493668, "loss": 0.0117, "step": 175630 }, { "epoch": 0.89, "learning_rate": 0.00016708103990192266, "loss": 0.015, "step": 175640 }, { "epoch": 0.89, "learning_rate": 0.00016707347220890867, "loss": 0.0104, "step": 175650 }, { "epoch": 0.89, "learning_rate": 0.00016706590451589465, "loss": 0.0118, "step": 175660 }, { "epoch": 0.89, "learning_rate": 0.00016705833682288063, "loss": 0.0121, "step": 175670 }, { "epoch": 0.89, "learning_rate": 0.00016705076912986664, "loss": 0.012, "step": 175680 }, { "epoch": 0.89, "learning_rate": 0.00016704320143685262, "loss": 0.0092, "step": 175690 }, { "epoch": 0.89, "learning_rate": 0.0001670356337438386, "loss": 0.0102, "step": 175700 }, { "epoch": 0.89, "learning_rate": 0.00016702806605082461, "loss": 0.0163, "step": 175710 }, { "epoch": 0.89, "learning_rate": 0.0001670204983578106, "loss": 0.011, "step": 175720 }, { "epoch": 0.89, "learning_rate": 0.00016701293066479658, "loss": 0.011, "step": 175730 }, { "epoch": 0.89, "learning_rate": 0.00016700536297178259, "loss": 0.0099, "step": 175740 }, { "epoch": 0.89, "learning_rate": 0.00016699779527876857, "loss": 0.0122, "step": 175750 }, { "epoch": 0.89, "learning_rate": 0.00016699022758575455, "loss": 0.0118, "step": 175760 }, { "epoch": 0.89, "learning_rate": 0.00016698265989274056, "loss": 0.0109, "step": 175770 }, { "epoch": 0.89, "learning_rate": 0.00016697509219972654, "loss": 0.0132, "step": 175780 }, { "epoch": 0.89, "learning_rate": 0.00016696752450671252, "loss": 0.0105, "step": 175790 }, { "epoch": 0.89, "learning_rate": 0.0001669599568136985, "loss": 0.0131, "step": 175800 }, { "epoch": 0.89, "learning_rate": 0.0001669523891206845, "loss": 0.0215, "step": 175810 }, { "epoch": 0.89, "learning_rate": 0.0001669448214276705, "loss": 0.0096, "step": 175820 }, { "epoch": 0.89, "learning_rate": 0.00016693725373465647, "loss": 0.0115, "step": 175830 }, { "epoch": 0.89, "learning_rate": 0.00016692968604164248, "loss": 0.0108, "step": 175840 }, { "epoch": 0.89, "learning_rate": 0.00016692211834862846, "loss": 0.0099, "step": 175850 }, { "epoch": 0.89, "learning_rate": 0.00016691455065561444, "loss": 0.0117, "step": 175860 }, { "epoch": 0.89, "learning_rate": 0.00016690698296260045, "loss": 0.0157, "step": 175870 }, { "epoch": 0.89, "learning_rate": 0.00016689941526958643, "loss": 0.0113, "step": 175880 }, { "epoch": 0.89, "learning_rate": 0.00016689184757657242, "loss": 0.0156, "step": 175890 }, { "epoch": 0.89, "learning_rate": 0.00016688427988355842, "loss": 0.0122, "step": 175900 }, { "epoch": 0.89, "learning_rate": 0.0001668767121905444, "loss": 0.0163, "step": 175910 }, { "epoch": 0.89, "learning_rate": 0.0001668691444975304, "loss": 0.0128, "step": 175920 }, { "epoch": 0.89, "learning_rate": 0.0001668615768045164, "loss": 0.0168, "step": 175930 }, { "epoch": 0.89, "learning_rate": 0.00016685400911150238, "loss": 0.0131, "step": 175940 }, { "epoch": 0.89, "learning_rate": 0.00016684644141848836, "loss": 0.0127, "step": 175950 }, { "epoch": 0.89, "learning_rate": 0.00016683887372547437, "loss": 0.0095, "step": 175960 }, { "epoch": 0.89, "learning_rate": 0.00016683130603246035, "loss": 0.011, "step": 175970 }, { "epoch": 0.89, "learning_rate": 0.00016682373833944633, "loss": 0.0107, "step": 175980 }, { "epoch": 0.89, "learning_rate": 0.0001668161706464323, "loss": 0.0119, "step": 175990 }, { "epoch": 0.89, "learning_rate": 0.00016680860295341832, "loss": 0.0114, "step": 176000 }, { "epoch": 0.89, "eval_cer": 0.9145032493714259, "eval_loss": 0.008152415975928307, "eval_runtime": 116.6203, "eval_samples_per_second": 17.15, "eval_steps_per_second": 4.287, "step": 176000 }, { "epoch": 0.89, "learning_rate": 0.0001668010352604043, "loss": 0.012, "step": 176010 }, { "epoch": 0.89, "learning_rate": 0.00016679346756739028, "loss": 0.0134, "step": 176020 }, { "epoch": 0.89, "learning_rate": 0.0001667858998743763, "loss": 0.0097, "step": 176030 }, { "epoch": 0.89, "learning_rate": 0.00016677833218136227, "loss": 0.0114, "step": 176040 }, { "epoch": 0.89, "learning_rate": 0.00016677076448834825, "loss": 0.0141, "step": 176050 }, { "epoch": 0.89, "learning_rate": 0.00016676319679533426, "loss": 0.0126, "step": 176060 }, { "epoch": 0.89, "learning_rate": 0.00016675562910232024, "loss": 0.0097, "step": 176070 }, { "epoch": 0.89, "learning_rate": 0.00016674806140930623, "loss": 0.0143, "step": 176080 }, { "epoch": 0.89, "learning_rate": 0.00016674049371629223, "loss": 0.0112, "step": 176090 }, { "epoch": 0.89, "learning_rate": 0.00016673292602327822, "loss": 0.0103, "step": 176100 }, { "epoch": 0.89, "learning_rate": 0.0001667253583302642, "loss": 0.0131, "step": 176110 }, { "epoch": 0.89, "learning_rate": 0.0001667177906372502, "loss": 0.0111, "step": 176120 }, { "epoch": 0.89, "learning_rate": 0.0001667102229442362, "loss": 0.0116, "step": 176130 }, { "epoch": 0.89, "learning_rate": 0.00016670265525122217, "loss": 0.0107, "step": 176140 }, { "epoch": 0.89, "learning_rate": 0.00016669508755820815, "loss": 0.0139, "step": 176150 }, { "epoch": 0.89, "learning_rate": 0.00016668751986519416, "loss": 0.0087, "step": 176160 }, { "epoch": 0.89, "learning_rate": 0.00016667995217218014, "loss": 0.0136, "step": 176170 }, { "epoch": 0.89, "learning_rate": 0.00016667238447916612, "loss": 0.0155, "step": 176180 }, { "epoch": 0.89, "learning_rate": 0.00016666481678615213, "loss": 0.0128, "step": 176190 }, { "epoch": 0.89, "learning_rate": 0.0001666572490931381, "loss": 0.0107, "step": 176200 }, { "epoch": 0.89, "learning_rate": 0.0001666496814001241, "loss": 0.0107, "step": 176210 }, { "epoch": 0.89, "learning_rate": 0.0001666421137071101, "loss": 0.0126, "step": 176220 }, { "epoch": 0.89, "learning_rate": 0.00016663454601409608, "loss": 0.0119, "step": 176230 }, { "epoch": 0.89, "learning_rate": 0.00016662697832108206, "loss": 0.0121, "step": 176240 }, { "epoch": 0.89, "learning_rate": 0.00016661941062806807, "loss": 0.0124, "step": 176250 }, { "epoch": 0.89, "learning_rate": 0.00016661184293505405, "loss": 0.0137, "step": 176260 }, { "epoch": 0.89, "learning_rate": 0.00016660427524204004, "loss": 0.009, "step": 176270 }, { "epoch": 0.89, "learning_rate": 0.00016659670754902604, "loss": 0.0101, "step": 176280 }, { "epoch": 0.89, "learning_rate": 0.00016658913985601203, "loss": 0.0126, "step": 176290 }, { "epoch": 0.89, "learning_rate": 0.000166581572162998, "loss": 0.0102, "step": 176300 }, { "epoch": 0.89, "learning_rate": 0.000166574004469984, "loss": 0.0139, "step": 176310 }, { "epoch": 0.89, "learning_rate": 0.00016656643677697, "loss": 0.0113, "step": 176320 }, { "epoch": 0.89, "learning_rate": 0.00016655886908395598, "loss": 0.0105, "step": 176330 }, { "epoch": 0.89, "learning_rate": 0.00016655130139094196, "loss": 0.0149, "step": 176340 }, { "epoch": 0.89, "learning_rate": 0.00016654373369792797, "loss": 0.0111, "step": 176350 }, { "epoch": 0.89, "learning_rate": 0.00016653616600491395, "loss": 0.0099, "step": 176360 }, { "epoch": 0.89, "learning_rate": 0.00016652859831189993, "loss": 0.0152, "step": 176370 }, { "epoch": 0.89, "learning_rate": 0.00016652103061888594, "loss": 0.0116, "step": 176380 }, { "epoch": 0.89, "learning_rate": 0.00016651346292587192, "loss": 0.0129, "step": 176390 }, { "epoch": 0.89, "learning_rate": 0.0001665058952328579, "loss": 0.0108, "step": 176400 }, { "epoch": 0.89, "learning_rate": 0.0001664983275398439, "loss": 0.0099, "step": 176410 }, { "epoch": 0.89, "learning_rate": 0.0001664907598468299, "loss": 0.0125, "step": 176420 }, { "epoch": 0.89, "learning_rate": 0.00016648319215381587, "loss": 0.0105, "step": 176430 }, { "epoch": 0.89, "learning_rate": 0.00016647562446080188, "loss": 0.0093, "step": 176440 }, { "epoch": 0.89, "learning_rate": 0.00016646805676778786, "loss": 0.0127, "step": 176450 }, { "epoch": 0.89, "learning_rate": 0.00016646048907477385, "loss": 0.0106, "step": 176460 }, { "epoch": 0.89, "learning_rate": 0.00016645292138175983, "loss": 0.0101, "step": 176470 }, { "epoch": 0.89, "learning_rate": 0.00016644535368874584, "loss": 0.0106, "step": 176480 }, { "epoch": 0.89, "learning_rate": 0.00016643778599573182, "loss": 0.0145, "step": 176490 }, { "epoch": 0.89, "learning_rate": 0.0001664302183027178, "loss": 0.011, "step": 176500 }, { "epoch": 0.89, "learning_rate": 0.0001664226506097038, "loss": 0.0113, "step": 176510 }, { "epoch": 0.89, "learning_rate": 0.0001664150829166898, "loss": 0.0117, "step": 176520 }, { "epoch": 0.89, "learning_rate": 0.00016640751522367577, "loss": 0.0112, "step": 176530 }, { "epoch": 0.89, "learning_rate": 0.00016639994753066178, "loss": 0.0115, "step": 176540 }, { "epoch": 0.89, "learning_rate": 0.00016639237983764776, "loss": 0.0113, "step": 176550 }, { "epoch": 0.89, "learning_rate": 0.00016638481214463374, "loss": 0.0119, "step": 176560 }, { "epoch": 0.89, "learning_rate": 0.00016637724445161975, "loss": 0.0118, "step": 176570 }, { "epoch": 0.89, "learning_rate": 0.00016636967675860573, "loss": 0.0123, "step": 176580 }, { "epoch": 0.89, "learning_rate": 0.0001663621090655917, "loss": 0.0141, "step": 176590 }, { "epoch": 0.89, "learning_rate": 0.00016635454137257767, "loss": 0.0099, "step": 176600 }, { "epoch": 0.89, "learning_rate": 0.00016634697367956368, "loss": 0.014, "step": 176610 }, { "epoch": 0.89, "learning_rate": 0.00016633940598654966, "loss": 0.0104, "step": 176620 }, { "epoch": 0.89, "learning_rate": 0.00016633183829353564, "loss": 0.0137, "step": 176630 }, { "epoch": 0.89, "learning_rate": 0.00016632427060052165, "loss": 0.0104, "step": 176640 }, { "epoch": 0.89, "learning_rate": 0.00016631670290750763, "loss": 0.0122, "step": 176650 }, { "epoch": 0.89, "learning_rate": 0.0001663091352144936, "loss": 0.0109, "step": 176660 }, { "epoch": 0.89, "learning_rate": 0.00016630156752147962, "loss": 0.0146, "step": 176670 }, { "epoch": 0.89, "learning_rate": 0.0001662939998284656, "loss": 0.0109, "step": 176680 }, { "epoch": 0.89, "learning_rate": 0.00016628643213545158, "loss": 0.0111, "step": 176690 }, { "epoch": 0.89, "learning_rate": 0.00016627886444243756, "loss": 0.0116, "step": 176700 }, { "epoch": 0.89, "learning_rate": 0.00016627129674942357, "loss": 0.0106, "step": 176710 }, { "epoch": 0.89, "learning_rate": 0.00016626372905640955, "loss": 0.0113, "step": 176720 }, { "epoch": 0.89, "learning_rate": 0.00016625616136339553, "loss": 0.0096, "step": 176730 }, { "epoch": 0.89, "learning_rate": 0.00016624859367038154, "loss": 0.0116, "step": 176740 }, { "epoch": 0.89, "learning_rate": 0.00016624102597736752, "loss": 0.0119, "step": 176750 }, { "epoch": 0.89, "learning_rate": 0.0001662334582843535, "loss": 0.0125, "step": 176760 }, { "epoch": 0.89, "learning_rate": 0.00016622589059133951, "loss": 0.0121, "step": 176770 }, { "epoch": 0.89, "learning_rate": 0.0001662183228983255, "loss": 0.0131, "step": 176780 }, { "epoch": 0.89, "learning_rate": 0.00016621075520531148, "loss": 0.0092, "step": 176790 }, { "epoch": 0.89, "learning_rate": 0.00016620318751229749, "loss": 0.0084, "step": 176800 }, { "epoch": 0.89, "learning_rate": 0.00016619561981928347, "loss": 0.0123, "step": 176810 }, { "epoch": 0.89, "learning_rate": 0.00016618805212626945, "loss": 0.0105, "step": 176820 }, { "epoch": 0.89, "learning_rate": 0.00016618048443325546, "loss": 0.0109, "step": 176830 }, { "epoch": 0.89, "learning_rate": 0.00016617291674024144, "loss": 0.0094, "step": 176840 }, { "epoch": 0.89, "learning_rate": 0.00016616534904722742, "loss": 0.012, "step": 176850 }, { "epoch": 0.89, "learning_rate": 0.00016615778135421343, "loss": 0.012, "step": 176860 }, { "epoch": 0.89, "learning_rate": 0.0001661502136611994, "loss": 0.0131, "step": 176870 }, { "epoch": 0.89, "learning_rate": 0.0001661426459681854, "loss": 0.0097, "step": 176880 }, { "epoch": 0.89, "learning_rate": 0.00016613507827517137, "loss": 0.0148, "step": 176890 }, { "epoch": 0.89, "learning_rate": 0.00016612751058215738, "loss": 0.0123, "step": 176900 }, { "epoch": 0.89, "learning_rate": 0.00016611994288914336, "loss": 0.0119, "step": 176910 }, { "epoch": 0.89, "learning_rate": 0.00016611237519612934, "loss": 0.0106, "step": 176920 }, { "epoch": 0.89, "learning_rate": 0.00016610480750311535, "loss": 0.0088, "step": 176930 }, { "epoch": 0.89, "learning_rate": 0.00016609723981010133, "loss": 0.0113, "step": 176940 }, { "epoch": 0.89, "learning_rate": 0.00016608967211708732, "loss": 0.0096, "step": 176950 }, { "epoch": 0.89, "learning_rate": 0.00016608210442407332, "loss": 0.0113, "step": 176960 }, { "epoch": 0.89, "learning_rate": 0.0001660745367310593, "loss": 0.0123, "step": 176970 }, { "epoch": 0.89, "learning_rate": 0.0001660669690380453, "loss": 0.0134, "step": 176980 }, { "epoch": 0.89, "learning_rate": 0.0001660594013450313, "loss": 0.0113, "step": 176990 }, { "epoch": 0.89, "learning_rate": 0.00016605183365201728, "loss": 0.0093, "step": 177000 }, { "epoch": 0.89, "eval_cer": 0.9144896638256703, "eval_loss": 0.00848294422030449, "eval_runtime": 116.4993, "eval_samples_per_second": 17.167, "eval_steps_per_second": 4.292, "step": 177000 }, { "epoch": 0.89, "learning_rate": 0.00016604426595900326, "loss": 0.0126, "step": 177010 }, { "epoch": 0.89, "learning_rate": 0.00016603669826598927, "loss": 0.0146, "step": 177020 }, { "epoch": 0.89, "learning_rate": 0.00016602913057297525, "loss": 0.013, "step": 177030 }, { "epoch": 0.89, "learning_rate": 0.00016602156287996123, "loss": 0.0131, "step": 177040 }, { "epoch": 0.89, "learning_rate": 0.0001660139951869472, "loss": 0.0125, "step": 177050 }, { "epoch": 0.89, "learning_rate": 0.00016600642749393322, "loss": 0.0099, "step": 177060 }, { "epoch": 0.89, "learning_rate": 0.0001659988598009192, "loss": 0.0114, "step": 177070 }, { "epoch": 0.89, "learning_rate": 0.00016599129210790518, "loss": 0.0134, "step": 177080 }, { "epoch": 0.89, "learning_rate": 0.0001659837244148912, "loss": 0.018, "step": 177090 }, { "epoch": 0.89, "learning_rate": 0.00016597615672187717, "loss": 0.0149, "step": 177100 }, { "epoch": 0.89, "learning_rate": 0.00016596858902886315, "loss": 0.0111, "step": 177110 }, { "epoch": 0.89, "learning_rate": 0.00016596102133584916, "loss": 0.0115, "step": 177120 }, { "epoch": 0.89, "learning_rate": 0.00016595345364283514, "loss": 0.0112, "step": 177130 }, { "epoch": 0.89, "learning_rate": 0.00016594588594982113, "loss": 0.0123, "step": 177140 }, { "epoch": 0.89, "learning_rate": 0.00016593831825680713, "loss": 0.0109, "step": 177150 }, { "epoch": 0.89, "learning_rate": 0.00016593075056379312, "loss": 0.0133, "step": 177160 }, { "epoch": 0.89, "learning_rate": 0.0001659231828707791, "loss": 0.012, "step": 177170 }, { "epoch": 0.89, "learning_rate": 0.0001659156151777651, "loss": 0.0112, "step": 177180 }, { "epoch": 0.89, "learning_rate": 0.0001659080474847511, "loss": 0.011, "step": 177190 }, { "epoch": 0.89, "learning_rate": 0.00016590047979173707, "loss": 0.0091, "step": 177200 }, { "epoch": 0.89, "learning_rate": 0.00016589291209872305, "loss": 0.0114, "step": 177210 }, { "epoch": 0.89, "learning_rate": 0.00016588534440570906, "loss": 0.0109, "step": 177220 }, { "epoch": 0.89, "learning_rate": 0.00016587777671269504, "loss": 0.0131, "step": 177230 }, { "epoch": 0.89, "learning_rate": 0.00016587020901968102, "loss": 0.0106, "step": 177240 }, { "epoch": 0.89, "learning_rate": 0.00016586264132666703, "loss": 0.0126, "step": 177250 }, { "epoch": 0.89, "learning_rate": 0.000165855073633653, "loss": 0.011, "step": 177260 }, { "epoch": 0.89, "learning_rate": 0.000165847505940639, "loss": 0.0116, "step": 177270 }, { "epoch": 0.89, "learning_rate": 0.000165839938247625, "loss": 0.0139, "step": 177280 }, { "epoch": 0.89, "learning_rate": 0.00016583237055461098, "loss": 0.0102, "step": 177290 }, { "epoch": 0.89, "learning_rate": 0.00016582480286159696, "loss": 0.0112, "step": 177300 }, { "epoch": 0.89, "learning_rate": 0.00016581723516858297, "loss": 0.013, "step": 177310 }, { "epoch": 0.89, "learning_rate": 0.00016580966747556895, "loss": 0.0123, "step": 177320 }, { "epoch": 0.89, "learning_rate": 0.00016580209978255494, "loss": 0.0143, "step": 177330 }, { "epoch": 0.89, "learning_rate": 0.00016579453208954094, "loss": 0.0107, "step": 177340 }, { "epoch": 0.89, "learning_rate": 0.00016578696439652693, "loss": 0.0089, "step": 177350 }, { "epoch": 0.89, "learning_rate": 0.0001657793967035129, "loss": 0.0101, "step": 177360 }, { "epoch": 0.89, "learning_rate": 0.0001657718290104989, "loss": 0.0096, "step": 177370 }, { "epoch": 0.89, "learning_rate": 0.0001657642613174849, "loss": 0.0106, "step": 177380 }, { "epoch": 0.89, "learning_rate": 0.00016575669362447088, "loss": 0.0082, "step": 177390 }, { "epoch": 0.9, "learning_rate": 0.00016574912593145686, "loss": 0.0158, "step": 177400 }, { "epoch": 0.9, "learning_rate": 0.00016574155823844287, "loss": 0.0124, "step": 177410 }, { "epoch": 0.9, "learning_rate": 0.00016573399054542885, "loss": 0.0128, "step": 177420 }, { "epoch": 0.9, "learning_rate": 0.00016572642285241483, "loss": 0.0123, "step": 177430 }, { "epoch": 0.9, "learning_rate": 0.00016571885515940084, "loss": 0.0099, "step": 177440 }, { "epoch": 0.9, "learning_rate": 0.00016571128746638682, "loss": 0.0121, "step": 177450 }, { "epoch": 0.9, "learning_rate": 0.0001657037197733728, "loss": 0.0099, "step": 177460 }, { "epoch": 0.9, "learning_rate": 0.0001656961520803588, "loss": 0.0106, "step": 177470 }, { "epoch": 0.9, "learning_rate": 0.0001656885843873448, "loss": 0.0113, "step": 177480 }, { "epoch": 0.9, "learning_rate": 0.00016568101669433077, "loss": 0.0092, "step": 177490 }, { "epoch": 0.9, "learning_rate": 0.00016567344900131678, "loss": 0.0106, "step": 177500 }, { "epoch": 0.9, "learning_rate": 0.00016566588130830276, "loss": 0.0098, "step": 177510 }, { "epoch": 0.9, "learning_rate": 0.00016565831361528875, "loss": 0.0162, "step": 177520 }, { "epoch": 0.9, "learning_rate": 0.00016565074592227475, "loss": 0.0133, "step": 177530 }, { "epoch": 0.9, "learning_rate": 0.00016564317822926074, "loss": 0.0104, "step": 177540 }, { "epoch": 0.9, "learning_rate": 0.00016563561053624672, "loss": 0.0091, "step": 177550 }, { "epoch": 0.9, "learning_rate": 0.0001656280428432327, "loss": 0.0135, "step": 177560 }, { "epoch": 0.9, "learning_rate": 0.0001656204751502187, "loss": 0.0117, "step": 177570 }, { "epoch": 0.9, "learning_rate": 0.0001656129074572047, "loss": 0.01, "step": 177580 }, { "epoch": 0.9, "learning_rate": 0.00016560533976419067, "loss": 0.0166, "step": 177590 }, { "epoch": 0.9, "learning_rate": 0.00016559777207117668, "loss": 0.0102, "step": 177600 }, { "epoch": 0.9, "learning_rate": 0.00016559020437816266, "loss": 0.0112, "step": 177610 }, { "epoch": 0.9, "learning_rate": 0.00016558263668514864, "loss": 0.0122, "step": 177620 }, { "epoch": 0.9, "learning_rate": 0.00016557506899213465, "loss": 0.0108, "step": 177630 }, { "epoch": 0.9, "learning_rate": 0.00016556750129912063, "loss": 0.0107, "step": 177640 }, { "epoch": 0.9, "learning_rate": 0.0001655599336061066, "loss": 0.0129, "step": 177650 }, { "epoch": 0.9, "learning_rate": 0.00016555236591309262, "loss": 0.0106, "step": 177660 }, { "epoch": 0.9, "learning_rate": 0.0001655447982200786, "loss": 0.0116, "step": 177670 }, { "epoch": 0.9, "learning_rate": 0.00016553723052706458, "loss": 0.0121, "step": 177680 }, { "epoch": 0.9, "learning_rate": 0.0001655296628340506, "loss": 0.0112, "step": 177690 }, { "epoch": 0.9, "learning_rate": 0.00016552209514103657, "loss": 0.0124, "step": 177700 }, { "epoch": 0.9, "learning_rate": 0.00016551452744802256, "loss": 0.0113, "step": 177710 }, { "epoch": 0.9, "learning_rate": 0.00016550695975500854, "loss": 0.0122, "step": 177720 }, { "epoch": 0.9, "learning_rate": 0.00016549939206199455, "loss": 0.0115, "step": 177730 }, { "epoch": 0.9, "learning_rate": 0.00016549182436898053, "loss": 0.0121, "step": 177740 }, { "epoch": 0.9, "learning_rate": 0.0001654842566759665, "loss": 0.0118, "step": 177750 }, { "epoch": 0.9, "learning_rate": 0.00016547668898295252, "loss": 0.0126, "step": 177760 }, { "epoch": 0.9, "learning_rate": 0.0001654691212899385, "loss": 0.0077, "step": 177770 }, { "epoch": 0.9, "learning_rate": 0.00016546155359692448, "loss": 0.0153, "step": 177780 }, { "epoch": 0.9, "learning_rate": 0.0001654539859039105, "loss": 0.012, "step": 177790 }, { "epoch": 0.9, "learning_rate": 0.00016544641821089647, "loss": 0.0099, "step": 177800 }, { "epoch": 0.9, "learning_rate": 0.00016543885051788245, "loss": 0.0112, "step": 177810 }, { "epoch": 0.9, "learning_rate": 0.00016543128282486846, "loss": 0.0144, "step": 177820 }, { "epoch": 0.9, "learning_rate": 0.00016542371513185444, "loss": 0.0089, "step": 177830 }, { "epoch": 0.9, "learning_rate": 0.00016541614743884042, "loss": 0.0104, "step": 177840 }, { "epoch": 0.9, "learning_rate": 0.00016540857974582638, "loss": 0.0141, "step": 177850 }, { "epoch": 0.9, "learning_rate": 0.00016540101205281239, "loss": 0.0095, "step": 177860 }, { "epoch": 0.9, "learning_rate": 0.00016539344435979837, "loss": 0.0119, "step": 177870 }, { "epoch": 0.9, "learning_rate": 0.00016538587666678435, "loss": 0.0143, "step": 177880 }, { "epoch": 0.9, "learning_rate": 0.00016537830897377036, "loss": 0.0156, "step": 177890 }, { "epoch": 0.9, "learning_rate": 0.00016537074128075634, "loss": 0.0145, "step": 177900 }, { "epoch": 0.9, "learning_rate": 0.00016536317358774232, "loss": 0.0121, "step": 177910 }, { "epoch": 0.9, "learning_rate": 0.00016535560589472833, "loss": 0.0112, "step": 177920 }, { "epoch": 0.9, "learning_rate": 0.0001653480382017143, "loss": 0.0126, "step": 177930 }, { "epoch": 0.9, "learning_rate": 0.0001653404705087003, "loss": 0.0139, "step": 177940 }, { "epoch": 0.9, "learning_rate": 0.00016533290281568627, "loss": 0.0114, "step": 177950 }, { "epoch": 0.9, "learning_rate": 0.00016532533512267228, "loss": 0.0107, "step": 177960 }, { "epoch": 0.9, "learning_rate": 0.00016531776742965826, "loss": 0.014, "step": 177970 }, { "epoch": 0.9, "learning_rate": 0.00016531019973664424, "loss": 0.0126, "step": 177980 }, { "epoch": 0.9, "learning_rate": 0.00016530263204363025, "loss": 0.0126, "step": 177990 }, { "epoch": 0.9, "learning_rate": 0.00016529506435061623, "loss": 0.0134, "step": 178000 }, { "epoch": 0.9, "eval_cer": 0.9144828710527925, "eval_loss": 0.008248904719948769, "eval_runtime": 116.6185, "eval_samples_per_second": 17.15, "eval_steps_per_second": 4.287, "step": 178000 }, { "epoch": 0.9, "learning_rate": 0.00016528749665760222, "loss": 0.0122, "step": 178010 }, { "epoch": 0.9, "learning_rate": 0.00016527992896458822, "loss": 0.0117, "step": 178020 }, { "epoch": 0.9, "learning_rate": 0.0001652723612715742, "loss": 0.0117, "step": 178030 }, { "epoch": 0.9, "learning_rate": 0.0001652647935785602, "loss": 0.0159, "step": 178040 }, { "epoch": 0.9, "learning_rate": 0.0001652572258855462, "loss": 0.0093, "step": 178050 }, { "epoch": 0.9, "learning_rate": 0.00016524965819253218, "loss": 0.0128, "step": 178060 }, { "epoch": 0.9, "learning_rate": 0.00016524209049951816, "loss": 0.0107, "step": 178070 }, { "epoch": 0.9, "learning_rate": 0.00016523452280650417, "loss": 0.011, "step": 178080 }, { "epoch": 0.9, "learning_rate": 0.00016522695511349015, "loss": 0.0162, "step": 178090 }, { "epoch": 0.9, "learning_rate": 0.00016521938742047613, "loss": 0.0101, "step": 178100 }, { "epoch": 0.9, "learning_rate": 0.0001652118197274621, "loss": 0.0091, "step": 178110 }, { "epoch": 0.9, "learning_rate": 0.00016520425203444812, "loss": 0.013, "step": 178120 }, { "epoch": 0.9, "learning_rate": 0.0001651966843414341, "loss": 0.0117, "step": 178130 }, { "epoch": 0.9, "learning_rate": 0.00016518911664842008, "loss": 0.0081, "step": 178140 }, { "epoch": 0.9, "learning_rate": 0.0001651815489554061, "loss": 0.0124, "step": 178150 }, { "epoch": 0.9, "learning_rate": 0.00016517398126239207, "loss": 0.0127, "step": 178160 }, { "epoch": 0.9, "learning_rate": 0.00016516641356937805, "loss": 0.0122, "step": 178170 }, { "epoch": 0.9, "learning_rate": 0.00016515884587636406, "loss": 0.0115, "step": 178180 }, { "epoch": 0.9, "learning_rate": 0.00016515127818335004, "loss": 0.0107, "step": 178190 }, { "epoch": 0.9, "learning_rate": 0.00016514371049033603, "loss": 0.0114, "step": 178200 }, { "epoch": 0.9, "learning_rate": 0.00016513614279732203, "loss": 0.0128, "step": 178210 }, { "epoch": 0.9, "learning_rate": 0.00016512857510430802, "loss": 0.0123, "step": 178220 }, { "epoch": 0.9, "learning_rate": 0.000165121007411294, "loss": 0.0114, "step": 178230 }, { "epoch": 0.9, "learning_rate": 0.00016511343971828, "loss": 0.0152, "step": 178240 }, { "epoch": 0.9, "learning_rate": 0.000165105872025266, "loss": 0.0131, "step": 178250 }, { "epoch": 0.9, "learning_rate": 0.00016509830433225197, "loss": 0.0113, "step": 178260 }, { "epoch": 0.9, "learning_rate": 0.00016509073663923795, "loss": 0.0172, "step": 178270 }, { "epoch": 0.9, "learning_rate": 0.00016508316894622396, "loss": 0.0128, "step": 178280 }, { "epoch": 0.9, "learning_rate": 0.00016507560125320994, "loss": 0.013, "step": 178290 }, { "epoch": 0.9, "learning_rate": 0.00016506803356019592, "loss": 0.0119, "step": 178300 }, { "epoch": 0.9, "learning_rate": 0.00016506046586718193, "loss": 0.0099, "step": 178310 }, { "epoch": 0.9, "learning_rate": 0.0001650528981741679, "loss": 0.0118, "step": 178320 }, { "epoch": 0.9, "learning_rate": 0.0001650453304811539, "loss": 0.0095, "step": 178330 }, { "epoch": 0.9, "learning_rate": 0.0001650377627881399, "loss": 0.0099, "step": 178340 }, { "epoch": 0.9, "learning_rate": 0.00016503019509512588, "loss": 0.0137, "step": 178350 }, { "epoch": 0.9, "learning_rate": 0.00016502262740211186, "loss": 0.011, "step": 178360 }, { "epoch": 0.9, "learning_rate": 0.00016501505970909787, "loss": 0.0138, "step": 178370 }, { "epoch": 0.9, "learning_rate": 0.00016500749201608385, "loss": 0.0089, "step": 178380 }, { "epoch": 0.9, "learning_rate": 0.00016499992432306984, "loss": 0.0141, "step": 178390 }, { "epoch": 0.9, "learning_rate": 0.00016499235663005584, "loss": 0.0121, "step": 178400 }, { "epoch": 0.9, "learning_rate": 0.00016498478893704183, "loss": 0.013, "step": 178410 }, { "epoch": 0.9, "learning_rate": 0.0001649772212440278, "loss": 0.0124, "step": 178420 }, { "epoch": 0.9, "learning_rate": 0.00016496965355101382, "loss": 0.0107, "step": 178430 }, { "epoch": 0.9, "learning_rate": 0.0001649620858579998, "loss": 0.0146, "step": 178440 }, { "epoch": 0.9, "learning_rate": 0.00016495451816498578, "loss": 0.0133, "step": 178450 }, { "epoch": 0.9, "learning_rate": 0.00016494695047197176, "loss": 0.0119, "step": 178460 }, { "epoch": 0.9, "learning_rate": 0.00016493938277895777, "loss": 0.0093, "step": 178470 }, { "epoch": 0.9, "learning_rate": 0.00016493181508594375, "loss": 0.0112, "step": 178480 }, { "epoch": 0.9, "learning_rate": 0.00016492424739292973, "loss": 0.0208, "step": 178490 }, { "epoch": 0.9, "learning_rate": 0.00016491667969991574, "loss": 0.0219, "step": 178500 }, { "epoch": 0.9, "learning_rate": 0.00016490911200690172, "loss": 0.0107, "step": 178510 }, { "epoch": 0.9, "learning_rate": 0.0001649015443138877, "loss": 0.0267, "step": 178520 }, { "epoch": 0.9, "learning_rate": 0.0001648939766208737, "loss": 0.0128, "step": 178530 }, { "epoch": 0.9, "learning_rate": 0.0001648864089278597, "loss": 0.0128, "step": 178540 }, { "epoch": 0.9, "learning_rate": 0.00016487884123484567, "loss": 0.0115, "step": 178550 }, { "epoch": 0.9, "learning_rate": 0.00016487127354183168, "loss": 0.0133, "step": 178560 }, { "epoch": 0.9, "learning_rate": 0.00016486370584881766, "loss": 0.0131, "step": 178570 }, { "epoch": 0.9, "learning_rate": 0.00016485613815580365, "loss": 0.0102, "step": 178580 }, { "epoch": 0.9, "learning_rate": 0.00016484857046278965, "loss": 0.0105, "step": 178590 }, { "epoch": 0.9, "learning_rate": 0.00016484100276977564, "loss": 0.0111, "step": 178600 }, { "epoch": 0.9, "learning_rate": 0.00016483343507676162, "loss": 0.012, "step": 178610 }, { "epoch": 0.9, "learning_rate": 0.0001648258673837476, "loss": 0.0086, "step": 178620 }, { "epoch": 0.9, "learning_rate": 0.0001648182996907336, "loss": 0.0113, "step": 178630 }, { "epoch": 0.9, "learning_rate": 0.0001648107319977196, "loss": 0.0101, "step": 178640 }, { "epoch": 0.9, "learning_rate": 0.00016480316430470557, "loss": 0.0119, "step": 178650 }, { "epoch": 0.9, "learning_rate": 0.00016479559661169158, "loss": 0.0107, "step": 178660 }, { "epoch": 0.9, "learning_rate": 0.00016478802891867756, "loss": 0.0094, "step": 178670 }, { "epoch": 0.9, "learning_rate": 0.00016478046122566354, "loss": 0.0101, "step": 178680 }, { "epoch": 0.9, "learning_rate": 0.00016477289353264955, "loss": 0.0115, "step": 178690 }, { "epoch": 0.9, "learning_rate": 0.00016476532583963553, "loss": 0.01, "step": 178700 }, { "epoch": 0.9, "learning_rate": 0.0001647577581466215, "loss": 0.0104, "step": 178710 }, { "epoch": 0.9, "learning_rate": 0.00016475019045360752, "loss": 0.0112, "step": 178720 }, { "epoch": 0.9, "learning_rate": 0.0001647426227605935, "loss": 0.0117, "step": 178730 }, { "epoch": 0.9, "learning_rate": 0.00016473505506757948, "loss": 0.0123, "step": 178740 }, { "epoch": 0.9, "learning_rate": 0.0001647274873745655, "loss": 0.0158, "step": 178750 }, { "epoch": 0.9, "learning_rate": 0.00016471991968155147, "loss": 0.0112, "step": 178760 }, { "epoch": 0.9, "learning_rate": 0.00016471235198853746, "loss": 0.0115, "step": 178770 }, { "epoch": 0.9, "learning_rate": 0.00016470478429552344, "loss": 0.0109, "step": 178780 }, { "epoch": 0.9, "learning_rate": 0.00016469721660250945, "loss": 0.0146, "step": 178790 }, { "epoch": 0.9, "learning_rate": 0.00016468964890949543, "loss": 0.0112, "step": 178800 }, { "epoch": 0.9, "learning_rate": 0.0001646820812164814, "loss": 0.0119, "step": 178810 }, { "epoch": 0.9, "learning_rate": 0.00016467451352346742, "loss": 0.0112, "step": 178820 }, { "epoch": 0.9, "learning_rate": 0.0001646669458304534, "loss": 0.0146, "step": 178830 }, { "epoch": 0.9, "learning_rate": 0.00016465937813743938, "loss": 0.0134, "step": 178840 }, { "epoch": 0.9, "learning_rate": 0.0001646518104444254, "loss": 0.012, "step": 178850 }, { "epoch": 0.9, "learning_rate": 0.00016464424275141137, "loss": 0.0108, "step": 178860 }, { "epoch": 0.9, "learning_rate": 0.00016463667505839735, "loss": 0.0084, "step": 178870 }, { "epoch": 0.9, "learning_rate": 0.00016462910736538336, "loss": 0.0092, "step": 178880 }, { "epoch": 0.9, "learning_rate": 0.00016462153967236934, "loss": 0.0154, "step": 178890 }, { "epoch": 0.9, "learning_rate": 0.00016461397197935532, "loss": 0.0109, "step": 178900 }, { "epoch": 0.9, "learning_rate": 0.00016460640428634133, "loss": 0.0132, "step": 178910 }, { "epoch": 0.9, "learning_rate": 0.0001645988365933273, "loss": 0.0105, "step": 178920 }, { "epoch": 0.9, "learning_rate": 0.0001645912689003133, "loss": 0.0105, "step": 178930 }, { "epoch": 0.9, "learning_rate": 0.0001645837012072993, "loss": 0.0108, "step": 178940 }, { "epoch": 0.9, "learning_rate": 0.00016457613351428528, "loss": 0.0109, "step": 178950 }, { "epoch": 0.9, "learning_rate": 0.00016456856582127127, "loss": 0.0113, "step": 178960 }, { "epoch": 0.9, "learning_rate": 0.00016456099812825725, "loss": 0.0142, "step": 178970 }, { "epoch": 0.9, "learning_rate": 0.00016455343043524326, "loss": 0.0113, "step": 178980 }, { "epoch": 0.9, "learning_rate": 0.00016454586274222924, "loss": 0.0103, "step": 178990 }, { "epoch": 0.9, "learning_rate": 0.00016453829504921522, "loss": 0.0116, "step": 179000 }, { "epoch": 0.9, "eval_cer": 0.914462492734159, "eval_loss": 0.008126331493258476, "eval_runtime": 116.7985, "eval_samples_per_second": 17.124, "eval_steps_per_second": 4.281, "step": 179000 }, { "epoch": 0.9, "learning_rate": 0.00016453072735620123, "loss": 0.0122, "step": 179010 }, { "epoch": 0.9, "learning_rate": 0.0001645231596631872, "loss": 0.0112, "step": 179020 }, { "epoch": 0.9, "learning_rate": 0.0001645155919701732, "loss": 0.0103, "step": 179030 }, { "epoch": 0.9, "learning_rate": 0.0001645080242771592, "loss": 0.0118, "step": 179040 }, { "epoch": 0.9, "learning_rate": 0.00016450045658414518, "loss": 0.0124, "step": 179050 }, { "epoch": 0.9, "learning_rate": 0.00016449288889113116, "loss": 0.0115, "step": 179060 }, { "epoch": 0.9, "learning_rate": 0.00016448532119811717, "loss": 0.0093, "step": 179070 }, { "epoch": 0.9, "learning_rate": 0.00016447775350510315, "loss": 0.0099, "step": 179080 }, { "epoch": 0.9, "learning_rate": 0.00016447018581208913, "loss": 0.0112, "step": 179090 }, { "epoch": 0.9, "learning_rate": 0.00016446261811907514, "loss": 0.011, "step": 179100 }, { "epoch": 0.9, "learning_rate": 0.0001644550504260611, "loss": 0.0172, "step": 179110 }, { "epoch": 0.9, "learning_rate": 0.00016444748273304708, "loss": 0.0158, "step": 179120 }, { "epoch": 0.9, "learning_rate": 0.00016443991504003306, "loss": 0.0119, "step": 179130 }, { "epoch": 0.9, "learning_rate": 0.00016443234734701907, "loss": 0.0134, "step": 179140 }, { "epoch": 0.9, "learning_rate": 0.00016442477965400505, "loss": 0.0099, "step": 179150 }, { "epoch": 0.9, "learning_rate": 0.00016441721196099103, "loss": 0.0115, "step": 179160 }, { "epoch": 0.9, "learning_rate": 0.000164409644267977, "loss": 0.0117, "step": 179170 }, { "epoch": 0.9, "learning_rate": 0.00016440207657496302, "loss": 0.0097, "step": 179180 }, { "epoch": 0.9, "learning_rate": 0.000164394508881949, "loss": 0.0103, "step": 179190 }, { "epoch": 0.9, "learning_rate": 0.00016438694118893498, "loss": 0.0105, "step": 179200 }, { "epoch": 0.9, "learning_rate": 0.000164379373495921, "loss": 0.0112, "step": 179210 }, { "epoch": 0.9, "learning_rate": 0.00016437180580290697, "loss": 0.0147, "step": 179220 }, { "epoch": 0.9, "learning_rate": 0.00016436423810989295, "loss": 0.0154, "step": 179230 }, { "epoch": 0.9, "learning_rate": 0.00016435667041687896, "loss": 0.0091, "step": 179240 }, { "epoch": 0.9, "learning_rate": 0.00016434910272386494, "loss": 0.0099, "step": 179250 }, { "epoch": 0.9, "learning_rate": 0.00016434153503085093, "loss": 0.0115, "step": 179260 }, { "epoch": 0.9, "learning_rate": 0.00016433396733783693, "loss": 0.0138, "step": 179270 }, { "epoch": 0.9, "learning_rate": 0.00016432639964482292, "loss": 0.0116, "step": 179280 }, { "epoch": 0.9, "learning_rate": 0.0001643188319518089, "loss": 0.0104, "step": 179290 }, { "epoch": 0.9, "learning_rate": 0.0001643112642587949, "loss": 0.0115, "step": 179300 }, { "epoch": 0.9, "learning_rate": 0.0001643036965657809, "loss": 0.0136, "step": 179310 }, { "epoch": 0.9, "learning_rate": 0.00016429612887276687, "loss": 0.0123, "step": 179320 }, { "epoch": 0.9, "learning_rate": 0.00016428856117975288, "loss": 0.0089, "step": 179330 }, { "epoch": 0.9, "learning_rate": 0.00016428099348673886, "loss": 0.0113, "step": 179340 }, { "epoch": 0.9, "learning_rate": 0.00016427342579372484, "loss": 0.0096, "step": 179350 }, { "epoch": 0.9, "learning_rate": 0.00016426585810071082, "loss": 0.0138, "step": 179360 }, { "epoch": 0.9, "learning_rate": 0.00016425829040769683, "loss": 0.0143, "step": 179370 }, { "epoch": 0.9, "learning_rate": 0.0001642507227146828, "loss": 0.011, "step": 179380 }, { "epoch": 0.91, "learning_rate": 0.0001642431550216688, "loss": 0.016, "step": 179390 }, { "epoch": 0.91, "learning_rate": 0.0001642355873286548, "loss": 0.0085, "step": 179400 }, { "epoch": 0.91, "learning_rate": 0.00016422801963564078, "loss": 0.0114, "step": 179410 }, { "epoch": 0.91, "learning_rate": 0.00016422045194262676, "loss": 0.0136, "step": 179420 }, { "epoch": 0.91, "learning_rate": 0.00016421288424961277, "loss": 0.0112, "step": 179430 }, { "epoch": 0.91, "learning_rate": 0.00016420531655659875, "loss": 0.0095, "step": 179440 }, { "epoch": 0.91, "learning_rate": 0.00016419774886358474, "loss": 0.0133, "step": 179450 }, { "epoch": 0.91, "learning_rate": 0.00016419018117057074, "loss": 0.0114, "step": 179460 }, { "epoch": 0.91, "learning_rate": 0.00016418261347755673, "loss": 0.0114, "step": 179470 }, { "epoch": 0.91, "learning_rate": 0.0001641750457845427, "loss": 0.0123, "step": 179480 }, { "epoch": 0.91, "learning_rate": 0.00016416747809152872, "loss": 0.0099, "step": 179490 }, { "epoch": 0.91, "learning_rate": 0.0001641599103985147, "loss": 0.0091, "step": 179500 }, { "epoch": 0.91, "learning_rate": 0.00016415234270550068, "loss": 0.0111, "step": 179510 }, { "epoch": 0.91, "learning_rate": 0.00016414477501248666, "loss": 0.0107, "step": 179520 }, { "epoch": 0.91, "learning_rate": 0.00016413720731947267, "loss": 0.0132, "step": 179530 }, { "epoch": 0.91, "learning_rate": 0.00016412963962645865, "loss": 0.013, "step": 179540 }, { "epoch": 0.91, "learning_rate": 0.00016412207193344463, "loss": 0.0153, "step": 179550 }, { "epoch": 0.91, "learning_rate": 0.00016411450424043064, "loss": 0.0129, "step": 179560 }, { "epoch": 0.91, "learning_rate": 0.00016410693654741662, "loss": 0.0094, "step": 179570 }, { "epoch": 0.91, "learning_rate": 0.0001640993688544026, "loss": 0.0216, "step": 179580 }, { "epoch": 0.91, "learning_rate": 0.0001640918011613886, "loss": 0.0112, "step": 179590 }, { "epoch": 0.91, "learning_rate": 0.0001640842334683746, "loss": 0.0135, "step": 179600 }, { "epoch": 0.91, "learning_rate": 0.00016407666577536058, "loss": 0.0111, "step": 179610 }, { "epoch": 0.91, "learning_rate": 0.00016406909808234658, "loss": 0.0102, "step": 179620 }, { "epoch": 0.91, "learning_rate": 0.00016406153038933257, "loss": 0.0128, "step": 179630 }, { "epoch": 0.91, "learning_rate": 0.00016405396269631855, "loss": 0.0116, "step": 179640 }, { "epoch": 0.91, "learning_rate": 0.00016404639500330455, "loss": 0.0101, "step": 179650 }, { "epoch": 0.91, "learning_rate": 0.00016403882731029054, "loss": 0.0109, "step": 179660 }, { "epoch": 0.91, "learning_rate": 0.00016403125961727652, "loss": 0.0108, "step": 179670 }, { "epoch": 0.91, "learning_rate": 0.0001640236919242625, "loss": 0.0129, "step": 179680 }, { "epoch": 0.91, "learning_rate": 0.0001640161242312485, "loss": 0.017, "step": 179690 }, { "epoch": 0.91, "learning_rate": 0.0001640085565382345, "loss": 0.0116, "step": 179700 }, { "epoch": 0.91, "learning_rate": 0.00016400098884522047, "loss": 0.0136, "step": 179710 }, { "epoch": 0.91, "learning_rate": 0.00016399342115220648, "loss": 0.0121, "step": 179720 }, { "epoch": 0.91, "learning_rate": 0.00016398585345919246, "loss": 0.0084, "step": 179730 }, { "epoch": 0.91, "learning_rate": 0.00016397828576617844, "loss": 0.0114, "step": 179740 }, { "epoch": 0.91, "learning_rate": 0.00016397071807316445, "loss": 0.0114, "step": 179750 }, { "epoch": 0.91, "learning_rate": 0.00016396315038015043, "loss": 0.0088, "step": 179760 }, { "epoch": 0.91, "learning_rate": 0.00016395558268713641, "loss": 0.0116, "step": 179770 }, { "epoch": 0.91, "learning_rate": 0.00016394801499412242, "loss": 0.0152, "step": 179780 }, { "epoch": 0.91, "learning_rate": 0.0001639404473011084, "loss": 0.0115, "step": 179790 }, { "epoch": 0.91, "learning_rate": 0.00016393287960809439, "loss": 0.0113, "step": 179800 }, { "epoch": 0.91, "learning_rate": 0.0001639253119150804, "loss": 0.0165, "step": 179810 }, { "epoch": 0.91, "learning_rate": 0.00016391774422206638, "loss": 0.0098, "step": 179820 }, { "epoch": 0.91, "learning_rate": 0.00016391017652905236, "loss": 0.0113, "step": 179830 }, { "epoch": 0.91, "learning_rate": 0.00016390260883603837, "loss": 0.0115, "step": 179840 }, { "epoch": 0.91, "learning_rate": 0.00016389504114302435, "loss": 0.0126, "step": 179850 }, { "epoch": 0.91, "learning_rate": 0.00016388747345001033, "loss": 0.0115, "step": 179860 }, { "epoch": 0.91, "learning_rate": 0.0001638799057569963, "loss": 0.0117, "step": 179870 }, { "epoch": 0.91, "learning_rate": 0.00016387233806398232, "loss": 0.0093, "step": 179880 }, { "epoch": 0.91, "learning_rate": 0.0001638647703709683, "loss": 0.0101, "step": 179890 }, { "epoch": 0.91, "learning_rate": 0.00016385720267795428, "loss": 0.0081, "step": 179900 }, { "epoch": 0.91, "learning_rate": 0.0001638496349849403, "loss": 0.0092, "step": 179910 }, { "epoch": 0.91, "learning_rate": 0.00016384206729192627, "loss": 0.01, "step": 179920 }, { "epoch": 0.91, "learning_rate": 0.00016383449959891225, "loss": 0.0094, "step": 179930 }, { "epoch": 0.91, "learning_rate": 0.00016382693190589826, "loss": 0.0129, "step": 179940 }, { "epoch": 0.91, "learning_rate": 0.00016381936421288424, "loss": 0.0149, "step": 179950 }, { "epoch": 0.91, "learning_rate": 0.00016381179651987022, "loss": 0.0094, "step": 179960 }, { "epoch": 0.91, "learning_rate": 0.00016380422882685623, "loss": 0.0134, "step": 179970 }, { "epoch": 0.91, "learning_rate": 0.00016379666113384221, "loss": 0.0091, "step": 179980 }, { "epoch": 0.91, "learning_rate": 0.0001637890934408282, "loss": 0.0098, "step": 179990 }, { "epoch": 0.91, "learning_rate": 0.0001637815257478142, "loss": 0.0102, "step": 180000 }, { "epoch": 0.91, "eval_cer": 0.9144857822411687, "eval_loss": 0.008224265649914742, "eval_runtime": 116.6551, "eval_samples_per_second": 17.145, "eval_steps_per_second": 4.286, "step": 180000 }, { "epoch": 0.91, "learning_rate": 0.00016377395805480019, "loss": 0.0104, "step": 180010 }, { "epoch": 0.91, "learning_rate": 0.00016376639036178617, "loss": 0.009, "step": 180020 }, { "epoch": 0.91, "learning_rate": 0.00016375882266877215, "loss": 0.0138, "step": 180030 }, { "epoch": 0.91, "learning_rate": 0.00016375125497575816, "loss": 0.0099, "step": 180040 }, { "epoch": 0.91, "learning_rate": 0.00016374368728274414, "loss": 0.0122, "step": 180050 }, { "epoch": 0.91, "learning_rate": 0.00016373611958973012, "loss": 0.0136, "step": 180060 }, { "epoch": 0.91, "learning_rate": 0.00016372855189671613, "loss": 0.0124, "step": 180070 }, { "epoch": 0.91, "learning_rate": 0.0001637209842037021, "loss": 0.012, "step": 180080 }, { "epoch": 0.91, "learning_rate": 0.0001637134165106881, "loss": 0.0144, "step": 180090 }, { "epoch": 0.91, "learning_rate": 0.0001637058488176741, "loss": 0.0098, "step": 180100 }, { "epoch": 0.91, "learning_rate": 0.00016369828112466008, "loss": 0.0116, "step": 180110 }, { "epoch": 0.91, "learning_rate": 0.00016369071343164606, "loss": 0.0117, "step": 180120 }, { "epoch": 0.91, "learning_rate": 0.00016368314573863207, "loss": 0.0141, "step": 180130 }, { "epoch": 0.91, "learning_rate": 0.00016367557804561805, "loss": 0.0137, "step": 180140 }, { "epoch": 0.91, "learning_rate": 0.00016366801035260403, "loss": 0.0102, "step": 180150 }, { "epoch": 0.91, "learning_rate": 0.00016366044265959004, "loss": 0.01, "step": 180160 }, { "epoch": 0.91, "learning_rate": 0.00016365287496657602, "loss": 0.0135, "step": 180170 }, { "epoch": 0.91, "learning_rate": 0.000163645307273562, "loss": 0.0099, "step": 180180 }, { "epoch": 0.91, "learning_rate": 0.000163637739580548, "loss": 0.0117, "step": 180190 }, { "epoch": 0.91, "learning_rate": 0.000163630171887534, "loss": 0.0101, "step": 180200 }, { "epoch": 0.91, "learning_rate": 0.00016362260419451998, "loss": 0.0106, "step": 180210 }, { "epoch": 0.91, "learning_rate": 0.00016361503650150596, "loss": 0.0133, "step": 180220 }, { "epoch": 0.91, "learning_rate": 0.00016360746880849197, "loss": 0.0111, "step": 180230 }, { "epoch": 0.91, "learning_rate": 0.00016359990111547795, "loss": 0.0166, "step": 180240 }, { "epoch": 0.91, "learning_rate": 0.00016359233342246393, "loss": 0.0103, "step": 180250 }, { "epoch": 0.91, "learning_rate": 0.00016358476572944994, "loss": 0.012, "step": 180260 }, { "epoch": 0.91, "learning_rate": 0.00016357719803643592, "loss": 0.0113, "step": 180270 }, { "epoch": 0.91, "learning_rate": 0.0001635696303434219, "loss": 0.0109, "step": 180280 }, { "epoch": 0.91, "learning_rate": 0.0001635620626504079, "loss": 0.0108, "step": 180290 }, { "epoch": 0.91, "learning_rate": 0.0001635544949573939, "loss": 0.0105, "step": 180300 }, { "epoch": 0.91, "learning_rate": 0.00016354692726437987, "loss": 0.0112, "step": 180310 }, { "epoch": 0.91, "learning_rate": 0.00016353935957136588, "loss": 0.0114, "step": 180320 }, { "epoch": 0.91, "learning_rate": 0.00016353179187835186, "loss": 0.0118, "step": 180330 }, { "epoch": 0.91, "learning_rate": 0.00016352422418533784, "loss": 0.009, "step": 180340 }, { "epoch": 0.91, "learning_rate": 0.00016351665649232383, "loss": 0.0114, "step": 180350 }, { "epoch": 0.91, "learning_rate": 0.00016350908879930983, "loss": 0.0112, "step": 180360 }, { "epoch": 0.91, "learning_rate": 0.0001635015211062958, "loss": 0.0081, "step": 180370 }, { "epoch": 0.91, "learning_rate": 0.00016349395341328177, "loss": 0.0107, "step": 180380 }, { "epoch": 0.91, "learning_rate": 0.00016348638572026778, "loss": 0.0115, "step": 180390 }, { "epoch": 0.91, "learning_rate": 0.00016347881802725376, "loss": 0.0102, "step": 180400 }, { "epoch": 0.91, "learning_rate": 0.00016347125033423974, "loss": 0.0083, "step": 180410 }, { "epoch": 0.91, "learning_rate": 0.00016346368264122572, "loss": 0.0111, "step": 180420 }, { "epoch": 0.91, "learning_rate": 0.00016345611494821173, "loss": 0.0124, "step": 180430 }, { "epoch": 0.91, "learning_rate": 0.0001634485472551977, "loss": 0.0153, "step": 180440 }, { "epoch": 0.91, "learning_rate": 0.0001634409795621837, "loss": 0.0101, "step": 180450 }, { "epoch": 0.91, "learning_rate": 0.0001634334118691697, "loss": 0.0124, "step": 180460 }, { "epoch": 0.91, "learning_rate": 0.00016342584417615568, "loss": 0.0147, "step": 180470 }, { "epoch": 0.91, "learning_rate": 0.00016341827648314167, "loss": 0.0126, "step": 180480 }, { "epoch": 0.91, "learning_rate": 0.00016341070879012767, "loss": 0.0176, "step": 180490 }, { "epoch": 0.91, "learning_rate": 0.00016340314109711366, "loss": 0.0105, "step": 180500 }, { "epoch": 0.91, "learning_rate": 0.00016339557340409964, "loss": 0.0094, "step": 180510 }, { "epoch": 0.91, "learning_rate": 0.00016338800571108565, "loss": 0.011, "step": 180520 }, { "epoch": 0.91, "learning_rate": 0.00016338043801807163, "loss": 0.014, "step": 180530 }, { "epoch": 0.91, "learning_rate": 0.0001633728703250576, "loss": 0.0174, "step": 180540 }, { "epoch": 0.91, "learning_rate": 0.00016336530263204362, "loss": 0.0089, "step": 180550 }, { "epoch": 0.91, "learning_rate": 0.0001633577349390296, "loss": 0.0105, "step": 180560 }, { "epoch": 0.91, "learning_rate": 0.00016335016724601558, "loss": 0.0146, "step": 180570 }, { "epoch": 0.91, "learning_rate": 0.00016334259955300156, "loss": 0.0176, "step": 180580 }, { "epoch": 0.91, "learning_rate": 0.00016333503185998757, "loss": 0.0107, "step": 180590 }, { "epoch": 0.91, "learning_rate": 0.00016332746416697355, "loss": 0.0103, "step": 180600 }, { "epoch": 0.91, "learning_rate": 0.00016331989647395953, "loss": 0.0107, "step": 180610 }, { "epoch": 0.91, "learning_rate": 0.00016331232878094554, "loss": 0.0107, "step": 180620 }, { "epoch": 0.91, "learning_rate": 0.00016330476108793152, "loss": 0.0095, "step": 180630 }, { "epoch": 0.91, "learning_rate": 0.0001632971933949175, "loss": 0.0116, "step": 180640 }, { "epoch": 0.91, "learning_rate": 0.0001632896257019035, "loss": 0.0131, "step": 180650 }, { "epoch": 0.91, "learning_rate": 0.0001632820580088895, "loss": 0.0107, "step": 180660 }, { "epoch": 0.91, "learning_rate": 0.00016327449031587548, "loss": 0.01, "step": 180670 }, { "epoch": 0.91, "learning_rate": 0.00016326692262286148, "loss": 0.0089, "step": 180680 }, { "epoch": 0.91, "learning_rate": 0.00016325935492984747, "loss": 0.0114, "step": 180690 }, { "epoch": 0.91, "learning_rate": 0.00016325178723683345, "loss": 0.0102, "step": 180700 }, { "epoch": 0.91, "learning_rate": 0.00016324421954381946, "loss": 0.0129, "step": 180710 }, { "epoch": 0.91, "learning_rate": 0.00016323665185080544, "loss": 0.01, "step": 180720 }, { "epoch": 0.91, "learning_rate": 0.00016322908415779142, "loss": 0.011, "step": 180730 }, { "epoch": 0.91, "learning_rate": 0.00016322151646477743, "loss": 0.0117, "step": 180740 }, { "epoch": 0.91, "learning_rate": 0.0001632139487717634, "loss": 0.0103, "step": 180750 }, { "epoch": 0.91, "learning_rate": 0.0001632063810787494, "loss": 0.0158, "step": 180760 }, { "epoch": 0.91, "learning_rate": 0.00016319881338573537, "loss": 0.0128, "step": 180770 }, { "epoch": 0.91, "learning_rate": 0.00016319124569272138, "loss": 0.01, "step": 180780 }, { "epoch": 0.91, "learning_rate": 0.00016318367799970736, "loss": 0.0094, "step": 180790 }, { "epoch": 0.91, "learning_rate": 0.00016317611030669334, "loss": 0.0103, "step": 180800 }, { "epoch": 0.91, "learning_rate": 0.00016316854261367935, "loss": 0.0106, "step": 180810 }, { "epoch": 0.91, "learning_rate": 0.00016316097492066533, "loss": 0.0114, "step": 180820 }, { "epoch": 0.91, "learning_rate": 0.00016315340722765131, "loss": 0.0127, "step": 180830 }, { "epoch": 0.91, "learning_rate": 0.00016314583953463732, "loss": 0.0129, "step": 180840 }, { "epoch": 0.91, "learning_rate": 0.0001631382718416233, "loss": 0.0116, "step": 180850 }, { "epoch": 0.91, "learning_rate": 0.00016313070414860929, "loss": 0.0113, "step": 180860 }, { "epoch": 0.91, "learning_rate": 0.0001631231364555953, "loss": 0.0112, "step": 180870 }, { "epoch": 0.91, "learning_rate": 0.00016311556876258128, "loss": 0.0123, "step": 180880 }, { "epoch": 0.91, "learning_rate": 0.00016310800106956726, "loss": 0.0102, "step": 180890 }, { "epoch": 0.91, "learning_rate": 0.00016310043337655327, "loss": 0.0144, "step": 180900 }, { "epoch": 0.91, "learning_rate": 0.00016309286568353925, "loss": 0.0112, "step": 180910 }, { "epoch": 0.91, "learning_rate": 0.00016308529799052523, "loss": 0.0092, "step": 180920 }, { "epoch": 0.91, "learning_rate": 0.0001630777302975112, "loss": 0.0096, "step": 180930 }, { "epoch": 0.91, "learning_rate": 0.00016307016260449722, "loss": 0.0115, "step": 180940 }, { "epoch": 0.91, "learning_rate": 0.0001630625949114832, "loss": 0.0128, "step": 180950 }, { "epoch": 0.91, "learning_rate": 0.00016305502721846918, "loss": 0.0105, "step": 180960 }, { "epoch": 0.91, "learning_rate": 0.0001630474595254552, "loss": 0.0122, "step": 180970 }, { "epoch": 0.91, "learning_rate": 0.00016303989183244117, "loss": 0.0095, "step": 180980 }, { "epoch": 0.91, "learning_rate": 0.00016303232413942715, "loss": 0.011, "step": 180990 }, { "epoch": 0.91, "learning_rate": 0.00016302475644641316, "loss": 0.0117, "step": 181000 }, { "epoch": 0.91, "eval_cer": 0.9144751078837893, "eval_loss": 0.008274085819721222, "eval_runtime": 116.712, "eval_samples_per_second": 17.136, "eval_steps_per_second": 4.284, "step": 181000 }, { "epoch": 0.91, "learning_rate": 0.00016301718875339914, "loss": 0.0135, "step": 181010 }, { "epoch": 0.91, "learning_rate": 0.00016300962106038512, "loss": 0.0104, "step": 181020 }, { "epoch": 0.91, "learning_rate": 0.00016300205336737113, "loss": 0.0161, "step": 181030 }, { "epoch": 0.91, "learning_rate": 0.00016299448567435711, "loss": 0.0133, "step": 181040 }, { "epoch": 0.91, "learning_rate": 0.0001629869179813431, "loss": 0.0125, "step": 181050 }, { "epoch": 0.91, "learning_rate": 0.0001629793502883291, "loss": 0.01, "step": 181060 }, { "epoch": 0.91, "learning_rate": 0.00016297178259531509, "loss": 0.011, "step": 181070 }, { "epoch": 0.91, "learning_rate": 0.00016296421490230107, "loss": 0.012, "step": 181080 }, { "epoch": 0.91, "learning_rate": 0.00016295664720928705, "loss": 0.0172, "step": 181090 }, { "epoch": 0.91, "learning_rate": 0.00016294907951627306, "loss": 0.0121, "step": 181100 }, { "epoch": 0.91, "learning_rate": 0.00016294151182325904, "loss": 0.0132, "step": 181110 }, { "epoch": 0.91, "learning_rate": 0.00016293394413024502, "loss": 0.0124, "step": 181120 }, { "epoch": 0.91, "learning_rate": 0.00016292637643723103, "loss": 0.0106, "step": 181130 }, { "epoch": 0.91, "learning_rate": 0.000162918808744217, "loss": 0.0103, "step": 181140 }, { "epoch": 0.91, "learning_rate": 0.000162911241051203, "loss": 0.0125, "step": 181150 }, { "epoch": 0.91, "learning_rate": 0.000162903673358189, "loss": 0.0085, "step": 181160 }, { "epoch": 0.91, "learning_rate": 0.00016289610566517498, "loss": 0.0128, "step": 181170 }, { "epoch": 0.91, "learning_rate": 0.00016288853797216096, "loss": 0.0177, "step": 181180 }, { "epoch": 0.91, "learning_rate": 0.00016288097027914697, "loss": 0.0123, "step": 181190 }, { "epoch": 0.91, "learning_rate": 0.00016287340258613295, "loss": 0.0179, "step": 181200 }, { "epoch": 0.91, "learning_rate": 0.00016286583489311893, "loss": 0.0151, "step": 181210 }, { "epoch": 0.91, "learning_rate": 0.00016285826720010494, "loss": 0.0134, "step": 181220 }, { "epoch": 0.91, "learning_rate": 0.00016285069950709092, "loss": 0.0125, "step": 181230 }, { "epoch": 0.91, "learning_rate": 0.0001628431318140769, "loss": 0.0148, "step": 181240 }, { "epoch": 0.91, "learning_rate": 0.0001628355641210629, "loss": 0.0166, "step": 181250 }, { "epoch": 0.91, "learning_rate": 0.0001628279964280489, "loss": 0.0099, "step": 181260 }, { "epoch": 0.91, "learning_rate": 0.00016282042873503488, "loss": 0.0088, "step": 181270 }, { "epoch": 0.91, "learning_rate": 0.00016281286104202086, "loss": 0.0117, "step": 181280 }, { "epoch": 0.91, "learning_rate": 0.00016280529334900687, "loss": 0.0105, "step": 181290 }, { "epoch": 0.91, "learning_rate": 0.00016279772565599285, "loss": 0.0113, "step": 181300 }, { "epoch": 0.91, "learning_rate": 0.00016279015796297883, "loss": 0.0119, "step": 181310 }, { "epoch": 0.91, "learning_rate": 0.00016278259026996484, "loss": 0.0134, "step": 181320 }, { "epoch": 0.91, "learning_rate": 0.00016277502257695082, "loss": 0.0111, "step": 181330 }, { "epoch": 0.91, "learning_rate": 0.0001627674548839368, "loss": 0.0132, "step": 181340 }, { "epoch": 0.91, "learning_rate": 0.0001627598871909228, "loss": 0.0114, "step": 181350 }, { "epoch": 0.91, "learning_rate": 0.0001627523194979088, "loss": 0.0106, "step": 181360 }, { "epoch": 0.92, "learning_rate": 0.00016274475180489477, "loss": 0.0103, "step": 181370 }, { "epoch": 0.92, "learning_rate": 0.00016273718411188078, "loss": 0.011, "step": 181380 }, { "epoch": 0.92, "learning_rate": 0.00016272961641886676, "loss": 0.0136, "step": 181390 }, { "epoch": 0.92, "learning_rate": 0.00016272204872585274, "loss": 0.0108, "step": 181400 }, { "epoch": 0.92, "learning_rate": 0.00016271448103283875, "loss": 0.0122, "step": 181410 }, { "epoch": 0.92, "learning_rate": 0.00016270691333982473, "loss": 0.0108, "step": 181420 }, { "epoch": 0.92, "learning_rate": 0.00016269934564681072, "loss": 0.0103, "step": 181430 }, { "epoch": 0.92, "learning_rate": 0.0001626917779537967, "loss": 0.0096, "step": 181440 }, { "epoch": 0.92, "learning_rate": 0.0001626842102607827, "loss": 0.0135, "step": 181450 }, { "epoch": 0.92, "learning_rate": 0.0001626766425677687, "loss": 0.011, "step": 181460 }, { "epoch": 0.92, "learning_rate": 0.00016266907487475467, "loss": 0.0131, "step": 181470 }, { "epoch": 0.92, "learning_rate": 0.00016266150718174068, "loss": 0.0087, "step": 181480 }, { "epoch": 0.92, "learning_rate": 0.00016265393948872666, "loss": 0.0126, "step": 181490 }, { "epoch": 0.92, "learning_rate": 0.00016264637179571264, "loss": 0.0088, "step": 181500 }, { "epoch": 0.92, "learning_rate": 0.00016263880410269865, "loss": 0.0153, "step": 181510 }, { "epoch": 0.92, "learning_rate": 0.00016263123640968463, "loss": 0.0109, "step": 181520 }, { "epoch": 0.92, "learning_rate": 0.0001626236687166706, "loss": 0.0104, "step": 181530 }, { "epoch": 0.92, "learning_rate": 0.00016261610102365662, "loss": 0.011, "step": 181540 }, { "epoch": 0.92, "learning_rate": 0.0001626085333306426, "loss": 0.0116, "step": 181550 }, { "epoch": 0.92, "learning_rate": 0.00016260096563762858, "loss": 0.0135, "step": 181560 }, { "epoch": 0.92, "learning_rate": 0.0001625933979446146, "loss": 0.0114, "step": 181570 }, { "epoch": 0.92, "learning_rate": 0.00016258583025160057, "loss": 0.0148, "step": 181580 }, { "epoch": 0.92, "learning_rate": 0.00016257826255858655, "loss": 0.0096, "step": 181590 }, { "epoch": 0.92, "learning_rate": 0.00016257069486557254, "loss": 0.0137, "step": 181600 }, { "epoch": 0.92, "learning_rate": 0.00016256312717255854, "loss": 0.0126, "step": 181610 }, { "epoch": 0.92, "learning_rate": 0.00016255555947954453, "loss": 0.0123, "step": 181620 }, { "epoch": 0.92, "learning_rate": 0.00016254799178653048, "loss": 0.0162, "step": 181630 }, { "epoch": 0.92, "learning_rate": 0.00016254042409351646, "loss": 0.0096, "step": 181640 }, { "epoch": 0.92, "learning_rate": 0.00016253285640050247, "loss": 0.0105, "step": 181650 }, { "epoch": 0.92, "learning_rate": 0.00016252528870748845, "loss": 0.0104, "step": 181660 }, { "epoch": 0.92, "learning_rate": 0.00016251772101447443, "loss": 0.0139, "step": 181670 }, { "epoch": 0.92, "learning_rate": 0.00016251015332146044, "loss": 0.0111, "step": 181680 }, { "epoch": 0.92, "learning_rate": 0.00016250258562844642, "loss": 0.013, "step": 181690 }, { "epoch": 0.92, "learning_rate": 0.0001624950179354324, "loss": 0.0112, "step": 181700 }, { "epoch": 0.92, "learning_rate": 0.0001624874502424184, "loss": 0.0107, "step": 181710 }, { "epoch": 0.92, "learning_rate": 0.0001624798825494044, "loss": 0.0107, "step": 181720 }, { "epoch": 0.92, "learning_rate": 0.00016247231485639038, "loss": 0.0094, "step": 181730 }, { "epoch": 0.92, "learning_rate": 0.00016246474716337638, "loss": 0.0124, "step": 181740 }, { "epoch": 0.92, "learning_rate": 0.00016245717947036237, "loss": 0.0122, "step": 181750 }, { "epoch": 0.92, "learning_rate": 0.00016244961177734835, "loss": 0.012, "step": 181760 }, { "epoch": 0.92, "learning_rate": 0.00016244204408433436, "loss": 0.0091, "step": 181770 }, { "epoch": 0.92, "learning_rate": 0.00016243447639132034, "loss": 0.0115, "step": 181780 }, { "epoch": 0.92, "learning_rate": 0.00016242690869830632, "loss": 0.0116, "step": 181790 }, { "epoch": 0.92, "learning_rate": 0.00016241934100529233, "loss": 0.0138, "step": 181800 }, { "epoch": 0.92, "learning_rate": 0.0001624117733122783, "loss": 0.013, "step": 181810 }, { "epoch": 0.92, "learning_rate": 0.0001624042056192643, "loss": 0.0126, "step": 181820 }, { "epoch": 0.92, "learning_rate": 0.00016239663792625027, "loss": 0.0116, "step": 181830 }, { "epoch": 0.92, "learning_rate": 0.00016238907023323628, "loss": 0.0132, "step": 181840 }, { "epoch": 0.92, "learning_rate": 0.00016238150254022226, "loss": 0.0107, "step": 181850 }, { "epoch": 0.92, "learning_rate": 0.00016237393484720824, "loss": 0.0105, "step": 181860 }, { "epoch": 0.92, "learning_rate": 0.00016236636715419425, "loss": 0.0109, "step": 181870 }, { "epoch": 0.92, "learning_rate": 0.00016235879946118023, "loss": 0.0103, "step": 181880 }, { "epoch": 0.92, "learning_rate": 0.00016235123176816621, "loss": 0.0159, "step": 181890 }, { "epoch": 0.92, "learning_rate": 0.00016234366407515222, "loss": 0.0104, "step": 181900 }, { "epoch": 0.92, "learning_rate": 0.0001623360963821382, "loss": 0.0095, "step": 181910 }, { "epoch": 0.92, "learning_rate": 0.00016232852868912419, "loss": 0.0142, "step": 181920 }, { "epoch": 0.92, "learning_rate": 0.0001623209609961102, "loss": 0.0138, "step": 181930 }, { "epoch": 0.92, "learning_rate": 0.00016231339330309618, "loss": 0.0173, "step": 181940 }, { "epoch": 0.92, "learning_rate": 0.00016230582561008216, "loss": 0.0096, "step": 181950 }, { "epoch": 0.92, "learning_rate": 0.00016229825791706817, "loss": 0.0109, "step": 181960 }, { "epoch": 0.92, "learning_rate": 0.00016229069022405415, "loss": 0.0121, "step": 181970 }, { "epoch": 0.92, "learning_rate": 0.00016228312253104013, "loss": 0.0156, "step": 181980 }, { "epoch": 0.92, "learning_rate": 0.0001622755548380261, "loss": 0.0107, "step": 181990 }, { "epoch": 0.92, "learning_rate": 0.00016226798714501212, "loss": 0.0104, "step": 182000 }, { "epoch": 0.92, "eval_cer": 0.9144857822411687, "eval_loss": 0.008326300419867039, "eval_runtime": 116.6222, "eval_samples_per_second": 17.149, "eval_steps_per_second": 4.287, "step": 182000 }, { "epoch": 0.92, "learning_rate": 0.0001622604194519981, "loss": 0.0137, "step": 182010 }, { "epoch": 0.92, "learning_rate": 0.00016225285175898408, "loss": 0.0108, "step": 182020 }, { "epoch": 0.92, "learning_rate": 0.0001622452840659701, "loss": 0.013, "step": 182030 }, { "epoch": 0.92, "learning_rate": 0.00016223771637295607, "loss": 0.0097, "step": 182040 }, { "epoch": 0.92, "learning_rate": 0.00016223014867994205, "loss": 0.0102, "step": 182050 }, { "epoch": 0.92, "learning_rate": 0.00016222258098692806, "loss": 0.0127, "step": 182060 }, { "epoch": 0.92, "learning_rate": 0.00016221501329391404, "loss": 0.0123, "step": 182070 }, { "epoch": 0.92, "learning_rate": 0.00016220744560090002, "loss": 0.01, "step": 182080 }, { "epoch": 0.92, "learning_rate": 0.00016219987790788603, "loss": 0.0126, "step": 182090 }, { "epoch": 0.92, "learning_rate": 0.00016219231021487201, "loss": 0.0107, "step": 182100 }, { "epoch": 0.92, "learning_rate": 0.000162184742521858, "loss": 0.014, "step": 182110 }, { "epoch": 0.92, "learning_rate": 0.000162177174828844, "loss": 0.0118, "step": 182120 }, { "epoch": 0.92, "learning_rate": 0.00016216960713582999, "loss": 0.012, "step": 182130 }, { "epoch": 0.92, "learning_rate": 0.00016216203944281597, "loss": 0.0107, "step": 182140 }, { "epoch": 0.92, "learning_rate": 0.00016215447174980195, "loss": 0.0109, "step": 182150 }, { "epoch": 0.92, "learning_rate": 0.00016214690405678796, "loss": 0.0099, "step": 182160 }, { "epoch": 0.92, "learning_rate": 0.00016213933636377394, "loss": 0.0134, "step": 182170 }, { "epoch": 0.92, "learning_rate": 0.00016213176867075992, "loss": 0.0115, "step": 182180 }, { "epoch": 0.92, "learning_rate": 0.00016212420097774593, "loss": 0.0097, "step": 182190 }, { "epoch": 0.92, "learning_rate": 0.0001621166332847319, "loss": 0.0098, "step": 182200 }, { "epoch": 0.92, "learning_rate": 0.0001621090655917179, "loss": 0.0168, "step": 182210 }, { "epoch": 0.92, "learning_rate": 0.0001621014978987039, "loss": 0.0137, "step": 182220 }, { "epoch": 0.92, "learning_rate": 0.00016209393020568988, "loss": 0.012, "step": 182230 }, { "epoch": 0.92, "learning_rate": 0.00016208636251267586, "loss": 0.0123, "step": 182240 }, { "epoch": 0.92, "learning_rate": 0.00016207879481966187, "loss": 0.0098, "step": 182250 }, { "epoch": 0.92, "learning_rate": 0.00016207122712664785, "loss": 0.0173, "step": 182260 }, { "epoch": 0.92, "learning_rate": 0.00016206365943363383, "loss": 0.0123, "step": 182270 }, { "epoch": 0.92, "learning_rate": 0.00016205609174061984, "loss": 0.0121, "step": 182280 }, { "epoch": 0.92, "learning_rate": 0.00016204852404760582, "loss": 0.0148, "step": 182290 }, { "epoch": 0.92, "learning_rate": 0.0001620409563545918, "loss": 0.0107, "step": 182300 }, { "epoch": 0.92, "learning_rate": 0.00016203338866157781, "loss": 0.009, "step": 182310 }, { "epoch": 0.92, "learning_rate": 0.0001620258209685638, "loss": 0.0131, "step": 182320 }, { "epoch": 0.92, "learning_rate": 0.00016201825327554978, "loss": 0.0131, "step": 182330 }, { "epoch": 0.92, "learning_rate": 0.00016201068558253576, "loss": 0.0108, "step": 182340 }, { "epoch": 0.92, "learning_rate": 0.00016200311788952177, "loss": 0.0116, "step": 182350 }, { "epoch": 0.92, "learning_rate": 0.00016199555019650775, "loss": 0.0144, "step": 182360 }, { "epoch": 0.92, "learning_rate": 0.00016198798250349373, "loss": 0.0092, "step": 182370 }, { "epoch": 0.92, "learning_rate": 0.00016198041481047974, "loss": 0.0136, "step": 182380 }, { "epoch": 0.92, "learning_rate": 0.00016197284711746572, "loss": 0.0104, "step": 182390 }, { "epoch": 0.92, "learning_rate": 0.0001619652794244517, "loss": 0.013, "step": 182400 }, { "epoch": 0.92, "learning_rate": 0.0001619577117314377, "loss": 0.012, "step": 182410 }, { "epoch": 0.92, "learning_rate": 0.0001619501440384237, "loss": 0.0091, "step": 182420 }, { "epoch": 0.92, "learning_rate": 0.00016194257634540967, "loss": 0.0109, "step": 182430 }, { "epoch": 0.92, "learning_rate": 0.00016193500865239568, "loss": 0.0111, "step": 182440 }, { "epoch": 0.92, "learning_rate": 0.00016192744095938166, "loss": 0.0112, "step": 182450 }, { "epoch": 0.92, "learning_rate": 0.00016191987326636764, "loss": 0.0128, "step": 182460 }, { "epoch": 0.92, "learning_rate": 0.00016191230557335365, "loss": 0.0102, "step": 182470 }, { "epoch": 0.92, "learning_rate": 0.00016190473788033963, "loss": 0.0112, "step": 182480 }, { "epoch": 0.92, "learning_rate": 0.00016189717018732562, "loss": 0.0114, "step": 182490 }, { "epoch": 0.92, "learning_rate": 0.0001618896024943116, "loss": 0.0104, "step": 182500 }, { "epoch": 0.92, "learning_rate": 0.0001618820348012976, "loss": 0.0094, "step": 182510 }, { "epoch": 0.92, "learning_rate": 0.0001618744671082836, "loss": 0.0097, "step": 182520 }, { "epoch": 0.92, "learning_rate": 0.00016186689941526957, "loss": 0.011, "step": 182530 }, { "epoch": 0.92, "learning_rate": 0.00016185933172225558, "loss": 0.0113, "step": 182540 }, { "epoch": 0.92, "learning_rate": 0.00016185176402924156, "loss": 0.0093, "step": 182550 }, { "epoch": 0.92, "learning_rate": 0.00016184419633622754, "loss": 0.0122, "step": 182560 }, { "epoch": 0.92, "learning_rate": 0.00016183662864321355, "loss": 0.0116, "step": 182570 }, { "epoch": 0.92, "learning_rate": 0.00016182906095019953, "loss": 0.0103, "step": 182580 }, { "epoch": 0.92, "learning_rate": 0.0001618214932571855, "loss": 0.009, "step": 182590 }, { "epoch": 0.92, "learning_rate": 0.00016181392556417152, "loss": 0.0122, "step": 182600 }, { "epoch": 0.92, "learning_rate": 0.0001618063578711575, "loss": 0.0111, "step": 182610 }, { "epoch": 0.92, "learning_rate": 0.00016179879017814348, "loss": 0.0125, "step": 182620 }, { "epoch": 0.92, "learning_rate": 0.0001617912224851295, "loss": 0.0121, "step": 182630 }, { "epoch": 0.92, "learning_rate": 0.00016178365479211547, "loss": 0.0105, "step": 182640 }, { "epoch": 0.92, "learning_rate": 0.00016177608709910145, "loss": 0.012, "step": 182650 }, { "epoch": 0.92, "learning_rate": 0.00016176851940608744, "loss": 0.0107, "step": 182660 }, { "epoch": 0.92, "learning_rate": 0.00016176095171307344, "loss": 0.0109, "step": 182670 }, { "epoch": 0.92, "learning_rate": 0.00016175338402005943, "loss": 0.0112, "step": 182680 }, { "epoch": 0.92, "learning_rate": 0.0001617458163270454, "loss": 0.0118, "step": 182690 }, { "epoch": 0.92, "learning_rate": 0.00016173824863403142, "loss": 0.0108, "step": 182700 }, { "epoch": 0.92, "learning_rate": 0.0001617306809410174, "loss": 0.0108, "step": 182710 }, { "epoch": 0.92, "learning_rate": 0.00016172311324800338, "loss": 0.0114, "step": 182720 }, { "epoch": 0.92, "learning_rate": 0.0001617155455549894, "loss": 0.014, "step": 182730 }, { "epoch": 0.92, "learning_rate": 0.00016170797786197537, "loss": 0.01, "step": 182740 }, { "epoch": 0.92, "learning_rate": 0.00016170041016896135, "loss": 0.0113, "step": 182750 }, { "epoch": 0.92, "learning_rate": 0.00016169284247594736, "loss": 0.0113, "step": 182760 }, { "epoch": 0.92, "learning_rate": 0.00016168527478293334, "loss": 0.0131, "step": 182770 }, { "epoch": 0.92, "learning_rate": 0.00016167770708991932, "loss": 0.0108, "step": 182780 }, { "epoch": 0.92, "learning_rate": 0.00016167013939690533, "loss": 0.0106, "step": 182790 }, { "epoch": 0.92, "learning_rate": 0.0001616625717038913, "loss": 0.0112, "step": 182800 }, { "epoch": 0.92, "learning_rate": 0.0001616550040108773, "loss": 0.0129, "step": 182810 }, { "epoch": 0.92, "learning_rate": 0.0001616474363178633, "loss": 0.0116, "step": 182820 }, { "epoch": 0.92, "learning_rate": 0.00016163986862484928, "loss": 0.0122, "step": 182830 }, { "epoch": 0.92, "learning_rate": 0.00016163230093183526, "loss": 0.01, "step": 182840 }, { "epoch": 0.92, "learning_rate": 0.00016162473323882125, "loss": 0.0095, "step": 182850 }, { "epoch": 0.92, "learning_rate": 0.00016161716554580725, "loss": 0.0092, "step": 182860 }, { "epoch": 0.92, "learning_rate": 0.00016160959785279324, "loss": 0.0118, "step": 182870 }, { "epoch": 0.92, "learning_rate": 0.0001616020301597792, "loss": 0.0093, "step": 182880 }, { "epoch": 0.92, "learning_rate": 0.00016159446246676517, "loss": 0.0098, "step": 182890 }, { "epoch": 0.92, "learning_rate": 0.00016158689477375118, "loss": 0.0131, "step": 182900 }, { "epoch": 0.92, "learning_rate": 0.00016157932708073716, "loss": 0.0083, "step": 182910 }, { "epoch": 0.92, "learning_rate": 0.00016157175938772314, "loss": 0.0105, "step": 182920 }, { "epoch": 0.92, "learning_rate": 0.00016156419169470915, "loss": 0.0119, "step": 182930 }, { "epoch": 0.92, "learning_rate": 0.00016155662400169513, "loss": 0.0091, "step": 182940 }, { "epoch": 0.92, "learning_rate": 0.00016154905630868111, "loss": 0.0129, "step": 182950 }, { "epoch": 0.92, "learning_rate": 0.00016154148861566712, "loss": 0.012, "step": 182960 }, { "epoch": 0.92, "learning_rate": 0.0001615339209226531, "loss": 0.0135, "step": 182970 }, { "epoch": 0.92, "learning_rate": 0.00016152635322963909, "loss": 0.0092, "step": 182980 }, { "epoch": 0.92, "learning_rate": 0.0001615187855366251, "loss": 0.0105, "step": 182990 }, { "epoch": 0.92, "learning_rate": 0.00016151121784361108, "loss": 0.0101, "step": 183000 }, { "epoch": 0.92, "eval_cer": 0.9144828710527925, "eval_loss": 0.00819355621933937, "eval_runtime": 116.6466, "eval_samples_per_second": 17.146, "eval_steps_per_second": 4.286, "step": 183000 }, { "epoch": 0.92, "learning_rate": 0.00016150365015059706, "loss": 0.0082, "step": 183010 }, { "epoch": 0.92, "learning_rate": 0.00016149608245758307, "loss": 0.0146, "step": 183020 }, { "epoch": 0.92, "learning_rate": 0.00016148851476456905, "loss": 0.0106, "step": 183030 }, { "epoch": 0.92, "learning_rate": 0.00016148094707155503, "loss": 0.0108, "step": 183040 }, { "epoch": 0.92, "learning_rate": 0.000161473379378541, "loss": 0.0117, "step": 183050 }, { "epoch": 0.92, "learning_rate": 0.00016146581168552702, "loss": 0.0125, "step": 183060 }, { "epoch": 0.92, "learning_rate": 0.000161458243992513, "loss": 0.0097, "step": 183070 }, { "epoch": 0.92, "learning_rate": 0.00016145067629949898, "loss": 0.0123, "step": 183080 }, { "epoch": 0.92, "learning_rate": 0.000161443108606485, "loss": 0.0116, "step": 183090 }, { "epoch": 0.92, "learning_rate": 0.00016143554091347097, "loss": 0.0129, "step": 183100 }, { "epoch": 0.92, "learning_rate": 0.00016142797322045695, "loss": 0.0113, "step": 183110 }, { "epoch": 0.92, "learning_rate": 0.00016142040552744296, "loss": 0.0136, "step": 183120 }, { "epoch": 0.92, "learning_rate": 0.00016141283783442894, "loss": 0.0117, "step": 183130 }, { "epoch": 0.92, "learning_rate": 0.00016140527014141492, "loss": 0.0092, "step": 183140 }, { "epoch": 0.92, "learning_rate": 0.00016139770244840093, "loss": 0.0105, "step": 183150 }, { "epoch": 0.92, "learning_rate": 0.00016139013475538691, "loss": 0.0102, "step": 183160 }, { "epoch": 0.92, "learning_rate": 0.0001613825670623729, "loss": 0.0096, "step": 183170 }, { "epoch": 0.92, "learning_rate": 0.0001613749993693589, "loss": 0.011, "step": 183180 }, { "epoch": 0.92, "learning_rate": 0.00016136743167634489, "loss": 0.011, "step": 183190 }, { "epoch": 0.92, "learning_rate": 0.00016135986398333087, "loss": 0.0123, "step": 183200 }, { "epoch": 0.92, "learning_rate": 0.00016135229629031688, "loss": 0.0118, "step": 183210 }, { "epoch": 0.92, "learning_rate": 0.00016134472859730286, "loss": 0.0118, "step": 183220 }, { "epoch": 0.92, "learning_rate": 0.00016133716090428884, "loss": 0.0127, "step": 183230 }, { "epoch": 0.92, "learning_rate": 0.00016132959321127482, "loss": 0.0103, "step": 183240 }, { "epoch": 0.92, "learning_rate": 0.00016132202551826083, "loss": 0.0096, "step": 183250 }, { "epoch": 0.92, "learning_rate": 0.0001613144578252468, "loss": 0.0119, "step": 183260 }, { "epoch": 0.92, "learning_rate": 0.0001613068901322328, "loss": 0.0098, "step": 183270 }, { "epoch": 0.92, "learning_rate": 0.0001612993224392188, "loss": 0.0092, "step": 183280 }, { "epoch": 0.92, "learning_rate": 0.00016129175474620478, "loss": 0.0099, "step": 183290 }, { "epoch": 0.92, "learning_rate": 0.00016128418705319076, "loss": 0.0108, "step": 183300 }, { "epoch": 0.92, "learning_rate": 0.00016127661936017677, "loss": 0.0104, "step": 183310 }, { "epoch": 0.92, "learning_rate": 0.00016126905166716275, "loss": 0.0088, "step": 183320 }, { "epoch": 0.92, "learning_rate": 0.00016126148397414873, "loss": 0.0098, "step": 183330 }, { "epoch": 0.92, "learning_rate": 0.00016125391628113474, "loss": 0.015, "step": 183340 }, { "epoch": 0.93, "learning_rate": 0.00016124634858812072, "loss": 0.0126, "step": 183350 }, { "epoch": 0.93, "learning_rate": 0.0001612387808951067, "loss": 0.01, "step": 183360 }, { "epoch": 0.93, "learning_rate": 0.00016123121320209271, "loss": 0.0171, "step": 183370 }, { "epoch": 0.93, "learning_rate": 0.0001612236455090787, "loss": 0.0222, "step": 183380 }, { "epoch": 0.93, "learning_rate": 0.00016121607781606468, "loss": 0.0118, "step": 183390 }, { "epoch": 0.93, "learning_rate": 0.00016120851012305066, "loss": 0.0094, "step": 183400 }, { "epoch": 0.93, "learning_rate": 0.00016120094243003667, "loss": 0.0139, "step": 183410 }, { "epoch": 0.93, "learning_rate": 0.00016119337473702265, "loss": 0.0157, "step": 183420 }, { "epoch": 0.93, "learning_rate": 0.00016118580704400863, "loss": 0.0113, "step": 183430 }, { "epoch": 0.93, "learning_rate": 0.00016117823935099464, "loss": 0.0094, "step": 183440 }, { "epoch": 0.93, "learning_rate": 0.00016117067165798062, "loss": 0.0139, "step": 183450 }, { "epoch": 0.93, "learning_rate": 0.0001611631039649666, "loss": 0.011, "step": 183460 }, { "epoch": 0.93, "learning_rate": 0.0001611555362719526, "loss": 0.0089, "step": 183470 }, { "epoch": 0.93, "learning_rate": 0.0001611479685789386, "loss": 0.0136, "step": 183480 }, { "epoch": 0.93, "learning_rate": 0.00016114040088592457, "loss": 0.0109, "step": 183490 }, { "epoch": 0.93, "learning_rate": 0.00016113283319291058, "loss": 0.0132, "step": 183500 }, { "epoch": 0.93, "learning_rate": 0.00016112526549989656, "loss": 0.0117, "step": 183510 }, { "epoch": 0.93, "learning_rate": 0.00016111769780688254, "loss": 0.011, "step": 183520 }, { "epoch": 0.93, "learning_rate": 0.00016111013011386855, "loss": 0.0126, "step": 183530 }, { "epoch": 0.93, "learning_rate": 0.00016110256242085453, "loss": 0.0114, "step": 183540 }, { "epoch": 0.93, "learning_rate": 0.00016109499472784052, "loss": 0.0094, "step": 183550 }, { "epoch": 0.93, "learning_rate": 0.0001610874270348265, "loss": 0.0107, "step": 183560 }, { "epoch": 0.93, "learning_rate": 0.0001610798593418125, "loss": 0.0107, "step": 183570 }, { "epoch": 0.93, "learning_rate": 0.0001610722916487985, "loss": 0.0081, "step": 183580 }, { "epoch": 0.93, "learning_rate": 0.00016106472395578447, "loss": 0.0158, "step": 183590 }, { "epoch": 0.93, "learning_rate": 0.00016105715626277048, "loss": 0.0106, "step": 183600 }, { "epoch": 0.93, "learning_rate": 0.00016104958856975646, "loss": 0.0113, "step": 183610 }, { "epoch": 0.93, "learning_rate": 0.00016104202087674244, "loss": 0.0147, "step": 183620 }, { "epoch": 0.93, "learning_rate": 0.00016103445318372845, "loss": 0.0113, "step": 183630 }, { "epoch": 0.93, "learning_rate": 0.00016102688549071443, "loss": 0.0127, "step": 183640 }, { "epoch": 0.93, "learning_rate": 0.0001610193177977004, "loss": 0.0099, "step": 183650 }, { "epoch": 0.93, "learning_rate": 0.00016101175010468642, "loss": 0.013, "step": 183660 }, { "epoch": 0.93, "learning_rate": 0.0001610041824116724, "loss": 0.0105, "step": 183670 }, { "epoch": 0.93, "learning_rate": 0.00016099661471865838, "loss": 0.0097, "step": 183680 }, { "epoch": 0.93, "learning_rate": 0.0001609890470256444, "loss": 0.0115, "step": 183690 }, { "epoch": 0.93, "learning_rate": 0.00016098147933263037, "loss": 0.0127, "step": 183700 }, { "epoch": 0.93, "learning_rate": 0.00016097391163961635, "loss": 0.0105, "step": 183710 }, { "epoch": 0.93, "learning_rate": 0.00016096634394660236, "loss": 0.0127, "step": 183720 }, { "epoch": 0.93, "learning_rate": 0.00016095877625358834, "loss": 0.0094, "step": 183730 }, { "epoch": 0.93, "learning_rate": 0.00016095120856057433, "loss": 0.0105, "step": 183740 }, { "epoch": 0.93, "learning_rate": 0.0001609436408675603, "loss": 0.014, "step": 183750 }, { "epoch": 0.93, "learning_rate": 0.00016093607317454632, "loss": 0.0123, "step": 183760 }, { "epoch": 0.93, "learning_rate": 0.0001609285054815323, "loss": 0.0107, "step": 183770 }, { "epoch": 0.93, "learning_rate": 0.00016092093778851828, "loss": 0.0095, "step": 183780 }, { "epoch": 0.93, "learning_rate": 0.0001609133700955043, "loss": 0.0098, "step": 183790 }, { "epoch": 0.93, "learning_rate": 0.00016090580240249027, "loss": 0.01, "step": 183800 }, { "epoch": 0.93, "learning_rate": 0.00016089823470947625, "loss": 0.0118, "step": 183810 }, { "epoch": 0.93, "learning_rate": 0.00016089066701646226, "loss": 0.0103, "step": 183820 }, { "epoch": 0.93, "learning_rate": 0.00016088309932344824, "loss": 0.01, "step": 183830 }, { "epoch": 0.93, "learning_rate": 0.00016087553163043422, "loss": 0.0098, "step": 183840 }, { "epoch": 0.93, "learning_rate": 0.00016086796393742023, "loss": 0.0106, "step": 183850 }, { "epoch": 0.93, "learning_rate": 0.0001608603962444062, "loss": 0.0108, "step": 183860 }, { "epoch": 0.93, "learning_rate": 0.0001608528285513922, "loss": 0.0115, "step": 183870 }, { "epoch": 0.93, "learning_rate": 0.0001608452608583782, "loss": 0.0119, "step": 183880 }, { "epoch": 0.93, "learning_rate": 0.00016083769316536418, "loss": 0.0106, "step": 183890 }, { "epoch": 0.93, "learning_rate": 0.00016083012547235016, "loss": 0.009, "step": 183900 }, { "epoch": 0.93, "learning_rate": 0.00016082255777933615, "loss": 0.0097, "step": 183910 }, { "epoch": 0.93, "learning_rate": 0.00016081499008632215, "loss": 0.0123, "step": 183920 }, { "epoch": 0.93, "learning_rate": 0.00016080742239330814, "loss": 0.0105, "step": 183930 }, { "epoch": 0.93, "learning_rate": 0.00016079985470029412, "loss": 0.0112, "step": 183940 }, { "epoch": 0.93, "learning_rate": 0.00016079228700728013, "loss": 0.0093, "step": 183950 }, { "epoch": 0.93, "learning_rate": 0.0001607847193142661, "loss": 0.013, "step": 183960 }, { "epoch": 0.93, "learning_rate": 0.0001607771516212521, "loss": 0.0111, "step": 183970 }, { "epoch": 0.93, "learning_rate": 0.0001607695839282381, "loss": 0.0076, "step": 183980 }, { "epoch": 0.93, "learning_rate": 0.00016076201623522408, "loss": 0.0103, "step": 183990 }, { "epoch": 0.93, "learning_rate": 0.00016075444854221006, "loss": 0.0133, "step": 184000 }, { "epoch": 0.93, "eval_cer": 0.9144731670915385, "eval_loss": 0.00799303688108921, "eval_runtime": 116.5635, "eval_samples_per_second": 17.158, "eval_steps_per_second": 4.29, "step": 184000 }, { "epoch": 0.93, "learning_rate": 0.00016074688084919607, "loss": 0.0113, "step": 184010 }, { "epoch": 0.93, "learning_rate": 0.00016073931315618205, "loss": 0.0116, "step": 184020 }, { "epoch": 0.93, "learning_rate": 0.00016073174546316803, "loss": 0.0128, "step": 184030 }, { "epoch": 0.93, "learning_rate": 0.00016072417777015404, "loss": 0.0098, "step": 184040 }, { "epoch": 0.93, "learning_rate": 0.00016071661007714002, "loss": 0.0088, "step": 184050 }, { "epoch": 0.93, "learning_rate": 0.000160709042384126, "loss": 0.0113, "step": 184060 }, { "epoch": 0.93, "learning_rate": 0.00016070147469111198, "loss": 0.0136, "step": 184070 }, { "epoch": 0.93, "learning_rate": 0.000160693906998098, "loss": 0.0109, "step": 184080 }, { "epoch": 0.93, "learning_rate": 0.00016068633930508397, "loss": 0.0123, "step": 184090 }, { "epoch": 0.93, "learning_rate": 0.00016067877161206996, "loss": 0.0156, "step": 184100 }, { "epoch": 0.93, "learning_rate": 0.00016067120391905596, "loss": 0.0137, "step": 184110 }, { "epoch": 0.93, "learning_rate": 0.00016066363622604195, "loss": 0.0103, "step": 184120 }, { "epoch": 0.93, "learning_rate": 0.00016065606853302793, "loss": 0.0108, "step": 184130 }, { "epoch": 0.93, "learning_rate": 0.00016064850084001388, "loss": 0.0084, "step": 184140 }, { "epoch": 0.93, "learning_rate": 0.0001606409331469999, "loss": 0.0106, "step": 184150 }, { "epoch": 0.93, "learning_rate": 0.00016063336545398587, "loss": 0.0109, "step": 184160 }, { "epoch": 0.93, "learning_rate": 0.00016062579776097185, "loss": 0.0114, "step": 184170 }, { "epoch": 0.93, "learning_rate": 0.00016061823006795786, "loss": 0.0116, "step": 184180 }, { "epoch": 0.93, "learning_rate": 0.00016061066237494384, "loss": 0.0105, "step": 184190 }, { "epoch": 0.93, "learning_rate": 0.00016060309468192982, "loss": 0.0093, "step": 184200 }, { "epoch": 0.93, "learning_rate": 0.00016059552698891583, "loss": 0.0096, "step": 184210 }, { "epoch": 0.93, "learning_rate": 0.00016058795929590181, "loss": 0.011, "step": 184220 }, { "epoch": 0.93, "learning_rate": 0.0001605803916028878, "loss": 0.0117, "step": 184230 }, { "epoch": 0.93, "learning_rate": 0.0001605728239098738, "loss": 0.0124, "step": 184240 }, { "epoch": 0.93, "learning_rate": 0.00016056525621685979, "loss": 0.0107, "step": 184250 }, { "epoch": 0.93, "learning_rate": 0.00016055768852384577, "loss": 0.0086, "step": 184260 }, { "epoch": 0.93, "learning_rate": 0.00016055012083083178, "loss": 0.0119, "step": 184270 }, { "epoch": 0.93, "learning_rate": 0.00016054255313781776, "loss": 0.0097, "step": 184280 }, { "epoch": 0.93, "learning_rate": 0.00016053498544480374, "loss": 0.0094, "step": 184290 }, { "epoch": 0.93, "learning_rate": 0.00016052741775178972, "loss": 0.0095, "step": 184300 }, { "epoch": 0.93, "learning_rate": 0.00016051985005877573, "loss": 0.012, "step": 184310 }, { "epoch": 0.93, "learning_rate": 0.0001605122823657617, "loss": 0.0118, "step": 184320 }, { "epoch": 0.93, "learning_rate": 0.0001605047146727477, "loss": 0.0119, "step": 184330 }, { "epoch": 0.93, "learning_rate": 0.0001604971469797337, "loss": 0.012, "step": 184340 }, { "epoch": 0.93, "learning_rate": 0.00016048957928671968, "loss": 0.0113, "step": 184350 }, { "epoch": 0.93, "learning_rate": 0.00016048201159370566, "loss": 0.0116, "step": 184360 }, { "epoch": 0.93, "learning_rate": 0.00016047444390069167, "loss": 0.0111, "step": 184370 }, { "epoch": 0.93, "learning_rate": 0.00016046687620767765, "loss": 0.0139, "step": 184380 }, { "epoch": 0.93, "learning_rate": 0.00016045930851466363, "loss": 0.0134, "step": 184390 }, { "epoch": 0.93, "learning_rate": 0.00016045174082164964, "loss": 0.0121, "step": 184400 }, { "epoch": 0.93, "learning_rate": 0.00016044417312863562, "loss": 0.0099, "step": 184410 }, { "epoch": 0.93, "learning_rate": 0.0001604366054356216, "loss": 0.0129, "step": 184420 }, { "epoch": 0.93, "learning_rate": 0.00016042903774260761, "loss": 0.0103, "step": 184430 }, { "epoch": 0.93, "learning_rate": 0.0001604214700495936, "loss": 0.0097, "step": 184440 }, { "epoch": 0.93, "learning_rate": 0.00016041390235657958, "loss": 0.0121, "step": 184450 }, { "epoch": 0.93, "learning_rate": 0.00016040633466356556, "loss": 0.0102, "step": 184460 }, { "epoch": 0.93, "learning_rate": 0.00016039876697055157, "loss": 0.0102, "step": 184470 }, { "epoch": 0.93, "learning_rate": 0.00016039119927753755, "loss": 0.0109, "step": 184480 }, { "epoch": 0.93, "learning_rate": 0.00016038363158452353, "loss": 0.0106, "step": 184490 }, { "epoch": 0.93, "learning_rate": 0.00016037606389150954, "loss": 0.0125, "step": 184500 }, { "epoch": 0.93, "learning_rate": 0.00016036849619849552, "loss": 0.0113, "step": 184510 }, { "epoch": 0.93, "learning_rate": 0.0001603609285054815, "loss": 0.0113, "step": 184520 }, { "epoch": 0.93, "learning_rate": 0.0001603533608124675, "loss": 0.0108, "step": 184530 }, { "epoch": 0.93, "learning_rate": 0.0001603457931194535, "loss": 0.0141, "step": 184540 }, { "epoch": 0.93, "learning_rate": 0.00016033822542643947, "loss": 0.0106, "step": 184550 }, { "epoch": 0.93, "learning_rate": 0.00016033065773342548, "loss": 0.0121, "step": 184560 }, { "epoch": 0.93, "learning_rate": 0.00016032309004041146, "loss": 0.0114, "step": 184570 }, { "epoch": 0.93, "learning_rate": 0.00016031552234739744, "loss": 0.0122, "step": 184580 }, { "epoch": 0.93, "learning_rate": 0.00016030795465438345, "loss": 0.0107, "step": 184590 }, { "epoch": 0.93, "learning_rate": 0.00016030038696136943, "loss": 0.0139, "step": 184600 }, { "epoch": 0.93, "learning_rate": 0.00016029281926835542, "loss": 0.0121, "step": 184610 }, { "epoch": 0.93, "learning_rate": 0.00016028525157534142, "loss": 0.01, "step": 184620 }, { "epoch": 0.93, "learning_rate": 0.0001602776838823274, "loss": 0.0155, "step": 184630 }, { "epoch": 0.93, "learning_rate": 0.0001602701161893134, "loss": 0.0135, "step": 184640 }, { "epoch": 0.93, "learning_rate": 0.00016026254849629937, "loss": 0.01, "step": 184650 }, { "epoch": 0.93, "learning_rate": 0.00016025498080328538, "loss": 0.012, "step": 184660 }, { "epoch": 0.93, "learning_rate": 0.00016024741311027136, "loss": 0.0103, "step": 184670 }, { "epoch": 0.93, "learning_rate": 0.00016023984541725734, "loss": 0.012, "step": 184680 }, { "epoch": 0.93, "learning_rate": 0.00016023227772424335, "loss": 0.0099, "step": 184690 }, { "epoch": 0.93, "learning_rate": 0.00016022471003122933, "loss": 0.0115, "step": 184700 }, { "epoch": 0.93, "learning_rate": 0.0001602171423382153, "loss": 0.0085, "step": 184710 }, { "epoch": 0.93, "learning_rate": 0.00016020957464520132, "loss": 0.0135, "step": 184720 }, { "epoch": 0.93, "learning_rate": 0.0001602020069521873, "loss": 0.0145, "step": 184730 }, { "epoch": 0.93, "learning_rate": 0.00016019443925917328, "loss": 0.0088, "step": 184740 }, { "epoch": 0.93, "learning_rate": 0.0001601868715661593, "loss": 0.0118, "step": 184750 }, { "epoch": 0.93, "learning_rate": 0.00016017930387314527, "loss": 0.0097, "step": 184760 }, { "epoch": 0.93, "learning_rate": 0.00016017173618013125, "loss": 0.0103, "step": 184770 }, { "epoch": 0.93, "learning_rate": 0.00016016416848711726, "loss": 0.0126, "step": 184780 }, { "epoch": 0.93, "learning_rate": 0.00016015660079410324, "loss": 0.0096, "step": 184790 }, { "epoch": 0.93, "learning_rate": 0.00016014903310108923, "loss": 0.0148, "step": 184800 }, { "epoch": 0.93, "learning_rate": 0.0001601414654080752, "loss": 0.01, "step": 184810 }, { "epoch": 0.93, "learning_rate": 0.00016013389771506122, "loss": 0.0127, "step": 184820 }, { "epoch": 0.93, "learning_rate": 0.0001601263300220472, "loss": 0.0108, "step": 184830 }, { "epoch": 0.93, "learning_rate": 0.00016011876232903318, "loss": 0.012, "step": 184840 }, { "epoch": 0.93, "learning_rate": 0.0001601111946360192, "loss": 0.0105, "step": 184850 }, { "epoch": 0.93, "learning_rate": 0.00016010362694300517, "loss": 0.0103, "step": 184860 }, { "epoch": 0.93, "learning_rate": 0.00016009605924999115, "loss": 0.011, "step": 184870 }, { "epoch": 0.93, "learning_rate": 0.00016008849155697716, "loss": 0.0081, "step": 184880 }, { "epoch": 0.93, "learning_rate": 0.00016008092386396314, "loss": 0.0086, "step": 184890 }, { "epoch": 0.93, "learning_rate": 0.00016007335617094912, "loss": 0.0127, "step": 184900 }, { "epoch": 0.93, "learning_rate": 0.00016006578847793513, "loss": 0.0155, "step": 184910 }, { "epoch": 0.93, "learning_rate": 0.0001600582207849211, "loss": 0.0109, "step": 184920 }, { "epoch": 0.93, "learning_rate": 0.0001600506530919071, "loss": 0.0155, "step": 184930 }, { "epoch": 0.93, "learning_rate": 0.0001600430853988931, "loss": 0.0117, "step": 184940 }, { "epoch": 0.93, "learning_rate": 0.00016003551770587908, "loss": 0.0119, "step": 184950 }, { "epoch": 0.93, "learning_rate": 0.00016002795001286506, "loss": 0.011, "step": 184960 }, { "epoch": 0.93, "learning_rate": 0.00016002038231985105, "loss": 0.0149, "step": 184970 }, { "epoch": 0.93, "learning_rate": 0.00016001281462683705, "loss": 0.0125, "step": 184980 }, { "epoch": 0.93, "learning_rate": 0.00016000524693382304, "loss": 0.0125, "step": 184990 }, { "epoch": 0.93, "learning_rate": 0.00015999767924080902, "loss": 0.011, "step": 185000 }, { "epoch": 0.93, "eval_cer": 0.914462492734159, "eval_loss": 0.007860948331654072, "eval_runtime": 116.6063, "eval_samples_per_second": 17.152, "eval_steps_per_second": 4.288, "step": 185000 }, { "epoch": 0.93, "learning_rate": 0.00015999011154779503, "loss": 0.0116, "step": 185010 }, { "epoch": 0.93, "learning_rate": 0.000159982543854781, "loss": 0.012, "step": 185020 }, { "epoch": 0.93, "learning_rate": 0.000159974976161767, "loss": 0.0116, "step": 185030 }, { "epoch": 0.93, "learning_rate": 0.000159967408468753, "loss": 0.0079, "step": 185040 }, { "epoch": 0.93, "learning_rate": 0.00015995984077573898, "loss": 0.0121, "step": 185050 }, { "epoch": 0.93, "learning_rate": 0.00015995227308272496, "loss": 0.0135, "step": 185060 }, { "epoch": 0.93, "learning_rate": 0.00015994470538971097, "loss": 0.0115, "step": 185070 }, { "epoch": 0.93, "learning_rate": 0.00015993713769669695, "loss": 0.014, "step": 185080 }, { "epoch": 0.93, "learning_rate": 0.00015992957000368293, "loss": 0.0133, "step": 185090 }, { "epoch": 0.93, "learning_rate": 0.00015992200231066894, "loss": 0.0094, "step": 185100 }, { "epoch": 0.93, "learning_rate": 0.00015991443461765492, "loss": 0.0103, "step": 185110 }, { "epoch": 0.93, "learning_rate": 0.0001599068669246409, "loss": 0.0099, "step": 185120 }, { "epoch": 0.93, "learning_rate": 0.00015989929923162688, "loss": 0.0108, "step": 185130 }, { "epoch": 0.93, "learning_rate": 0.0001598917315386129, "loss": 0.0136, "step": 185140 }, { "epoch": 0.93, "learning_rate": 0.00015988416384559887, "loss": 0.0139, "step": 185150 }, { "epoch": 0.93, "learning_rate": 0.00015987659615258486, "loss": 0.0114, "step": 185160 }, { "epoch": 0.93, "learning_rate": 0.00015986902845957086, "loss": 0.0136, "step": 185170 }, { "epoch": 0.93, "learning_rate": 0.00015986146076655685, "loss": 0.0112, "step": 185180 }, { "epoch": 0.93, "learning_rate": 0.00015985389307354283, "loss": 0.0153, "step": 185190 }, { "epoch": 0.93, "learning_rate": 0.00015984632538052884, "loss": 0.0131, "step": 185200 }, { "epoch": 0.93, "learning_rate": 0.00015983875768751482, "loss": 0.0103, "step": 185210 }, { "epoch": 0.93, "learning_rate": 0.0001598311899945008, "loss": 0.0106, "step": 185220 }, { "epoch": 0.93, "learning_rate": 0.0001598236223014868, "loss": 0.0123, "step": 185230 }, { "epoch": 0.93, "learning_rate": 0.0001598160546084728, "loss": 0.008, "step": 185240 }, { "epoch": 0.93, "learning_rate": 0.00015980848691545877, "loss": 0.012, "step": 185250 }, { "epoch": 0.93, "learning_rate": 0.00015980091922244478, "loss": 0.0121, "step": 185260 }, { "epoch": 0.93, "learning_rate": 0.00015979335152943076, "loss": 0.0111, "step": 185270 }, { "epoch": 0.93, "learning_rate": 0.00015978578383641674, "loss": 0.0146, "step": 185280 }, { "epoch": 0.93, "learning_rate": 0.00015977821614340275, "loss": 0.0119, "step": 185290 }, { "epoch": 0.93, "learning_rate": 0.00015977064845038873, "loss": 0.0132, "step": 185300 }, { "epoch": 0.93, "learning_rate": 0.0001597630807573747, "loss": 0.0096, "step": 185310 }, { "epoch": 0.93, "learning_rate": 0.0001597555130643607, "loss": 0.0105, "step": 185320 }, { "epoch": 0.94, "learning_rate": 0.0001597479453713467, "loss": 0.0112, "step": 185330 }, { "epoch": 0.94, "learning_rate": 0.00015974037767833268, "loss": 0.0115, "step": 185340 }, { "epoch": 0.94, "learning_rate": 0.00015973280998531867, "loss": 0.012, "step": 185350 }, { "epoch": 0.94, "learning_rate": 0.00015972524229230467, "loss": 0.011, "step": 185360 }, { "epoch": 0.94, "learning_rate": 0.00015971767459929066, "loss": 0.0108, "step": 185370 }, { "epoch": 0.94, "learning_rate": 0.00015971010690627664, "loss": 0.0099, "step": 185380 }, { "epoch": 0.94, "learning_rate": 0.00015970253921326265, "loss": 0.0129, "step": 185390 }, { "epoch": 0.94, "learning_rate": 0.0001596949715202486, "loss": 0.0131, "step": 185400 }, { "epoch": 0.94, "learning_rate": 0.00015968740382723458, "loss": 0.0116, "step": 185410 }, { "epoch": 0.94, "learning_rate": 0.00015967983613422056, "loss": 0.01, "step": 185420 }, { "epoch": 0.94, "learning_rate": 0.00015967226844120657, "loss": 0.0126, "step": 185430 }, { "epoch": 0.94, "learning_rate": 0.00015966470074819255, "loss": 0.012, "step": 185440 }, { "epoch": 0.94, "learning_rate": 0.00015965713305517854, "loss": 0.0098, "step": 185450 }, { "epoch": 0.94, "learning_rate": 0.00015964956536216454, "loss": 0.0106, "step": 185460 }, { "epoch": 0.94, "learning_rate": 0.00015964199766915053, "loss": 0.0097, "step": 185470 }, { "epoch": 0.94, "learning_rate": 0.0001596344299761365, "loss": 0.0099, "step": 185480 }, { "epoch": 0.94, "learning_rate": 0.00015962686228312252, "loss": 0.0096, "step": 185490 }, { "epoch": 0.94, "learning_rate": 0.0001596192945901085, "loss": 0.0108, "step": 185500 }, { "epoch": 0.94, "learning_rate": 0.00015961172689709448, "loss": 0.0105, "step": 185510 }, { "epoch": 0.94, "learning_rate": 0.00015960415920408046, "loss": 0.0134, "step": 185520 }, { "epoch": 0.94, "learning_rate": 0.00015959659151106647, "loss": 0.0107, "step": 185530 }, { "epoch": 0.94, "learning_rate": 0.00015958902381805245, "loss": 0.0136, "step": 185540 }, { "epoch": 0.94, "learning_rate": 0.00015958145612503843, "loss": 0.0106, "step": 185550 }, { "epoch": 0.94, "learning_rate": 0.00015957388843202444, "loss": 0.0099, "step": 185560 }, { "epoch": 0.94, "learning_rate": 0.00015956632073901042, "loss": 0.0086, "step": 185570 }, { "epoch": 0.94, "learning_rate": 0.0001595587530459964, "loss": 0.0096, "step": 185580 }, { "epoch": 0.94, "learning_rate": 0.0001595511853529824, "loss": 0.0106, "step": 185590 }, { "epoch": 0.94, "learning_rate": 0.0001595436176599684, "loss": 0.0107, "step": 185600 }, { "epoch": 0.94, "learning_rate": 0.00015953604996695437, "loss": 0.0132, "step": 185610 }, { "epoch": 0.94, "learning_rate": 0.00015952848227394038, "loss": 0.0111, "step": 185620 }, { "epoch": 0.94, "learning_rate": 0.00015952091458092636, "loss": 0.0099, "step": 185630 }, { "epoch": 0.94, "learning_rate": 0.00015951334688791235, "loss": 0.0086, "step": 185640 }, { "epoch": 0.94, "learning_rate": 0.00015950577919489835, "loss": 0.0127, "step": 185650 }, { "epoch": 0.94, "learning_rate": 0.00015949821150188434, "loss": 0.0112, "step": 185660 }, { "epoch": 0.94, "learning_rate": 0.00015949064380887032, "loss": 0.0113, "step": 185670 }, { "epoch": 0.94, "learning_rate": 0.00015948307611585633, "loss": 0.0143, "step": 185680 }, { "epoch": 0.94, "learning_rate": 0.0001594755084228423, "loss": 0.0089, "step": 185690 }, { "epoch": 0.94, "learning_rate": 0.0001594679407298283, "loss": 0.0097, "step": 185700 }, { "epoch": 0.94, "learning_rate": 0.00015946037303681427, "loss": 0.0129, "step": 185710 }, { "epoch": 0.94, "learning_rate": 0.00015945280534380028, "loss": 0.0104, "step": 185720 }, { "epoch": 0.94, "learning_rate": 0.00015944523765078626, "loss": 0.013, "step": 185730 }, { "epoch": 0.94, "learning_rate": 0.00015943766995777224, "loss": 0.0126, "step": 185740 }, { "epoch": 0.94, "learning_rate": 0.00015943010226475825, "loss": 0.0141, "step": 185750 }, { "epoch": 0.94, "learning_rate": 0.00015942253457174423, "loss": 0.0103, "step": 185760 }, { "epoch": 0.94, "learning_rate": 0.0001594149668787302, "loss": 0.0125, "step": 185770 }, { "epoch": 0.94, "learning_rate": 0.00015940739918571622, "loss": 0.0082, "step": 185780 }, { "epoch": 0.94, "learning_rate": 0.0001593998314927022, "loss": 0.0079, "step": 185790 }, { "epoch": 0.94, "learning_rate": 0.00015939226379968818, "loss": 0.01, "step": 185800 }, { "epoch": 0.94, "learning_rate": 0.0001593846961066742, "loss": 0.0102, "step": 185810 }, { "epoch": 0.94, "learning_rate": 0.00015937712841366017, "loss": 0.0099, "step": 185820 }, { "epoch": 0.94, "learning_rate": 0.00015936956072064616, "loss": 0.0109, "step": 185830 }, { "epoch": 0.94, "learning_rate": 0.00015936199302763216, "loss": 0.0145, "step": 185840 }, { "epoch": 0.94, "learning_rate": 0.00015935442533461815, "loss": 0.01, "step": 185850 }, { "epoch": 0.94, "learning_rate": 0.00015934685764160413, "loss": 0.0086, "step": 185860 }, { "epoch": 0.94, "learning_rate": 0.0001593392899485901, "loss": 0.0128, "step": 185870 }, { "epoch": 0.94, "learning_rate": 0.00015933172225557612, "loss": 0.0136, "step": 185880 }, { "epoch": 0.94, "learning_rate": 0.0001593241545625621, "loss": 0.0108, "step": 185890 }, { "epoch": 0.94, "learning_rate": 0.00015931658686954808, "loss": 0.0102, "step": 185900 }, { "epoch": 0.94, "learning_rate": 0.0001593090191765341, "loss": 0.0113, "step": 185910 }, { "epoch": 0.94, "learning_rate": 0.00015930145148352007, "loss": 0.0132, "step": 185920 }, { "epoch": 0.94, "learning_rate": 0.00015929388379050605, "loss": 0.0095, "step": 185930 }, { "epoch": 0.94, "learning_rate": 0.00015928631609749206, "loss": 0.0114, "step": 185940 }, { "epoch": 0.94, "learning_rate": 0.00015927874840447804, "loss": 0.0119, "step": 185950 }, { "epoch": 0.94, "learning_rate": 0.00015927118071146402, "loss": 0.0126, "step": 185960 }, { "epoch": 0.94, "learning_rate": 0.00015926361301845003, "loss": 0.011, "step": 185970 }, { "epoch": 0.94, "learning_rate": 0.000159256045325436, "loss": 0.0141, "step": 185980 }, { "epoch": 0.94, "learning_rate": 0.000159248477632422, "loss": 0.015, "step": 185990 }, { "epoch": 0.94, "learning_rate": 0.000159240909939408, "loss": 0.009, "step": 186000 }, { "epoch": 0.94, "eval_cer": 0.9144770486760401, "eval_loss": 0.007943259552121162, "eval_runtime": 116.7604, "eval_samples_per_second": 17.129, "eval_steps_per_second": 4.282, "step": 186000 }, { "epoch": 0.94, "learning_rate": 0.00015923334224639398, "loss": 0.0097, "step": 186010 }, { "epoch": 0.94, "learning_rate": 0.00015922577455337997, "loss": 0.0079, "step": 186020 }, { "epoch": 0.94, "learning_rate": 0.00015921820686036595, "loss": 0.0128, "step": 186030 }, { "epoch": 0.94, "learning_rate": 0.00015921063916735196, "loss": 0.0144, "step": 186040 }, { "epoch": 0.94, "learning_rate": 0.00015920307147433794, "loss": 0.0111, "step": 186050 }, { "epoch": 0.94, "learning_rate": 0.00015919550378132392, "loss": 0.0096, "step": 186060 }, { "epoch": 0.94, "learning_rate": 0.00015918793608830993, "loss": 0.013, "step": 186070 }, { "epoch": 0.94, "learning_rate": 0.0001591803683952959, "loss": 0.0161, "step": 186080 }, { "epoch": 0.94, "learning_rate": 0.0001591728007022819, "loss": 0.0114, "step": 186090 }, { "epoch": 0.94, "learning_rate": 0.0001591652330092679, "loss": 0.0094, "step": 186100 }, { "epoch": 0.94, "learning_rate": 0.00015915766531625388, "loss": 0.0103, "step": 186110 }, { "epoch": 0.94, "learning_rate": 0.00015915009762323986, "loss": 0.0126, "step": 186120 }, { "epoch": 0.94, "learning_rate": 0.00015914252993022587, "loss": 0.0112, "step": 186130 }, { "epoch": 0.94, "learning_rate": 0.00015913496223721185, "loss": 0.0088, "step": 186140 }, { "epoch": 0.94, "learning_rate": 0.00015912739454419783, "loss": 0.0111, "step": 186150 }, { "epoch": 0.94, "learning_rate": 0.00015911982685118384, "loss": 0.0117, "step": 186160 }, { "epoch": 0.94, "learning_rate": 0.00015911225915816982, "loss": 0.0117, "step": 186170 }, { "epoch": 0.94, "learning_rate": 0.0001591046914651558, "loss": 0.012, "step": 186180 }, { "epoch": 0.94, "learning_rate": 0.0001590971237721418, "loss": 0.0109, "step": 186190 }, { "epoch": 0.94, "learning_rate": 0.0001590895560791278, "loss": 0.0093, "step": 186200 }, { "epoch": 0.94, "learning_rate": 0.00015908198838611378, "loss": 0.0102, "step": 186210 }, { "epoch": 0.94, "learning_rate": 0.00015907442069309976, "loss": 0.0135, "step": 186220 }, { "epoch": 0.94, "learning_rate": 0.00015906685300008577, "loss": 0.0086, "step": 186230 }, { "epoch": 0.94, "learning_rate": 0.00015905928530707175, "loss": 0.0155, "step": 186240 }, { "epoch": 0.94, "learning_rate": 0.00015905171761405773, "loss": 0.0118, "step": 186250 }, { "epoch": 0.94, "learning_rate": 0.00015904414992104374, "loss": 0.0116, "step": 186260 }, { "epoch": 0.94, "learning_rate": 0.00015903658222802972, "loss": 0.0095, "step": 186270 }, { "epoch": 0.94, "learning_rate": 0.0001590290145350157, "loss": 0.0111, "step": 186280 }, { "epoch": 0.94, "learning_rate": 0.0001590214468420017, "loss": 0.0091, "step": 186290 }, { "epoch": 0.94, "learning_rate": 0.0001590138791489877, "loss": 0.0104, "step": 186300 }, { "epoch": 0.94, "learning_rate": 0.00015900631145597367, "loss": 0.0116, "step": 186310 }, { "epoch": 0.94, "learning_rate": 0.00015899874376295968, "loss": 0.0112, "step": 186320 }, { "epoch": 0.94, "learning_rate": 0.00015899117606994566, "loss": 0.0107, "step": 186330 }, { "epoch": 0.94, "learning_rate": 0.00015898360837693164, "loss": 0.0101, "step": 186340 }, { "epoch": 0.94, "learning_rate": 0.00015897604068391765, "loss": 0.0103, "step": 186350 }, { "epoch": 0.94, "learning_rate": 0.00015896847299090363, "loss": 0.0118, "step": 186360 }, { "epoch": 0.94, "learning_rate": 0.00015896090529788961, "loss": 0.0097, "step": 186370 }, { "epoch": 0.94, "learning_rate": 0.0001589533376048756, "loss": 0.0106, "step": 186380 }, { "epoch": 0.94, "learning_rate": 0.0001589457699118616, "loss": 0.0124, "step": 186390 }, { "epoch": 0.94, "learning_rate": 0.00015893820221884759, "loss": 0.0153, "step": 186400 }, { "epoch": 0.94, "learning_rate": 0.00015893063452583357, "loss": 0.0115, "step": 186410 }, { "epoch": 0.94, "learning_rate": 0.00015892306683281958, "loss": 0.012, "step": 186420 }, { "epoch": 0.94, "learning_rate": 0.00015891549913980556, "loss": 0.009, "step": 186430 }, { "epoch": 0.94, "learning_rate": 0.00015890793144679154, "loss": 0.0108, "step": 186440 }, { "epoch": 0.94, "learning_rate": 0.00015890036375377755, "loss": 0.0126, "step": 186450 }, { "epoch": 0.94, "learning_rate": 0.00015889279606076353, "loss": 0.0138, "step": 186460 }, { "epoch": 0.94, "learning_rate": 0.0001588852283677495, "loss": 0.0125, "step": 186470 }, { "epoch": 0.94, "learning_rate": 0.00015887766067473552, "loss": 0.0121, "step": 186480 }, { "epoch": 0.94, "learning_rate": 0.0001588700929817215, "loss": 0.0104, "step": 186490 }, { "epoch": 0.94, "learning_rate": 0.00015886252528870748, "loss": 0.0107, "step": 186500 }, { "epoch": 0.94, "learning_rate": 0.0001588549575956935, "loss": 0.0085, "step": 186510 }, { "epoch": 0.94, "learning_rate": 0.00015884738990267947, "loss": 0.0113, "step": 186520 }, { "epoch": 0.94, "learning_rate": 0.00015883982220966545, "loss": 0.0113, "step": 186530 }, { "epoch": 0.94, "learning_rate": 0.00015883225451665143, "loss": 0.0158, "step": 186540 }, { "epoch": 0.94, "learning_rate": 0.00015882468682363744, "loss": 0.0127, "step": 186550 }, { "epoch": 0.94, "learning_rate": 0.00015881711913062342, "loss": 0.0126, "step": 186560 }, { "epoch": 0.94, "learning_rate": 0.0001588095514376094, "loss": 0.0101, "step": 186570 }, { "epoch": 0.94, "learning_rate": 0.00015880198374459541, "loss": 0.0081, "step": 186580 }, { "epoch": 0.94, "learning_rate": 0.0001587944160515814, "loss": 0.0106, "step": 186590 }, { "epoch": 0.94, "learning_rate": 0.00015878684835856738, "loss": 0.011, "step": 186600 }, { "epoch": 0.94, "learning_rate": 0.00015877928066555339, "loss": 0.011, "step": 186610 }, { "epoch": 0.94, "learning_rate": 0.00015877171297253937, "loss": 0.0128, "step": 186620 }, { "epoch": 0.94, "learning_rate": 0.00015876414527952535, "loss": 0.0105, "step": 186630 }, { "epoch": 0.94, "learning_rate": 0.00015875657758651136, "loss": 0.0107, "step": 186640 }, { "epoch": 0.94, "learning_rate": 0.0001587490098934973, "loss": 0.0127, "step": 186650 }, { "epoch": 0.94, "learning_rate": 0.0001587414422004833, "loss": 0.0122, "step": 186660 }, { "epoch": 0.94, "learning_rate": 0.00015873387450746927, "loss": 0.0093, "step": 186670 }, { "epoch": 0.94, "learning_rate": 0.00015872630681445528, "loss": 0.0083, "step": 186680 }, { "epoch": 0.94, "learning_rate": 0.00015871873912144126, "loss": 0.0115, "step": 186690 }, { "epoch": 0.94, "learning_rate": 0.00015871117142842725, "loss": 0.0109, "step": 186700 }, { "epoch": 0.94, "learning_rate": 0.00015870360373541325, "loss": 0.0138, "step": 186710 }, { "epoch": 0.94, "learning_rate": 0.00015869603604239924, "loss": 0.0147, "step": 186720 }, { "epoch": 0.94, "learning_rate": 0.00015868846834938522, "loss": 0.0085, "step": 186730 }, { "epoch": 0.94, "learning_rate": 0.00015868090065637123, "loss": 0.0137, "step": 186740 }, { "epoch": 0.94, "learning_rate": 0.0001586733329633572, "loss": 0.009, "step": 186750 }, { "epoch": 0.94, "learning_rate": 0.0001586657652703432, "loss": 0.0097, "step": 186760 }, { "epoch": 0.94, "learning_rate": 0.00015865819757732917, "loss": 0.0115, "step": 186770 }, { "epoch": 0.94, "learning_rate": 0.00015865062988431518, "loss": 0.0125, "step": 186780 }, { "epoch": 0.94, "learning_rate": 0.00015864306219130116, "loss": 0.0111, "step": 186790 }, { "epoch": 0.94, "learning_rate": 0.00015863549449828714, "loss": 0.0114, "step": 186800 }, { "epoch": 0.94, "learning_rate": 0.00015862792680527315, "loss": 0.0077, "step": 186810 }, { "epoch": 0.94, "learning_rate": 0.00015862035911225913, "loss": 0.0107, "step": 186820 }, { "epoch": 0.94, "learning_rate": 0.0001586127914192451, "loss": 0.0151, "step": 186830 }, { "epoch": 0.94, "learning_rate": 0.00015860522372623112, "loss": 0.0114, "step": 186840 }, { "epoch": 0.94, "learning_rate": 0.0001585976560332171, "loss": 0.0116, "step": 186850 }, { "epoch": 0.94, "learning_rate": 0.00015859008834020308, "loss": 0.0129, "step": 186860 }, { "epoch": 0.94, "learning_rate": 0.0001585825206471891, "loss": 0.0098, "step": 186870 }, { "epoch": 0.94, "learning_rate": 0.00015857495295417507, "loss": 0.0087, "step": 186880 }, { "epoch": 0.94, "learning_rate": 0.00015856738526116106, "loss": 0.01, "step": 186890 }, { "epoch": 0.94, "learning_rate": 0.00015855981756814706, "loss": 0.0097, "step": 186900 }, { "epoch": 0.94, "learning_rate": 0.00015855224987513305, "loss": 0.0105, "step": 186910 }, { "epoch": 0.94, "learning_rate": 0.00015854468218211903, "loss": 0.0258, "step": 186920 }, { "epoch": 0.94, "learning_rate": 0.000158537114489105, "loss": 0.0128, "step": 186930 }, { "epoch": 0.94, "learning_rate": 0.00015852954679609102, "loss": 0.0108, "step": 186940 }, { "epoch": 0.94, "learning_rate": 0.000158521979103077, "loss": 0.0101, "step": 186950 }, { "epoch": 0.94, "learning_rate": 0.00015851441141006298, "loss": 0.0141, "step": 186960 }, { "epoch": 0.94, "learning_rate": 0.000158506843717049, "loss": 0.0093, "step": 186970 }, { "epoch": 0.94, "learning_rate": 0.00015849927602403497, "loss": 0.013, "step": 186980 }, { "epoch": 0.94, "learning_rate": 0.00015849170833102095, "loss": 0.0117, "step": 186990 }, { "epoch": 0.94, "learning_rate": 0.00015848414063800696, "loss": 0.0092, "step": 187000 }, { "epoch": 0.94, "eval_cer": 0.9144683151109114, "eval_loss": 0.008203052915632725, "eval_runtime": 116.5799, "eval_samples_per_second": 17.156, "eval_steps_per_second": 4.289, "step": 187000 }, { "epoch": 0.94, "learning_rate": 0.00015847657294499294, "loss": 0.0105, "step": 187010 }, { "epoch": 0.94, "learning_rate": 0.00015846900525197892, "loss": 0.0123, "step": 187020 }, { "epoch": 0.94, "learning_rate": 0.00015846143755896493, "loss": 0.0105, "step": 187030 }, { "epoch": 0.94, "learning_rate": 0.0001584538698659509, "loss": 0.0101, "step": 187040 }, { "epoch": 0.94, "learning_rate": 0.0001584463021729369, "loss": 0.011, "step": 187050 }, { "epoch": 0.94, "learning_rate": 0.0001584387344799229, "loss": 0.0118, "step": 187060 }, { "epoch": 0.94, "learning_rate": 0.00015843116678690888, "loss": 0.0107, "step": 187070 }, { "epoch": 0.94, "learning_rate": 0.00015842359909389487, "loss": 0.0115, "step": 187080 }, { "epoch": 0.94, "learning_rate": 0.00015841603140088087, "loss": 0.0144, "step": 187090 }, { "epoch": 0.94, "learning_rate": 0.00015840846370786686, "loss": 0.0095, "step": 187100 }, { "epoch": 0.94, "learning_rate": 0.00015840089601485284, "loss": 0.0094, "step": 187110 }, { "epoch": 0.94, "learning_rate": 0.00015839332832183882, "loss": 0.0117, "step": 187120 }, { "epoch": 0.94, "learning_rate": 0.00015838576062882483, "loss": 0.0097, "step": 187130 }, { "epoch": 0.94, "learning_rate": 0.0001583781929358108, "loss": 0.0117, "step": 187140 }, { "epoch": 0.94, "learning_rate": 0.0001583706252427968, "loss": 0.0119, "step": 187150 }, { "epoch": 0.94, "learning_rate": 0.0001583630575497828, "loss": 0.0154, "step": 187160 }, { "epoch": 0.94, "learning_rate": 0.00015835548985676878, "loss": 0.0117, "step": 187170 }, { "epoch": 0.94, "learning_rate": 0.00015834792216375476, "loss": 0.0104, "step": 187180 }, { "epoch": 0.94, "learning_rate": 0.00015834035447074077, "loss": 0.0125, "step": 187190 }, { "epoch": 0.94, "learning_rate": 0.00015833278677772675, "loss": 0.0103, "step": 187200 }, { "epoch": 0.94, "learning_rate": 0.00015832521908471273, "loss": 0.0092, "step": 187210 }, { "epoch": 0.94, "learning_rate": 0.00015831765139169874, "loss": 0.0115, "step": 187220 }, { "epoch": 0.94, "learning_rate": 0.00015831008369868472, "loss": 0.0091, "step": 187230 }, { "epoch": 0.94, "learning_rate": 0.0001583025160056707, "loss": 0.012, "step": 187240 }, { "epoch": 0.94, "learning_rate": 0.0001582949483126567, "loss": 0.0107, "step": 187250 }, { "epoch": 0.94, "learning_rate": 0.0001582873806196427, "loss": 0.013, "step": 187260 }, { "epoch": 0.94, "learning_rate": 0.00015827981292662868, "loss": 0.0093, "step": 187270 }, { "epoch": 0.94, "learning_rate": 0.00015827224523361466, "loss": 0.01, "step": 187280 }, { "epoch": 0.94, "learning_rate": 0.00015826467754060067, "loss": 0.0129, "step": 187290 }, { "epoch": 0.94, "learning_rate": 0.00015825710984758665, "loss": 0.0106, "step": 187300 }, { "epoch": 0.94, "learning_rate": 0.00015824954215457263, "loss": 0.0137, "step": 187310 }, { "epoch": 0.95, "learning_rate": 0.00015824197446155864, "loss": 0.0125, "step": 187320 }, { "epoch": 0.95, "learning_rate": 0.00015823440676854462, "loss": 0.0132, "step": 187330 }, { "epoch": 0.95, "learning_rate": 0.0001582268390755306, "loss": 0.009, "step": 187340 }, { "epoch": 0.95, "learning_rate": 0.0001582192713825166, "loss": 0.01, "step": 187350 }, { "epoch": 0.95, "learning_rate": 0.0001582117036895026, "loss": 0.0105, "step": 187360 }, { "epoch": 0.95, "learning_rate": 0.00015820413599648857, "loss": 0.0109, "step": 187370 }, { "epoch": 0.95, "learning_rate": 0.00015819656830347458, "loss": 0.0111, "step": 187380 }, { "epoch": 0.95, "learning_rate": 0.00015818900061046056, "loss": 0.0111, "step": 187390 }, { "epoch": 0.95, "learning_rate": 0.00015818143291744654, "loss": 0.0107, "step": 187400 }, { "epoch": 0.95, "learning_rate": 0.00015817386522443255, "loss": 0.0106, "step": 187410 }, { "epoch": 0.95, "learning_rate": 0.00015816629753141853, "loss": 0.0117, "step": 187420 }, { "epoch": 0.95, "learning_rate": 0.00015815872983840451, "loss": 0.0103, "step": 187430 }, { "epoch": 0.95, "learning_rate": 0.0001581511621453905, "loss": 0.0115, "step": 187440 }, { "epoch": 0.95, "learning_rate": 0.0001581435944523765, "loss": 0.009, "step": 187450 }, { "epoch": 0.95, "learning_rate": 0.00015813602675936249, "loss": 0.0094, "step": 187460 }, { "epoch": 0.95, "learning_rate": 0.00015812845906634847, "loss": 0.0108, "step": 187470 }, { "epoch": 0.95, "learning_rate": 0.00015812089137333448, "loss": 0.011, "step": 187480 }, { "epoch": 0.95, "learning_rate": 0.00015811332368032046, "loss": 0.014, "step": 187490 }, { "epoch": 0.95, "learning_rate": 0.00015810575598730644, "loss": 0.0104, "step": 187500 }, { "epoch": 0.95, "learning_rate": 0.00015809818829429245, "loss": 0.0112, "step": 187510 }, { "epoch": 0.95, "learning_rate": 0.00015809062060127843, "loss": 0.0125, "step": 187520 }, { "epoch": 0.95, "learning_rate": 0.0001580830529082644, "loss": 0.0116, "step": 187530 }, { "epoch": 0.95, "learning_rate": 0.00015807548521525042, "loss": 0.0097, "step": 187540 }, { "epoch": 0.95, "learning_rate": 0.0001580679175222364, "loss": 0.0106, "step": 187550 }, { "epoch": 0.95, "learning_rate": 0.00015806034982922238, "loss": 0.0099, "step": 187560 }, { "epoch": 0.95, "learning_rate": 0.0001580527821362084, "loss": 0.0089, "step": 187570 }, { "epoch": 0.95, "learning_rate": 0.00015804521444319437, "loss": 0.0098, "step": 187580 }, { "epoch": 0.95, "learning_rate": 0.00015803764675018035, "loss": 0.0096, "step": 187590 }, { "epoch": 0.95, "learning_rate": 0.00015803007905716636, "loss": 0.0102, "step": 187600 }, { "epoch": 0.95, "learning_rate": 0.00015802251136415234, "loss": 0.0095, "step": 187610 }, { "epoch": 0.95, "learning_rate": 0.00015801494367113832, "loss": 0.0086, "step": 187620 }, { "epoch": 0.95, "learning_rate": 0.0001580073759781243, "loss": 0.0103, "step": 187630 }, { "epoch": 0.95, "learning_rate": 0.00015799980828511031, "loss": 0.0101, "step": 187640 }, { "epoch": 0.95, "learning_rate": 0.0001579922405920963, "loss": 0.0092, "step": 187650 }, { "epoch": 0.95, "learning_rate": 0.00015798467289908228, "loss": 0.012, "step": 187660 }, { "epoch": 0.95, "learning_rate": 0.00015797710520606829, "loss": 0.0101, "step": 187670 }, { "epoch": 0.95, "learning_rate": 0.00015796953751305427, "loss": 0.0102, "step": 187680 }, { "epoch": 0.95, "learning_rate": 0.00015796196982004025, "loss": 0.0162, "step": 187690 }, { "epoch": 0.95, "learning_rate": 0.00015795440212702626, "loss": 0.0118, "step": 187700 }, { "epoch": 0.95, "learning_rate": 0.00015794683443401224, "loss": 0.0115, "step": 187710 }, { "epoch": 0.95, "learning_rate": 0.00015793926674099822, "loss": 0.0102, "step": 187720 }, { "epoch": 0.95, "learning_rate": 0.00015793169904798423, "loss": 0.0111, "step": 187730 }, { "epoch": 0.95, "learning_rate": 0.0001579241313549702, "loss": 0.0103, "step": 187740 }, { "epoch": 0.95, "learning_rate": 0.0001579165636619562, "loss": 0.01, "step": 187750 }, { "epoch": 0.95, "learning_rate": 0.0001579089959689422, "loss": 0.0111, "step": 187760 }, { "epoch": 0.95, "learning_rate": 0.00015790142827592818, "loss": 0.013, "step": 187770 }, { "epoch": 0.95, "learning_rate": 0.00015789386058291416, "loss": 0.0097, "step": 187780 }, { "epoch": 0.95, "learning_rate": 0.00015788629288990014, "loss": 0.0103, "step": 187790 }, { "epoch": 0.95, "learning_rate": 0.00015787872519688615, "loss": 0.0123, "step": 187800 }, { "epoch": 0.95, "learning_rate": 0.00015787115750387213, "loss": 0.0122, "step": 187810 }, { "epoch": 0.95, "learning_rate": 0.00015786358981085812, "loss": 0.0125, "step": 187820 }, { "epoch": 0.95, "learning_rate": 0.00015785602211784412, "loss": 0.0115, "step": 187830 }, { "epoch": 0.95, "learning_rate": 0.0001578484544248301, "loss": 0.0089, "step": 187840 }, { "epoch": 0.95, "learning_rate": 0.0001578408867318161, "loss": 0.0115, "step": 187850 }, { "epoch": 0.95, "learning_rate": 0.0001578333190388021, "loss": 0.0122, "step": 187860 }, { "epoch": 0.95, "learning_rate": 0.00015782575134578808, "loss": 0.0133, "step": 187870 }, { "epoch": 0.95, "learning_rate": 0.00015781818365277406, "loss": 0.0117, "step": 187880 }, { "epoch": 0.95, "learning_rate": 0.00015781061595976007, "loss": 0.012, "step": 187890 }, { "epoch": 0.95, "learning_rate": 0.00015780304826674605, "loss": 0.0097, "step": 187900 }, { "epoch": 0.95, "learning_rate": 0.000157795480573732, "loss": 0.01, "step": 187910 }, { "epoch": 0.95, "learning_rate": 0.00015778791288071798, "loss": 0.0114, "step": 187920 }, { "epoch": 0.95, "learning_rate": 0.000157780345187704, "loss": 0.0124, "step": 187930 }, { "epoch": 0.95, "learning_rate": 0.00015777277749468997, "loss": 0.0115, "step": 187940 }, { "epoch": 0.95, "learning_rate": 0.00015776520980167596, "loss": 0.0108, "step": 187950 }, { "epoch": 0.95, "learning_rate": 0.00015775764210866196, "loss": 0.0098, "step": 187960 }, { "epoch": 0.95, "learning_rate": 0.00015775007441564795, "loss": 0.0136, "step": 187970 }, { "epoch": 0.95, "learning_rate": 0.00015774250672263393, "loss": 0.0113, "step": 187980 }, { "epoch": 0.95, "learning_rate": 0.00015773493902961994, "loss": 0.0107, "step": 187990 }, { "epoch": 0.95, "learning_rate": 0.00015772737133660592, "loss": 0.0113, "step": 188000 }, { "epoch": 0.95, "eval_cer": 0.9144634631302844, "eval_loss": 0.007855391129851341, "eval_runtime": 116.599, "eval_samples_per_second": 17.153, "eval_steps_per_second": 4.288, "step": 188000 }, { "epoch": 0.95, "learning_rate": 0.0001577198036435919, "loss": 0.0129, "step": 188010 }, { "epoch": 0.95, "learning_rate": 0.00015771223595057788, "loss": 0.0086, "step": 188020 }, { "epoch": 0.95, "learning_rate": 0.0001577046682575639, "loss": 0.0094, "step": 188030 }, { "epoch": 0.95, "learning_rate": 0.00015769710056454987, "loss": 0.0116, "step": 188040 }, { "epoch": 0.95, "learning_rate": 0.00015768953287153585, "loss": 0.0123, "step": 188050 }, { "epoch": 0.95, "learning_rate": 0.00015768196517852186, "loss": 0.0144, "step": 188060 }, { "epoch": 0.95, "learning_rate": 0.00015767439748550784, "loss": 0.0107, "step": 188070 }, { "epoch": 0.95, "learning_rate": 0.00015766682979249382, "loss": 0.0162, "step": 188080 }, { "epoch": 0.95, "learning_rate": 0.00015765926209947983, "loss": 0.0106, "step": 188090 }, { "epoch": 0.95, "learning_rate": 0.0001576516944064658, "loss": 0.0096, "step": 188100 }, { "epoch": 0.95, "learning_rate": 0.0001576441267134518, "loss": 0.0101, "step": 188110 }, { "epoch": 0.95, "learning_rate": 0.0001576365590204378, "loss": 0.0105, "step": 188120 }, { "epoch": 0.95, "learning_rate": 0.00015762899132742378, "loss": 0.0114, "step": 188130 }, { "epoch": 0.95, "learning_rate": 0.00015762142363440977, "loss": 0.0119, "step": 188140 }, { "epoch": 0.95, "learning_rate": 0.00015761385594139577, "loss": 0.0193, "step": 188150 }, { "epoch": 0.95, "learning_rate": 0.00015760628824838176, "loss": 0.0105, "step": 188160 }, { "epoch": 0.95, "learning_rate": 0.00015759872055536774, "loss": 0.0125, "step": 188170 }, { "epoch": 0.95, "learning_rate": 0.00015759115286235372, "loss": 0.0126, "step": 188180 }, { "epoch": 0.95, "learning_rate": 0.00015758358516933973, "loss": 0.0122, "step": 188190 }, { "epoch": 0.95, "learning_rate": 0.0001575760174763257, "loss": 0.0094, "step": 188200 }, { "epoch": 0.95, "learning_rate": 0.0001575684497833117, "loss": 0.0111, "step": 188210 }, { "epoch": 0.95, "learning_rate": 0.0001575608820902977, "loss": 0.0177, "step": 188220 }, { "epoch": 0.95, "learning_rate": 0.00015755331439728368, "loss": 0.0131, "step": 188230 }, { "epoch": 0.95, "learning_rate": 0.00015754574670426966, "loss": 0.0095, "step": 188240 }, { "epoch": 0.95, "learning_rate": 0.00015753817901125567, "loss": 0.0118, "step": 188250 }, { "epoch": 0.95, "learning_rate": 0.00015753061131824165, "loss": 0.0136, "step": 188260 }, { "epoch": 0.95, "learning_rate": 0.00015752304362522763, "loss": 0.0103, "step": 188270 }, { "epoch": 0.95, "learning_rate": 0.00015751547593221364, "loss": 0.0129, "step": 188280 }, { "epoch": 0.95, "learning_rate": 0.00015750790823919962, "loss": 0.008, "step": 188290 }, { "epoch": 0.95, "learning_rate": 0.0001575003405461856, "loss": 0.0145, "step": 188300 }, { "epoch": 0.95, "learning_rate": 0.0001574927728531716, "loss": 0.0092, "step": 188310 }, { "epoch": 0.95, "learning_rate": 0.0001574852051601576, "loss": 0.0074, "step": 188320 }, { "epoch": 0.95, "learning_rate": 0.00015747763746714358, "loss": 0.0131, "step": 188330 }, { "epoch": 0.95, "learning_rate": 0.00015747006977412956, "loss": 0.0084, "step": 188340 }, { "epoch": 0.95, "learning_rate": 0.00015746250208111557, "loss": 0.009, "step": 188350 }, { "epoch": 0.95, "learning_rate": 0.00015745493438810155, "loss": 0.0124, "step": 188360 }, { "epoch": 0.95, "learning_rate": 0.00015744736669508753, "loss": 0.0099, "step": 188370 }, { "epoch": 0.95, "learning_rate": 0.00015743979900207354, "loss": 0.0109, "step": 188380 }, { "epoch": 0.95, "learning_rate": 0.00015743223130905952, "loss": 0.0141, "step": 188390 }, { "epoch": 0.95, "learning_rate": 0.0001574246636160455, "loss": 0.0107, "step": 188400 }, { "epoch": 0.95, "learning_rate": 0.0001574170959230315, "loss": 0.01, "step": 188410 }, { "epoch": 0.95, "learning_rate": 0.0001574095282300175, "loss": 0.0109, "step": 188420 }, { "epoch": 0.95, "learning_rate": 0.00015740196053700347, "loss": 0.011, "step": 188430 }, { "epoch": 0.95, "learning_rate": 0.00015739439284398948, "loss": 0.0098, "step": 188440 }, { "epoch": 0.95, "learning_rate": 0.00015738682515097546, "loss": 0.0111, "step": 188450 }, { "epoch": 0.95, "learning_rate": 0.00015737925745796144, "loss": 0.012, "step": 188460 }, { "epoch": 0.95, "learning_rate": 0.00015737168976494745, "loss": 0.0101, "step": 188470 }, { "epoch": 0.95, "learning_rate": 0.00015736412207193343, "loss": 0.0145, "step": 188480 }, { "epoch": 0.95, "learning_rate": 0.00015735655437891941, "loss": 0.0085, "step": 188490 }, { "epoch": 0.95, "learning_rate": 0.00015734898668590542, "loss": 0.0097, "step": 188500 }, { "epoch": 0.95, "learning_rate": 0.0001573414189928914, "loss": 0.0104, "step": 188510 }, { "epoch": 0.95, "learning_rate": 0.00015733385129987739, "loss": 0.0106, "step": 188520 }, { "epoch": 0.95, "learning_rate": 0.00015732628360686337, "loss": 0.011, "step": 188530 }, { "epoch": 0.95, "learning_rate": 0.00015731871591384938, "loss": 0.0121, "step": 188540 }, { "epoch": 0.95, "learning_rate": 0.00015731114822083536, "loss": 0.01, "step": 188550 }, { "epoch": 0.95, "learning_rate": 0.00015730358052782134, "loss": 0.0083, "step": 188560 }, { "epoch": 0.95, "learning_rate": 0.00015729601283480735, "loss": 0.0116, "step": 188570 }, { "epoch": 0.95, "learning_rate": 0.00015728844514179333, "loss": 0.0102, "step": 188580 }, { "epoch": 0.95, "learning_rate": 0.0001572808774487793, "loss": 0.0147, "step": 188590 }, { "epoch": 0.95, "learning_rate": 0.00015727330975576532, "loss": 0.0122, "step": 188600 }, { "epoch": 0.95, "learning_rate": 0.0001572657420627513, "loss": 0.0106, "step": 188610 }, { "epoch": 0.95, "learning_rate": 0.00015725817436973728, "loss": 0.0098, "step": 188620 }, { "epoch": 0.95, "learning_rate": 0.0001572506066767233, "loss": 0.0113, "step": 188630 }, { "epoch": 0.95, "learning_rate": 0.00015724303898370927, "loss": 0.0146, "step": 188640 }, { "epoch": 0.95, "learning_rate": 0.00015723547129069525, "loss": 0.0117, "step": 188650 }, { "epoch": 0.95, "learning_rate": 0.00015722790359768126, "loss": 0.0104, "step": 188660 }, { "epoch": 0.95, "learning_rate": 0.00015722033590466724, "loss": 0.0114, "step": 188670 }, { "epoch": 0.95, "learning_rate": 0.00015721276821165322, "loss": 0.01, "step": 188680 }, { "epoch": 0.95, "learning_rate": 0.0001572052005186392, "loss": 0.0117, "step": 188690 }, { "epoch": 0.95, "learning_rate": 0.00015719763282562521, "loss": 0.0088, "step": 188700 }, { "epoch": 0.95, "learning_rate": 0.0001571900651326112, "loss": 0.0097, "step": 188710 }, { "epoch": 0.95, "learning_rate": 0.00015718249743959718, "loss": 0.0093, "step": 188720 }, { "epoch": 0.95, "learning_rate": 0.00015717492974658319, "loss": 0.0149, "step": 188730 }, { "epoch": 0.95, "learning_rate": 0.00015716736205356917, "loss": 0.0106, "step": 188740 }, { "epoch": 0.95, "learning_rate": 0.00015715979436055515, "loss": 0.0145, "step": 188750 }, { "epoch": 0.95, "learning_rate": 0.00015715222666754116, "loss": 0.0096, "step": 188760 }, { "epoch": 0.95, "learning_rate": 0.00015714465897452714, "loss": 0.0119, "step": 188770 }, { "epoch": 0.95, "learning_rate": 0.00015713709128151312, "loss": 0.013, "step": 188780 }, { "epoch": 0.95, "learning_rate": 0.00015712952358849913, "loss": 0.0107, "step": 188790 }, { "epoch": 0.95, "learning_rate": 0.0001571219558954851, "loss": 0.012, "step": 188800 }, { "epoch": 0.95, "learning_rate": 0.0001571143882024711, "loss": 0.0102, "step": 188810 }, { "epoch": 0.95, "learning_rate": 0.0001571068205094571, "loss": 0.0105, "step": 188820 }, { "epoch": 0.95, "learning_rate": 0.00015709925281644308, "loss": 0.0123, "step": 188830 }, { "epoch": 0.95, "learning_rate": 0.00015709168512342906, "loss": 0.0121, "step": 188840 }, { "epoch": 0.95, "learning_rate": 0.00015708411743041504, "loss": 0.0089, "step": 188850 }, { "epoch": 0.95, "learning_rate": 0.00015707654973740105, "loss": 0.0112, "step": 188860 }, { "epoch": 0.95, "learning_rate": 0.00015706898204438703, "loss": 0.0091, "step": 188870 }, { "epoch": 0.95, "learning_rate": 0.00015706141435137302, "loss": 0.0136, "step": 188880 }, { "epoch": 0.95, "learning_rate": 0.00015705384665835902, "loss": 0.0114, "step": 188890 }, { "epoch": 0.95, "learning_rate": 0.000157046278965345, "loss": 0.0123, "step": 188900 }, { "epoch": 0.95, "learning_rate": 0.000157038711272331, "loss": 0.012, "step": 188910 }, { "epoch": 0.95, "learning_rate": 0.000157031143579317, "loss": 0.0139, "step": 188920 }, { "epoch": 0.95, "learning_rate": 0.00015702357588630298, "loss": 0.0113, "step": 188930 }, { "epoch": 0.95, "learning_rate": 0.00015701600819328896, "loss": 0.011, "step": 188940 }, { "epoch": 0.95, "learning_rate": 0.00015700844050027497, "loss": 0.011, "step": 188950 }, { "epoch": 0.95, "learning_rate": 0.00015700087280726095, "loss": 0.014, "step": 188960 }, { "epoch": 0.95, "learning_rate": 0.00015699330511424693, "loss": 0.0108, "step": 188970 }, { "epoch": 0.95, "learning_rate": 0.00015698573742123294, "loss": 0.0092, "step": 188980 }, { "epoch": 0.95, "learning_rate": 0.00015697816972821892, "loss": 0.0115, "step": 188990 }, { "epoch": 0.95, "learning_rate": 0.0001569706020352049, "loss": 0.011, "step": 189000 }, { "epoch": 0.95, "eval_cer": 0.914452788772905, "eval_loss": 0.00806601531803608, "eval_runtime": 116.7489, "eval_samples_per_second": 17.131, "eval_steps_per_second": 4.283, "step": 189000 }, { "epoch": 0.95, "learning_rate": 0.00015696303434219088, "loss": 0.0111, "step": 189010 }, { "epoch": 0.95, "learning_rate": 0.0001569554666491769, "loss": 0.0127, "step": 189020 }, { "epoch": 0.95, "learning_rate": 0.00015694789895616287, "loss": 0.0139, "step": 189030 }, { "epoch": 0.95, "learning_rate": 0.00015694033126314885, "loss": 0.0113, "step": 189040 }, { "epoch": 0.95, "learning_rate": 0.00015693276357013486, "loss": 0.0078, "step": 189050 }, { "epoch": 0.95, "learning_rate": 0.00015692519587712084, "loss": 0.0086, "step": 189060 }, { "epoch": 0.95, "learning_rate": 0.00015691762818410683, "loss": 0.0113, "step": 189070 }, { "epoch": 0.95, "learning_rate": 0.00015691006049109283, "loss": 0.01, "step": 189080 }, { "epoch": 0.95, "learning_rate": 0.00015690249279807882, "loss": 0.0086, "step": 189090 }, { "epoch": 0.95, "learning_rate": 0.0001568949251050648, "loss": 0.0109, "step": 189100 }, { "epoch": 0.95, "learning_rate": 0.0001568873574120508, "loss": 0.0137, "step": 189110 }, { "epoch": 0.95, "learning_rate": 0.0001568797897190368, "loss": 0.0101, "step": 189120 }, { "epoch": 0.95, "learning_rate": 0.00015687222202602277, "loss": 0.0116, "step": 189130 }, { "epoch": 0.95, "learning_rate": 0.00015686465433300878, "loss": 0.0092, "step": 189140 }, { "epoch": 0.95, "learning_rate": 0.00015685708663999476, "loss": 0.0101, "step": 189150 }, { "epoch": 0.95, "learning_rate": 0.00015684951894698074, "loss": 0.0123, "step": 189160 }, { "epoch": 0.95, "learning_rate": 0.0001568419512539667, "loss": 0.0086, "step": 189170 }, { "epoch": 0.95, "learning_rate": 0.0001568343835609527, "loss": 0.0103, "step": 189180 }, { "epoch": 0.95, "learning_rate": 0.00015682681586793868, "loss": 0.0126, "step": 189190 }, { "epoch": 0.95, "learning_rate": 0.00015681924817492467, "loss": 0.01, "step": 189200 }, { "epoch": 0.95, "learning_rate": 0.00015681168048191067, "loss": 0.0118, "step": 189210 }, { "epoch": 0.95, "learning_rate": 0.00015680411278889666, "loss": 0.0127, "step": 189220 }, { "epoch": 0.95, "learning_rate": 0.00015679654509588264, "loss": 0.0202, "step": 189230 }, { "epoch": 0.95, "learning_rate": 0.00015678897740286862, "loss": 0.0107, "step": 189240 }, { "epoch": 0.95, "learning_rate": 0.00015678140970985463, "loss": 0.0112, "step": 189250 }, { "epoch": 0.95, "learning_rate": 0.0001567738420168406, "loss": 0.0098, "step": 189260 }, { "epoch": 0.95, "learning_rate": 0.0001567662743238266, "loss": 0.0149, "step": 189270 }, { "epoch": 0.95, "learning_rate": 0.0001567587066308126, "loss": 0.0101, "step": 189280 }, { "epoch": 0.95, "learning_rate": 0.00015675113893779858, "loss": 0.0107, "step": 189290 }, { "epoch": 0.96, "learning_rate": 0.00015674357124478456, "loss": 0.0113, "step": 189300 }, { "epoch": 0.96, "learning_rate": 0.00015673600355177057, "loss": 0.0112, "step": 189310 }, { "epoch": 0.96, "learning_rate": 0.00015672843585875655, "loss": 0.0077, "step": 189320 }, { "epoch": 0.96, "learning_rate": 0.00015672086816574253, "loss": 0.0113, "step": 189330 }, { "epoch": 0.96, "learning_rate": 0.00015671330047272854, "loss": 0.0103, "step": 189340 }, { "epoch": 0.96, "learning_rate": 0.00015670573277971452, "loss": 0.0102, "step": 189350 }, { "epoch": 0.96, "learning_rate": 0.0001566981650867005, "loss": 0.0132, "step": 189360 }, { "epoch": 0.96, "learning_rate": 0.0001566905973936865, "loss": 0.0088, "step": 189370 }, { "epoch": 0.96, "learning_rate": 0.0001566830297006725, "loss": 0.0096, "step": 189380 }, { "epoch": 0.96, "learning_rate": 0.00015667546200765848, "loss": 0.0092, "step": 189390 }, { "epoch": 0.96, "learning_rate": 0.00015666789431464446, "loss": 0.0115, "step": 189400 }, { "epoch": 0.96, "learning_rate": 0.00015666032662163047, "loss": 0.0137, "step": 189410 }, { "epoch": 0.96, "learning_rate": 0.00015665275892861645, "loss": 0.011, "step": 189420 }, { "epoch": 0.96, "learning_rate": 0.00015664519123560243, "loss": 0.0121, "step": 189430 }, { "epoch": 0.96, "learning_rate": 0.00015663762354258844, "loss": 0.012, "step": 189440 }, { "epoch": 0.96, "learning_rate": 0.00015663005584957442, "loss": 0.011, "step": 189450 }, { "epoch": 0.96, "learning_rate": 0.0001566224881565604, "loss": 0.0103, "step": 189460 }, { "epoch": 0.96, "learning_rate": 0.0001566149204635464, "loss": 0.0119, "step": 189470 }, { "epoch": 0.96, "learning_rate": 0.0001566073527705324, "loss": 0.0121, "step": 189480 }, { "epoch": 0.96, "learning_rate": 0.00015659978507751837, "loss": 0.0132, "step": 189490 }, { "epoch": 0.96, "learning_rate": 0.00015659221738450438, "loss": 0.013, "step": 189500 }, { "epoch": 0.96, "learning_rate": 0.00015658464969149036, "loss": 0.0111, "step": 189510 }, { "epoch": 0.96, "learning_rate": 0.00015657708199847634, "loss": 0.0101, "step": 189520 }, { "epoch": 0.96, "learning_rate": 0.00015656951430546235, "loss": 0.0119, "step": 189530 }, { "epoch": 0.96, "learning_rate": 0.00015656194661244833, "loss": 0.0144, "step": 189540 }, { "epoch": 0.96, "learning_rate": 0.00015655437891943431, "loss": 0.0126, "step": 189550 }, { "epoch": 0.96, "learning_rate": 0.00015654681122642032, "loss": 0.0141, "step": 189560 }, { "epoch": 0.96, "learning_rate": 0.0001565392435334063, "loss": 0.0121, "step": 189570 }, { "epoch": 0.96, "learning_rate": 0.00015653167584039229, "loss": 0.0121, "step": 189580 }, { "epoch": 0.96, "learning_rate": 0.00015652410814737827, "loss": 0.0111, "step": 189590 }, { "epoch": 0.96, "learning_rate": 0.00015651654045436428, "loss": 0.0164, "step": 189600 }, { "epoch": 0.96, "learning_rate": 0.00015650897276135026, "loss": 0.0104, "step": 189610 }, { "epoch": 0.96, "learning_rate": 0.00015650140506833624, "loss": 0.01, "step": 189620 }, { "epoch": 0.96, "learning_rate": 0.00015649383737532225, "loss": 0.0107, "step": 189630 }, { "epoch": 0.96, "learning_rate": 0.00015648626968230823, "loss": 0.009, "step": 189640 }, { "epoch": 0.96, "learning_rate": 0.0001564787019892942, "loss": 0.01, "step": 189650 }, { "epoch": 0.96, "learning_rate": 0.00015647113429628022, "loss": 0.0113, "step": 189660 }, { "epoch": 0.96, "learning_rate": 0.0001564635666032662, "loss": 0.01, "step": 189670 }, { "epoch": 0.96, "learning_rate": 0.00015645599891025218, "loss": 0.0103, "step": 189680 }, { "epoch": 0.96, "learning_rate": 0.0001564484312172382, "loss": 0.0125, "step": 189690 }, { "epoch": 0.96, "learning_rate": 0.00015644086352422417, "loss": 0.0104, "step": 189700 }, { "epoch": 0.96, "learning_rate": 0.00015643329583121015, "loss": 0.0115, "step": 189710 }, { "epoch": 0.96, "learning_rate": 0.00015642572813819616, "loss": 0.0115, "step": 189720 }, { "epoch": 0.96, "learning_rate": 0.00015641816044518214, "loss": 0.0129, "step": 189730 }, { "epoch": 0.96, "learning_rate": 0.00015641059275216812, "loss": 0.0112, "step": 189740 }, { "epoch": 0.96, "learning_rate": 0.0001564030250591541, "loss": 0.0146, "step": 189750 }, { "epoch": 0.96, "learning_rate": 0.00015639545736614011, "loss": 0.0113, "step": 189760 }, { "epoch": 0.96, "learning_rate": 0.0001563878896731261, "loss": 0.0109, "step": 189770 }, { "epoch": 0.96, "learning_rate": 0.00015638032198011208, "loss": 0.0087, "step": 189780 }, { "epoch": 0.96, "learning_rate": 0.00015637275428709809, "loss": 0.013, "step": 189790 }, { "epoch": 0.96, "learning_rate": 0.00015636518659408407, "loss": 0.0112, "step": 189800 }, { "epoch": 0.96, "learning_rate": 0.00015635761890107005, "loss": 0.0089, "step": 189810 }, { "epoch": 0.96, "learning_rate": 0.00015635005120805606, "loss": 0.0102, "step": 189820 }, { "epoch": 0.96, "learning_rate": 0.00015634248351504204, "loss": 0.0118, "step": 189830 }, { "epoch": 0.96, "learning_rate": 0.00015633491582202802, "loss": 0.0108, "step": 189840 }, { "epoch": 0.96, "learning_rate": 0.00015632734812901403, "loss": 0.0128, "step": 189850 }, { "epoch": 0.96, "learning_rate": 0.000156319780436, "loss": 0.0129, "step": 189860 }, { "epoch": 0.96, "learning_rate": 0.000156312212742986, "loss": 0.0146, "step": 189870 }, { "epoch": 0.96, "learning_rate": 0.000156304645049972, "loss": 0.0115, "step": 189880 }, { "epoch": 0.96, "learning_rate": 0.00015629707735695798, "loss": 0.0125, "step": 189890 }, { "epoch": 0.96, "learning_rate": 0.00015628950966394396, "loss": 0.0111, "step": 189900 }, { "epoch": 0.96, "learning_rate": 0.00015628194197092994, "loss": 0.0099, "step": 189910 }, { "epoch": 0.96, "learning_rate": 0.00015627437427791595, "loss": 0.0115, "step": 189920 }, { "epoch": 0.96, "learning_rate": 0.00015626680658490193, "loss": 0.0115, "step": 189930 }, { "epoch": 0.96, "learning_rate": 0.00015625923889188792, "loss": 0.0134, "step": 189940 }, { "epoch": 0.96, "learning_rate": 0.00015625167119887392, "loss": 0.0137, "step": 189950 }, { "epoch": 0.96, "learning_rate": 0.0001562441035058599, "loss": 0.0102, "step": 189960 }, { "epoch": 0.96, "learning_rate": 0.0001562365358128459, "loss": 0.0099, "step": 189970 }, { "epoch": 0.96, "learning_rate": 0.0001562289681198319, "loss": 0.0129, "step": 189980 }, { "epoch": 0.96, "learning_rate": 0.00015622140042681788, "loss": 0.0099, "step": 189990 }, { "epoch": 0.96, "learning_rate": 0.00015621383273380386, "loss": 0.0097, "step": 190000 }, { "epoch": 0.96, "eval_cer": 0.9144372624348985, "eval_loss": 0.007905209437012672, "eval_runtime": 116.6163, "eval_samples_per_second": 17.15, "eval_steps_per_second": 4.288, "step": 190000 }, { "epoch": 0.96, "learning_rate": 0.00015620626504078987, "loss": 0.0084, "step": 190010 }, { "epoch": 0.96, "learning_rate": 0.00015619869734777585, "loss": 0.0122, "step": 190020 }, { "epoch": 0.96, "learning_rate": 0.00015619112965476183, "loss": 0.0101, "step": 190030 }, { "epoch": 0.96, "learning_rate": 0.00015618356196174784, "loss": 0.0118, "step": 190040 }, { "epoch": 0.96, "learning_rate": 0.00015617599426873382, "loss": 0.0215, "step": 190050 }, { "epoch": 0.96, "learning_rate": 0.0001561684265757198, "loss": 0.0112, "step": 190060 }, { "epoch": 0.96, "learning_rate": 0.0001561608588827058, "loss": 0.0125, "step": 190070 }, { "epoch": 0.96, "learning_rate": 0.0001561532911896918, "loss": 0.0126, "step": 190080 }, { "epoch": 0.96, "learning_rate": 0.00015614572349667777, "loss": 0.0125, "step": 190090 }, { "epoch": 0.96, "learning_rate": 0.00015613815580366375, "loss": 0.0092, "step": 190100 }, { "epoch": 0.96, "learning_rate": 0.00015613058811064976, "loss": 0.0112, "step": 190110 }, { "epoch": 0.96, "learning_rate": 0.00015612302041763574, "loss": 0.0096, "step": 190120 }, { "epoch": 0.96, "learning_rate": 0.00015611545272462173, "loss": 0.0126, "step": 190130 }, { "epoch": 0.96, "learning_rate": 0.00015610788503160773, "loss": 0.0112, "step": 190140 }, { "epoch": 0.96, "learning_rate": 0.00015610031733859372, "loss": 0.0103, "step": 190150 }, { "epoch": 0.96, "learning_rate": 0.0001560927496455797, "loss": 0.0125, "step": 190160 }, { "epoch": 0.96, "learning_rate": 0.0001560851819525657, "loss": 0.0109, "step": 190170 }, { "epoch": 0.96, "learning_rate": 0.0001560776142595517, "loss": 0.0121, "step": 190180 }, { "epoch": 0.96, "learning_rate": 0.00015607004656653767, "loss": 0.0132, "step": 190190 }, { "epoch": 0.96, "learning_rate": 0.00015606247887352368, "loss": 0.0111, "step": 190200 }, { "epoch": 0.96, "learning_rate": 0.00015605491118050966, "loss": 0.0108, "step": 190210 }, { "epoch": 0.96, "learning_rate": 0.00015604734348749564, "loss": 0.0111, "step": 190220 }, { "epoch": 0.96, "learning_rate": 0.00015603977579448165, "loss": 0.0101, "step": 190230 }, { "epoch": 0.96, "learning_rate": 0.00015603220810146763, "loss": 0.0088, "step": 190240 }, { "epoch": 0.96, "learning_rate": 0.0001560246404084536, "loss": 0.0106, "step": 190250 }, { "epoch": 0.96, "learning_rate": 0.0001560170727154396, "loss": 0.0122, "step": 190260 }, { "epoch": 0.96, "learning_rate": 0.0001560095050224256, "loss": 0.009, "step": 190270 }, { "epoch": 0.96, "learning_rate": 0.00015600193732941158, "loss": 0.0112, "step": 190280 }, { "epoch": 0.96, "learning_rate": 0.00015599436963639756, "loss": 0.0135, "step": 190290 }, { "epoch": 0.96, "learning_rate": 0.00015598680194338357, "loss": 0.01, "step": 190300 }, { "epoch": 0.96, "learning_rate": 0.00015597923425036955, "loss": 0.0093, "step": 190310 }, { "epoch": 0.96, "learning_rate": 0.00015597166655735554, "loss": 0.0127, "step": 190320 }, { "epoch": 0.96, "learning_rate": 0.00015596409886434154, "loss": 0.0094, "step": 190330 }, { "epoch": 0.96, "learning_rate": 0.00015595653117132753, "loss": 0.011, "step": 190340 }, { "epoch": 0.96, "learning_rate": 0.0001559489634783135, "loss": 0.0144, "step": 190350 }, { "epoch": 0.96, "learning_rate": 0.00015594139578529952, "loss": 0.0136, "step": 190360 }, { "epoch": 0.96, "learning_rate": 0.0001559338280922855, "loss": 0.0114, "step": 190370 }, { "epoch": 0.96, "learning_rate": 0.00015592626039927148, "loss": 0.0125, "step": 190380 }, { "epoch": 0.96, "learning_rate": 0.0001559186927062575, "loss": 0.0101, "step": 190390 }, { "epoch": 0.96, "learning_rate": 0.00015591112501324347, "loss": 0.0085, "step": 190400 }, { "epoch": 0.96, "learning_rate": 0.00015590355732022945, "loss": 0.0114, "step": 190410 }, { "epoch": 0.96, "learning_rate": 0.0001558959896272154, "loss": 0.0112, "step": 190420 }, { "epoch": 0.96, "learning_rate": 0.0001558884219342014, "loss": 0.0115, "step": 190430 }, { "epoch": 0.96, "learning_rate": 0.0001558808542411874, "loss": 0.0117, "step": 190440 }, { "epoch": 0.96, "learning_rate": 0.00015587328654817338, "loss": 0.0104, "step": 190450 }, { "epoch": 0.96, "learning_rate": 0.00015586571885515938, "loss": 0.0103, "step": 190460 }, { "epoch": 0.96, "learning_rate": 0.00015585815116214537, "loss": 0.0116, "step": 190470 }, { "epoch": 0.96, "learning_rate": 0.00015585058346913135, "loss": 0.0113, "step": 190480 }, { "epoch": 0.96, "learning_rate": 0.00015584301577611733, "loss": 0.0103, "step": 190490 }, { "epoch": 0.96, "learning_rate": 0.00015583544808310334, "loss": 0.0102, "step": 190500 }, { "epoch": 0.96, "learning_rate": 0.00015582788039008932, "loss": 0.0087, "step": 190510 }, { "epoch": 0.96, "learning_rate": 0.0001558203126970753, "loss": 0.0127, "step": 190520 }, { "epoch": 0.96, "learning_rate": 0.0001558127450040613, "loss": 0.013, "step": 190530 }, { "epoch": 0.96, "learning_rate": 0.0001558051773110473, "loss": 0.0117, "step": 190540 }, { "epoch": 0.96, "learning_rate": 0.00015579760961803327, "loss": 0.0135, "step": 190550 }, { "epoch": 0.96, "learning_rate": 0.00015579004192501928, "loss": 0.0127, "step": 190560 }, { "epoch": 0.96, "learning_rate": 0.00015578247423200526, "loss": 0.0109, "step": 190570 }, { "epoch": 0.96, "learning_rate": 0.00015577490653899124, "loss": 0.0144, "step": 190580 }, { "epoch": 0.96, "learning_rate": 0.00015576733884597725, "loss": 0.0103, "step": 190590 }, { "epoch": 0.96, "learning_rate": 0.00015575977115296323, "loss": 0.0139, "step": 190600 }, { "epoch": 0.96, "learning_rate": 0.00015575220345994921, "loss": 0.0113, "step": 190610 }, { "epoch": 0.96, "learning_rate": 0.00015574463576693522, "loss": 0.0121, "step": 190620 }, { "epoch": 0.96, "learning_rate": 0.0001557370680739212, "loss": 0.0111, "step": 190630 }, { "epoch": 0.96, "learning_rate": 0.00015572950038090719, "loss": 0.0127, "step": 190640 }, { "epoch": 0.96, "learning_rate": 0.00015572193268789317, "loss": 0.0088, "step": 190650 }, { "epoch": 0.96, "learning_rate": 0.00015571436499487918, "loss": 0.0107, "step": 190660 }, { "epoch": 0.96, "learning_rate": 0.00015570679730186516, "loss": 0.0117, "step": 190670 }, { "epoch": 0.96, "learning_rate": 0.00015569922960885114, "loss": 0.0096, "step": 190680 }, { "epoch": 0.96, "learning_rate": 0.00015569166191583715, "loss": 0.0086, "step": 190690 }, { "epoch": 0.96, "learning_rate": 0.00015568409422282313, "loss": 0.0094, "step": 190700 }, { "epoch": 0.96, "learning_rate": 0.0001556765265298091, "loss": 0.0124, "step": 190710 }, { "epoch": 0.96, "learning_rate": 0.00015566895883679512, "loss": 0.0153, "step": 190720 }, { "epoch": 0.96, "learning_rate": 0.0001556613911437811, "loss": 0.0129, "step": 190730 }, { "epoch": 0.96, "learning_rate": 0.00015565382345076708, "loss": 0.0149, "step": 190740 }, { "epoch": 0.96, "learning_rate": 0.0001556462557577531, "loss": 0.0097, "step": 190750 }, { "epoch": 0.96, "learning_rate": 0.00015563868806473907, "loss": 0.0132, "step": 190760 }, { "epoch": 0.96, "learning_rate": 0.00015563112037172505, "loss": 0.0123, "step": 190770 }, { "epoch": 0.96, "learning_rate": 0.00015562355267871106, "loss": 0.0087, "step": 190780 }, { "epoch": 0.96, "learning_rate": 0.00015561598498569704, "loss": 0.0105, "step": 190790 }, { "epoch": 0.96, "learning_rate": 0.00015560841729268302, "loss": 0.011, "step": 190800 }, { "epoch": 0.96, "learning_rate": 0.000155600849599669, "loss": 0.0134, "step": 190810 }, { "epoch": 0.96, "learning_rate": 0.00015559328190665501, "loss": 0.0107, "step": 190820 }, { "epoch": 0.96, "learning_rate": 0.000155585714213641, "loss": 0.0108, "step": 190830 }, { "epoch": 0.96, "learning_rate": 0.00015557814652062698, "loss": 0.0093, "step": 190840 }, { "epoch": 0.96, "learning_rate": 0.00015557057882761299, "loss": 0.0116, "step": 190850 }, { "epoch": 0.96, "learning_rate": 0.00015556301113459897, "loss": 0.0125, "step": 190860 }, { "epoch": 0.96, "learning_rate": 0.00015555544344158495, "loss": 0.0064, "step": 190870 }, { "epoch": 0.96, "learning_rate": 0.00015554787574857096, "loss": 0.0104, "step": 190880 }, { "epoch": 0.96, "learning_rate": 0.00015554030805555694, "loss": 0.0098, "step": 190890 }, { "epoch": 0.96, "learning_rate": 0.00015553274036254292, "loss": 0.0099, "step": 190900 }, { "epoch": 0.96, "learning_rate": 0.00015552517266952893, "loss": 0.0113, "step": 190910 }, { "epoch": 0.96, "learning_rate": 0.0001555176049765149, "loss": 0.0112, "step": 190920 }, { "epoch": 0.96, "learning_rate": 0.0001555100372835009, "loss": 0.0103, "step": 190930 }, { "epoch": 0.96, "learning_rate": 0.0001555024695904869, "loss": 0.0096, "step": 190940 }, { "epoch": 0.96, "learning_rate": 0.00015549490189747288, "loss": 0.0077, "step": 190950 }, { "epoch": 0.96, "learning_rate": 0.00015548733420445886, "loss": 0.0111, "step": 190960 }, { "epoch": 0.96, "learning_rate": 0.00015547976651144487, "loss": 0.0095, "step": 190970 }, { "epoch": 0.96, "learning_rate": 0.00015547219881843085, "loss": 0.0123, "step": 190980 }, { "epoch": 0.96, "learning_rate": 0.00015546463112541683, "loss": 0.0103, "step": 190990 }, { "epoch": 0.96, "learning_rate": 0.00015545706343240282, "loss": 0.0124, "step": 191000 }, { "epoch": 0.96, "eval_cer": 0.9144634631302844, "eval_loss": 0.007862123660743237, "eval_runtime": 115.5241, "eval_samples_per_second": 17.312, "eval_steps_per_second": 4.328, "step": 191000 }, { "epoch": 0.96, "learning_rate": 0.00015544949573938882, "loss": 0.0109, "step": 191010 }, { "epoch": 0.96, "learning_rate": 0.0001554419280463748, "loss": 0.0134, "step": 191020 }, { "epoch": 0.96, "learning_rate": 0.0001554343603533608, "loss": 0.0088, "step": 191030 }, { "epoch": 0.96, "learning_rate": 0.0001554267926603468, "loss": 0.0132, "step": 191040 }, { "epoch": 0.96, "learning_rate": 0.00015541922496733278, "loss": 0.0101, "step": 191050 }, { "epoch": 0.96, "learning_rate": 0.00015541165727431876, "loss": 0.0096, "step": 191060 }, { "epoch": 0.96, "learning_rate": 0.00015540408958130477, "loss": 0.012, "step": 191070 }, { "epoch": 0.96, "learning_rate": 0.00015539652188829075, "loss": 0.0157, "step": 191080 }, { "epoch": 0.96, "learning_rate": 0.00015538895419527673, "loss": 0.0133, "step": 191090 }, { "epoch": 0.96, "learning_rate": 0.00015538138650226274, "loss": 0.0113, "step": 191100 }, { "epoch": 0.96, "learning_rate": 0.00015537381880924872, "loss": 0.0111, "step": 191110 }, { "epoch": 0.96, "learning_rate": 0.0001553662511162347, "loss": 0.0125, "step": 191120 }, { "epoch": 0.96, "learning_rate": 0.0001553586834232207, "loss": 0.0174, "step": 191130 }, { "epoch": 0.96, "learning_rate": 0.0001553511157302067, "loss": 0.0111, "step": 191140 }, { "epoch": 0.96, "learning_rate": 0.00015534354803719267, "loss": 0.0113, "step": 191150 }, { "epoch": 0.96, "learning_rate": 0.00015533598034417865, "loss": 0.0129, "step": 191160 }, { "epoch": 0.96, "learning_rate": 0.00015532841265116466, "loss": 0.0097, "step": 191170 }, { "epoch": 0.96, "learning_rate": 0.00015532084495815064, "loss": 0.0103, "step": 191180 }, { "epoch": 0.96, "learning_rate": 0.00015531327726513663, "loss": 0.0137, "step": 191190 }, { "epoch": 0.96, "learning_rate": 0.00015530570957212263, "loss": 0.0101, "step": 191200 }, { "epoch": 0.96, "learning_rate": 0.00015529814187910862, "loss": 0.0096, "step": 191210 }, { "epoch": 0.96, "learning_rate": 0.0001552905741860946, "loss": 0.0109, "step": 191220 }, { "epoch": 0.96, "learning_rate": 0.0001552830064930806, "loss": 0.0105, "step": 191230 }, { "epoch": 0.96, "learning_rate": 0.0001552754388000666, "loss": 0.0102, "step": 191240 }, { "epoch": 0.96, "learning_rate": 0.00015526787110705257, "loss": 0.0149, "step": 191250 }, { "epoch": 0.96, "learning_rate": 0.00015526030341403858, "loss": 0.014, "step": 191260 }, { "epoch": 0.96, "learning_rate": 0.00015525273572102456, "loss": 0.0121, "step": 191270 }, { "epoch": 0.97, "learning_rate": 0.00015524516802801054, "loss": 0.0118, "step": 191280 }, { "epoch": 0.97, "learning_rate": 0.00015523760033499655, "loss": 0.0139, "step": 191290 }, { "epoch": 0.97, "learning_rate": 0.00015523003264198253, "loss": 0.0105, "step": 191300 }, { "epoch": 0.97, "learning_rate": 0.0001552224649489685, "loss": 0.0109, "step": 191310 }, { "epoch": 0.97, "learning_rate": 0.0001552148972559545, "loss": 0.0119, "step": 191320 }, { "epoch": 0.97, "learning_rate": 0.0001552073295629405, "loss": 0.0111, "step": 191330 }, { "epoch": 0.97, "learning_rate": 0.00015519976186992648, "loss": 0.0105, "step": 191340 }, { "epoch": 0.97, "learning_rate": 0.00015519219417691247, "loss": 0.0094, "step": 191350 }, { "epoch": 0.97, "learning_rate": 0.00015518462648389847, "loss": 0.0137, "step": 191360 }, { "epoch": 0.97, "learning_rate": 0.00015517705879088446, "loss": 0.0113, "step": 191370 }, { "epoch": 0.97, "learning_rate": 0.00015516949109787044, "loss": 0.0098, "step": 191380 }, { "epoch": 0.97, "learning_rate": 0.00015516192340485645, "loss": 0.0133, "step": 191390 }, { "epoch": 0.97, "learning_rate": 0.00015515435571184243, "loss": 0.0125, "step": 191400 }, { "epoch": 0.97, "learning_rate": 0.0001551467880188284, "loss": 0.0124, "step": 191410 }, { "epoch": 0.97, "learning_rate": 0.00015513922032581442, "loss": 0.0136, "step": 191420 }, { "epoch": 0.97, "learning_rate": 0.0001551316526328004, "loss": 0.015, "step": 191430 }, { "epoch": 0.97, "learning_rate": 0.00015512408493978638, "loss": 0.0105, "step": 191440 }, { "epoch": 0.97, "learning_rate": 0.0001551165172467724, "loss": 0.0105, "step": 191450 }, { "epoch": 0.97, "learning_rate": 0.00015510894955375837, "loss": 0.0118, "step": 191460 }, { "epoch": 0.97, "learning_rate": 0.00015510138186074435, "loss": 0.0096, "step": 191470 }, { "epoch": 0.97, "learning_rate": 0.00015509381416773036, "loss": 0.0122, "step": 191480 }, { "epoch": 0.97, "learning_rate": 0.00015508624647471634, "loss": 0.0097, "step": 191490 }, { "epoch": 0.97, "learning_rate": 0.00015507867878170232, "loss": 0.0143, "step": 191500 }, { "epoch": 0.97, "learning_rate": 0.0001550711110886883, "loss": 0.0116, "step": 191510 }, { "epoch": 0.97, "learning_rate": 0.0001550635433956743, "loss": 0.0118, "step": 191520 }, { "epoch": 0.97, "learning_rate": 0.0001550559757026603, "loss": 0.0116, "step": 191530 }, { "epoch": 0.97, "learning_rate": 0.00015504840800964628, "loss": 0.0128, "step": 191540 }, { "epoch": 0.97, "learning_rate": 0.00015504084031663228, "loss": 0.0136, "step": 191550 }, { "epoch": 0.97, "learning_rate": 0.00015503327262361827, "loss": 0.01, "step": 191560 }, { "epoch": 0.97, "learning_rate": 0.00015502570493060425, "loss": 0.0093, "step": 191570 }, { "epoch": 0.97, "learning_rate": 0.00015501813723759026, "loss": 0.0115, "step": 191580 }, { "epoch": 0.97, "learning_rate": 0.00015501056954457624, "loss": 0.0097, "step": 191590 }, { "epoch": 0.97, "learning_rate": 0.00015500300185156222, "loss": 0.0102, "step": 191600 }, { "epoch": 0.97, "learning_rate": 0.00015499543415854823, "loss": 0.0102, "step": 191610 }, { "epoch": 0.97, "learning_rate": 0.0001549878664655342, "loss": 0.0096, "step": 191620 }, { "epoch": 0.97, "learning_rate": 0.0001549802987725202, "loss": 0.0115, "step": 191630 }, { "epoch": 0.97, "learning_rate": 0.0001549727310795062, "loss": 0.0141, "step": 191640 }, { "epoch": 0.97, "learning_rate": 0.00015496516338649218, "loss": 0.0089, "step": 191650 }, { "epoch": 0.97, "learning_rate": 0.00015495759569347816, "loss": 0.0128, "step": 191660 }, { "epoch": 0.97, "learning_rate": 0.00015495002800046414, "loss": 0.0102, "step": 191670 }, { "epoch": 0.97, "learning_rate": 0.00015494246030745012, "loss": 0.0107, "step": 191680 }, { "epoch": 0.97, "learning_rate": 0.0001549348926144361, "loss": 0.0121, "step": 191690 }, { "epoch": 0.97, "learning_rate": 0.0001549273249214221, "loss": 0.0103, "step": 191700 }, { "epoch": 0.97, "learning_rate": 0.00015491975722840807, "loss": 0.011, "step": 191710 }, { "epoch": 0.97, "learning_rate": 0.00015491218953539408, "loss": 0.0096, "step": 191720 }, { "epoch": 0.97, "learning_rate": 0.00015490462184238006, "loss": 0.0097, "step": 191730 }, { "epoch": 0.97, "learning_rate": 0.00015489705414936604, "loss": 0.0122, "step": 191740 }, { "epoch": 0.97, "learning_rate": 0.00015488948645635205, "loss": 0.0105, "step": 191750 }, { "epoch": 0.97, "learning_rate": 0.00015488191876333803, "loss": 0.0092, "step": 191760 }, { "epoch": 0.97, "learning_rate": 0.000154874351070324, "loss": 0.012, "step": 191770 }, { "epoch": 0.97, "learning_rate": 0.00015486678337731002, "loss": 0.0089, "step": 191780 }, { "epoch": 0.97, "learning_rate": 0.000154859215684296, "loss": 0.0121, "step": 191790 }, { "epoch": 0.97, "learning_rate": 0.00015485164799128198, "loss": 0.0087, "step": 191800 }, { "epoch": 0.97, "learning_rate": 0.000154844080298268, "loss": 0.0121, "step": 191810 }, { "epoch": 0.97, "learning_rate": 0.00015483651260525397, "loss": 0.0108, "step": 191820 }, { "epoch": 0.97, "learning_rate": 0.00015482894491223995, "loss": 0.0094, "step": 191830 }, { "epoch": 0.97, "learning_rate": 0.00015482137721922596, "loss": 0.0091, "step": 191840 }, { "epoch": 0.97, "learning_rate": 0.00015481380952621194, "loss": 0.0105, "step": 191850 }, { "epoch": 0.97, "learning_rate": 0.00015480624183319793, "loss": 0.0096, "step": 191860 }, { "epoch": 0.97, "learning_rate": 0.00015479867414018393, "loss": 0.0118, "step": 191870 }, { "epoch": 0.97, "learning_rate": 0.00015479110644716992, "loss": 0.0118, "step": 191880 }, { "epoch": 0.97, "learning_rate": 0.0001547835387541559, "loss": 0.0119, "step": 191890 }, { "epoch": 0.97, "learning_rate": 0.00015477597106114188, "loss": 0.0101, "step": 191900 }, { "epoch": 0.97, "learning_rate": 0.0001547684033681279, "loss": 0.0118, "step": 191910 }, { "epoch": 0.97, "learning_rate": 0.00015476083567511387, "loss": 0.0104, "step": 191920 }, { "epoch": 0.97, "learning_rate": 0.00015475326798209985, "loss": 0.0099, "step": 191930 }, { "epoch": 0.97, "learning_rate": 0.00015474570028908586, "loss": 0.0072, "step": 191940 }, { "epoch": 0.97, "learning_rate": 0.00015473813259607184, "loss": 0.0123, "step": 191950 }, { "epoch": 0.97, "learning_rate": 0.00015473056490305782, "loss": 0.0141, "step": 191960 }, { "epoch": 0.97, "learning_rate": 0.00015472299721004383, "loss": 0.012, "step": 191970 }, { "epoch": 0.97, "learning_rate": 0.0001547154295170298, "loss": 0.0118, "step": 191980 }, { "epoch": 0.97, "learning_rate": 0.0001547078618240158, "loss": 0.0105, "step": 191990 }, { "epoch": 0.97, "learning_rate": 0.0001547002941310018, "loss": 0.0106, "step": 192000 }, { "epoch": 0.97, "eval_cer": 0.9144411440194001, "eval_loss": 0.008027549833059311, "eval_runtime": 116.6747, "eval_samples_per_second": 17.142, "eval_steps_per_second": 4.285, "step": 192000 }, { "epoch": 0.97, "learning_rate": 0.00015469272643798778, "loss": 0.0119, "step": 192010 }, { "epoch": 0.97, "learning_rate": 0.00015468515874497376, "loss": 0.0099, "step": 192020 }, { "epoch": 0.97, "learning_rate": 0.00015467759105195977, "loss": 0.0094, "step": 192030 }, { "epoch": 0.97, "learning_rate": 0.00015467002335894575, "loss": 0.008, "step": 192040 }, { "epoch": 0.97, "learning_rate": 0.00015466245566593174, "loss": 0.0118, "step": 192050 }, { "epoch": 0.97, "learning_rate": 0.00015465488797291772, "loss": 0.0108, "step": 192060 }, { "epoch": 0.97, "learning_rate": 0.00015464732027990373, "loss": 0.0099, "step": 192070 }, { "epoch": 0.97, "learning_rate": 0.0001546397525868897, "loss": 0.0101, "step": 192080 }, { "epoch": 0.97, "learning_rate": 0.0001546321848938757, "loss": 0.0125, "step": 192090 }, { "epoch": 0.97, "learning_rate": 0.0001546246172008617, "loss": 0.0163, "step": 192100 }, { "epoch": 0.97, "learning_rate": 0.00015461704950784768, "loss": 0.0126, "step": 192110 }, { "epoch": 0.97, "learning_rate": 0.00015460948181483366, "loss": 0.0115, "step": 192120 }, { "epoch": 0.97, "learning_rate": 0.00015460191412181967, "loss": 0.0102, "step": 192130 }, { "epoch": 0.97, "learning_rate": 0.00015459434642880565, "loss": 0.0107, "step": 192140 }, { "epoch": 0.97, "learning_rate": 0.00015458677873579163, "loss": 0.0112, "step": 192150 }, { "epoch": 0.97, "learning_rate": 0.00015457921104277764, "loss": 0.0111, "step": 192160 }, { "epoch": 0.97, "learning_rate": 0.00015457164334976362, "loss": 0.0125, "step": 192170 }, { "epoch": 0.97, "learning_rate": 0.0001545640756567496, "loss": 0.0113, "step": 192180 }, { "epoch": 0.97, "learning_rate": 0.0001545565079637356, "loss": 0.0102, "step": 192190 }, { "epoch": 0.97, "learning_rate": 0.0001545489402707216, "loss": 0.0126, "step": 192200 }, { "epoch": 0.97, "learning_rate": 0.00015454137257770757, "loss": 0.0102, "step": 192210 }, { "epoch": 0.97, "learning_rate": 0.00015453380488469356, "loss": 0.0116, "step": 192220 }, { "epoch": 0.97, "learning_rate": 0.00015452623719167956, "loss": 0.0105, "step": 192230 }, { "epoch": 0.97, "learning_rate": 0.00015451866949866555, "loss": 0.0082, "step": 192240 }, { "epoch": 0.97, "learning_rate": 0.00015451110180565153, "loss": 0.0119, "step": 192250 }, { "epoch": 0.97, "learning_rate": 0.00015450353411263754, "loss": 0.0085, "step": 192260 }, { "epoch": 0.97, "learning_rate": 0.00015449596641962352, "loss": 0.0105, "step": 192270 }, { "epoch": 0.97, "learning_rate": 0.0001544883987266095, "loss": 0.0113, "step": 192280 }, { "epoch": 0.97, "learning_rate": 0.0001544808310335955, "loss": 0.0121, "step": 192290 }, { "epoch": 0.97, "learning_rate": 0.0001544732633405815, "loss": 0.0097, "step": 192300 }, { "epoch": 0.97, "learning_rate": 0.00015446569564756747, "loss": 0.0103, "step": 192310 }, { "epoch": 0.97, "learning_rate": 0.00015445812795455348, "loss": 0.0088, "step": 192320 }, { "epoch": 0.97, "learning_rate": 0.00015445056026153946, "loss": 0.0123, "step": 192330 }, { "epoch": 0.97, "learning_rate": 0.00015444299256852544, "loss": 0.0099, "step": 192340 }, { "epoch": 0.97, "learning_rate": 0.00015443542487551145, "loss": 0.009, "step": 192350 }, { "epoch": 0.97, "learning_rate": 0.00015442785718249743, "loss": 0.0097, "step": 192360 }, { "epoch": 0.97, "learning_rate": 0.0001544202894894834, "loss": 0.0091, "step": 192370 }, { "epoch": 0.97, "learning_rate": 0.00015441272179646942, "loss": 0.0096, "step": 192380 }, { "epoch": 0.97, "learning_rate": 0.0001544051541034554, "loss": 0.0127, "step": 192390 }, { "epoch": 0.97, "learning_rate": 0.00015439758641044138, "loss": 0.0105, "step": 192400 }, { "epoch": 0.97, "learning_rate": 0.00015439001871742737, "loss": 0.0099, "step": 192410 }, { "epoch": 0.97, "learning_rate": 0.00015438245102441337, "loss": 0.0112, "step": 192420 }, { "epoch": 0.97, "learning_rate": 0.00015437488333139936, "loss": 0.012, "step": 192430 }, { "epoch": 0.97, "learning_rate": 0.00015436731563838534, "loss": 0.0103, "step": 192440 }, { "epoch": 0.97, "learning_rate": 0.00015435974794537135, "loss": 0.0123, "step": 192450 }, { "epoch": 0.97, "learning_rate": 0.00015435218025235733, "loss": 0.0104, "step": 192460 }, { "epoch": 0.97, "learning_rate": 0.0001543446125593433, "loss": 0.0112, "step": 192470 }, { "epoch": 0.97, "learning_rate": 0.00015433704486632932, "loss": 0.0115, "step": 192480 }, { "epoch": 0.97, "learning_rate": 0.0001543294771733153, "loss": 0.0091, "step": 192490 }, { "epoch": 0.97, "learning_rate": 0.00015432190948030128, "loss": 0.0106, "step": 192500 }, { "epoch": 0.97, "learning_rate": 0.0001543143417872873, "loss": 0.0088, "step": 192510 }, { "epoch": 0.97, "learning_rate": 0.00015430677409427327, "loss": 0.0106, "step": 192520 }, { "epoch": 0.97, "learning_rate": 0.00015429920640125925, "loss": 0.0108, "step": 192530 }, { "epoch": 0.97, "learning_rate": 0.00015429163870824526, "loss": 0.0144, "step": 192540 }, { "epoch": 0.97, "learning_rate": 0.00015428407101523124, "loss": 0.0077, "step": 192550 }, { "epoch": 0.97, "learning_rate": 0.00015427650332221722, "loss": 0.0112, "step": 192560 }, { "epoch": 0.97, "learning_rate": 0.0001542689356292032, "loss": 0.0129, "step": 192570 }, { "epoch": 0.97, "learning_rate": 0.0001542613679361892, "loss": 0.007, "step": 192580 }, { "epoch": 0.97, "learning_rate": 0.0001542538002431752, "loss": 0.0119, "step": 192590 }, { "epoch": 0.97, "learning_rate": 0.00015424623255016118, "loss": 0.0097, "step": 192600 }, { "epoch": 0.97, "learning_rate": 0.00015423866485714718, "loss": 0.0095, "step": 192610 }, { "epoch": 0.97, "learning_rate": 0.00015423109716413317, "loss": 0.0093, "step": 192620 }, { "epoch": 0.97, "learning_rate": 0.00015422352947111915, "loss": 0.0111, "step": 192630 }, { "epoch": 0.97, "learning_rate": 0.00015421596177810516, "loss": 0.0098, "step": 192640 }, { "epoch": 0.97, "learning_rate": 0.00015420839408509114, "loss": 0.0118, "step": 192650 }, { "epoch": 0.97, "learning_rate": 0.00015420082639207712, "loss": 0.0117, "step": 192660 }, { "epoch": 0.97, "learning_rate": 0.00015419325869906313, "loss": 0.0115, "step": 192670 }, { "epoch": 0.97, "learning_rate": 0.0001541856910060491, "loss": 0.01, "step": 192680 }, { "epoch": 0.97, "learning_rate": 0.0001541781233130351, "loss": 0.0101, "step": 192690 }, { "epoch": 0.97, "learning_rate": 0.0001541705556200211, "loss": 0.012, "step": 192700 }, { "epoch": 0.97, "learning_rate": 0.00015416298792700708, "loss": 0.0107, "step": 192710 }, { "epoch": 0.97, "learning_rate": 0.00015415542023399306, "loss": 0.012, "step": 192720 }, { "epoch": 0.97, "learning_rate": 0.00015414785254097904, "loss": 0.0115, "step": 192730 }, { "epoch": 0.97, "learning_rate": 0.00015414028484796505, "loss": 0.0107, "step": 192740 }, { "epoch": 0.97, "learning_rate": 0.00015413271715495103, "loss": 0.0091, "step": 192750 }, { "epoch": 0.97, "learning_rate": 0.00015412514946193701, "loss": 0.009, "step": 192760 }, { "epoch": 0.97, "learning_rate": 0.00015411758176892302, "loss": 0.0102, "step": 192770 }, { "epoch": 0.97, "learning_rate": 0.000154110014075909, "loss": 0.0153, "step": 192780 }, { "epoch": 0.97, "learning_rate": 0.00015410244638289499, "loss": 0.0095, "step": 192790 }, { "epoch": 0.97, "learning_rate": 0.000154094878689881, "loss": 0.01, "step": 192800 }, { "epoch": 0.97, "learning_rate": 0.00015408731099686698, "loss": 0.0119, "step": 192810 }, { "epoch": 0.97, "learning_rate": 0.00015407974330385296, "loss": 0.0095, "step": 192820 }, { "epoch": 0.97, "learning_rate": 0.00015407217561083897, "loss": 0.0129, "step": 192830 }, { "epoch": 0.97, "learning_rate": 0.00015406460791782495, "loss": 0.0119, "step": 192840 }, { "epoch": 0.97, "learning_rate": 0.00015405704022481093, "loss": 0.0105, "step": 192850 }, { "epoch": 0.97, "learning_rate": 0.00015404947253179694, "loss": 0.012, "step": 192860 }, { "epoch": 0.97, "learning_rate": 0.00015404190483878292, "loss": 0.0119, "step": 192870 }, { "epoch": 0.97, "learning_rate": 0.0001540343371457689, "loss": 0.0109, "step": 192880 }, { "epoch": 0.97, "learning_rate": 0.00015402676945275488, "loss": 0.0098, "step": 192890 }, { "epoch": 0.97, "learning_rate": 0.0001540192017597409, "loss": 0.0125, "step": 192900 }, { "epoch": 0.97, "learning_rate": 0.00015401163406672687, "loss": 0.0094, "step": 192910 }, { "epoch": 0.97, "learning_rate": 0.00015400406637371285, "loss": 0.0079, "step": 192920 }, { "epoch": 0.97, "learning_rate": 0.00015399649868069886, "loss": 0.0101, "step": 192930 }, { "epoch": 0.97, "learning_rate": 0.00015398893098768482, "loss": 0.01, "step": 192940 }, { "epoch": 0.97, "learning_rate": 0.0001539813632946708, "loss": 0.0104, "step": 192950 }, { "epoch": 0.97, "learning_rate": 0.00015397379560165678, "loss": 0.0133, "step": 192960 }, { "epoch": 0.97, "learning_rate": 0.0001539662279086428, "loss": 0.008, "step": 192970 }, { "epoch": 0.97, "learning_rate": 0.00015395866021562877, "loss": 0.0126, "step": 192980 }, { "epoch": 0.97, "learning_rate": 0.00015395109252261475, "loss": 0.009, "step": 192990 }, { "epoch": 0.97, "learning_rate": 0.00015394352482960076, "loss": 0.0111, "step": 193000 }, { "epoch": 0.97, "eval_cer": 0.9144644335264098, "eval_loss": 0.008065390400588512, "eval_runtime": 116.6291, "eval_samples_per_second": 17.148, "eval_steps_per_second": 4.287, "step": 193000 }, { "epoch": 0.97, "learning_rate": 0.00015393595713658674, "loss": 0.012, "step": 193010 }, { "epoch": 0.97, "learning_rate": 0.00015392838944357272, "loss": 0.0106, "step": 193020 }, { "epoch": 0.97, "learning_rate": 0.00015392082175055873, "loss": 0.0099, "step": 193030 }, { "epoch": 0.97, "learning_rate": 0.0001539132540575447, "loss": 0.0106, "step": 193040 }, { "epoch": 0.97, "learning_rate": 0.0001539056863645307, "loss": 0.0093, "step": 193050 }, { "epoch": 0.97, "learning_rate": 0.0001538981186715167, "loss": 0.0099, "step": 193060 }, { "epoch": 0.97, "learning_rate": 0.00015389055097850268, "loss": 0.0127, "step": 193070 }, { "epoch": 0.97, "learning_rate": 0.00015388298328548866, "loss": 0.0098, "step": 193080 }, { "epoch": 0.97, "learning_rate": 0.00015387541559247467, "loss": 0.0118, "step": 193090 }, { "epoch": 0.97, "learning_rate": 0.00015386784789946065, "loss": 0.0098, "step": 193100 }, { "epoch": 0.97, "learning_rate": 0.00015386028020644664, "loss": 0.0134, "step": 193110 }, { "epoch": 0.97, "learning_rate": 0.00015385271251343262, "loss": 0.0149, "step": 193120 }, { "epoch": 0.97, "learning_rate": 0.00015384514482041863, "loss": 0.0102, "step": 193130 }, { "epoch": 0.97, "learning_rate": 0.0001538375771274046, "loss": 0.012, "step": 193140 }, { "epoch": 0.97, "learning_rate": 0.0001538300094343906, "loss": 0.0105, "step": 193150 }, { "epoch": 0.97, "learning_rate": 0.0001538224417413766, "loss": 0.0114, "step": 193160 }, { "epoch": 0.97, "learning_rate": 0.00015381487404836258, "loss": 0.0105, "step": 193170 }, { "epoch": 0.97, "learning_rate": 0.00015380730635534856, "loss": 0.0096, "step": 193180 }, { "epoch": 0.97, "learning_rate": 0.00015379973866233457, "loss": 0.0123, "step": 193190 }, { "epoch": 0.97, "learning_rate": 0.00015379217096932055, "loss": 0.0125, "step": 193200 }, { "epoch": 0.97, "learning_rate": 0.00015378460327630653, "loss": 0.0095, "step": 193210 }, { "epoch": 0.97, "learning_rate": 0.00015377703558329254, "loss": 0.0122, "step": 193220 }, { "epoch": 0.97, "learning_rate": 0.00015376946789027852, "loss": 0.0094, "step": 193230 }, { "epoch": 0.97, "learning_rate": 0.0001537619001972645, "loss": 0.0091, "step": 193240 }, { "epoch": 0.97, "learning_rate": 0.0001537543325042505, "loss": 0.0111, "step": 193250 }, { "epoch": 0.98, "learning_rate": 0.0001537467648112365, "loss": 0.0102, "step": 193260 }, { "epoch": 0.98, "learning_rate": 0.00015373919711822247, "loss": 0.0114, "step": 193270 }, { "epoch": 0.98, "learning_rate": 0.00015373162942520846, "loss": 0.0129, "step": 193280 }, { "epoch": 0.98, "learning_rate": 0.00015372406173219446, "loss": 0.0123, "step": 193290 }, { "epoch": 0.98, "learning_rate": 0.00015371649403918045, "loss": 0.0087, "step": 193300 }, { "epoch": 0.98, "learning_rate": 0.00015370892634616643, "loss": 0.0124, "step": 193310 }, { "epoch": 0.98, "learning_rate": 0.00015370135865315244, "loss": 0.0096, "step": 193320 }, { "epoch": 0.98, "learning_rate": 0.00015369379096013842, "loss": 0.012, "step": 193330 }, { "epoch": 0.98, "learning_rate": 0.0001536862232671244, "loss": 0.0097, "step": 193340 }, { "epoch": 0.98, "learning_rate": 0.0001536786555741104, "loss": 0.0152, "step": 193350 }, { "epoch": 0.98, "learning_rate": 0.0001536710878810964, "loss": 0.012, "step": 193360 }, { "epoch": 0.98, "learning_rate": 0.00015366352018808237, "loss": 0.0105, "step": 193370 }, { "epoch": 0.98, "learning_rate": 0.00015365595249506838, "loss": 0.012, "step": 193380 }, { "epoch": 0.98, "learning_rate": 0.00015364838480205436, "loss": 0.0124, "step": 193390 }, { "epoch": 0.98, "learning_rate": 0.00015364081710904034, "loss": 0.0136, "step": 193400 }, { "epoch": 0.98, "learning_rate": 0.00015363324941602635, "loss": 0.0138, "step": 193410 }, { "epoch": 0.98, "learning_rate": 0.00015362568172301233, "loss": 0.0086, "step": 193420 }, { "epoch": 0.98, "learning_rate": 0.0001536181140299983, "loss": 0.013, "step": 193430 }, { "epoch": 0.98, "learning_rate": 0.00015361054633698432, "loss": 0.0126, "step": 193440 }, { "epoch": 0.98, "learning_rate": 0.0001536029786439703, "loss": 0.012, "step": 193450 }, { "epoch": 0.98, "learning_rate": 0.00015359541095095628, "loss": 0.0092, "step": 193460 }, { "epoch": 0.98, "learning_rate": 0.00015358784325794227, "loss": 0.0109, "step": 193470 }, { "epoch": 0.98, "learning_rate": 0.00015358027556492827, "loss": 0.009, "step": 193480 }, { "epoch": 0.98, "learning_rate": 0.00015357270787191426, "loss": 0.008, "step": 193490 }, { "epoch": 0.98, "learning_rate": 0.00015356514017890024, "loss": 0.0128, "step": 193500 }, { "epoch": 0.98, "learning_rate": 0.00015355757248588625, "loss": 0.0126, "step": 193510 }, { "epoch": 0.98, "learning_rate": 0.00015355000479287223, "loss": 0.0099, "step": 193520 }, { "epoch": 0.98, "learning_rate": 0.0001535424370998582, "loss": 0.0096, "step": 193530 }, { "epoch": 0.98, "learning_rate": 0.00015353486940684422, "loss": 0.015, "step": 193540 }, { "epoch": 0.98, "learning_rate": 0.0001535273017138302, "loss": 0.0099, "step": 193550 }, { "epoch": 0.98, "learning_rate": 0.00015351973402081618, "loss": 0.0115, "step": 193560 }, { "epoch": 0.98, "learning_rate": 0.0001535121663278022, "loss": 0.0111, "step": 193570 }, { "epoch": 0.98, "learning_rate": 0.00015350459863478817, "loss": 0.0124, "step": 193580 }, { "epoch": 0.98, "learning_rate": 0.00015349703094177415, "loss": 0.0122, "step": 193590 }, { "epoch": 0.98, "learning_rate": 0.00015348946324876016, "loss": 0.0093, "step": 193600 }, { "epoch": 0.98, "learning_rate": 0.00015348189555574614, "loss": 0.0123, "step": 193610 }, { "epoch": 0.98, "learning_rate": 0.00015347432786273212, "loss": 0.0137, "step": 193620 }, { "epoch": 0.98, "learning_rate": 0.0001534667601697181, "loss": 0.0125, "step": 193630 }, { "epoch": 0.98, "learning_rate": 0.0001534591924767041, "loss": 0.0102, "step": 193640 }, { "epoch": 0.98, "learning_rate": 0.0001534516247836901, "loss": 0.0126, "step": 193650 }, { "epoch": 0.98, "learning_rate": 0.00015344405709067608, "loss": 0.0097, "step": 193660 }, { "epoch": 0.98, "learning_rate": 0.00015343648939766208, "loss": 0.009, "step": 193670 }, { "epoch": 0.98, "learning_rate": 0.00015342892170464807, "loss": 0.0105, "step": 193680 }, { "epoch": 0.98, "learning_rate": 0.00015342135401163405, "loss": 0.0094, "step": 193690 }, { "epoch": 0.98, "learning_rate": 0.00015341378631862006, "loss": 0.0143, "step": 193700 }, { "epoch": 0.98, "learning_rate": 0.00015340621862560604, "loss": 0.0107, "step": 193710 }, { "epoch": 0.98, "learning_rate": 0.00015339865093259202, "loss": 0.01, "step": 193720 }, { "epoch": 0.98, "learning_rate": 0.00015339108323957803, "loss": 0.0105, "step": 193730 }, { "epoch": 0.98, "learning_rate": 0.000153383515546564, "loss": 0.0106, "step": 193740 }, { "epoch": 0.98, "learning_rate": 0.00015337594785355, "loss": 0.0155, "step": 193750 }, { "epoch": 0.98, "learning_rate": 0.000153368380160536, "loss": 0.0095, "step": 193760 }, { "epoch": 0.98, "learning_rate": 0.00015336081246752198, "loss": 0.0122, "step": 193770 }, { "epoch": 0.98, "learning_rate": 0.00015335324477450796, "loss": 0.0157, "step": 193780 }, { "epoch": 0.98, "learning_rate": 0.00015334567708149394, "loss": 0.0108, "step": 193790 }, { "epoch": 0.98, "learning_rate": 0.00015333810938847995, "loss": 0.0107, "step": 193800 }, { "epoch": 0.98, "learning_rate": 0.00015333054169546593, "loss": 0.0117, "step": 193810 }, { "epoch": 0.98, "learning_rate": 0.00015332297400245191, "loss": 0.0104, "step": 193820 }, { "epoch": 0.98, "learning_rate": 0.00015331540630943792, "loss": 0.0082, "step": 193830 }, { "epoch": 0.98, "learning_rate": 0.0001533078386164239, "loss": 0.0086, "step": 193840 }, { "epoch": 0.98, "learning_rate": 0.00015330027092340989, "loss": 0.0109, "step": 193850 }, { "epoch": 0.98, "learning_rate": 0.0001532927032303959, "loss": 0.0091, "step": 193860 }, { "epoch": 0.98, "learning_rate": 0.00015328513553738188, "loss": 0.0115, "step": 193870 }, { "epoch": 0.98, "learning_rate": 0.00015327756784436786, "loss": 0.0104, "step": 193880 }, { "epoch": 0.98, "learning_rate": 0.00015327000015135387, "loss": 0.013, "step": 193890 }, { "epoch": 0.98, "learning_rate": 0.00015326243245833985, "loss": 0.0127, "step": 193900 }, { "epoch": 0.98, "learning_rate": 0.00015325486476532583, "loss": 0.0122, "step": 193910 }, { "epoch": 0.98, "learning_rate": 0.00015324729707231184, "loss": 0.0101, "step": 193920 }, { "epoch": 0.98, "learning_rate": 0.00015323972937929782, "loss": 0.0115, "step": 193930 }, { "epoch": 0.98, "learning_rate": 0.0001532321616862838, "loss": 0.0139, "step": 193940 }, { "epoch": 0.98, "learning_rate": 0.0001532245939932698, "loss": 0.0138, "step": 193950 }, { "epoch": 0.98, "learning_rate": 0.0001532170263002558, "loss": 0.0119, "step": 193960 }, { "epoch": 0.98, "learning_rate": 0.00015320945860724177, "loss": 0.0128, "step": 193970 }, { "epoch": 0.98, "learning_rate": 0.00015320189091422775, "loss": 0.0111, "step": 193980 }, { "epoch": 0.98, "learning_rate": 0.00015319432322121376, "loss": 0.012, "step": 193990 }, { "epoch": 0.98, "learning_rate": 0.00015318675552819974, "loss": 0.0134, "step": 194000 }, { "epoch": 0.98, "eval_cer": 0.9144683151109114, "eval_loss": 0.007887054234743118, "eval_runtime": 116.7404, "eval_samples_per_second": 17.132, "eval_steps_per_second": 4.283, "step": 194000 }, { "epoch": 0.98, "learning_rate": 0.00015317918783518572, "loss": 0.0082, "step": 194010 }, { "epoch": 0.98, "learning_rate": 0.00015317162014217173, "loss": 0.0086, "step": 194020 }, { "epoch": 0.98, "learning_rate": 0.00015316405244915771, "loss": 0.0106, "step": 194030 }, { "epoch": 0.98, "learning_rate": 0.0001531564847561437, "loss": 0.0085, "step": 194040 }, { "epoch": 0.98, "learning_rate": 0.0001531489170631297, "loss": 0.0112, "step": 194050 }, { "epoch": 0.98, "learning_rate": 0.00015314134937011569, "loss": 0.0109, "step": 194060 }, { "epoch": 0.98, "learning_rate": 0.00015313378167710167, "loss": 0.0111, "step": 194070 }, { "epoch": 0.98, "learning_rate": 0.00015312621398408768, "loss": 0.0089, "step": 194080 }, { "epoch": 0.98, "learning_rate": 0.00015311864629107366, "loss": 0.0121, "step": 194090 }, { "epoch": 0.98, "learning_rate": 0.00015311107859805964, "loss": 0.0137, "step": 194100 }, { "epoch": 0.98, "learning_rate": 0.00015310351090504565, "loss": 0.0094, "step": 194110 }, { "epoch": 0.98, "learning_rate": 0.00015309594321203163, "loss": 0.0129, "step": 194120 }, { "epoch": 0.98, "learning_rate": 0.0001530883755190176, "loss": 0.0112, "step": 194130 }, { "epoch": 0.98, "learning_rate": 0.0001530808078260036, "loss": 0.0109, "step": 194140 }, { "epoch": 0.98, "learning_rate": 0.0001530732401329896, "loss": 0.0101, "step": 194150 }, { "epoch": 0.98, "learning_rate": 0.00015306567243997558, "loss": 0.0143, "step": 194160 }, { "epoch": 0.98, "learning_rate": 0.00015305810474696156, "loss": 0.0102, "step": 194170 }, { "epoch": 0.98, "learning_rate": 0.00015305053705394757, "loss": 0.0096, "step": 194180 }, { "epoch": 0.98, "learning_rate": 0.00015304296936093353, "loss": 0.0097, "step": 194190 }, { "epoch": 0.98, "learning_rate": 0.0001530354016679195, "loss": 0.0104, "step": 194200 }, { "epoch": 0.98, "learning_rate": 0.0001530278339749055, "loss": 0.0098, "step": 194210 }, { "epoch": 0.98, "learning_rate": 0.0001530202662818915, "loss": 0.0093, "step": 194220 }, { "epoch": 0.98, "learning_rate": 0.00015301269858887748, "loss": 0.0117, "step": 194230 }, { "epoch": 0.98, "learning_rate": 0.00015300513089586346, "loss": 0.0089, "step": 194240 }, { "epoch": 0.98, "learning_rate": 0.00015299756320284947, "loss": 0.0105, "step": 194250 }, { "epoch": 0.98, "learning_rate": 0.00015298999550983545, "loss": 0.0093, "step": 194260 }, { "epoch": 0.98, "learning_rate": 0.00015298242781682143, "loss": 0.0135, "step": 194270 }, { "epoch": 0.98, "learning_rate": 0.00015297486012380744, "loss": 0.0088, "step": 194280 }, { "epoch": 0.98, "learning_rate": 0.00015296729243079342, "loss": 0.0123, "step": 194290 }, { "epoch": 0.98, "learning_rate": 0.0001529597247377794, "loss": 0.0091, "step": 194300 }, { "epoch": 0.98, "learning_rate": 0.0001529521570447654, "loss": 0.0092, "step": 194310 }, { "epoch": 0.98, "learning_rate": 0.0001529445893517514, "loss": 0.0111, "step": 194320 }, { "epoch": 0.98, "learning_rate": 0.00015293702165873737, "loss": 0.0114, "step": 194330 }, { "epoch": 0.98, "learning_rate": 0.00015292945396572338, "loss": 0.012, "step": 194340 }, { "epoch": 0.98, "learning_rate": 0.00015292188627270936, "loss": 0.0145, "step": 194350 }, { "epoch": 0.98, "learning_rate": 0.00015291431857969535, "loss": 0.01, "step": 194360 }, { "epoch": 0.98, "learning_rate": 0.00015290675088668133, "loss": 0.0097, "step": 194370 }, { "epoch": 0.98, "learning_rate": 0.00015289918319366734, "loss": 0.0097, "step": 194380 }, { "epoch": 0.98, "learning_rate": 0.00015289161550065332, "loss": 0.0125, "step": 194390 }, { "epoch": 0.98, "learning_rate": 0.0001528840478076393, "loss": 0.0107, "step": 194400 }, { "epoch": 0.98, "learning_rate": 0.0001528764801146253, "loss": 0.0139, "step": 194410 }, { "epoch": 0.98, "learning_rate": 0.0001528689124216113, "loss": 0.0107, "step": 194420 }, { "epoch": 0.98, "learning_rate": 0.00015286134472859727, "loss": 0.0116, "step": 194430 }, { "epoch": 0.98, "learning_rate": 0.00015285377703558328, "loss": 0.0113, "step": 194440 }, { "epoch": 0.98, "learning_rate": 0.00015284620934256926, "loss": 0.0108, "step": 194450 }, { "epoch": 0.98, "learning_rate": 0.00015283864164955524, "loss": 0.0131, "step": 194460 }, { "epoch": 0.98, "learning_rate": 0.00015283107395654125, "loss": 0.0117, "step": 194470 }, { "epoch": 0.98, "learning_rate": 0.00015282350626352723, "loss": 0.0105, "step": 194480 }, { "epoch": 0.98, "learning_rate": 0.0001528159385705132, "loss": 0.0112, "step": 194490 }, { "epoch": 0.98, "learning_rate": 0.00015280837087749922, "loss": 0.0104, "step": 194500 }, { "epoch": 0.98, "learning_rate": 0.0001528008031844852, "loss": 0.0089, "step": 194510 }, { "epoch": 0.98, "learning_rate": 0.00015279323549147118, "loss": 0.0178, "step": 194520 }, { "epoch": 0.98, "learning_rate": 0.00015278566779845717, "loss": 0.0098, "step": 194530 }, { "epoch": 0.98, "learning_rate": 0.00015277810010544317, "loss": 0.0131, "step": 194540 }, { "epoch": 0.98, "learning_rate": 0.00015277053241242916, "loss": 0.0108, "step": 194550 }, { "epoch": 0.98, "learning_rate": 0.00015276296471941514, "loss": 0.0086, "step": 194560 }, { "epoch": 0.98, "learning_rate": 0.00015275539702640115, "loss": 0.0103, "step": 194570 }, { "epoch": 0.98, "learning_rate": 0.00015274782933338713, "loss": 0.0094, "step": 194580 }, { "epoch": 0.98, "learning_rate": 0.0001527402616403731, "loss": 0.0123, "step": 194590 }, { "epoch": 0.98, "learning_rate": 0.00015273269394735912, "loss": 0.009, "step": 194600 }, { "epoch": 0.98, "learning_rate": 0.0001527251262543451, "loss": 0.0103, "step": 194610 }, { "epoch": 0.98, "learning_rate": 0.00015271755856133108, "loss": 0.0107, "step": 194620 }, { "epoch": 0.98, "learning_rate": 0.0001527099908683171, "loss": 0.0152, "step": 194630 }, { "epoch": 0.98, "learning_rate": 0.00015270242317530307, "loss": 0.0113, "step": 194640 }, { "epoch": 0.98, "learning_rate": 0.00015269485548228905, "loss": 0.0099, "step": 194650 }, { "epoch": 0.98, "learning_rate": 0.00015268728778927506, "loss": 0.014, "step": 194660 }, { "epoch": 0.98, "learning_rate": 0.00015267972009626104, "loss": 0.0133, "step": 194670 }, { "epoch": 0.98, "learning_rate": 0.00015267215240324702, "loss": 0.0085, "step": 194680 }, { "epoch": 0.98, "learning_rate": 0.000152664584710233, "loss": 0.0111, "step": 194690 }, { "epoch": 0.98, "learning_rate": 0.000152657017017219, "loss": 0.0128, "step": 194700 }, { "epoch": 0.98, "learning_rate": 0.000152649449324205, "loss": 0.0087, "step": 194710 }, { "epoch": 0.98, "learning_rate": 0.00015264188163119098, "loss": 0.0094, "step": 194720 }, { "epoch": 0.98, "learning_rate": 0.00015263431393817698, "loss": 0.0116, "step": 194730 }, { "epoch": 0.98, "learning_rate": 0.00015262674624516297, "loss": 0.0089, "step": 194740 }, { "epoch": 0.98, "learning_rate": 0.00015261917855214895, "loss": 0.011, "step": 194750 }, { "epoch": 0.98, "learning_rate": 0.00015261161085913496, "loss": 0.0102, "step": 194760 }, { "epoch": 0.98, "learning_rate": 0.00015260404316612094, "loss": 0.0115, "step": 194770 }, { "epoch": 0.98, "learning_rate": 0.00015259647547310692, "loss": 0.0125, "step": 194780 }, { "epoch": 0.98, "learning_rate": 0.00015258890778009293, "loss": 0.0104, "step": 194790 }, { "epoch": 0.98, "learning_rate": 0.0001525813400870789, "loss": 0.0103, "step": 194800 }, { "epoch": 0.98, "learning_rate": 0.0001525737723940649, "loss": 0.0087, "step": 194810 }, { "epoch": 0.98, "learning_rate": 0.0001525662047010509, "loss": 0.0113, "step": 194820 }, { "epoch": 0.98, "learning_rate": 0.00015255863700803688, "loss": 0.0118, "step": 194830 }, { "epoch": 0.98, "learning_rate": 0.00015255106931502286, "loss": 0.009, "step": 194840 }, { "epoch": 0.98, "learning_rate": 0.00015254350162200887, "loss": 0.0114, "step": 194850 }, { "epoch": 0.98, "learning_rate": 0.00015253593392899485, "loss": 0.0105, "step": 194860 }, { "epoch": 0.98, "learning_rate": 0.00015252836623598083, "loss": 0.0108, "step": 194870 }, { "epoch": 0.98, "learning_rate": 0.00015252079854296681, "loss": 0.01, "step": 194880 }, { "epoch": 0.98, "learning_rate": 0.00015251323084995282, "loss": 0.0099, "step": 194890 }, { "epoch": 0.98, "learning_rate": 0.0001525056631569388, "loss": 0.014, "step": 194900 }, { "epoch": 0.98, "learning_rate": 0.00015249809546392479, "loss": 0.0111, "step": 194910 }, { "epoch": 0.98, "learning_rate": 0.0001524905277709108, "loss": 0.0115, "step": 194920 }, { "epoch": 0.98, "learning_rate": 0.00015248296007789678, "loss": 0.0086, "step": 194930 }, { "epoch": 0.98, "learning_rate": 0.00015247539238488276, "loss": 0.0092, "step": 194940 }, { "epoch": 0.98, "learning_rate": 0.00015246782469186877, "loss": 0.0107, "step": 194950 }, { "epoch": 0.98, "learning_rate": 0.00015246025699885475, "loss": 0.0105, "step": 194960 }, { "epoch": 0.98, "learning_rate": 0.00015245268930584073, "loss": 0.0094, "step": 194970 }, { "epoch": 0.98, "learning_rate": 0.00015244512161282674, "loss": 0.0114, "step": 194980 }, { "epoch": 0.98, "learning_rate": 0.00015243755391981272, "loss": 0.0114, "step": 194990 }, { "epoch": 0.98, "learning_rate": 0.0001524299862267987, "loss": 0.0132, "step": 195000 }, { "epoch": 0.98, "eval_cer": 0.9144712262992877, "eval_loss": 0.007762947119772434, "eval_runtime": 116.6633, "eval_samples_per_second": 17.143, "eval_steps_per_second": 4.286, "step": 195000 }, { "epoch": 0.98, "learning_rate": 0.0001524224185337847, "loss": 0.0093, "step": 195010 }, { "epoch": 0.98, "learning_rate": 0.0001524148508407707, "loss": 0.0135, "step": 195020 }, { "epoch": 0.98, "learning_rate": 0.00015240728314775667, "loss": 0.0125, "step": 195030 }, { "epoch": 0.98, "learning_rate": 0.00015239971545474265, "loss": 0.011, "step": 195040 }, { "epoch": 0.98, "learning_rate": 0.00015239214776172866, "loss": 0.0137, "step": 195050 }, { "epoch": 0.98, "learning_rate": 0.00015238458006871464, "loss": 0.0117, "step": 195060 }, { "epoch": 0.98, "learning_rate": 0.00015237701237570062, "loss": 0.0097, "step": 195070 }, { "epoch": 0.98, "learning_rate": 0.00015236944468268663, "loss": 0.0099, "step": 195080 }, { "epoch": 0.98, "learning_rate": 0.00015236187698967261, "loss": 0.0106, "step": 195090 }, { "epoch": 0.98, "learning_rate": 0.0001523543092966586, "loss": 0.01, "step": 195100 }, { "epoch": 0.98, "learning_rate": 0.0001523467416036446, "loss": 0.0105, "step": 195110 }, { "epoch": 0.98, "learning_rate": 0.00015233917391063059, "loss": 0.0126, "step": 195120 }, { "epoch": 0.98, "learning_rate": 0.00015233160621761657, "loss": 0.0124, "step": 195130 }, { "epoch": 0.98, "learning_rate": 0.00015232403852460258, "loss": 0.0135, "step": 195140 }, { "epoch": 0.98, "learning_rate": 0.00015231647083158856, "loss": 0.0106, "step": 195150 }, { "epoch": 0.98, "learning_rate": 0.00015230890313857454, "loss": 0.0124, "step": 195160 }, { "epoch": 0.98, "learning_rate": 0.00015230133544556055, "loss": 0.0138, "step": 195170 }, { "epoch": 0.98, "learning_rate": 0.00015229376775254653, "loss": 0.0099, "step": 195180 }, { "epoch": 0.98, "learning_rate": 0.0001522862000595325, "loss": 0.0104, "step": 195190 }, { "epoch": 0.98, "learning_rate": 0.0001522786323665185, "loss": 0.0143, "step": 195200 }, { "epoch": 0.98, "learning_rate": 0.0001522710646735045, "loss": 0.0134, "step": 195210 }, { "epoch": 0.98, "learning_rate": 0.00015226349698049048, "loss": 0.0109, "step": 195220 }, { "epoch": 0.98, "learning_rate": 0.00015225592928747646, "loss": 0.012, "step": 195230 }, { "epoch": 0.99, "learning_rate": 0.00015224836159446247, "loss": 0.0086, "step": 195240 }, { "epoch": 0.99, "learning_rate": 0.00015224079390144845, "loss": 0.0093, "step": 195250 }, { "epoch": 0.99, "learning_rate": 0.00015223322620843443, "loss": 0.0089, "step": 195260 }, { "epoch": 0.99, "learning_rate": 0.00015222565851542044, "loss": 0.0094, "step": 195270 }, { "epoch": 0.99, "learning_rate": 0.00015221809082240642, "loss": 0.0097, "step": 195280 }, { "epoch": 0.99, "learning_rate": 0.0001522105231293924, "loss": 0.0091, "step": 195290 }, { "epoch": 0.99, "learning_rate": 0.00015220295543637841, "loss": 0.0097, "step": 195300 }, { "epoch": 0.99, "learning_rate": 0.0001521953877433644, "loss": 0.0132, "step": 195310 }, { "epoch": 0.99, "learning_rate": 0.00015218782005035038, "loss": 0.0126, "step": 195320 }, { "epoch": 0.99, "learning_rate": 0.00015218025235733639, "loss": 0.009, "step": 195330 }, { "epoch": 0.99, "learning_rate": 0.00015217268466432237, "loss": 0.0102, "step": 195340 }, { "epoch": 0.99, "learning_rate": 0.00015216511697130835, "loss": 0.0111, "step": 195350 }, { "epoch": 0.99, "learning_rate": 0.00015215754927829436, "loss": 0.0133, "step": 195360 }, { "epoch": 0.99, "learning_rate": 0.00015214998158528034, "loss": 0.0106, "step": 195370 }, { "epoch": 0.99, "learning_rate": 0.00015214241389226632, "loss": 0.0111, "step": 195380 }, { "epoch": 0.99, "learning_rate": 0.0001521348461992523, "loss": 0.0114, "step": 195390 }, { "epoch": 0.99, "learning_rate": 0.0001521272785062383, "loss": 0.0075, "step": 195400 }, { "epoch": 0.99, "learning_rate": 0.0001521197108132243, "loss": 0.0108, "step": 195410 }, { "epoch": 0.99, "learning_rate": 0.00015211214312021027, "loss": 0.0077, "step": 195420 }, { "epoch": 0.99, "learning_rate": 0.00015210457542719628, "loss": 0.0118, "step": 195430 }, { "epoch": 0.99, "learning_rate": 0.00015209700773418226, "loss": 0.0112, "step": 195440 }, { "epoch": 0.99, "learning_rate": 0.00015208944004116822, "loss": 0.0097, "step": 195450 }, { "epoch": 0.99, "learning_rate": 0.0001520818723481542, "loss": 0.0108, "step": 195460 }, { "epoch": 0.99, "learning_rate": 0.0001520743046551402, "loss": 0.0113, "step": 195470 }, { "epoch": 0.99, "learning_rate": 0.0001520667369621262, "loss": 0.0109, "step": 195480 }, { "epoch": 0.99, "learning_rate": 0.00015205916926911217, "loss": 0.0128, "step": 195490 }, { "epoch": 0.99, "learning_rate": 0.00015205160157609818, "loss": 0.0097, "step": 195500 }, { "epoch": 0.99, "learning_rate": 0.00015204403388308416, "loss": 0.0096, "step": 195510 }, { "epoch": 0.99, "learning_rate": 0.00015203646619007014, "loss": 0.0098, "step": 195520 }, { "epoch": 0.99, "learning_rate": 0.00015202889849705615, "loss": 0.0086, "step": 195530 }, { "epoch": 0.99, "learning_rate": 0.00015202133080404213, "loss": 0.0157, "step": 195540 }, { "epoch": 0.99, "learning_rate": 0.0001520137631110281, "loss": 0.0133, "step": 195550 }, { "epoch": 0.99, "learning_rate": 0.00015200619541801412, "loss": 0.0097, "step": 195560 }, { "epoch": 0.99, "learning_rate": 0.0001519986277250001, "loss": 0.0097, "step": 195570 }, { "epoch": 0.99, "learning_rate": 0.00015199106003198608, "loss": 0.0118, "step": 195580 }, { "epoch": 0.99, "learning_rate": 0.00015198349233897207, "loss": 0.0098, "step": 195590 }, { "epoch": 0.99, "learning_rate": 0.00015197592464595807, "loss": 0.0127, "step": 195600 }, { "epoch": 0.99, "learning_rate": 0.00015196835695294406, "loss": 0.0136, "step": 195610 }, { "epoch": 0.99, "learning_rate": 0.00015196078925993004, "loss": 0.0123, "step": 195620 }, { "epoch": 0.99, "learning_rate": 0.00015195322156691605, "loss": 0.0114, "step": 195630 }, { "epoch": 0.99, "learning_rate": 0.00015194565387390203, "loss": 0.0092, "step": 195640 }, { "epoch": 0.99, "learning_rate": 0.000151938086180888, "loss": 0.0101, "step": 195650 }, { "epoch": 0.99, "learning_rate": 0.00015193051848787402, "loss": 0.0125, "step": 195660 }, { "epoch": 0.99, "learning_rate": 0.00015192295079486, "loss": 0.0104, "step": 195670 }, { "epoch": 0.99, "learning_rate": 0.00015191538310184598, "loss": 0.0102, "step": 195680 }, { "epoch": 0.99, "learning_rate": 0.000151907815408832, "loss": 0.0131, "step": 195690 }, { "epoch": 0.99, "learning_rate": 0.00015190024771581797, "loss": 0.0127, "step": 195700 }, { "epoch": 0.99, "learning_rate": 0.00015189268002280395, "loss": 0.0101, "step": 195710 }, { "epoch": 0.99, "learning_rate": 0.00015188511232978996, "loss": 0.0131, "step": 195720 }, { "epoch": 0.99, "learning_rate": 0.00015187754463677594, "loss": 0.0087, "step": 195730 }, { "epoch": 0.99, "learning_rate": 0.00015186997694376192, "loss": 0.0106, "step": 195740 }, { "epoch": 0.99, "learning_rate": 0.00015186240925074793, "loss": 0.0141, "step": 195750 }, { "epoch": 0.99, "learning_rate": 0.0001518548415577339, "loss": 0.0104, "step": 195760 }, { "epoch": 0.99, "learning_rate": 0.0001518472738647199, "loss": 0.0098, "step": 195770 }, { "epoch": 0.99, "learning_rate": 0.00015183970617170588, "loss": 0.0118, "step": 195780 }, { "epoch": 0.99, "learning_rate": 0.00015183213847869188, "loss": 0.0087, "step": 195790 }, { "epoch": 0.99, "learning_rate": 0.00015182457078567787, "loss": 0.0139, "step": 195800 }, { "epoch": 0.99, "learning_rate": 0.00015181700309266385, "loss": 0.0104, "step": 195810 }, { "epoch": 0.99, "learning_rate": 0.00015180943539964986, "loss": 0.0083, "step": 195820 }, { "epoch": 0.99, "learning_rate": 0.00015180186770663584, "loss": 0.0112, "step": 195830 }, { "epoch": 0.99, "learning_rate": 0.00015179430001362182, "loss": 0.0091, "step": 195840 }, { "epoch": 0.99, "learning_rate": 0.00015178673232060783, "loss": 0.0149, "step": 195850 }, { "epoch": 0.99, "learning_rate": 0.0001517791646275938, "loss": 0.0119, "step": 195860 }, { "epoch": 0.99, "learning_rate": 0.0001517715969345798, "loss": 0.0122, "step": 195870 }, { "epoch": 0.99, "learning_rate": 0.0001517640292415658, "loss": 0.0137, "step": 195880 }, { "epoch": 0.99, "learning_rate": 0.00015175646154855178, "loss": 0.0138, "step": 195890 }, { "epoch": 0.99, "learning_rate": 0.00015174889385553776, "loss": 0.0124, "step": 195900 }, { "epoch": 0.99, "learning_rate": 0.00015174132616252377, "loss": 0.0103, "step": 195910 }, { "epoch": 0.99, "learning_rate": 0.00015173375846950975, "loss": 0.0112, "step": 195920 }, { "epoch": 0.99, "learning_rate": 0.00015172619077649573, "loss": 0.0118, "step": 195930 }, { "epoch": 0.99, "learning_rate": 0.00015171862308348171, "loss": 0.0128, "step": 195940 }, { "epoch": 0.99, "learning_rate": 0.00015171105539046772, "loss": 0.0135, "step": 195950 }, { "epoch": 0.99, "learning_rate": 0.0001517034876974537, "loss": 0.0157, "step": 195960 }, { "epoch": 0.99, "learning_rate": 0.00015169592000443969, "loss": 0.0106, "step": 195970 }, { "epoch": 0.99, "learning_rate": 0.0001516883523114257, "loss": 0.0113, "step": 195980 }, { "epoch": 0.99, "learning_rate": 0.00015168078461841168, "loss": 0.0105, "step": 195990 }, { "epoch": 0.99, "learning_rate": 0.00015167321692539766, "loss": 0.01, "step": 196000 }, { "epoch": 0.99, "eval_cer": 0.9144450256039017, "eval_loss": 0.007811464369297028, "eval_runtime": 116.6323, "eval_samples_per_second": 17.148, "eval_steps_per_second": 4.287, "step": 196000 }, { "epoch": 0.99, "learning_rate": 0.00015166564923238367, "loss": 0.008, "step": 196010 }, { "epoch": 0.99, "learning_rate": 0.00015165808153936965, "loss": 0.0087, "step": 196020 }, { "epoch": 0.99, "learning_rate": 0.00015165051384635563, "loss": 0.0119, "step": 196030 }, { "epoch": 0.99, "learning_rate": 0.00015164294615334164, "loss": 0.012, "step": 196040 }, { "epoch": 0.99, "learning_rate": 0.00015163537846032762, "loss": 0.0102, "step": 196050 }, { "epoch": 0.99, "learning_rate": 0.0001516278107673136, "loss": 0.0088, "step": 196060 }, { "epoch": 0.99, "learning_rate": 0.0001516202430742996, "loss": 0.0115, "step": 196070 }, { "epoch": 0.99, "learning_rate": 0.0001516126753812856, "loss": 0.0124, "step": 196080 }, { "epoch": 0.99, "learning_rate": 0.00015160510768827157, "loss": 0.0101, "step": 196090 }, { "epoch": 0.99, "learning_rate": 0.00015159753999525755, "loss": 0.0102, "step": 196100 }, { "epoch": 0.99, "learning_rate": 0.00015158997230224356, "loss": 0.0099, "step": 196110 }, { "epoch": 0.99, "learning_rate": 0.00015158240460922954, "loss": 0.0108, "step": 196120 }, { "epoch": 0.99, "learning_rate": 0.00015157483691621552, "loss": 0.0086, "step": 196130 }, { "epoch": 0.99, "learning_rate": 0.00015156726922320153, "loss": 0.0108, "step": 196140 }, { "epoch": 0.99, "learning_rate": 0.00015155970153018751, "loss": 0.01, "step": 196150 }, { "epoch": 0.99, "learning_rate": 0.0001515521338371735, "loss": 0.0099, "step": 196160 }, { "epoch": 0.99, "learning_rate": 0.0001515445661441595, "loss": 0.0139, "step": 196170 }, { "epoch": 0.99, "learning_rate": 0.00015153699845114549, "loss": 0.0098, "step": 196180 }, { "epoch": 0.99, "learning_rate": 0.00015152943075813147, "loss": 0.0104, "step": 196190 }, { "epoch": 0.99, "learning_rate": 0.00015152186306511748, "loss": 0.0084, "step": 196200 }, { "epoch": 0.99, "learning_rate": 0.00015151429537210346, "loss": 0.0101, "step": 196210 }, { "epoch": 0.99, "learning_rate": 0.00015150672767908944, "loss": 0.0088, "step": 196220 }, { "epoch": 0.99, "learning_rate": 0.00015149915998607545, "loss": 0.0108, "step": 196230 }, { "epoch": 0.99, "learning_rate": 0.00015149159229306143, "loss": 0.0084, "step": 196240 }, { "epoch": 0.99, "learning_rate": 0.0001514840246000474, "loss": 0.0101, "step": 196250 }, { "epoch": 0.99, "learning_rate": 0.00015147645690703342, "loss": 0.0127, "step": 196260 }, { "epoch": 0.99, "learning_rate": 0.0001514688892140194, "loss": 0.0091, "step": 196270 }, { "epoch": 0.99, "learning_rate": 0.00015146132152100538, "loss": 0.0094, "step": 196280 }, { "epoch": 0.99, "learning_rate": 0.00015145375382799136, "loss": 0.0096, "step": 196290 }, { "epoch": 0.99, "learning_rate": 0.00015144618613497737, "loss": 0.0099, "step": 196300 }, { "epoch": 0.99, "learning_rate": 0.00015143861844196335, "loss": 0.0109, "step": 196310 }, { "epoch": 0.99, "learning_rate": 0.00015143105074894933, "loss": 0.0106, "step": 196320 }, { "epoch": 0.99, "learning_rate": 0.00015142348305593534, "loss": 0.0102, "step": 196330 }, { "epoch": 0.99, "learning_rate": 0.00015141591536292132, "loss": 0.0124, "step": 196340 }, { "epoch": 0.99, "learning_rate": 0.0001514083476699073, "loss": 0.0113, "step": 196350 }, { "epoch": 0.99, "learning_rate": 0.00015140077997689331, "loss": 0.0102, "step": 196360 }, { "epoch": 0.99, "learning_rate": 0.0001513932122838793, "loss": 0.0113, "step": 196370 }, { "epoch": 0.99, "learning_rate": 0.00015138564459086528, "loss": 0.012, "step": 196380 }, { "epoch": 0.99, "learning_rate": 0.00015137807689785129, "loss": 0.0122, "step": 196390 }, { "epoch": 0.99, "learning_rate": 0.00015137050920483727, "loss": 0.0109, "step": 196400 }, { "epoch": 0.99, "learning_rate": 0.00015136294151182325, "loss": 0.0115, "step": 196410 }, { "epoch": 0.99, "learning_rate": 0.00015135537381880926, "loss": 0.0084, "step": 196420 }, { "epoch": 0.99, "learning_rate": 0.00015134780612579524, "loss": 0.0127, "step": 196430 }, { "epoch": 0.99, "learning_rate": 0.00015134023843278122, "loss": 0.0121, "step": 196440 }, { "epoch": 0.99, "learning_rate": 0.0001513326707397672, "loss": 0.0089, "step": 196450 }, { "epoch": 0.99, "learning_rate": 0.0001513251030467532, "loss": 0.0097, "step": 196460 }, { "epoch": 0.99, "learning_rate": 0.0001513175353537392, "loss": 0.0083, "step": 196470 }, { "epoch": 0.99, "learning_rate": 0.00015130996766072517, "loss": 0.0098, "step": 196480 }, { "epoch": 0.99, "learning_rate": 0.00015130239996771118, "loss": 0.0106, "step": 196490 }, { "epoch": 0.99, "learning_rate": 0.00015129483227469716, "loss": 0.0163, "step": 196500 }, { "epoch": 0.99, "learning_rate": 0.00015128726458168314, "loss": 0.0097, "step": 196510 }, { "epoch": 0.99, "learning_rate": 0.00015127969688866915, "loss": 0.0095, "step": 196520 }, { "epoch": 0.99, "learning_rate": 0.00015127212919565513, "loss": 0.0121, "step": 196530 }, { "epoch": 0.99, "learning_rate": 0.00015126456150264112, "loss": 0.0082, "step": 196540 }, { "epoch": 0.99, "learning_rate": 0.00015125699380962712, "loss": 0.0093, "step": 196550 }, { "epoch": 0.99, "learning_rate": 0.0001512494261166131, "loss": 0.0099, "step": 196560 }, { "epoch": 0.99, "learning_rate": 0.0001512418584235991, "loss": 0.0099, "step": 196570 }, { "epoch": 0.99, "learning_rate": 0.0001512342907305851, "loss": 0.0079, "step": 196580 }, { "epoch": 0.99, "learning_rate": 0.00015122672303757108, "loss": 0.0116, "step": 196590 }, { "epoch": 0.99, "learning_rate": 0.00015121915534455706, "loss": 0.0108, "step": 196600 }, { "epoch": 0.99, "learning_rate": 0.00015121158765154304, "loss": 0.0091, "step": 196610 }, { "epoch": 0.99, "learning_rate": 0.00015120401995852905, "loss": 0.0125, "step": 196620 }, { "epoch": 0.99, "learning_rate": 0.00015119645226551503, "loss": 0.0112, "step": 196630 }, { "epoch": 0.99, "learning_rate": 0.000151188884572501, "loss": 0.0094, "step": 196640 }, { "epoch": 0.99, "learning_rate": 0.00015118131687948702, "loss": 0.0148, "step": 196650 }, { "epoch": 0.99, "learning_rate": 0.000151173749186473, "loss": 0.0133, "step": 196660 }, { "epoch": 0.99, "learning_rate": 0.00015116618149345898, "loss": 0.0141, "step": 196670 }, { "epoch": 0.99, "learning_rate": 0.000151158613800445, "loss": 0.0078, "step": 196680 }, { "epoch": 0.99, "learning_rate": 0.00015115104610743097, "loss": 0.0129, "step": 196690 }, { "epoch": 0.99, "learning_rate": 0.00015114347841441695, "loss": 0.0119, "step": 196700 }, { "epoch": 0.99, "learning_rate": 0.0001511359107214029, "loss": 0.0118, "step": 196710 }, { "epoch": 0.99, "learning_rate": 0.00015112834302838892, "loss": 0.0108, "step": 196720 }, { "epoch": 0.99, "learning_rate": 0.0001511207753353749, "loss": 0.0094, "step": 196730 }, { "epoch": 0.99, "learning_rate": 0.00015111320764236088, "loss": 0.0107, "step": 196740 }, { "epoch": 0.99, "learning_rate": 0.0001511056399493469, "loss": 0.0111, "step": 196750 }, { "epoch": 0.99, "learning_rate": 0.00015109807225633287, "loss": 0.0135, "step": 196760 }, { "epoch": 0.99, "learning_rate": 0.00015109050456331885, "loss": 0.0098, "step": 196770 }, { "epoch": 0.99, "learning_rate": 0.00015108293687030486, "loss": 0.0173, "step": 196780 }, { "epoch": 0.99, "learning_rate": 0.00015107536917729084, "loss": 0.011, "step": 196790 }, { "epoch": 0.99, "learning_rate": 0.00015106780148427682, "loss": 0.011, "step": 196800 }, { "epoch": 0.99, "learning_rate": 0.00015106023379126283, "loss": 0.0121, "step": 196810 }, { "epoch": 0.99, "learning_rate": 0.0001510526660982488, "loss": 0.0112, "step": 196820 }, { "epoch": 0.99, "learning_rate": 0.0001510450984052348, "loss": 0.0111, "step": 196830 }, { "epoch": 0.99, "learning_rate": 0.00015103753071222078, "loss": 0.0096, "step": 196840 }, { "epoch": 0.99, "learning_rate": 0.00015102996301920678, "loss": 0.0128, "step": 196850 }, { "epoch": 0.99, "learning_rate": 0.00015102239532619277, "loss": 0.0096, "step": 196860 }, { "epoch": 0.99, "learning_rate": 0.00015101482763317875, "loss": 0.0112, "step": 196870 }, { "epoch": 0.99, "learning_rate": 0.00015100725994016476, "loss": 0.0132, "step": 196880 }, { "epoch": 0.99, "learning_rate": 0.00015099969224715074, "loss": 0.0111, "step": 196890 }, { "epoch": 0.99, "learning_rate": 0.00015099212455413672, "loss": 0.0099, "step": 196900 }, { "epoch": 0.99, "learning_rate": 0.00015098455686112273, "loss": 0.0134, "step": 196910 }, { "epoch": 0.99, "learning_rate": 0.0001509769891681087, "loss": 0.0098, "step": 196920 }, { "epoch": 0.99, "learning_rate": 0.0001509694214750947, "loss": 0.0121, "step": 196930 }, { "epoch": 0.99, "learning_rate": 0.0001509618537820807, "loss": 0.0112, "step": 196940 }, { "epoch": 0.99, "learning_rate": 0.00015095428608906668, "loss": 0.0115, "step": 196950 }, { "epoch": 0.99, "learning_rate": 0.00015094671839605266, "loss": 0.0111, "step": 196960 }, { "epoch": 0.99, "learning_rate": 0.00015093915070303867, "loss": 0.0105, "step": 196970 }, { "epoch": 0.99, "learning_rate": 0.00015093158301002465, "loss": 0.0087, "step": 196980 }, { "epoch": 0.99, "learning_rate": 0.00015092401531701063, "loss": 0.0118, "step": 196990 }, { "epoch": 0.99, "learning_rate": 0.00015091644762399662, "loss": 0.0106, "step": 197000 }, { "epoch": 0.99, "eval_cer": 0.9144877230334195, "eval_loss": 0.007818542420864105, "eval_runtime": 116.7928, "eval_samples_per_second": 17.124, "eval_steps_per_second": 4.281, "step": 197000 }, { "epoch": 0.99, "learning_rate": 0.00015090887993098262, "loss": 0.0102, "step": 197010 }, { "epoch": 0.99, "learning_rate": 0.0001509013122379686, "loss": 0.0127, "step": 197020 }, { "epoch": 0.99, "learning_rate": 0.0001508937445449546, "loss": 0.0101, "step": 197030 }, { "epoch": 0.99, "learning_rate": 0.0001508861768519406, "loss": 0.0111, "step": 197040 }, { "epoch": 0.99, "learning_rate": 0.00015087860915892658, "loss": 0.0098, "step": 197050 }, { "epoch": 0.99, "learning_rate": 0.00015087104146591256, "loss": 0.0121, "step": 197060 }, { "epoch": 0.99, "learning_rate": 0.00015086347377289857, "loss": 0.0101, "step": 197070 }, { "epoch": 0.99, "learning_rate": 0.00015085590607988455, "loss": 0.0107, "step": 197080 }, { "epoch": 0.99, "learning_rate": 0.00015084833838687053, "loss": 0.0124, "step": 197090 }, { "epoch": 0.99, "learning_rate": 0.00015084077069385654, "loss": 0.0102, "step": 197100 }, { "epoch": 0.99, "learning_rate": 0.00015083320300084252, "loss": 0.0111, "step": 197110 }, { "epoch": 0.99, "learning_rate": 0.0001508256353078285, "loss": 0.0092, "step": 197120 }, { "epoch": 0.99, "learning_rate": 0.0001508180676148145, "loss": 0.0094, "step": 197130 }, { "epoch": 0.99, "learning_rate": 0.0001508104999218005, "loss": 0.0127, "step": 197140 }, { "epoch": 0.99, "learning_rate": 0.00015080293222878647, "loss": 0.0106, "step": 197150 }, { "epoch": 0.99, "learning_rate": 0.00015079536453577245, "loss": 0.0106, "step": 197160 }, { "epoch": 0.99, "learning_rate": 0.00015078779684275846, "loss": 0.0103, "step": 197170 }, { "epoch": 0.99, "learning_rate": 0.00015078022914974444, "loss": 0.0134, "step": 197180 }, { "epoch": 0.99, "learning_rate": 0.00015077266145673043, "loss": 0.0124, "step": 197190 }, { "epoch": 0.99, "learning_rate": 0.00015076509376371643, "loss": 0.0109, "step": 197200 }, { "epoch": 0.99, "learning_rate": 0.00015075752607070242, "loss": 0.016, "step": 197210 }, { "epoch": 0.99, "learning_rate": 0.0001507499583776884, "loss": 0.0101, "step": 197220 }, { "epoch": 1.0, "learning_rate": 0.0001507423906846744, "loss": 0.0101, "step": 197230 }, { "epoch": 1.0, "learning_rate": 0.0001507348229916604, "loss": 0.0124, "step": 197240 }, { "epoch": 1.0, "learning_rate": 0.00015072725529864637, "loss": 0.011, "step": 197250 }, { "epoch": 1.0, "learning_rate": 0.00015071968760563238, "loss": 0.0118, "step": 197260 }, { "epoch": 1.0, "learning_rate": 0.00015071211991261836, "loss": 0.0135, "step": 197270 }, { "epoch": 1.0, "learning_rate": 0.00015070455221960434, "loss": 0.0103, "step": 197280 }, { "epoch": 1.0, "learning_rate": 0.00015069698452659035, "loss": 0.0112, "step": 197290 }, { "epoch": 1.0, "learning_rate": 0.00015068941683357633, "loss": 0.0096, "step": 197300 }, { "epoch": 1.0, "learning_rate": 0.0001506818491405623, "loss": 0.0117, "step": 197310 }, { "epoch": 1.0, "learning_rate": 0.00015067428144754832, "loss": 0.0114, "step": 197320 }, { "epoch": 1.0, "learning_rate": 0.0001506667137545343, "loss": 0.0112, "step": 197330 }, { "epoch": 1.0, "learning_rate": 0.00015065914606152028, "loss": 0.0129, "step": 197340 }, { "epoch": 1.0, "learning_rate": 0.00015065157836850626, "loss": 0.0166, "step": 197350 }, { "epoch": 1.0, "learning_rate": 0.00015064401067549227, "loss": 0.0115, "step": 197360 }, { "epoch": 1.0, "learning_rate": 0.00015063644298247825, "loss": 0.0096, "step": 197370 }, { "epoch": 1.0, "learning_rate": 0.00015062887528946424, "loss": 0.0094, "step": 197380 }, { "epoch": 1.0, "learning_rate": 0.00015062130759645024, "loss": 0.0089, "step": 197390 }, { "epoch": 1.0, "learning_rate": 0.00015061373990343623, "loss": 0.0114, "step": 197400 }, { "epoch": 1.0, "learning_rate": 0.0001506061722104222, "loss": 0.008, "step": 197410 }, { "epoch": 1.0, "learning_rate": 0.00015059860451740822, "loss": 0.0102, "step": 197420 }, { "epoch": 1.0, "learning_rate": 0.0001505910368243942, "loss": 0.0113, "step": 197430 }, { "epoch": 1.0, "learning_rate": 0.00015058346913138018, "loss": 0.0086, "step": 197440 }, { "epoch": 1.0, "learning_rate": 0.0001505759014383662, "loss": 0.0109, "step": 197450 }, { "epoch": 1.0, "learning_rate": 0.00015056833374535217, "loss": 0.0096, "step": 197460 }, { "epoch": 1.0, "learning_rate": 0.00015056076605233815, "loss": 0.0111, "step": 197470 }, { "epoch": 1.0, "learning_rate": 0.00015055319835932416, "loss": 0.0107, "step": 197480 }, { "epoch": 1.0, "learning_rate": 0.00015054563066631014, "loss": 0.0103, "step": 197490 }, { "epoch": 1.0, "learning_rate": 0.00015053806297329612, "loss": 0.0103, "step": 197500 }, { "epoch": 1.0, "learning_rate": 0.0001505304952802821, "loss": 0.0098, "step": 197510 }, { "epoch": 1.0, "learning_rate": 0.0001505229275872681, "loss": 0.0097, "step": 197520 }, { "epoch": 1.0, "learning_rate": 0.0001505153598942541, "loss": 0.0122, "step": 197530 }, { "epoch": 1.0, "learning_rate": 0.00015050779220124007, "loss": 0.0116, "step": 197540 }, { "epoch": 1.0, "learning_rate": 0.00015050022450822608, "loss": 0.0107, "step": 197550 }, { "epoch": 1.0, "learning_rate": 0.00015049265681521206, "loss": 0.0085, "step": 197560 }, { "epoch": 1.0, "learning_rate": 0.00015048508912219805, "loss": 0.0086, "step": 197570 }, { "epoch": 1.0, "learning_rate": 0.00015047752142918405, "loss": 0.0131, "step": 197580 }, { "epoch": 1.0, "learning_rate": 0.00015046995373617004, "loss": 0.0094, "step": 197590 }, { "epoch": 1.0, "learning_rate": 0.00015046238604315602, "loss": 0.0102, "step": 197600 }, { "epoch": 1.0, "learning_rate": 0.00015045481835014203, "loss": 0.0099, "step": 197610 }, { "epoch": 1.0, "learning_rate": 0.000150447250657128, "loss": 0.0079, "step": 197620 }, { "epoch": 1.0, "learning_rate": 0.000150439682964114, "loss": 0.011, "step": 197630 }, { "epoch": 1.0, "learning_rate": 0.0001504321152711, "loss": 0.0078, "step": 197640 }, { "epoch": 1.0, "learning_rate": 0.00015042454757808598, "loss": 0.0097, "step": 197650 }, { "epoch": 1.0, "learning_rate": 0.00015041697988507196, "loss": 0.0119, "step": 197660 }, { "epoch": 1.0, "learning_rate": 0.00015040941219205794, "loss": 0.011, "step": 197670 }, { "epoch": 1.0, "learning_rate": 0.00015040184449904395, "loss": 0.0128, "step": 197680 }, { "epoch": 1.0, "learning_rate": 0.00015039427680602993, "loss": 0.0114, "step": 197690 }, { "epoch": 1.0, "learning_rate": 0.0001503867091130159, "loss": 0.0098, "step": 197700 }, { "epoch": 1.0, "learning_rate": 0.00015037914142000192, "loss": 0.0092, "step": 197710 }, { "epoch": 1.0, "learning_rate": 0.0001503715737269879, "loss": 0.0114, "step": 197720 }, { "epoch": 1.0, "learning_rate": 0.00015036400603397388, "loss": 0.0096, "step": 197730 }, { "epoch": 1.0, "learning_rate": 0.0001503564383409599, "loss": 0.0112, "step": 197740 }, { "epoch": 1.0, "learning_rate": 0.00015034887064794587, "loss": 0.0099, "step": 197750 }, { "epoch": 1.0, "learning_rate": 0.00015034130295493186, "loss": 0.0086, "step": 197760 }, { "epoch": 1.0, "learning_rate": 0.00015033373526191786, "loss": 0.0073, "step": 197770 }, { "epoch": 1.0, "learning_rate": 0.00015032616756890385, "loss": 0.0081, "step": 197780 }, { "epoch": 1.0, "learning_rate": 0.00015031859987588983, "loss": 0.0086, "step": 197790 }, { "epoch": 1.0, "learning_rate": 0.00015031103218287584, "loss": 0.0102, "step": 197800 }, { "epoch": 1.0, "learning_rate": 0.00015030346448986182, "loss": 0.0136, "step": 197810 }, { "epoch": 1.0, "learning_rate": 0.0001502958967968478, "loss": 0.011, "step": 197820 }, { "epoch": 1.0, "learning_rate": 0.0001502883291038338, "loss": 0.013, "step": 197830 }, { "epoch": 1.0, "learning_rate": 0.0001502807614108198, "loss": 0.0079, "step": 197840 }, { "epoch": 1.0, "learning_rate": 0.00015027319371780577, "loss": 0.0102, "step": 197850 }, { "epoch": 1.0, "learning_rate": 0.00015026562602479175, "loss": 0.0109, "step": 197860 }, { "epoch": 1.0, "learning_rate": 0.00015025805833177776, "loss": 0.0102, "step": 197870 }, { "epoch": 1.0, "learning_rate": 0.00015025049063876374, "loss": 0.0104, "step": 197880 }, { "epoch": 1.0, "learning_rate": 0.00015024292294574972, "loss": 0.0114, "step": 197890 }, { "epoch": 1.0, "learning_rate": 0.00015023535525273573, "loss": 0.0141, "step": 197900 }, { "epoch": 1.0, "learning_rate": 0.0001502277875597217, "loss": 0.0093, "step": 197910 }, { "epoch": 1.0, "learning_rate": 0.0001502202198667077, "loss": 0.0095, "step": 197920 }, { "epoch": 1.0, "learning_rate": 0.0001502126521736937, "loss": 0.0093, "step": 197930 }, { "epoch": 1.0, "learning_rate": 0.00015020508448067968, "loss": 0.0118, "step": 197940 }, { "epoch": 1.0, "learning_rate": 0.00015019751678766567, "loss": 0.009, "step": 197950 }, { "epoch": 1.0, "learning_rate": 0.00015018994909465162, "loss": 0.0109, "step": 197960 }, { "epoch": 1.0, "learning_rate": 0.00015018238140163763, "loss": 0.0111, "step": 197970 }, { "epoch": 1.0, "learning_rate": 0.0001501748137086236, "loss": 0.0077, "step": 197980 }, { "epoch": 1.0, "learning_rate": 0.0001501672460156096, "loss": 0.0113, "step": 197990 }, { "epoch": 1.0, "learning_rate": 0.0001501596783225956, "loss": 0.0091, "step": 198000 }, { "epoch": 1.0, "eval_cer": 0.9144508479806542, "eval_loss": 0.007899566553533077, "eval_runtime": 116.6273, "eval_samples_per_second": 17.149, "eval_steps_per_second": 4.287, "step": 198000 }, { "epoch": 1.0, "learning_rate": 0.00015015211062958158, "loss": 0.0115, "step": 198010 }, { "epoch": 1.0, "learning_rate": 0.00015014454293656756, "loss": 0.0108, "step": 198020 }, { "epoch": 1.0, "learning_rate": 0.00015013697524355357, "loss": 0.0132, "step": 198030 }, { "epoch": 1.0, "learning_rate": 0.00015012940755053955, "loss": 0.0086, "step": 198040 }, { "epoch": 1.0, "learning_rate": 0.00015012183985752553, "loss": 0.0124, "step": 198050 }, { "epoch": 1.0, "learning_rate": 0.00015011427216451152, "loss": 0.0122, "step": 198060 }, { "epoch": 1.0, "learning_rate": 0.00015010670447149752, "loss": 0.013, "step": 198070 }, { "epoch": 1.0, "learning_rate": 0.0001500991367784835, "loss": 0.0101, "step": 198080 }, { "epoch": 1.0, "learning_rate": 0.0001500915690854695, "loss": 0.007, "step": 198090 }, { "epoch": 1.0, "learning_rate": 0.0001500840013924555, "loss": 0.0124, "step": 198100 }, { "epoch": 1.0, "learning_rate": 0.00015007643369944148, "loss": 0.0075, "step": 198110 }, { "epoch": 1.0, "learning_rate": 0.00015006886600642746, "loss": 0.0101, "step": 198120 }, { "epoch": 1.0, "learning_rate": 0.00015006129831341347, "loss": 0.0134, "step": 198130 }, { "epoch": 1.0, "learning_rate": 0.00015005373062039945, "loss": 0.0106, "step": 198140 }, { "epoch": 1.0, "learning_rate": 0.00015004616292738543, "loss": 0.0164, "step": 198150 }, { "epoch": 1.0, "learning_rate": 0.00015003859523437144, "loss": 0.0095, "step": 198160 }, { "epoch": 1.0, "learning_rate": 0.00015003102754135742, "loss": 0.0103, "step": 198170 }, { "epoch": 1.0, "learning_rate": 0.0001500234598483434, "loss": 0.0145, "step": 198180 }, { "epoch": 1.0, "learning_rate": 0.0001500158921553294, "loss": 0.0115, "step": 198190 }, { "epoch": 1.0, "learning_rate": 0.0001500083244623154, "loss": 0.0108, "step": 198200 }, { "epoch": 1.0, "learning_rate": 0.00015000075676930137, "loss": 0.0138, "step": 198210 }, { "epoch": 1.0, "learning_rate": 0.00014999318907628738, "loss": 0.0088, "step": 198220 }, { "epoch": 1.0, "learning_rate": 0.00014998562138327336, "loss": 0.01, "step": 198230 }, { "epoch": 1.0, "learning_rate": 0.00014997805369025937, "loss": 0.0105, "step": 198240 }, { "epoch": 1.0, "learning_rate": 0.00014997048599724535, "loss": 0.0092, "step": 198250 }, { "epoch": 1.0, "learning_rate": 0.00014996291830423133, "loss": 0.0114, "step": 198260 }, { "epoch": 1.0, "learning_rate": 0.00014995535061121734, "loss": 0.0114, "step": 198270 }, { "epoch": 1.0, "learning_rate": 0.0001499477829182033, "loss": 0.0106, "step": 198280 }, { "epoch": 1.0, "learning_rate": 0.0001499402152251893, "loss": 0.0107, "step": 198290 }, { "epoch": 1.0, "learning_rate": 0.0001499326475321753, "loss": 0.0087, "step": 198300 }, { "epoch": 1.0, "learning_rate": 0.00014992507983916127, "loss": 0.0094, "step": 198310 }, { "epoch": 1.0, "learning_rate": 0.00014991751214614728, "loss": 0.0105, "step": 198320 }, { "epoch": 1.0, "learning_rate": 0.00014990994445313326, "loss": 0.0088, "step": 198330 }, { "epoch": 1.0, "learning_rate": 0.00014990237676011924, "loss": 0.0093, "step": 198340 }, { "epoch": 1.0, "learning_rate": 0.00014989480906710525, "loss": 0.0089, "step": 198350 }, { "epoch": 1.0, "learning_rate": 0.00014988724137409123, "loss": 0.0106, "step": 198360 }, { "epoch": 1.0, "learning_rate": 0.0001498796736810772, "loss": 0.0083, "step": 198370 }, { "epoch": 1.0, "learning_rate": 0.00014987210598806322, "loss": 0.0092, "step": 198380 }, { "epoch": 1.0, "learning_rate": 0.0001498645382950492, "loss": 0.0089, "step": 198390 }, { "epoch": 1.0, "learning_rate": 0.00014985697060203518, "loss": 0.0096, "step": 198400 }, { "epoch": 1.0, "learning_rate": 0.00014984940290902116, "loss": 0.0117, "step": 198410 }, { "epoch": 1.0, "learning_rate": 0.00014984183521600717, "loss": 0.01, "step": 198420 }, { "epoch": 1.0, "learning_rate": 0.00014983426752299315, "loss": 0.0067, "step": 198430 }, { "epoch": 1.0, "learning_rate": 0.00014982669982997914, "loss": 0.011, "step": 198440 }, { "epoch": 1.0, "learning_rate": 0.00014981913213696514, "loss": 0.0089, "step": 198450 }, { "epoch": 1.0, "learning_rate": 0.00014981156444395113, "loss": 0.0103, "step": 198460 }, { "epoch": 1.0, "learning_rate": 0.0001498039967509371, "loss": 0.0125, "step": 198470 }, { "epoch": 1.0, "learning_rate": 0.00014979642905792312, "loss": 0.0086, "step": 198480 }, { "epoch": 1.0, "learning_rate": 0.0001497888613649091, "loss": 0.0097, "step": 198490 }, { "epoch": 1.0, "learning_rate": 0.00014978129367189508, "loss": 0.0067, "step": 198500 }, { "epoch": 1.0, "learning_rate": 0.0001497737259788811, "loss": 0.0101, "step": 198510 }, { "epoch": 1.0, "learning_rate": 0.00014976615828586707, "loss": 0.0114, "step": 198520 }, { "epoch": 1.0, "learning_rate": 0.00014975859059285305, "loss": 0.009, "step": 198530 }, { "epoch": 1.0, "learning_rate": 0.00014975102289983906, "loss": 0.0081, "step": 198540 }, { "epoch": 1.0, "learning_rate": 0.00014974345520682504, "loss": 0.0108, "step": 198550 }, { "epoch": 1.0, "learning_rate": 0.00014973588751381102, "loss": 0.0095, "step": 198560 }, { "epoch": 1.0, "learning_rate": 0.000149728319820797, "loss": 0.0093, "step": 198570 }, { "epoch": 1.0, "learning_rate": 0.000149720752127783, "loss": 0.01, "step": 198580 }, { "epoch": 1.0, "learning_rate": 0.000149713184434769, "loss": 0.0128, "step": 198590 }, { "epoch": 1.0, "learning_rate": 0.00014970561674175497, "loss": 0.0158, "step": 198600 }, { "epoch": 1.0, "learning_rate": 0.00014969804904874098, "loss": 0.015, "step": 198610 }, { "epoch": 1.0, "learning_rate": 0.00014969048135572696, "loss": 0.0128, "step": 198620 }, { "epoch": 1.0, "learning_rate": 0.00014968291366271295, "loss": 0.011, "step": 198630 }, { "epoch": 1.0, "learning_rate": 0.00014967534596969895, "loss": 0.0096, "step": 198640 }, { "epoch": 1.0, "learning_rate": 0.00014966777827668494, "loss": 0.0108, "step": 198650 }, { "epoch": 1.0, "learning_rate": 0.00014966021058367092, "loss": 0.0095, "step": 198660 }, { "epoch": 1.0, "learning_rate": 0.00014965264289065693, "loss": 0.0113, "step": 198670 }, { "epoch": 1.0, "learning_rate": 0.0001496450751976429, "loss": 0.0095, "step": 198680 }, { "epoch": 1.0, "learning_rate": 0.0001496375075046289, "loss": 0.0101, "step": 198690 }, { "epoch": 1.0, "learning_rate": 0.0001496299398116149, "loss": 0.0108, "step": 198700 }, { "epoch": 1.0, "learning_rate": 0.00014962237211860088, "loss": 0.0107, "step": 198710 }, { "epoch": 1.0, "learning_rate": 0.00014961480442558686, "loss": 0.0074, "step": 198720 }, { "epoch": 1.0, "learning_rate": 0.00014960723673257287, "loss": 0.0135, "step": 198730 }, { "epoch": 1.0, "learning_rate": 0.00014959966903955885, "loss": 0.0103, "step": 198740 }, { "epoch": 1.0, "learning_rate": 0.00014959210134654483, "loss": 0.0113, "step": 198750 }, { "epoch": 1.0, "learning_rate": 0.0001495845336535308, "loss": 0.0097, "step": 198760 }, { "epoch": 1.0, "learning_rate": 0.00014957696596051682, "loss": 0.0079, "step": 198770 }, { "epoch": 1.0, "learning_rate": 0.0001495693982675028, "loss": 0.009, "step": 198780 }, { "epoch": 1.0, "learning_rate": 0.00014956183057448878, "loss": 0.011, "step": 198790 }, { "epoch": 1.0, "learning_rate": 0.0001495542628814748, "loss": 0.0112, "step": 198800 }, { "epoch": 1.0, "learning_rate": 0.00014954669518846077, "loss": 0.011, "step": 198810 }, { "epoch": 1.0, "learning_rate": 0.00014953912749544676, "loss": 0.0096, "step": 198820 }, { "epoch": 1.0, "learning_rate": 0.00014953155980243276, "loss": 0.0077, "step": 198830 }, { "epoch": 1.0, "learning_rate": 0.00014952399210941875, "loss": 0.012, "step": 198840 }, { "epoch": 1.0, "learning_rate": 0.00014951642441640473, "loss": 0.0103, "step": 198850 }, { "epoch": 1.0, "learning_rate": 0.00014950885672339074, "loss": 0.0099, "step": 198860 }, { "epoch": 1.0, "learning_rate": 0.00014950128903037672, "loss": 0.0119, "step": 198870 }, { "epoch": 1.0, "learning_rate": 0.0001494937213373627, "loss": 0.0111, "step": 198880 }, { "epoch": 1.0, "learning_rate": 0.0001494861536443487, "loss": 0.0093, "step": 198890 }, { "epoch": 1.0, "learning_rate": 0.0001494785859513347, "loss": 0.0116, "step": 198900 }, { "epoch": 1.0, "learning_rate": 0.00014947101825832067, "loss": 0.0091, "step": 198910 }, { "epoch": 1.0, "learning_rate": 0.00014946345056530665, "loss": 0.0067, "step": 198920 }, { "epoch": 1.0, "learning_rate": 0.00014945588287229263, "loss": 0.0138, "step": 198930 }, { "epoch": 1.0, "learning_rate": 0.00014944831517927861, "loss": 0.0096, "step": 198940 }, { "epoch": 1.0, "learning_rate": 0.00014944074748626462, "loss": 0.0139, "step": 198950 }, { "epoch": 1.0, "learning_rate": 0.0001494331797932506, "loss": 0.0083, "step": 198960 }, { "epoch": 1.0, "learning_rate": 0.00014942561210023659, "loss": 0.0093, "step": 198970 }, { "epoch": 1.0, "learning_rate": 0.0001494180444072226, "loss": 0.0119, "step": 198980 }, { "epoch": 1.0, "learning_rate": 0.00014941047671420858, "loss": 0.0098, "step": 198990 }, { "epoch": 1.0, "learning_rate": 0.00014940290902119456, "loss": 0.0085, "step": 199000 }, { "epoch": 1.0, "eval_cer": 0.914462492734159, "eval_loss": 0.00810973159968853, "eval_runtime": 117.6891, "eval_samples_per_second": 16.994, "eval_steps_per_second": 4.248, "step": 199000 }, { "epoch": 1.0, "learning_rate": 0.00014939534132818057, "loss": 0.009, "step": 199010 }, { "epoch": 1.0, "learning_rate": 0.00014938777363516655, "loss": 0.0097, "step": 199020 }, { "epoch": 1.0, "learning_rate": 0.00014938020594215253, "loss": 0.0093, "step": 199030 }, { "epoch": 1.0, "learning_rate": 0.00014937263824913854, "loss": 0.0087, "step": 199040 }, { "epoch": 1.0, "learning_rate": 0.00014936507055612452, "loss": 0.008, "step": 199050 }, { "epoch": 1.0, "learning_rate": 0.0001493575028631105, "loss": 0.0094, "step": 199060 }, { "epoch": 1.0, "learning_rate": 0.0001493499351700965, "loss": 0.0084, "step": 199070 }, { "epoch": 1.0, "learning_rate": 0.0001493423674770825, "loss": 0.0079, "step": 199080 }, { "epoch": 1.0, "learning_rate": 0.00014933479978406847, "loss": 0.0093, "step": 199090 }, { "epoch": 1.0, "learning_rate": 0.00014932723209105445, "loss": 0.0095, "step": 199100 }, { "epoch": 1.0, "learning_rate": 0.00014931966439804046, "loss": 0.0083, "step": 199110 }, { "epoch": 1.0, "learning_rate": 0.00014931209670502644, "loss": 0.0098, "step": 199120 }, { "epoch": 1.0, "learning_rate": 0.00014930452901201242, "loss": 0.0098, "step": 199130 }, { "epoch": 1.0, "learning_rate": 0.00014929696131899843, "loss": 0.0107, "step": 199140 }, { "epoch": 1.0, "learning_rate": 0.00014928939362598441, "loss": 0.0079, "step": 199150 }, { "epoch": 1.0, "learning_rate": 0.0001492818259329704, "loss": 0.0087, "step": 199160 }, { "epoch": 1.0, "learning_rate": 0.0001492742582399564, "loss": 0.0103, "step": 199170 }, { "epoch": 1.0, "learning_rate": 0.00014926669054694239, "loss": 0.0108, "step": 199180 }, { "epoch": 1.0, "learning_rate": 0.00014925912285392837, "loss": 0.0162, "step": 199190 }, { "epoch": 1.0, "learning_rate": 0.00014925155516091438, "loss": 0.0074, "step": 199200 }, { "epoch": 1.01, "learning_rate": 0.00014924398746790036, "loss": 0.011, "step": 199210 }, { "epoch": 1.01, "learning_rate": 0.00014923641977488634, "loss": 0.0111, "step": 199220 }, { "epoch": 1.01, "learning_rate": 0.00014922885208187235, "loss": 0.0081, "step": 199230 }, { "epoch": 1.01, "learning_rate": 0.00014922128438885833, "loss": 0.0115, "step": 199240 }, { "epoch": 1.01, "learning_rate": 0.0001492137166958443, "loss": 0.0077, "step": 199250 }, { "epoch": 1.01, "learning_rate": 0.00014920614900283032, "loss": 0.0101, "step": 199260 }, { "epoch": 1.01, "learning_rate": 0.0001491985813098163, "loss": 0.01, "step": 199270 }, { "epoch": 1.01, "learning_rate": 0.00014919101361680228, "loss": 0.0098, "step": 199280 }, { "epoch": 1.01, "learning_rate": 0.00014918344592378826, "loss": 0.0078, "step": 199290 }, { "epoch": 1.01, "learning_rate": 0.00014917587823077427, "loss": 0.0102, "step": 199300 }, { "epoch": 1.01, "learning_rate": 0.00014916831053776025, "loss": 0.0084, "step": 199310 }, { "epoch": 1.01, "learning_rate": 0.00014916074284474623, "loss": 0.0094, "step": 199320 }, { "epoch": 1.01, "learning_rate": 0.00014915317515173224, "loss": 0.0081, "step": 199330 }, { "epoch": 1.01, "learning_rate": 0.00014914560745871822, "loss": 0.0102, "step": 199340 }, { "epoch": 1.01, "learning_rate": 0.0001491380397657042, "loss": 0.0083, "step": 199350 }, { "epoch": 1.01, "learning_rate": 0.00014913047207269021, "loss": 0.0084, "step": 199360 }, { "epoch": 1.01, "learning_rate": 0.0001491229043796762, "loss": 0.0101, "step": 199370 }, { "epoch": 1.01, "learning_rate": 0.00014911533668666218, "loss": 0.0096, "step": 199380 }, { "epoch": 1.01, "learning_rate": 0.00014910776899364819, "loss": 0.008, "step": 199390 }, { "epoch": 1.01, "learning_rate": 0.00014910020130063417, "loss": 0.0093, "step": 199400 }, { "epoch": 1.01, "learning_rate": 0.00014909263360762015, "loss": 0.0102, "step": 199410 }, { "epoch": 1.01, "learning_rate": 0.00014908506591460616, "loss": 0.0093, "step": 199420 }, { "epoch": 1.01, "learning_rate": 0.00014907749822159214, "loss": 0.0085, "step": 199430 }, { "epoch": 1.01, "learning_rate": 0.00014906993052857812, "loss": 0.0085, "step": 199440 }, { "epoch": 1.01, "learning_rate": 0.0001490623628355641, "loss": 0.0091, "step": 199450 }, { "epoch": 1.01, "learning_rate": 0.0001490547951425501, "loss": 0.012, "step": 199460 }, { "epoch": 1.01, "learning_rate": 0.0001490472274495361, "loss": 0.0105, "step": 199470 }, { "epoch": 1.01, "learning_rate": 0.00014903965975652207, "loss": 0.0089, "step": 199480 }, { "epoch": 1.01, "learning_rate": 0.00014903209206350808, "loss": 0.0097, "step": 199490 }, { "epoch": 1.01, "learning_rate": 0.00014902452437049406, "loss": 0.0127, "step": 199500 }, { "epoch": 1.01, "learning_rate": 0.00014901695667748004, "loss": 0.0092, "step": 199510 }, { "epoch": 1.01, "learning_rate": 0.00014900938898446605, "loss": 0.01, "step": 199520 }, { "epoch": 1.01, "learning_rate": 0.00014900182129145203, "loss": 0.0153, "step": 199530 }, { "epoch": 1.01, "learning_rate": 0.00014899425359843802, "loss": 0.0097, "step": 199540 }, { "epoch": 1.01, "learning_rate": 0.000148986685905424, "loss": 0.0117, "step": 199550 }, { "epoch": 1.01, "learning_rate": 0.00014897911821240998, "loss": 0.0114, "step": 199560 }, { "epoch": 1.01, "learning_rate": 0.000148971550519396, "loss": 0.0081, "step": 199570 }, { "epoch": 1.01, "learning_rate": 0.00014896398282638197, "loss": 0.0093, "step": 199580 }, { "epoch": 1.01, "learning_rate": 0.00014895641513336795, "loss": 0.0107, "step": 199590 }, { "epoch": 1.01, "learning_rate": 0.00014894884744035396, "loss": 0.0106, "step": 199600 }, { "epoch": 1.01, "learning_rate": 0.00014894127974733994, "loss": 0.0105, "step": 199610 }, { "epoch": 1.01, "learning_rate": 0.00014893371205432592, "loss": 0.0102, "step": 199620 }, { "epoch": 1.01, "learning_rate": 0.00014892614436131193, "loss": 0.0113, "step": 199630 }, { "epoch": 1.01, "learning_rate": 0.0001489185766682979, "loss": 0.009, "step": 199640 }, { "epoch": 1.01, "learning_rate": 0.0001489110089752839, "loss": 0.0085, "step": 199650 }, { "epoch": 1.01, "learning_rate": 0.00014890344128226987, "loss": 0.0095, "step": 199660 }, { "epoch": 1.01, "learning_rate": 0.00014889587358925588, "loss": 0.0142, "step": 199670 }, { "epoch": 1.01, "learning_rate": 0.00014888830589624186, "loss": 0.0162, "step": 199680 }, { "epoch": 1.01, "learning_rate": 0.00014888073820322785, "loss": 0.0112, "step": 199690 }, { "epoch": 1.01, "learning_rate": 0.00014887317051021385, "loss": 0.01, "step": 199700 }, { "epoch": 1.01, "learning_rate": 0.00014886560281719984, "loss": 0.0089, "step": 199710 }, { "epoch": 1.01, "learning_rate": 0.00014885803512418582, "loss": 0.0101, "step": 199720 }, { "epoch": 1.01, "learning_rate": 0.00014885046743117183, "loss": 0.0114, "step": 199730 }, { "epoch": 1.01, "learning_rate": 0.0001488428997381578, "loss": 0.0106, "step": 199740 }, { "epoch": 1.01, "learning_rate": 0.0001488353320451438, "loss": 0.0077, "step": 199750 }, { "epoch": 1.01, "learning_rate": 0.0001488277643521298, "loss": 0.0069, "step": 199760 }, { "epoch": 1.01, "learning_rate": 0.00014882019665911578, "loss": 0.0109, "step": 199770 }, { "epoch": 1.01, "learning_rate": 0.00014881262896610176, "loss": 0.0105, "step": 199780 }, { "epoch": 1.01, "learning_rate": 0.00014880506127308777, "loss": 0.0082, "step": 199790 }, { "epoch": 1.01, "learning_rate": 0.00014879749358007375, "loss": 0.0137, "step": 199800 }, { "epoch": 1.01, "learning_rate": 0.00014878992588705973, "loss": 0.0094, "step": 199810 }, { "epoch": 1.01, "learning_rate": 0.0001487823581940457, "loss": 0.0089, "step": 199820 }, { "epoch": 1.01, "learning_rate": 0.00014877479050103172, "loss": 0.0105, "step": 199830 }, { "epoch": 1.01, "learning_rate": 0.0001487672228080177, "loss": 0.0118, "step": 199840 }, { "epoch": 1.01, "learning_rate": 0.00014875965511500368, "loss": 0.0099, "step": 199850 }, { "epoch": 1.01, "learning_rate": 0.0001487520874219897, "loss": 0.0095, "step": 199860 }, { "epoch": 1.01, "learning_rate": 0.00014874451972897567, "loss": 0.009, "step": 199870 }, { "epoch": 1.01, "learning_rate": 0.00014873695203596166, "loss": 0.0112, "step": 199880 }, { "epoch": 1.01, "learning_rate": 0.00014872938434294766, "loss": 0.0104, "step": 199890 }, { "epoch": 1.01, "learning_rate": 0.00014872181664993365, "loss": 0.0079, "step": 199900 }, { "epoch": 1.01, "learning_rate": 0.00014871424895691963, "loss": 0.0098, "step": 199910 }, { "epoch": 1.01, "learning_rate": 0.00014870668126390564, "loss": 0.0096, "step": 199920 }, { "epoch": 1.01, "learning_rate": 0.00014869911357089162, "loss": 0.0091, "step": 199930 }, { "epoch": 1.01, "learning_rate": 0.0001486915458778776, "loss": 0.0114, "step": 199940 }, { "epoch": 1.01, "learning_rate": 0.0001486839781848636, "loss": 0.0097, "step": 199950 }, { "epoch": 1.01, "learning_rate": 0.0001486764104918496, "loss": 0.0089, "step": 199960 }, { "epoch": 1.01, "learning_rate": 0.00014866884279883557, "loss": 0.0083, "step": 199970 }, { "epoch": 1.01, "learning_rate": 0.00014866127510582155, "loss": 0.0083, "step": 199980 }, { "epoch": 1.01, "learning_rate": 0.00014865370741280756, "loss": 0.0102, "step": 199990 }, { "epoch": 1.01, "learning_rate": 0.00014864613971979354, "loss": 0.0085, "step": 200000 }, { "epoch": 1.01, "eval_cer": 0.9144615223380336, "eval_loss": 0.007801192346960306, "eval_runtime": 117.4252, "eval_samples_per_second": 17.032, "eval_steps_per_second": 4.258, "step": 200000 }, { "epoch": 1.01, "learning_rate": 0.00014863857202677952, "loss": 0.0097, "step": 200010 }, { "epoch": 1.01, "learning_rate": 0.00014863100433376553, "loss": 0.0116, "step": 200020 }, { "epoch": 1.01, "learning_rate": 0.0001486234366407515, "loss": 0.01, "step": 200030 }, { "epoch": 1.01, "learning_rate": 0.0001486158689477375, "loss": 0.0106, "step": 200040 }, { "epoch": 1.01, "learning_rate": 0.0001486083012547235, "loss": 0.009, "step": 200050 }, { "epoch": 1.01, "learning_rate": 0.00014860073356170948, "loss": 0.0097, "step": 200060 }, { "epoch": 1.01, "learning_rate": 0.00014859316586869547, "loss": 0.0088, "step": 200070 }, { "epoch": 1.01, "learning_rate": 0.00014858559817568147, "loss": 0.0089, "step": 200080 }, { "epoch": 1.01, "learning_rate": 0.00014857803048266746, "loss": 0.0094, "step": 200090 }, { "epoch": 1.01, "learning_rate": 0.00014857046278965344, "loss": 0.0099, "step": 200100 }, { "epoch": 1.01, "learning_rate": 0.00014856289509663945, "loss": 0.0111, "step": 200110 }, { "epoch": 1.01, "learning_rate": 0.00014855532740362543, "loss": 0.0089, "step": 200120 }, { "epoch": 1.01, "learning_rate": 0.0001485477597106114, "loss": 0.009, "step": 200130 }, { "epoch": 1.01, "learning_rate": 0.00014854019201759742, "loss": 0.0108, "step": 200140 }, { "epoch": 1.01, "learning_rate": 0.0001485326243245834, "loss": 0.0074, "step": 200150 }, { "epoch": 1.01, "learning_rate": 0.00014852505663156938, "loss": 0.0089, "step": 200160 }, { "epoch": 1.01, "learning_rate": 0.00014851748893855536, "loss": 0.0093, "step": 200170 }, { "epoch": 1.01, "learning_rate": 0.00014850992124554134, "loss": 0.0089, "step": 200180 }, { "epoch": 1.01, "learning_rate": 0.00014850235355252732, "loss": 0.0087, "step": 200190 }, { "epoch": 1.01, "learning_rate": 0.00014849478585951333, "loss": 0.0114, "step": 200200 }, { "epoch": 1.01, "learning_rate": 0.00014848721816649931, "loss": 0.0094, "step": 200210 }, { "epoch": 1.01, "learning_rate": 0.0001484796504734853, "loss": 0.0091, "step": 200220 }, { "epoch": 1.01, "learning_rate": 0.0001484720827804713, "loss": 0.0075, "step": 200230 }, { "epoch": 1.01, "learning_rate": 0.00014846451508745729, "loss": 0.0082, "step": 200240 }, { "epoch": 1.01, "learning_rate": 0.00014845694739444327, "loss": 0.0095, "step": 200250 }, { "epoch": 1.01, "learning_rate": 0.00014844937970142928, "loss": 0.0083, "step": 200260 }, { "epoch": 1.01, "learning_rate": 0.00014844181200841526, "loss": 0.0106, "step": 200270 }, { "epoch": 1.01, "learning_rate": 0.00014843424431540124, "loss": 0.0085, "step": 200280 }, { "epoch": 1.01, "learning_rate": 0.00014842667662238725, "loss": 0.0112, "step": 200290 }, { "epoch": 1.01, "learning_rate": 0.00014841910892937323, "loss": 0.0095, "step": 200300 }, { "epoch": 1.01, "learning_rate": 0.0001484115412363592, "loss": 0.0104, "step": 200310 }, { "epoch": 1.01, "learning_rate": 0.00014840397354334522, "loss": 0.0104, "step": 200320 }, { "epoch": 1.01, "learning_rate": 0.0001483964058503312, "loss": 0.0079, "step": 200330 }, { "epoch": 1.01, "learning_rate": 0.00014838883815731718, "loss": 0.0083, "step": 200340 }, { "epoch": 1.01, "learning_rate": 0.00014838127046430316, "loss": 0.0099, "step": 200350 }, { "epoch": 1.01, "learning_rate": 0.00014837370277128917, "loss": 0.0074, "step": 200360 }, { "epoch": 1.01, "learning_rate": 0.00014836613507827515, "loss": 0.0176, "step": 200370 }, { "epoch": 1.01, "learning_rate": 0.00014835856738526113, "loss": 0.0103, "step": 200380 }, { "epoch": 1.01, "learning_rate": 0.00014835099969224714, "loss": 0.0098, "step": 200390 }, { "epoch": 1.01, "learning_rate": 0.00014834343199923312, "loss": 0.0109, "step": 200400 }, { "epoch": 1.01, "learning_rate": 0.0001483358643062191, "loss": 0.0095, "step": 200410 }, { "epoch": 1.01, "learning_rate": 0.00014832829661320511, "loss": 0.0097, "step": 200420 }, { "epoch": 1.01, "learning_rate": 0.0001483207289201911, "loss": 0.0099, "step": 200430 }, { "epoch": 1.01, "learning_rate": 0.00014831316122717708, "loss": 0.015, "step": 200440 }, { "epoch": 1.01, "learning_rate": 0.00014830559353416309, "loss": 0.0131, "step": 200450 }, { "epoch": 1.01, "learning_rate": 0.00014829802584114907, "loss": 0.0498, "step": 200460 }, { "epoch": 1.01, "learning_rate": 0.00014829045814813505, "loss": 0.0123, "step": 200470 }, { "epoch": 1.01, "learning_rate": 0.00014828289045512106, "loss": 0.0098, "step": 200480 }, { "epoch": 1.01, "learning_rate": 0.00014827532276210704, "loss": 0.0117, "step": 200490 }, { "epoch": 1.01, "learning_rate": 0.00014826775506909302, "loss": 0.0111, "step": 200500 }, { "epoch": 1.01, "learning_rate": 0.000148260187376079, "loss": 0.0098, "step": 200510 }, { "epoch": 1.01, "learning_rate": 0.000148252619683065, "loss": 0.0111, "step": 200520 }, { "epoch": 1.01, "learning_rate": 0.000148245051990051, "loss": 0.008, "step": 200530 }, { "epoch": 1.01, "learning_rate": 0.00014823748429703697, "loss": 0.0123, "step": 200540 }, { "epoch": 1.01, "learning_rate": 0.00014822991660402298, "loss": 0.0089, "step": 200550 }, { "epoch": 1.01, "learning_rate": 0.00014822234891100896, "loss": 0.008, "step": 200560 }, { "epoch": 1.01, "learning_rate": 0.00014821478121799494, "loss": 0.0079, "step": 200570 }, { "epoch": 1.01, "learning_rate": 0.00014820721352498095, "loss": 0.0071, "step": 200580 }, { "epoch": 1.01, "learning_rate": 0.00014819964583196693, "loss": 0.0119, "step": 200590 }, { "epoch": 1.01, "learning_rate": 0.00014819207813895292, "loss": 0.0127, "step": 200600 }, { "epoch": 1.01, "learning_rate": 0.00014818451044593892, "loss": 0.0112, "step": 200610 }, { "epoch": 1.01, "learning_rate": 0.0001481769427529249, "loss": 0.0087, "step": 200620 }, { "epoch": 1.01, "learning_rate": 0.0001481693750599109, "loss": 0.01, "step": 200630 }, { "epoch": 1.01, "learning_rate": 0.0001481618073668969, "loss": 0.0106, "step": 200640 }, { "epoch": 1.01, "learning_rate": 0.00014815423967388288, "loss": 0.0104, "step": 200650 }, { "epoch": 1.01, "learning_rate": 0.00014814667198086886, "loss": 0.0076, "step": 200660 }, { "epoch": 1.01, "learning_rate": 0.00014813910428785487, "loss": 0.0091, "step": 200670 }, { "epoch": 1.01, "learning_rate": 0.00014813153659484085, "loss": 0.0104, "step": 200680 }, { "epoch": 1.01, "learning_rate": 0.00014812396890182683, "loss": 0.0108, "step": 200690 }, { "epoch": 1.01, "learning_rate": 0.0001481164012088128, "loss": 0.0101, "step": 200700 }, { "epoch": 1.01, "learning_rate": 0.00014810883351579882, "loss": 0.0098, "step": 200710 }, { "epoch": 1.01, "learning_rate": 0.0001481012658227848, "loss": 0.0102, "step": 200720 }, { "epoch": 1.01, "learning_rate": 0.00014809369812977078, "loss": 0.0089, "step": 200730 }, { "epoch": 1.01, "learning_rate": 0.0001480861304367568, "loss": 0.0109, "step": 200740 }, { "epoch": 1.01, "learning_rate": 0.00014807856274374277, "loss": 0.0091, "step": 200750 }, { "epoch": 1.01, "learning_rate": 0.00014807099505072875, "loss": 0.0095, "step": 200760 }, { "epoch": 1.01, "learning_rate": 0.00014806342735771476, "loss": 0.0106, "step": 200770 }, { "epoch": 1.01, "learning_rate": 0.00014805585966470074, "loss": 0.0088, "step": 200780 }, { "epoch": 1.01, "learning_rate": 0.00014804829197168673, "loss": 0.0124, "step": 200790 }, { "epoch": 1.01, "learning_rate": 0.0001480407242786727, "loss": 0.0088, "step": 200800 }, { "epoch": 1.01, "learning_rate": 0.0001480331565856587, "loss": 0.0109, "step": 200810 }, { "epoch": 1.01, "learning_rate": 0.0001480255888926447, "loss": 0.0111, "step": 200820 }, { "epoch": 1.01, "learning_rate": 0.00014801802119963068, "loss": 0.0091, "step": 200830 }, { "epoch": 1.01, "learning_rate": 0.00014801045350661666, "loss": 0.0111, "step": 200840 }, { "epoch": 1.01, "learning_rate": 0.00014800288581360267, "loss": 0.0117, "step": 200850 }, { "epoch": 1.01, "learning_rate": 0.00014799531812058865, "loss": 0.0105, "step": 200860 }, { "epoch": 1.01, "learning_rate": 0.00014798775042757463, "loss": 0.0085, "step": 200870 }, { "epoch": 1.01, "learning_rate": 0.0001479801827345606, "loss": 0.0118, "step": 200880 }, { "epoch": 1.01, "learning_rate": 0.00014797261504154662, "loss": 0.0112, "step": 200890 }, { "epoch": 1.01, "learning_rate": 0.0001479650473485326, "loss": 0.0112, "step": 200900 }, { "epoch": 1.01, "learning_rate": 0.00014795747965551858, "loss": 0.0099, "step": 200910 }, { "epoch": 1.01, "learning_rate": 0.0001479499119625046, "loss": 0.0114, "step": 200920 }, { "epoch": 1.01, "learning_rate": 0.00014794234426949057, "loss": 0.0092, "step": 200930 }, { "epoch": 1.01, "learning_rate": 0.00014793477657647656, "loss": 0.0111, "step": 200940 }, { "epoch": 1.01, "learning_rate": 0.00014792720888346256, "loss": 0.0083, "step": 200950 }, { "epoch": 1.01, "learning_rate": 0.00014791964119044855, "loss": 0.0099, "step": 200960 }, { "epoch": 1.01, "learning_rate": 0.00014791207349743453, "loss": 0.0085, "step": 200970 }, { "epoch": 1.01, "learning_rate": 0.00014790450580442054, "loss": 0.0159, "step": 200980 }, { "epoch": 1.01, "learning_rate": 0.00014789693811140652, "loss": 0.0129, "step": 200990 }, { "epoch": 1.01, "learning_rate": 0.0001478893704183925, "loss": 0.0094, "step": 201000 }, { "epoch": 1.01, "eval_cer": 0.914447936792278, "eval_loss": 0.007961818017065525, "eval_runtime": 117.347, "eval_samples_per_second": 17.043, "eval_steps_per_second": 4.261, "step": 201000 }, { "epoch": 1.01, "learning_rate": 0.0001478818027253785, "loss": 0.0099, "step": 201010 }, { "epoch": 1.01, "learning_rate": 0.0001478742350323645, "loss": 0.0091, "step": 201020 }, { "epoch": 1.01, "learning_rate": 0.00014786666733935047, "loss": 0.0101, "step": 201030 }, { "epoch": 1.01, "learning_rate": 0.00014785909964633645, "loss": 0.0135, "step": 201040 }, { "epoch": 1.01, "learning_rate": 0.00014785153195332246, "loss": 0.0141, "step": 201050 }, { "epoch": 1.01, "learning_rate": 0.00014784396426030844, "loss": 0.0078, "step": 201060 }, { "epoch": 1.01, "learning_rate": 0.00014783639656729442, "loss": 0.011, "step": 201070 }, { "epoch": 1.01, "learning_rate": 0.00014782882887428043, "loss": 0.0122, "step": 201080 }, { "epoch": 1.01, "learning_rate": 0.0001478212611812664, "loss": 0.01, "step": 201090 }, { "epoch": 1.01, "learning_rate": 0.0001478136934882524, "loss": 0.0103, "step": 201100 }, { "epoch": 1.01, "learning_rate": 0.0001478061257952384, "loss": 0.0109, "step": 201110 }, { "epoch": 1.01, "learning_rate": 0.00014779855810222438, "loss": 0.0091, "step": 201120 }, { "epoch": 1.01, "learning_rate": 0.00014779099040921037, "loss": 0.0093, "step": 201130 }, { "epoch": 1.01, "learning_rate": 0.00014778342271619637, "loss": 0.0084, "step": 201140 }, { "epoch": 1.01, "learning_rate": 0.00014777585502318236, "loss": 0.0116, "step": 201150 }, { "epoch": 1.01, "learning_rate": 0.00014776828733016834, "loss": 0.0088, "step": 201160 }, { "epoch": 1.01, "learning_rate": 0.00014776071963715435, "loss": 0.0102, "step": 201170 }, { "epoch": 1.01, "learning_rate": 0.00014775315194414033, "loss": 0.0106, "step": 201180 }, { "epoch": 1.02, "learning_rate": 0.0001477455842511263, "loss": 0.0099, "step": 201190 }, { "epoch": 1.02, "learning_rate": 0.00014773801655811232, "loss": 0.0082, "step": 201200 }, { "epoch": 1.02, "learning_rate": 0.0001477304488650983, "loss": 0.0084, "step": 201210 }, { "epoch": 1.02, "learning_rate": 0.00014772288117208428, "loss": 0.0108, "step": 201220 }, { "epoch": 1.02, "learning_rate": 0.00014771531347907026, "loss": 0.0087, "step": 201230 }, { "epoch": 1.02, "learning_rate": 0.00014770774578605627, "loss": 0.0091, "step": 201240 }, { "epoch": 1.02, "learning_rate": 0.00014770017809304225, "loss": 0.0095, "step": 201250 }, { "epoch": 1.02, "learning_rate": 0.00014769261040002823, "loss": 0.012, "step": 201260 }, { "epoch": 1.02, "learning_rate": 0.00014768504270701424, "loss": 0.0117, "step": 201270 }, { "epoch": 1.02, "learning_rate": 0.00014767747501400022, "loss": 0.0094, "step": 201280 }, { "epoch": 1.02, "learning_rate": 0.0001476699073209862, "loss": 0.0102, "step": 201290 }, { "epoch": 1.02, "learning_rate": 0.0001476623396279722, "loss": 0.0091, "step": 201300 }, { "epoch": 1.02, "learning_rate": 0.0001476547719349582, "loss": 0.0099, "step": 201310 }, { "epoch": 1.02, "learning_rate": 0.00014764720424194418, "loss": 0.0094, "step": 201320 }, { "epoch": 1.02, "learning_rate": 0.00014763963654893018, "loss": 0.0101, "step": 201330 }, { "epoch": 1.02, "learning_rate": 0.00014763206885591617, "loss": 0.0078, "step": 201340 }, { "epoch": 1.02, "learning_rate": 0.00014762450116290215, "loss": 0.011, "step": 201350 }, { "epoch": 1.02, "learning_rate": 0.00014761693346988816, "loss": 0.0092, "step": 201360 }, { "epoch": 1.02, "learning_rate": 0.00014760936577687414, "loss": 0.0096, "step": 201370 }, { "epoch": 1.02, "learning_rate": 0.00014760179808386012, "loss": 0.0086, "step": 201380 }, { "epoch": 1.02, "learning_rate": 0.0001475942303908461, "loss": 0.0102, "step": 201390 }, { "epoch": 1.02, "learning_rate": 0.0001475866626978321, "loss": 0.0091, "step": 201400 }, { "epoch": 1.02, "learning_rate": 0.0001475790950048181, "loss": 0.0143, "step": 201410 }, { "epoch": 1.02, "learning_rate": 0.00014757152731180407, "loss": 0.0086, "step": 201420 }, { "epoch": 1.02, "learning_rate": 0.00014756395961879005, "loss": 0.0101, "step": 201430 }, { "epoch": 1.02, "learning_rate": 0.00014755639192577603, "loss": 0.0089, "step": 201440 }, { "epoch": 1.02, "learning_rate": 0.00014754882423276204, "loss": 0.0119, "step": 201450 }, { "epoch": 1.02, "learning_rate": 0.00014754125653974802, "loss": 0.0099, "step": 201460 }, { "epoch": 1.02, "learning_rate": 0.000147533688846734, "loss": 0.0092, "step": 201470 }, { "epoch": 1.02, "learning_rate": 0.00014752612115372001, "loss": 0.0099, "step": 201480 }, { "epoch": 1.02, "learning_rate": 0.000147518553460706, "loss": 0.0089, "step": 201490 }, { "epoch": 1.02, "learning_rate": 0.00014751098576769198, "loss": 0.0093, "step": 201500 }, { "epoch": 1.02, "learning_rate": 0.00014750341807467799, "loss": 0.0085, "step": 201510 }, { "epoch": 1.02, "learning_rate": 0.00014749585038166397, "loss": 0.0085, "step": 201520 }, { "epoch": 1.02, "learning_rate": 0.00014748828268864995, "loss": 0.0117, "step": 201530 }, { "epoch": 1.02, "learning_rate": 0.00014748071499563596, "loss": 0.0107, "step": 201540 }, { "epoch": 1.02, "learning_rate": 0.00014747314730262194, "loss": 0.0091, "step": 201550 }, { "epoch": 1.02, "learning_rate": 0.00014746557960960792, "loss": 0.0093, "step": 201560 }, { "epoch": 1.02, "learning_rate": 0.00014745801191659393, "loss": 0.0087, "step": 201570 }, { "epoch": 1.02, "learning_rate": 0.0001474504442235799, "loss": 0.0122, "step": 201580 }, { "epoch": 1.02, "learning_rate": 0.0001474428765305659, "loss": 0.009, "step": 201590 }, { "epoch": 1.02, "learning_rate": 0.00014743530883755187, "loss": 0.0093, "step": 201600 }, { "epoch": 1.02, "learning_rate": 0.00014742774114453788, "loss": 0.0069, "step": 201610 }, { "epoch": 1.02, "learning_rate": 0.00014742017345152386, "loss": 0.008, "step": 201620 }, { "epoch": 1.02, "learning_rate": 0.00014741260575850984, "loss": 0.0137, "step": 201630 }, { "epoch": 1.02, "learning_rate": 0.00014740503806549585, "loss": 0.0089, "step": 201640 }, { "epoch": 1.02, "learning_rate": 0.00014739747037248183, "loss": 0.0082, "step": 201650 }, { "epoch": 1.02, "learning_rate": 0.00014738990267946782, "loss": 0.0107, "step": 201660 }, { "epoch": 1.02, "learning_rate": 0.00014738233498645382, "loss": 0.0089, "step": 201670 }, { "epoch": 1.02, "learning_rate": 0.0001473747672934398, "loss": 0.0077, "step": 201680 }, { "epoch": 1.02, "learning_rate": 0.0001473671996004258, "loss": 0.0103, "step": 201690 }, { "epoch": 1.02, "learning_rate": 0.0001473596319074118, "loss": 0.0092, "step": 201700 }, { "epoch": 1.02, "learning_rate": 0.00014735206421439778, "loss": 0.0083, "step": 201710 }, { "epoch": 1.02, "learning_rate": 0.00014734449652138376, "loss": 0.0103, "step": 201720 }, { "epoch": 1.02, "learning_rate": 0.00014733692882836977, "loss": 0.015, "step": 201730 }, { "epoch": 1.02, "learning_rate": 0.00014732936113535575, "loss": 0.0099, "step": 201740 }, { "epoch": 1.02, "learning_rate": 0.00014732179344234173, "loss": 0.0091, "step": 201750 }, { "epoch": 1.02, "learning_rate": 0.0001473142257493277, "loss": 0.0131, "step": 201760 }, { "epoch": 1.02, "learning_rate": 0.00014730665805631372, "loss": 0.0111, "step": 201770 }, { "epoch": 1.02, "learning_rate": 0.0001472990903632997, "loss": 0.0105, "step": 201780 }, { "epoch": 1.02, "learning_rate": 0.00014729152267028568, "loss": 0.0094, "step": 201790 }, { "epoch": 1.02, "learning_rate": 0.0001472839549772717, "loss": 0.0139, "step": 201800 }, { "epoch": 1.02, "learning_rate": 0.00014727638728425767, "loss": 0.0096, "step": 201810 }, { "epoch": 1.02, "learning_rate": 0.00014726881959124365, "loss": 0.0109, "step": 201820 }, { "epoch": 1.02, "learning_rate": 0.00014726125189822966, "loss": 0.011, "step": 201830 }, { "epoch": 1.02, "learning_rate": 0.00014725368420521564, "loss": 0.0092, "step": 201840 }, { "epoch": 1.02, "learning_rate": 0.00014724611651220163, "loss": 0.0099, "step": 201850 }, { "epoch": 1.02, "learning_rate": 0.00014723854881918763, "loss": 0.0108, "step": 201860 }, { "epoch": 1.02, "learning_rate": 0.00014723098112617362, "loss": 0.0077, "step": 201870 }, { "epoch": 1.02, "learning_rate": 0.0001472234134331596, "loss": 0.012, "step": 201880 }, { "epoch": 1.02, "learning_rate": 0.0001472158457401456, "loss": 0.0085, "step": 201890 }, { "epoch": 1.02, "learning_rate": 0.0001472082780471316, "loss": 0.0081, "step": 201900 }, { "epoch": 1.02, "learning_rate": 0.00014720071035411757, "loss": 0.0077, "step": 201910 }, { "epoch": 1.02, "learning_rate": 0.00014719314266110355, "loss": 0.009, "step": 201920 }, { "epoch": 1.02, "learning_rate": 0.00014718557496808956, "loss": 0.0094, "step": 201930 }, { "epoch": 1.02, "learning_rate": 0.00014717800727507554, "loss": 0.011, "step": 201940 }, { "epoch": 1.02, "learning_rate": 0.00014717043958206152, "loss": 0.0107, "step": 201950 }, { "epoch": 1.02, "learning_rate": 0.00014716287188904753, "loss": 0.0086, "step": 201960 }, { "epoch": 1.02, "learning_rate": 0.0001471553041960335, "loss": 0.0099, "step": 201970 }, { "epoch": 1.02, "learning_rate": 0.0001471477365030195, "loss": 0.0105, "step": 201980 }, { "epoch": 1.02, "learning_rate": 0.0001471401688100055, "loss": 0.008, "step": 201990 }, { "epoch": 1.02, "learning_rate": 0.00014713260111699148, "loss": 0.009, "step": 202000 }, { "epoch": 1.02, "eval_cer": 0.9144954862024227, "eval_loss": 0.007912137545645237, "eval_runtime": 117.0882, "eval_samples_per_second": 17.081, "eval_steps_per_second": 4.27, "step": 202000 }, { "epoch": 1.02, "learning_rate": 0.00014712503342397746, "loss": 0.0113, "step": 202010 }, { "epoch": 1.02, "learning_rate": 0.00014711746573096347, "loss": 0.0106, "step": 202020 }, { "epoch": 1.02, "learning_rate": 0.00014710989803794945, "loss": 0.0126, "step": 202030 }, { "epoch": 1.02, "learning_rate": 0.00014710233034493544, "loss": 0.0107, "step": 202040 }, { "epoch": 1.02, "learning_rate": 0.00014709476265192142, "loss": 0.0111, "step": 202050 }, { "epoch": 1.02, "learning_rate": 0.0001470871949589074, "loss": 0.0086, "step": 202060 }, { "epoch": 1.02, "learning_rate": 0.0001470796272658934, "loss": 0.0098, "step": 202070 }, { "epoch": 1.02, "learning_rate": 0.0001470720595728794, "loss": 0.009, "step": 202080 }, { "epoch": 1.02, "learning_rate": 0.00014706449187986537, "loss": 0.0108, "step": 202090 }, { "epoch": 1.02, "learning_rate": 0.00014705692418685138, "loss": 0.0099, "step": 202100 }, { "epoch": 1.02, "learning_rate": 0.00014704935649383736, "loss": 0.0098, "step": 202110 }, { "epoch": 1.02, "learning_rate": 0.00014704178880082334, "loss": 0.0108, "step": 202120 }, { "epoch": 1.02, "learning_rate": 0.00014703422110780932, "loss": 0.0107, "step": 202130 }, { "epoch": 1.02, "learning_rate": 0.00014702665341479533, "loss": 0.0092, "step": 202140 }, { "epoch": 1.02, "learning_rate": 0.0001470190857217813, "loss": 0.009, "step": 202150 }, { "epoch": 1.02, "learning_rate": 0.0001470115180287673, "loss": 0.0084, "step": 202160 }, { "epoch": 1.02, "learning_rate": 0.0001470039503357533, "loss": 0.0118, "step": 202170 }, { "epoch": 1.02, "learning_rate": 0.00014699638264273928, "loss": 0.0094, "step": 202180 }, { "epoch": 1.02, "learning_rate": 0.00014698881494972527, "loss": 0.0087, "step": 202190 }, { "epoch": 1.02, "learning_rate": 0.00014698124725671127, "loss": 0.0129, "step": 202200 }, { "epoch": 1.02, "learning_rate": 0.00014697367956369726, "loss": 0.0133, "step": 202210 }, { "epoch": 1.02, "learning_rate": 0.00014696611187068324, "loss": 0.0087, "step": 202220 }, { "epoch": 1.02, "learning_rate": 0.00014695854417766925, "loss": 0.0078, "step": 202230 }, { "epoch": 1.02, "learning_rate": 0.00014695097648465523, "loss": 0.0098, "step": 202240 }, { "epoch": 1.02, "learning_rate": 0.0001469434087916412, "loss": 0.0114, "step": 202250 }, { "epoch": 1.02, "learning_rate": 0.00014693584109862722, "loss": 0.0098, "step": 202260 }, { "epoch": 1.02, "learning_rate": 0.0001469282734056132, "loss": 0.0074, "step": 202270 }, { "epoch": 1.02, "learning_rate": 0.00014692070571259918, "loss": 0.0088, "step": 202280 }, { "epoch": 1.02, "learning_rate": 0.00014691313801958516, "loss": 0.0101, "step": 202290 }, { "epoch": 1.02, "learning_rate": 0.00014690557032657117, "loss": 0.0098, "step": 202300 }, { "epoch": 1.02, "learning_rate": 0.00014689800263355715, "loss": 0.0111, "step": 202310 }, { "epoch": 1.02, "learning_rate": 0.00014689043494054313, "loss": 0.0127, "step": 202320 }, { "epoch": 1.02, "learning_rate": 0.00014688286724752914, "loss": 0.0075, "step": 202330 }, { "epoch": 1.02, "learning_rate": 0.00014687529955451512, "loss": 0.0084, "step": 202340 }, { "epoch": 1.02, "learning_rate": 0.0001468677318615011, "loss": 0.0105, "step": 202350 }, { "epoch": 1.02, "learning_rate": 0.0001468601641684871, "loss": 0.0088, "step": 202360 }, { "epoch": 1.02, "learning_rate": 0.0001468525964754731, "loss": 0.0096, "step": 202370 }, { "epoch": 1.02, "learning_rate": 0.00014684502878245908, "loss": 0.0097, "step": 202380 }, { "epoch": 1.02, "learning_rate": 0.00014683746108944508, "loss": 0.0119, "step": 202390 }, { "epoch": 1.02, "learning_rate": 0.00014682989339643107, "loss": 0.0079, "step": 202400 }, { "epoch": 1.02, "learning_rate": 0.00014682232570341705, "loss": 0.0113, "step": 202410 }, { "epoch": 1.02, "learning_rate": 0.00014681475801040306, "loss": 0.0093, "step": 202420 }, { "epoch": 1.02, "learning_rate": 0.00014680719031738904, "loss": 0.0107, "step": 202430 }, { "epoch": 1.02, "learning_rate": 0.00014679962262437502, "loss": 0.0089, "step": 202440 }, { "epoch": 1.02, "learning_rate": 0.000146792054931361, "loss": 0.0079, "step": 202450 }, { "epoch": 1.02, "learning_rate": 0.000146784487238347, "loss": 0.0108, "step": 202460 }, { "epoch": 1.02, "learning_rate": 0.000146776919545333, "loss": 0.011, "step": 202470 }, { "epoch": 1.02, "learning_rate": 0.00014676935185231897, "loss": 0.0095, "step": 202480 }, { "epoch": 1.02, "learning_rate": 0.00014676178415930498, "loss": 0.0083, "step": 202490 }, { "epoch": 1.02, "learning_rate": 0.00014675421646629096, "loss": 0.0087, "step": 202500 }, { "epoch": 1.02, "learning_rate": 0.00014674664877327694, "loss": 0.009, "step": 202510 }, { "epoch": 1.02, "learning_rate": 0.00014673908108026295, "loss": 0.0089, "step": 202520 }, { "epoch": 1.02, "learning_rate": 0.00014673151338724893, "loss": 0.0103, "step": 202530 }, { "epoch": 1.02, "learning_rate": 0.00014672394569423491, "loss": 0.0107, "step": 202540 }, { "epoch": 1.02, "learning_rate": 0.00014671637800122092, "loss": 0.0122, "step": 202550 }, { "epoch": 1.02, "learning_rate": 0.0001467088103082069, "loss": 0.0078, "step": 202560 }, { "epoch": 1.02, "learning_rate": 0.00014670124261519289, "loss": 0.0089, "step": 202570 }, { "epoch": 1.02, "learning_rate": 0.0001466936749221789, "loss": 0.0092, "step": 202580 }, { "epoch": 1.02, "learning_rate": 0.00014668610722916488, "loss": 0.0077, "step": 202590 }, { "epoch": 1.02, "learning_rate": 0.00014667853953615086, "loss": 0.0095, "step": 202600 }, { "epoch": 1.02, "learning_rate": 0.00014667097184313687, "loss": 0.0124, "step": 202610 }, { "epoch": 1.02, "learning_rate": 0.00014666340415012285, "loss": 0.0125, "step": 202620 }, { "epoch": 1.02, "learning_rate": 0.00014665583645710883, "loss": 0.0091, "step": 202630 }, { "epoch": 1.02, "learning_rate": 0.0001466482687640948, "loss": 0.0127, "step": 202640 }, { "epoch": 1.02, "learning_rate": 0.00014664070107108082, "loss": 0.0093, "step": 202650 }, { "epoch": 1.02, "learning_rate": 0.0001466331333780668, "loss": 0.0077, "step": 202660 }, { "epoch": 1.02, "learning_rate": 0.00014662556568505278, "loss": 0.009, "step": 202670 }, { "epoch": 1.02, "learning_rate": 0.00014661799799203876, "loss": 0.009, "step": 202680 }, { "epoch": 1.02, "learning_rate": 0.00014661043029902474, "loss": 0.0097, "step": 202690 }, { "epoch": 1.02, "learning_rate": 0.00014660286260601075, "loss": 0.0108, "step": 202700 }, { "epoch": 1.02, "learning_rate": 0.00014659529491299673, "loss": 0.008, "step": 202710 }, { "epoch": 1.02, "learning_rate": 0.00014658772721998272, "loss": 0.0108, "step": 202720 }, { "epoch": 1.02, "learning_rate": 0.00014658015952696872, "loss": 0.0106, "step": 202730 }, { "epoch": 1.02, "learning_rate": 0.0001465725918339547, "loss": 0.0076, "step": 202740 }, { "epoch": 1.02, "learning_rate": 0.0001465650241409407, "loss": 0.0103, "step": 202750 }, { "epoch": 1.02, "learning_rate": 0.0001465574564479267, "loss": 0.0091, "step": 202760 }, { "epoch": 1.02, "learning_rate": 0.00014654988875491268, "loss": 0.0123, "step": 202770 }, { "epoch": 1.02, "learning_rate": 0.00014654232106189866, "loss": 0.0091, "step": 202780 }, { "epoch": 1.02, "learning_rate": 0.00014653475336888467, "loss": 0.0102, "step": 202790 }, { "epoch": 1.02, "learning_rate": 0.00014652718567587065, "loss": 0.0102, "step": 202800 }, { "epoch": 1.02, "learning_rate": 0.00014651961798285663, "loss": 0.008, "step": 202810 }, { "epoch": 1.02, "learning_rate": 0.0001465120502898426, "loss": 0.009, "step": 202820 }, { "epoch": 1.02, "learning_rate": 0.00014650448259682862, "loss": 0.0087, "step": 202830 }, { "epoch": 1.02, "learning_rate": 0.0001464969149038146, "loss": 0.0105, "step": 202840 }, { "epoch": 1.02, "learning_rate": 0.00014648934721080058, "loss": 0.0101, "step": 202850 }, { "epoch": 1.02, "learning_rate": 0.0001464817795177866, "loss": 0.0102, "step": 202860 }, { "epoch": 1.02, "learning_rate": 0.00014647421182477257, "loss": 0.0074, "step": 202870 }, { "epoch": 1.02, "learning_rate": 0.00014646664413175856, "loss": 0.0104, "step": 202880 }, { "epoch": 1.02, "learning_rate": 0.00014645907643874456, "loss": 0.0068, "step": 202890 }, { "epoch": 1.02, "learning_rate": 0.00014645150874573055, "loss": 0.0109, "step": 202900 }, { "epoch": 1.02, "learning_rate": 0.00014644394105271653, "loss": 0.0077, "step": 202910 }, { "epoch": 1.02, "learning_rate": 0.00014643637335970254, "loss": 0.0091, "step": 202920 }, { "epoch": 1.02, "learning_rate": 0.00014642880566668852, "loss": 0.0073, "step": 202930 }, { "epoch": 1.02, "learning_rate": 0.0001464212379736745, "loss": 0.0098, "step": 202940 }, { "epoch": 1.02, "learning_rate": 0.0001464136702806605, "loss": 0.0105, "step": 202950 }, { "epoch": 1.02, "learning_rate": 0.0001464061025876465, "loss": 0.0083, "step": 202960 }, { "epoch": 1.02, "learning_rate": 0.00014639853489463247, "loss": 0.0143, "step": 202970 }, { "epoch": 1.02, "learning_rate": 0.00014639096720161845, "loss": 0.0102, "step": 202980 }, { "epoch": 1.02, "learning_rate": 0.00014638339950860446, "loss": 0.0104, "step": 202990 }, { "epoch": 1.02, "learning_rate": 0.00014637583181559044, "loss": 0.0112, "step": 203000 }, { "epoch": 1.02, "eval_cer": 0.9144663743186606, "eval_loss": 0.0076591866090893745, "eval_runtime": 117.2192, "eval_samples_per_second": 17.062, "eval_steps_per_second": 4.266, "step": 203000 }, { "epoch": 1.02, "learning_rate": 0.00014636826412257642, "loss": 0.0068, "step": 203010 }, { "epoch": 1.02, "learning_rate": 0.00014636069642956243, "loss": 0.0078, "step": 203020 }, { "epoch": 1.02, "learning_rate": 0.0001463531287365484, "loss": 0.0119, "step": 203030 }, { "epoch": 1.02, "learning_rate": 0.0001463455610435344, "loss": 0.0111, "step": 203040 }, { "epoch": 1.02, "learning_rate": 0.0001463379933505204, "loss": 0.0103, "step": 203050 }, { "epoch": 1.02, "learning_rate": 0.00014633042565750638, "loss": 0.0069, "step": 203060 }, { "epoch": 1.02, "learning_rate": 0.00014632285796449237, "loss": 0.0126, "step": 203070 }, { "epoch": 1.02, "learning_rate": 0.00014631529027147837, "loss": 0.0096, "step": 203080 }, { "epoch": 1.02, "learning_rate": 0.00014630772257846436, "loss": 0.0093, "step": 203090 }, { "epoch": 1.02, "learning_rate": 0.00014630015488545034, "loss": 0.0112, "step": 203100 }, { "epoch": 1.02, "learning_rate": 0.00014629258719243635, "loss": 0.0092, "step": 203110 }, { "epoch": 1.02, "learning_rate": 0.00014628501949942233, "loss": 0.0113, "step": 203120 }, { "epoch": 1.02, "learning_rate": 0.0001462774518064083, "loss": 0.0084, "step": 203130 }, { "epoch": 1.02, "learning_rate": 0.00014626988411339432, "loss": 0.0112, "step": 203140 }, { "epoch": 1.02, "learning_rate": 0.0001462623164203803, "loss": 0.0112, "step": 203150 }, { "epoch": 1.02, "learning_rate": 0.00014625474872736628, "loss": 0.0124, "step": 203160 }, { "epoch": 1.03, "learning_rate": 0.00014624718103435226, "loss": 0.0087, "step": 203170 }, { "epoch": 1.03, "learning_rate": 0.00014623961334133827, "loss": 0.0082, "step": 203180 }, { "epoch": 1.03, "learning_rate": 0.00014623204564832425, "loss": 0.0099, "step": 203190 }, { "epoch": 1.03, "learning_rate": 0.00014622447795531023, "loss": 0.0091, "step": 203200 }, { "epoch": 1.03, "learning_rate": 0.00014621691026229624, "loss": 0.0085, "step": 203210 }, { "epoch": 1.03, "learning_rate": 0.00014620934256928222, "loss": 0.01, "step": 203220 }, { "epoch": 1.03, "learning_rate": 0.0001462017748762682, "loss": 0.0103, "step": 203230 }, { "epoch": 1.03, "learning_rate": 0.0001461942071832542, "loss": 0.0097, "step": 203240 }, { "epoch": 1.03, "learning_rate": 0.0001461866394902402, "loss": 0.0103, "step": 203250 }, { "epoch": 1.03, "learning_rate": 0.00014617907179722618, "loss": 0.0112, "step": 203260 }, { "epoch": 1.03, "learning_rate": 0.00014617150410421218, "loss": 0.0121, "step": 203270 }, { "epoch": 1.03, "learning_rate": 0.00014616393641119817, "loss": 0.0097, "step": 203280 }, { "epoch": 1.03, "learning_rate": 0.00014615636871818415, "loss": 0.0122, "step": 203290 }, { "epoch": 1.03, "learning_rate": 0.00014614880102517016, "loss": 0.0086, "step": 203300 }, { "epoch": 1.03, "learning_rate": 0.0001461412333321561, "loss": 0.011, "step": 203310 }, { "epoch": 1.03, "learning_rate": 0.00014613366563914212, "loss": 0.0109, "step": 203320 }, { "epoch": 1.03, "learning_rate": 0.0001461260979461281, "loss": 0.0095, "step": 203330 }, { "epoch": 1.03, "learning_rate": 0.00014611853025311408, "loss": 0.0088, "step": 203340 }, { "epoch": 1.03, "learning_rate": 0.00014611096256010006, "loss": 0.0085, "step": 203350 }, { "epoch": 1.03, "learning_rate": 0.00014610339486708607, "loss": 0.0097, "step": 203360 }, { "epoch": 1.03, "learning_rate": 0.00014609582717407205, "loss": 0.0085, "step": 203370 }, { "epoch": 1.03, "learning_rate": 0.00014608825948105803, "loss": 0.0098, "step": 203380 }, { "epoch": 1.03, "learning_rate": 0.00014608069178804404, "loss": 0.0085, "step": 203390 }, { "epoch": 1.03, "learning_rate": 0.00014607312409503002, "loss": 0.0095, "step": 203400 }, { "epoch": 1.03, "learning_rate": 0.000146065556402016, "loss": 0.0063, "step": 203410 }, { "epoch": 1.03, "learning_rate": 0.00014605798870900201, "loss": 0.0093, "step": 203420 }, { "epoch": 1.03, "learning_rate": 0.000146050421015988, "loss": 0.01, "step": 203430 }, { "epoch": 1.03, "learning_rate": 0.00014604285332297398, "loss": 0.0097, "step": 203440 }, { "epoch": 1.03, "learning_rate": 0.00014603528562995999, "loss": 0.009, "step": 203450 }, { "epoch": 1.03, "learning_rate": 0.00014602771793694597, "loss": 0.0107, "step": 203460 }, { "epoch": 1.03, "learning_rate": 0.00014602015024393195, "loss": 0.008, "step": 203470 }, { "epoch": 1.03, "learning_rate": 0.00014601258255091796, "loss": 0.0097, "step": 203480 }, { "epoch": 1.03, "learning_rate": 0.00014600501485790394, "loss": 0.0107, "step": 203490 }, { "epoch": 1.03, "learning_rate": 0.00014599744716488992, "loss": 0.0069, "step": 203500 }, { "epoch": 1.03, "learning_rate": 0.00014598987947187593, "loss": 0.0118, "step": 203510 }, { "epoch": 1.03, "learning_rate": 0.0001459823117788619, "loss": 0.0086, "step": 203520 }, { "epoch": 1.03, "learning_rate": 0.0001459747440858479, "loss": 0.0093, "step": 203530 }, { "epoch": 1.03, "learning_rate": 0.00014596717639283387, "loss": 0.0102, "step": 203540 }, { "epoch": 1.03, "learning_rate": 0.00014595960869981988, "loss": 0.009, "step": 203550 }, { "epoch": 1.03, "learning_rate": 0.00014595204100680586, "loss": 0.0115, "step": 203560 }, { "epoch": 1.03, "learning_rate": 0.00014594447331379184, "loss": 0.0093, "step": 203570 }, { "epoch": 1.03, "learning_rate": 0.00014593690562077785, "loss": 0.0092, "step": 203580 }, { "epoch": 1.03, "learning_rate": 0.00014592933792776383, "loss": 0.0089, "step": 203590 }, { "epoch": 1.03, "learning_rate": 0.00014592177023474982, "loss": 0.0102, "step": 203600 }, { "epoch": 1.03, "learning_rate": 0.00014591420254173582, "loss": 0.0102, "step": 203610 }, { "epoch": 1.03, "learning_rate": 0.0001459066348487218, "loss": 0.0117, "step": 203620 }, { "epoch": 1.03, "learning_rate": 0.0001458990671557078, "loss": 0.0095, "step": 203630 }, { "epoch": 1.03, "learning_rate": 0.0001458914994626938, "loss": 0.0096, "step": 203640 }, { "epoch": 1.03, "learning_rate": 0.00014588393176967978, "loss": 0.0098, "step": 203650 }, { "epoch": 1.03, "learning_rate": 0.00014587636407666576, "loss": 0.0112, "step": 203660 }, { "epoch": 1.03, "learning_rate": 0.00014586879638365177, "loss": 0.0091, "step": 203670 }, { "epoch": 1.03, "learning_rate": 0.00014586122869063775, "loss": 0.0091, "step": 203680 }, { "epoch": 1.03, "learning_rate": 0.00014585366099762373, "loss": 0.0123, "step": 203690 }, { "epoch": 1.03, "learning_rate": 0.0001458460933046097, "loss": 0.0098, "step": 203700 }, { "epoch": 1.03, "learning_rate": 0.00014583852561159572, "loss": 0.0117, "step": 203710 }, { "epoch": 1.03, "learning_rate": 0.0001458309579185817, "loss": 0.0095, "step": 203720 }, { "epoch": 1.03, "learning_rate": 0.00014582339022556768, "loss": 0.0101, "step": 203730 }, { "epoch": 1.03, "learning_rate": 0.0001458158225325537, "loss": 0.0086, "step": 203740 }, { "epoch": 1.03, "learning_rate": 0.00014580825483953967, "loss": 0.0114, "step": 203750 }, { "epoch": 1.03, "learning_rate": 0.00014580068714652565, "loss": 0.0103, "step": 203760 }, { "epoch": 1.03, "learning_rate": 0.00014579311945351166, "loss": 0.009, "step": 203770 }, { "epoch": 1.03, "learning_rate": 0.00014578555176049764, "loss": 0.0099, "step": 203780 }, { "epoch": 1.03, "learning_rate": 0.00014577798406748363, "loss": 0.0109, "step": 203790 }, { "epoch": 1.03, "learning_rate": 0.00014577041637446963, "loss": 0.0094, "step": 203800 }, { "epoch": 1.03, "learning_rate": 0.00014576284868145562, "loss": 0.0113, "step": 203810 }, { "epoch": 1.03, "learning_rate": 0.0001457552809884416, "loss": 0.0124, "step": 203820 }, { "epoch": 1.03, "learning_rate": 0.0001457477132954276, "loss": 0.0104, "step": 203830 }, { "epoch": 1.03, "learning_rate": 0.0001457401456024136, "loss": 0.0105, "step": 203840 }, { "epoch": 1.03, "learning_rate": 0.00014573257790939957, "loss": 0.0132, "step": 203850 }, { "epoch": 1.03, "learning_rate": 0.00014572501021638555, "loss": 0.0131, "step": 203860 }, { "epoch": 1.03, "learning_rate": 0.00014571744252337156, "loss": 0.0109, "step": 203870 }, { "epoch": 1.03, "learning_rate": 0.00014570987483035754, "loss": 0.0103, "step": 203880 }, { "epoch": 1.03, "learning_rate": 0.00014570230713734352, "loss": 0.0121, "step": 203890 }, { "epoch": 1.03, "learning_rate": 0.00014569473944432953, "loss": 0.0119, "step": 203900 }, { "epoch": 1.03, "learning_rate": 0.0001456871717513155, "loss": 0.0101, "step": 203910 }, { "epoch": 1.03, "learning_rate": 0.0001456796040583015, "loss": 0.0117, "step": 203920 }, { "epoch": 1.03, "learning_rate": 0.00014567203636528747, "loss": 0.0107, "step": 203930 }, { "epoch": 1.03, "learning_rate": 0.00014566446867227346, "loss": 0.0096, "step": 203940 }, { "epoch": 1.03, "learning_rate": 0.00014565690097925946, "loss": 0.0089, "step": 203950 }, { "epoch": 1.03, "learning_rate": 0.00014564933328624545, "loss": 0.0073, "step": 203960 }, { "epoch": 1.03, "learning_rate": 0.00014564176559323143, "loss": 0.0089, "step": 203970 }, { "epoch": 1.03, "learning_rate": 0.00014563419790021744, "loss": 0.0104, "step": 203980 }, { "epoch": 1.03, "learning_rate": 0.00014562663020720342, "loss": 0.0087, "step": 203990 }, { "epoch": 1.03, "learning_rate": 0.0001456190625141894, "loss": 0.0129, "step": 204000 }, { "epoch": 1.03, "eval_cer": 0.9144741374876638, "eval_loss": 0.007685788441449404, "eval_runtime": 116.7131, "eval_samples_per_second": 17.136, "eval_steps_per_second": 4.284, "step": 204000 }, { "epoch": 1.03, "learning_rate": 0.0001456114948211754, "loss": 0.0097, "step": 204010 }, { "epoch": 1.03, "learning_rate": 0.0001456039271281614, "loss": 0.0117, "step": 204020 }, { "epoch": 1.03, "learning_rate": 0.00014559635943514737, "loss": 0.0079, "step": 204030 }, { "epoch": 1.03, "learning_rate": 0.00014558879174213338, "loss": 0.0103, "step": 204040 }, { "epoch": 1.03, "learning_rate": 0.00014558122404911936, "loss": 0.0096, "step": 204050 }, { "epoch": 1.03, "learning_rate": 0.00014557365635610534, "loss": 0.008, "step": 204060 }, { "epoch": 1.03, "learning_rate": 0.00014556608866309132, "loss": 0.0097, "step": 204070 }, { "epoch": 1.03, "learning_rate": 0.00014555852097007733, "loss": 0.0095, "step": 204080 }, { "epoch": 1.03, "learning_rate": 0.0001455509532770633, "loss": 0.0104, "step": 204090 }, { "epoch": 1.03, "learning_rate": 0.0001455433855840493, "loss": 0.0104, "step": 204100 }, { "epoch": 1.03, "learning_rate": 0.0001455358178910353, "loss": 0.0085, "step": 204110 }, { "epoch": 1.03, "learning_rate": 0.00014552825019802128, "loss": 0.0133, "step": 204120 }, { "epoch": 1.03, "learning_rate": 0.00014552068250500727, "loss": 0.0113, "step": 204130 }, { "epoch": 1.03, "learning_rate": 0.00014551311481199327, "loss": 0.0101, "step": 204140 }, { "epoch": 1.03, "learning_rate": 0.00014550554711897926, "loss": 0.008, "step": 204150 }, { "epoch": 1.03, "learning_rate": 0.00014549797942596524, "loss": 0.0104, "step": 204160 }, { "epoch": 1.03, "learning_rate": 0.00014549041173295125, "loss": 0.0104, "step": 204170 }, { "epoch": 1.03, "learning_rate": 0.00014548284403993723, "loss": 0.0098, "step": 204180 }, { "epoch": 1.03, "learning_rate": 0.0001454752763469232, "loss": 0.009, "step": 204190 }, { "epoch": 1.03, "learning_rate": 0.00014546770865390922, "loss": 0.0093, "step": 204200 }, { "epoch": 1.03, "learning_rate": 0.0001454601409608952, "loss": 0.0102, "step": 204210 }, { "epoch": 1.03, "learning_rate": 0.00014545257326788118, "loss": 0.0134, "step": 204220 }, { "epoch": 1.03, "learning_rate": 0.00014544500557486716, "loss": 0.0116, "step": 204230 }, { "epoch": 1.03, "learning_rate": 0.00014543743788185317, "loss": 0.0145, "step": 204240 }, { "epoch": 1.03, "learning_rate": 0.00014542987018883915, "loss": 0.0131, "step": 204250 }, { "epoch": 1.03, "learning_rate": 0.00014542230249582513, "loss": 0.0092, "step": 204260 }, { "epoch": 1.03, "learning_rate": 0.00014541473480281114, "loss": 0.0095, "step": 204270 }, { "epoch": 1.03, "learning_rate": 0.00014540716710979712, "loss": 0.0092, "step": 204280 }, { "epoch": 1.03, "learning_rate": 0.0001453995994167831, "loss": 0.0087, "step": 204290 }, { "epoch": 1.03, "learning_rate": 0.0001453920317237691, "loss": 0.0116, "step": 204300 }, { "epoch": 1.03, "learning_rate": 0.0001453844640307551, "loss": 0.0102, "step": 204310 }, { "epoch": 1.03, "learning_rate": 0.00014537689633774108, "loss": 0.0114, "step": 204320 }, { "epoch": 1.03, "learning_rate": 0.00014536932864472708, "loss": 0.0109, "step": 204330 }, { "epoch": 1.03, "learning_rate": 0.00014536176095171307, "loss": 0.0112, "step": 204340 }, { "epoch": 1.03, "learning_rate": 0.00014535419325869905, "loss": 0.0093, "step": 204350 }, { "epoch": 1.03, "learning_rate": 0.00014534662556568506, "loss": 0.0092, "step": 204360 }, { "epoch": 1.03, "learning_rate": 0.00014533905787267104, "loss": 0.0123, "step": 204370 }, { "epoch": 1.03, "learning_rate": 0.00014533149017965702, "loss": 0.009, "step": 204380 }, { "epoch": 1.03, "learning_rate": 0.000145323922486643, "loss": 0.0106, "step": 204390 }, { "epoch": 1.03, "learning_rate": 0.000145316354793629, "loss": 0.0101, "step": 204400 }, { "epoch": 1.03, "learning_rate": 0.000145308787100615, "loss": 0.0129, "step": 204410 }, { "epoch": 1.03, "learning_rate": 0.00014530121940760097, "loss": 0.0094, "step": 204420 }, { "epoch": 1.03, "learning_rate": 0.00014529365171458698, "loss": 0.0116, "step": 204430 }, { "epoch": 1.03, "learning_rate": 0.00014528608402157296, "loss": 0.0095, "step": 204440 }, { "epoch": 1.03, "learning_rate": 0.00014527851632855894, "loss": 0.0114, "step": 204450 }, { "epoch": 1.03, "learning_rate": 0.00014527094863554495, "loss": 0.0093, "step": 204460 }, { "epoch": 1.03, "learning_rate": 0.00014526338094253093, "loss": 0.0084, "step": 204470 }, { "epoch": 1.03, "learning_rate": 0.00014525581324951691, "loss": 0.0095, "step": 204480 }, { "epoch": 1.03, "learning_rate": 0.00014524824555650292, "loss": 0.0102, "step": 204490 }, { "epoch": 1.03, "learning_rate": 0.0001452406778634889, "loss": 0.0102, "step": 204500 }, { "epoch": 1.03, "learning_rate": 0.00014523311017047489, "loss": 0.0083, "step": 204510 }, { "epoch": 1.03, "learning_rate": 0.0001452255424774609, "loss": 0.0098, "step": 204520 }, { "epoch": 1.03, "learning_rate": 0.00014521797478444688, "loss": 0.0112, "step": 204530 }, { "epoch": 1.03, "learning_rate": 0.00014521040709143286, "loss": 0.0112, "step": 204540 }, { "epoch": 1.03, "learning_rate": 0.00014520283939841887, "loss": 0.0103, "step": 204550 }, { "epoch": 1.03, "learning_rate": 0.00014519527170540482, "loss": 0.0103, "step": 204560 }, { "epoch": 1.03, "learning_rate": 0.00014518770401239083, "loss": 0.0155, "step": 204570 }, { "epoch": 1.03, "learning_rate": 0.0001451801363193768, "loss": 0.0085, "step": 204580 }, { "epoch": 1.03, "learning_rate": 0.0001451725686263628, "loss": 0.009, "step": 204590 }, { "epoch": 1.03, "learning_rate": 0.00014516500093334877, "loss": 0.0116, "step": 204600 }, { "epoch": 1.03, "learning_rate": 0.00014515743324033478, "loss": 0.0101, "step": 204610 }, { "epoch": 1.03, "learning_rate": 0.00014514986554732076, "loss": 0.0123, "step": 204620 }, { "epoch": 1.03, "learning_rate": 0.00014514229785430674, "loss": 0.0081, "step": 204630 }, { "epoch": 1.03, "learning_rate": 0.00014513473016129275, "loss": 0.01, "step": 204640 }, { "epoch": 1.03, "learning_rate": 0.00014512716246827873, "loss": 0.013, "step": 204650 }, { "epoch": 1.03, "learning_rate": 0.00014511959477526472, "loss": 0.009, "step": 204660 }, { "epoch": 1.03, "learning_rate": 0.00014511202708225072, "loss": 0.0089, "step": 204670 }, { "epoch": 1.03, "learning_rate": 0.0001451044593892367, "loss": 0.0136, "step": 204680 }, { "epoch": 1.03, "learning_rate": 0.0001450968916962227, "loss": 0.0098, "step": 204690 }, { "epoch": 1.03, "learning_rate": 0.0001450893240032087, "loss": 0.0125, "step": 204700 }, { "epoch": 1.03, "learning_rate": 0.00014508175631019468, "loss": 0.0101, "step": 204710 }, { "epoch": 1.03, "learning_rate": 0.00014507418861718066, "loss": 0.0109, "step": 204720 }, { "epoch": 1.03, "learning_rate": 0.00014506662092416667, "loss": 0.0129, "step": 204730 }, { "epoch": 1.03, "learning_rate": 0.00014505905323115265, "loss": 0.0087, "step": 204740 }, { "epoch": 1.03, "learning_rate": 0.00014505148553813863, "loss": 0.0107, "step": 204750 }, { "epoch": 1.03, "learning_rate": 0.0001450439178451246, "loss": 0.0156, "step": 204760 }, { "epoch": 1.03, "learning_rate": 0.00014503635015211062, "loss": 0.0087, "step": 204770 }, { "epoch": 1.03, "learning_rate": 0.0001450287824590966, "loss": 0.0073, "step": 204780 }, { "epoch": 1.03, "learning_rate": 0.00014502121476608258, "loss": 0.008, "step": 204790 }, { "epoch": 1.03, "learning_rate": 0.0001450136470730686, "loss": 0.0084, "step": 204800 }, { "epoch": 1.03, "learning_rate": 0.00014500607938005457, "loss": 0.0102, "step": 204810 }, { "epoch": 1.03, "learning_rate": 0.00014499851168704055, "loss": 0.0112, "step": 204820 }, { "epoch": 1.03, "learning_rate": 0.00014499094399402656, "loss": 0.0088, "step": 204830 }, { "epoch": 1.03, "learning_rate": 0.00014498337630101254, "loss": 0.0097, "step": 204840 }, { "epoch": 1.03, "learning_rate": 0.00014497580860799853, "loss": 0.0086, "step": 204850 }, { "epoch": 1.03, "learning_rate": 0.00014496824091498453, "loss": 0.0077, "step": 204860 }, { "epoch": 1.03, "learning_rate": 0.00014496067322197052, "loss": 0.0092, "step": 204870 }, { "epoch": 1.03, "learning_rate": 0.0001449531055289565, "loss": 0.0108, "step": 204880 }, { "epoch": 1.03, "learning_rate": 0.0001449455378359425, "loss": 0.0111, "step": 204890 }, { "epoch": 1.03, "learning_rate": 0.0001449379701429285, "loss": 0.0098, "step": 204900 }, { "epoch": 1.03, "learning_rate": 0.00014493040244991447, "loss": 0.0112, "step": 204910 }, { "epoch": 1.03, "learning_rate": 0.00014492283475690045, "loss": 0.0082, "step": 204920 }, { "epoch": 1.03, "learning_rate": 0.00014491526706388646, "loss": 0.0109, "step": 204930 }, { "epoch": 1.03, "learning_rate": 0.00014490769937087244, "loss": 0.0086, "step": 204940 }, { "epoch": 1.03, "learning_rate": 0.00014490013167785842, "loss": 0.0087, "step": 204950 }, { "epoch": 1.03, "learning_rate": 0.00014489256398484443, "loss": 0.0114, "step": 204960 }, { "epoch": 1.03, "learning_rate": 0.0001448849962918304, "loss": 0.01, "step": 204970 }, { "epoch": 1.03, "learning_rate": 0.0001448774285988164, "loss": 0.0073, "step": 204980 }, { "epoch": 1.03, "learning_rate": 0.0001448698609058024, "loss": 0.0077, "step": 204990 }, { "epoch": 1.03, "learning_rate": 0.00014486229321278838, "loss": 0.0101, "step": 205000 }, { "epoch": 1.03, "eval_cer": 0.9144615223380336, "eval_loss": 0.007726417388767004, "eval_runtime": 116.6083, "eval_samples_per_second": 17.151, "eval_steps_per_second": 4.288, "step": 205000 }, { "epoch": 1.03, "learning_rate": 0.00014485472551977436, "loss": 0.0074, "step": 205010 }, { "epoch": 1.03, "learning_rate": 0.00014484715782676037, "loss": 0.0116, "step": 205020 }, { "epoch": 1.03, "learning_rate": 0.00014483959013374635, "loss": 0.0089, "step": 205030 }, { "epoch": 1.03, "learning_rate": 0.00014483202244073234, "loss": 0.0081, "step": 205040 }, { "epoch": 1.03, "learning_rate": 0.00014482445474771834, "loss": 0.0119, "step": 205050 }, { "epoch": 1.03, "learning_rate": 0.00014481688705470433, "loss": 0.0079, "step": 205060 }, { "epoch": 1.03, "learning_rate": 0.0001448093193616903, "loss": 0.0084, "step": 205070 }, { "epoch": 1.03, "learning_rate": 0.00014480175166867632, "loss": 0.0103, "step": 205080 }, { "epoch": 1.03, "learning_rate": 0.0001447941839756623, "loss": 0.013, "step": 205090 }, { "epoch": 1.03, "learning_rate": 0.00014478661628264828, "loss": 0.0105, "step": 205100 }, { "epoch": 1.03, "learning_rate": 0.00014477904858963426, "loss": 0.0088, "step": 205110 }, { "epoch": 1.03, "learning_rate": 0.00014477148089662027, "loss": 0.0107, "step": 205120 }, { "epoch": 1.03, "learning_rate": 0.00014476391320360625, "loss": 0.0088, "step": 205130 }, { "epoch": 1.03, "learning_rate": 0.00014475634551059223, "loss": 0.0085, "step": 205140 }, { "epoch": 1.04, "learning_rate": 0.00014474877781757824, "loss": 0.0087, "step": 205150 }, { "epoch": 1.04, "learning_rate": 0.00014474121012456422, "loss": 0.0076, "step": 205160 }, { "epoch": 1.04, "learning_rate": 0.0001447336424315502, "loss": 0.011, "step": 205170 }, { "epoch": 1.04, "learning_rate": 0.0001447260747385362, "loss": 0.012, "step": 205180 }, { "epoch": 1.04, "learning_rate": 0.00014471850704552217, "loss": 0.011, "step": 205190 }, { "epoch": 1.04, "learning_rate": 0.00014471093935250817, "loss": 0.01, "step": 205200 }, { "epoch": 1.04, "learning_rate": 0.00014470337165949416, "loss": 0.0123, "step": 205210 }, { "epoch": 1.04, "learning_rate": 0.00014469580396648014, "loss": 0.0109, "step": 205220 }, { "epoch": 1.04, "learning_rate": 0.00014468823627346615, "loss": 0.0093, "step": 205230 }, { "epoch": 1.04, "learning_rate": 0.00014468066858045213, "loss": 0.0094, "step": 205240 }, { "epoch": 1.04, "learning_rate": 0.0001446731008874381, "loss": 0.0103, "step": 205250 }, { "epoch": 1.04, "learning_rate": 0.00014466553319442412, "loss": 0.0082, "step": 205260 }, { "epoch": 1.04, "learning_rate": 0.0001446579655014101, "loss": 0.009, "step": 205270 }, { "epoch": 1.04, "learning_rate": 0.00014465039780839608, "loss": 0.0119, "step": 205280 }, { "epoch": 1.04, "learning_rate": 0.00014464283011538206, "loss": 0.0084, "step": 205290 }, { "epoch": 1.04, "learning_rate": 0.00014463526242236807, "loss": 0.0083, "step": 205300 }, { "epoch": 1.04, "learning_rate": 0.00014462769472935405, "loss": 0.0115, "step": 205310 }, { "epoch": 1.04, "learning_rate": 0.00014462012703634003, "loss": 0.0095, "step": 205320 }, { "epoch": 1.04, "learning_rate": 0.00014461255934332604, "loss": 0.009, "step": 205330 }, { "epoch": 1.04, "learning_rate": 0.00014460499165031202, "loss": 0.0096, "step": 205340 }, { "epoch": 1.04, "learning_rate": 0.000144597423957298, "loss": 0.0134, "step": 205350 }, { "epoch": 1.04, "learning_rate": 0.000144589856264284, "loss": 0.0081, "step": 205360 }, { "epoch": 1.04, "learning_rate": 0.00014458228857127, "loss": 0.0103, "step": 205370 }, { "epoch": 1.04, "learning_rate": 0.00014457472087825598, "loss": 0.0089, "step": 205380 }, { "epoch": 1.04, "learning_rate": 0.00014456715318524198, "loss": 0.0101, "step": 205390 }, { "epoch": 1.04, "learning_rate": 0.00014455958549222797, "loss": 0.0081, "step": 205400 }, { "epoch": 1.04, "learning_rate": 0.00014455201779921395, "loss": 0.0104, "step": 205410 }, { "epoch": 1.04, "learning_rate": 0.00014454445010619996, "loss": 0.0136, "step": 205420 }, { "epoch": 1.04, "learning_rate": 0.00014453688241318594, "loss": 0.0105, "step": 205430 }, { "epoch": 1.04, "learning_rate": 0.00014452931472017192, "loss": 0.0083, "step": 205440 }, { "epoch": 1.04, "learning_rate": 0.00014452174702715793, "loss": 0.0091, "step": 205450 }, { "epoch": 1.04, "learning_rate": 0.0001445141793341439, "loss": 0.0103, "step": 205460 }, { "epoch": 1.04, "learning_rate": 0.0001445066116411299, "loss": 0.0091, "step": 205470 }, { "epoch": 1.04, "learning_rate": 0.00014449904394811587, "loss": 0.0117, "step": 205480 }, { "epoch": 1.04, "learning_rate": 0.00014449147625510188, "loss": 0.011, "step": 205490 }, { "epoch": 1.04, "learning_rate": 0.00014448390856208786, "loss": 0.0097, "step": 205500 }, { "epoch": 1.04, "learning_rate": 0.00014447634086907384, "loss": 0.0082, "step": 205510 }, { "epoch": 1.04, "learning_rate": 0.00014446877317605985, "loss": 0.0077, "step": 205520 }, { "epoch": 1.04, "learning_rate": 0.00014446120548304583, "loss": 0.0106, "step": 205530 }, { "epoch": 1.04, "learning_rate": 0.00014445363779003181, "loss": 0.0116, "step": 205540 }, { "epoch": 1.04, "learning_rate": 0.00014444607009701782, "loss": 0.0111, "step": 205550 }, { "epoch": 1.04, "learning_rate": 0.0001444385024040038, "loss": 0.0081, "step": 205560 }, { "epoch": 1.04, "learning_rate": 0.00014443093471098979, "loss": 0.0096, "step": 205570 }, { "epoch": 1.04, "learning_rate": 0.0001444233670179758, "loss": 0.0108, "step": 205580 }, { "epoch": 1.04, "learning_rate": 0.00014441579932496178, "loss": 0.0076, "step": 205590 }, { "epoch": 1.04, "learning_rate": 0.00014440823163194776, "loss": 0.0106, "step": 205600 }, { "epoch": 1.04, "learning_rate": 0.00014440066393893377, "loss": 0.0106, "step": 205610 }, { "epoch": 1.04, "learning_rate": 0.00014439309624591975, "loss": 0.0089, "step": 205620 }, { "epoch": 1.04, "learning_rate": 0.00014438552855290573, "loss": 0.0099, "step": 205630 }, { "epoch": 1.04, "learning_rate": 0.0001443779608598917, "loss": 0.0117, "step": 205640 }, { "epoch": 1.04, "learning_rate": 0.00014437039316687772, "loss": 0.0088, "step": 205650 }, { "epoch": 1.04, "learning_rate": 0.0001443628254738637, "loss": 0.0078, "step": 205660 }, { "epoch": 1.04, "learning_rate": 0.00014435525778084968, "loss": 0.0135, "step": 205670 }, { "epoch": 1.04, "learning_rate": 0.0001443476900878357, "loss": 0.0093, "step": 205680 }, { "epoch": 1.04, "learning_rate": 0.00014434012239482167, "loss": 0.0097, "step": 205690 }, { "epoch": 1.04, "learning_rate": 0.00014433255470180765, "loss": 0.0102, "step": 205700 }, { "epoch": 1.04, "learning_rate": 0.00014432498700879366, "loss": 0.0102, "step": 205710 }, { "epoch": 1.04, "learning_rate": 0.00014431741931577964, "loss": 0.011, "step": 205720 }, { "epoch": 1.04, "learning_rate": 0.00014430985162276562, "loss": 0.0096, "step": 205730 }, { "epoch": 1.04, "learning_rate": 0.00014430228392975163, "loss": 0.0122, "step": 205740 }, { "epoch": 1.04, "learning_rate": 0.00014429471623673761, "loss": 0.0117, "step": 205750 }, { "epoch": 1.04, "learning_rate": 0.0001442871485437236, "loss": 0.0094, "step": 205760 }, { "epoch": 1.04, "learning_rate": 0.0001442795808507096, "loss": 0.01, "step": 205770 }, { "epoch": 1.04, "learning_rate": 0.00014427201315769559, "loss": 0.0115, "step": 205780 }, { "epoch": 1.04, "learning_rate": 0.00014426444546468157, "loss": 0.0081, "step": 205790 }, { "epoch": 1.04, "learning_rate": 0.00014425687777166755, "loss": 0.0088, "step": 205800 }, { "epoch": 1.04, "learning_rate": 0.00014424931007865356, "loss": 0.0095, "step": 205810 }, { "epoch": 1.04, "learning_rate": 0.0001442417423856395, "loss": 0.0092, "step": 205820 }, { "epoch": 1.04, "learning_rate": 0.00014423417469262552, "loss": 0.0106, "step": 205830 }, { "epoch": 1.04, "learning_rate": 0.0001442266069996115, "loss": 0.0065, "step": 205840 }, { "epoch": 1.04, "learning_rate": 0.00014421903930659748, "loss": 0.0106, "step": 205850 }, { "epoch": 1.04, "learning_rate": 0.0001442114716135835, "loss": 0.0092, "step": 205860 }, { "epoch": 1.04, "learning_rate": 0.00014420390392056947, "loss": 0.0094, "step": 205870 }, { "epoch": 1.04, "learning_rate": 0.00014419633622755545, "loss": 0.0103, "step": 205880 }, { "epoch": 1.04, "learning_rate": 0.00014418876853454146, "loss": 0.0116, "step": 205890 }, { "epoch": 1.04, "learning_rate": 0.00014418120084152744, "loss": 0.0106, "step": 205900 }, { "epoch": 1.04, "learning_rate": 0.00014417363314851343, "loss": 0.0106, "step": 205910 }, { "epoch": 1.04, "learning_rate": 0.00014416606545549943, "loss": 0.0135, "step": 205920 }, { "epoch": 1.04, "learning_rate": 0.00014415849776248542, "loss": 0.0098, "step": 205930 }, { "epoch": 1.04, "learning_rate": 0.0001441509300694714, "loss": 0.0085, "step": 205940 }, { "epoch": 1.04, "learning_rate": 0.0001441433623764574, "loss": 0.0087, "step": 205950 }, { "epoch": 1.04, "learning_rate": 0.0001441357946834434, "loss": 0.0073, "step": 205960 }, { "epoch": 1.04, "learning_rate": 0.00014412822699042937, "loss": 0.0101, "step": 205970 }, { "epoch": 1.04, "learning_rate": 0.00014412065929741538, "loss": 0.0088, "step": 205980 }, { "epoch": 1.04, "learning_rate": 0.00014411309160440136, "loss": 0.0084, "step": 205990 }, { "epoch": 1.04, "learning_rate": 0.00014410552391138734, "loss": 0.0122, "step": 206000 }, { "epoch": 1.04, "eval_cer": 0.914452788772905, "eval_loss": 0.007414559833705425, "eval_runtime": 116.657, "eval_samples_per_second": 17.144, "eval_steps_per_second": 4.286, "step": 206000 }, { "epoch": 1.04, "learning_rate": 0.00014409795621837332, "loss": 0.0079, "step": 206010 }, { "epoch": 1.04, "learning_rate": 0.00014409038852535933, "loss": 0.0104, "step": 206020 }, { "epoch": 1.04, "learning_rate": 0.0001440828208323453, "loss": 0.0149, "step": 206030 }, { "epoch": 1.04, "learning_rate": 0.0001440752531393313, "loss": 0.0109, "step": 206040 }, { "epoch": 1.04, "learning_rate": 0.0001440676854463173, "loss": 0.0074, "step": 206050 }, { "epoch": 1.04, "learning_rate": 0.00014406011775330328, "loss": 0.0079, "step": 206060 }, { "epoch": 1.04, "learning_rate": 0.00014405255006028926, "loss": 0.0116, "step": 206070 }, { "epoch": 1.04, "learning_rate": 0.00014404498236727527, "loss": 0.0102, "step": 206080 }, { "epoch": 1.04, "learning_rate": 0.00014403741467426125, "loss": 0.0083, "step": 206090 }, { "epoch": 1.04, "learning_rate": 0.00014402984698124724, "loss": 0.0103, "step": 206100 }, { "epoch": 1.04, "learning_rate": 0.00014402227928823324, "loss": 0.0104, "step": 206110 }, { "epoch": 1.04, "learning_rate": 0.00014401471159521923, "loss": 0.0131, "step": 206120 }, { "epoch": 1.04, "learning_rate": 0.0001440071439022052, "loss": 0.0095, "step": 206130 }, { "epoch": 1.04, "learning_rate": 0.00014399957620919122, "loss": 0.0094, "step": 206140 }, { "epoch": 1.04, "learning_rate": 0.0001439920085161772, "loss": 0.0094, "step": 206150 }, { "epoch": 1.04, "learning_rate": 0.00014398444082316318, "loss": 0.0097, "step": 206160 }, { "epoch": 1.04, "learning_rate": 0.00014397687313014916, "loss": 0.0098, "step": 206170 }, { "epoch": 1.04, "learning_rate": 0.00014396930543713517, "loss": 0.0089, "step": 206180 }, { "epoch": 1.04, "learning_rate": 0.00014396173774412115, "loss": 0.0111, "step": 206190 }, { "epoch": 1.04, "learning_rate": 0.00014395417005110713, "loss": 0.0104, "step": 206200 }, { "epoch": 1.04, "learning_rate": 0.00014394660235809314, "loss": 0.0091, "step": 206210 }, { "epoch": 1.04, "learning_rate": 0.00014393903466507912, "loss": 0.0094, "step": 206220 }, { "epoch": 1.04, "learning_rate": 0.0001439314669720651, "loss": 0.0101, "step": 206230 }, { "epoch": 1.04, "learning_rate": 0.0001439238992790511, "loss": 0.0108, "step": 206240 }, { "epoch": 1.04, "learning_rate": 0.0001439163315860371, "loss": 0.0113, "step": 206250 }, { "epoch": 1.04, "learning_rate": 0.00014390876389302307, "loss": 0.0099, "step": 206260 }, { "epoch": 1.04, "learning_rate": 0.00014390119620000908, "loss": 0.0088, "step": 206270 }, { "epoch": 1.04, "learning_rate": 0.00014389362850699506, "loss": 0.0087, "step": 206280 }, { "epoch": 1.04, "learning_rate": 0.00014388606081398105, "loss": 0.0105, "step": 206290 }, { "epoch": 1.04, "learning_rate": 0.00014387849312096705, "loss": 0.0109, "step": 206300 }, { "epoch": 1.04, "learning_rate": 0.00014387092542795304, "loss": 0.0121, "step": 206310 }, { "epoch": 1.04, "learning_rate": 0.00014386335773493902, "loss": 0.012, "step": 206320 }, { "epoch": 1.04, "learning_rate": 0.000143855790041925, "loss": 0.0095, "step": 206330 }, { "epoch": 1.04, "learning_rate": 0.000143848222348911, "loss": 0.0087, "step": 206340 }, { "epoch": 1.04, "learning_rate": 0.000143840654655897, "loss": 0.0126, "step": 206350 }, { "epoch": 1.04, "learning_rate": 0.00014383308696288297, "loss": 0.0082, "step": 206360 }, { "epoch": 1.04, "learning_rate": 0.00014382551926986898, "loss": 0.0112, "step": 206370 }, { "epoch": 1.04, "learning_rate": 0.00014381795157685496, "loss": 0.0122, "step": 206380 }, { "epoch": 1.04, "learning_rate": 0.00014381038388384094, "loss": 0.0088, "step": 206390 }, { "epoch": 1.04, "learning_rate": 0.00014380281619082695, "loss": 0.0093, "step": 206400 }, { "epoch": 1.04, "learning_rate": 0.00014379524849781293, "loss": 0.0104, "step": 206410 }, { "epoch": 1.04, "learning_rate": 0.0001437876808047989, "loss": 0.0111, "step": 206420 }, { "epoch": 1.04, "learning_rate": 0.00014378011311178492, "loss": 0.008, "step": 206430 }, { "epoch": 1.04, "learning_rate": 0.0001437725454187709, "loss": 0.0107, "step": 206440 }, { "epoch": 1.04, "learning_rate": 0.00014376497772575688, "loss": 0.0085, "step": 206450 }, { "epoch": 1.04, "learning_rate": 0.00014375741003274287, "loss": 0.0103, "step": 206460 }, { "epoch": 1.04, "learning_rate": 0.00014374984233972885, "loss": 0.0108, "step": 206470 }, { "epoch": 1.04, "learning_rate": 0.00014374227464671486, "loss": 0.0081, "step": 206480 }, { "epoch": 1.04, "learning_rate": 0.00014373470695370084, "loss": 0.0088, "step": 206490 }, { "epoch": 1.04, "learning_rate": 0.00014372713926068682, "loss": 0.0113, "step": 206500 }, { "epoch": 1.04, "learning_rate": 0.00014371957156767283, "loss": 0.0102, "step": 206510 }, { "epoch": 1.04, "learning_rate": 0.0001437120038746588, "loss": 0.0089, "step": 206520 }, { "epoch": 1.04, "learning_rate": 0.0001437044361816448, "loss": 0.009, "step": 206530 }, { "epoch": 1.04, "learning_rate": 0.00014369686848863077, "loss": 0.0105, "step": 206540 }, { "epoch": 1.04, "learning_rate": 0.00014368930079561678, "loss": 0.0127, "step": 206550 }, { "epoch": 1.04, "learning_rate": 0.00014368173310260276, "loss": 0.0067, "step": 206560 }, { "epoch": 1.04, "learning_rate": 0.00014367416540958874, "loss": 0.0093, "step": 206570 }, { "epoch": 1.04, "learning_rate": 0.00014366659771657475, "loss": 0.0078, "step": 206580 }, { "epoch": 1.04, "learning_rate": 0.00014365903002356073, "loss": 0.0135, "step": 206590 }, { "epoch": 1.04, "learning_rate": 0.00014365146233054671, "loss": 0.0105, "step": 206600 }, { "epoch": 1.04, "learning_rate": 0.00014364389463753272, "loss": 0.0101, "step": 206610 }, { "epoch": 1.04, "learning_rate": 0.0001436363269445187, "loss": 0.0074, "step": 206620 }, { "epoch": 1.04, "learning_rate": 0.00014362875925150469, "loss": 0.0101, "step": 206630 }, { "epoch": 1.04, "learning_rate": 0.0001436211915584907, "loss": 0.0096, "step": 206640 }, { "epoch": 1.04, "learning_rate": 0.00014361362386547668, "loss": 0.0105, "step": 206650 }, { "epoch": 1.04, "learning_rate": 0.00014360605617246266, "loss": 0.0078, "step": 206660 }, { "epoch": 1.04, "learning_rate": 0.00014359848847944867, "loss": 0.0106, "step": 206670 }, { "epoch": 1.04, "learning_rate": 0.00014359092078643465, "loss": 0.0088, "step": 206680 }, { "epoch": 1.04, "learning_rate": 0.00014358335309342063, "loss": 0.0138, "step": 206690 }, { "epoch": 1.04, "learning_rate": 0.0001435757854004066, "loss": 0.0087, "step": 206700 }, { "epoch": 1.04, "learning_rate": 0.00014356821770739262, "loss": 0.009, "step": 206710 }, { "epoch": 1.04, "learning_rate": 0.0001435606500143786, "loss": 0.0091, "step": 206720 }, { "epoch": 1.04, "learning_rate": 0.00014355308232136458, "loss": 0.0081, "step": 206730 }, { "epoch": 1.04, "learning_rate": 0.0001435455146283506, "loss": 0.007, "step": 206740 }, { "epoch": 1.04, "learning_rate": 0.00014353794693533657, "loss": 0.0106, "step": 206750 }, { "epoch": 1.04, "learning_rate": 0.00014353037924232255, "loss": 0.0101, "step": 206760 }, { "epoch": 1.04, "learning_rate": 0.00014352281154930856, "loss": 0.0093, "step": 206770 }, { "epoch": 1.04, "learning_rate": 0.00014351524385629454, "loss": 0.009, "step": 206780 }, { "epoch": 1.04, "learning_rate": 0.00014350767616328052, "loss": 0.0087, "step": 206790 }, { "epoch": 1.04, "learning_rate": 0.00014350010847026653, "loss": 0.0115, "step": 206800 }, { "epoch": 1.04, "learning_rate": 0.00014349254077725251, "loss": 0.0087, "step": 206810 }, { "epoch": 1.04, "learning_rate": 0.0001434849730842385, "loss": 0.0115, "step": 206820 }, { "epoch": 1.04, "learning_rate": 0.0001434774053912245, "loss": 0.0096, "step": 206830 }, { "epoch": 1.04, "learning_rate": 0.00014346983769821049, "loss": 0.0115, "step": 206840 }, { "epoch": 1.04, "learning_rate": 0.00014346227000519647, "loss": 0.0089, "step": 206850 }, { "epoch": 1.04, "learning_rate": 0.00014345470231218245, "loss": 0.0098, "step": 206860 }, { "epoch": 1.04, "learning_rate": 0.00014344713461916846, "loss": 0.0089, "step": 206870 }, { "epoch": 1.04, "learning_rate": 0.00014343956692615444, "loss": 0.0102, "step": 206880 }, { "epoch": 1.04, "learning_rate": 0.00014343199923314042, "loss": 0.0076, "step": 206890 }, { "epoch": 1.04, "learning_rate": 0.00014342443154012643, "loss": 0.0109, "step": 206900 }, { "epoch": 1.04, "learning_rate": 0.0001434168638471124, "loss": 0.0108, "step": 206910 }, { "epoch": 1.04, "learning_rate": 0.0001434092961540984, "loss": 0.0112, "step": 206920 }, { "epoch": 1.04, "learning_rate": 0.0001434017284610844, "loss": 0.0116, "step": 206930 }, { "epoch": 1.04, "learning_rate": 0.00014339416076807038, "loss": 0.0086, "step": 206940 }, { "epoch": 1.04, "learning_rate": 0.00014338659307505636, "loss": 0.01, "step": 206950 }, { "epoch": 1.04, "learning_rate": 0.00014337902538204237, "loss": 0.011, "step": 206960 }, { "epoch": 1.04, "learning_rate": 0.00014337145768902835, "loss": 0.0092, "step": 206970 }, { "epoch": 1.04, "learning_rate": 0.00014336388999601433, "loss": 0.0086, "step": 206980 }, { "epoch": 1.04, "learning_rate": 0.00014335632230300034, "loss": 0.0102, "step": 206990 }, { "epoch": 1.04, "learning_rate": 0.00014334875460998632, "loss": 0.0136, "step": 207000 }, { "epoch": 1.04, "eval_cer": 0.9144566703574066, "eval_loss": 0.0076129864901304245, "eval_runtime": 116.5362, "eval_samples_per_second": 17.162, "eval_steps_per_second": 4.291, "step": 207000 }, { "epoch": 1.04, "learning_rate": 0.0001433411869169723, "loss": 0.008, "step": 207010 }, { "epoch": 1.04, "learning_rate": 0.00014333361922395831, "loss": 0.0079, "step": 207020 }, { "epoch": 1.04, "learning_rate": 0.0001433260515309443, "loss": 0.0077, "step": 207030 }, { "epoch": 1.04, "learning_rate": 0.00014331848383793028, "loss": 0.0097, "step": 207040 }, { "epoch": 1.04, "learning_rate": 0.00014331091614491626, "loss": 0.0083, "step": 207050 }, { "epoch": 1.04, "learning_rate": 0.00014330334845190227, "loss": 0.01, "step": 207060 }, { "epoch": 1.04, "learning_rate": 0.00014329578075888825, "loss": 0.0084, "step": 207070 }, { "epoch": 1.04, "learning_rate": 0.00014328821306587423, "loss": 0.0112, "step": 207080 }, { "epoch": 1.04, "learning_rate": 0.0001432806453728602, "loss": 0.0095, "step": 207090 }, { "epoch": 1.04, "learning_rate": 0.0001432730776798462, "loss": 0.0095, "step": 207100 }, { "epoch": 1.04, "learning_rate": 0.0001432655099868322, "loss": 0.0097, "step": 207110 }, { "epoch": 1.04, "learning_rate": 0.00014325794229381818, "loss": 0.009, "step": 207120 }, { "epoch": 1.04, "learning_rate": 0.00014325037460080416, "loss": 0.0101, "step": 207130 }, { "epoch": 1.05, "learning_rate": 0.00014324280690779017, "loss": 0.0084, "step": 207140 }, { "epoch": 1.05, "learning_rate": 0.00014323523921477615, "loss": 0.0075, "step": 207150 }, { "epoch": 1.05, "learning_rate": 0.00014322767152176214, "loss": 0.0094, "step": 207160 }, { "epoch": 1.05, "learning_rate": 0.00014322010382874814, "loss": 0.0112, "step": 207170 }, { "epoch": 1.05, "learning_rate": 0.00014321253613573413, "loss": 0.0117, "step": 207180 }, { "epoch": 1.05, "learning_rate": 0.0001432049684427201, "loss": 0.0074, "step": 207190 }, { "epoch": 1.05, "learning_rate": 0.00014319740074970612, "loss": 0.0109, "step": 207200 }, { "epoch": 1.05, "learning_rate": 0.0001431898330566921, "loss": 0.0093, "step": 207210 }, { "epoch": 1.05, "learning_rate": 0.00014318226536367808, "loss": 0.0128, "step": 207220 }, { "epoch": 1.05, "learning_rate": 0.00014317469767066406, "loss": 0.0111, "step": 207230 }, { "epoch": 1.05, "learning_rate": 0.00014316712997765007, "loss": 0.0089, "step": 207240 }, { "epoch": 1.05, "learning_rate": 0.00014315956228463605, "loss": 0.008, "step": 207250 }, { "epoch": 1.05, "learning_rate": 0.00014315199459162203, "loss": 0.0119, "step": 207260 }, { "epoch": 1.05, "learning_rate": 0.00014314442689860804, "loss": 0.0091, "step": 207270 }, { "epoch": 1.05, "learning_rate": 0.00014313685920559402, "loss": 0.0106, "step": 207280 }, { "epoch": 1.05, "learning_rate": 0.00014312929151258, "loss": 0.0084, "step": 207290 }, { "epoch": 1.05, "learning_rate": 0.000143121723819566, "loss": 0.0105, "step": 207300 }, { "epoch": 1.05, "learning_rate": 0.000143114156126552, "loss": 0.008, "step": 207310 }, { "epoch": 1.05, "learning_rate": 0.00014310658843353797, "loss": 0.0087, "step": 207320 }, { "epoch": 1.05, "learning_rate": 0.00014309902074052398, "loss": 0.0114, "step": 207330 }, { "epoch": 1.05, "learning_rate": 0.00014309145304750996, "loss": 0.0097, "step": 207340 }, { "epoch": 1.05, "learning_rate": 0.00014308388535449595, "loss": 0.0109, "step": 207350 }, { "epoch": 1.05, "learning_rate": 0.00014307631766148195, "loss": 0.0163, "step": 207360 }, { "epoch": 1.05, "learning_rate": 0.00014306874996846794, "loss": 0.0126, "step": 207370 }, { "epoch": 1.05, "learning_rate": 0.00014306118227545392, "loss": 0.0112, "step": 207380 }, { "epoch": 1.05, "learning_rate": 0.00014305361458243993, "loss": 0.013, "step": 207390 }, { "epoch": 1.05, "learning_rate": 0.0001430460468894259, "loss": 0.0105, "step": 207400 }, { "epoch": 1.05, "learning_rate": 0.0001430384791964119, "loss": 0.0108, "step": 207410 }, { "epoch": 1.05, "learning_rate": 0.00014303091150339787, "loss": 0.0096, "step": 207420 }, { "epoch": 1.05, "learning_rate": 0.00014302334381038388, "loss": 0.0102, "step": 207430 }, { "epoch": 1.05, "learning_rate": 0.00014301577611736986, "loss": 0.0116, "step": 207440 }, { "epoch": 1.05, "learning_rate": 0.00014300820842435584, "loss": 0.0106, "step": 207450 }, { "epoch": 1.05, "learning_rate": 0.00014300064073134185, "loss": 0.01, "step": 207460 }, { "epoch": 1.05, "learning_rate": 0.00014299307303832783, "loss": 0.0103, "step": 207470 }, { "epoch": 1.05, "learning_rate": 0.0001429855053453138, "loss": 0.0099, "step": 207480 }, { "epoch": 1.05, "learning_rate": 0.00014297793765229982, "loss": 0.0084, "step": 207490 }, { "epoch": 1.05, "learning_rate": 0.0001429703699592858, "loss": 0.009, "step": 207500 }, { "epoch": 1.05, "learning_rate": 0.00014296280226627178, "loss": 0.0084, "step": 207510 }, { "epoch": 1.05, "learning_rate": 0.0001429552345732578, "loss": 0.0081, "step": 207520 }, { "epoch": 1.05, "learning_rate": 0.00014294766688024377, "loss": 0.0101, "step": 207530 }, { "epoch": 1.05, "learning_rate": 0.00014294009918722976, "loss": 0.0114, "step": 207540 }, { "epoch": 1.05, "learning_rate": 0.00014293253149421576, "loss": 0.0085, "step": 207550 }, { "epoch": 1.05, "learning_rate": 0.00014292496380120175, "loss": 0.009, "step": 207560 }, { "epoch": 1.05, "learning_rate": 0.00014291739610818773, "loss": 0.011, "step": 207570 }, { "epoch": 1.05, "learning_rate": 0.0001429098284151737, "loss": 0.0102, "step": 207580 }, { "epoch": 1.05, "learning_rate": 0.00014290226072215972, "loss": 0.0092, "step": 207590 }, { "epoch": 1.05, "learning_rate": 0.0001428946930291457, "loss": 0.0109, "step": 207600 }, { "epoch": 1.05, "learning_rate": 0.00014288712533613168, "loss": 0.0101, "step": 207610 }, { "epoch": 1.05, "learning_rate": 0.0001428795576431177, "loss": 0.0094, "step": 207620 }, { "epoch": 1.05, "learning_rate": 0.00014287198995010367, "loss": 0.0094, "step": 207630 }, { "epoch": 1.05, "learning_rate": 0.00014286442225708965, "loss": 0.0098, "step": 207640 }, { "epoch": 1.05, "learning_rate": 0.00014285685456407566, "loss": 0.0101, "step": 207650 }, { "epoch": 1.05, "learning_rate": 0.00014284928687106164, "loss": 0.01, "step": 207660 }, { "epoch": 1.05, "learning_rate": 0.00014284171917804762, "loss": 0.0081, "step": 207670 }, { "epoch": 1.05, "learning_rate": 0.00014283415148503363, "loss": 0.009, "step": 207680 }, { "epoch": 1.05, "learning_rate": 0.0001428265837920196, "loss": 0.0099, "step": 207690 }, { "epoch": 1.05, "learning_rate": 0.0001428190160990056, "loss": 0.009, "step": 207700 }, { "epoch": 1.05, "learning_rate": 0.00014281144840599158, "loss": 0.0096, "step": 207710 }, { "epoch": 1.05, "learning_rate": 0.00014280388071297756, "loss": 0.0084, "step": 207720 }, { "epoch": 1.05, "learning_rate": 0.00014279631301996357, "loss": 0.0094, "step": 207730 }, { "epoch": 1.05, "learning_rate": 0.00014278874532694955, "loss": 0.0126, "step": 207740 }, { "epoch": 1.05, "learning_rate": 0.00014278117763393553, "loss": 0.0098, "step": 207750 }, { "epoch": 1.05, "learning_rate": 0.0001427736099409215, "loss": 0.0103, "step": 207760 }, { "epoch": 1.05, "learning_rate": 0.00014276604224790752, "loss": 0.0098, "step": 207770 }, { "epoch": 1.05, "learning_rate": 0.0001427584745548935, "loss": 0.01, "step": 207780 }, { "epoch": 1.05, "learning_rate": 0.00014275090686187948, "loss": 0.0107, "step": 207790 }, { "epoch": 1.05, "learning_rate": 0.0001427433391688655, "loss": 0.007, "step": 207800 }, { "epoch": 1.05, "learning_rate": 0.00014273577147585147, "loss": 0.0092, "step": 207810 }, { "epoch": 1.05, "learning_rate": 0.00014272820378283745, "loss": 0.0093, "step": 207820 }, { "epoch": 1.05, "learning_rate": 0.00014272063608982346, "loss": 0.0121, "step": 207830 }, { "epoch": 1.05, "learning_rate": 0.00014271306839680944, "loss": 0.0121, "step": 207840 }, { "epoch": 1.05, "learning_rate": 0.00014270550070379542, "loss": 0.0093, "step": 207850 }, { "epoch": 1.05, "learning_rate": 0.00014269793301078143, "loss": 0.0107, "step": 207860 }, { "epoch": 1.05, "learning_rate": 0.00014269036531776741, "loss": 0.0096, "step": 207870 }, { "epoch": 1.05, "learning_rate": 0.0001426827976247534, "loss": 0.0085, "step": 207880 }, { "epoch": 1.05, "learning_rate": 0.0001426752299317394, "loss": 0.009, "step": 207890 }, { "epoch": 1.05, "learning_rate": 0.00014266766223872539, "loss": 0.0108, "step": 207900 }, { "epoch": 1.05, "learning_rate": 0.00014266009454571137, "loss": 0.0105, "step": 207910 }, { "epoch": 1.05, "learning_rate": 0.00014265252685269738, "loss": 0.0087, "step": 207920 }, { "epoch": 1.05, "learning_rate": 0.00014264495915968336, "loss": 0.01, "step": 207930 }, { "epoch": 1.05, "learning_rate": 0.00014263739146666934, "loss": 0.0094, "step": 207940 }, { "epoch": 1.05, "learning_rate": 0.00014262982377365532, "loss": 0.0067, "step": 207950 }, { "epoch": 1.05, "learning_rate": 0.00014262225608064133, "loss": 0.0103, "step": 207960 }, { "epoch": 1.05, "learning_rate": 0.0001426146883876273, "loss": 0.0124, "step": 207970 }, { "epoch": 1.05, "learning_rate": 0.0001426071206946133, "loss": 0.0103, "step": 207980 }, { "epoch": 1.05, "learning_rate": 0.0001425995530015993, "loss": 0.0123, "step": 207990 }, { "epoch": 1.05, "learning_rate": 0.00014259198530858528, "loss": 0.0099, "step": 208000 }, { "epoch": 1.05, "eval_cer": 0.914462492734159, "eval_loss": 0.007478554733097553, "eval_runtime": 116.5491, "eval_samples_per_second": 17.16, "eval_steps_per_second": 4.29, "step": 208000 }, { "epoch": 1.05, "learning_rate": 0.00014258441761557126, "loss": 0.0089, "step": 208010 }, { "epoch": 1.05, "learning_rate": 0.00014257684992255727, "loss": 0.0091, "step": 208020 }, { "epoch": 1.05, "learning_rate": 0.00014256928222954325, "loss": 0.0102, "step": 208030 }, { "epoch": 1.05, "learning_rate": 0.00014256171453652923, "loss": 0.0124, "step": 208040 }, { "epoch": 1.05, "learning_rate": 0.00014255414684351524, "loss": 0.0094, "step": 208050 }, { "epoch": 1.05, "learning_rate": 0.00014254657915050122, "loss": 0.0114, "step": 208060 }, { "epoch": 1.05, "learning_rate": 0.0001425390114574872, "loss": 0.0101, "step": 208070 }, { "epoch": 1.05, "learning_rate": 0.00014253144376447321, "loss": 0.0103, "step": 208080 }, { "epoch": 1.05, "learning_rate": 0.0001425238760714592, "loss": 0.0097, "step": 208090 }, { "epoch": 1.05, "learning_rate": 0.00014251630837844518, "loss": 0.0104, "step": 208100 }, { "epoch": 1.05, "learning_rate": 0.00014250874068543116, "loss": 0.0063, "step": 208110 }, { "epoch": 1.05, "learning_rate": 0.00014250117299241717, "loss": 0.0083, "step": 208120 }, { "epoch": 1.05, "learning_rate": 0.00014249360529940315, "loss": 0.0105, "step": 208130 }, { "epoch": 1.05, "learning_rate": 0.00014248603760638913, "loss": 0.0079, "step": 208140 }, { "epoch": 1.05, "learning_rate": 0.00014247846991337514, "loss": 0.0078, "step": 208150 }, { "epoch": 1.05, "learning_rate": 0.00014247090222036112, "loss": 0.0098, "step": 208160 }, { "epoch": 1.05, "learning_rate": 0.0001424633345273471, "loss": 0.0111, "step": 208170 }, { "epoch": 1.05, "learning_rate": 0.0001424557668343331, "loss": 0.0083, "step": 208180 }, { "epoch": 1.05, "learning_rate": 0.0001424481991413191, "loss": 0.012, "step": 208190 }, { "epoch": 1.05, "learning_rate": 0.00014244063144830507, "loss": 0.0108, "step": 208200 }, { "epoch": 1.05, "learning_rate": 0.00014243306375529108, "loss": 0.009, "step": 208210 }, { "epoch": 1.05, "learning_rate": 0.00014242549606227706, "loss": 0.0089, "step": 208220 }, { "epoch": 1.05, "learning_rate": 0.00014241792836926304, "loss": 0.0125, "step": 208230 }, { "epoch": 1.05, "learning_rate": 0.00014241036067624905, "loss": 0.0098, "step": 208240 }, { "epoch": 1.05, "learning_rate": 0.00014240279298323503, "loss": 0.009, "step": 208250 }, { "epoch": 1.05, "learning_rate": 0.00014239522529022102, "loss": 0.0093, "step": 208260 }, { "epoch": 1.05, "learning_rate": 0.000142387657597207, "loss": 0.013, "step": 208270 }, { "epoch": 1.05, "learning_rate": 0.000142380089904193, "loss": 0.0104, "step": 208280 }, { "epoch": 1.05, "learning_rate": 0.000142372522211179, "loss": 0.0098, "step": 208290 }, { "epoch": 1.05, "learning_rate": 0.00014236495451816497, "loss": 0.0077, "step": 208300 }, { "epoch": 1.05, "learning_rate": 0.00014235738682515098, "loss": 0.0093, "step": 208310 }, { "epoch": 1.05, "learning_rate": 0.00014234981913213696, "loss": 0.0101, "step": 208320 }, { "epoch": 1.05, "learning_rate": 0.00014234225143912294, "loss": 0.0102, "step": 208330 }, { "epoch": 1.05, "learning_rate": 0.00014233468374610892, "loss": 0.0098, "step": 208340 }, { "epoch": 1.05, "learning_rate": 0.0001423271160530949, "loss": 0.0086, "step": 208350 }, { "epoch": 1.05, "learning_rate": 0.0001423195483600809, "loss": 0.0099, "step": 208360 }, { "epoch": 1.05, "learning_rate": 0.0001423119806670669, "loss": 0.0088, "step": 208370 }, { "epoch": 1.05, "learning_rate": 0.00014230441297405287, "loss": 0.0103, "step": 208380 }, { "epoch": 1.05, "learning_rate": 0.00014229684528103888, "loss": 0.0084, "step": 208390 }, { "epoch": 1.05, "learning_rate": 0.00014228927758802486, "loss": 0.008, "step": 208400 }, { "epoch": 1.05, "learning_rate": 0.00014228170989501085, "loss": 0.0097, "step": 208410 }, { "epoch": 1.05, "learning_rate": 0.00014227414220199685, "loss": 0.0105, "step": 208420 }, { "epoch": 1.05, "learning_rate": 0.00014226657450898284, "loss": 0.0115, "step": 208430 }, { "epoch": 1.05, "learning_rate": 0.00014225900681596882, "loss": 0.0103, "step": 208440 }, { "epoch": 1.05, "learning_rate": 0.00014225143912295483, "loss": 0.0077, "step": 208450 }, { "epoch": 1.05, "learning_rate": 0.0001422438714299408, "loss": 0.0081, "step": 208460 }, { "epoch": 1.05, "learning_rate": 0.0001422363037369268, "loss": 0.0084, "step": 208470 }, { "epoch": 1.05, "learning_rate": 0.00014222873604391277, "loss": 0.0094, "step": 208480 }, { "epoch": 1.05, "learning_rate": 0.00014222116835089878, "loss": 0.0106, "step": 208490 }, { "epoch": 1.05, "learning_rate": 0.00014221360065788476, "loss": 0.011, "step": 208500 }, { "epoch": 1.05, "learning_rate": 0.00014220603296487074, "loss": 0.0101, "step": 208510 }, { "epoch": 1.05, "learning_rate": 0.00014219846527185675, "loss": 0.0084, "step": 208520 }, { "epoch": 1.05, "learning_rate": 0.00014219089757884273, "loss": 0.0089, "step": 208530 }, { "epoch": 1.05, "learning_rate": 0.00014218332988582871, "loss": 0.0106, "step": 208540 }, { "epoch": 1.05, "learning_rate": 0.00014217576219281472, "loss": 0.0099, "step": 208550 }, { "epoch": 1.05, "learning_rate": 0.0001421681944998007, "loss": 0.0105, "step": 208560 }, { "epoch": 1.05, "learning_rate": 0.00014216062680678668, "loss": 0.0086, "step": 208570 }, { "epoch": 1.05, "learning_rate": 0.0001421530591137727, "loss": 0.0098, "step": 208580 }, { "epoch": 1.05, "learning_rate": 0.00014214549142075867, "loss": 0.0095, "step": 208590 }, { "epoch": 1.05, "learning_rate": 0.00014213792372774466, "loss": 0.0087, "step": 208600 }, { "epoch": 1.05, "learning_rate": 0.00014213035603473066, "loss": 0.0097, "step": 208610 }, { "epoch": 1.05, "learning_rate": 0.00014212278834171665, "loss": 0.0065, "step": 208620 }, { "epoch": 1.05, "learning_rate": 0.00014211522064870263, "loss": 0.0101, "step": 208630 }, { "epoch": 1.05, "learning_rate": 0.0001421076529556886, "loss": 0.009, "step": 208640 }, { "epoch": 1.05, "learning_rate": 0.00014210008526267462, "loss": 0.0104, "step": 208650 }, { "epoch": 1.05, "learning_rate": 0.0001420925175696606, "loss": 0.0093, "step": 208660 }, { "epoch": 1.05, "learning_rate": 0.00014208494987664658, "loss": 0.0093, "step": 208670 }, { "epoch": 1.05, "learning_rate": 0.0001420773821836326, "loss": 0.0112, "step": 208680 }, { "epoch": 1.05, "learning_rate": 0.00014206981449061857, "loss": 0.013, "step": 208690 }, { "epoch": 1.05, "learning_rate": 0.00014206224679760455, "loss": 0.0088, "step": 208700 }, { "epoch": 1.05, "learning_rate": 0.00014205467910459056, "loss": 0.0131, "step": 208710 }, { "epoch": 1.05, "learning_rate": 0.00014204711141157654, "loss": 0.0113, "step": 208720 }, { "epoch": 1.05, "learning_rate": 0.00014203954371856252, "loss": 0.0116, "step": 208730 }, { "epoch": 1.05, "learning_rate": 0.00014203197602554853, "loss": 0.0124, "step": 208740 }, { "epoch": 1.05, "learning_rate": 0.00014202440833253451, "loss": 0.0093, "step": 208750 }, { "epoch": 1.05, "learning_rate": 0.0001420168406395205, "loss": 0.0103, "step": 208760 }, { "epoch": 1.05, "learning_rate": 0.0001420092729465065, "loss": 0.0074, "step": 208770 }, { "epoch": 1.05, "learning_rate": 0.00014200170525349249, "loss": 0.0122, "step": 208780 }, { "epoch": 1.05, "learning_rate": 0.00014199413756047847, "loss": 0.0095, "step": 208790 }, { "epoch": 1.05, "learning_rate": 0.00014198656986746445, "loss": 0.0081, "step": 208800 }, { "epoch": 1.05, "learning_rate": 0.00014197900217445046, "loss": 0.0091, "step": 208810 }, { "epoch": 1.05, "learning_rate": 0.00014197143448143644, "loss": 0.0103, "step": 208820 }, { "epoch": 1.05, "learning_rate": 0.00014196386678842242, "loss": 0.0089, "step": 208830 }, { "epoch": 1.05, "learning_rate": 0.00014195629909540843, "loss": 0.0094, "step": 208840 }, { "epoch": 1.05, "learning_rate": 0.0001419487314023944, "loss": 0.0091, "step": 208850 }, { "epoch": 1.05, "learning_rate": 0.0001419411637093804, "loss": 0.0089, "step": 208860 }, { "epoch": 1.05, "learning_rate": 0.0001419335960163664, "loss": 0.0081, "step": 208870 }, { "epoch": 1.05, "learning_rate": 0.00014192602832335238, "loss": 0.0148, "step": 208880 }, { "epoch": 1.05, "learning_rate": 0.00014191846063033836, "loss": 0.0094, "step": 208890 }, { "epoch": 1.05, "learning_rate": 0.00014191089293732437, "loss": 0.0084, "step": 208900 }, { "epoch": 1.05, "learning_rate": 0.00014190332524431035, "loss": 0.0106, "step": 208910 }, { "epoch": 1.05, "learning_rate": 0.00014189575755129633, "loss": 0.0091, "step": 208920 }, { "epoch": 1.05, "learning_rate": 0.00014188818985828234, "loss": 0.0083, "step": 208930 }, { "epoch": 1.05, "learning_rate": 0.00014188062216526832, "loss": 0.0083, "step": 208940 }, { "epoch": 1.05, "learning_rate": 0.0001418730544722543, "loss": 0.01, "step": 208950 }, { "epoch": 1.05, "learning_rate": 0.0001418654867792403, "loss": 0.0115, "step": 208960 }, { "epoch": 1.05, "learning_rate": 0.00014185791908622627, "loss": 0.008, "step": 208970 }, { "epoch": 1.05, "learning_rate": 0.00014185035139321228, "loss": 0.0119, "step": 208980 }, { "epoch": 1.05, "learning_rate": 0.00014184278370019826, "loss": 0.0087, "step": 208990 }, { "epoch": 1.05, "learning_rate": 0.00014183521600718424, "loss": 0.0099, "step": 209000 }, { "epoch": 1.05, "eval_cer": 0.9144392032271493, "eval_loss": 0.007373651955276728, "eval_runtime": 116.5945, "eval_samples_per_second": 17.153, "eval_steps_per_second": 4.288, "step": 209000 }, { "epoch": 1.05, "learning_rate": 0.00014182764831417022, "loss": 0.0091, "step": 209010 }, { "epoch": 1.05, "learning_rate": 0.00014182008062115623, "loss": 0.0088, "step": 209020 }, { "epoch": 1.05, "learning_rate": 0.0001418125129281422, "loss": 0.0083, "step": 209030 }, { "epoch": 1.05, "learning_rate": 0.0001418049452351282, "loss": 0.0102, "step": 209040 }, { "epoch": 1.05, "learning_rate": 0.0001417973775421142, "loss": 0.0074, "step": 209050 }, { "epoch": 1.05, "learning_rate": 0.00014178980984910018, "loss": 0.009, "step": 209060 }, { "epoch": 1.05, "learning_rate": 0.00014178224215608616, "loss": 0.009, "step": 209070 }, { "epoch": 1.05, "learning_rate": 0.00014177467446307217, "loss": 0.013, "step": 209080 }, { "epoch": 1.05, "learning_rate": 0.00014176710677005815, "loss": 0.0084, "step": 209090 }, { "epoch": 1.05, "learning_rate": 0.00014175953907704414, "loss": 0.011, "step": 209100 }, { "epoch": 1.05, "learning_rate": 0.00014175197138403014, "loss": 0.0112, "step": 209110 }, { "epoch": 1.06, "learning_rate": 0.00014174440369101613, "loss": 0.0117, "step": 209120 }, { "epoch": 1.06, "learning_rate": 0.0001417368359980021, "loss": 0.0101, "step": 209130 }, { "epoch": 1.06, "learning_rate": 0.00014172926830498812, "loss": 0.0091, "step": 209140 }, { "epoch": 1.06, "learning_rate": 0.0001417217006119741, "loss": 0.0108, "step": 209150 }, { "epoch": 1.06, "learning_rate": 0.00014171413291896008, "loss": 0.0111, "step": 209160 }, { "epoch": 1.06, "learning_rate": 0.00014170656522594606, "loss": 0.0086, "step": 209170 }, { "epoch": 1.06, "learning_rate": 0.00014169899753293207, "loss": 0.0101, "step": 209180 }, { "epoch": 1.06, "learning_rate": 0.00014169142983991805, "loss": 0.0112, "step": 209190 }, { "epoch": 1.06, "learning_rate": 0.00014168386214690403, "loss": 0.009, "step": 209200 }, { "epoch": 1.06, "learning_rate": 0.00014167629445389004, "loss": 0.0101, "step": 209210 }, { "epoch": 1.06, "learning_rate": 0.00014166872676087602, "loss": 0.0079, "step": 209220 }, { "epoch": 1.06, "learning_rate": 0.000141661159067862, "loss": 0.0108, "step": 209230 }, { "epoch": 1.06, "learning_rate": 0.000141653591374848, "loss": 0.0091, "step": 209240 }, { "epoch": 1.06, "learning_rate": 0.000141646023681834, "loss": 0.0077, "step": 209250 }, { "epoch": 1.06, "learning_rate": 0.00014163845598881997, "loss": 0.0073, "step": 209260 }, { "epoch": 1.06, "learning_rate": 0.00014163088829580598, "loss": 0.0113, "step": 209270 }, { "epoch": 1.06, "learning_rate": 0.00014162332060279196, "loss": 0.0108, "step": 209280 }, { "epoch": 1.06, "learning_rate": 0.00014161575290977795, "loss": 0.0126, "step": 209290 }, { "epoch": 1.06, "learning_rate": 0.00014160818521676395, "loss": 0.0086, "step": 209300 }, { "epoch": 1.06, "learning_rate": 0.00014160061752374994, "loss": 0.0106, "step": 209310 }, { "epoch": 1.06, "learning_rate": 0.00014159304983073592, "loss": 0.0108, "step": 209320 }, { "epoch": 1.06, "learning_rate": 0.00014158548213772193, "loss": 0.0098, "step": 209330 }, { "epoch": 1.06, "learning_rate": 0.0001415779144447079, "loss": 0.0079, "step": 209340 }, { "epoch": 1.06, "learning_rate": 0.0001415703467516939, "loss": 0.0123, "step": 209350 }, { "epoch": 1.06, "learning_rate": 0.00014156277905867987, "loss": 0.0092, "step": 209360 }, { "epoch": 1.06, "learning_rate": 0.00014155521136566588, "loss": 0.009, "step": 209370 }, { "epoch": 1.06, "learning_rate": 0.00014154764367265186, "loss": 0.0084, "step": 209380 }, { "epoch": 1.06, "learning_rate": 0.00014154007597963784, "loss": 0.0098, "step": 209390 }, { "epoch": 1.06, "learning_rate": 0.00014153250828662385, "loss": 0.0075, "step": 209400 }, { "epoch": 1.06, "learning_rate": 0.00014152494059360983, "loss": 0.0126, "step": 209410 }, { "epoch": 1.06, "learning_rate": 0.0001415173729005958, "loss": 0.0083, "step": 209420 }, { "epoch": 1.06, "learning_rate": 0.00014150980520758182, "loss": 0.0083, "step": 209430 }, { "epoch": 1.06, "learning_rate": 0.0001415022375145678, "loss": 0.0101, "step": 209440 }, { "epoch": 1.06, "learning_rate": 0.00014149466982155378, "loss": 0.0079, "step": 209450 }, { "epoch": 1.06, "learning_rate": 0.0001414871021285398, "loss": 0.0138, "step": 209460 }, { "epoch": 1.06, "learning_rate": 0.00014147953443552577, "loss": 0.0088, "step": 209470 }, { "epoch": 1.06, "learning_rate": 0.00014147196674251176, "loss": 0.0156, "step": 209480 }, { "epoch": 1.06, "learning_rate": 0.00014146439904949776, "loss": 0.0086, "step": 209490 }, { "epoch": 1.06, "learning_rate": 0.00014145683135648375, "loss": 0.0108, "step": 209500 }, { "epoch": 1.06, "learning_rate": 0.00014144926366346973, "loss": 0.009, "step": 209510 }, { "epoch": 1.06, "learning_rate": 0.0001414416959704557, "loss": 0.0106, "step": 209520 }, { "epoch": 1.06, "learning_rate": 0.00014143412827744172, "loss": 0.0093, "step": 209530 }, { "epoch": 1.06, "learning_rate": 0.0001414265605844277, "loss": 0.0105, "step": 209540 }, { "epoch": 1.06, "learning_rate": 0.00014141899289141368, "loss": 0.0113, "step": 209550 }, { "epoch": 1.06, "learning_rate": 0.0001414114251983997, "loss": 0.0101, "step": 209560 }, { "epoch": 1.06, "learning_rate": 0.00014140385750538567, "loss": 0.0099, "step": 209570 }, { "epoch": 1.06, "learning_rate": 0.00014139628981237165, "loss": 0.0094, "step": 209580 }, { "epoch": 1.06, "learning_rate": 0.00014138872211935763, "loss": 0.0097, "step": 209590 }, { "epoch": 1.06, "learning_rate": 0.00014138115442634361, "loss": 0.0095, "step": 209600 }, { "epoch": 1.06, "learning_rate": 0.00014137358673332962, "loss": 0.0104, "step": 209610 }, { "epoch": 1.06, "learning_rate": 0.0001413660190403156, "loss": 0.0102, "step": 209620 }, { "epoch": 1.06, "learning_rate": 0.00014135845134730159, "loss": 0.009, "step": 209630 }, { "epoch": 1.06, "learning_rate": 0.0001413508836542876, "loss": 0.0112, "step": 209640 }, { "epoch": 1.06, "learning_rate": 0.00014134331596127358, "loss": 0.0083, "step": 209650 }, { "epoch": 1.06, "learning_rate": 0.00014133574826825956, "loss": 0.0105, "step": 209660 }, { "epoch": 1.06, "learning_rate": 0.00014132818057524557, "loss": 0.0095, "step": 209670 }, { "epoch": 1.06, "learning_rate": 0.00014132061288223155, "loss": 0.0081, "step": 209680 }, { "epoch": 1.06, "learning_rate": 0.00014131304518921753, "loss": 0.0107, "step": 209690 }, { "epoch": 1.06, "learning_rate": 0.0001413054774962035, "loss": 0.0095, "step": 209700 }, { "epoch": 1.06, "learning_rate": 0.00014129790980318952, "loss": 0.0076, "step": 209710 }, { "epoch": 1.06, "learning_rate": 0.0001412903421101755, "loss": 0.0125, "step": 209720 }, { "epoch": 1.06, "learning_rate": 0.00014128277441716148, "loss": 0.0078, "step": 209730 }, { "epoch": 1.06, "learning_rate": 0.0001412752067241475, "loss": 0.0087, "step": 209740 }, { "epoch": 1.06, "learning_rate": 0.00014126763903113347, "loss": 0.0124, "step": 209750 }, { "epoch": 1.06, "learning_rate": 0.00014126007133811945, "loss": 0.0092, "step": 209760 }, { "epoch": 1.06, "learning_rate": 0.00014125250364510546, "loss": 0.0086, "step": 209770 }, { "epoch": 1.06, "learning_rate": 0.00014124493595209144, "loss": 0.01, "step": 209780 }, { "epoch": 1.06, "learning_rate": 0.00014123736825907742, "loss": 0.0099, "step": 209790 }, { "epoch": 1.06, "learning_rate": 0.00014122980056606343, "loss": 0.0079, "step": 209800 }, { "epoch": 1.06, "learning_rate": 0.00014122223287304941, "loss": 0.0103, "step": 209810 }, { "epoch": 1.06, "learning_rate": 0.0001412146651800354, "loss": 0.0087, "step": 209820 }, { "epoch": 1.06, "learning_rate": 0.0001412070974870214, "loss": 0.0104, "step": 209830 }, { "epoch": 1.06, "learning_rate": 0.00014119952979400739, "loss": 0.0092, "step": 209840 }, { "epoch": 1.06, "learning_rate": 0.00014119196210099337, "loss": 0.0096, "step": 209850 }, { "epoch": 1.06, "learning_rate": 0.00014118439440797938, "loss": 0.0099, "step": 209860 }, { "epoch": 1.06, "learning_rate": 0.00014117682671496536, "loss": 0.0093, "step": 209870 }, { "epoch": 1.06, "learning_rate": 0.00014116925902195134, "loss": 0.0096, "step": 209880 }, { "epoch": 1.06, "learning_rate": 0.00014116169132893732, "loss": 0.0094, "step": 209890 }, { "epoch": 1.06, "learning_rate": 0.00014115412363592333, "loss": 0.0088, "step": 209900 }, { "epoch": 1.06, "learning_rate": 0.0001411465559429093, "loss": 0.0095, "step": 209910 }, { "epoch": 1.06, "learning_rate": 0.0001411389882498953, "loss": 0.0077, "step": 209920 }, { "epoch": 1.06, "learning_rate": 0.0001411314205568813, "loss": 0.0087, "step": 209930 }, { "epoch": 1.06, "learning_rate": 0.00014112385286386728, "loss": 0.0095, "step": 209940 }, { "epoch": 1.06, "learning_rate": 0.00014111628517085326, "loss": 0.0092, "step": 209950 }, { "epoch": 1.06, "learning_rate": 0.00014110871747783927, "loss": 0.0087, "step": 209960 }, { "epoch": 1.06, "learning_rate": 0.00014110114978482525, "loss": 0.0097, "step": 209970 }, { "epoch": 1.06, "learning_rate": 0.00014109358209181123, "loss": 0.01, "step": 209980 }, { "epoch": 1.06, "learning_rate": 0.00014108601439879724, "loss": 0.0225, "step": 209990 }, { "epoch": 1.06, "learning_rate": 0.00014107844670578322, "loss": 0.0091, "step": 210000 }, { "epoch": 1.06, "eval_cer": 0.9144906342217957, "eval_loss": 0.007647486869245768, "eval_runtime": 116.648, "eval_samples_per_second": 17.146, "eval_steps_per_second": 4.286, "step": 210000 }, { "epoch": 1.06, "learning_rate": 0.0001410708790127692, "loss": 0.0109, "step": 210010 }, { "epoch": 1.06, "learning_rate": 0.00014106331131975521, "loss": 0.0083, "step": 210020 }, { "epoch": 1.06, "learning_rate": 0.0001410557436267412, "loss": 0.0113, "step": 210030 }, { "epoch": 1.06, "learning_rate": 0.00014104817593372718, "loss": 0.0092, "step": 210040 }, { "epoch": 1.06, "learning_rate": 0.00014104060824071316, "loss": 0.0101, "step": 210050 }, { "epoch": 1.06, "learning_rate": 0.00014103304054769917, "loss": 0.0109, "step": 210060 }, { "epoch": 1.06, "learning_rate": 0.00014102547285468515, "loss": 0.0098, "step": 210070 }, { "epoch": 1.06, "learning_rate": 0.00014101790516167113, "loss": 0.0081, "step": 210080 }, { "epoch": 1.06, "learning_rate": 0.00014101033746865714, "loss": 0.0111, "step": 210090 }, { "epoch": 1.06, "learning_rate": 0.00014100276977564312, "loss": 0.0109, "step": 210100 }, { "epoch": 1.06, "learning_rate": 0.0001409952020826291, "loss": 0.0108, "step": 210110 }, { "epoch": 1.06, "learning_rate": 0.0001409876343896151, "loss": 0.0102, "step": 210120 }, { "epoch": 1.06, "learning_rate": 0.0001409800666966011, "loss": 0.0094, "step": 210130 }, { "epoch": 1.06, "learning_rate": 0.00014097249900358707, "loss": 0.0098, "step": 210140 }, { "epoch": 1.06, "learning_rate": 0.00014096493131057308, "loss": 0.0104, "step": 210150 }, { "epoch": 1.06, "learning_rate": 0.00014095736361755906, "loss": 0.01, "step": 210160 }, { "epoch": 1.06, "learning_rate": 0.00014094979592454504, "loss": 0.0112, "step": 210170 }, { "epoch": 1.06, "learning_rate": 0.00014094222823153105, "loss": 0.0093, "step": 210180 }, { "epoch": 1.06, "learning_rate": 0.00014093466053851703, "loss": 0.0105, "step": 210190 }, { "epoch": 1.06, "learning_rate": 0.00014092709284550302, "loss": 0.0095, "step": 210200 }, { "epoch": 1.06, "learning_rate": 0.000140919525152489, "loss": 0.0093, "step": 210210 }, { "epoch": 1.06, "learning_rate": 0.00014091195745947498, "loss": 0.0089, "step": 210220 }, { "epoch": 1.06, "learning_rate": 0.000140904389766461, "loss": 0.0156, "step": 210230 }, { "epoch": 1.06, "learning_rate": 0.00014089682207344697, "loss": 0.0098, "step": 210240 }, { "epoch": 1.06, "learning_rate": 0.00014088925438043295, "loss": 0.01, "step": 210250 }, { "epoch": 1.06, "learning_rate": 0.00014088168668741893, "loss": 0.0125, "step": 210260 }, { "epoch": 1.06, "learning_rate": 0.00014087411899440494, "loss": 0.0105, "step": 210270 }, { "epoch": 1.06, "learning_rate": 0.00014086655130139092, "loss": 0.0102, "step": 210280 }, { "epoch": 1.06, "learning_rate": 0.0001408589836083769, "loss": 0.01, "step": 210290 }, { "epoch": 1.06, "learning_rate": 0.0001408514159153629, "loss": 0.0079, "step": 210300 }, { "epoch": 1.06, "learning_rate": 0.0001408438482223489, "loss": 0.0105, "step": 210310 }, { "epoch": 1.06, "learning_rate": 0.00014083628052933487, "loss": 0.009, "step": 210320 }, { "epoch": 1.06, "learning_rate": 0.00014082871283632088, "loss": 0.0118, "step": 210330 }, { "epoch": 1.06, "learning_rate": 0.00014082114514330686, "loss": 0.0084, "step": 210340 }, { "epoch": 1.06, "learning_rate": 0.00014081357745029285, "loss": 0.0083, "step": 210350 }, { "epoch": 1.06, "learning_rate": 0.00014080600975727885, "loss": 0.0102, "step": 210360 }, { "epoch": 1.06, "learning_rate": 0.00014079844206426484, "loss": 0.0113, "step": 210370 }, { "epoch": 1.06, "learning_rate": 0.00014079087437125082, "loss": 0.0101, "step": 210380 }, { "epoch": 1.06, "learning_rate": 0.00014078330667823683, "loss": 0.0134, "step": 210390 }, { "epoch": 1.06, "learning_rate": 0.0001407757389852228, "loss": 0.011, "step": 210400 }, { "epoch": 1.06, "learning_rate": 0.0001407681712922088, "loss": 0.0121, "step": 210410 }, { "epoch": 1.06, "learning_rate": 0.00014076060359919477, "loss": 0.0101, "step": 210420 }, { "epoch": 1.06, "learning_rate": 0.00014075303590618078, "loss": 0.0126, "step": 210430 }, { "epoch": 1.06, "learning_rate": 0.00014074546821316676, "loss": 0.0097, "step": 210440 }, { "epoch": 1.06, "learning_rate": 0.00014073790052015274, "loss": 0.0095, "step": 210450 }, { "epoch": 1.06, "learning_rate": 0.00014073033282713875, "loss": 0.0101, "step": 210460 }, { "epoch": 1.06, "learning_rate": 0.00014072276513412473, "loss": 0.01, "step": 210470 }, { "epoch": 1.06, "learning_rate": 0.0001407151974411107, "loss": 0.0102, "step": 210480 }, { "epoch": 1.06, "learning_rate": 0.00014070762974809672, "loss": 0.0087, "step": 210490 }, { "epoch": 1.06, "learning_rate": 0.0001407000620550827, "loss": 0.0109, "step": 210500 }, { "epoch": 1.06, "learning_rate": 0.00014069249436206868, "loss": 0.0092, "step": 210510 }, { "epoch": 1.06, "learning_rate": 0.0001406849266690547, "loss": 0.0097, "step": 210520 }, { "epoch": 1.06, "learning_rate": 0.00014067735897604067, "loss": 0.013, "step": 210530 }, { "epoch": 1.06, "learning_rate": 0.00014066979128302666, "loss": 0.0165, "step": 210540 }, { "epoch": 1.06, "learning_rate": 0.00014066222359001266, "loss": 0.0072, "step": 210550 }, { "epoch": 1.06, "learning_rate": 0.00014065465589699865, "loss": 0.0083, "step": 210560 }, { "epoch": 1.06, "learning_rate": 0.00014064708820398463, "loss": 0.0121, "step": 210570 }, { "epoch": 1.06, "learning_rate": 0.0001406395205109706, "loss": 0.015, "step": 210580 }, { "epoch": 1.06, "learning_rate": 0.00014063195281795662, "loss": 0.0078, "step": 210590 }, { "epoch": 1.06, "learning_rate": 0.0001406243851249426, "loss": 0.0099, "step": 210600 }, { "epoch": 1.06, "learning_rate": 0.00014061681743192858, "loss": 0.0099, "step": 210610 }, { "epoch": 1.06, "learning_rate": 0.0001406092497389146, "loss": 0.014, "step": 210620 }, { "epoch": 1.06, "learning_rate": 0.00014060168204590057, "loss": 0.0131, "step": 210630 }, { "epoch": 1.06, "learning_rate": 0.00014059411435288655, "loss": 0.0093, "step": 210640 }, { "epoch": 1.06, "learning_rate": 0.00014058654665987256, "loss": 0.0087, "step": 210650 }, { "epoch": 1.06, "learning_rate": 0.00014057897896685854, "loss": 0.0119, "step": 210660 }, { "epoch": 1.06, "learning_rate": 0.00014057141127384452, "loss": 0.0101, "step": 210670 }, { "epoch": 1.06, "learning_rate": 0.00014056384358083053, "loss": 0.0075, "step": 210680 }, { "epoch": 1.06, "learning_rate": 0.0001405562758878165, "loss": 0.0092, "step": 210690 }, { "epoch": 1.06, "learning_rate": 0.0001405487081948025, "loss": 0.0096, "step": 210700 }, { "epoch": 1.06, "learning_rate": 0.0001405411405017885, "loss": 0.0082, "step": 210710 }, { "epoch": 1.06, "learning_rate": 0.00014053357280877448, "loss": 0.0101, "step": 210720 }, { "epoch": 1.06, "learning_rate": 0.00014052600511576047, "loss": 0.0101, "step": 210730 }, { "epoch": 1.06, "learning_rate": 0.00014051843742274645, "loss": 0.0113, "step": 210740 }, { "epoch": 1.06, "learning_rate": 0.00014051086972973246, "loss": 0.0096, "step": 210750 }, { "epoch": 1.06, "learning_rate": 0.00014050330203671844, "loss": 0.0093, "step": 210760 }, { "epoch": 1.06, "learning_rate": 0.00014049573434370442, "loss": 0.0104, "step": 210770 }, { "epoch": 1.06, "learning_rate": 0.00014048816665069043, "loss": 0.0125, "step": 210780 }, { "epoch": 1.06, "learning_rate": 0.0001404805989576764, "loss": 0.0119, "step": 210790 }, { "epoch": 1.06, "learning_rate": 0.0001404730312646624, "loss": 0.0085, "step": 210800 }, { "epoch": 1.06, "learning_rate": 0.0001404654635716484, "loss": 0.0099, "step": 210810 }, { "epoch": 1.06, "learning_rate": 0.00014045789587863438, "loss": 0.0119, "step": 210820 }, { "epoch": 1.06, "learning_rate": 0.00014045032818562036, "loss": 0.0098, "step": 210830 }, { "epoch": 1.06, "learning_rate": 0.00014044276049260637, "loss": 0.0094, "step": 210840 }, { "epoch": 1.06, "learning_rate": 0.00014043519279959232, "loss": 0.01, "step": 210850 }, { "epoch": 1.06, "learning_rate": 0.00014042762510657833, "loss": 0.0094, "step": 210860 }, { "epoch": 1.06, "learning_rate": 0.00014042005741356431, "loss": 0.0128, "step": 210870 }, { "epoch": 1.06, "learning_rate": 0.0001404124897205503, "loss": 0.0098, "step": 210880 }, { "epoch": 1.06, "learning_rate": 0.0001404049220275363, "loss": 0.0099, "step": 210890 }, { "epoch": 1.06, "learning_rate": 0.00014039735433452229, "loss": 0.0095, "step": 210900 }, { "epoch": 1.06, "learning_rate": 0.00014038978664150827, "loss": 0.0107, "step": 210910 }, { "epoch": 1.06, "learning_rate": 0.00014038221894849428, "loss": 0.0099, "step": 210920 }, { "epoch": 1.06, "learning_rate": 0.00014037465125548026, "loss": 0.0076, "step": 210930 }, { "epoch": 1.06, "learning_rate": 0.00014036708356246624, "loss": 0.0091, "step": 210940 }, { "epoch": 1.06, "learning_rate": 0.00014035951586945222, "loss": 0.0105, "step": 210950 }, { "epoch": 1.06, "learning_rate": 0.00014035194817643823, "loss": 0.0111, "step": 210960 }, { "epoch": 1.06, "learning_rate": 0.0001403443804834242, "loss": 0.009, "step": 210970 }, { "epoch": 1.06, "learning_rate": 0.0001403368127904102, "loss": 0.0084, "step": 210980 }, { "epoch": 1.06, "learning_rate": 0.0001403292450973962, "loss": 0.0102, "step": 210990 }, { "epoch": 1.06, "learning_rate": 0.00014032167740438218, "loss": 0.0079, "step": 211000 }, { "epoch": 1.06, "eval_cer": 0.9144489071884033, "eval_loss": 0.007559832185506821, "eval_runtime": 116.7132, "eval_samples_per_second": 17.136, "eval_steps_per_second": 4.284, "step": 211000 }, { "epoch": 1.06, "learning_rate": 0.00014031410971136816, "loss": 0.0094, "step": 211010 }, { "epoch": 1.06, "learning_rate": 0.00014030654201835417, "loss": 0.007, "step": 211020 }, { "epoch": 1.06, "learning_rate": 0.00014029897432534015, "loss": 0.0098, "step": 211030 }, { "epoch": 1.06, "learning_rate": 0.00014029140663232613, "loss": 0.0085, "step": 211040 }, { "epoch": 1.06, "learning_rate": 0.00014028383893931214, "loss": 0.0104, "step": 211050 }, { "epoch": 1.06, "learning_rate": 0.00014027627124629812, "loss": 0.0095, "step": 211060 }, { "epoch": 1.06, "learning_rate": 0.0001402687035532841, "loss": 0.0108, "step": 211070 }, { "epoch": 1.06, "learning_rate": 0.00014026113586027011, "loss": 0.0105, "step": 211080 }, { "epoch": 1.06, "learning_rate": 0.0001402535681672561, "loss": 0.0102, "step": 211090 }, { "epoch": 1.07, "learning_rate": 0.00014024600047424208, "loss": 0.0092, "step": 211100 }, { "epoch": 1.07, "learning_rate": 0.00014023843278122806, "loss": 0.0088, "step": 211110 }, { "epoch": 1.07, "learning_rate": 0.00014023086508821407, "loss": 0.0097, "step": 211120 }, { "epoch": 1.07, "learning_rate": 0.00014022329739520005, "loss": 0.0097, "step": 211130 }, { "epoch": 1.07, "learning_rate": 0.00014021572970218603, "loss": 0.0087, "step": 211140 }, { "epoch": 1.07, "learning_rate": 0.00014020816200917204, "loss": 0.0081, "step": 211150 }, { "epoch": 1.07, "learning_rate": 0.00014020059431615802, "loss": 0.0103, "step": 211160 }, { "epoch": 1.07, "learning_rate": 0.000140193026623144, "loss": 0.0095, "step": 211170 }, { "epoch": 1.07, "learning_rate": 0.00014018545893013, "loss": 0.0075, "step": 211180 }, { "epoch": 1.07, "learning_rate": 0.000140177891237116, "loss": 0.0091, "step": 211190 }, { "epoch": 1.07, "learning_rate": 0.00014017032354410197, "loss": 0.0087, "step": 211200 }, { "epoch": 1.07, "learning_rate": 0.00014016275585108798, "loss": 0.0076, "step": 211210 }, { "epoch": 1.07, "learning_rate": 0.00014015518815807396, "loss": 0.0115, "step": 211220 }, { "epoch": 1.07, "learning_rate": 0.00014014762046505994, "loss": 0.0077, "step": 211230 }, { "epoch": 1.07, "learning_rate": 0.00014014005277204595, "loss": 0.0172, "step": 211240 }, { "epoch": 1.07, "learning_rate": 0.00014013248507903193, "loss": 0.0111, "step": 211250 }, { "epoch": 1.07, "learning_rate": 0.00014012491738601792, "loss": 0.0101, "step": 211260 }, { "epoch": 1.07, "learning_rate": 0.00014011734969300392, "loss": 0.009, "step": 211270 }, { "epoch": 1.07, "learning_rate": 0.0001401097819999899, "loss": 0.0107, "step": 211280 }, { "epoch": 1.07, "learning_rate": 0.0001401022143069759, "loss": 0.0101, "step": 211290 }, { "epoch": 1.07, "learning_rate": 0.00014009464661396187, "loss": 0.013, "step": 211300 }, { "epoch": 1.07, "learning_rate": 0.00014008707892094788, "loss": 0.0092, "step": 211310 }, { "epoch": 1.07, "learning_rate": 0.00014007951122793386, "loss": 0.0118, "step": 211320 }, { "epoch": 1.07, "learning_rate": 0.00014007194353491984, "loss": 0.0099, "step": 211330 }, { "epoch": 1.07, "learning_rate": 0.00014006437584190585, "loss": 0.0117, "step": 211340 }, { "epoch": 1.07, "learning_rate": 0.00014005680814889183, "loss": 0.0106, "step": 211350 }, { "epoch": 1.07, "learning_rate": 0.0001400492404558778, "loss": 0.0111, "step": 211360 }, { "epoch": 1.07, "learning_rate": 0.00014004167276286382, "loss": 0.0088, "step": 211370 }, { "epoch": 1.07, "learning_rate": 0.0001400341050698498, "loss": 0.0115, "step": 211380 }, { "epoch": 1.07, "learning_rate": 0.00014002653737683578, "loss": 0.007, "step": 211390 }, { "epoch": 1.07, "learning_rate": 0.0001400189696838218, "loss": 0.0085, "step": 211400 }, { "epoch": 1.07, "learning_rate": 0.00014001140199080777, "loss": 0.0162, "step": 211410 }, { "epoch": 1.07, "learning_rate": 0.00014000383429779375, "loss": 0.0088, "step": 211420 }, { "epoch": 1.07, "learning_rate": 0.00013999626660477976, "loss": 0.0105, "step": 211430 }, { "epoch": 1.07, "learning_rate": 0.00013998869891176574, "loss": 0.0104, "step": 211440 }, { "epoch": 1.07, "learning_rate": 0.00013998113121875173, "loss": 0.0086, "step": 211450 }, { "epoch": 1.07, "learning_rate": 0.0001399735635257377, "loss": 0.0093, "step": 211460 }, { "epoch": 1.07, "learning_rate": 0.00013996599583272372, "loss": 0.0095, "step": 211470 }, { "epoch": 1.07, "learning_rate": 0.00013995842813970967, "loss": 0.0097, "step": 211480 }, { "epoch": 1.07, "learning_rate": 0.00013995086044669568, "loss": 0.0084, "step": 211490 }, { "epoch": 1.07, "learning_rate": 0.00013994329275368166, "loss": 0.0121, "step": 211500 }, { "epoch": 1.07, "learning_rate": 0.00013993572506066764, "loss": 0.0091, "step": 211510 }, { "epoch": 1.07, "learning_rate": 0.00013992815736765365, "loss": 0.0091, "step": 211520 }, { "epoch": 1.07, "learning_rate": 0.00013992058967463963, "loss": 0.0084, "step": 211530 }, { "epoch": 1.07, "learning_rate": 0.0001399130219816256, "loss": 0.0105, "step": 211540 }, { "epoch": 1.07, "learning_rate": 0.00013990545428861162, "loss": 0.0091, "step": 211550 }, { "epoch": 1.07, "learning_rate": 0.0001398978865955976, "loss": 0.0082, "step": 211560 }, { "epoch": 1.07, "learning_rate": 0.00013989031890258358, "loss": 0.0087, "step": 211570 }, { "epoch": 1.07, "learning_rate": 0.0001398827512095696, "loss": 0.0094, "step": 211580 }, { "epoch": 1.07, "learning_rate": 0.00013987518351655557, "loss": 0.0098, "step": 211590 }, { "epoch": 1.07, "learning_rate": 0.00013986761582354156, "loss": 0.0127, "step": 211600 }, { "epoch": 1.07, "learning_rate": 0.00013986004813052756, "loss": 0.0097, "step": 211610 }, { "epoch": 1.07, "learning_rate": 0.00013985248043751355, "loss": 0.0116, "step": 211620 }, { "epoch": 1.07, "learning_rate": 0.00013984491274449953, "loss": 0.0083, "step": 211630 }, { "epoch": 1.07, "learning_rate": 0.0001398373450514855, "loss": 0.0101, "step": 211640 }, { "epoch": 1.07, "learning_rate": 0.00013982977735847152, "loss": 0.0079, "step": 211650 }, { "epoch": 1.07, "learning_rate": 0.0001398222096654575, "loss": 0.0109, "step": 211660 }, { "epoch": 1.07, "learning_rate": 0.00013981464197244348, "loss": 0.0093, "step": 211670 }, { "epoch": 1.07, "learning_rate": 0.0001398070742794295, "loss": 0.0078, "step": 211680 }, { "epoch": 1.07, "learning_rate": 0.00013979950658641547, "loss": 0.0087, "step": 211690 }, { "epoch": 1.07, "learning_rate": 0.00013979193889340145, "loss": 0.0092, "step": 211700 }, { "epoch": 1.07, "learning_rate": 0.00013978437120038746, "loss": 0.0094, "step": 211710 }, { "epoch": 1.07, "learning_rate": 0.00013977680350737344, "loss": 0.0116, "step": 211720 }, { "epoch": 1.07, "learning_rate": 0.00013976923581435942, "loss": 0.0111, "step": 211730 }, { "epoch": 1.07, "learning_rate": 0.00013976166812134543, "loss": 0.0111, "step": 211740 }, { "epoch": 1.07, "learning_rate": 0.0001397541004283314, "loss": 0.0112, "step": 211750 }, { "epoch": 1.07, "learning_rate": 0.0001397465327353174, "loss": 0.0094, "step": 211760 }, { "epoch": 1.07, "learning_rate": 0.0001397389650423034, "loss": 0.0097, "step": 211770 }, { "epoch": 1.07, "learning_rate": 0.00013973139734928938, "loss": 0.0104, "step": 211780 }, { "epoch": 1.07, "learning_rate": 0.00013972382965627537, "loss": 0.0141, "step": 211790 }, { "epoch": 1.07, "learning_rate": 0.00013971626196326137, "loss": 0.0092, "step": 211800 }, { "epoch": 1.07, "learning_rate": 0.00013970869427024736, "loss": 0.0089, "step": 211810 }, { "epoch": 1.07, "learning_rate": 0.00013970112657723334, "loss": 0.0092, "step": 211820 }, { "epoch": 1.07, "learning_rate": 0.00013969355888421932, "loss": 0.0103, "step": 211830 }, { "epoch": 1.07, "learning_rate": 0.00013968599119120533, "loss": 0.011, "step": 211840 }, { "epoch": 1.07, "learning_rate": 0.0001396784234981913, "loss": 0.0109, "step": 211850 }, { "epoch": 1.07, "learning_rate": 0.0001396708558051773, "loss": 0.0123, "step": 211860 }, { "epoch": 1.07, "learning_rate": 0.0001396632881121633, "loss": 0.0113, "step": 211870 }, { "epoch": 1.07, "learning_rate": 0.00013965572041914928, "loss": 0.0112, "step": 211880 }, { "epoch": 1.07, "learning_rate": 0.00013964815272613526, "loss": 0.0076, "step": 211890 }, { "epoch": 1.07, "learning_rate": 0.00013964058503312127, "loss": 0.0117, "step": 211900 }, { "epoch": 1.07, "learning_rate": 0.00013963301734010725, "loss": 0.0105, "step": 211910 }, { "epoch": 1.07, "learning_rate": 0.00013962544964709323, "loss": 0.0103, "step": 211920 }, { "epoch": 1.07, "learning_rate": 0.00013961788195407924, "loss": 0.0105, "step": 211930 }, { "epoch": 1.07, "learning_rate": 0.00013961031426106522, "loss": 0.0103, "step": 211940 }, { "epoch": 1.07, "learning_rate": 0.0001396027465680512, "loss": 0.0091, "step": 211950 }, { "epoch": 1.07, "learning_rate": 0.0001395951788750372, "loss": 0.0099, "step": 211960 }, { "epoch": 1.07, "learning_rate": 0.0001395876111820232, "loss": 0.0086, "step": 211970 }, { "epoch": 1.07, "learning_rate": 0.00013958004348900918, "loss": 0.0117, "step": 211980 }, { "epoch": 1.07, "learning_rate": 0.00013957247579599516, "loss": 0.0097, "step": 211990 }, { "epoch": 1.07, "learning_rate": 0.00013956490810298117, "loss": 0.009, "step": 212000 }, { "epoch": 1.07, "eval_cer": 0.9144615223380336, "eval_loss": 0.007792965974658728, "eval_runtime": 116.6797, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 212000 }, { "epoch": 1.07, "learning_rate": 0.00013955734040996715, "loss": 0.01, "step": 212010 }, { "epoch": 1.07, "learning_rate": 0.00013954977271695313, "loss": 0.0111, "step": 212020 }, { "epoch": 1.07, "learning_rate": 0.00013954220502393914, "loss": 0.0078, "step": 212030 }, { "epoch": 1.07, "learning_rate": 0.00013953463733092512, "loss": 0.0154, "step": 212040 }, { "epoch": 1.07, "learning_rate": 0.0001395270696379111, "loss": 0.009, "step": 212050 }, { "epoch": 1.07, "learning_rate": 0.0001395195019448971, "loss": 0.0109, "step": 212060 }, { "epoch": 1.07, "learning_rate": 0.0001395119342518831, "loss": 0.0071, "step": 212070 }, { "epoch": 1.07, "learning_rate": 0.00013950436655886907, "loss": 0.0102, "step": 212080 }, { "epoch": 1.07, "learning_rate": 0.00013949679886585508, "loss": 0.0083, "step": 212090 }, { "epoch": 1.07, "learning_rate": 0.00013948923117284103, "loss": 0.0074, "step": 212100 }, { "epoch": 1.07, "learning_rate": 0.00013948166347982704, "loss": 0.0102, "step": 212110 }, { "epoch": 1.07, "learning_rate": 0.00013947409578681302, "loss": 0.0092, "step": 212120 }, { "epoch": 1.07, "learning_rate": 0.000139466528093799, "loss": 0.0087, "step": 212130 }, { "epoch": 1.07, "learning_rate": 0.00013945896040078501, "loss": 0.0122, "step": 212140 }, { "epoch": 1.07, "learning_rate": 0.000139451392707771, "loss": 0.0086, "step": 212150 }, { "epoch": 1.07, "learning_rate": 0.00013944382501475698, "loss": 0.0102, "step": 212160 }, { "epoch": 1.07, "learning_rate": 0.00013943625732174299, "loss": 0.0089, "step": 212170 }, { "epoch": 1.07, "learning_rate": 0.00013942868962872897, "loss": 0.0081, "step": 212180 }, { "epoch": 1.07, "learning_rate": 0.00013942112193571495, "loss": 0.0097, "step": 212190 }, { "epoch": 1.07, "learning_rate": 0.00013941355424270093, "loss": 0.0098, "step": 212200 }, { "epoch": 1.07, "learning_rate": 0.00013940598654968694, "loss": 0.0124, "step": 212210 }, { "epoch": 1.07, "learning_rate": 0.00013939841885667292, "loss": 0.011, "step": 212220 }, { "epoch": 1.07, "learning_rate": 0.0001393908511636589, "loss": 0.0101, "step": 212230 }, { "epoch": 1.07, "learning_rate": 0.0001393832834706449, "loss": 0.0108, "step": 212240 }, { "epoch": 1.07, "learning_rate": 0.0001393757157776309, "loss": 0.0095, "step": 212250 }, { "epoch": 1.07, "learning_rate": 0.00013936814808461687, "loss": 0.0105, "step": 212260 }, { "epoch": 1.07, "learning_rate": 0.00013936058039160288, "loss": 0.0098, "step": 212270 }, { "epoch": 1.07, "learning_rate": 0.00013935301269858886, "loss": 0.0075, "step": 212280 }, { "epoch": 1.07, "learning_rate": 0.00013934544500557484, "loss": 0.0106, "step": 212290 }, { "epoch": 1.07, "learning_rate": 0.00013933787731256085, "loss": 0.0093, "step": 212300 }, { "epoch": 1.07, "learning_rate": 0.00013933030961954683, "loss": 0.008, "step": 212310 }, { "epoch": 1.07, "learning_rate": 0.00013932274192653282, "loss": 0.0113, "step": 212320 }, { "epoch": 1.07, "learning_rate": 0.00013931517423351882, "loss": 0.0079, "step": 212330 }, { "epoch": 1.07, "learning_rate": 0.0001393076065405048, "loss": 0.0082, "step": 212340 }, { "epoch": 1.07, "learning_rate": 0.0001393000388474908, "loss": 0.0122, "step": 212350 }, { "epoch": 1.07, "learning_rate": 0.00013929247115447677, "loss": 0.0092, "step": 212360 }, { "epoch": 1.07, "learning_rate": 0.00013928490346146278, "loss": 0.0092, "step": 212370 }, { "epoch": 1.07, "learning_rate": 0.00013927733576844876, "loss": 0.0103, "step": 212380 }, { "epoch": 1.07, "learning_rate": 0.00013926976807543474, "loss": 0.0097, "step": 212390 }, { "epoch": 1.07, "learning_rate": 0.00013926220038242075, "loss": 0.0068, "step": 212400 }, { "epoch": 1.07, "learning_rate": 0.00013925463268940673, "loss": 0.0106, "step": 212410 }, { "epoch": 1.07, "learning_rate": 0.0001392470649963927, "loss": 0.0112, "step": 212420 }, { "epoch": 1.07, "learning_rate": 0.00013923949730337872, "loss": 0.0102, "step": 212430 }, { "epoch": 1.07, "learning_rate": 0.0001392319296103647, "loss": 0.0103, "step": 212440 }, { "epoch": 1.07, "learning_rate": 0.00013922436191735068, "loss": 0.0139, "step": 212450 }, { "epoch": 1.07, "learning_rate": 0.0001392167942243367, "loss": 0.0087, "step": 212460 }, { "epoch": 1.07, "learning_rate": 0.00013920922653132267, "loss": 0.0097, "step": 212470 }, { "epoch": 1.07, "learning_rate": 0.00013920165883830865, "loss": 0.0112, "step": 212480 }, { "epoch": 1.07, "learning_rate": 0.00013919409114529466, "loss": 0.01, "step": 212490 }, { "epoch": 1.07, "learning_rate": 0.00013918652345228064, "loss": 0.0118, "step": 212500 }, { "epoch": 1.07, "learning_rate": 0.00013917895575926663, "loss": 0.0118, "step": 212510 }, { "epoch": 1.07, "learning_rate": 0.0001391713880662526, "loss": 0.0086, "step": 212520 }, { "epoch": 1.07, "learning_rate": 0.00013916382037323862, "loss": 0.0085, "step": 212530 }, { "epoch": 1.07, "learning_rate": 0.0001391562526802246, "loss": 0.011, "step": 212540 }, { "epoch": 1.07, "learning_rate": 0.00013914868498721058, "loss": 0.0089, "step": 212550 }, { "epoch": 1.07, "learning_rate": 0.0001391411172941966, "loss": 0.01, "step": 212560 }, { "epoch": 1.07, "learning_rate": 0.00013913354960118257, "loss": 0.0079, "step": 212570 }, { "epoch": 1.07, "learning_rate": 0.00013912598190816855, "loss": 0.0084, "step": 212580 }, { "epoch": 1.07, "learning_rate": 0.00013911841421515456, "loss": 0.0101, "step": 212590 }, { "epoch": 1.07, "learning_rate": 0.00013911084652214054, "loss": 0.0097, "step": 212600 }, { "epoch": 1.07, "learning_rate": 0.00013910327882912652, "loss": 0.0119, "step": 212610 }, { "epoch": 1.07, "learning_rate": 0.00013909571113611253, "loss": 0.0095, "step": 212620 }, { "epoch": 1.07, "learning_rate": 0.0001390881434430985, "loss": 0.0101, "step": 212630 }, { "epoch": 1.07, "learning_rate": 0.0001390805757500845, "loss": 0.0093, "step": 212640 }, { "epoch": 1.07, "learning_rate": 0.0001390730080570705, "loss": 0.0093, "step": 212650 }, { "epoch": 1.07, "learning_rate": 0.00013906544036405648, "loss": 0.0098, "step": 212660 }, { "epoch": 1.07, "learning_rate": 0.00013905787267104246, "loss": 0.0101, "step": 212670 }, { "epoch": 1.07, "learning_rate": 0.00013905030497802845, "loss": 0.011, "step": 212680 }, { "epoch": 1.07, "learning_rate": 0.00013904273728501445, "loss": 0.0094, "step": 212690 }, { "epoch": 1.07, "learning_rate": 0.00013903516959200044, "loss": 0.0106, "step": 212700 }, { "epoch": 1.07, "learning_rate": 0.00013902760189898642, "loss": 0.0072, "step": 212710 }, { "epoch": 1.07, "learning_rate": 0.00013902003420597243, "loss": 0.0092, "step": 212720 }, { "epoch": 1.07, "learning_rate": 0.00013901246651295838, "loss": 0.0094, "step": 212730 }, { "epoch": 1.07, "learning_rate": 0.0001390048988199444, "loss": 0.0127, "step": 212740 }, { "epoch": 1.07, "learning_rate": 0.00013899733112693037, "loss": 0.0099, "step": 212750 }, { "epoch": 1.07, "learning_rate": 0.00013898976343391635, "loss": 0.009, "step": 212760 }, { "epoch": 1.07, "learning_rate": 0.00013898219574090236, "loss": 0.0123, "step": 212770 }, { "epoch": 1.07, "learning_rate": 0.00013897462804788834, "loss": 0.0099, "step": 212780 }, { "epoch": 1.07, "learning_rate": 0.00013896706035487432, "loss": 0.0091, "step": 212790 }, { "epoch": 1.07, "learning_rate": 0.00013895949266186033, "loss": 0.011, "step": 212800 }, { "epoch": 1.07, "learning_rate": 0.0001389519249688463, "loss": 0.0112, "step": 212810 }, { "epoch": 1.07, "learning_rate": 0.0001389443572758323, "loss": 0.0082, "step": 212820 }, { "epoch": 1.07, "learning_rate": 0.0001389367895828183, "loss": 0.0075, "step": 212830 }, { "epoch": 1.07, "learning_rate": 0.00013892922188980428, "loss": 0.0085, "step": 212840 }, { "epoch": 1.07, "learning_rate": 0.00013892165419679027, "loss": 0.0108, "step": 212850 }, { "epoch": 1.07, "learning_rate": 0.00013891408650377627, "loss": 0.0089, "step": 212860 }, { "epoch": 1.07, "learning_rate": 0.00013890651881076226, "loss": 0.0096, "step": 212870 }, { "epoch": 1.07, "learning_rate": 0.00013889895111774824, "loss": 0.0092, "step": 212880 }, { "epoch": 1.07, "learning_rate": 0.00013889138342473422, "loss": 0.0083, "step": 212890 }, { "epoch": 1.07, "learning_rate": 0.00013888381573172023, "loss": 0.0085, "step": 212900 }, { "epoch": 1.07, "learning_rate": 0.0001388762480387062, "loss": 0.011, "step": 212910 }, { "epoch": 1.07, "learning_rate": 0.0001388686803456922, "loss": 0.0089, "step": 212920 }, { "epoch": 1.07, "learning_rate": 0.0001388611126526782, "loss": 0.0129, "step": 212930 }, { "epoch": 1.07, "learning_rate": 0.00013885354495966418, "loss": 0.0093, "step": 212940 }, { "epoch": 1.07, "learning_rate": 0.00013884597726665016, "loss": 0.0101, "step": 212950 }, { "epoch": 1.07, "learning_rate": 0.00013883840957363617, "loss": 0.0133, "step": 212960 }, { "epoch": 1.07, "learning_rate": 0.00013883084188062215, "loss": 0.0119, "step": 212970 }, { "epoch": 1.07, "learning_rate": 0.00013882327418760813, "loss": 0.0106, "step": 212980 }, { "epoch": 1.07, "learning_rate": 0.00013881570649459414, "loss": 0.0077, "step": 212990 }, { "epoch": 1.07, "learning_rate": 0.00013880813880158012, "loss": 0.0184, "step": 213000 }, { "epoch": 1.07, "eval_cer": 0.914481900656667, "eval_loss": 0.007489955984055996, "eval_runtime": 116.6491, "eval_samples_per_second": 17.145, "eval_steps_per_second": 4.286, "step": 213000 }, { "epoch": 1.07, "learning_rate": 0.0001388005711085661, "loss": 0.011, "step": 213010 }, { "epoch": 1.07, "learning_rate": 0.0001387930034155521, "loss": 0.0117, "step": 213020 }, { "epoch": 1.07, "learning_rate": 0.0001387854357225381, "loss": 0.0105, "step": 213030 }, { "epoch": 1.07, "learning_rate": 0.00013877786802952408, "loss": 0.0092, "step": 213040 }, { "epoch": 1.07, "learning_rate": 0.00013877030033651006, "loss": 0.0097, "step": 213050 }, { "epoch": 1.07, "learning_rate": 0.00013876273264349607, "loss": 0.0091, "step": 213060 }, { "epoch": 1.07, "learning_rate": 0.00013875516495048205, "loss": 0.0091, "step": 213070 }, { "epoch": 1.08, "learning_rate": 0.00013874759725746803, "loss": 0.0087, "step": 213080 }, { "epoch": 1.08, "learning_rate": 0.00013874002956445404, "loss": 0.0087, "step": 213090 }, { "epoch": 1.08, "learning_rate": 0.00013873246187144002, "loss": 0.0103, "step": 213100 }, { "epoch": 1.08, "learning_rate": 0.000138724894178426, "loss": 0.0094, "step": 213110 }, { "epoch": 1.08, "learning_rate": 0.000138717326485412, "loss": 0.0111, "step": 213120 }, { "epoch": 1.08, "learning_rate": 0.000138709758792398, "loss": 0.0108, "step": 213130 }, { "epoch": 1.08, "learning_rate": 0.00013870219109938397, "loss": 0.0071, "step": 213140 }, { "epoch": 1.08, "learning_rate": 0.00013869462340636998, "loss": 0.0082, "step": 213150 }, { "epoch": 1.08, "learning_rate": 0.00013868705571335596, "loss": 0.0103, "step": 213160 }, { "epoch": 1.08, "learning_rate": 0.00013867948802034194, "loss": 0.0134, "step": 213170 }, { "epoch": 1.08, "learning_rate": 0.00013867192032732795, "loss": 0.0127, "step": 213180 }, { "epoch": 1.08, "learning_rate": 0.00013866435263431393, "loss": 0.0096, "step": 213190 }, { "epoch": 1.08, "learning_rate": 0.00013865678494129991, "loss": 0.0091, "step": 213200 }, { "epoch": 1.08, "learning_rate": 0.00013864921724828592, "loss": 0.0071, "step": 213210 }, { "epoch": 1.08, "learning_rate": 0.0001386416495552719, "loss": 0.0107, "step": 213220 }, { "epoch": 1.08, "learning_rate": 0.00013863408186225789, "loss": 0.0083, "step": 213230 }, { "epoch": 1.08, "learning_rate": 0.00013862651416924387, "loss": 0.0122, "step": 213240 }, { "epoch": 1.08, "learning_rate": 0.00013861894647622988, "loss": 0.0085, "step": 213250 }, { "epoch": 1.08, "learning_rate": 0.00013861137878321586, "loss": 0.0061, "step": 213260 }, { "epoch": 1.08, "learning_rate": 0.00013860381109020184, "loss": 0.0101, "step": 213270 }, { "epoch": 1.08, "learning_rate": 0.00013859624339718785, "loss": 0.0075, "step": 213280 }, { "epoch": 1.08, "learning_rate": 0.00013858867570417383, "loss": 0.0109, "step": 213290 }, { "epoch": 1.08, "learning_rate": 0.0001385811080111598, "loss": 0.0111, "step": 213300 }, { "epoch": 1.08, "learning_rate": 0.00013857354031814582, "loss": 0.0097, "step": 213310 }, { "epoch": 1.08, "learning_rate": 0.0001385659726251318, "loss": 0.0098, "step": 213320 }, { "epoch": 1.08, "learning_rate": 0.00013855840493211778, "loss": 0.0103, "step": 213330 }, { "epoch": 1.08, "learning_rate": 0.0001385508372391038, "loss": 0.0092, "step": 213340 }, { "epoch": 1.08, "learning_rate": 0.00013854326954608977, "loss": 0.0097, "step": 213350 }, { "epoch": 1.08, "learning_rate": 0.00013853570185307575, "loss": 0.0083, "step": 213360 }, { "epoch": 1.08, "learning_rate": 0.00013852813416006173, "loss": 0.0097, "step": 213370 }, { "epoch": 1.08, "learning_rate": 0.00013852056646704772, "loss": 0.0107, "step": 213380 }, { "epoch": 1.08, "learning_rate": 0.00013851299877403372, "loss": 0.0112, "step": 213390 }, { "epoch": 1.08, "learning_rate": 0.0001385054310810197, "loss": 0.0116, "step": 213400 }, { "epoch": 1.08, "learning_rate": 0.0001384978633880057, "loss": 0.0087, "step": 213410 }, { "epoch": 1.08, "learning_rate": 0.00013849029569499167, "loss": 0.0097, "step": 213420 }, { "epoch": 1.08, "learning_rate": 0.00013848272800197768, "loss": 0.0118, "step": 213430 }, { "epoch": 1.08, "learning_rate": 0.00013847516030896366, "loss": 0.0093, "step": 213440 }, { "epoch": 1.08, "learning_rate": 0.00013846759261594964, "loss": 0.0105, "step": 213450 }, { "epoch": 1.08, "learning_rate": 0.00013846002492293565, "loss": 0.0084, "step": 213460 }, { "epoch": 1.08, "learning_rate": 0.00013845245722992163, "loss": 0.0083, "step": 213470 }, { "epoch": 1.08, "learning_rate": 0.0001384448895369076, "loss": 0.0076, "step": 213480 }, { "epoch": 1.08, "learning_rate": 0.00013843732184389362, "loss": 0.0096, "step": 213490 }, { "epoch": 1.08, "learning_rate": 0.0001384297541508796, "loss": 0.0099, "step": 213500 }, { "epoch": 1.08, "learning_rate": 0.00013842218645786558, "loss": 0.0102, "step": 213510 }, { "epoch": 1.08, "learning_rate": 0.0001384146187648516, "loss": 0.0087, "step": 213520 }, { "epoch": 1.08, "learning_rate": 0.00013840705107183757, "loss": 0.0092, "step": 213530 }, { "epoch": 1.08, "learning_rate": 0.00013839948337882355, "loss": 0.0075, "step": 213540 }, { "epoch": 1.08, "learning_rate": 0.00013839191568580956, "loss": 0.0081, "step": 213550 }, { "epoch": 1.08, "learning_rate": 0.00013838434799279554, "loss": 0.0093, "step": 213560 }, { "epoch": 1.08, "learning_rate": 0.00013837678029978153, "loss": 0.01, "step": 213570 }, { "epoch": 1.08, "learning_rate": 0.0001383692126067675, "loss": 0.01, "step": 213580 }, { "epoch": 1.08, "learning_rate": 0.00013836164491375352, "loss": 0.011, "step": 213590 }, { "epoch": 1.08, "learning_rate": 0.0001383540772207395, "loss": 0.0079, "step": 213600 }, { "epoch": 1.08, "learning_rate": 0.00013834650952772548, "loss": 0.0096, "step": 213610 }, { "epoch": 1.08, "learning_rate": 0.0001383389418347115, "loss": 0.0082, "step": 213620 }, { "epoch": 1.08, "learning_rate": 0.00013833137414169747, "loss": 0.0092, "step": 213630 }, { "epoch": 1.08, "learning_rate": 0.00013832380644868345, "loss": 0.008, "step": 213640 }, { "epoch": 1.08, "learning_rate": 0.00013831623875566946, "loss": 0.0092, "step": 213650 }, { "epoch": 1.08, "learning_rate": 0.00013830867106265544, "loss": 0.0097, "step": 213660 }, { "epoch": 1.08, "learning_rate": 0.00013830110336964142, "loss": 0.0099, "step": 213670 }, { "epoch": 1.08, "learning_rate": 0.00013829353567662743, "loss": 0.0108, "step": 213680 }, { "epoch": 1.08, "learning_rate": 0.0001382859679836134, "loss": 0.0082, "step": 213690 }, { "epoch": 1.08, "learning_rate": 0.0001382784002905994, "loss": 0.0095, "step": 213700 }, { "epoch": 1.08, "learning_rate": 0.0001382708325975854, "loss": 0.0093, "step": 213710 }, { "epoch": 1.08, "learning_rate": 0.00013826326490457138, "loss": 0.009, "step": 213720 }, { "epoch": 1.08, "learning_rate": 0.00013825569721155736, "loss": 0.0087, "step": 213730 }, { "epoch": 1.08, "learning_rate": 0.00013824812951854337, "loss": 0.0094, "step": 213740 }, { "epoch": 1.08, "learning_rate": 0.00013824056182552935, "loss": 0.0098, "step": 213750 }, { "epoch": 1.08, "learning_rate": 0.00013823299413251534, "loss": 0.0118, "step": 213760 }, { "epoch": 1.08, "learning_rate": 0.00013822542643950132, "loss": 0.0106, "step": 213770 }, { "epoch": 1.08, "learning_rate": 0.00013821785874648733, "loss": 0.0091, "step": 213780 }, { "epoch": 1.08, "learning_rate": 0.0001382102910534733, "loss": 0.01, "step": 213790 }, { "epoch": 1.08, "learning_rate": 0.0001382027233604593, "loss": 0.0074, "step": 213800 }, { "epoch": 1.08, "learning_rate": 0.0001381951556674453, "loss": 0.0104, "step": 213810 }, { "epoch": 1.08, "learning_rate": 0.00013818758797443128, "loss": 0.0124, "step": 213820 }, { "epoch": 1.08, "learning_rate": 0.00013818002028141726, "loss": 0.0092, "step": 213830 }, { "epoch": 1.08, "learning_rate": 0.00013817245258840327, "loss": 0.0077, "step": 213840 }, { "epoch": 1.08, "learning_rate": 0.00013816488489538925, "loss": 0.0114, "step": 213850 }, { "epoch": 1.08, "learning_rate": 0.00013815731720237523, "loss": 0.0116, "step": 213860 }, { "epoch": 1.08, "learning_rate": 0.00013814974950936124, "loss": 0.0092, "step": 213870 }, { "epoch": 1.08, "learning_rate": 0.00013814218181634722, "loss": 0.0102, "step": 213880 }, { "epoch": 1.08, "learning_rate": 0.0001381346141233332, "loss": 0.0085, "step": 213890 }, { "epoch": 1.08, "learning_rate": 0.0001381270464303192, "loss": 0.0094, "step": 213900 }, { "epoch": 1.08, "learning_rate": 0.0001381194787373052, "loss": 0.0079, "step": 213910 }, { "epoch": 1.08, "learning_rate": 0.00013811191104429117, "loss": 0.011, "step": 213920 }, { "epoch": 1.08, "learning_rate": 0.00013810434335127716, "loss": 0.0097, "step": 213930 }, { "epoch": 1.08, "learning_rate": 0.00013809677565826316, "loss": 0.009, "step": 213940 }, { "epoch": 1.08, "learning_rate": 0.00013808920796524915, "loss": 0.0091, "step": 213950 }, { "epoch": 1.08, "learning_rate": 0.00013808164027223513, "loss": 0.0104, "step": 213960 }, { "epoch": 1.08, "learning_rate": 0.00013807407257922114, "loss": 0.0152, "step": 213970 }, { "epoch": 1.08, "learning_rate": 0.00013806650488620712, "loss": 0.0104, "step": 213980 }, { "epoch": 1.08, "learning_rate": 0.0001380589371931931, "loss": 0.0146, "step": 213990 }, { "epoch": 1.08, "learning_rate": 0.00013805136950017908, "loss": 0.0098, "step": 214000 }, { "epoch": 1.08, "eval_cer": 0.9144392032271493, "eval_loss": 0.0074865869246423244, "eval_runtime": 116.6822, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 214000 }, { "epoch": 1.08, "learning_rate": 0.00013804380180716506, "loss": 0.0103, "step": 214010 }, { "epoch": 1.08, "learning_rate": 0.00013803623411415107, "loss": 0.0094, "step": 214020 }, { "epoch": 1.08, "learning_rate": 0.00013802866642113705, "loss": 0.0128, "step": 214030 }, { "epoch": 1.08, "learning_rate": 0.00013802109872812303, "loss": 0.011, "step": 214040 }, { "epoch": 1.08, "learning_rate": 0.00013801353103510904, "loss": 0.0086, "step": 214050 }, { "epoch": 1.08, "learning_rate": 0.00013800596334209502, "loss": 0.01, "step": 214060 }, { "epoch": 1.08, "learning_rate": 0.000137998395649081, "loss": 0.0124, "step": 214070 }, { "epoch": 1.08, "learning_rate": 0.000137990827956067, "loss": 0.0109, "step": 214080 }, { "epoch": 1.08, "learning_rate": 0.000137983260263053, "loss": 0.0105, "step": 214090 }, { "epoch": 1.08, "learning_rate": 0.00013797569257003898, "loss": 0.0111, "step": 214100 }, { "epoch": 1.08, "learning_rate": 0.00013796812487702498, "loss": 0.0144, "step": 214110 }, { "epoch": 1.08, "learning_rate": 0.00013796055718401097, "loss": 0.0105, "step": 214120 }, { "epoch": 1.08, "learning_rate": 0.00013795298949099695, "loss": 0.008, "step": 214130 }, { "epoch": 1.08, "learning_rate": 0.00013794542179798293, "loss": 0.0092, "step": 214140 }, { "epoch": 1.08, "learning_rate": 0.00013793785410496894, "loss": 0.0135, "step": 214150 }, { "epoch": 1.08, "learning_rate": 0.00013793028641195492, "loss": 0.0098, "step": 214160 }, { "epoch": 1.08, "learning_rate": 0.0001379227187189409, "loss": 0.0086, "step": 214170 }, { "epoch": 1.08, "learning_rate": 0.0001379151510259269, "loss": 0.0082, "step": 214180 }, { "epoch": 1.08, "learning_rate": 0.0001379075833329129, "loss": 0.0113, "step": 214190 }, { "epoch": 1.08, "learning_rate": 0.00013790001563989887, "loss": 0.0094, "step": 214200 }, { "epoch": 1.08, "learning_rate": 0.00013789244794688488, "loss": 0.0099, "step": 214210 }, { "epoch": 1.08, "learning_rate": 0.00013788488025387086, "loss": 0.0116, "step": 214220 }, { "epoch": 1.08, "learning_rate": 0.00013787731256085684, "loss": 0.0084, "step": 214230 }, { "epoch": 1.08, "learning_rate": 0.00013786974486784285, "loss": 0.0087, "step": 214240 }, { "epoch": 1.08, "learning_rate": 0.00013786217717482883, "loss": 0.0097, "step": 214250 }, { "epoch": 1.08, "learning_rate": 0.00013785460948181481, "loss": 0.0086, "step": 214260 }, { "epoch": 1.08, "learning_rate": 0.00013784704178880082, "loss": 0.0096, "step": 214270 }, { "epoch": 1.08, "learning_rate": 0.0001378394740957868, "loss": 0.0099, "step": 214280 }, { "epoch": 1.08, "learning_rate": 0.00013783190640277279, "loss": 0.007, "step": 214290 }, { "epoch": 1.08, "learning_rate": 0.00013782433870975877, "loss": 0.0097, "step": 214300 }, { "epoch": 1.08, "learning_rate": 0.00013781677101674478, "loss": 0.0114, "step": 214310 }, { "epoch": 1.08, "learning_rate": 0.00013780920332373076, "loss": 0.01, "step": 214320 }, { "epoch": 1.08, "learning_rate": 0.00013780163563071674, "loss": 0.0089, "step": 214330 }, { "epoch": 1.08, "learning_rate": 0.00013779406793770275, "loss": 0.009, "step": 214340 }, { "epoch": 1.08, "learning_rate": 0.00013778650024468873, "loss": 0.0087, "step": 214350 }, { "epoch": 1.08, "learning_rate": 0.0001377789325516747, "loss": 0.0122, "step": 214360 }, { "epoch": 1.08, "learning_rate": 0.00013777136485866072, "loss": 0.0096, "step": 214370 }, { "epoch": 1.08, "learning_rate": 0.0001377637971656467, "loss": 0.0093, "step": 214380 }, { "epoch": 1.08, "learning_rate": 0.00013775622947263268, "loss": 0.0081, "step": 214390 }, { "epoch": 1.08, "learning_rate": 0.0001377486617796187, "loss": 0.0103, "step": 214400 }, { "epoch": 1.08, "learning_rate": 0.00013774109408660467, "loss": 0.0087, "step": 214410 }, { "epoch": 1.08, "learning_rate": 0.00013773352639359065, "loss": 0.0113, "step": 214420 }, { "epoch": 1.08, "learning_rate": 0.00013772595870057666, "loss": 0.0092, "step": 214430 }, { "epoch": 1.08, "learning_rate": 0.00013771839100756264, "loss": 0.008, "step": 214440 }, { "epoch": 1.08, "learning_rate": 0.00013771082331454862, "loss": 0.0075, "step": 214450 }, { "epoch": 1.08, "learning_rate": 0.0001377032556215346, "loss": 0.01, "step": 214460 }, { "epoch": 1.08, "learning_rate": 0.00013769568792852061, "loss": 0.0104, "step": 214470 }, { "epoch": 1.08, "learning_rate": 0.0001376881202355066, "loss": 0.0086, "step": 214480 }, { "epoch": 1.08, "learning_rate": 0.00013768055254249258, "loss": 0.0102, "step": 214490 }, { "epoch": 1.08, "learning_rate": 0.00013767298484947859, "loss": 0.014, "step": 214500 }, { "epoch": 1.08, "learning_rate": 0.00013766541715646457, "loss": 0.0109, "step": 214510 }, { "epoch": 1.08, "learning_rate": 0.00013765784946345055, "loss": 0.0106, "step": 214520 }, { "epoch": 1.08, "learning_rate": 0.00013765028177043656, "loss": 0.009, "step": 214530 }, { "epoch": 1.08, "learning_rate": 0.00013764271407742254, "loss": 0.0089, "step": 214540 }, { "epoch": 1.08, "learning_rate": 0.00013763514638440852, "loss": 0.0108, "step": 214550 }, { "epoch": 1.08, "learning_rate": 0.00013762757869139453, "loss": 0.0069, "step": 214560 }, { "epoch": 1.08, "learning_rate": 0.0001376200109983805, "loss": 0.009, "step": 214570 }, { "epoch": 1.08, "learning_rate": 0.0001376124433053665, "loss": 0.0082, "step": 214580 }, { "epoch": 1.08, "learning_rate": 0.0001376048756123525, "loss": 0.011, "step": 214590 }, { "epoch": 1.08, "learning_rate": 0.00013759730791933848, "loss": 0.0095, "step": 214600 }, { "epoch": 1.08, "learning_rate": 0.00013758974022632446, "loss": 0.0083, "step": 214610 }, { "epoch": 1.08, "learning_rate": 0.00013758217253331045, "loss": 0.0088, "step": 214620 }, { "epoch": 1.08, "learning_rate": 0.00013757460484029643, "loss": 0.0087, "step": 214630 }, { "epoch": 1.08, "learning_rate": 0.00013756703714728244, "loss": 0.0103, "step": 214640 }, { "epoch": 1.08, "learning_rate": 0.00013755946945426842, "loss": 0.0119, "step": 214650 }, { "epoch": 1.08, "learning_rate": 0.0001375519017612544, "loss": 0.0121, "step": 214660 }, { "epoch": 1.08, "learning_rate": 0.00013754433406824038, "loss": 0.0101, "step": 214670 }, { "epoch": 1.08, "learning_rate": 0.0001375367663752264, "loss": 0.0107, "step": 214680 }, { "epoch": 1.08, "learning_rate": 0.00013752919868221237, "loss": 0.0103, "step": 214690 }, { "epoch": 1.08, "learning_rate": 0.00013752163098919835, "loss": 0.0136, "step": 214700 }, { "epoch": 1.08, "learning_rate": 0.00013751406329618436, "loss": 0.009, "step": 214710 }, { "epoch": 1.08, "learning_rate": 0.00013750649560317034, "loss": 0.0119, "step": 214720 }, { "epoch": 1.08, "learning_rate": 0.00013749892791015632, "loss": 0.0089, "step": 214730 }, { "epoch": 1.08, "learning_rate": 0.00013749136021714233, "loss": 0.0116, "step": 214740 }, { "epoch": 1.08, "learning_rate": 0.0001374837925241283, "loss": 0.0084, "step": 214750 }, { "epoch": 1.08, "learning_rate": 0.0001374762248311143, "loss": 0.0111, "step": 214760 }, { "epoch": 1.08, "learning_rate": 0.0001374686571381003, "loss": 0.0124, "step": 214770 }, { "epoch": 1.08, "learning_rate": 0.00013746108944508628, "loss": 0.0078, "step": 214780 }, { "epoch": 1.08, "learning_rate": 0.00013745352175207227, "loss": 0.0073, "step": 214790 }, { "epoch": 1.08, "learning_rate": 0.00013744595405905827, "loss": 0.0096, "step": 214800 }, { "epoch": 1.08, "learning_rate": 0.00013743838636604426, "loss": 0.0097, "step": 214810 }, { "epoch": 1.08, "learning_rate": 0.00013743081867303024, "loss": 0.0107, "step": 214820 }, { "epoch": 1.08, "learning_rate": 0.00013742325098001622, "loss": 0.0073, "step": 214830 }, { "epoch": 1.08, "learning_rate": 0.00013741568328700223, "loss": 0.0113, "step": 214840 }, { "epoch": 1.08, "learning_rate": 0.0001374081155939882, "loss": 0.0089, "step": 214850 }, { "epoch": 1.08, "learning_rate": 0.0001374005479009742, "loss": 0.0104, "step": 214860 }, { "epoch": 1.08, "learning_rate": 0.0001373929802079602, "loss": 0.0089, "step": 214870 }, { "epoch": 1.08, "learning_rate": 0.00013738541251494618, "loss": 0.0081, "step": 214880 }, { "epoch": 1.08, "learning_rate": 0.00013737784482193216, "loss": 0.0087, "step": 214890 }, { "epoch": 1.08, "learning_rate": 0.00013737027712891817, "loss": 0.0083, "step": 214900 }, { "epoch": 1.08, "learning_rate": 0.00013736270943590415, "loss": 0.0077, "step": 214910 }, { "epoch": 1.08, "learning_rate": 0.00013735514174289013, "loss": 0.0095, "step": 214920 }, { "epoch": 1.08, "learning_rate": 0.00013734757404987614, "loss": 0.0098, "step": 214930 }, { "epoch": 1.08, "learning_rate": 0.00013734000635686212, "loss": 0.0137, "step": 214940 }, { "epoch": 1.08, "learning_rate": 0.0001373324386638481, "loss": 0.0117, "step": 214950 }, { "epoch": 1.08, "learning_rate": 0.0001373248709708341, "loss": 0.0105, "step": 214960 }, { "epoch": 1.08, "learning_rate": 0.0001373173032778201, "loss": 0.0105, "step": 214970 }, { "epoch": 1.08, "learning_rate": 0.00013730973558480608, "loss": 0.0104, "step": 214980 }, { "epoch": 1.08, "learning_rate": 0.00013730216789179206, "loss": 0.0088, "step": 214990 }, { "epoch": 1.08, "learning_rate": 0.00013729460019877807, "loss": 0.0132, "step": 215000 }, { "epoch": 1.08, "eval_cer": 0.9144809302605417, "eval_loss": 0.0071860929019749165, "eval_runtime": 116.5447, "eval_samples_per_second": 17.161, "eval_steps_per_second": 4.29, "step": 215000 }, { "epoch": 1.08, "learning_rate": 0.00013728703250576405, "loss": 0.013, "step": 215010 }, { "epoch": 1.08, "learning_rate": 0.00013727946481275003, "loss": 0.011, "step": 215020 }, { "epoch": 1.08, "learning_rate": 0.00013727189711973604, "loss": 0.0118, "step": 215030 }, { "epoch": 1.08, "learning_rate": 0.00013726432942672202, "loss": 0.0071, "step": 215040 }, { "epoch": 1.08, "learning_rate": 0.000137256761733708, "loss": 0.009, "step": 215050 }, { "epoch": 1.09, "learning_rate": 0.000137249194040694, "loss": 0.0086, "step": 215060 }, { "epoch": 1.09, "learning_rate": 0.00013724162634768, "loss": 0.0097, "step": 215070 }, { "epoch": 1.09, "learning_rate": 0.00013723405865466597, "loss": 0.0097, "step": 215080 }, { "epoch": 1.09, "learning_rate": 0.00013722649096165198, "loss": 0.0091, "step": 215090 }, { "epoch": 1.09, "learning_rate": 0.00013721892326863796, "loss": 0.0101, "step": 215100 }, { "epoch": 1.09, "learning_rate": 0.00013721135557562394, "loss": 0.009, "step": 215110 }, { "epoch": 1.09, "learning_rate": 0.00013720378788260995, "loss": 0.0098, "step": 215120 }, { "epoch": 1.09, "learning_rate": 0.00013719622018959593, "loss": 0.0091, "step": 215130 }, { "epoch": 1.09, "learning_rate": 0.00013718865249658191, "loss": 0.0101, "step": 215140 }, { "epoch": 1.09, "learning_rate": 0.00013718108480356792, "loss": 0.0105, "step": 215150 }, { "epoch": 1.09, "learning_rate": 0.0001371735171105539, "loss": 0.0113, "step": 215160 }, { "epoch": 1.09, "learning_rate": 0.00013716594941753989, "loss": 0.0086, "step": 215170 }, { "epoch": 1.09, "learning_rate": 0.00013715838172452587, "loss": 0.0079, "step": 215180 }, { "epoch": 1.09, "learning_rate": 0.00013715081403151188, "loss": 0.0093, "step": 215190 }, { "epoch": 1.09, "learning_rate": 0.00013714324633849786, "loss": 0.0104, "step": 215200 }, { "epoch": 1.09, "learning_rate": 0.00013713567864548384, "loss": 0.0091, "step": 215210 }, { "epoch": 1.09, "learning_rate": 0.00013712811095246985, "loss": 0.0082, "step": 215220 }, { "epoch": 1.09, "learning_rate": 0.00013712054325945583, "loss": 0.0078, "step": 215230 }, { "epoch": 1.09, "learning_rate": 0.0001371129755664418, "loss": 0.0113, "step": 215240 }, { "epoch": 1.09, "learning_rate": 0.0001371054078734278, "loss": 0.0091, "step": 215250 }, { "epoch": 1.09, "learning_rate": 0.00013709784018041377, "loss": 0.0109, "step": 215260 }, { "epoch": 1.09, "learning_rate": 0.00013709027248739978, "loss": 0.0121, "step": 215270 }, { "epoch": 1.09, "learning_rate": 0.00013708270479438576, "loss": 0.0096, "step": 215280 }, { "epoch": 1.09, "learning_rate": 0.00013707513710137174, "loss": 0.0102, "step": 215290 }, { "epoch": 1.09, "learning_rate": 0.00013706756940835775, "loss": 0.0075, "step": 215300 }, { "epoch": 1.09, "learning_rate": 0.00013706000171534373, "loss": 0.0089, "step": 215310 }, { "epoch": 1.09, "learning_rate": 0.00013705243402232972, "loss": 0.009, "step": 215320 }, { "epoch": 1.09, "learning_rate": 0.00013704486632931572, "loss": 0.0069, "step": 215330 }, { "epoch": 1.09, "learning_rate": 0.0001370372986363017, "loss": 0.0092, "step": 215340 }, { "epoch": 1.09, "learning_rate": 0.0001370297309432877, "loss": 0.0125, "step": 215350 }, { "epoch": 1.09, "learning_rate": 0.00013702216325027367, "loss": 0.0107, "step": 215360 }, { "epoch": 1.09, "learning_rate": 0.00013701459555725968, "loss": 0.0099, "step": 215370 }, { "epoch": 1.09, "learning_rate": 0.00013700702786424566, "loss": 0.0116, "step": 215380 }, { "epoch": 1.09, "learning_rate": 0.00013699946017123164, "loss": 0.0101, "step": 215390 }, { "epoch": 1.09, "learning_rate": 0.00013699189247821765, "loss": 0.009, "step": 215400 }, { "epoch": 1.09, "learning_rate": 0.00013698432478520363, "loss": 0.0079, "step": 215410 }, { "epoch": 1.09, "learning_rate": 0.0001369767570921896, "loss": 0.014, "step": 215420 }, { "epoch": 1.09, "learning_rate": 0.00013696918939917562, "loss": 0.0104, "step": 215430 }, { "epoch": 1.09, "learning_rate": 0.0001369616217061616, "loss": 0.0123, "step": 215440 }, { "epoch": 1.09, "learning_rate": 0.00013695405401314758, "loss": 0.0127, "step": 215450 }, { "epoch": 1.09, "learning_rate": 0.0001369464863201336, "loss": 0.0098, "step": 215460 }, { "epoch": 1.09, "learning_rate": 0.00013693891862711957, "loss": 0.0119, "step": 215470 }, { "epoch": 1.09, "learning_rate": 0.00013693135093410555, "loss": 0.0069, "step": 215480 }, { "epoch": 1.09, "learning_rate": 0.00013692378324109156, "loss": 0.0138, "step": 215490 }, { "epoch": 1.09, "learning_rate": 0.00013691621554807754, "loss": 0.0085, "step": 215500 }, { "epoch": 1.09, "learning_rate": 0.00013690864785506353, "loss": 0.0105, "step": 215510 }, { "epoch": 1.09, "learning_rate": 0.0001369010801620495, "loss": 0.0083, "step": 215520 }, { "epoch": 1.09, "learning_rate": 0.00013689351246903552, "loss": 0.0092, "step": 215530 }, { "epoch": 1.09, "learning_rate": 0.0001368859447760215, "loss": 0.0088, "step": 215540 }, { "epoch": 1.09, "learning_rate": 0.00013687837708300748, "loss": 0.0083, "step": 215550 }, { "epoch": 1.09, "learning_rate": 0.0001368708093899935, "loss": 0.0084, "step": 215560 }, { "epoch": 1.09, "learning_rate": 0.00013686324169697947, "loss": 0.0087, "step": 215570 }, { "epoch": 1.09, "learning_rate": 0.00013685567400396545, "loss": 0.0096, "step": 215580 }, { "epoch": 1.09, "learning_rate": 0.00013684810631095146, "loss": 0.0116, "step": 215590 }, { "epoch": 1.09, "learning_rate": 0.00013684053861793744, "loss": 0.0082, "step": 215600 }, { "epoch": 1.09, "learning_rate": 0.00013683297092492342, "loss": 0.0095, "step": 215610 }, { "epoch": 1.09, "learning_rate": 0.00013682540323190943, "loss": 0.009, "step": 215620 }, { "epoch": 1.09, "learning_rate": 0.0001368178355388954, "loss": 0.0098, "step": 215630 }, { "epoch": 1.09, "learning_rate": 0.0001368102678458814, "loss": 0.0116, "step": 215640 }, { "epoch": 1.09, "learning_rate": 0.0001368027001528674, "loss": 0.0128, "step": 215650 }, { "epoch": 1.09, "learning_rate": 0.00013679513245985338, "loss": 0.0094, "step": 215660 }, { "epoch": 1.09, "learning_rate": 0.00013678756476683936, "loss": 0.0093, "step": 215670 }, { "epoch": 1.09, "learning_rate": 0.00013677999707382537, "loss": 0.0112, "step": 215680 }, { "epoch": 1.09, "learning_rate": 0.00013677242938081135, "loss": 0.0098, "step": 215690 }, { "epoch": 1.09, "learning_rate": 0.00013676486168779734, "loss": 0.0089, "step": 215700 }, { "epoch": 1.09, "learning_rate": 0.00013675729399478332, "loss": 0.0084, "step": 215710 }, { "epoch": 1.09, "learning_rate": 0.00013674972630176933, "loss": 0.0109, "step": 215720 }, { "epoch": 1.09, "learning_rate": 0.0001367421586087553, "loss": 0.012, "step": 215730 }, { "epoch": 1.09, "learning_rate": 0.0001367345909157413, "loss": 0.0104, "step": 215740 }, { "epoch": 1.09, "learning_rate": 0.0001367270232227273, "loss": 0.0097, "step": 215750 }, { "epoch": 1.09, "learning_rate": 0.00013671945552971328, "loss": 0.0086, "step": 215760 }, { "epoch": 1.09, "learning_rate": 0.00013671188783669926, "loss": 0.0112, "step": 215770 }, { "epoch": 1.09, "learning_rate": 0.00013670432014368527, "loss": 0.0066, "step": 215780 }, { "epoch": 1.09, "learning_rate": 0.00013669675245067125, "loss": 0.0102, "step": 215790 }, { "epoch": 1.09, "learning_rate": 0.00013668918475765723, "loss": 0.0091, "step": 215800 }, { "epoch": 1.09, "learning_rate": 0.00013668161706464324, "loss": 0.0097, "step": 215810 }, { "epoch": 1.09, "learning_rate": 0.00013667404937162922, "loss": 0.0108, "step": 215820 }, { "epoch": 1.09, "learning_rate": 0.0001366664816786152, "loss": 0.0092, "step": 215830 }, { "epoch": 1.09, "learning_rate": 0.0001366589139856012, "loss": 0.0093, "step": 215840 }, { "epoch": 1.09, "learning_rate": 0.0001366513462925872, "loss": 0.0085, "step": 215850 }, { "epoch": 1.09, "learning_rate": 0.00013664377859957317, "loss": 0.0086, "step": 215860 }, { "epoch": 1.09, "learning_rate": 0.00013663621090655916, "loss": 0.0104, "step": 215870 }, { "epoch": 1.09, "learning_rate": 0.00013662864321354514, "loss": 0.0084, "step": 215880 }, { "epoch": 1.09, "learning_rate": 0.00013662107552053112, "loss": 0.0091, "step": 215890 }, { "epoch": 1.09, "learning_rate": 0.00013661350782751713, "loss": 0.0086, "step": 215900 }, { "epoch": 1.09, "learning_rate": 0.0001366059401345031, "loss": 0.0145, "step": 215910 }, { "epoch": 1.09, "learning_rate": 0.0001365983724414891, "loss": 0.0091, "step": 215920 }, { "epoch": 1.09, "learning_rate": 0.0001365908047484751, "loss": 0.0084, "step": 215930 }, { "epoch": 1.09, "learning_rate": 0.00013658323705546108, "loss": 0.0079, "step": 215940 }, { "epoch": 1.09, "learning_rate": 0.00013657566936244706, "loss": 0.0074, "step": 215950 }, { "epoch": 1.09, "learning_rate": 0.00013656810166943307, "loss": 0.009, "step": 215960 }, { "epoch": 1.09, "learning_rate": 0.00013656053397641905, "loss": 0.0076, "step": 215970 }, { "epoch": 1.09, "learning_rate": 0.00013655296628340503, "loss": 0.0079, "step": 215980 }, { "epoch": 1.09, "learning_rate": 0.00013654539859039104, "loss": 0.0081, "step": 215990 }, { "epoch": 1.09, "learning_rate": 0.00013653783089737702, "loss": 0.0104, "step": 216000 }, { "epoch": 1.09, "eval_cer": 0.9144760782799146, "eval_loss": 0.0073201656341552734, "eval_runtime": 116.5986, "eval_samples_per_second": 17.153, "eval_steps_per_second": 4.288, "step": 216000 }, { "epoch": 1.09, "learning_rate": 0.000136530263204363, "loss": 0.0089, "step": 216010 }, { "epoch": 1.09, "learning_rate": 0.000136522695511349, "loss": 0.0088, "step": 216020 }, { "epoch": 1.09, "learning_rate": 0.000136515127818335, "loss": 0.0064, "step": 216030 }, { "epoch": 1.09, "learning_rate": 0.00013650756012532098, "loss": 0.008, "step": 216040 }, { "epoch": 1.09, "learning_rate": 0.00013649999243230698, "loss": 0.0087, "step": 216050 }, { "epoch": 1.09, "learning_rate": 0.00013649242473929297, "loss": 0.0104, "step": 216060 }, { "epoch": 1.09, "learning_rate": 0.00013648485704627895, "loss": 0.0128, "step": 216070 }, { "epoch": 1.09, "learning_rate": 0.00013647728935326493, "loss": 0.012, "step": 216080 }, { "epoch": 1.09, "learning_rate": 0.00013646972166025094, "loss": 0.0097, "step": 216090 }, { "epoch": 1.09, "learning_rate": 0.00013646215396723692, "loss": 0.0101, "step": 216100 }, { "epoch": 1.09, "learning_rate": 0.0001364545862742229, "loss": 0.008, "step": 216110 }, { "epoch": 1.09, "learning_rate": 0.0001364470185812089, "loss": 0.0097, "step": 216120 }, { "epoch": 1.09, "learning_rate": 0.0001364394508881949, "loss": 0.0081, "step": 216130 }, { "epoch": 1.09, "learning_rate": 0.00013643188319518087, "loss": 0.0068, "step": 216140 }, { "epoch": 1.09, "learning_rate": 0.00013642431550216688, "loss": 0.012, "step": 216150 }, { "epoch": 1.09, "learning_rate": 0.00013641674780915286, "loss": 0.0083, "step": 216160 }, { "epoch": 1.09, "learning_rate": 0.00013640918011613884, "loss": 0.0109, "step": 216170 }, { "epoch": 1.09, "learning_rate": 0.00013640161242312485, "loss": 0.0092, "step": 216180 }, { "epoch": 1.09, "learning_rate": 0.00013639404473011083, "loss": 0.0109, "step": 216190 }, { "epoch": 1.09, "learning_rate": 0.00013638647703709681, "loss": 0.0068, "step": 216200 }, { "epoch": 1.09, "learning_rate": 0.00013637890934408282, "loss": 0.0082, "step": 216210 }, { "epoch": 1.09, "learning_rate": 0.0001363713416510688, "loss": 0.0089, "step": 216220 }, { "epoch": 1.09, "learning_rate": 0.00013636377395805479, "loss": 0.0087, "step": 216230 }, { "epoch": 1.09, "learning_rate": 0.00013635620626504077, "loss": 0.0083, "step": 216240 }, { "epoch": 1.09, "learning_rate": 0.00013634863857202678, "loss": 0.0084, "step": 216250 }, { "epoch": 1.09, "learning_rate": 0.00013634107087901276, "loss": 0.0103, "step": 216260 }, { "epoch": 1.09, "learning_rate": 0.00013633350318599874, "loss": 0.0107, "step": 216270 }, { "epoch": 1.09, "learning_rate": 0.00013632593549298475, "loss": 0.0097, "step": 216280 }, { "epoch": 1.09, "learning_rate": 0.00013631836779997073, "loss": 0.0096, "step": 216290 }, { "epoch": 1.09, "learning_rate": 0.0001363108001069567, "loss": 0.0129, "step": 216300 }, { "epoch": 1.09, "learning_rate": 0.00013630323241394272, "loss": 0.0097, "step": 216310 }, { "epoch": 1.09, "learning_rate": 0.0001362956647209287, "loss": 0.0076, "step": 216320 }, { "epoch": 1.09, "learning_rate": 0.00013628809702791468, "loss": 0.0112, "step": 216330 }, { "epoch": 1.09, "learning_rate": 0.0001362805293349007, "loss": 0.0075, "step": 216340 }, { "epoch": 1.09, "learning_rate": 0.00013627296164188667, "loss": 0.0076, "step": 216350 }, { "epoch": 1.09, "learning_rate": 0.00013626539394887265, "loss": 0.0081, "step": 216360 }, { "epoch": 1.09, "learning_rate": 0.00013625782625585866, "loss": 0.0106, "step": 216370 }, { "epoch": 1.09, "learning_rate": 0.00013625025856284464, "loss": 0.0091, "step": 216380 }, { "epoch": 1.09, "learning_rate": 0.00013624269086983062, "loss": 0.0091, "step": 216390 }, { "epoch": 1.09, "learning_rate": 0.0001362351231768166, "loss": 0.011, "step": 216400 }, { "epoch": 1.09, "learning_rate": 0.00013622755548380261, "loss": 0.0085, "step": 216410 }, { "epoch": 1.09, "learning_rate": 0.0001362199877907886, "loss": 0.0091, "step": 216420 }, { "epoch": 1.09, "learning_rate": 0.00013621242009777458, "loss": 0.0099, "step": 216430 }, { "epoch": 1.09, "learning_rate": 0.00013620485240476059, "loss": 0.0086, "step": 216440 }, { "epoch": 1.09, "learning_rate": 0.00013619728471174657, "loss": 0.0095, "step": 216450 }, { "epoch": 1.09, "learning_rate": 0.00013618971701873255, "loss": 0.0067, "step": 216460 }, { "epoch": 1.09, "learning_rate": 0.00013618214932571856, "loss": 0.0089, "step": 216470 }, { "epoch": 1.09, "learning_rate": 0.00013617458163270454, "loss": 0.0074, "step": 216480 }, { "epoch": 1.09, "learning_rate": 0.00013616701393969052, "loss": 0.0127, "step": 216490 }, { "epoch": 1.09, "learning_rate": 0.0001361594462466765, "loss": 0.0083, "step": 216500 }, { "epoch": 1.09, "learning_rate": 0.00013615187855366248, "loss": 0.01, "step": 216510 }, { "epoch": 1.09, "learning_rate": 0.0001361443108606485, "loss": 0.0095, "step": 216520 }, { "epoch": 1.09, "learning_rate": 0.00013613674316763447, "loss": 0.0108, "step": 216530 }, { "epoch": 1.09, "learning_rate": 0.00013612917547462045, "loss": 0.008, "step": 216540 }, { "epoch": 1.09, "learning_rate": 0.00013612160778160646, "loss": 0.0097, "step": 216550 }, { "epoch": 1.09, "learning_rate": 0.00013611404008859244, "loss": 0.0084, "step": 216560 }, { "epoch": 1.09, "learning_rate": 0.00013610647239557843, "loss": 0.007, "step": 216570 }, { "epoch": 1.09, "learning_rate": 0.00013609890470256443, "loss": 0.0082, "step": 216580 }, { "epoch": 1.09, "learning_rate": 0.00013609133700955042, "loss": 0.0122, "step": 216590 }, { "epoch": 1.09, "learning_rate": 0.0001360837693165364, "loss": 0.0085, "step": 216600 }, { "epoch": 1.09, "learning_rate": 0.00013607620162352238, "loss": 0.0103, "step": 216610 }, { "epoch": 1.09, "learning_rate": 0.0001360686339305084, "loss": 0.0084, "step": 216620 }, { "epoch": 1.09, "learning_rate": 0.00013606106623749437, "loss": 0.0075, "step": 216630 }, { "epoch": 1.09, "learning_rate": 0.00013605349854448035, "loss": 0.0124, "step": 216640 }, { "epoch": 1.09, "learning_rate": 0.00013604593085146636, "loss": 0.0092, "step": 216650 }, { "epoch": 1.09, "learning_rate": 0.00013603836315845234, "loss": 0.0107, "step": 216660 }, { "epoch": 1.09, "learning_rate": 0.00013603079546543832, "loss": 0.0087, "step": 216670 }, { "epoch": 1.09, "learning_rate": 0.00013602322777242433, "loss": 0.0093, "step": 216680 }, { "epoch": 1.09, "learning_rate": 0.0001360156600794103, "loss": 0.0093, "step": 216690 }, { "epoch": 1.09, "learning_rate": 0.0001360080923863963, "loss": 0.0127, "step": 216700 }, { "epoch": 1.09, "learning_rate": 0.0001360005246933823, "loss": 0.0101, "step": 216710 }, { "epoch": 1.09, "learning_rate": 0.00013599295700036828, "loss": 0.0108, "step": 216720 }, { "epoch": 1.09, "learning_rate": 0.00013598538930735426, "loss": 0.0153, "step": 216730 }, { "epoch": 1.09, "learning_rate": 0.00013597782161434027, "loss": 0.0084, "step": 216740 }, { "epoch": 1.09, "learning_rate": 0.00013597025392132625, "loss": 0.0112, "step": 216750 }, { "epoch": 1.09, "learning_rate": 0.00013596268622831224, "loss": 0.0092, "step": 216760 }, { "epoch": 1.09, "learning_rate": 0.00013595511853529822, "loss": 0.0076, "step": 216770 }, { "epoch": 1.09, "learning_rate": 0.00013594755084228423, "loss": 0.0112, "step": 216780 }, { "epoch": 1.09, "learning_rate": 0.0001359399831492702, "loss": 0.009, "step": 216790 }, { "epoch": 1.09, "learning_rate": 0.0001359324154562562, "loss": 0.0123, "step": 216800 }, { "epoch": 1.09, "learning_rate": 0.0001359248477632422, "loss": 0.0071, "step": 216810 }, { "epoch": 1.09, "learning_rate": 0.00013591728007022818, "loss": 0.0074, "step": 216820 }, { "epoch": 1.09, "learning_rate": 0.00013590971237721416, "loss": 0.0093, "step": 216830 }, { "epoch": 1.09, "learning_rate": 0.00013590214468420017, "loss": 0.0099, "step": 216840 }, { "epoch": 1.09, "learning_rate": 0.00013589457699118615, "loss": 0.0078, "step": 216850 }, { "epoch": 1.09, "learning_rate": 0.00013588700929817213, "loss": 0.0086, "step": 216860 }, { "epoch": 1.09, "learning_rate": 0.00013587944160515814, "loss": 0.012, "step": 216870 }, { "epoch": 1.09, "learning_rate": 0.00013587187391214412, "loss": 0.0089, "step": 216880 }, { "epoch": 1.09, "learning_rate": 0.0001358643062191301, "loss": 0.0098, "step": 216890 }, { "epoch": 1.09, "learning_rate": 0.0001358567385261161, "loss": 0.0094, "step": 216900 }, { "epoch": 1.09, "learning_rate": 0.0001358491708331021, "loss": 0.0097, "step": 216910 }, { "epoch": 1.09, "learning_rate": 0.00013584160314008807, "loss": 0.0092, "step": 216920 }, { "epoch": 1.09, "learning_rate": 0.00013583403544707406, "loss": 0.0104, "step": 216930 }, { "epoch": 1.09, "learning_rate": 0.00013582646775406006, "loss": 0.0083, "step": 216940 }, { "epoch": 1.09, "learning_rate": 0.00013581890006104605, "loss": 0.011, "step": 216950 }, { "epoch": 1.09, "learning_rate": 0.00013581133236803203, "loss": 0.008, "step": 216960 }, { "epoch": 1.09, "learning_rate": 0.00013580376467501804, "loss": 0.01, "step": 216970 }, { "epoch": 1.09, "learning_rate": 0.00013579619698200402, "loss": 0.0111, "step": 216980 }, { "epoch": 1.09, "learning_rate": 0.00013578862928899, "loss": 0.0122, "step": 216990 }, { "epoch": 1.09, "learning_rate": 0.000135781061595976, "loss": 0.0094, "step": 217000 }, { "epoch": 1.09, "eval_cer": 0.9144741374876638, "eval_loss": 0.007423856761306524, "eval_runtime": 116.6037, "eval_samples_per_second": 17.152, "eval_steps_per_second": 4.288, "step": 217000 }, { "epoch": 1.09, "learning_rate": 0.000135773493902962, "loss": 0.0097, "step": 217010 }, { "epoch": 1.09, "learning_rate": 0.00013576592620994797, "loss": 0.0098, "step": 217020 }, { "epoch": 1.09, "learning_rate": 0.00013575835851693398, "loss": 0.0105, "step": 217030 }, { "epoch": 1.09, "learning_rate": 0.00013575079082391996, "loss": 0.0095, "step": 217040 }, { "epoch": 1.1, "learning_rate": 0.00013574322313090594, "loss": 0.0086, "step": 217050 }, { "epoch": 1.1, "learning_rate": 0.00013573565543789195, "loss": 0.0081, "step": 217060 }, { "epoch": 1.1, "learning_rate": 0.00013572808774487793, "loss": 0.0093, "step": 217070 }, { "epoch": 1.1, "learning_rate": 0.0001357205200518639, "loss": 0.0081, "step": 217080 }, { "epoch": 1.1, "learning_rate": 0.00013571295235884992, "loss": 0.0072, "step": 217090 }, { "epoch": 1.1, "learning_rate": 0.0001357053846658359, "loss": 0.0104, "step": 217100 }, { "epoch": 1.1, "learning_rate": 0.00013569781697282188, "loss": 0.0097, "step": 217110 }, { "epoch": 1.1, "learning_rate": 0.00013569024927980787, "loss": 0.0078, "step": 217120 }, { "epoch": 1.1, "learning_rate": 0.00013568268158679385, "loss": 0.0118, "step": 217130 }, { "epoch": 1.1, "learning_rate": 0.00013567511389377983, "loss": 0.0099, "step": 217140 }, { "epoch": 1.1, "learning_rate": 0.00013566754620076584, "loss": 0.0103, "step": 217150 }, { "epoch": 1.1, "learning_rate": 0.00013565997850775182, "loss": 0.0102, "step": 217160 }, { "epoch": 1.1, "learning_rate": 0.0001356524108147378, "loss": 0.0114, "step": 217170 }, { "epoch": 1.1, "learning_rate": 0.0001356448431217238, "loss": 0.0079, "step": 217180 }, { "epoch": 1.1, "learning_rate": 0.0001356372754287098, "loss": 0.0094, "step": 217190 }, { "epoch": 1.1, "learning_rate": 0.00013562970773569577, "loss": 0.0087, "step": 217200 }, { "epoch": 1.1, "learning_rate": 0.00013562214004268178, "loss": 0.0098, "step": 217210 }, { "epoch": 1.1, "learning_rate": 0.00013561457234966776, "loss": 0.0094, "step": 217220 }, { "epoch": 1.1, "learning_rate": 0.00013560700465665374, "loss": 0.0133, "step": 217230 }, { "epoch": 1.1, "learning_rate": 0.00013559943696363975, "loss": 0.0093, "step": 217240 }, { "epoch": 1.1, "learning_rate": 0.00013559186927062573, "loss": 0.0103, "step": 217250 }, { "epoch": 1.1, "learning_rate": 0.00013558430157761171, "loss": 0.0103, "step": 217260 }, { "epoch": 1.1, "learning_rate": 0.00013557673388459772, "loss": 0.0091, "step": 217270 }, { "epoch": 1.1, "learning_rate": 0.0001355691661915837, "loss": 0.0085, "step": 217280 }, { "epoch": 1.1, "learning_rate": 0.00013556159849856969, "loss": 0.0069, "step": 217290 }, { "epoch": 1.1, "learning_rate": 0.00013555403080555567, "loss": 0.0086, "step": 217300 }, { "epoch": 1.1, "learning_rate": 0.00013554646311254168, "loss": 0.0092, "step": 217310 }, { "epoch": 1.1, "learning_rate": 0.00013553889541952766, "loss": 0.0106, "step": 217320 }, { "epoch": 1.1, "learning_rate": 0.00013553132772651364, "loss": 0.0092, "step": 217330 }, { "epoch": 1.1, "learning_rate": 0.00013552376003349965, "loss": 0.0103, "step": 217340 }, { "epoch": 1.1, "learning_rate": 0.00013551619234048563, "loss": 0.0091, "step": 217350 }, { "epoch": 1.1, "learning_rate": 0.0001355086246474716, "loss": 0.0086, "step": 217360 }, { "epoch": 1.1, "learning_rate": 0.00013550105695445762, "loss": 0.0098, "step": 217370 }, { "epoch": 1.1, "learning_rate": 0.0001354934892614436, "loss": 0.0083, "step": 217380 }, { "epoch": 1.1, "learning_rate": 0.00013548592156842958, "loss": 0.007, "step": 217390 }, { "epoch": 1.1, "learning_rate": 0.0001354783538754156, "loss": 0.0106, "step": 217400 }, { "epoch": 1.1, "learning_rate": 0.00013547078618240157, "loss": 0.0085, "step": 217410 }, { "epoch": 1.1, "learning_rate": 0.00013546321848938755, "loss": 0.0073, "step": 217420 }, { "epoch": 1.1, "learning_rate": 0.00013545565079637356, "loss": 0.0098, "step": 217430 }, { "epoch": 1.1, "learning_rate": 0.00013544808310335954, "loss": 0.0106, "step": 217440 }, { "epoch": 1.1, "learning_rate": 0.00013544051541034552, "loss": 0.0093, "step": 217450 }, { "epoch": 1.1, "learning_rate": 0.0001354329477173315, "loss": 0.0114, "step": 217460 }, { "epoch": 1.1, "learning_rate": 0.00013542538002431751, "loss": 0.0099, "step": 217470 }, { "epoch": 1.1, "learning_rate": 0.0001354178123313035, "loss": 0.0094, "step": 217480 }, { "epoch": 1.1, "learning_rate": 0.00013541024463828948, "loss": 0.008, "step": 217490 }, { "epoch": 1.1, "learning_rate": 0.00013540267694527549, "loss": 0.0104, "step": 217500 }, { "epoch": 1.1, "learning_rate": 0.00013539510925226147, "loss": 0.0103, "step": 217510 }, { "epoch": 1.1, "learning_rate": 0.00013538754155924745, "loss": 0.0081, "step": 217520 }, { "epoch": 1.1, "learning_rate": 0.00013537997386623346, "loss": 0.0128, "step": 217530 }, { "epoch": 1.1, "learning_rate": 0.00013537240617321944, "loss": 0.0082, "step": 217540 }, { "epoch": 1.1, "learning_rate": 0.00013536483848020542, "loss": 0.008, "step": 217550 }, { "epoch": 1.1, "learning_rate": 0.00013535727078719143, "loss": 0.0124, "step": 217560 }, { "epoch": 1.1, "learning_rate": 0.0001353497030941774, "loss": 0.0071, "step": 217570 }, { "epoch": 1.1, "learning_rate": 0.0001353421354011634, "loss": 0.0103, "step": 217580 }, { "epoch": 1.1, "learning_rate": 0.0001353345677081494, "loss": 0.0128, "step": 217590 }, { "epoch": 1.1, "learning_rate": 0.00013532700001513538, "loss": 0.0081, "step": 217600 }, { "epoch": 1.1, "learning_rate": 0.00013531943232212136, "loss": 0.0111, "step": 217610 }, { "epoch": 1.1, "learning_rate": 0.00013531186462910737, "loss": 0.0084, "step": 217620 }, { "epoch": 1.1, "learning_rate": 0.00013530429693609335, "loss": 0.0103, "step": 217630 }, { "epoch": 1.1, "learning_rate": 0.00013529672924307933, "loss": 0.0095, "step": 217640 }, { "epoch": 1.1, "learning_rate": 0.00013528916155006532, "loss": 0.0091, "step": 217650 }, { "epoch": 1.1, "learning_rate": 0.00013528159385705132, "loss": 0.0094, "step": 217660 }, { "epoch": 1.1, "learning_rate": 0.0001352740261640373, "loss": 0.0109, "step": 217670 }, { "epoch": 1.1, "learning_rate": 0.0001352664584710233, "loss": 0.0111, "step": 217680 }, { "epoch": 1.1, "learning_rate": 0.0001352588907780093, "loss": 0.01, "step": 217690 }, { "epoch": 1.1, "learning_rate": 0.00013525132308499528, "loss": 0.009, "step": 217700 }, { "epoch": 1.1, "learning_rate": 0.00013524375539198126, "loss": 0.0098, "step": 217710 }, { "epoch": 1.1, "learning_rate": 0.00013523618769896727, "loss": 0.0101, "step": 217720 }, { "epoch": 1.1, "learning_rate": 0.00013522862000595325, "loss": 0.0089, "step": 217730 }, { "epoch": 1.1, "learning_rate": 0.00013522105231293923, "loss": 0.0077, "step": 217740 }, { "epoch": 1.1, "learning_rate": 0.00013521348461992524, "loss": 0.0105, "step": 217750 }, { "epoch": 1.1, "learning_rate": 0.0001352059169269112, "loss": 0.0074, "step": 217760 }, { "epoch": 1.1, "learning_rate": 0.0001351983492338972, "loss": 0.0105, "step": 217770 }, { "epoch": 1.1, "learning_rate": 0.00013519078154088318, "loss": 0.0108, "step": 217780 }, { "epoch": 1.1, "learning_rate": 0.00013518321384786916, "loss": 0.0096, "step": 217790 }, { "epoch": 1.1, "learning_rate": 0.00013517564615485517, "loss": 0.0089, "step": 217800 }, { "epoch": 1.1, "learning_rate": 0.00013516807846184115, "loss": 0.0099, "step": 217810 }, { "epoch": 1.1, "learning_rate": 0.00013516051076882714, "loss": 0.0099, "step": 217820 }, { "epoch": 1.1, "learning_rate": 0.00013515294307581312, "loss": 0.0188, "step": 217830 }, { "epoch": 1.1, "learning_rate": 0.00013514537538279913, "loss": 0.0099, "step": 217840 }, { "epoch": 1.1, "learning_rate": 0.0001351378076897851, "loss": 0.0119, "step": 217850 }, { "epoch": 1.1, "learning_rate": 0.0001351302399967711, "loss": 0.0089, "step": 217860 }, { "epoch": 1.1, "learning_rate": 0.0001351226723037571, "loss": 0.0105, "step": 217870 }, { "epoch": 1.1, "learning_rate": 0.00013511510461074308, "loss": 0.0073, "step": 217880 }, { "epoch": 1.1, "learning_rate": 0.00013510753691772906, "loss": 0.0088, "step": 217890 }, { "epoch": 1.1, "learning_rate": 0.00013509996922471507, "loss": 0.011, "step": 217900 }, { "epoch": 1.1, "learning_rate": 0.00013509240153170105, "loss": 0.0088, "step": 217910 }, { "epoch": 1.1, "learning_rate": 0.00013508483383868703, "loss": 0.0103, "step": 217920 }, { "epoch": 1.1, "learning_rate": 0.00013507726614567304, "loss": 0.008, "step": 217930 }, { "epoch": 1.1, "learning_rate": 0.00013506969845265902, "loss": 0.0104, "step": 217940 }, { "epoch": 1.1, "learning_rate": 0.000135062130759645, "loss": 0.0087, "step": 217950 }, { "epoch": 1.1, "learning_rate": 0.000135054563066631, "loss": 0.0111, "step": 217960 }, { "epoch": 1.1, "learning_rate": 0.000135046995373617, "loss": 0.0104, "step": 217970 }, { "epoch": 1.1, "learning_rate": 0.00013503942768060297, "loss": 0.0133, "step": 217980 }, { "epoch": 1.1, "learning_rate": 0.00013503185998758898, "loss": 0.011, "step": 217990 }, { "epoch": 1.1, "learning_rate": 0.00013502429229457496, "loss": 0.0077, "step": 218000 }, { "epoch": 1.1, "eval_cer": 0.9144867526372941, "eval_loss": 0.006999760400503874, "eval_runtime": 116.2125, "eval_samples_per_second": 17.21, "eval_steps_per_second": 4.302, "step": 218000 }, { "epoch": 1.1, "learning_rate": 0.00013501672460156095, "loss": 0.0123, "step": 218010 }, { "epoch": 1.1, "learning_rate": 0.00013500915690854693, "loss": 0.0082, "step": 218020 }, { "epoch": 1.1, "learning_rate": 0.00013500158921553294, "loss": 0.0101, "step": 218030 }, { "epoch": 1.1, "learning_rate": 0.00013499402152251892, "loss": 0.0102, "step": 218040 }, { "epoch": 1.1, "learning_rate": 0.0001349864538295049, "loss": 0.0086, "step": 218050 }, { "epoch": 1.1, "learning_rate": 0.0001349788861364909, "loss": 0.0095, "step": 218060 }, { "epoch": 1.1, "learning_rate": 0.0001349713184434769, "loss": 0.0087, "step": 218070 }, { "epoch": 1.1, "learning_rate": 0.00013496375075046287, "loss": 0.0114, "step": 218080 }, { "epoch": 1.1, "learning_rate": 0.00013495618305744888, "loss": 0.0101, "step": 218090 }, { "epoch": 1.1, "learning_rate": 0.00013494861536443486, "loss": 0.0098, "step": 218100 }, { "epoch": 1.1, "learning_rate": 0.00013494104767142084, "loss": 0.0096, "step": 218110 }, { "epoch": 1.1, "learning_rate": 0.00013493347997840685, "loss": 0.0094, "step": 218120 }, { "epoch": 1.1, "learning_rate": 0.00013492591228539283, "loss": 0.0113, "step": 218130 }, { "epoch": 1.1, "learning_rate": 0.0001349183445923788, "loss": 0.0129, "step": 218140 }, { "epoch": 1.1, "learning_rate": 0.00013491077689936482, "loss": 0.0101, "step": 218150 }, { "epoch": 1.1, "learning_rate": 0.0001349032092063508, "loss": 0.0094, "step": 218160 }, { "epoch": 1.1, "learning_rate": 0.00013489564151333678, "loss": 0.0102, "step": 218170 }, { "epoch": 1.1, "learning_rate": 0.00013488807382032277, "loss": 0.0104, "step": 218180 }, { "epoch": 1.1, "learning_rate": 0.00013488050612730877, "loss": 0.0099, "step": 218190 }, { "epoch": 1.1, "learning_rate": 0.00013487293843429476, "loss": 0.0096, "step": 218200 }, { "epoch": 1.1, "learning_rate": 0.00013486537074128074, "loss": 0.0102, "step": 218210 }, { "epoch": 1.1, "learning_rate": 0.00013485780304826675, "loss": 0.008, "step": 218220 }, { "epoch": 1.1, "learning_rate": 0.00013485023535525273, "loss": 0.0105, "step": 218230 }, { "epoch": 1.1, "learning_rate": 0.0001348426676622387, "loss": 0.0093, "step": 218240 }, { "epoch": 1.1, "learning_rate": 0.00013483509996922472, "loss": 0.0104, "step": 218250 }, { "epoch": 1.1, "learning_rate": 0.0001348275322762107, "loss": 0.0102, "step": 218260 }, { "epoch": 1.1, "learning_rate": 0.00013481996458319668, "loss": 0.0083, "step": 218270 }, { "epoch": 1.1, "learning_rate": 0.0001348123968901827, "loss": 0.0104, "step": 218280 }, { "epoch": 1.1, "learning_rate": 0.00013480482919716867, "loss": 0.0097, "step": 218290 }, { "epoch": 1.1, "learning_rate": 0.00013479726150415465, "loss": 0.009, "step": 218300 }, { "epoch": 1.1, "learning_rate": 0.00013478969381114066, "loss": 0.0086, "step": 218310 }, { "epoch": 1.1, "learning_rate": 0.00013478212611812664, "loss": 0.0106, "step": 218320 }, { "epoch": 1.1, "learning_rate": 0.00013477455842511262, "loss": 0.0099, "step": 218330 }, { "epoch": 1.1, "learning_rate": 0.0001347669907320986, "loss": 0.0108, "step": 218340 }, { "epoch": 1.1, "learning_rate": 0.0001347594230390846, "loss": 0.0112, "step": 218350 }, { "epoch": 1.1, "learning_rate": 0.0001347518553460706, "loss": 0.0106, "step": 218360 }, { "epoch": 1.1, "learning_rate": 0.00013474428765305658, "loss": 0.0077, "step": 218370 }, { "epoch": 1.1, "learning_rate": 0.00013473671996004258, "loss": 0.014, "step": 218380 }, { "epoch": 1.1, "learning_rate": 0.00013472915226702854, "loss": 0.0105, "step": 218390 }, { "epoch": 1.1, "learning_rate": 0.00013472158457401455, "loss": 0.0139, "step": 218400 }, { "epoch": 1.1, "learning_rate": 0.00013471401688100053, "loss": 0.0107, "step": 218410 }, { "epoch": 1.1, "learning_rate": 0.0001347064491879865, "loss": 0.0074, "step": 218420 }, { "epoch": 1.1, "learning_rate": 0.00013469888149497252, "loss": 0.0088, "step": 218430 }, { "epoch": 1.1, "learning_rate": 0.0001346913138019585, "loss": 0.0103, "step": 218440 }, { "epoch": 1.1, "learning_rate": 0.00013468374610894448, "loss": 0.0088, "step": 218450 }, { "epoch": 1.1, "learning_rate": 0.0001346761784159305, "loss": 0.009, "step": 218460 }, { "epoch": 1.1, "learning_rate": 0.00013466861072291647, "loss": 0.0099, "step": 218470 }, { "epoch": 1.1, "learning_rate": 0.00013466104302990245, "loss": 0.0084, "step": 218480 }, { "epoch": 1.1, "learning_rate": 0.00013465347533688846, "loss": 0.0127, "step": 218490 }, { "epoch": 1.1, "learning_rate": 0.00013464590764387444, "loss": 0.0092, "step": 218500 }, { "epoch": 1.1, "learning_rate": 0.00013463833995086042, "loss": 0.0089, "step": 218510 }, { "epoch": 1.1, "learning_rate": 0.00013463077225784643, "loss": 0.0079, "step": 218520 }, { "epoch": 1.1, "learning_rate": 0.00013462320456483241, "loss": 0.0104, "step": 218530 }, { "epoch": 1.1, "learning_rate": 0.0001346156368718184, "loss": 0.0113, "step": 218540 }, { "epoch": 1.1, "learning_rate": 0.00013460806917880438, "loss": 0.0096, "step": 218550 }, { "epoch": 1.1, "learning_rate": 0.00013460050148579039, "loss": 0.0077, "step": 218560 }, { "epoch": 1.1, "learning_rate": 0.00013459293379277637, "loss": 0.0077, "step": 218570 }, { "epoch": 1.1, "learning_rate": 0.00013458536609976235, "loss": 0.0096, "step": 218580 }, { "epoch": 1.1, "learning_rate": 0.00013457779840674836, "loss": 0.009, "step": 218590 }, { "epoch": 1.1, "learning_rate": 0.00013457023071373434, "loss": 0.0087, "step": 218600 }, { "epoch": 1.1, "learning_rate": 0.00013456266302072032, "loss": 0.0112, "step": 218610 }, { "epoch": 1.1, "learning_rate": 0.00013455509532770633, "loss": 0.0089, "step": 218620 }, { "epoch": 1.1, "learning_rate": 0.0001345475276346923, "loss": 0.0107, "step": 218630 }, { "epoch": 1.1, "learning_rate": 0.0001345399599416783, "loss": 0.0085, "step": 218640 }, { "epoch": 1.1, "learning_rate": 0.0001345323922486643, "loss": 0.0083, "step": 218650 }, { "epoch": 1.1, "learning_rate": 0.00013452482455565028, "loss": 0.009, "step": 218660 }, { "epoch": 1.1, "learning_rate": 0.00013451725686263626, "loss": 0.0094, "step": 218670 }, { "epoch": 1.1, "learning_rate": 0.00013450968916962227, "loss": 0.01, "step": 218680 }, { "epoch": 1.1, "learning_rate": 0.00013450212147660825, "loss": 0.0082, "step": 218690 }, { "epoch": 1.1, "learning_rate": 0.00013449455378359423, "loss": 0.0097, "step": 218700 }, { "epoch": 1.1, "learning_rate": 0.00013448698609058022, "loss": 0.0128, "step": 218710 }, { "epoch": 1.1, "learning_rate": 0.00013447941839756622, "loss": 0.0085, "step": 218720 }, { "epoch": 1.1, "learning_rate": 0.0001344718507045522, "loss": 0.009, "step": 218730 }, { "epoch": 1.1, "learning_rate": 0.0001344642830115382, "loss": 0.009, "step": 218740 }, { "epoch": 1.1, "learning_rate": 0.0001344567153185242, "loss": 0.009, "step": 218750 }, { "epoch": 1.1, "learning_rate": 0.00013444914762551018, "loss": 0.0075, "step": 218760 }, { "epoch": 1.1, "learning_rate": 0.00013444157993249616, "loss": 0.0114, "step": 218770 }, { "epoch": 1.1, "learning_rate": 0.00013443401223948217, "loss": 0.01, "step": 218780 }, { "epoch": 1.1, "learning_rate": 0.00013442644454646815, "loss": 0.01, "step": 218790 }, { "epoch": 1.1, "learning_rate": 0.00013441887685345413, "loss": 0.0095, "step": 218800 }, { "epoch": 1.1, "learning_rate": 0.00013441130916044014, "loss": 0.01, "step": 218810 }, { "epoch": 1.1, "learning_rate": 0.00013440374146742612, "loss": 0.0119, "step": 218820 }, { "epoch": 1.1, "learning_rate": 0.0001343961737744121, "loss": 0.0094, "step": 218830 }, { "epoch": 1.1, "learning_rate": 0.0001343886060813981, "loss": 0.0081, "step": 218840 }, { "epoch": 1.1, "learning_rate": 0.0001343810383883841, "loss": 0.0083, "step": 218850 }, { "epoch": 1.1, "learning_rate": 0.00013437347069537007, "loss": 0.0105, "step": 218860 }, { "epoch": 1.1, "learning_rate": 0.00013436590300235605, "loss": 0.0095, "step": 218870 }, { "epoch": 1.1, "learning_rate": 0.00013435833530934206, "loss": 0.0111, "step": 218880 }, { "epoch": 1.1, "learning_rate": 0.00013435076761632804, "loss": 0.0072, "step": 218890 }, { "epoch": 1.1, "learning_rate": 0.00013434319992331403, "loss": 0.0123, "step": 218900 }, { "epoch": 1.1, "learning_rate": 0.00013433563223030003, "loss": 0.0066, "step": 218910 }, { "epoch": 1.1, "learning_rate": 0.00013432806453728602, "loss": 0.0082, "step": 218920 }, { "epoch": 1.1, "learning_rate": 0.000134320496844272, "loss": 0.0085, "step": 218930 }, { "epoch": 1.1, "learning_rate": 0.000134312929151258, "loss": 0.0088, "step": 218940 }, { "epoch": 1.1, "learning_rate": 0.000134305361458244, "loss": 0.0115, "step": 218950 }, { "epoch": 1.1, "learning_rate": 0.00013429779376522997, "loss": 0.0093, "step": 218960 }, { "epoch": 1.1, "learning_rate": 0.00013429022607221598, "loss": 0.0127, "step": 218970 }, { "epoch": 1.1, "learning_rate": 0.00013428265837920196, "loss": 0.0107, "step": 218980 }, { "epoch": 1.1, "learning_rate": 0.00013427509068618794, "loss": 0.0085, "step": 218990 }, { "epoch": 1.1, "learning_rate": 0.00013426752299317395, "loss": 0.0087, "step": 219000 }, { "epoch": 1.1, "eval_cer": 0.9144799598644162, "eval_loss": 0.007354082074016333, "eval_runtime": 116.3343, "eval_samples_per_second": 17.192, "eval_steps_per_second": 4.298, "step": 219000 }, { "epoch": 1.1, "learning_rate": 0.00013425995530015993, "loss": 0.0105, "step": 219010 }, { "epoch": 1.1, "learning_rate": 0.0001342523876071459, "loss": 0.0091, "step": 219020 }, { "epoch": 1.11, "learning_rate": 0.0001342448199141319, "loss": 0.0087, "step": 219030 }, { "epoch": 1.11, "learning_rate": 0.00013423725222111787, "loss": 0.0103, "step": 219040 }, { "epoch": 1.11, "learning_rate": 0.00013422968452810388, "loss": 0.0114, "step": 219050 }, { "epoch": 1.11, "learning_rate": 0.00013422211683508986, "loss": 0.0088, "step": 219060 }, { "epoch": 1.11, "learning_rate": 0.00013421454914207585, "loss": 0.0107, "step": 219070 }, { "epoch": 1.11, "learning_rate": 0.00013420698144906183, "loss": 0.0094, "step": 219080 }, { "epoch": 1.11, "learning_rate": 0.00013419941375604784, "loss": 0.0085, "step": 219090 }, { "epoch": 1.11, "learning_rate": 0.00013419184606303382, "loss": 0.0095, "step": 219100 }, { "epoch": 1.11, "learning_rate": 0.0001341842783700198, "loss": 0.0109, "step": 219110 }, { "epoch": 1.11, "learning_rate": 0.0001341767106770058, "loss": 0.0102, "step": 219120 }, { "epoch": 1.11, "learning_rate": 0.0001341691429839918, "loss": 0.0099, "step": 219130 }, { "epoch": 1.11, "learning_rate": 0.00013416157529097777, "loss": 0.0104, "step": 219140 }, { "epoch": 1.11, "learning_rate": 0.00013415400759796378, "loss": 0.0083, "step": 219150 }, { "epoch": 1.11, "learning_rate": 0.00013414643990494976, "loss": 0.0103, "step": 219160 }, { "epoch": 1.11, "learning_rate": 0.00013413887221193574, "loss": 0.0093, "step": 219170 }, { "epoch": 1.11, "learning_rate": 0.00013413130451892175, "loss": 0.0116, "step": 219180 }, { "epoch": 1.11, "learning_rate": 0.00013412373682590773, "loss": 0.0088, "step": 219190 }, { "epoch": 1.11, "learning_rate": 0.0001341161691328937, "loss": 0.01, "step": 219200 }, { "epoch": 1.11, "learning_rate": 0.00013410860143987972, "loss": 0.0094, "step": 219210 }, { "epoch": 1.11, "learning_rate": 0.0001341010337468657, "loss": 0.0103, "step": 219220 }, { "epoch": 1.11, "learning_rate": 0.00013409346605385168, "loss": 0.009, "step": 219230 }, { "epoch": 1.11, "learning_rate": 0.00013408589836083767, "loss": 0.0087, "step": 219240 }, { "epoch": 1.11, "learning_rate": 0.00013407833066782367, "loss": 0.0076, "step": 219250 }, { "epoch": 1.11, "learning_rate": 0.00013407076297480966, "loss": 0.012, "step": 219260 }, { "epoch": 1.11, "learning_rate": 0.00013406319528179564, "loss": 0.0097, "step": 219270 }, { "epoch": 1.11, "learning_rate": 0.00013405562758878165, "loss": 0.0075, "step": 219280 }, { "epoch": 1.11, "learning_rate": 0.00013404805989576763, "loss": 0.0094, "step": 219290 }, { "epoch": 1.11, "learning_rate": 0.0001340404922027536, "loss": 0.0104, "step": 219300 }, { "epoch": 1.11, "learning_rate": 0.00013403292450973962, "loss": 0.0083, "step": 219310 }, { "epoch": 1.11, "learning_rate": 0.0001340253568167256, "loss": 0.0069, "step": 219320 }, { "epoch": 1.11, "learning_rate": 0.00013401778912371158, "loss": 0.0084, "step": 219330 }, { "epoch": 1.11, "learning_rate": 0.0001340102214306976, "loss": 0.0097, "step": 219340 }, { "epoch": 1.11, "learning_rate": 0.00013400265373768357, "loss": 0.0106, "step": 219350 }, { "epoch": 1.11, "learning_rate": 0.00013399508604466955, "loss": 0.0071, "step": 219360 }, { "epoch": 1.11, "learning_rate": 0.00013398751835165556, "loss": 0.0117, "step": 219370 }, { "epoch": 1.11, "learning_rate": 0.00013397995065864154, "loss": 0.0129, "step": 219380 }, { "epoch": 1.11, "learning_rate": 0.00013397238296562752, "loss": 0.0094, "step": 219390 }, { "epoch": 1.11, "learning_rate": 0.0001339648152726135, "loss": 0.0109, "step": 219400 }, { "epoch": 1.11, "learning_rate": 0.0001339572475795995, "loss": 0.0082, "step": 219410 }, { "epoch": 1.11, "learning_rate": 0.0001339496798865855, "loss": 0.0105, "step": 219420 }, { "epoch": 1.11, "learning_rate": 0.00013394211219357148, "loss": 0.0107, "step": 219430 }, { "epoch": 1.11, "learning_rate": 0.00013393454450055748, "loss": 0.0119, "step": 219440 }, { "epoch": 1.11, "learning_rate": 0.00013392697680754347, "loss": 0.0087, "step": 219450 }, { "epoch": 1.11, "learning_rate": 0.00013391940911452945, "loss": 0.0096, "step": 219460 }, { "epoch": 1.11, "learning_rate": 0.00013391184142151546, "loss": 0.0096, "step": 219470 }, { "epoch": 1.11, "learning_rate": 0.00013390427372850144, "loss": 0.009, "step": 219480 }, { "epoch": 1.11, "learning_rate": 0.00013389670603548742, "loss": 0.0097, "step": 219490 }, { "epoch": 1.11, "learning_rate": 0.00013388913834247343, "loss": 0.0098, "step": 219500 }, { "epoch": 1.11, "learning_rate": 0.0001338815706494594, "loss": 0.0128, "step": 219510 }, { "epoch": 1.11, "learning_rate": 0.0001338740029564454, "loss": 0.0071, "step": 219520 }, { "epoch": 1.11, "learning_rate": 0.0001338664352634314, "loss": 0.0075, "step": 219530 }, { "epoch": 1.11, "learning_rate": 0.00013385886757041738, "loss": 0.0092, "step": 219540 }, { "epoch": 1.11, "learning_rate": 0.00013385129987740336, "loss": 0.0089, "step": 219550 }, { "epoch": 1.11, "learning_rate": 0.00013384373218438937, "loss": 0.007, "step": 219560 }, { "epoch": 1.11, "learning_rate": 0.00013383616449137535, "loss": 0.0099, "step": 219570 }, { "epoch": 1.11, "learning_rate": 0.00013382859679836133, "loss": 0.0118, "step": 219580 }, { "epoch": 1.11, "learning_rate": 0.00013382102910534731, "loss": 0.0098, "step": 219590 }, { "epoch": 1.11, "learning_rate": 0.00013381346141233332, "loss": 0.0089, "step": 219600 }, { "epoch": 1.11, "learning_rate": 0.0001338058937193193, "loss": 0.0128, "step": 219610 }, { "epoch": 1.11, "learning_rate": 0.00013379832602630529, "loss": 0.0091, "step": 219620 }, { "epoch": 1.11, "learning_rate": 0.0001337907583332913, "loss": 0.0083, "step": 219630 }, { "epoch": 1.11, "learning_rate": 0.00013378319064027728, "loss": 0.0102, "step": 219640 }, { "epoch": 1.11, "learning_rate": 0.00013377562294726326, "loss": 0.0078, "step": 219650 }, { "epoch": 1.11, "learning_rate": 0.00013376805525424924, "loss": 0.0108, "step": 219660 }, { "epoch": 1.11, "learning_rate": 0.00013376048756123522, "loss": 0.0106, "step": 219670 }, { "epoch": 1.11, "learning_rate": 0.00013375291986822123, "loss": 0.0112, "step": 219680 }, { "epoch": 1.11, "learning_rate": 0.0001337453521752072, "loss": 0.0094, "step": 219690 }, { "epoch": 1.11, "learning_rate": 0.0001337377844821932, "loss": 0.012, "step": 219700 }, { "epoch": 1.11, "learning_rate": 0.0001337302167891792, "loss": 0.009, "step": 219710 }, { "epoch": 1.11, "learning_rate": 0.00013372264909616518, "loss": 0.0107, "step": 219720 }, { "epoch": 1.11, "learning_rate": 0.00013371508140315116, "loss": 0.0093, "step": 219730 }, { "epoch": 1.11, "learning_rate": 0.00013370751371013717, "loss": 0.0103, "step": 219740 }, { "epoch": 1.11, "learning_rate": 0.00013369994601712315, "loss": 0.0088, "step": 219750 }, { "epoch": 1.11, "learning_rate": 0.00013369237832410913, "loss": 0.0083, "step": 219760 }, { "epoch": 1.11, "learning_rate": 0.00013368481063109512, "loss": 0.0103, "step": 219770 }, { "epoch": 1.11, "learning_rate": 0.00013367724293808112, "loss": 0.0084, "step": 219780 }, { "epoch": 1.11, "learning_rate": 0.0001336696752450671, "loss": 0.0073, "step": 219790 }, { "epoch": 1.11, "learning_rate": 0.0001336621075520531, "loss": 0.0089, "step": 219800 }, { "epoch": 1.11, "learning_rate": 0.0001336545398590391, "loss": 0.0086, "step": 219810 }, { "epoch": 1.11, "learning_rate": 0.00013364697216602508, "loss": 0.0094, "step": 219820 }, { "epoch": 1.11, "learning_rate": 0.00013363940447301106, "loss": 0.0112, "step": 219830 }, { "epoch": 1.11, "learning_rate": 0.00013363183677999707, "loss": 0.0078, "step": 219840 }, { "epoch": 1.11, "learning_rate": 0.00013362426908698305, "loss": 0.0078, "step": 219850 }, { "epoch": 1.11, "learning_rate": 0.00013361670139396903, "loss": 0.0094, "step": 219860 }, { "epoch": 1.11, "learning_rate": 0.00013360913370095504, "loss": 0.0101, "step": 219870 }, { "epoch": 1.11, "learning_rate": 0.00013360156600794102, "loss": 0.0114, "step": 219880 }, { "epoch": 1.11, "learning_rate": 0.000133593998314927, "loss": 0.0088, "step": 219890 }, { "epoch": 1.11, "learning_rate": 0.000133586430621913, "loss": 0.0088, "step": 219900 }, { "epoch": 1.11, "learning_rate": 0.000133578862928899, "loss": 0.0094, "step": 219910 }, { "epoch": 1.11, "learning_rate": 0.00013357129523588497, "loss": 0.0079, "step": 219920 }, { "epoch": 1.11, "learning_rate": 0.00013356372754287098, "loss": 0.0105, "step": 219930 }, { "epoch": 1.11, "learning_rate": 0.00013355615984985696, "loss": 0.0113, "step": 219940 }, { "epoch": 1.11, "learning_rate": 0.00013354859215684294, "loss": 0.0113, "step": 219950 }, { "epoch": 1.11, "learning_rate": 0.00013354102446382893, "loss": 0.0084, "step": 219960 }, { "epoch": 1.11, "learning_rate": 0.00013353345677081493, "loss": 0.0104, "step": 219970 }, { "epoch": 1.11, "learning_rate": 0.00013352588907780092, "loss": 0.0082, "step": 219980 }, { "epoch": 1.11, "learning_rate": 0.0001335183213847869, "loss": 0.0096, "step": 219990 }, { "epoch": 1.11, "learning_rate": 0.0001335107536917729, "loss": 0.0092, "step": 220000 }, { "epoch": 1.11, "eval_cer": 0.9144450256039017, "eval_loss": 0.007259270641952753, "eval_runtime": 116.3674, "eval_samples_per_second": 17.187, "eval_steps_per_second": 4.297, "step": 220000 }, { "epoch": 1.11, "learning_rate": 0.0001335031859987589, "loss": 0.0095, "step": 220010 }, { "epoch": 1.11, "learning_rate": 0.00013349561830574487, "loss": 0.0124, "step": 220020 }, { "epoch": 1.11, "learning_rate": 0.00013348805061273088, "loss": 0.0093, "step": 220030 }, { "epoch": 1.11, "learning_rate": 0.00013348048291971686, "loss": 0.0102, "step": 220040 }, { "epoch": 1.11, "learning_rate": 0.00013347291522670284, "loss": 0.0096, "step": 220050 }, { "epoch": 1.11, "learning_rate": 0.00013346534753368885, "loss": 0.0121, "step": 220060 }, { "epoch": 1.11, "learning_rate": 0.00013345777984067483, "loss": 0.0112, "step": 220070 }, { "epoch": 1.11, "learning_rate": 0.0001334502121476608, "loss": 0.0094, "step": 220080 }, { "epoch": 1.11, "learning_rate": 0.00013344264445464682, "loss": 0.0098, "step": 220090 }, { "epoch": 1.11, "learning_rate": 0.0001334350767616328, "loss": 0.0092, "step": 220100 }, { "epoch": 1.11, "learning_rate": 0.00013342750906861878, "loss": 0.0078, "step": 220110 }, { "epoch": 1.11, "learning_rate": 0.00013341994137560476, "loss": 0.0092, "step": 220120 }, { "epoch": 1.11, "learning_rate": 0.00013341237368259077, "loss": 0.0097, "step": 220130 }, { "epoch": 1.11, "learning_rate": 0.00013340480598957675, "loss": 0.0094, "step": 220140 }, { "epoch": 1.11, "learning_rate": 0.00013339723829656274, "loss": 0.0084, "step": 220150 }, { "epoch": 1.11, "learning_rate": 0.00013338967060354874, "loss": 0.0096, "step": 220160 }, { "epoch": 1.11, "learning_rate": 0.00013338210291053473, "loss": 0.0096, "step": 220170 }, { "epoch": 1.11, "learning_rate": 0.0001333745352175207, "loss": 0.0081, "step": 220180 }, { "epoch": 1.11, "learning_rate": 0.00013336696752450672, "loss": 0.0096, "step": 220190 }, { "epoch": 1.11, "learning_rate": 0.0001333593998314927, "loss": 0.0102, "step": 220200 }, { "epoch": 1.11, "learning_rate": 0.00013335183213847868, "loss": 0.0093, "step": 220210 }, { "epoch": 1.11, "learning_rate": 0.0001333442644454647, "loss": 0.0077, "step": 220220 }, { "epoch": 1.11, "learning_rate": 0.00013333669675245067, "loss": 0.0108, "step": 220230 }, { "epoch": 1.11, "learning_rate": 0.00013332912905943665, "loss": 0.011, "step": 220240 }, { "epoch": 1.11, "learning_rate": 0.00013332156136642266, "loss": 0.009, "step": 220250 }, { "epoch": 1.11, "learning_rate": 0.00013331399367340864, "loss": 0.007, "step": 220260 }, { "epoch": 1.11, "learning_rate": 0.00013330642598039462, "loss": 0.013, "step": 220270 }, { "epoch": 1.11, "learning_rate": 0.0001332988582873806, "loss": 0.0085, "step": 220280 }, { "epoch": 1.11, "learning_rate": 0.00013329129059436659, "loss": 0.0093, "step": 220290 }, { "epoch": 1.11, "learning_rate": 0.00013328372290135257, "loss": 0.0092, "step": 220300 }, { "epoch": 1.11, "learning_rate": 0.00013327615520833858, "loss": 0.0104, "step": 220310 }, { "epoch": 1.11, "learning_rate": 0.00013326858751532456, "loss": 0.0087, "step": 220320 }, { "epoch": 1.11, "learning_rate": 0.00013326101982231054, "loss": 0.0099, "step": 220330 }, { "epoch": 1.11, "learning_rate": 0.00013325345212929655, "loss": 0.0113, "step": 220340 }, { "epoch": 1.11, "learning_rate": 0.00013324588443628253, "loss": 0.0104, "step": 220350 }, { "epoch": 1.11, "learning_rate": 0.0001332383167432685, "loss": 0.0099, "step": 220360 }, { "epoch": 1.11, "learning_rate": 0.00013323074905025452, "loss": 0.01, "step": 220370 }, { "epoch": 1.11, "learning_rate": 0.0001332231813572405, "loss": 0.008, "step": 220380 }, { "epoch": 1.11, "learning_rate": 0.00013321561366422648, "loss": 0.0114, "step": 220390 }, { "epoch": 1.11, "learning_rate": 0.0001332080459712125, "loss": 0.0097, "step": 220400 }, { "epoch": 1.11, "learning_rate": 0.00013320047827819847, "loss": 0.0095, "step": 220410 }, { "epoch": 1.11, "learning_rate": 0.00013319291058518445, "loss": 0.0094, "step": 220420 }, { "epoch": 1.11, "learning_rate": 0.00013318534289217046, "loss": 0.011, "step": 220430 }, { "epoch": 1.11, "learning_rate": 0.00013317777519915644, "loss": 0.0086, "step": 220440 }, { "epoch": 1.11, "learning_rate": 0.00013317020750614242, "loss": 0.009, "step": 220450 }, { "epoch": 1.11, "learning_rate": 0.00013316263981312843, "loss": 0.0088, "step": 220460 }, { "epoch": 1.11, "learning_rate": 0.00013315507212011441, "loss": 0.0078, "step": 220470 }, { "epoch": 1.11, "learning_rate": 0.0001331475044271004, "loss": 0.0084, "step": 220480 }, { "epoch": 1.11, "learning_rate": 0.00013313993673408638, "loss": 0.0082, "step": 220490 }, { "epoch": 1.11, "learning_rate": 0.00013313236904107239, "loss": 0.0111, "step": 220500 }, { "epoch": 1.11, "learning_rate": 0.00013312480134805837, "loss": 0.0086, "step": 220510 }, { "epoch": 1.11, "learning_rate": 0.00013311723365504435, "loss": 0.0101, "step": 220520 }, { "epoch": 1.11, "learning_rate": 0.00013310966596203036, "loss": 0.008, "step": 220530 }, { "epoch": 1.11, "learning_rate": 0.00013310209826901634, "loss": 0.0089, "step": 220540 }, { "epoch": 1.11, "learning_rate": 0.00013309453057600232, "loss": 0.0103, "step": 220550 }, { "epoch": 1.11, "learning_rate": 0.00013308696288298833, "loss": 0.0094, "step": 220560 }, { "epoch": 1.11, "learning_rate": 0.0001330793951899743, "loss": 0.0106, "step": 220570 }, { "epoch": 1.11, "learning_rate": 0.0001330718274969603, "loss": 0.0099, "step": 220580 }, { "epoch": 1.11, "learning_rate": 0.0001330642598039463, "loss": 0.0099, "step": 220590 }, { "epoch": 1.11, "learning_rate": 0.00013305669211093228, "loss": 0.0103, "step": 220600 }, { "epoch": 1.11, "learning_rate": 0.00013304912441791826, "loss": 0.0095, "step": 220610 }, { "epoch": 1.11, "learning_rate": 0.00013304155672490427, "loss": 0.0079, "step": 220620 }, { "epoch": 1.11, "learning_rate": 0.00013303398903189025, "loss": 0.0076, "step": 220630 }, { "epoch": 1.11, "learning_rate": 0.00013302642133887623, "loss": 0.0089, "step": 220640 }, { "epoch": 1.11, "learning_rate": 0.00013301885364586222, "loss": 0.0085, "step": 220650 }, { "epoch": 1.11, "learning_rate": 0.00013301128595284822, "loss": 0.0098, "step": 220660 }, { "epoch": 1.11, "learning_rate": 0.0001330037182598342, "loss": 0.0098, "step": 220670 }, { "epoch": 1.11, "learning_rate": 0.0001329961505668202, "loss": 0.0089, "step": 220680 }, { "epoch": 1.11, "learning_rate": 0.0001329885828738062, "loss": 0.0122, "step": 220690 }, { "epoch": 1.11, "learning_rate": 0.00013298101518079218, "loss": 0.01, "step": 220700 }, { "epoch": 1.11, "learning_rate": 0.00013297344748777816, "loss": 0.0098, "step": 220710 }, { "epoch": 1.11, "learning_rate": 0.00013296587979476417, "loss": 0.0101, "step": 220720 }, { "epoch": 1.11, "learning_rate": 0.00013295831210175015, "loss": 0.009, "step": 220730 }, { "epoch": 1.11, "learning_rate": 0.00013295074440873613, "loss": 0.009, "step": 220740 }, { "epoch": 1.11, "learning_rate": 0.00013294317671572214, "loss": 0.009, "step": 220750 }, { "epoch": 1.11, "learning_rate": 0.00013293560902270812, "loss": 0.0099, "step": 220760 }, { "epoch": 1.11, "learning_rate": 0.0001329280413296941, "loss": 0.011, "step": 220770 }, { "epoch": 1.11, "learning_rate": 0.0001329204736366801, "loss": 0.0127, "step": 220780 }, { "epoch": 1.11, "learning_rate": 0.0001329129059436661, "loss": 0.0095, "step": 220790 }, { "epoch": 1.11, "learning_rate": 0.00013290533825065207, "loss": 0.0071, "step": 220800 }, { "epoch": 1.11, "learning_rate": 0.00013289777055763805, "loss": 0.0084, "step": 220810 }, { "epoch": 1.11, "learning_rate": 0.00013289020286462406, "loss": 0.0088, "step": 220820 }, { "epoch": 1.11, "learning_rate": 0.00013288263517161004, "loss": 0.0083, "step": 220830 }, { "epoch": 1.11, "learning_rate": 0.00013287506747859603, "loss": 0.0131, "step": 220840 }, { "epoch": 1.11, "learning_rate": 0.00013286749978558203, "loss": 0.0084, "step": 220850 }, { "epoch": 1.11, "learning_rate": 0.00013285993209256802, "loss": 0.0099, "step": 220860 }, { "epoch": 1.11, "learning_rate": 0.000132852364399554, "loss": 0.0098, "step": 220870 }, { "epoch": 1.11, "learning_rate": 0.00013284479670654, "loss": 0.0118, "step": 220880 }, { "epoch": 1.11, "learning_rate": 0.000132837229013526, "loss": 0.0085, "step": 220890 }, { "epoch": 1.11, "learning_rate": 0.00013282966132051197, "loss": 0.0095, "step": 220900 }, { "epoch": 1.11, "learning_rate": 0.00013282209362749795, "loss": 0.0106, "step": 220910 }, { "epoch": 1.11, "learning_rate": 0.00013281452593448393, "loss": 0.0097, "step": 220920 }, { "epoch": 1.11, "learning_rate": 0.00013280695824146994, "loss": 0.0087, "step": 220930 }, { "epoch": 1.11, "learning_rate": 0.00013279939054845592, "loss": 0.008, "step": 220940 }, { "epoch": 1.11, "learning_rate": 0.0001327918228554419, "loss": 0.0089, "step": 220950 }, { "epoch": 1.11, "learning_rate": 0.0001327842551624279, "loss": 0.008, "step": 220960 }, { "epoch": 1.11, "learning_rate": 0.0001327766874694139, "loss": 0.0092, "step": 220970 }, { "epoch": 1.11, "learning_rate": 0.00013276911977639987, "loss": 0.0084, "step": 220980 }, { "epoch": 1.11, "learning_rate": 0.00013276155208338588, "loss": 0.0084, "step": 220990 }, { "epoch": 1.11, "learning_rate": 0.00013275398439037186, "loss": 0.0098, "step": 221000 }, { "epoch": 1.11, "eval_cer": 0.9144712262992877, "eval_loss": 0.007316153962165117, "eval_runtime": 116.2409, "eval_samples_per_second": 17.206, "eval_steps_per_second": 4.301, "step": 221000 }, { "epoch": 1.12, "learning_rate": 0.00013274641669735785, "loss": 0.0087, "step": 221010 }, { "epoch": 1.12, "learning_rate": 0.00013273884900434383, "loss": 0.0087, "step": 221020 }, { "epoch": 1.12, "learning_rate": 0.00013273128131132984, "loss": 0.0086, "step": 221030 }, { "epoch": 1.12, "learning_rate": 0.00013272371361831582, "loss": 0.0081, "step": 221040 }, { "epoch": 1.12, "learning_rate": 0.0001327161459253018, "loss": 0.0073, "step": 221050 }, { "epoch": 1.12, "learning_rate": 0.0001327085782322878, "loss": 0.0095, "step": 221060 }, { "epoch": 1.12, "learning_rate": 0.0001327010105392738, "loss": 0.0076, "step": 221070 }, { "epoch": 1.12, "learning_rate": 0.00013269344284625977, "loss": 0.0102, "step": 221080 }, { "epoch": 1.12, "learning_rate": 0.00013268587515324578, "loss": 0.007, "step": 221090 }, { "epoch": 1.12, "learning_rate": 0.00013267830746023176, "loss": 0.0085, "step": 221100 }, { "epoch": 1.12, "learning_rate": 0.00013267073976721774, "loss": 0.0145, "step": 221110 }, { "epoch": 1.12, "learning_rate": 0.00013266317207420375, "loss": 0.0096, "step": 221120 }, { "epoch": 1.12, "learning_rate": 0.00013265560438118973, "loss": 0.0093, "step": 221130 }, { "epoch": 1.12, "learning_rate": 0.0001326480366881757, "loss": 0.0106, "step": 221140 }, { "epoch": 1.12, "learning_rate": 0.00013264046899516172, "loss": 0.0105, "step": 221150 }, { "epoch": 1.12, "learning_rate": 0.0001326329013021477, "loss": 0.0187, "step": 221160 }, { "epoch": 1.12, "learning_rate": 0.00013262533360913368, "loss": 0.013, "step": 221170 }, { "epoch": 1.12, "learning_rate": 0.00013261776591611967, "loss": 0.0105, "step": 221180 }, { "epoch": 1.12, "learning_rate": 0.00013261019822310567, "loss": 0.0121, "step": 221190 }, { "epoch": 1.12, "learning_rate": 0.00013260263053009166, "loss": 0.0089, "step": 221200 }, { "epoch": 1.12, "learning_rate": 0.00013259506283707764, "loss": 0.0107, "step": 221210 }, { "epoch": 1.12, "learning_rate": 0.00013258749514406365, "loss": 0.0065, "step": 221220 }, { "epoch": 1.12, "learning_rate": 0.00013257992745104963, "loss": 0.0099, "step": 221230 }, { "epoch": 1.12, "learning_rate": 0.0001325723597580356, "loss": 0.0102, "step": 221240 }, { "epoch": 1.12, "learning_rate": 0.00013256479206502162, "loss": 0.0107, "step": 221250 }, { "epoch": 1.12, "learning_rate": 0.0001325572243720076, "loss": 0.0095, "step": 221260 }, { "epoch": 1.12, "learning_rate": 0.00013254965667899358, "loss": 0.0091, "step": 221270 }, { "epoch": 1.12, "learning_rate": 0.0001325420889859796, "loss": 0.0111, "step": 221280 }, { "epoch": 1.12, "learning_rate": 0.00013253452129296557, "loss": 0.009, "step": 221290 }, { "epoch": 1.12, "learning_rate": 0.00013252695359995155, "loss": 0.0087, "step": 221300 }, { "epoch": 1.12, "learning_rate": 0.00013251938590693756, "loss": 0.0098, "step": 221310 }, { "epoch": 1.12, "learning_rate": 0.00013251181821392354, "loss": 0.0087, "step": 221320 }, { "epoch": 1.12, "learning_rate": 0.00013250425052090952, "loss": 0.0082, "step": 221330 }, { "epoch": 1.12, "learning_rate": 0.0001324966828278955, "loss": 0.0081, "step": 221340 }, { "epoch": 1.12, "learning_rate": 0.0001324891151348815, "loss": 0.008, "step": 221350 }, { "epoch": 1.12, "learning_rate": 0.0001324815474418675, "loss": 0.0102, "step": 221360 }, { "epoch": 1.12, "learning_rate": 0.00013247397974885348, "loss": 0.0129, "step": 221370 }, { "epoch": 1.12, "learning_rate": 0.00013246641205583948, "loss": 0.0084, "step": 221380 }, { "epoch": 1.12, "learning_rate": 0.00013245884436282547, "loss": 0.0082, "step": 221390 }, { "epoch": 1.12, "learning_rate": 0.00013245127666981145, "loss": 0.0102, "step": 221400 }, { "epoch": 1.12, "learning_rate": 0.00013244370897679746, "loss": 0.01, "step": 221410 }, { "epoch": 1.12, "learning_rate": 0.00013243614128378344, "loss": 0.0097, "step": 221420 }, { "epoch": 1.12, "learning_rate": 0.00013242857359076942, "loss": 0.0104, "step": 221430 }, { "epoch": 1.12, "learning_rate": 0.00013242100589775543, "loss": 0.0088, "step": 221440 }, { "epoch": 1.12, "learning_rate": 0.0001324134382047414, "loss": 0.0119, "step": 221450 }, { "epoch": 1.12, "learning_rate": 0.0001324058705117274, "loss": 0.0087, "step": 221460 }, { "epoch": 1.12, "learning_rate": 0.0001323983028187134, "loss": 0.0078, "step": 221470 }, { "epoch": 1.12, "learning_rate": 0.00013239073512569938, "loss": 0.0089, "step": 221480 }, { "epoch": 1.12, "learning_rate": 0.00013238316743268536, "loss": 0.0096, "step": 221490 }, { "epoch": 1.12, "learning_rate": 0.00013237559973967137, "loss": 0.0075, "step": 221500 }, { "epoch": 1.12, "learning_rate": 0.00013236803204665735, "loss": 0.0108, "step": 221510 }, { "epoch": 1.12, "learning_rate": 0.00013236046435364333, "loss": 0.0104, "step": 221520 }, { "epoch": 1.12, "learning_rate": 0.00013235289666062931, "loss": 0.0085, "step": 221530 }, { "epoch": 1.12, "learning_rate": 0.0001323453289676153, "loss": 0.0081, "step": 221540 }, { "epoch": 1.12, "learning_rate": 0.00013233776127460128, "loss": 0.0098, "step": 221550 }, { "epoch": 1.12, "learning_rate": 0.00013233019358158729, "loss": 0.0075, "step": 221560 }, { "epoch": 1.12, "learning_rate": 0.00013232262588857327, "loss": 0.0104, "step": 221570 }, { "epoch": 1.12, "learning_rate": 0.00013231505819555925, "loss": 0.0073, "step": 221580 }, { "epoch": 1.12, "learning_rate": 0.00013230749050254526, "loss": 0.0135, "step": 221590 }, { "epoch": 1.12, "learning_rate": 0.00013229992280953124, "loss": 0.009, "step": 221600 }, { "epoch": 1.12, "learning_rate": 0.00013229235511651722, "loss": 0.0072, "step": 221610 }, { "epoch": 1.12, "learning_rate": 0.00013228478742350323, "loss": 0.0124, "step": 221620 }, { "epoch": 1.12, "learning_rate": 0.0001322772197304892, "loss": 0.0096, "step": 221630 }, { "epoch": 1.12, "learning_rate": 0.0001322696520374752, "loss": 0.0099, "step": 221640 }, { "epoch": 1.12, "learning_rate": 0.0001322620843444612, "loss": 0.0104, "step": 221650 }, { "epoch": 1.12, "learning_rate": 0.00013225451665144718, "loss": 0.0086, "step": 221660 }, { "epoch": 1.12, "learning_rate": 0.00013224694895843316, "loss": 0.0111, "step": 221670 }, { "epoch": 1.12, "learning_rate": 0.00013223938126541917, "loss": 0.009, "step": 221680 }, { "epoch": 1.12, "learning_rate": 0.00013223181357240515, "loss": 0.0112, "step": 221690 }, { "epoch": 1.12, "learning_rate": 0.00013222424587939113, "loss": 0.0302, "step": 221700 }, { "epoch": 1.12, "learning_rate": 0.00013221667818637712, "loss": 0.0137, "step": 221710 }, { "epoch": 1.12, "learning_rate": 0.00013220911049336312, "loss": 0.0125, "step": 221720 }, { "epoch": 1.12, "learning_rate": 0.0001322015428003491, "loss": 0.0086, "step": 221730 }, { "epoch": 1.12, "learning_rate": 0.0001321939751073351, "loss": 0.0094, "step": 221740 }, { "epoch": 1.12, "learning_rate": 0.0001321864074143211, "loss": 0.0084, "step": 221750 }, { "epoch": 1.12, "learning_rate": 0.00013217883972130708, "loss": 0.0071, "step": 221760 }, { "epoch": 1.12, "learning_rate": 0.00013217127202829306, "loss": 0.0095, "step": 221770 }, { "epoch": 1.12, "learning_rate": 0.00013216370433527907, "loss": 0.0073, "step": 221780 }, { "epoch": 1.12, "learning_rate": 0.00013215613664226505, "loss": 0.0099, "step": 221790 }, { "epoch": 1.12, "learning_rate": 0.00013214856894925103, "loss": 0.011, "step": 221800 }, { "epoch": 1.12, "learning_rate": 0.00013214100125623704, "loss": 0.009, "step": 221810 }, { "epoch": 1.12, "learning_rate": 0.00013213343356322302, "loss": 0.0075, "step": 221820 }, { "epoch": 1.12, "learning_rate": 0.000132125865870209, "loss": 0.0103, "step": 221830 }, { "epoch": 1.12, "learning_rate": 0.000132118298177195, "loss": 0.0093, "step": 221840 }, { "epoch": 1.12, "learning_rate": 0.000132110730484181, "loss": 0.0083, "step": 221850 }, { "epoch": 1.12, "learning_rate": 0.00013210316279116697, "loss": 0.0093, "step": 221860 }, { "epoch": 1.12, "learning_rate": 0.00013209559509815298, "loss": 0.0126, "step": 221870 }, { "epoch": 1.12, "learning_rate": 0.00013208802740513896, "loss": 0.0078, "step": 221880 }, { "epoch": 1.12, "learning_rate": 0.00013208045971212494, "loss": 0.0089, "step": 221890 }, { "epoch": 1.12, "learning_rate": 0.00013207289201911093, "loss": 0.0084, "step": 221900 }, { "epoch": 1.12, "learning_rate": 0.00013206532432609693, "loss": 0.0099, "step": 221910 }, { "epoch": 1.12, "learning_rate": 0.00013205775663308292, "loss": 0.0114, "step": 221920 }, { "epoch": 1.12, "learning_rate": 0.0001320501889400689, "loss": 0.0092, "step": 221930 }, { "epoch": 1.12, "learning_rate": 0.0001320426212470549, "loss": 0.0119, "step": 221940 }, { "epoch": 1.12, "learning_rate": 0.0001320350535540409, "loss": 0.0091, "step": 221950 }, { "epoch": 1.12, "learning_rate": 0.00013202748586102687, "loss": 0.0094, "step": 221960 }, { "epoch": 1.12, "learning_rate": 0.00013201991816801288, "loss": 0.012, "step": 221970 }, { "epoch": 1.12, "learning_rate": 0.00013201235047499886, "loss": 0.0083, "step": 221980 }, { "epoch": 1.12, "learning_rate": 0.00013200478278198484, "loss": 0.0094, "step": 221990 }, { "epoch": 1.12, "learning_rate": 0.00013199721508897085, "loss": 0.0103, "step": 222000 }, { "epoch": 1.12, "eval_cer": 0.9144731670915385, "eval_loss": 0.007101530209183693, "eval_runtime": 116.3424, "eval_samples_per_second": 17.191, "eval_steps_per_second": 4.298, "step": 222000 }, { "epoch": 1.12, "learning_rate": 0.00013198964739595683, "loss": 0.0095, "step": 222010 }, { "epoch": 1.12, "learning_rate": 0.0001319820797029428, "loss": 0.0094, "step": 222020 }, { "epoch": 1.12, "learning_rate": 0.00013197451200992882, "loss": 0.0088, "step": 222030 }, { "epoch": 1.12, "learning_rate": 0.0001319669443169148, "loss": 0.0095, "step": 222040 }, { "epoch": 1.12, "learning_rate": 0.00013195937662390078, "loss": 0.0087, "step": 222050 }, { "epoch": 1.12, "learning_rate": 0.00013195180893088676, "loss": 0.0114, "step": 222060 }, { "epoch": 1.12, "learning_rate": 0.00013194424123787277, "loss": 0.0078, "step": 222070 }, { "epoch": 1.12, "learning_rate": 0.00013193667354485875, "loss": 0.0081, "step": 222080 }, { "epoch": 1.12, "learning_rate": 0.00013192910585184474, "loss": 0.0105, "step": 222090 }, { "epoch": 1.12, "learning_rate": 0.00013192153815883074, "loss": 0.0084, "step": 222100 }, { "epoch": 1.12, "learning_rate": 0.00013191397046581673, "loss": 0.01, "step": 222110 }, { "epoch": 1.12, "learning_rate": 0.0001319064027728027, "loss": 0.0105, "step": 222120 }, { "epoch": 1.12, "learning_rate": 0.00013189883507978872, "loss": 0.0105, "step": 222130 }, { "epoch": 1.12, "learning_rate": 0.0001318912673867747, "loss": 0.0071, "step": 222140 }, { "epoch": 1.12, "learning_rate": 0.00013188369969376068, "loss": 0.0094, "step": 222150 }, { "epoch": 1.12, "learning_rate": 0.00013187613200074666, "loss": 0.0093, "step": 222160 }, { "epoch": 1.12, "learning_rate": 0.00013186856430773264, "loss": 0.0089, "step": 222170 }, { "epoch": 1.12, "learning_rate": 0.00013186099661471865, "loss": 0.0107, "step": 222180 }, { "epoch": 1.12, "learning_rate": 0.00013185342892170463, "loss": 0.0089, "step": 222190 }, { "epoch": 1.12, "learning_rate": 0.0001318458612286906, "loss": 0.0093, "step": 222200 }, { "epoch": 1.12, "learning_rate": 0.00013183829353567662, "loss": 0.0074, "step": 222210 }, { "epoch": 1.12, "learning_rate": 0.0001318307258426626, "loss": 0.0089, "step": 222220 }, { "epoch": 1.12, "learning_rate": 0.00013182315814964858, "loss": 0.0118, "step": 222230 }, { "epoch": 1.12, "learning_rate": 0.00013181559045663457, "loss": 0.0085, "step": 222240 }, { "epoch": 1.12, "learning_rate": 0.00013180802276362057, "loss": 0.0081, "step": 222250 }, { "epoch": 1.12, "learning_rate": 0.00013180045507060656, "loss": 0.009, "step": 222260 }, { "epoch": 1.12, "learning_rate": 0.00013179288737759254, "loss": 0.0072, "step": 222270 }, { "epoch": 1.12, "learning_rate": 0.00013178531968457855, "loss": 0.0102, "step": 222280 }, { "epoch": 1.12, "learning_rate": 0.00013177775199156453, "loss": 0.0092, "step": 222290 }, { "epoch": 1.12, "learning_rate": 0.0001317701842985505, "loss": 0.0082, "step": 222300 }, { "epoch": 1.12, "learning_rate": 0.00013176261660553652, "loss": 0.0091, "step": 222310 }, { "epoch": 1.12, "learning_rate": 0.0001317550489125225, "loss": 0.0101, "step": 222320 }, { "epoch": 1.12, "learning_rate": 0.00013174748121950848, "loss": 0.0113, "step": 222330 }, { "epoch": 1.12, "learning_rate": 0.0001317399135264945, "loss": 0.0099, "step": 222340 }, { "epoch": 1.12, "learning_rate": 0.00013173234583348047, "loss": 0.0085, "step": 222350 }, { "epoch": 1.12, "learning_rate": 0.00013172477814046645, "loss": 0.0106, "step": 222360 }, { "epoch": 1.12, "learning_rate": 0.00013171721044745246, "loss": 0.0095, "step": 222370 }, { "epoch": 1.12, "learning_rate": 0.00013170964275443844, "loss": 0.0089, "step": 222380 }, { "epoch": 1.12, "learning_rate": 0.00013170207506142442, "loss": 0.0093, "step": 222390 }, { "epoch": 1.12, "learning_rate": 0.00013169450736841043, "loss": 0.0096, "step": 222400 }, { "epoch": 1.12, "learning_rate": 0.0001316869396753964, "loss": 0.0082, "step": 222410 }, { "epoch": 1.12, "learning_rate": 0.0001316793719823824, "loss": 0.0072, "step": 222420 }, { "epoch": 1.12, "learning_rate": 0.00013167180428936838, "loss": 0.0077, "step": 222430 }, { "epoch": 1.12, "learning_rate": 0.00013166423659635438, "loss": 0.0091, "step": 222440 }, { "epoch": 1.12, "learning_rate": 0.00013165666890334037, "loss": 0.0082, "step": 222450 }, { "epoch": 1.12, "learning_rate": 0.00013164910121032635, "loss": 0.0086, "step": 222460 }, { "epoch": 1.12, "learning_rate": 0.00013164153351731236, "loss": 0.0079, "step": 222470 }, { "epoch": 1.12, "learning_rate": 0.00013163396582429834, "loss": 0.0102, "step": 222480 }, { "epoch": 1.12, "learning_rate": 0.00013162639813128432, "loss": 0.0084, "step": 222490 }, { "epoch": 1.12, "learning_rate": 0.00013161883043827033, "loss": 0.0121, "step": 222500 }, { "epoch": 1.12, "learning_rate": 0.0001316112627452563, "loss": 0.0152, "step": 222510 }, { "epoch": 1.12, "learning_rate": 0.0001316036950522423, "loss": 0.0075, "step": 222520 }, { "epoch": 1.12, "learning_rate": 0.0001315961273592283, "loss": 0.0107, "step": 222530 }, { "epoch": 1.12, "learning_rate": 0.00013158855966621428, "loss": 0.0099, "step": 222540 }, { "epoch": 1.12, "learning_rate": 0.00013158099197320026, "loss": 0.0087, "step": 222550 }, { "epoch": 1.12, "learning_rate": 0.00013157342428018627, "loss": 0.0084, "step": 222560 }, { "epoch": 1.12, "learning_rate": 0.00013156585658717225, "loss": 0.0113, "step": 222570 }, { "epoch": 1.12, "learning_rate": 0.00013155828889415823, "loss": 0.0103, "step": 222580 }, { "epoch": 1.12, "learning_rate": 0.00013155072120114421, "loss": 0.0104, "step": 222590 }, { "epoch": 1.12, "learning_rate": 0.00013154315350813022, "loss": 0.0076, "step": 222600 }, { "epoch": 1.12, "learning_rate": 0.0001315355858151162, "loss": 0.0112, "step": 222610 }, { "epoch": 1.12, "learning_rate": 0.00013152801812210219, "loss": 0.0108, "step": 222620 }, { "epoch": 1.12, "learning_rate": 0.0001315204504290882, "loss": 0.0074, "step": 222630 }, { "epoch": 1.12, "learning_rate": 0.00013151288273607418, "loss": 0.0091, "step": 222640 }, { "epoch": 1.12, "learning_rate": 0.00013150531504306016, "loss": 0.0092, "step": 222650 }, { "epoch": 1.12, "learning_rate": 0.00013149774735004617, "loss": 0.009, "step": 222660 }, { "epoch": 1.12, "learning_rate": 0.00013149017965703215, "loss": 0.009, "step": 222670 }, { "epoch": 1.12, "learning_rate": 0.00013148261196401813, "loss": 0.0082, "step": 222680 }, { "epoch": 1.12, "learning_rate": 0.00013147504427100414, "loss": 0.0082, "step": 222690 }, { "epoch": 1.12, "learning_rate": 0.00013146747657799012, "loss": 0.0085, "step": 222700 }, { "epoch": 1.12, "learning_rate": 0.0001314599088849761, "loss": 0.0082, "step": 222710 }, { "epoch": 1.12, "learning_rate": 0.0001314523411919621, "loss": 0.0091, "step": 222720 }, { "epoch": 1.12, "learning_rate": 0.0001314447734989481, "loss": 0.0064, "step": 222730 }, { "epoch": 1.12, "learning_rate": 0.00013143720580593407, "loss": 0.01, "step": 222740 }, { "epoch": 1.12, "learning_rate": 0.00013142963811292005, "loss": 0.0119, "step": 222750 }, { "epoch": 1.12, "learning_rate": 0.00013142207041990606, "loss": 0.0101, "step": 222760 }, { "epoch": 1.12, "learning_rate": 0.00013141450272689204, "loss": 0.0104, "step": 222770 }, { "epoch": 1.12, "learning_rate": 0.00013140693503387802, "loss": 0.0101, "step": 222780 }, { "epoch": 1.12, "learning_rate": 0.000131399367340864, "loss": 0.0091, "step": 222790 }, { "epoch": 1.12, "learning_rate": 0.00013139179964785, "loss": 0.0079, "step": 222800 }, { "epoch": 1.12, "learning_rate": 0.000131384231954836, "loss": 0.009, "step": 222810 }, { "epoch": 1.12, "learning_rate": 0.00013137666426182198, "loss": 0.0082, "step": 222820 }, { "epoch": 1.12, "learning_rate": 0.00013136909656880796, "loss": 0.0085, "step": 222830 }, { "epoch": 1.12, "learning_rate": 0.00013136152887579397, "loss": 0.0119, "step": 222840 }, { "epoch": 1.12, "learning_rate": 0.00013135396118277995, "loss": 0.0116, "step": 222850 }, { "epoch": 1.12, "learning_rate": 0.00013134639348976593, "loss": 0.0094, "step": 222860 }, { "epoch": 1.12, "learning_rate": 0.00013133882579675194, "loss": 0.0086, "step": 222870 }, { "epoch": 1.12, "learning_rate": 0.00013133125810373792, "loss": 0.0081, "step": 222880 }, { "epoch": 1.12, "learning_rate": 0.0001313236904107239, "loss": 0.0104, "step": 222890 }, { "epoch": 1.12, "learning_rate": 0.0001313161227177099, "loss": 0.009, "step": 222900 }, { "epoch": 1.12, "learning_rate": 0.0001313085550246959, "loss": 0.0121, "step": 222910 }, { "epoch": 1.12, "learning_rate": 0.00013130098733168187, "loss": 0.0112, "step": 222920 }, { "epoch": 1.12, "learning_rate": 0.00013129341963866788, "loss": 0.0097, "step": 222930 }, { "epoch": 1.12, "learning_rate": 0.00013128585194565386, "loss": 0.0086, "step": 222940 }, { "epoch": 1.12, "learning_rate": 0.00013127828425263984, "loss": 0.0101, "step": 222950 }, { "epoch": 1.12, "learning_rate": 0.00013127071655962583, "loss": 0.0072, "step": 222960 }, { "epoch": 1.12, "learning_rate": 0.00013126314886661183, "loss": 0.0111, "step": 222970 }, { "epoch": 1.12, "learning_rate": 0.00013125558117359782, "loss": 0.0117, "step": 222980 }, { "epoch": 1.13, "learning_rate": 0.0001312480134805838, "loss": 0.0076, "step": 222990 }, { "epoch": 1.13, "learning_rate": 0.0001312404457875698, "loss": 0.0088, "step": 223000 }, { "epoch": 1.13, "eval_cer": 0.9144547295651558, "eval_loss": 0.006930416449904442, "eval_runtime": 115.5739, "eval_samples_per_second": 17.305, "eval_steps_per_second": 4.326, "step": 223000 }, { "epoch": 1.13, "learning_rate": 0.0001312328780945558, "loss": 0.009, "step": 223010 }, { "epoch": 1.13, "learning_rate": 0.00013122531040154177, "loss": 0.0118, "step": 223020 }, { "epoch": 1.13, "learning_rate": 0.00013121774270852778, "loss": 0.0107, "step": 223030 }, { "epoch": 1.13, "learning_rate": 0.00013121017501551376, "loss": 0.0117, "step": 223040 }, { "epoch": 1.13, "learning_rate": 0.00013120260732249974, "loss": 0.0103, "step": 223050 }, { "epoch": 1.13, "learning_rate": 0.00013119503962948575, "loss": 0.0108, "step": 223060 }, { "epoch": 1.13, "learning_rate": 0.00013118747193647173, "loss": 0.0086, "step": 223070 }, { "epoch": 1.13, "learning_rate": 0.0001311799042434577, "loss": 0.0081, "step": 223080 }, { "epoch": 1.13, "learning_rate": 0.00013117233655044372, "loss": 0.0077, "step": 223090 }, { "epoch": 1.13, "learning_rate": 0.0001311647688574297, "loss": 0.0115, "step": 223100 }, { "epoch": 1.13, "learning_rate": 0.00013115720116441568, "loss": 0.0079, "step": 223110 }, { "epoch": 1.13, "learning_rate": 0.00013114963347140166, "loss": 0.0118, "step": 223120 }, { "epoch": 1.13, "learning_rate": 0.00013114206577838767, "loss": 0.0116, "step": 223130 }, { "epoch": 1.13, "learning_rate": 0.00013113449808537365, "loss": 0.01, "step": 223140 }, { "epoch": 1.13, "learning_rate": 0.00013112693039235964, "loss": 0.0072, "step": 223150 }, { "epoch": 1.13, "learning_rate": 0.00013111936269934564, "loss": 0.012, "step": 223160 }, { "epoch": 1.13, "learning_rate": 0.00013111179500633163, "loss": 0.0078, "step": 223170 }, { "epoch": 1.13, "learning_rate": 0.0001311042273133176, "loss": 0.0077, "step": 223180 }, { "epoch": 1.13, "learning_rate": 0.00013109665962030362, "loss": 0.009, "step": 223190 }, { "epoch": 1.13, "learning_rate": 0.0001310890919272896, "loss": 0.0083, "step": 223200 }, { "epoch": 1.13, "learning_rate": 0.00013108152423427558, "loss": 0.0121, "step": 223210 }, { "epoch": 1.13, "learning_rate": 0.0001310739565412616, "loss": 0.0085, "step": 223220 }, { "epoch": 1.13, "learning_rate": 0.00013106638884824757, "loss": 0.009, "step": 223230 }, { "epoch": 1.13, "learning_rate": 0.00013105882115523355, "loss": 0.0099, "step": 223240 }, { "epoch": 1.13, "learning_rate": 0.00013105125346221956, "loss": 0.0082, "step": 223250 }, { "epoch": 1.13, "learning_rate": 0.00013104368576920554, "loss": 0.0086, "step": 223260 }, { "epoch": 1.13, "learning_rate": 0.00013103611807619152, "loss": 0.0098, "step": 223270 }, { "epoch": 1.13, "learning_rate": 0.0001310285503831775, "loss": 0.0096, "step": 223280 }, { "epoch": 1.13, "learning_rate": 0.0001310209826901635, "loss": 0.0103, "step": 223290 }, { "epoch": 1.13, "learning_rate": 0.0001310134149971495, "loss": 0.011, "step": 223300 }, { "epoch": 1.13, "learning_rate": 0.00013100584730413547, "loss": 0.0114, "step": 223310 }, { "epoch": 1.13, "learning_rate": 0.00013099827961112148, "loss": 0.0086, "step": 223320 }, { "epoch": 1.13, "learning_rate": 0.00013099071191810746, "loss": 0.0088, "step": 223330 }, { "epoch": 1.13, "learning_rate": 0.00013098314422509345, "loss": 0.0116, "step": 223340 }, { "epoch": 1.13, "learning_rate": 0.00013097557653207945, "loss": 0.0083, "step": 223350 }, { "epoch": 1.13, "learning_rate": 0.00013096800883906544, "loss": 0.0092, "step": 223360 }, { "epoch": 1.13, "learning_rate": 0.00013096044114605142, "loss": 0.012, "step": 223370 }, { "epoch": 1.13, "learning_rate": 0.00013095287345303743, "loss": 0.0089, "step": 223380 }, { "epoch": 1.13, "learning_rate": 0.0001309453057600234, "loss": 0.0112, "step": 223390 }, { "epoch": 1.13, "learning_rate": 0.0001309377380670094, "loss": 0.0111, "step": 223400 }, { "epoch": 1.13, "learning_rate": 0.0001309301703739954, "loss": 0.0077, "step": 223410 }, { "epoch": 1.13, "learning_rate": 0.00013092260268098135, "loss": 0.0126, "step": 223420 }, { "epoch": 1.13, "learning_rate": 0.00013091503498796736, "loss": 0.0121, "step": 223430 }, { "epoch": 1.13, "learning_rate": 0.00013090746729495334, "loss": 0.0072, "step": 223440 }, { "epoch": 1.13, "learning_rate": 0.00013089989960193932, "loss": 0.0083, "step": 223450 }, { "epoch": 1.13, "learning_rate": 0.00013089233190892533, "loss": 0.0126, "step": 223460 }, { "epoch": 1.13, "learning_rate": 0.0001308847642159113, "loss": 0.0103, "step": 223470 }, { "epoch": 1.13, "learning_rate": 0.0001308771965228973, "loss": 0.0099, "step": 223480 }, { "epoch": 1.13, "learning_rate": 0.00013086962882988328, "loss": 0.0099, "step": 223490 }, { "epoch": 1.13, "learning_rate": 0.00013086206113686928, "loss": 0.009, "step": 223500 }, { "epoch": 1.13, "learning_rate": 0.00013085449344385527, "loss": 0.0093, "step": 223510 }, { "epoch": 1.13, "learning_rate": 0.00013084692575084125, "loss": 0.01, "step": 223520 }, { "epoch": 1.13, "learning_rate": 0.00013083935805782726, "loss": 0.0125, "step": 223530 }, { "epoch": 1.13, "learning_rate": 0.00013083179036481324, "loss": 0.0083, "step": 223540 }, { "epoch": 1.13, "learning_rate": 0.00013082422267179922, "loss": 0.0111, "step": 223550 }, { "epoch": 1.13, "learning_rate": 0.00013081665497878523, "loss": 0.0122, "step": 223560 }, { "epoch": 1.13, "learning_rate": 0.0001308090872857712, "loss": 0.0079, "step": 223570 }, { "epoch": 1.13, "learning_rate": 0.0001308015195927572, "loss": 0.0098, "step": 223580 }, { "epoch": 1.13, "learning_rate": 0.0001307939518997432, "loss": 0.0146, "step": 223590 }, { "epoch": 1.13, "learning_rate": 0.00013078638420672918, "loss": 0.0137, "step": 223600 }, { "epoch": 1.13, "learning_rate": 0.00013077881651371516, "loss": 0.0081, "step": 223610 }, { "epoch": 1.13, "learning_rate": 0.00013077124882070117, "loss": 0.0081, "step": 223620 }, { "epoch": 1.13, "learning_rate": 0.00013076368112768715, "loss": 0.0092, "step": 223630 }, { "epoch": 1.13, "learning_rate": 0.00013075611343467313, "loss": 0.0093, "step": 223640 }, { "epoch": 1.13, "learning_rate": 0.00013074854574165911, "loss": 0.0117, "step": 223650 }, { "epoch": 1.13, "learning_rate": 0.00013074097804864512, "loss": 0.0087, "step": 223660 }, { "epoch": 1.13, "learning_rate": 0.0001307334103556311, "loss": 0.0096, "step": 223670 }, { "epoch": 1.13, "learning_rate": 0.00013072584266261709, "loss": 0.0091, "step": 223680 }, { "epoch": 1.13, "learning_rate": 0.0001307182749696031, "loss": 0.0078, "step": 223690 }, { "epoch": 1.13, "learning_rate": 0.00013071070727658908, "loss": 0.0094, "step": 223700 }, { "epoch": 1.13, "learning_rate": 0.00013070313958357506, "loss": 0.0096, "step": 223710 }, { "epoch": 1.13, "learning_rate": 0.00013069557189056107, "loss": 0.0084, "step": 223720 }, { "epoch": 1.13, "learning_rate": 0.00013068800419754705, "loss": 0.0095, "step": 223730 }, { "epoch": 1.13, "learning_rate": 0.00013068043650453303, "loss": 0.0259, "step": 223740 }, { "epoch": 1.13, "learning_rate": 0.00013067286881151904, "loss": 0.011, "step": 223750 }, { "epoch": 1.13, "learning_rate": 0.00013066530111850502, "loss": 0.0127, "step": 223760 }, { "epoch": 1.13, "learning_rate": 0.000130657733425491, "loss": 0.012, "step": 223770 }, { "epoch": 1.13, "learning_rate": 0.000130650165732477, "loss": 0.0083, "step": 223780 }, { "epoch": 1.13, "learning_rate": 0.000130642598039463, "loss": 0.0106, "step": 223790 }, { "epoch": 1.13, "learning_rate": 0.00013063503034644897, "loss": 0.0088, "step": 223800 }, { "epoch": 1.13, "learning_rate": 0.00013062746265343498, "loss": 0.0082, "step": 223810 }, { "epoch": 1.13, "learning_rate": 0.00013061989496042096, "loss": 0.012, "step": 223820 }, { "epoch": 1.13, "learning_rate": 0.00013061232726740694, "loss": 0.0106, "step": 223830 }, { "epoch": 1.13, "learning_rate": 0.00013060475957439292, "loss": 0.0098, "step": 223840 }, { "epoch": 1.13, "learning_rate": 0.00013059719188137893, "loss": 0.0101, "step": 223850 }, { "epoch": 1.13, "learning_rate": 0.00013058962418836491, "loss": 0.0092, "step": 223860 }, { "epoch": 1.13, "learning_rate": 0.0001305820564953509, "loss": 0.0091, "step": 223870 }, { "epoch": 1.13, "learning_rate": 0.0001305744888023369, "loss": 0.0098, "step": 223880 }, { "epoch": 1.13, "learning_rate": 0.00013056692110932289, "loss": 0.0071, "step": 223890 }, { "epoch": 1.13, "learning_rate": 0.00013055935341630887, "loss": 0.0095, "step": 223900 }, { "epoch": 1.13, "learning_rate": 0.00013055178572329488, "loss": 0.007, "step": 223910 }, { "epoch": 1.13, "learning_rate": 0.00013054421803028086, "loss": 0.0089, "step": 223920 }, { "epoch": 1.13, "learning_rate": 0.00013053665033726684, "loss": 0.009, "step": 223930 }, { "epoch": 1.13, "learning_rate": 0.00013052908264425285, "loss": 0.0078, "step": 223940 }, { "epoch": 1.13, "learning_rate": 0.00013052151495123883, "loss": 0.0081, "step": 223950 }, { "epoch": 1.13, "learning_rate": 0.0001305139472582248, "loss": 0.0079, "step": 223960 }, { "epoch": 1.13, "learning_rate": 0.00013050637956521082, "loss": 0.0088, "step": 223970 }, { "epoch": 1.13, "learning_rate": 0.0001304988118721968, "loss": 0.0096, "step": 223980 }, { "epoch": 1.13, "learning_rate": 0.00013049124417918278, "loss": 0.0079, "step": 223990 }, { "epoch": 1.13, "learning_rate": 0.00013048367648616876, "loss": 0.0089, "step": 224000 }, { "epoch": 1.13, "eval_cer": 0.9144683151109114, "eval_loss": 0.007022760342806578, "eval_runtime": 115.4845, "eval_samples_per_second": 17.318, "eval_steps_per_second": 4.33, "step": 224000 }, { "epoch": 1.13, "learning_rate": 0.00013047610879315477, "loss": 0.0131, "step": 224010 }, { "epoch": 1.13, "learning_rate": 0.00013046854110014075, "loss": 0.0086, "step": 224020 }, { "epoch": 1.13, "learning_rate": 0.00013046097340712673, "loss": 0.0072, "step": 224030 }, { "epoch": 1.13, "learning_rate": 0.00013045340571411274, "loss": 0.0101, "step": 224040 }, { "epoch": 1.13, "learning_rate": 0.0001304458380210987, "loss": 0.0081, "step": 224050 }, { "epoch": 1.13, "learning_rate": 0.0001304382703280847, "loss": 0.0085, "step": 224060 }, { "epoch": 1.13, "learning_rate": 0.0001304307026350707, "loss": 0.0097, "step": 224070 }, { "epoch": 1.13, "learning_rate": 0.00013042313494205667, "loss": 0.0085, "step": 224080 }, { "epoch": 1.13, "learning_rate": 0.00013041556724904268, "loss": 0.0082, "step": 224090 }, { "epoch": 1.13, "learning_rate": 0.00013040799955602866, "loss": 0.0082, "step": 224100 }, { "epoch": 1.13, "learning_rate": 0.00013040043186301464, "loss": 0.0101, "step": 224110 }, { "epoch": 1.13, "learning_rate": 0.00013039286417000065, "loss": 0.0106, "step": 224120 }, { "epoch": 1.13, "learning_rate": 0.00013038529647698663, "loss": 0.0105, "step": 224130 }, { "epoch": 1.13, "learning_rate": 0.0001303777287839726, "loss": 0.0115, "step": 224140 }, { "epoch": 1.13, "learning_rate": 0.00013037016109095862, "loss": 0.013, "step": 224150 }, { "epoch": 1.13, "learning_rate": 0.0001303625933979446, "loss": 0.0121, "step": 224160 }, { "epoch": 1.13, "learning_rate": 0.00013035502570493058, "loss": 0.0091, "step": 224170 }, { "epoch": 1.13, "learning_rate": 0.00013034745801191656, "loss": 0.008, "step": 224180 }, { "epoch": 1.13, "learning_rate": 0.00013033989031890257, "loss": 0.0067, "step": 224190 }, { "epoch": 1.13, "learning_rate": 0.00013033232262588855, "loss": 0.0079, "step": 224200 }, { "epoch": 1.13, "learning_rate": 0.00013032475493287454, "loss": 0.0096, "step": 224210 }, { "epoch": 1.13, "learning_rate": 0.00013031718723986054, "loss": 0.0095, "step": 224220 }, { "epoch": 1.13, "learning_rate": 0.00013030961954684653, "loss": 0.0086, "step": 224230 }, { "epoch": 1.13, "learning_rate": 0.0001303020518538325, "loss": 0.009, "step": 224240 }, { "epoch": 1.13, "learning_rate": 0.00013029448416081852, "loss": 0.0074, "step": 224250 }, { "epoch": 1.13, "learning_rate": 0.0001302869164678045, "loss": 0.0104, "step": 224260 }, { "epoch": 1.13, "learning_rate": 0.00013027934877479048, "loss": 0.0072, "step": 224270 }, { "epoch": 1.13, "learning_rate": 0.0001302717810817765, "loss": 0.0088, "step": 224280 }, { "epoch": 1.13, "learning_rate": 0.00013026421338876247, "loss": 0.0122, "step": 224290 }, { "epoch": 1.13, "learning_rate": 0.00013025664569574845, "loss": 0.011, "step": 224300 }, { "epoch": 1.13, "learning_rate": 0.00013024907800273446, "loss": 0.0093, "step": 224310 }, { "epoch": 1.13, "learning_rate": 0.00013024151030972044, "loss": 0.0076, "step": 224320 }, { "epoch": 1.13, "learning_rate": 0.00013023394261670642, "loss": 0.0088, "step": 224330 }, { "epoch": 1.13, "learning_rate": 0.00013022637492369243, "loss": 0.009, "step": 224340 }, { "epoch": 1.13, "learning_rate": 0.0001302188072306784, "loss": 0.0111, "step": 224350 }, { "epoch": 1.13, "learning_rate": 0.0001302112395376644, "loss": 0.0088, "step": 224360 }, { "epoch": 1.13, "learning_rate": 0.00013020367184465037, "loss": 0.0117, "step": 224370 }, { "epoch": 1.13, "learning_rate": 0.00013019610415163638, "loss": 0.0087, "step": 224380 }, { "epoch": 1.13, "learning_rate": 0.00013018853645862236, "loss": 0.0086, "step": 224390 }, { "epoch": 1.13, "learning_rate": 0.00013018096876560835, "loss": 0.013, "step": 224400 }, { "epoch": 1.13, "learning_rate": 0.00013017340107259435, "loss": 0.008, "step": 224410 }, { "epoch": 1.13, "learning_rate": 0.00013016583337958034, "loss": 0.0078, "step": 224420 }, { "epoch": 1.13, "learning_rate": 0.00013015826568656632, "loss": 0.0096, "step": 224430 }, { "epoch": 1.13, "learning_rate": 0.00013015069799355233, "loss": 0.0102, "step": 224440 }, { "epoch": 1.13, "learning_rate": 0.0001301431303005383, "loss": 0.0078, "step": 224450 }, { "epoch": 1.13, "learning_rate": 0.0001301355626075243, "loss": 0.0093, "step": 224460 }, { "epoch": 1.13, "learning_rate": 0.0001301279949145103, "loss": 0.0104, "step": 224470 }, { "epoch": 1.13, "learning_rate": 0.00013012042722149628, "loss": 0.01, "step": 224480 }, { "epoch": 1.13, "learning_rate": 0.00013011285952848226, "loss": 0.0085, "step": 224490 }, { "epoch": 1.13, "learning_rate": 0.00013010529183546827, "loss": 0.009, "step": 224500 }, { "epoch": 1.13, "learning_rate": 0.00013009772414245425, "loss": 0.0089, "step": 224510 }, { "epoch": 1.13, "learning_rate": 0.00013009015644944023, "loss": 0.0078, "step": 224520 }, { "epoch": 1.13, "learning_rate": 0.0001300825887564262, "loss": 0.0086, "step": 224530 }, { "epoch": 1.13, "learning_rate": 0.00013007502106341222, "loss": 0.0079, "step": 224540 }, { "epoch": 1.13, "learning_rate": 0.0001300674533703982, "loss": 0.0083, "step": 224550 }, { "epoch": 1.13, "learning_rate": 0.00013005988567738418, "loss": 0.0106, "step": 224560 }, { "epoch": 1.13, "learning_rate": 0.0001300523179843702, "loss": 0.0106, "step": 224570 }, { "epoch": 1.13, "learning_rate": 0.00013004475029135617, "loss": 0.009, "step": 224580 }, { "epoch": 1.13, "learning_rate": 0.00013003718259834216, "loss": 0.0079, "step": 224590 }, { "epoch": 1.13, "learning_rate": 0.00013002961490532816, "loss": 0.0089, "step": 224600 }, { "epoch": 1.13, "learning_rate": 0.00013002204721231415, "loss": 0.0081, "step": 224610 }, { "epoch": 1.13, "learning_rate": 0.00013001447951930013, "loss": 0.0082, "step": 224620 }, { "epoch": 1.13, "learning_rate": 0.00013000691182628614, "loss": 0.0067, "step": 224630 }, { "epoch": 1.13, "learning_rate": 0.00012999934413327212, "loss": 0.0099, "step": 224640 }, { "epoch": 1.13, "learning_rate": 0.0001299917764402581, "loss": 0.0121, "step": 224650 }, { "epoch": 1.13, "learning_rate": 0.0001299842087472441, "loss": 0.0113, "step": 224660 }, { "epoch": 1.13, "learning_rate": 0.00012997664105423006, "loss": 0.0089, "step": 224670 }, { "epoch": 1.13, "learning_rate": 0.00012996907336121607, "loss": 0.009, "step": 224680 }, { "epoch": 1.13, "learning_rate": 0.00012996150566820205, "loss": 0.0098, "step": 224690 }, { "epoch": 1.13, "learning_rate": 0.00012995393797518803, "loss": 0.0091, "step": 224700 }, { "epoch": 1.13, "learning_rate": 0.00012994637028217404, "loss": 0.0101, "step": 224710 }, { "epoch": 1.13, "learning_rate": 0.00012993880258916002, "loss": 0.0115, "step": 224720 }, { "epoch": 1.13, "learning_rate": 0.000129931234896146, "loss": 0.0072, "step": 224730 }, { "epoch": 1.13, "learning_rate": 0.00012992366720313199, "loss": 0.0087, "step": 224740 }, { "epoch": 1.13, "learning_rate": 0.000129916099510118, "loss": 0.0091, "step": 224750 }, { "epoch": 1.13, "learning_rate": 0.00012990853181710398, "loss": 0.0079, "step": 224760 }, { "epoch": 1.13, "learning_rate": 0.00012990096412408996, "loss": 0.0114, "step": 224770 }, { "epoch": 1.13, "learning_rate": 0.00012989339643107597, "loss": 0.0084, "step": 224780 }, { "epoch": 1.13, "learning_rate": 0.00012988582873806195, "loss": 0.007, "step": 224790 }, { "epoch": 1.13, "learning_rate": 0.00012987826104504793, "loss": 0.008, "step": 224800 }, { "epoch": 1.13, "learning_rate": 0.00012987069335203394, "loss": 0.0068, "step": 224810 }, { "epoch": 1.13, "learning_rate": 0.00012986312565901992, "loss": 0.0076, "step": 224820 }, { "epoch": 1.13, "learning_rate": 0.0001298555579660059, "loss": 0.009, "step": 224830 }, { "epoch": 1.13, "learning_rate": 0.0001298479902729919, "loss": 0.0108, "step": 224840 }, { "epoch": 1.13, "learning_rate": 0.0001298404225799779, "loss": 0.0086, "step": 224850 }, { "epoch": 1.13, "learning_rate": 0.00012983285488696387, "loss": 0.0129, "step": 224860 }, { "epoch": 1.13, "learning_rate": 0.00012982528719394988, "loss": 0.0081, "step": 224870 }, { "epoch": 1.13, "learning_rate": 0.00012981771950093586, "loss": 0.009, "step": 224880 }, { "epoch": 1.13, "learning_rate": 0.00012981015180792184, "loss": 0.0093, "step": 224890 }, { "epoch": 1.13, "learning_rate": 0.00012980258411490782, "loss": 0.0103, "step": 224900 }, { "epoch": 1.13, "learning_rate": 0.00012979501642189383, "loss": 0.0129, "step": 224910 }, { "epoch": 1.13, "learning_rate": 0.00012978744872887981, "loss": 0.0069, "step": 224920 }, { "epoch": 1.13, "learning_rate": 0.0001297798810358658, "loss": 0.0105, "step": 224930 }, { "epoch": 1.13, "learning_rate": 0.0001297723133428518, "loss": 0.008, "step": 224940 }, { "epoch": 1.13, "learning_rate": 0.00012976474564983779, "loss": 0.0154, "step": 224950 }, { "epoch": 1.13, "learning_rate": 0.00012975717795682377, "loss": 0.0076, "step": 224960 }, { "epoch": 1.13, "learning_rate": 0.00012974961026380978, "loss": 0.0084, "step": 224970 }, { "epoch": 1.14, "learning_rate": 0.00012974204257079576, "loss": 0.011, "step": 224980 }, { "epoch": 1.14, "learning_rate": 0.00012973447487778174, "loss": 0.0082, "step": 224990 }, { "epoch": 1.14, "learning_rate": 0.00012972690718476775, "loss": 0.0074, "step": 225000 }, { "epoch": 1.14, "eval_cer": 0.9144644335264098, "eval_loss": 0.007108866702765226, "eval_runtime": 116.0265, "eval_samples_per_second": 17.237, "eval_steps_per_second": 4.309, "step": 225000 }, { "epoch": 1.14, "learning_rate": 0.00012971933949175373, "loss": 0.0077, "step": 225010 }, { "epoch": 1.14, "learning_rate": 0.0001297117717987397, "loss": 0.009, "step": 225020 }, { "epoch": 1.14, "learning_rate": 0.00012970420410572572, "loss": 0.0086, "step": 225030 }, { "epoch": 1.14, "learning_rate": 0.0001296966364127117, "loss": 0.0085, "step": 225040 }, { "epoch": 1.14, "learning_rate": 0.00012968906871969768, "loss": 0.0083, "step": 225050 }, { "epoch": 1.14, "learning_rate": 0.00012968150102668366, "loss": 0.0086, "step": 225060 }, { "epoch": 1.14, "learning_rate": 0.00012967393333366967, "loss": 0.0077, "step": 225070 }, { "epoch": 1.14, "learning_rate": 0.00012966636564065565, "loss": 0.0087, "step": 225080 }, { "epoch": 1.14, "learning_rate": 0.00012965879794764163, "loss": 0.0076, "step": 225090 }, { "epoch": 1.14, "learning_rate": 0.00012965123025462764, "loss": 0.0082, "step": 225100 }, { "epoch": 1.14, "learning_rate": 0.00012964366256161362, "loss": 0.0099, "step": 225110 }, { "epoch": 1.14, "learning_rate": 0.0001296360948685996, "loss": 0.0135, "step": 225120 }, { "epoch": 1.14, "learning_rate": 0.00012962852717558561, "loss": 0.012, "step": 225130 }, { "epoch": 1.14, "learning_rate": 0.0001296209594825716, "loss": 0.0091, "step": 225140 }, { "epoch": 1.14, "learning_rate": 0.00012961339178955758, "loss": 0.0111, "step": 225150 }, { "epoch": 1.14, "learning_rate": 0.00012960582409654359, "loss": 0.0098, "step": 225160 }, { "epoch": 1.14, "learning_rate": 0.00012959825640352957, "loss": 0.0105, "step": 225170 }, { "epoch": 1.14, "learning_rate": 0.00012959068871051555, "loss": 0.0087, "step": 225180 }, { "epoch": 1.14, "learning_rate": 0.00012958312101750156, "loss": 0.0121, "step": 225190 }, { "epoch": 1.14, "learning_rate": 0.00012957555332448754, "loss": 0.0088, "step": 225200 }, { "epoch": 1.14, "learning_rate": 0.00012956798563147352, "loss": 0.0115, "step": 225210 }, { "epoch": 1.14, "learning_rate": 0.0001295604179384595, "loss": 0.0086, "step": 225220 }, { "epoch": 1.14, "learning_rate": 0.0001295528502454455, "loss": 0.0118, "step": 225230 }, { "epoch": 1.14, "learning_rate": 0.0001295452825524315, "loss": 0.0105, "step": 225240 }, { "epoch": 1.14, "learning_rate": 0.00012953771485941747, "loss": 0.0082, "step": 225250 }, { "epoch": 1.14, "learning_rate": 0.00012953014716640348, "loss": 0.008, "step": 225260 }, { "epoch": 1.14, "learning_rate": 0.00012952257947338946, "loss": 0.0093, "step": 225270 }, { "epoch": 1.14, "learning_rate": 0.00012951501178037544, "loss": 0.0091, "step": 225280 }, { "epoch": 1.14, "learning_rate": 0.00012950744408736145, "loss": 0.0122, "step": 225290 }, { "epoch": 1.14, "learning_rate": 0.0001294998763943474, "loss": 0.01, "step": 225300 }, { "epoch": 1.14, "learning_rate": 0.00012949230870133342, "loss": 0.0081, "step": 225310 }, { "epoch": 1.14, "learning_rate": 0.0001294847410083194, "loss": 0.0091, "step": 225320 }, { "epoch": 1.14, "learning_rate": 0.00012947717331530538, "loss": 0.0101, "step": 225330 }, { "epoch": 1.14, "learning_rate": 0.0001294696056222914, "loss": 0.0096, "step": 225340 }, { "epoch": 1.14, "learning_rate": 0.00012946203792927737, "loss": 0.0116, "step": 225350 }, { "epoch": 1.14, "learning_rate": 0.00012945447023626335, "loss": 0.0079, "step": 225360 }, { "epoch": 1.14, "learning_rate": 0.00012944690254324936, "loss": 0.0092, "step": 225370 }, { "epoch": 1.14, "learning_rate": 0.00012943933485023534, "loss": 0.0092, "step": 225380 }, { "epoch": 1.14, "learning_rate": 0.00012943176715722132, "loss": 0.0096, "step": 225390 }, { "epoch": 1.14, "learning_rate": 0.00012942419946420733, "loss": 0.0118, "step": 225400 }, { "epoch": 1.14, "learning_rate": 0.0001294166317711933, "loss": 0.0089, "step": 225410 }, { "epoch": 1.14, "learning_rate": 0.0001294090640781793, "loss": 0.0092, "step": 225420 }, { "epoch": 1.14, "learning_rate": 0.00012940149638516527, "loss": 0.009, "step": 225430 }, { "epoch": 1.14, "learning_rate": 0.00012939392869215128, "loss": 0.0094, "step": 225440 }, { "epoch": 1.14, "learning_rate": 0.00012938636099913726, "loss": 0.0091, "step": 225450 }, { "epoch": 1.14, "learning_rate": 0.00012937879330612325, "loss": 0.0091, "step": 225460 }, { "epoch": 1.14, "learning_rate": 0.00012937122561310925, "loss": 0.0101, "step": 225470 }, { "epoch": 1.14, "learning_rate": 0.00012936365792009524, "loss": 0.0081, "step": 225480 }, { "epoch": 1.14, "learning_rate": 0.00012935609022708122, "loss": 0.0083, "step": 225490 }, { "epoch": 1.14, "learning_rate": 0.00012934852253406723, "loss": 0.0105, "step": 225500 }, { "epoch": 1.14, "learning_rate": 0.0001293409548410532, "loss": 0.0084, "step": 225510 }, { "epoch": 1.14, "learning_rate": 0.0001293333871480392, "loss": 0.0075, "step": 225520 }, { "epoch": 1.14, "learning_rate": 0.0001293258194550252, "loss": 0.0081, "step": 225530 }, { "epoch": 1.14, "learning_rate": 0.00012931825176201118, "loss": 0.0094, "step": 225540 }, { "epoch": 1.14, "learning_rate": 0.00012931068406899716, "loss": 0.0112, "step": 225550 }, { "epoch": 1.14, "learning_rate": 0.00012930311637598317, "loss": 0.0153, "step": 225560 }, { "epoch": 1.14, "learning_rate": 0.00012929554868296915, "loss": 0.0082, "step": 225570 }, { "epoch": 1.14, "learning_rate": 0.00012928798098995513, "loss": 0.0086, "step": 225580 }, { "epoch": 1.14, "learning_rate": 0.0001292804132969411, "loss": 0.0088, "step": 225590 }, { "epoch": 1.14, "learning_rate": 0.00012927284560392712, "loss": 0.0086, "step": 225600 }, { "epoch": 1.14, "learning_rate": 0.0001292652779109131, "loss": 0.0094, "step": 225610 }, { "epoch": 1.14, "learning_rate": 0.00012925771021789908, "loss": 0.0094, "step": 225620 }, { "epoch": 1.14, "learning_rate": 0.0001292501425248851, "loss": 0.0077, "step": 225630 }, { "epoch": 1.14, "learning_rate": 0.00012924257483187107, "loss": 0.0112, "step": 225640 }, { "epoch": 1.14, "learning_rate": 0.00012923500713885706, "loss": 0.0068, "step": 225650 }, { "epoch": 1.14, "learning_rate": 0.00012922743944584306, "loss": 0.0075, "step": 225660 }, { "epoch": 1.14, "learning_rate": 0.00012921987175282905, "loss": 0.0083, "step": 225670 }, { "epoch": 1.14, "learning_rate": 0.00012921230405981503, "loss": 0.011, "step": 225680 }, { "epoch": 1.14, "learning_rate": 0.00012920473636680104, "loss": 0.0087, "step": 225690 }, { "epoch": 1.14, "learning_rate": 0.00012919716867378702, "loss": 0.01, "step": 225700 }, { "epoch": 1.14, "learning_rate": 0.000129189600980773, "loss": 0.0077, "step": 225710 }, { "epoch": 1.14, "learning_rate": 0.000129182033287759, "loss": 0.0101, "step": 225720 }, { "epoch": 1.14, "learning_rate": 0.000129174465594745, "loss": 0.0098, "step": 225730 }, { "epoch": 1.14, "learning_rate": 0.00012916689790173097, "loss": 0.0105, "step": 225740 }, { "epoch": 1.14, "learning_rate": 0.00012915933020871698, "loss": 0.0081, "step": 225750 }, { "epoch": 1.14, "learning_rate": 0.00012915176251570296, "loss": 0.0075, "step": 225760 }, { "epoch": 1.14, "learning_rate": 0.00012914419482268894, "loss": 0.0094, "step": 225770 }, { "epoch": 1.14, "learning_rate": 0.00012913662712967492, "loss": 0.0095, "step": 225780 }, { "epoch": 1.14, "learning_rate": 0.00012912905943666093, "loss": 0.0097, "step": 225790 }, { "epoch": 1.14, "learning_rate": 0.0001291214917436469, "loss": 0.0092, "step": 225800 }, { "epoch": 1.14, "learning_rate": 0.0001291139240506329, "loss": 0.0091, "step": 225810 }, { "epoch": 1.14, "learning_rate": 0.0001291063563576189, "loss": 0.0093, "step": 225820 }, { "epoch": 1.14, "learning_rate": 0.00012909878866460488, "loss": 0.0086, "step": 225830 }, { "epoch": 1.14, "learning_rate": 0.00012909122097159087, "loss": 0.0094, "step": 225840 }, { "epoch": 1.14, "learning_rate": 0.00012908365327857687, "loss": 0.0072, "step": 225850 }, { "epoch": 1.14, "learning_rate": 0.00012907608558556286, "loss": 0.0085, "step": 225860 }, { "epoch": 1.14, "learning_rate": 0.00012906851789254884, "loss": 0.0095, "step": 225870 }, { "epoch": 1.14, "learning_rate": 0.00012906095019953485, "loss": 0.0098, "step": 225880 }, { "epoch": 1.14, "learning_rate": 0.00012905338250652083, "loss": 0.0067, "step": 225890 }, { "epoch": 1.14, "learning_rate": 0.0001290458148135068, "loss": 0.0075, "step": 225900 }, { "epoch": 1.14, "learning_rate": 0.00012903824712049282, "loss": 0.0074, "step": 225910 }, { "epoch": 1.14, "learning_rate": 0.0001290306794274788, "loss": 0.0108, "step": 225920 }, { "epoch": 1.14, "learning_rate": 0.00012902311173446478, "loss": 0.008, "step": 225930 }, { "epoch": 1.14, "learning_rate": 0.00012901554404145076, "loss": 0.0089, "step": 225940 }, { "epoch": 1.14, "learning_rate": 0.00012900797634843674, "loss": 0.0117, "step": 225950 }, { "epoch": 1.14, "learning_rate": 0.00012900040865542272, "loss": 0.0077, "step": 225960 }, { "epoch": 1.14, "learning_rate": 0.00012899284096240873, "loss": 0.0078, "step": 225970 }, { "epoch": 1.14, "learning_rate": 0.00012898527326939471, "loss": 0.0114, "step": 225980 }, { "epoch": 1.14, "learning_rate": 0.0001289777055763807, "loss": 0.0074, "step": 225990 }, { "epoch": 1.14, "learning_rate": 0.0001289701378833667, "loss": 0.0092, "step": 226000 }, { "epoch": 1.14, "eval_cer": 0.9144498775845288, "eval_loss": 0.007178218103945255, "eval_runtime": 116.0384, "eval_samples_per_second": 17.236, "eval_steps_per_second": 4.309, "step": 226000 }, { "epoch": 1.14, "learning_rate": 0.00012896257019035269, "loss": 0.006, "step": 226010 }, { "epoch": 1.14, "learning_rate": 0.00012895500249733867, "loss": 0.0088, "step": 226020 }, { "epoch": 1.14, "learning_rate": 0.00012894743480432468, "loss": 0.0089, "step": 226030 }, { "epoch": 1.14, "learning_rate": 0.00012893986711131066, "loss": 0.0095, "step": 226040 }, { "epoch": 1.14, "learning_rate": 0.00012893229941829664, "loss": 0.0088, "step": 226050 }, { "epoch": 1.14, "learning_rate": 0.00012892473172528265, "loss": 0.0087, "step": 226060 }, { "epoch": 1.14, "learning_rate": 0.00012891716403226863, "loss": 0.0116, "step": 226070 }, { "epoch": 1.14, "learning_rate": 0.0001289095963392546, "loss": 0.0094, "step": 226080 }, { "epoch": 1.14, "learning_rate": 0.00012890202864624062, "loss": 0.0082, "step": 226090 }, { "epoch": 1.14, "learning_rate": 0.0001288944609532266, "loss": 0.0103, "step": 226100 }, { "epoch": 1.14, "learning_rate": 0.00012888689326021258, "loss": 0.0094, "step": 226110 }, { "epoch": 1.14, "learning_rate": 0.00012887932556719856, "loss": 0.0097, "step": 226120 }, { "epoch": 1.14, "learning_rate": 0.00012887175787418457, "loss": 0.0091, "step": 226130 }, { "epoch": 1.14, "learning_rate": 0.00012886419018117055, "loss": 0.0082, "step": 226140 }, { "epoch": 1.14, "learning_rate": 0.00012885662248815654, "loss": 0.011, "step": 226150 }, { "epoch": 1.14, "learning_rate": 0.00012884905479514254, "loss": 0.0077, "step": 226160 }, { "epoch": 1.14, "learning_rate": 0.00012884148710212853, "loss": 0.0134, "step": 226170 }, { "epoch": 1.14, "learning_rate": 0.0001288339194091145, "loss": 0.007, "step": 226180 }, { "epoch": 1.14, "learning_rate": 0.00012882635171610052, "loss": 0.0082, "step": 226190 }, { "epoch": 1.14, "learning_rate": 0.0001288187840230865, "loss": 0.0114, "step": 226200 }, { "epoch": 1.14, "learning_rate": 0.00012881121633007248, "loss": 0.009, "step": 226210 }, { "epoch": 1.14, "learning_rate": 0.00012880364863705849, "loss": 0.0069, "step": 226220 }, { "epoch": 1.14, "learning_rate": 0.00012879608094404447, "loss": 0.0091, "step": 226230 }, { "epoch": 1.14, "learning_rate": 0.00012878851325103045, "loss": 0.0078, "step": 226240 }, { "epoch": 1.14, "learning_rate": 0.00012878094555801646, "loss": 0.012, "step": 226250 }, { "epoch": 1.14, "learning_rate": 0.00012877337786500244, "loss": 0.0071, "step": 226260 }, { "epoch": 1.14, "learning_rate": 0.00012876581017198842, "loss": 0.0089, "step": 226270 }, { "epoch": 1.14, "learning_rate": 0.00012875824247897443, "loss": 0.0102, "step": 226280 }, { "epoch": 1.14, "learning_rate": 0.0001287506747859604, "loss": 0.0094, "step": 226290 }, { "epoch": 1.14, "learning_rate": 0.0001287431070929464, "loss": 0.0088, "step": 226300 }, { "epoch": 1.14, "learning_rate": 0.00012873553939993237, "loss": 0.0113, "step": 226310 }, { "epoch": 1.14, "learning_rate": 0.00012872797170691838, "loss": 0.0083, "step": 226320 }, { "epoch": 1.14, "learning_rate": 0.00012872040401390436, "loss": 0.0103, "step": 226330 }, { "epoch": 1.14, "learning_rate": 0.00012871283632089035, "loss": 0.01, "step": 226340 }, { "epoch": 1.14, "learning_rate": 0.00012870526862787635, "loss": 0.0095, "step": 226350 }, { "epoch": 1.14, "learning_rate": 0.00012869770093486234, "loss": 0.0085, "step": 226360 }, { "epoch": 1.14, "learning_rate": 0.00012869013324184832, "loss": 0.0115, "step": 226370 }, { "epoch": 1.14, "learning_rate": 0.00012868256554883433, "loss": 0.0099, "step": 226380 }, { "epoch": 1.14, "learning_rate": 0.0001286749978558203, "loss": 0.0094, "step": 226390 }, { "epoch": 1.14, "learning_rate": 0.0001286674301628063, "loss": 0.0069, "step": 226400 }, { "epoch": 1.14, "learning_rate": 0.0001286598624697923, "loss": 0.0081, "step": 226410 }, { "epoch": 1.14, "learning_rate": 0.00012865229477677828, "loss": 0.0096, "step": 226420 }, { "epoch": 1.14, "learning_rate": 0.00012864472708376426, "loss": 0.0083, "step": 226430 }, { "epoch": 1.14, "learning_rate": 0.00012863715939075027, "loss": 0.0077, "step": 226440 }, { "epoch": 1.14, "learning_rate": 0.00012862959169773625, "loss": 0.0088, "step": 226450 }, { "epoch": 1.14, "learning_rate": 0.00012862202400472223, "loss": 0.0088, "step": 226460 }, { "epoch": 1.14, "learning_rate": 0.0001286144563117082, "loss": 0.0068, "step": 226470 }, { "epoch": 1.14, "learning_rate": 0.00012860688861869422, "loss": 0.0081, "step": 226480 }, { "epoch": 1.14, "learning_rate": 0.0001285993209256802, "loss": 0.0078, "step": 226490 }, { "epoch": 1.14, "learning_rate": 0.00012859175323266618, "loss": 0.0094, "step": 226500 }, { "epoch": 1.14, "learning_rate": 0.0001285841855396522, "loss": 0.0092, "step": 226510 }, { "epoch": 1.14, "learning_rate": 0.00012857661784663817, "loss": 0.0079, "step": 226520 }, { "epoch": 1.14, "learning_rate": 0.00012856905015362416, "loss": 0.008, "step": 226530 }, { "epoch": 1.14, "learning_rate": 0.00012856148246061016, "loss": 0.0087, "step": 226540 }, { "epoch": 1.14, "learning_rate": 0.00012855391476759615, "loss": 0.008, "step": 226550 }, { "epoch": 1.14, "learning_rate": 0.00012854634707458213, "loss": 0.009, "step": 226560 }, { "epoch": 1.14, "learning_rate": 0.0001285387793815681, "loss": 0.0106, "step": 226570 }, { "epoch": 1.14, "learning_rate": 0.0001285312116885541, "loss": 0.0087, "step": 226580 }, { "epoch": 1.14, "learning_rate": 0.0001285236439955401, "loss": 0.0092, "step": 226590 }, { "epoch": 1.14, "learning_rate": 0.00012851607630252608, "loss": 0.0093, "step": 226600 }, { "epoch": 1.14, "learning_rate": 0.00012850850860951206, "loss": 0.0084, "step": 226610 }, { "epoch": 1.14, "learning_rate": 0.00012850094091649807, "loss": 0.0093, "step": 226620 }, { "epoch": 1.14, "learning_rate": 0.00012849337322348405, "loss": 0.0081, "step": 226630 }, { "epoch": 1.14, "learning_rate": 0.00012848580553047003, "loss": 0.0101, "step": 226640 }, { "epoch": 1.14, "learning_rate": 0.00012847823783745601, "loss": 0.0121, "step": 226650 }, { "epoch": 1.14, "learning_rate": 0.00012847067014444202, "loss": 0.0102, "step": 226660 }, { "epoch": 1.14, "learning_rate": 0.000128463102451428, "loss": 0.0096, "step": 226670 }, { "epoch": 1.14, "learning_rate": 0.00012845553475841399, "loss": 0.0103, "step": 226680 }, { "epoch": 1.14, "learning_rate": 0.0001284479670654, "loss": 0.0079, "step": 226690 }, { "epoch": 1.14, "learning_rate": 0.00012844039937238598, "loss": 0.0078, "step": 226700 }, { "epoch": 1.14, "learning_rate": 0.00012843283167937196, "loss": 0.0084, "step": 226710 }, { "epoch": 1.14, "learning_rate": 0.00012842526398635797, "loss": 0.009, "step": 226720 }, { "epoch": 1.14, "learning_rate": 0.00012841769629334395, "loss": 0.0095, "step": 226730 }, { "epoch": 1.14, "learning_rate": 0.00012841012860032993, "loss": 0.0099, "step": 226740 }, { "epoch": 1.14, "learning_rate": 0.00012840256090731594, "loss": 0.0079, "step": 226750 }, { "epoch": 1.14, "learning_rate": 0.00012839499321430192, "loss": 0.0107, "step": 226760 }, { "epoch": 1.14, "learning_rate": 0.0001283874255212879, "loss": 0.0114, "step": 226770 }, { "epoch": 1.14, "learning_rate": 0.0001283798578282739, "loss": 0.0083, "step": 226780 }, { "epoch": 1.14, "learning_rate": 0.0001283722901352599, "loss": 0.0077, "step": 226790 }, { "epoch": 1.14, "learning_rate": 0.00012836472244224587, "loss": 0.0083, "step": 226800 }, { "epoch": 1.14, "learning_rate": 0.00012835715474923188, "loss": 0.0076, "step": 226810 }, { "epoch": 1.14, "learning_rate": 0.00012834958705621786, "loss": 0.01, "step": 226820 }, { "epoch": 1.14, "learning_rate": 0.00012834201936320384, "loss": 0.0064, "step": 226830 }, { "epoch": 1.14, "learning_rate": 0.00012833445167018982, "loss": 0.0086, "step": 226840 }, { "epoch": 1.14, "learning_rate": 0.00012832688397717583, "loss": 0.0109, "step": 226850 }, { "epoch": 1.14, "learning_rate": 0.00012831931628416181, "loss": 0.0107, "step": 226860 }, { "epoch": 1.14, "learning_rate": 0.0001283117485911478, "loss": 0.0101, "step": 226870 }, { "epoch": 1.14, "learning_rate": 0.0001283041808981338, "loss": 0.0068, "step": 226880 }, { "epoch": 1.14, "learning_rate": 0.00012829661320511979, "loss": 0.0079, "step": 226890 }, { "epoch": 1.14, "learning_rate": 0.00012828904551210577, "loss": 0.0086, "step": 226900 }, { "epoch": 1.14, "learning_rate": 0.00012828147781909178, "loss": 0.0079, "step": 226910 }, { "epoch": 1.14, "learning_rate": 0.00012827391012607776, "loss": 0.0089, "step": 226920 }, { "epoch": 1.14, "learning_rate": 0.00012826634243306374, "loss": 0.0103, "step": 226930 }, { "epoch": 1.14, "learning_rate": 0.00012825877474004975, "loss": 0.0083, "step": 226940 }, { "epoch": 1.14, "learning_rate": 0.00012825120704703573, "loss": 0.0097, "step": 226950 }, { "epoch": 1.15, "learning_rate": 0.0001282436393540217, "loss": 0.008, "step": 226960 }, { "epoch": 1.15, "learning_rate": 0.00012823607166100772, "loss": 0.0086, "step": 226970 }, { "epoch": 1.15, "learning_rate": 0.0001282285039679937, "loss": 0.0114, "step": 226980 }, { "epoch": 1.15, "learning_rate": 0.00012822093627497968, "loss": 0.0095, "step": 226990 }, { "epoch": 1.15, "learning_rate": 0.00012821336858196566, "loss": 0.0074, "step": 227000 }, { "epoch": 1.15, "eval_cer": 0.9144663743186606, "eval_loss": 0.006952292751520872, "eval_runtime": 116.2021, "eval_samples_per_second": 17.211, "eval_steps_per_second": 4.303, "step": 227000 }, { "epoch": 1.15, "learning_rate": 0.00012820580088895167, "loss": 0.0068, "step": 227010 }, { "epoch": 1.15, "learning_rate": 0.00012819823319593765, "loss": 0.0086, "step": 227020 }, { "epoch": 1.15, "learning_rate": 0.00012819066550292363, "loss": 0.0077, "step": 227030 }, { "epoch": 1.15, "learning_rate": 0.00012818309780990964, "loss": 0.0083, "step": 227040 }, { "epoch": 1.15, "learning_rate": 0.00012817553011689562, "loss": 0.0087, "step": 227050 }, { "epoch": 1.15, "learning_rate": 0.0001281679624238816, "loss": 0.0063, "step": 227060 }, { "epoch": 1.15, "learning_rate": 0.00012816039473086761, "loss": 0.0083, "step": 227070 }, { "epoch": 1.15, "learning_rate": 0.0001281528270378536, "loss": 0.0101, "step": 227080 }, { "epoch": 1.15, "learning_rate": 0.00012814525934483958, "loss": 0.01, "step": 227090 }, { "epoch": 1.15, "learning_rate": 0.00012813769165182559, "loss": 0.0098, "step": 227100 }, { "epoch": 1.15, "learning_rate": 0.00012813012395881157, "loss": 0.0088, "step": 227110 }, { "epoch": 1.15, "learning_rate": 0.00012812255626579755, "loss": 0.0124, "step": 227120 }, { "epoch": 1.15, "learning_rate": 0.00012811498857278356, "loss": 0.0077, "step": 227130 }, { "epoch": 1.15, "learning_rate": 0.00012810742087976954, "loss": 0.0105, "step": 227140 }, { "epoch": 1.15, "learning_rate": 0.00012809985318675552, "loss": 0.0085, "step": 227150 }, { "epoch": 1.15, "learning_rate": 0.0001280922854937415, "loss": 0.0082, "step": 227160 }, { "epoch": 1.15, "learning_rate": 0.0001280847178007275, "loss": 0.0095, "step": 227170 }, { "epoch": 1.15, "learning_rate": 0.0001280771501077135, "loss": 0.0094, "step": 227180 }, { "epoch": 1.15, "learning_rate": 0.00012806958241469947, "loss": 0.0075, "step": 227190 }, { "epoch": 1.15, "learning_rate": 0.00012806201472168545, "loss": 0.0111, "step": 227200 }, { "epoch": 1.15, "learning_rate": 0.00012805444702867144, "loss": 0.0101, "step": 227210 }, { "epoch": 1.15, "learning_rate": 0.00012804687933565744, "loss": 0.01, "step": 227220 }, { "epoch": 1.15, "learning_rate": 0.00012803931164264343, "loss": 0.0095, "step": 227230 }, { "epoch": 1.15, "learning_rate": 0.0001280317439496294, "loss": 0.0096, "step": 227240 }, { "epoch": 1.15, "learning_rate": 0.00012802417625661542, "loss": 0.0091, "step": 227250 }, { "epoch": 1.15, "learning_rate": 0.0001280166085636014, "loss": 0.0092, "step": 227260 }, { "epoch": 1.15, "learning_rate": 0.00012800904087058738, "loss": 0.0089, "step": 227270 }, { "epoch": 1.15, "learning_rate": 0.0001280014731775734, "loss": 0.0103, "step": 227280 }, { "epoch": 1.15, "learning_rate": 0.00012799390548455937, "loss": 0.0104, "step": 227290 }, { "epoch": 1.15, "learning_rate": 0.00012798633779154535, "loss": 0.0072, "step": 227300 }, { "epoch": 1.15, "learning_rate": 0.00012797877009853136, "loss": 0.0116, "step": 227310 }, { "epoch": 1.15, "learning_rate": 0.00012797120240551734, "loss": 0.0076, "step": 227320 }, { "epoch": 1.15, "learning_rate": 0.00012796363471250332, "loss": 0.0103, "step": 227330 }, { "epoch": 1.15, "learning_rate": 0.00012795606701948933, "loss": 0.0084, "step": 227340 }, { "epoch": 1.15, "learning_rate": 0.0001279484993264753, "loss": 0.0089, "step": 227350 }, { "epoch": 1.15, "learning_rate": 0.0001279409316334613, "loss": 0.0075, "step": 227360 }, { "epoch": 1.15, "learning_rate": 0.00012793336394044727, "loss": 0.0091, "step": 227370 }, { "epoch": 1.15, "learning_rate": 0.00012792579624743328, "loss": 0.0087, "step": 227380 }, { "epoch": 1.15, "learning_rate": 0.00012791822855441926, "loss": 0.0073, "step": 227390 }, { "epoch": 1.15, "learning_rate": 0.00012791066086140525, "loss": 0.007, "step": 227400 }, { "epoch": 1.15, "learning_rate": 0.00012790309316839125, "loss": 0.0067, "step": 227410 }, { "epoch": 1.15, "learning_rate": 0.00012789552547537724, "loss": 0.0072, "step": 227420 }, { "epoch": 1.15, "learning_rate": 0.00012788795778236322, "loss": 0.0095, "step": 227430 }, { "epoch": 1.15, "learning_rate": 0.00012788039008934923, "loss": 0.0097, "step": 227440 }, { "epoch": 1.15, "learning_rate": 0.0001278728223963352, "loss": 0.0094, "step": 227450 }, { "epoch": 1.15, "learning_rate": 0.0001278652547033212, "loss": 0.0094, "step": 227460 }, { "epoch": 1.15, "learning_rate": 0.0001278576870103072, "loss": 0.0078, "step": 227470 }, { "epoch": 1.15, "learning_rate": 0.00012785011931729318, "loss": 0.0113, "step": 227480 }, { "epoch": 1.15, "learning_rate": 0.00012784255162427916, "loss": 0.0086, "step": 227490 }, { "epoch": 1.15, "learning_rate": 0.00012783498393126517, "loss": 0.0073, "step": 227500 }, { "epoch": 1.15, "learning_rate": 0.00012782741623825115, "loss": 0.0085, "step": 227510 }, { "epoch": 1.15, "learning_rate": 0.00012781984854523713, "loss": 0.0104, "step": 227520 }, { "epoch": 1.15, "learning_rate": 0.0001278122808522231, "loss": 0.011, "step": 227530 }, { "epoch": 1.15, "learning_rate": 0.00012780471315920912, "loss": 0.011, "step": 227540 }, { "epoch": 1.15, "learning_rate": 0.0001277971454661951, "loss": 0.008, "step": 227550 }, { "epoch": 1.15, "learning_rate": 0.00012778957777318108, "loss": 0.009, "step": 227560 }, { "epoch": 1.15, "learning_rate": 0.0001277820100801671, "loss": 0.0086, "step": 227570 }, { "epoch": 1.15, "learning_rate": 0.00012777444238715307, "loss": 0.0079, "step": 227580 }, { "epoch": 1.15, "learning_rate": 0.00012776687469413906, "loss": 0.0089, "step": 227590 }, { "epoch": 1.15, "learning_rate": 0.00012775930700112506, "loss": 0.0087, "step": 227600 }, { "epoch": 1.15, "learning_rate": 0.00012775173930811105, "loss": 0.0076, "step": 227610 }, { "epoch": 1.15, "learning_rate": 0.00012774417161509703, "loss": 0.0092, "step": 227620 }, { "epoch": 1.15, "learning_rate": 0.00012773660392208304, "loss": 0.0105, "step": 227630 }, { "epoch": 1.15, "learning_rate": 0.00012772903622906902, "loss": 0.0095, "step": 227640 }, { "epoch": 1.15, "learning_rate": 0.000127721468536055, "loss": 0.011, "step": 227650 }, { "epoch": 1.15, "learning_rate": 0.000127713900843041, "loss": 0.007, "step": 227660 }, { "epoch": 1.15, "learning_rate": 0.000127706333150027, "loss": 0.0082, "step": 227670 }, { "epoch": 1.15, "learning_rate": 0.00012769876545701297, "loss": 0.0079, "step": 227680 }, { "epoch": 1.15, "learning_rate": 0.00012769119776399898, "loss": 0.0091, "step": 227690 }, { "epoch": 1.15, "learning_rate": 0.00012768363007098496, "loss": 0.0096, "step": 227700 }, { "epoch": 1.15, "learning_rate": 0.00012767606237797094, "loss": 0.0094, "step": 227710 }, { "epoch": 1.15, "learning_rate": 0.00012766849468495692, "loss": 0.0096, "step": 227720 }, { "epoch": 1.15, "learning_rate": 0.00012766092699194293, "loss": 0.0127, "step": 227730 }, { "epoch": 1.15, "learning_rate": 0.0001276533592989289, "loss": 0.0061, "step": 227740 }, { "epoch": 1.15, "learning_rate": 0.0001276457916059149, "loss": 0.0086, "step": 227750 }, { "epoch": 1.15, "learning_rate": 0.0001276382239129009, "loss": 0.0079, "step": 227760 }, { "epoch": 1.15, "learning_rate": 0.00012763065621988688, "loss": 0.0089, "step": 227770 }, { "epoch": 1.15, "learning_rate": 0.00012762308852687287, "loss": 0.0094, "step": 227780 }, { "epoch": 1.15, "learning_rate": 0.00012761552083385887, "loss": 0.0085, "step": 227790 }, { "epoch": 1.15, "learning_rate": 0.00012760795314084486, "loss": 0.0083, "step": 227800 }, { "epoch": 1.15, "learning_rate": 0.00012760038544783084, "loss": 0.009, "step": 227810 }, { "epoch": 1.15, "learning_rate": 0.00012759281775481682, "loss": 0.0076, "step": 227820 }, { "epoch": 1.15, "learning_rate": 0.0001275852500618028, "loss": 0.0082, "step": 227830 }, { "epoch": 1.15, "learning_rate": 0.0001275776823687888, "loss": 0.0093, "step": 227840 }, { "epoch": 1.15, "learning_rate": 0.0001275701146757748, "loss": 0.0074, "step": 227850 }, { "epoch": 1.15, "learning_rate": 0.00012756254698276077, "loss": 0.0084, "step": 227860 }, { "epoch": 1.15, "learning_rate": 0.00012755497928974678, "loss": 0.0079, "step": 227870 }, { "epoch": 1.15, "learning_rate": 0.00012754741159673276, "loss": 0.012, "step": 227880 }, { "epoch": 1.15, "learning_rate": 0.00012753984390371874, "loss": 0.0094, "step": 227890 }, { "epoch": 1.15, "learning_rate": 0.00012753227621070472, "loss": 0.011, "step": 227900 }, { "epoch": 1.15, "learning_rate": 0.00012752470851769073, "loss": 0.0079, "step": 227910 }, { "epoch": 1.15, "learning_rate": 0.00012751714082467671, "loss": 0.0091, "step": 227920 }, { "epoch": 1.15, "learning_rate": 0.0001275095731316627, "loss": 0.0087, "step": 227930 }, { "epoch": 1.15, "learning_rate": 0.0001275020054386487, "loss": 0.0082, "step": 227940 }, { "epoch": 1.15, "learning_rate": 0.00012749443774563469, "loss": 0.011, "step": 227950 }, { "epoch": 1.15, "learning_rate": 0.00012748687005262067, "loss": 0.009, "step": 227960 }, { "epoch": 1.15, "learning_rate": 0.00012747930235960668, "loss": 0.0077, "step": 227970 }, { "epoch": 1.15, "learning_rate": 0.00012747173466659266, "loss": 0.0086, "step": 227980 }, { "epoch": 1.15, "learning_rate": 0.00012746416697357864, "loss": 0.0083, "step": 227990 }, { "epoch": 1.15, "learning_rate": 0.00012745659928056465, "loss": 0.01, "step": 228000 }, { "epoch": 1.15, "eval_cer": 0.9144615223380336, "eval_loss": 0.006729237735271454, "eval_runtime": 116.2506, "eval_samples_per_second": 17.204, "eval_steps_per_second": 4.301, "step": 228000 }, { "epoch": 1.15, "learning_rate": 0.00012744903158755063, "loss": 0.0105, "step": 228010 }, { "epoch": 1.15, "learning_rate": 0.0001274414638945366, "loss": 0.0093, "step": 228020 }, { "epoch": 1.15, "learning_rate": 0.00012743389620152262, "loss": 0.0093, "step": 228030 }, { "epoch": 1.15, "learning_rate": 0.0001274263285085086, "loss": 0.0105, "step": 228040 }, { "epoch": 1.15, "learning_rate": 0.00012741876081549458, "loss": 0.0092, "step": 228050 }, { "epoch": 1.15, "learning_rate": 0.00012741119312248056, "loss": 0.0112, "step": 228060 }, { "epoch": 1.15, "learning_rate": 0.00012740362542946657, "loss": 0.0099, "step": 228070 }, { "epoch": 1.15, "learning_rate": 0.00012739605773645255, "loss": 0.0103, "step": 228080 }, { "epoch": 1.15, "learning_rate": 0.00012738849004343853, "loss": 0.0118, "step": 228090 }, { "epoch": 1.15, "learning_rate": 0.00012738092235042454, "loss": 0.0098, "step": 228100 }, { "epoch": 1.15, "learning_rate": 0.00012737335465741052, "loss": 0.0103, "step": 228110 }, { "epoch": 1.15, "learning_rate": 0.0001273657869643965, "loss": 0.0094, "step": 228120 }, { "epoch": 1.15, "learning_rate": 0.00012735821927138251, "loss": 0.0074, "step": 228130 }, { "epoch": 1.15, "learning_rate": 0.0001273506515783685, "loss": 0.0091, "step": 228140 }, { "epoch": 1.15, "learning_rate": 0.00012734308388535448, "loss": 0.0078, "step": 228150 }, { "epoch": 1.15, "learning_rate": 0.00012733551619234049, "loss": 0.0086, "step": 228160 }, { "epoch": 1.15, "learning_rate": 0.00012732794849932647, "loss": 0.0077, "step": 228170 }, { "epoch": 1.15, "learning_rate": 0.00012732038080631245, "loss": 0.0083, "step": 228180 }, { "epoch": 1.15, "learning_rate": 0.00012731281311329846, "loss": 0.0091, "step": 228190 }, { "epoch": 1.15, "learning_rate": 0.00012730524542028444, "loss": 0.0107, "step": 228200 }, { "epoch": 1.15, "learning_rate": 0.00012729767772727042, "loss": 0.0082, "step": 228210 }, { "epoch": 1.15, "learning_rate": 0.00012729011003425643, "loss": 0.0076, "step": 228220 }, { "epoch": 1.15, "learning_rate": 0.0001272825423412424, "loss": 0.0093, "step": 228230 }, { "epoch": 1.15, "learning_rate": 0.0001272749746482284, "loss": 0.0085, "step": 228240 }, { "epoch": 1.15, "learning_rate": 0.00012726740695521437, "loss": 0.0081, "step": 228250 }, { "epoch": 1.15, "learning_rate": 0.00012725983926220038, "loss": 0.0083, "step": 228260 }, { "epoch": 1.15, "learning_rate": 0.00012725227156918636, "loss": 0.0116, "step": 228270 }, { "epoch": 1.15, "learning_rate": 0.00012724470387617234, "loss": 0.011, "step": 228280 }, { "epoch": 1.15, "learning_rate": 0.00012723713618315835, "loss": 0.0086, "step": 228290 }, { "epoch": 1.15, "learning_rate": 0.00012722956849014433, "loss": 0.0093, "step": 228300 }, { "epoch": 1.15, "learning_rate": 0.00012722200079713032, "loss": 0.0098, "step": 228310 }, { "epoch": 1.15, "learning_rate": 0.00012721443310411632, "loss": 0.0075, "step": 228320 }, { "epoch": 1.15, "learning_rate": 0.0001272068654111023, "loss": 0.0087, "step": 228330 }, { "epoch": 1.15, "learning_rate": 0.0001271992977180883, "loss": 0.009, "step": 228340 }, { "epoch": 1.15, "learning_rate": 0.0001271917300250743, "loss": 0.0091, "step": 228350 }, { "epoch": 1.15, "learning_rate": 0.00012718416233206028, "loss": 0.0102, "step": 228360 }, { "epoch": 1.15, "learning_rate": 0.00012717659463904626, "loss": 0.0104, "step": 228370 }, { "epoch": 1.15, "learning_rate": 0.00012716902694603227, "loss": 0.0101, "step": 228380 }, { "epoch": 1.15, "learning_rate": 0.00012716145925301825, "loss": 0.0098, "step": 228390 }, { "epoch": 1.15, "learning_rate": 0.00012715389156000423, "loss": 0.0093, "step": 228400 }, { "epoch": 1.15, "learning_rate": 0.0001271463238669902, "loss": 0.0094, "step": 228410 }, { "epoch": 1.15, "learning_rate": 0.00012713875617397622, "loss": 0.0075, "step": 228420 }, { "epoch": 1.15, "learning_rate": 0.0001271311884809622, "loss": 0.0095, "step": 228430 }, { "epoch": 1.15, "learning_rate": 0.00012712362078794818, "loss": 0.0075, "step": 228440 }, { "epoch": 1.15, "learning_rate": 0.00012711605309493416, "loss": 0.0139, "step": 228450 }, { "epoch": 1.15, "learning_rate": 0.00012710848540192015, "loss": 0.0092, "step": 228460 }, { "epoch": 1.15, "learning_rate": 0.00012710091770890615, "loss": 0.0095, "step": 228470 }, { "epoch": 1.15, "learning_rate": 0.00012709335001589214, "loss": 0.0104, "step": 228480 }, { "epoch": 1.15, "learning_rate": 0.00012708578232287812, "loss": 0.0096, "step": 228490 }, { "epoch": 1.15, "learning_rate": 0.00012707821462986413, "loss": 0.008, "step": 228500 }, { "epoch": 1.15, "learning_rate": 0.0001270706469368501, "loss": 0.0101, "step": 228510 }, { "epoch": 1.15, "learning_rate": 0.0001270630792438361, "loss": 0.0122, "step": 228520 }, { "epoch": 1.15, "learning_rate": 0.0001270555115508221, "loss": 0.0087, "step": 228530 }, { "epoch": 1.15, "learning_rate": 0.00012704794385780808, "loss": 0.012, "step": 228540 }, { "epoch": 1.15, "learning_rate": 0.00012704037616479406, "loss": 0.0111, "step": 228550 }, { "epoch": 1.15, "learning_rate": 0.00012703280847178007, "loss": 0.0089, "step": 228560 }, { "epoch": 1.15, "learning_rate": 0.00012702524077876605, "loss": 0.0123, "step": 228570 }, { "epoch": 1.15, "learning_rate": 0.00012701767308575203, "loss": 0.0096, "step": 228580 }, { "epoch": 1.15, "learning_rate": 0.000127010105392738, "loss": 0.0085, "step": 228590 }, { "epoch": 1.15, "learning_rate": 0.00012700253769972402, "loss": 0.0111, "step": 228600 }, { "epoch": 1.15, "learning_rate": 0.00012699497000671, "loss": 0.0111, "step": 228610 }, { "epoch": 1.15, "learning_rate": 0.00012698740231369598, "loss": 0.0104, "step": 228620 }, { "epoch": 1.15, "learning_rate": 0.000126979834620682, "loss": 0.0139, "step": 228630 }, { "epoch": 1.15, "learning_rate": 0.00012697226692766797, "loss": 0.0102, "step": 228640 }, { "epoch": 1.15, "learning_rate": 0.00012696469923465396, "loss": 0.0087, "step": 228650 }, { "epoch": 1.15, "learning_rate": 0.00012695713154163996, "loss": 0.0096, "step": 228660 }, { "epoch": 1.15, "learning_rate": 0.00012694956384862595, "loss": 0.0107, "step": 228670 }, { "epoch": 1.15, "learning_rate": 0.00012694199615561193, "loss": 0.0118, "step": 228680 }, { "epoch": 1.15, "learning_rate": 0.00012693442846259794, "loss": 0.0087, "step": 228690 }, { "epoch": 1.15, "learning_rate": 0.00012692686076958392, "loss": 0.0079, "step": 228700 }, { "epoch": 1.15, "learning_rate": 0.0001269192930765699, "loss": 0.0089, "step": 228710 }, { "epoch": 1.15, "learning_rate": 0.0001269117253835559, "loss": 0.0096, "step": 228720 }, { "epoch": 1.15, "learning_rate": 0.0001269041576905419, "loss": 0.0091, "step": 228730 }, { "epoch": 1.15, "learning_rate": 0.00012689658999752787, "loss": 0.0082, "step": 228740 }, { "epoch": 1.15, "learning_rate": 0.00012688902230451388, "loss": 0.0101, "step": 228750 }, { "epoch": 1.15, "learning_rate": 0.00012688145461149986, "loss": 0.0091, "step": 228760 }, { "epoch": 1.15, "learning_rate": 0.00012687388691848584, "loss": 0.0097, "step": 228770 }, { "epoch": 1.15, "learning_rate": 0.00012686631922547182, "loss": 0.0088, "step": 228780 }, { "epoch": 1.15, "learning_rate": 0.00012685875153245783, "loss": 0.0108, "step": 228790 }, { "epoch": 1.15, "learning_rate": 0.0001268511838394438, "loss": 0.0119, "step": 228800 }, { "epoch": 1.15, "learning_rate": 0.0001268436161464298, "loss": 0.0088, "step": 228810 }, { "epoch": 1.15, "learning_rate": 0.0001268360484534158, "loss": 0.0076, "step": 228820 }, { "epoch": 1.15, "learning_rate": 0.00012682848076040178, "loss": 0.0075, "step": 228830 }, { "epoch": 1.15, "learning_rate": 0.00012682091306738777, "loss": 0.0106, "step": 228840 }, { "epoch": 1.15, "learning_rate": 0.00012681334537437377, "loss": 0.0087, "step": 228850 }, { "epoch": 1.15, "learning_rate": 0.00012680577768135976, "loss": 0.0092, "step": 228860 }, { "epoch": 1.15, "learning_rate": 0.00012679820998834574, "loss": 0.0083, "step": 228870 }, { "epoch": 1.15, "learning_rate": 0.00012679064229533175, "loss": 0.0073, "step": 228880 }, { "epoch": 1.15, "learning_rate": 0.00012678307460231773, "loss": 0.0096, "step": 228890 }, { "epoch": 1.15, "learning_rate": 0.0001267755069093037, "loss": 0.009, "step": 228900 }, { "epoch": 1.15, "learning_rate": 0.00012676793921628972, "loss": 0.0089, "step": 228910 }, { "epoch": 1.15, "learning_rate": 0.0001267603715232757, "loss": 0.0073, "step": 228920 }, { "epoch": 1.15, "learning_rate": 0.00012675280383026168, "loss": 0.0102, "step": 228930 }, { "epoch": 1.16, "learning_rate": 0.00012674523613724766, "loss": 0.0092, "step": 228940 }, { "epoch": 1.16, "learning_rate": 0.00012673766844423367, "loss": 0.0095, "step": 228950 }, { "epoch": 1.16, "learning_rate": 0.00012673010075121965, "loss": 0.0089, "step": 228960 }, { "epoch": 1.16, "learning_rate": 0.00012672253305820563, "loss": 0.0099, "step": 228970 }, { "epoch": 1.16, "learning_rate": 0.00012671496536519164, "loss": 0.0077, "step": 228980 }, { "epoch": 1.16, "learning_rate": 0.00012670739767217762, "loss": 0.0103, "step": 228990 }, { "epoch": 1.16, "learning_rate": 0.0001266998299791636, "loss": 0.0086, "step": 229000 }, { "epoch": 1.16, "eval_cer": 0.9144634631302844, "eval_loss": 0.006603468209505081, "eval_runtime": 116.4012, "eval_samples_per_second": 17.182, "eval_steps_per_second": 4.295, "step": 229000 }, { "epoch": 1.16, "learning_rate": 0.0001266922622861496, "loss": 0.0089, "step": 229010 }, { "epoch": 1.16, "learning_rate": 0.0001266846945931356, "loss": 0.0089, "step": 229020 }, { "epoch": 1.16, "learning_rate": 0.00012667712690012158, "loss": 0.0081, "step": 229030 }, { "epoch": 1.16, "learning_rate": 0.00012666955920710758, "loss": 0.0099, "step": 229040 }, { "epoch": 1.16, "learning_rate": 0.00012666199151409357, "loss": 0.0112, "step": 229050 }, { "epoch": 1.16, "learning_rate": 0.00012665442382107955, "loss": 0.0097, "step": 229060 }, { "epoch": 1.16, "learning_rate": 0.00012664685612806553, "loss": 0.0077, "step": 229070 }, { "epoch": 1.16, "learning_rate": 0.0001266392884350515, "loss": 0.0085, "step": 229080 }, { "epoch": 1.16, "learning_rate": 0.00012663172074203752, "loss": 0.0088, "step": 229090 }, { "epoch": 1.16, "learning_rate": 0.0001266241530490235, "loss": 0.0101, "step": 229100 }, { "epoch": 1.16, "learning_rate": 0.00012661658535600948, "loss": 0.0067, "step": 229110 }, { "epoch": 1.16, "learning_rate": 0.0001266090176629955, "loss": 0.008, "step": 229120 }, { "epoch": 1.16, "learning_rate": 0.00012660144996998147, "loss": 0.0105, "step": 229130 }, { "epoch": 1.16, "learning_rate": 0.00012659388227696745, "loss": 0.01, "step": 229140 }, { "epoch": 1.16, "learning_rate": 0.00012658631458395343, "loss": 0.0112, "step": 229150 }, { "epoch": 1.16, "learning_rate": 0.00012657874689093944, "loss": 0.0082, "step": 229160 }, { "epoch": 1.16, "learning_rate": 0.00012657117919792542, "loss": 0.0089, "step": 229170 }, { "epoch": 1.16, "learning_rate": 0.0001265636115049114, "loss": 0.0076, "step": 229180 }, { "epoch": 1.16, "learning_rate": 0.00012655604381189741, "loss": 0.0096, "step": 229190 }, { "epoch": 1.16, "learning_rate": 0.0001265484761188834, "loss": 0.0082, "step": 229200 }, { "epoch": 1.16, "learning_rate": 0.00012654090842586938, "loss": 0.0065, "step": 229210 }, { "epoch": 1.16, "learning_rate": 0.00012653334073285539, "loss": 0.008, "step": 229220 }, { "epoch": 1.16, "learning_rate": 0.00012652577303984137, "loss": 0.0093, "step": 229230 }, { "epoch": 1.16, "learning_rate": 0.00012651820534682735, "loss": 0.0096, "step": 229240 }, { "epoch": 1.16, "learning_rate": 0.00012651063765381336, "loss": 0.0096, "step": 229250 }, { "epoch": 1.16, "learning_rate": 0.00012650306996079934, "loss": 0.0091, "step": 229260 }, { "epoch": 1.16, "learning_rate": 0.00012649550226778532, "loss": 0.0103, "step": 229270 }, { "epoch": 1.16, "learning_rate": 0.00012648793457477133, "loss": 0.0085, "step": 229280 }, { "epoch": 1.16, "learning_rate": 0.0001264803668817573, "loss": 0.0099, "step": 229290 }, { "epoch": 1.16, "learning_rate": 0.0001264727991887433, "loss": 0.0084, "step": 229300 }, { "epoch": 1.16, "learning_rate": 0.00012646523149572927, "loss": 0.0087, "step": 229310 }, { "epoch": 1.16, "learning_rate": 0.00012645766380271528, "loss": 0.0095, "step": 229320 }, { "epoch": 1.16, "learning_rate": 0.00012645009610970126, "loss": 0.0078, "step": 229330 }, { "epoch": 1.16, "learning_rate": 0.00012644252841668724, "loss": 0.0091, "step": 229340 }, { "epoch": 1.16, "learning_rate": 0.00012643496072367325, "loss": 0.0093, "step": 229350 }, { "epoch": 1.16, "learning_rate": 0.00012642739303065923, "loss": 0.0098, "step": 229360 }, { "epoch": 1.16, "learning_rate": 0.00012641982533764522, "loss": 0.0091, "step": 229370 }, { "epoch": 1.16, "learning_rate": 0.00012641225764463122, "loss": 0.01, "step": 229380 }, { "epoch": 1.16, "learning_rate": 0.0001264046899516172, "loss": 0.0087, "step": 229390 }, { "epoch": 1.16, "learning_rate": 0.0001263971222586032, "loss": 0.0095, "step": 229400 }, { "epoch": 1.16, "learning_rate": 0.0001263895545655892, "loss": 0.0086, "step": 229410 }, { "epoch": 1.16, "learning_rate": 0.00012638198687257518, "loss": 0.0078, "step": 229420 }, { "epoch": 1.16, "learning_rate": 0.00012637441917956116, "loss": 0.0087, "step": 229430 }, { "epoch": 1.16, "learning_rate": 0.00012636685148654717, "loss": 0.0092, "step": 229440 }, { "epoch": 1.16, "learning_rate": 0.00012635928379353315, "loss": 0.0091, "step": 229450 }, { "epoch": 1.16, "learning_rate": 0.00012635171610051913, "loss": 0.01, "step": 229460 }, { "epoch": 1.16, "learning_rate": 0.0001263441484075051, "loss": 0.0087, "step": 229470 }, { "epoch": 1.16, "learning_rate": 0.00012633658071449112, "loss": 0.009, "step": 229480 }, { "epoch": 1.16, "learning_rate": 0.0001263290130214771, "loss": 0.0101, "step": 229490 }, { "epoch": 1.16, "learning_rate": 0.00012632144532846308, "loss": 0.0087, "step": 229500 }, { "epoch": 1.16, "learning_rate": 0.0001263138776354491, "loss": 0.0084, "step": 229510 }, { "epoch": 1.16, "learning_rate": 0.00012630630994243507, "loss": 0.011, "step": 229520 }, { "epoch": 1.16, "learning_rate": 0.00012629874224942105, "loss": 0.0068, "step": 229530 }, { "epoch": 1.16, "learning_rate": 0.00012629117455640706, "loss": 0.0084, "step": 229540 }, { "epoch": 1.16, "learning_rate": 0.00012628360686339304, "loss": 0.0082, "step": 229550 }, { "epoch": 1.16, "learning_rate": 0.00012627603917037903, "loss": 0.011, "step": 229560 }, { "epoch": 1.16, "learning_rate": 0.00012626847147736503, "loss": 0.0095, "step": 229570 }, { "epoch": 1.16, "learning_rate": 0.00012626090378435102, "loss": 0.0086, "step": 229580 }, { "epoch": 1.16, "learning_rate": 0.000126253336091337, "loss": 0.009, "step": 229590 }, { "epoch": 1.16, "learning_rate": 0.000126245768398323, "loss": 0.0087, "step": 229600 }, { "epoch": 1.16, "learning_rate": 0.000126238200705309, "loss": 0.0083, "step": 229610 }, { "epoch": 1.16, "learning_rate": 0.00012623063301229497, "loss": 0.0085, "step": 229620 }, { "epoch": 1.16, "learning_rate": 0.00012622306531928098, "loss": 0.0097, "step": 229630 }, { "epoch": 1.16, "learning_rate": 0.00012621549762626696, "loss": 0.0085, "step": 229640 }, { "epoch": 1.16, "learning_rate": 0.00012620792993325294, "loss": 0.0085, "step": 229650 }, { "epoch": 1.16, "learning_rate": 0.00012620036224023892, "loss": 0.0098, "step": 229660 }, { "epoch": 1.16, "learning_rate": 0.00012619279454722493, "loss": 0.008, "step": 229670 }, { "epoch": 1.16, "learning_rate": 0.0001261852268542109, "loss": 0.0111, "step": 229680 }, { "epoch": 1.16, "learning_rate": 0.0001261776591611969, "loss": 0.0098, "step": 229690 }, { "epoch": 1.16, "learning_rate": 0.00012617009146818287, "loss": 0.0089, "step": 229700 }, { "epoch": 1.16, "learning_rate": 0.00012616252377516886, "loss": 0.01, "step": 229710 }, { "epoch": 1.16, "learning_rate": 0.00012615495608215486, "loss": 0.009, "step": 229720 }, { "epoch": 1.16, "learning_rate": 0.00012614738838914085, "loss": 0.009, "step": 229730 }, { "epoch": 1.16, "learning_rate": 0.00012613982069612683, "loss": 0.0105, "step": 229740 }, { "epoch": 1.16, "learning_rate": 0.00012613225300311284, "loss": 0.0089, "step": 229750 }, { "epoch": 1.16, "learning_rate": 0.00012612468531009882, "loss": 0.0082, "step": 229760 }, { "epoch": 1.16, "learning_rate": 0.0001261171176170848, "loss": 0.0098, "step": 229770 }, { "epoch": 1.16, "learning_rate": 0.0001261095499240708, "loss": 0.0083, "step": 229780 }, { "epoch": 1.16, "learning_rate": 0.0001261019822310568, "loss": 0.0099, "step": 229790 }, { "epoch": 1.16, "learning_rate": 0.00012609441453804277, "loss": 0.0088, "step": 229800 }, { "epoch": 1.16, "learning_rate": 0.00012608684684502878, "loss": 0.009, "step": 229810 }, { "epoch": 1.16, "learning_rate": 0.00012607927915201476, "loss": 0.0074, "step": 229820 }, { "epoch": 1.16, "learning_rate": 0.00012607171145900074, "loss": 0.0109, "step": 229830 }, { "epoch": 1.16, "learning_rate": 0.00012606414376598672, "loss": 0.0135, "step": 229840 }, { "epoch": 1.16, "learning_rate": 0.00012605657607297273, "loss": 0.008, "step": 229850 }, { "epoch": 1.16, "learning_rate": 0.0001260490083799587, "loss": 0.0105, "step": 229860 }, { "epoch": 1.16, "learning_rate": 0.0001260414406869447, "loss": 0.0221, "step": 229870 }, { "epoch": 1.16, "learning_rate": 0.0001260338729939307, "loss": 0.0097, "step": 229880 }, { "epoch": 1.16, "learning_rate": 0.00012602630530091668, "loss": 0.0112, "step": 229890 }, { "epoch": 1.16, "learning_rate": 0.00012601873760790267, "loss": 0.0123, "step": 229900 }, { "epoch": 1.16, "learning_rate": 0.00012601116991488867, "loss": 0.0098, "step": 229910 }, { "epoch": 1.16, "learning_rate": 0.00012600360222187466, "loss": 0.0086, "step": 229920 }, { "epoch": 1.16, "learning_rate": 0.00012599603452886064, "loss": 0.0069, "step": 229930 }, { "epoch": 1.16, "learning_rate": 0.00012598846683584665, "loss": 0.0107, "step": 229940 }, { "epoch": 1.16, "learning_rate": 0.00012598089914283263, "loss": 0.0074, "step": 229950 }, { "epoch": 1.16, "learning_rate": 0.0001259733314498186, "loss": 0.0074, "step": 229960 }, { "epoch": 1.16, "learning_rate": 0.00012596576375680462, "loss": 0.0097, "step": 229970 }, { "epoch": 1.16, "learning_rate": 0.0001259581960637906, "loss": 0.0084, "step": 229980 }, { "epoch": 1.16, "learning_rate": 0.00012595062837077658, "loss": 0.0106, "step": 229990 }, { "epoch": 1.16, "learning_rate": 0.00012594306067776256, "loss": 0.0113, "step": 230000 }, { "epoch": 1.16, "eval_cer": 0.9144556999612812, "eval_loss": 0.006792085710912943, "eval_runtime": 116.2077, "eval_samples_per_second": 17.211, "eval_steps_per_second": 4.303, "step": 230000 }, { "epoch": 1.16, "learning_rate": 0.00012593549298474857, "loss": 0.0083, "step": 230010 }, { "epoch": 1.16, "learning_rate": 0.00012592792529173455, "loss": 0.0075, "step": 230020 }, { "epoch": 1.16, "learning_rate": 0.00012592035759872053, "loss": 0.0076, "step": 230030 }, { "epoch": 1.16, "learning_rate": 0.00012591278990570654, "loss": 0.0087, "step": 230040 }, { "epoch": 1.16, "learning_rate": 0.00012590522221269252, "loss": 0.01, "step": 230050 }, { "epoch": 1.16, "learning_rate": 0.0001258976545196785, "loss": 0.0086, "step": 230060 }, { "epoch": 1.16, "learning_rate": 0.0001258900868266645, "loss": 0.0101, "step": 230070 }, { "epoch": 1.16, "learning_rate": 0.0001258825191336505, "loss": 0.0084, "step": 230080 }, { "epoch": 1.16, "learning_rate": 0.00012587495144063648, "loss": 0.0099, "step": 230090 }, { "epoch": 1.16, "learning_rate": 0.00012586738374762248, "loss": 0.0115, "step": 230100 }, { "epoch": 1.16, "learning_rate": 0.00012585981605460847, "loss": 0.0099, "step": 230110 }, { "epoch": 1.16, "learning_rate": 0.00012585224836159445, "loss": 0.0105, "step": 230120 }, { "epoch": 1.16, "learning_rate": 0.00012584468066858046, "loss": 0.0122, "step": 230130 }, { "epoch": 1.16, "learning_rate": 0.00012583711297556644, "loss": 0.0108, "step": 230140 }, { "epoch": 1.16, "learning_rate": 0.00012582954528255242, "loss": 0.0096, "step": 230150 }, { "epoch": 1.16, "learning_rate": 0.00012582197758953843, "loss": 0.0129, "step": 230160 }, { "epoch": 1.16, "learning_rate": 0.0001258144098965244, "loss": 0.0109, "step": 230170 }, { "epoch": 1.16, "learning_rate": 0.0001258068422035104, "loss": 0.0096, "step": 230180 }, { "epoch": 1.16, "learning_rate": 0.00012579927451049637, "loss": 0.0087, "step": 230190 }, { "epoch": 1.16, "learning_rate": 0.00012579170681748238, "loss": 0.0108, "step": 230200 }, { "epoch": 1.16, "learning_rate": 0.00012578413912446836, "loss": 0.0094, "step": 230210 }, { "epoch": 1.16, "learning_rate": 0.00012577657143145434, "loss": 0.0093, "step": 230220 }, { "epoch": 1.16, "learning_rate": 0.00012576900373844035, "loss": 0.0077, "step": 230230 }, { "epoch": 1.16, "learning_rate": 0.00012576143604542633, "loss": 0.0082, "step": 230240 }, { "epoch": 1.16, "learning_rate": 0.00012575386835241231, "loss": 0.0085, "step": 230250 }, { "epoch": 1.16, "learning_rate": 0.00012574630065939832, "loss": 0.0093, "step": 230260 }, { "epoch": 1.16, "learning_rate": 0.0001257387329663843, "loss": 0.0091, "step": 230270 }, { "epoch": 1.16, "learning_rate": 0.00012573116527337029, "loss": 0.0075, "step": 230280 }, { "epoch": 1.16, "learning_rate": 0.0001257235975803563, "loss": 0.0077, "step": 230290 }, { "epoch": 1.16, "learning_rate": 0.00012571602988734228, "loss": 0.011, "step": 230300 }, { "epoch": 1.16, "learning_rate": 0.00012570846219432826, "loss": 0.0095, "step": 230310 }, { "epoch": 1.16, "learning_rate": 0.00012570089450131427, "loss": 0.0092, "step": 230320 }, { "epoch": 1.16, "learning_rate": 0.00012569332680830022, "loss": 0.0094, "step": 230330 }, { "epoch": 1.16, "learning_rate": 0.00012568575911528623, "loss": 0.0081, "step": 230340 }, { "epoch": 1.16, "learning_rate": 0.0001256781914222722, "loss": 0.0111, "step": 230350 }, { "epoch": 1.16, "learning_rate": 0.0001256706237292582, "loss": 0.0098, "step": 230360 }, { "epoch": 1.16, "learning_rate": 0.00012566305603624417, "loss": 0.0103, "step": 230370 }, { "epoch": 1.16, "learning_rate": 0.00012565548834323018, "loss": 0.008, "step": 230380 }, { "epoch": 1.16, "learning_rate": 0.00012564792065021616, "loss": 0.0081, "step": 230390 }, { "epoch": 1.16, "learning_rate": 0.00012564035295720214, "loss": 0.0104, "step": 230400 }, { "epoch": 1.16, "learning_rate": 0.00012563278526418815, "loss": 0.0068, "step": 230410 }, { "epoch": 1.16, "learning_rate": 0.00012562521757117413, "loss": 0.0089, "step": 230420 }, { "epoch": 1.16, "learning_rate": 0.00012561764987816012, "loss": 0.0094, "step": 230430 }, { "epoch": 1.16, "learning_rate": 0.00012561008218514612, "loss": 0.0086, "step": 230440 }, { "epoch": 1.16, "learning_rate": 0.0001256025144921321, "loss": 0.0087, "step": 230450 }, { "epoch": 1.16, "learning_rate": 0.0001255949467991181, "loss": 0.008, "step": 230460 }, { "epoch": 1.16, "learning_rate": 0.0001255873791061041, "loss": 0.0102, "step": 230470 }, { "epoch": 1.16, "learning_rate": 0.00012557981141309008, "loss": 0.0112, "step": 230480 }, { "epoch": 1.16, "learning_rate": 0.00012557224372007606, "loss": 0.0086, "step": 230490 }, { "epoch": 1.16, "learning_rate": 0.00012556467602706207, "loss": 0.0109, "step": 230500 }, { "epoch": 1.16, "learning_rate": 0.00012555710833404805, "loss": 0.0084, "step": 230510 }, { "epoch": 1.16, "learning_rate": 0.00012554954064103403, "loss": 0.0119, "step": 230520 }, { "epoch": 1.16, "learning_rate": 0.00012554197294802, "loss": 0.0083, "step": 230530 }, { "epoch": 1.16, "learning_rate": 0.00012553440525500602, "loss": 0.0087, "step": 230540 }, { "epoch": 1.16, "learning_rate": 0.000125526837561992, "loss": 0.0077, "step": 230550 }, { "epoch": 1.16, "learning_rate": 0.00012551926986897798, "loss": 0.0076, "step": 230560 }, { "epoch": 1.16, "learning_rate": 0.000125511702175964, "loss": 0.0078, "step": 230570 }, { "epoch": 1.16, "learning_rate": 0.00012550413448294997, "loss": 0.0095, "step": 230580 }, { "epoch": 1.16, "learning_rate": 0.00012549656678993595, "loss": 0.0087, "step": 230590 }, { "epoch": 1.16, "learning_rate": 0.00012548899909692196, "loss": 0.0073, "step": 230600 }, { "epoch": 1.16, "learning_rate": 0.00012548143140390794, "loss": 0.0111, "step": 230610 }, { "epoch": 1.16, "learning_rate": 0.00012547386371089393, "loss": 0.0086, "step": 230620 }, { "epoch": 1.16, "learning_rate": 0.00012546629601787993, "loss": 0.0093, "step": 230630 }, { "epoch": 1.16, "learning_rate": 0.00012545872832486592, "loss": 0.0071, "step": 230640 }, { "epoch": 1.16, "learning_rate": 0.0001254511606318519, "loss": 0.0083, "step": 230650 }, { "epoch": 1.16, "learning_rate": 0.0001254435929388379, "loss": 0.008, "step": 230660 }, { "epoch": 1.16, "learning_rate": 0.0001254360252458239, "loss": 0.0096, "step": 230670 }, { "epoch": 1.16, "learning_rate": 0.00012542845755280987, "loss": 0.0096, "step": 230680 }, { "epoch": 1.16, "learning_rate": 0.00012542088985979588, "loss": 0.0103, "step": 230690 }, { "epoch": 1.16, "learning_rate": 0.00012541332216678186, "loss": 0.0094, "step": 230700 }, { "epoch": 1.16, "learning_rate": 0.00012540575447376784, "loss": 0.0089, "step": 230710 }, { "epoch": 1.16, "learning_rate": 0.00012539818678075382, "loss": 0.0085, "step": 230720 }, { "epoch": 1.16, "learning_rate": 0.00012539061908773983, "loss": 0.0097, "step": 230730 }, { "epoch": 1.16, "learning_rate": 0.0001253830513947258, "loss": 0.0086, "step": 230740 }, { "epoch": 1.16, "learning_rate": 0.0001253754837017118, "loss": 0.0119, "step": 230750 }, { "epoch": 1.16, "learning_rate": 0.0001253679160086978, "loss": 0.0081, "step": 230760 }, { "epoch": 1.16, "learning_rate": 0.00012536034831568378, "loss": 0.009, "step": 230770 }, { "epoch": 1.16, "learning_rate": 0.00012535278062266976, "loss": 0.0098, "step": 230780 }, { "epoch": 1.16, "learning_rate": 0.00012534521292965577, "loss": 0.0086, "step": 230790 }, { "epoch": 1.16, "learning_rate": 0.00012533764523664175, "loss": 0.01, "step": 230800 }, { "epoch": 1.16, "learning_rate": 0.00012533007754362774, "loss": 0.0098, "step": 230810 }, { "epoch": 1.16, "learning_rate": 0.00012532250985061374, "loss": 0.0077, "step": 230820 }, { "epoch": 1.16, "learning_rate": 0.00012531494215759973, "loss": 0.0089, "step": 230830 }, { "epoch": 1.16, "learning_rate": 0.0001253073744645857, "loss": 0.0085, "step": 230840 }, { "epoch": 1.16, "learning_rate": 0.00012529980677157172, "loss": 0.0081, "step": 230850 }, { "epoch": 1.16, "learning_rate": 0.0001252922390785577, "loss": 0.0079, "step": 230860 }, { "epoch": 1.16, "learning_rate": 0.00012528467138554368, "loss": 0.0089, "step": 230870 }, { "epoch": 1.16, "learning_rate": 0.00012527710369252966, "loss": 0.0089, "step": 230880 }, { "epoch": 1.16, "learning_rate": 0.00012526953599951567, "loss": 0.0092, "step": 230890 }, { "epoch": 1.16, "learning_rate": 0.00012526196830650165, "loss": 0.0082, "step": 230900 }, { "epoch": 1.16, "learning_rate": 0.00012525440061348763, "loss": 0.0087, "step": 230910 }, { "epoch": 1.17, "learning_rate": 0.00012524683292047364, "loss": 0.0097, "step": 230920 }, { "epoch": 1.17, "learning_rate": 0.00012523926522745962, "loss": 0.012, "step": 230930 }, { "epoch": 1.17, "learning_rate": 0.0001252316975344456, "loss": 0.0091, "step": 230940 }, { "epoch": 1.17, "learning_rate": 0.0001252241298414316, "loss": 0.0108, "step": 230950 }, { "epoch": 1.17, "learning_rate": 0.00012521656214841757, "loss": 0.0088, "step": 230960 }, { "epoch": 1.17, "learning_rate": 0.00012520899445540357, "loss": 0.0124, "step": 230970 }, { "epoch": 1.17, "learning_rate": 0.00012520142676238956, "loss": 0.0096, "step": 230980 }, { "epoch": 1.17, "learning_rate": 0.00012519385906937554, "loss": 0.011, "step": 230990 }, { "epoch": 1.17, "learning_rate": 0.00012518629137636155, "loss": 0.0086, "step": 231000 }, { "epoch": 1.17, "eval_cer": 0.9144353216426477, "eval_loss": 0.006772263906896114, "eval_runtime": 116.0719, "eval_samples_per_second": 17.231, "eval_steps_per_second": 4.308, "step": 231000 }, { "epoch": 1.17, "learning_rate": 0.00012517872368334753, "loss": 0.0083, "step": 231010 }, { "epoch": 1.17, "learning_rate": 0.0001251711559903335, "loss": 0.008, "step": 231020 }, { "epoch": 1.17, "learning_rate": 0.00012516358829731952, "loss": 0.0109, "step": 231030 }, { "epoch": 1.17, "learning_rate": 0.0001251560206043055, "loss": 0.01, "step": 231040 }, { "epoch": 1.17, "learning_rate": 0.00012514845291129148, "loss": 0.0098, "step": 231050 }, { "epoch": 1.17, "learning_rate": 0.0001251408852182775, "loss": 0.0091, "step": 231060 }, { "epoch": 1.17, "learning_rate": 0.00012513331752526347, "loss": 0.0108, "step": 231070 }, { "epoch": 1.17, "learning_rate": 0.00012512574983224945, "loss": 0.009, "step": 231080 }, { "epoch": 1.17, "learning_rate": 0.00012511818213923543, "loss": 0.0086, "step": 231090 }, { "epoch": 1.17, "learning_rate": 0.00012511061444622144, "loss": 0.0091, "step": 231100 }, { "epoch": 1.17, "learning_rate": 0.00012510304675320742, "loss": 0.0078, "step": 231110 }, { "epoch": 1.17, "learning_rate": 0.0001250954790601934, "loss": 0.0135, "step": 231120 }, { "epoch": 1.17, "learning_rate": 0.0001250879113671794, "loss": 0.0079, "step": 231130 }, { "epoch": 1.17, "learning_rate": 0.0001250803436741654, "loss": 0.0119, "step": 231140 }, { "epoch": 1.17, "learning_rate": 0.00012507277598115138, "loss": 0.0098, "step": 231150 }, { "epoch": 1.17, "learning_rate": 0.00012506520828813738, "loss": 0.0115, "step": 231160 }, { "epoch": 1.17, "learning_rate": 0.00012505764059512337, "loss": 0.009, "step": 231170 }, { "epoch": 1.17, "learning_rate": 0.00012505007290210935, "loss": 0.0071, "step": 231180 }, { "epoch": 1.17, "learning_rate": 0.00012504250520909536, "loss": 0.0081, "step": 231190 }, { "epoch": 1.17, "learning_rate": 0.00012503493751608134, "loss": 0.0099, "step": 231200 }, { "epoch": 1.17, "learning_rate": 0.00012502736982306732, "loss": 0.0095, "step": 231210 }, { "epoch": 1.17, "learning_rate": 0.00012501980213005333, "loss": 0.0116, "step": 231220 }, { "epoch": 1.17, "learning_rate": 0.0001250122344370393, "loss": 0.01, "step": 231230 }, { "epoch": 1.17, "learning_rate": 0.0001250046667440253, "loss": 0.0102, "step": 231240 }, { "epoch": 1.17, "learning_rate": 0.00012499709905101127, "loss": 0.0093, "step": 231250 }, { "epoch": 1.17, "learning_rate": 0.00012498953135799728, "loss": 0.0079, "step": 231260 }, { "epoch": 1.17, "learning_rate": 0.00012498196366498326, "loss": 0.0094, "step": 231270 }, { "epoch": 1.17, "learning_rate": 0.00012497439597196924, "loss": 0.0112, "step": 231280 }, { "epoch": 1.17, "learning_rate": 0.00012496682827895525, "loss": 0.0115, "step": 231290 }, { "epoch": 1.17, "learning_rate": 0.00012495926058594123, "loss": 0.0113, "step": 231300 }, { "epoch": 1.17, "learning_rate": 0.00012495169289292721, "loss": 0.0109, "step": 231310 }, { "epoch": 1.17, "learning_rate": 0.00012494412519991322, "loss": 0.013, "step": 231320 }, { "epoch": 1.17, "learning_rate": 0.0001249365575068992, "loss": 0.0074, "step": 231330 }, { "epoch": 1.17, "learning_rate": 0.00012492898981388519, "loss": 0.0101, "step": 231340 }, { "epoch": 1.17, "learning_rate": 0.0001249214221208712, "loss": 0.0109, "step": 231350 }, { "epoch": 1.17, "learning_rate": 0.00012491385442785718, "loss": 0.0095, "step": 231360 }, { "epoch": 1.17, "learning_rate": 0.00012490628673484316, "loss": 0.0136, "step": 231370 }, { "epoch": 1.17, "learning_rate": 0.00012489871904182917, "loss": 0.0108, "step": 231380 }, { "epoch": 1.17, "learning_rate": 0.00012489115134881515, "loss": 0.0081, "step": 231390 }, { "epoch": 1.17, "learning_rate": 0.00012488358365580113, "loss": 0.0073, "step": 231400 }, { "epoch": 1.17, "learning_rate": 0.0001248760159627871, "loss": 0.008, "step": 231410 }, { "epoch": 1.17, "learning_rate": 0.00012486844826977312, "loss": 0.0077, "step": 231420 }, { "epoch": 1.17, "learning_rate": 0.0001248608805767591, "loss": 0.0097, "step": 231430 }, { "epoch": 1.17, "learning_rate": 0.00012485331288374508, "loss": 0.0078, "step": 231440 }, { "epoch": 1.17, "learning_rate": 0.0001248457451907311, "loss": 0.0106, "step": 231450 }, { "epoch": 1.17, "learning_rate": 0.00012483817749771707, "loss": 0.0092, "step": 231460 }, { "epoch": 1.17, "learning_rate": 0.00012483060980470305, "loss": 0.008, "step": 231470 }, { "epoch": 1.17, "learning_rate": 0.00012482304211168906, "loss": 0.0072, "step": 231480 }, { "epoch": 1.17, "learning_rate": 0.00012481547441867504, "loss": 0.0098, "step": 231490 }, { "epoch": 1.17, "learning_rate": 0.00012480790672566102, "loss": 0.0118, "step": 231500 }, { "epoch": 1.17, "learning_rate": 0.00012480033903264703, "loss": 0.0113, "step": 231510 }, { "epoch": 1.17, "learning_rate": 0.00012479277133963301, "loss": 0.0099, "step": 231520 }, { "epoch": 1.17, "learning_rate": 0.000124785203646619, "loss": 0.0086, "step": 231530 }, { "epoch": 1.17, "learning_rate": 0.000124777635953605, "loss": 0.007, "step": 231540 }, { "epoch": 1.17, "learning_rate": 0.00012477006826059099, "loss": 0.0115, "step": 231550 }, { "epoch": 1.17, "learning_rate": 0.00012476250056757697, "loss": 0.0116, "step": 231560 }, { "epoch": 1.17, "learning_rate": 0.00012475493287456298, "loss": 0.0101, "step": 231570 }, { "epoch": 1.17, "learning_rate": 0.00012474736518154896, "loss": 0.0103, "step": 231580 }, { "epoch": 1.17, "learning_rate": 0.00012473979748853494, "loss": 0.0077, "step": 231590 }, { "epoch": 1.17, "learning_rate": 0.00012473222979552092, "loss": 0.008, "step": 231600 }, { "epoch": 1.17, "learning_rate": 0.0001247246621025069, "loss": 0.0131, "step": 231610 }, { "epoch": 1.17, "learning_rate": 0.00012471709440949288, "loss": 0.0092, "step": 231620 }, { "epoch": 1.17, "learning_rate": 0.0001247095267164789, "loss": 0.0094, "step": 231630 }, { "epoch": 1.17, "learning_rate": 0.00012470195902346487, "loss": 0.0097, "step": 231640 }, { "epoch": 1.17, "learning_rate": 0.00012469439133045085, "loss": 0.0077, "step": 231650 }, { "epoch": 1.17, "learning_rate": 0.00012468682363743686, "loss": 0.0087, "step": 231660 }, { "epoch": 1.17, "learning_rate": 0.00012467925594442284, "loss": 0.0095, "step": 231670 }, { "epoch": 1.17, "learning_rate": 0.00012467168825140883, "loss": 0.009, "step": 231680 }, { "epoch": 1.17, "learning_rate": 0.00012466412055839483, "loss": 0.0098, "step": 231690 }, { "epoch": 1.17, "learning_rate": 0.00012465655286538082, "loss": 0.011, "step": 231700 }, { "epoch": 1.17, "learning_rate": 0.0001246489851723668, "loss": 0.0084, "step": 231710 }, { "epoch": 1.17, "learning_rate": 0.0001246414174793528, "loss": 0.0109, "step": 231720 }, { "epoch": 1.17, "learning_rate": 0.0001246338497863388, "loss": 0.009, "step": 231730 }, { "epoch": 1.17, "learning_rate": 0.00012462628209332477, "loss": 0.0078, "step": 231740 }, { "epoch": 1.17, "learning_rate": 0.00012461871440031078, "loss": 0.0093, "step": 231750 }, { "epoch": 1.17, "learning_rate": 0.00012461114670729676, "loss": 0.0083, "step": 231760 }, { "epoch": 1.17, "learning_rate": 0.00012460357901428274, "loss": 0.0066, "step": 231770 }, { "epoch": 1.17, "learning_rate": 0.00012459601132126872, "loss": 0.0083, "step": 231780 }, { "epoch": 1.17, "learning_rate": 0.00012458844362825473, "loss": 0.0077, "step": 231790 }, { "epoch": 1.17, "learning_rate": 0.0001245808759352407, "loss": 0.0098, "step": 231800 }, { "epoch": 1.17, "learning_rate": 0.0001245733082422267, "loss": 0.0115, "step": 231810 }, { "epoch": 1.17, "learning_rate": 0.0001245657405492127, "loss": 0.0085, "step": 231820 }, { "epoch": 1.17, "learning_rate": 0.00012455817285619868, "loss": 0.0106, "step": 231830 }, { "epoch": 1.17, "learning_rate": 0.00012455060516318466, "loss": 0.0094, "step": 231840 }, { "epoch": 1.17, "learning_rate": 0.00012454303747017067, "loss": 0.0102, "step": 231850 }, { "epoch": 1.17, "learning_rate": 0.00012453546977715665, "loss": 0.0094, "step": 231860 }, { "epoch": 1.17, "learning_rate": 0.00012452790208414264, "loss": 0.0113, "step": 231870 }, { "epoch": 1.17, "learning_rate": 0.00012452033439112864, "loss": 0.0081, "step": 231880 }, { "epoch": 1.17, "learning_rate": 0.00012451276669811463, "loss": 0.0124, "step": 231890 }, { "epoch": 1.17, "learning_rate": 0.0001245051990051006, "loss": 0.0078, "step": 231900 }, { "epoch": 1.17, "learning_rate": 0.00012449763131208662, "loss": 0.0112, "step": 231910 }, { "epoch": 1.17, "learning_rate": 0.0001244900636190726, "loss": 0.01, "step": 231920 }, { "epoch": 1.17, "learning_rate": 0.00012448249592605858, "loss": 0.0075, "step": 231930 }, { "epoch": 1.17, "learning_rate": 0.00012447492823304456, "loss": 0.0094, "step": 231940 }, { "epoch": 1.17, "learning_rate": 0.00012446736054003057, "loss": 0.0077, "step": 231950 }, { "epoch": 1.17, "learning_rate": 0.00012445979284701655, "loss": 0.0089, "step": 231960 }, { "epoch": 1.17, "learning_rate": 0.00012445222515400253, "loss": 0.0072, "step": 231970 }, { "epoch": 1.17, "learning_rate": 0.00012444465746098854, "loss": 0.0095, "step": 231980 }, { "epoch": 1.17, "learning_rate": 0.00012443708976797452, "loss": 0.0108, "step": 231990 }, { "epoch": 1.17, "learning_rate": 0.0001244295220749605, "loss": 0.0075, "step": 232000 }, { "epoch": 1.17, "eval_cer": 0.9144654039225352, "eval_loss": 0.006733159068971872, "eval_runtime": 115.9285, "eval_samples_per_second": 17.252, "eval_steps_per_second": 4.313, "step": 232000 }, { "epoch": 1.17, "learning_rate": 0.0001244219543819465, "loss": 0.0108, "step": 232010 }, { "epoch": 1.17, "learning_rate": 0.0001244143866889325, "loss": 0.0096, "step": 232020 }, { "epoch": 1.17, "learning_rate": 0.00012440681899591848, "loss": 0.0086, "step": 232030 }, { "epoch": 1.17, "learning_rate": 0.00012439925130290448, "loss": 0.0088, "step": 232040 }, { "epoch": 1.17, "learning_rate": 0.00012439168360989047, "loss": 0.0111, "step": 232050 }, { "epoch": 1.17, "learning_rate": 0.00012438411591687645, "loss": 0.0079, "step": 232060 }, { "epoch": 1.17, "learning_rate": 0.00012437654822386246, "loss": 0.0072, "step": 232070 }, { "epoch": 1.17, "learning_rate": 0.00012436898053084844, "loss": 0.0086, "step": 232080 }, { "epoch": 1.17, "learning_rate": 0.00012436141283783442, "loss": 0.0098, "step": 232090 }, { "epoch": 1.17, "learning_rate": 0.00012435384514482043, "loss": 0.0129, "step": 232100 }, { "epoch": 1.17, "learning_rate": 0.0001243462774518064, "loss": 0.0102, "step": 232110 }, { "epoch": 1.17, "learning_rate": 0.0001243387097587924, "loss": 0.0102, "step": 232120 }, { "epoch": 1.17, "learning_rate": 0.00012433114206577837, "loss": 0.0117, "step": 232130 }, { "epoch": 1.17, "learning_rate": 0.00012432357437276438, "loss": 0.0085, "step": 232140 }, { "epoch": 1.17, "learning_rate": 0.00012431600667975036, "loss": 0.008, "step": 232150 }, { "epoch": 1.17, "learning_rate": 0.00012430843898673634, "loss": 0.0075, "step": 232160 }, { "epoch": 1.17, "learning_rate": 0.00012430087129372235, "loss": 0.0131, "step": 232170 }, { "epoch": 1.17, "learning_rate": 0.00012429330360070833, "loss": 0.0105, "step": 232180 }, { "epoch": 1.17, "learning_rate": 0.00012428573590769431, "loss": 0.0098, "step": 232190 }, { "epoch": 1.17, "learning_rate": 0.00012427816821468032, "loss": 0.0091, "step": 232200 }, { "epoch": 1.17, "learning_rate": 0.00012427060052166628, "loss": 0.01, "step": 232210 }, { "epoch": 1.17, "learning_rate": 0.00012426303282865229, "loss": 0.009, "step": 232220 }, { "epoch": 1.17, "learning_rate": 0.00012425546513563827, "loss": 0.0077, "step": 232230 }, { "epoch": 1.17, "learning_rate": 0.00012424789744262425, "loss": 0.0123, "step": 232240 }, { "epoch": 1.17, "learning_rate": 0.00012424032974961026, "loss": 0.0099, "step": 232250 }, { "epoch": 1.17, "learning_rate": 0.00012423276205659624, "loss": 0.0069, "step": 232260 }, { "epoch": 1.17, "learning_rate": 0.00012422519436358222, "loss": 0.0075, "step": 232270 }, { "epoch": 1.17, "learning_rate": 0.00012421762667056823, "loss": 0.01, "step": 232280 }, { "epoch": 1.17, "learning_rate": 0.0001242100589775542, "loss": 0.0097, "step": 232290 }, { "epoch": 1.17, "learning_rate": 0.0001242024912845402, "loss": 0.0102, "step": 232300 }, { "epoch": 1.17, "learning_rate": 0.00012419492359152617, "loss": 0.0093, "step": 232310 }, { "epoch": 1.17, "learning_rate": 0.00012418735589851218, "loss": 0.0102, "step": 232320 }, { "epoch": 1.17, "learning_rate": 0.00012417978820549816, "loss": 0.0076, "step": 232330 }, { "epoch": 1.17, "learning_rate": 0.00012417222051248414, "loss": 0.0083, "step": 232340 }, { "epoch": 1.17, "learning_rate": 0.00012416465281947015, "loss": 0.0071, "step": 232350 }, { "epoch": 1.17, "learning_rate": 0.00012415708512645613, "loss": 0.0106, "step": 232360 }, { "epoch": 1.17, "learning_rate": 0.00012414951743344212, "loss": 0.0083, "step": 232370 }, { "epoch": 1.17, "learning_rate": 0.00012414194974042812, "loss": 0.0116, "step": 232380 }, { "epoch": 1.17, "learning_rate": 0.0001241343820474141, "loss": 0.0091, "step": 232390 }, { "epoch": 1.17, "learning_rate": 0.0001241268143544001, "loss": 0.0075, "step": 232400 }, { "epoch": 1.17, "learning_rate": 0.0001241192466613861, "loss": 0.01, "step": 232410 }, { "epoch": 1.17, "learning_rate": 0.00012411167896837208, "loss": 0.0083, "step": 232420 }, { "epoch": 1.17, "learning_rate": 0.00012410411127535806, "loss": 0.0091, "step": 232430 }, { "epoch": 1.17, "learning_rate": 0.00012409654358234407, "loss": 0.0104, "step": 232440 }, { "epoch": 1.17, "learning_rate": 0.00012408897588933005, "loss": 0.0101, "step": 232450 }, { "epoch": 1.17, "learning_rate": 0.00012408140819631603, "loss": 0.0155, "step": 232460 }, { "epoch": 1.17, "learning_rate": 0.000124073840503302, "loss": 0.0083, "step": 232470 }, { "epoch": 1.17, "learning_rate": 0.00012406627281028802, "loss": 0.0081, "step": 232480 }, { "epoch": 1.17, "learning_rate": 0.000124058705117274, "loss": 0.0088, "step": 232490 }, { "epoch": 1.17, "learning_rate": 0.00012405113742425998, "loss": 0.0083, "step": 232500 }, { "epoch": 1.17, "learning_rate": 0.000124043569731246, "loss": 0.0065, "step": 232510 }, { "epoch": 1.17, "learning_rate": 0.00012403600203823197, "loss": 0.0081, "step": 232520 }, { "epoch": 1.17, "learning_rate": 0.00012402843434521795, "loss": 0.0096, "step": 232530 }, { "epoch": 1.17, "learning_rate": 0.00012402086665220396, "loss": 0.0096, "step": 232540 }, { "epoch": 1.17, "learning_rate": 0.00012401329895918994, "loss": 0.0118, "step": 232550 }, { "epoch": 1.17, "learning_rate": 0.00012400573126617593, "loss": 0.007, "step": 232560 }, { "epoch": 1.17, "learning_rate": 0.00012399816357316193, "loss": 0.0097, "step": 232570 }, { "epoch": 1.17, "learning_rate": 0.00012399059588014792, "loss": 0.0088, "step": 232580 }, { "epoch": 1.17, "learning_rate": 0.0001239830281871339, "loss": 0.0119, "step": 232590 }, { "epoch": 1.17, "learning_rate": 0.0001239754604941199, "loss": 0.0099, "step": 232600 }, { "epoch": 1.17, "learning_rate": 0.0001239678928011059, "loss": 0.0138, "step": 232610 }, { "epoch": 1.17, "learning_rate": 0.00012396032510809187, "loss": 0.0096, "step": 232620 }, { "epoch": 1.17, "learning_rate": 0.00012395275741507788, "loss": 0.0088, "step": 232630 }, { "epoch": 1.17, "learning_rate": 0.00012394518972206386, "loss": 0.0091, "step": 232640 }, { "epoch": 1.17, "learning_rate": 0.00012393762202904984, "loss": 0.0081, "step": 232650 }, { "epoch": 1.17, "learning_rate": 0.00012393005433603582, "loss": 0.0071, "step": 232660 }, { "epoch": 1.17, "learning_rate": 0.00012392248664302183, "loss": 0.0077, "step": 232670 }, { "epoch": 1.17, "learning_rate": 0.0001239149189500078, "loss": 0.0078, "step": 232680 }, { "epoch": 1.17, "learning_rate": 0.0001239073512569938, "loss": 0.0119, "step": 232690 }, { "epoch": 1.17, "learning_rate": 0.0001238997835639798, "loss": 0.0099, "step": 232700 }, { "epoch": 1.17, "learning_rate": 0.00012389221587096578, "loss": 0.0098, "step": 232710 }, { "epoch": 1.17, "learning_rate": 0.00012388464817795176, "loss": 0.0084, "step": 232720 }, { "epoch": 1.17, "learning_rate": 0.00012387708048493777, "loss": 0.0117, "step": 232730 }, { "epoch": 1.17, "learning_rate": 0.00012386951279192375, "loss": 0.0083, "step": 232740 }, { "epoch": 1.17, "learning_rate": 0.00012386194509890974, "loss": 0.0105, "step": 232750 }, { "epoch": 1.17, "learning_rate": 0.00012385437740589574, "loss": 0.0077, "step": 232760 }, { "epoch": 1.17, "learning_rate": 0.00012384680971288173, "loss": 0.0089, "step": 232770 }, { "epoch": 1.17, "learning_rate": 0.0001238392420198677, "loss": 0.0071, "step": 232780 }, { "epoch": 1.17, "learning_rate": 0.00012383167432685372, "loss": 0.0096, "step": 232790 }, { "epoch": 1.17, "learning_rate": 0.0001238241066338397, "loss": 0.0089, "step": 232800 }, { "epoch": 1.17, "learning_rate": 0.00012381653894082568, "loss": 0.0087, "step": 232810 }, { "epoch": 1.17, "learning_rate": 0.00012380897124781166, "loss": 0.0079, "step": 232820 }, { "epoch": 1.17, "learning_rate": 0.00012380140355479767, "loss": 0.0089, "step": 232830 }, { "epoch": 1.17, "learning_rate": 0.00012379383586178362, "loss": 0.0102, "step": 232840 }, { "epoch": 1.17, "learning_rate": 0.00012378626816876963, "loss": 0.0088, "step": 232850 }, { "epoch": 1.17, "learning_rate": 0.0001237787004757556, "loss": 0.0096, "step": 232860 }, { "epoch": 1.17, "learning_rate": 0.0001237711327827416, "loss": 0.0117, "step": 232870 }, { "epoch": 1.17, "learning_rate": 0.0001237635650897276, "loss": 0.009, "step": 232880 }, { "epoch": 1.17, "learning_rate": 0.00012375599739671358, "loss": 0.01, "step": 232890 }, { "epoch": 1.18, "learning_rate": 0.00012374842970369957, "loss": 0.0089, "step": 232900 }, { "epoch": 1.18, "learning_rate": 0.00012374086201068557, "loss": 0.0085, "step": 232910 }, { "epoch": 1.18, "learning_rate": 0.00012373329431767156, "loss": 0.0087, "step": 232920 }, { "epoch": 1.18, "learning_rate": 0.00012372572662465754, "loss": 0.0088, "step": 232930 }, { "epoch": 1.18, "learning_rate": 0.00012371815893164355, "loss": 0.0067, "step": 232940 }, { "epoch": 1.18, "learning_rate": 0.00012371059123862953, "loss": 0.0092, "step": 232950 }, { "epoch": 1.18, "learning_rate": 0.0001237030235456155, "loss": 0.0101, "step": 232960 }, { "epoch": 1.18, "learning_rate": 0.00012369545585260152, "loss": 0.0097, "step": 232970 }, { "epoch": 1.18, "learning_rate": 0.0001236878881595875, "loss": 0.008, "step": 232980 }, { "epoch": 1.18, "learning_rate": 0.00012368032046657348, "loss": 0.0083, "step": 232990 }, { "epoch": 1.18, "learning_rate": 0.0001236727527735595, "loss": 0.0077, "step": 233000 }, { "epoch": 1.18, "eval_cer": 0.914438232831024, "eval_loss": 0.006864336784929037, "eval_runtime": 115.9429, "eval_samples_per_second": 17.25, "eval_steps_per_second": 4.312, "step": 233000 }, { "epoch": 1.18, "learning_rate": 0.00012366518508054547, "loss": 0.0094, "step": 233010 }, { "epoch": 1.18, "learning_rate": 0.00012365761738753145, "loss": 0.0101, "step": 233020 }, { "epoch": 1.18, "learning_rate": 0.00012365004969451743, "loss": 0.0131, "step": 233030 }, { "epoch": 1.18, "learning_rate": 0.00012364248200150344, "loss": 0.0068, "step": 233040 }, { "epoch": 1.18, "learning_rate": 0.00012363491430848942, "loss": 0.0107, "step": 233050 }, { "epoch": 1.18, "learning_rate": 0.0001236273466154754, "loss": 0.0104, "step": 233060 }, { "epoch": 1.18, "learning_rate": 0.0001236197789224614, "loss": 0.0077, "step": 233070 }, { "epoch": 1.18, "learning_rate": 0.0001236122112294474, "loss": 0.0091, "step": 233080 }, { "epoch": 1.18, "learning_rate": 0.00012360464353643338, "loss": 0.0111, "step": 233090 }, { "epoch": 1.18, "learning_rate": 0.00012359707584341938, "loss": 0.0103, "step": 233100 }, { "epoch": 1.18, "learning_rate": 0.00012358950815040537, "loss": 0.0088, "step": 233110 }, { "epoch": 1.18, "learning_rate": 0.00012358194045739135, "loss": 0.0085, "step": 233120 }, { "epoch": 1.18, "learning_rate": 0.00012357437276437736, "loss": 0.0122, "step": 233130 }, { "epoch": 1.18, "learning_rate": 0.00012356680507136334, "loss": 0.0069, "step": 233140 }, { "epoch": 1.18, "learning_rate": 0.00012355923737834932, "loss": 0.0143, "step": 233150 }, { "epoch": 1.18, "learning_rate": 0.00012355166968533533, "loss": 0.0093, "step": 233160 }, { "epoch": 1.18, "learning_rate": 0.0001235441019923213, "loss": 0.0086, "step": 233170 }, { "epoch": 1.18, "learning_rate": 0.0001235365342993073, "loss": 0.0092, "step": 233180 }, { "epoch": 1.18, "learning_rate": 0.00012352896660629327, "loss": 0.0102, "step": 233190 }, { "epoch": 1.18, "learning_rate": 0.00012352139891327928, "loss": 0.0094, "step": 233200 }, { "epoch": 1.18, "learning_rate": 0.00012351383122026526, "loss": 0.0069, "step": 233210 }, { "epoch": 1.18, "learning_rate": 0.00012350626352725124, "loss": 0.0081, "step": 233220 }, { "epoch": 1.18, "learning_rate": 0.00012349869583423725, "loss": 0.0083, "step": 233230 }, { "epoch": 1.18, "learning_rate": 0.00012349112814122323, "loss": 0.0092, "step": 233240 }, { "epoch": 1.18, "learning_rate": 0.00012348356044820921, "loss": 0.0086, "step": 233250 }, { "epoch": 1.18, "learning_rate": 0.00012347599275519522, "loss": 0.0086, "step": 233260 }, { "epoch": 1.18, "learning_rate": 0.0001234684250621812, "loss": 0.0103, "step": 233270 }, { "epoch": 1.18, "learning_rate": 0.00012346085736916719, "loss": 0.0078, "step": 233280 }, { "epoch": 1.18, "learning_rate": 0.0001234532896761532, "loss": 0.0102, "step": 233290 }, { "epoch": 1.18, "learning_rate": 0.00012344572198313918, "loss": 0.0083, "step": 233300 }, { "epoch": 1.18, "learning_rate": 0.00012343815429012516, "loss": 0.0099, "step": 233310 }, { "epoch": 1.18, "learning_rate": 0.00012343058659711117, "loss": 0.0102, "step": 233320 }, { "epoch": 1.18, "learning_rate": 0.00012342301890409715, "loss": 0.0102, "step": 233330 }, { "epoch": 1.18, "learning_rate": 0.00012341545121108313, "loss": 0.0088, "step": 233340 }, { "epoch": 1.18, "learning_rate": 0.0001234078835180691, "loss": 0.0065, "step": 233350 }, { "epoch": 1.18, "learning_rate": 0.00012340031582505512, "loss": 0.0068, "step": 233360 }, { "epoch": 1.18, "learning_rate": 0.0001233927481320411, "loss": 0.0084, "step": 233370 }, { "epoch": 1.18, "learning_rate": 0.00012338518043902708, "loss": 0.0079, "step": 233380 }, { "epoch": 1.18, "learning_rate": 0.0001233776127460131, "loss": 0.0106, "step": 233390 }, { "epoch": 1.18, "learning_rate": 0.00012337004505299907, "loss": 0.0103, "step": 233400 }, { "epoch": 1.18, "learning_rate": 0.00012336247735998505, "loss": 0.0073, "step": 233410 }, { "epoch": 1.18, "learning_rate": 0.00012335490966697106, "loss": 0.0097, "step": 233420 }, { "epoch": 1.18, "learning_rate": 0.00012334734197395704, "loss": 0.0101, "step": 233430 }, { "epoch": 1.18, "learning_rate": 0.00012333977428094302, "loss": 0.0087, "step": 233440 }, { "epoch": 1.18, "learning_rate": 0.00012333220658792903, "loss": 0.01, "step": 233450 }, { "epoch": 1.18, "learning_rate": 0.00012332463889491501, "loss": 0.0091, "step": 233460 }, { "epoch": 1.18, "learning_rate": 0.000123317071201901, "loss": 0.0092, "step": 233470 }, { "epoch": 1.18, "learning_rate": 0.00012330950350888698, "loss": 0.0069, "step": 233480 }, { "epoch": 1.18, "learning_rate": 0.00012330193581587296, "loss": 0.0102, "step": 233490 }, { "epoch": 1.18, "learning_rate": 0.00012329436812285897, "loss": 0.0082, "step": 233500 }, { "epoch": 1.18, "learning_rate": 0.00012328680042984495, "loss": 0.0092, "step": 233510 }, { "epoch": 1.18, "learning_rate": 0.00012327923273683093, "loss": 0.0103, "step": 233520 }, { "epoch": 1.18, "learning_rate": 0.00012327166504381694, "loss": 0.0081, "step": 233530 }, { "epoch": 1.18, "learning_rate": 0.00012326409735080292, "loss": 0.0075, "step": 233540 }, { "epoch": 1.18, "learning_rate": 0.0001232565296577889, "loss": 0.0106, "step": 233550 }, { "epoch": 1.18, "learning_rate": 0.00012324896196477488, "loss": 0.0075, "step": 233560 }, { "epoch": 1.18, "learning_rate": 0.0001232413942717609, "loss": 0.0087, "step": 233570 }, { "epoch": 1.18, "learning_rate": 0.00012323382657874687, "loss": 0.0078, "step": 233580 }, { "epoch": 1.18, "learning_rate": 0.00012322625888573285, "loss": 0.0083, "step": 233590 }, { "epoch": 1.18, "learning_rate": 0.00012321869119271886, "loss": 0.0081, "step": 233600 }, { "epoch": 1.18, "learning_rate": 0.00012321112349970484, "loss": 0.0126, "step": 233610 }, { "epoch": 1.18, "learning_rate": 0.00012320355580669083, "loss": 0.008, "step": 233620 }, { "epoch": 1.18, "learning_rate": 0.00012319598811367683, "loss": 0.0086, "step": 233630 }, { "epoch": 1.18, "learning_rate": 0.00012318842042066282, "loss": 0.0078, "step": 233640 }, { "epoch": 1.18, "learning_rate": 0.0001231808527276488, "loss": 0.0081, "step": 233650 }, { "epoch": 1.18, "learning_rate": 0.0001231732850346348, "loss": 0.0112, "step": 233660 }, { "epoch": 1.18, "learning_rate": 0.0001231657173416208, "loss": 0.0114, "step": 233670 }, { "epoch": 1.18, "learning_rate": 0.00012315814964860677, "loss": 0.011, "step": 233680 }, { "epoch": 1.18, "learning_rate": 0.00012315058195559278, "loss": 0.0083, "step": 233690 }, { "epoch": 1.18, "learning_rate": 0.00012314301426257876, "loss": 0.0157, "step": 233700 }, { "epoch": 1.18, "learning_rate": 0.00012313544656956474, "loss": 0.011, "step": 233710 }, { "epoch": 1.18, "learning_rate": 0.00012312787887655072, "loss": 0.0084, "step": 233720 }, { "epoch": 1.18, "learning_rate": 0.00012312031118353673, "loss": 0.0101, "step": 233730 }, { "epoch": 1.18, "learning_rate": 0.0001231127434905227, "loss": 0.0101, "step": 233740 }, { "epoch": 1.18, "learning_rate": 0.0001231051757975087, "loss": 0.0087, "step": 233750 }, { "epoch": 1.18, "learning_rate": 0.0001230976081044947, "loss": 0.0082, "step": 233760 }, { "epoch": 1.18, "learning_rate": 0.00012309004041148068, "loss": 0.0092, "step": 233770 }, { "epoch": 1.18, "learning_rate": 0.00012308247271846666, "loss": 0.0129, "step": 233780 }, { "epoch": 1.18, "learning_rate": 0.00012307490502545267, "loss": 0.0113, "step": 233790 }, { "epoch": 1.18, "learning_rate": 0.00012306733733243865, "loss": 0.0075, "step": 233800 }, { "epoch": 1.18, "learning_rate": 0.00012305976963942464, "loss": 0.0084, "step": 233810 }, { "epoch": 1.18, "learning_rate": 0.00012305220194641064, "loss": 0.0087, "step": 233820 }, { "epoch": 1.18, "learning_rate": 0.00012304463425339663, "loss": 0.0063, "step": 233830 }, { "epoch": 1.18, "learning_rate": 0.0001230370665603826, "loss": 0.0061, "step": 233840 }, { "epoch": 1.18, "learning_rate": 0.00012302949886736862, "loss": 0.0081, "step": 233850 }, { "epoch": 1.18, "learning_rate": 0.0001230219311743546, "loss": 0.0119, "step": 233860 }, { "epoch": 1.18, "learning_rate": 0.00012301436348134058, "loss": 0.009, "step": 233870 }, { "epoch": 1.18, "learning_rate": 0.00012300679578832656, "loss": 0.0106, "step": 233880 }, { "epoch": 1.18, "learning_rate": 0.00012299922809531257, "loss": 0.0084, "step": 233890 }, { "epoch": 1.18, "learning_rate": 0.00012299166040229855, "loss": 0.0093, "step": 233900 }, { "epoch": 1.18, "learning_rate": 0.00012298409270928453, "loss": 0.0103, "step": 233910 }, { "epoch": 1.18, "learning_rate": 0.00012297652501627054, "loss": 0.0079, "step": 233920 }, { "epoch": 1.18, "learning_rate": 0.00012296895732325652, "loss": 0.0086, "step": 233930 }, { "epoch": 1.18, "learning_rate": 0.0001229613896302425, "loss": 0.0098, "step": 233940 }, { "epoch": 1.18, "learning_rate": 0.0001229538219372285, "loss": 0.0079, "step": 233950 }, { "epoch": 1.18, "learning_rate": 0.0001229462542442145, "loss": 0.0089, "step": 233960 }, { "epoch": 1.18, "learning_rate": 0.00012293868655120047, "loss": 0.0115, "step": 233970 }, { "epoch": 1.18, "learning_rate": 0.00012293111885818648, "loss": 0.0069, "step": 233980 }, { "epoch": 1.18, "learning_rate": 0.00012292355116517246, "loss": 0.0086, "step": 233990 }, { "epoch": 1.18, "learning_rate": 0.00012291598347215845, "loss": 0.0082, "step": 234000 }, { "epoch": 1.18, "eval_cer": 0.9144275584736445, "eval_loss": 0.0069518680684268475, "eval_runtime": 115.6903, "eval_samples_per_second": 17.288, "eval_steps_per_second": 4.322, "step": 234000 }, { "epoch": 1.18, "learning_rate": 0.00012290841577914445, "loss": 0.008, "step": 234010 }, { "epoch": 1.18, "learning_rate": 0.00012290084808613044, "loss": 0.0114, "step": 234020 }, { "epoch": 1.18, "learning_rate": 0.00012289328039311642, "loss": 0.0118, "step": 234030 }, { "epoch": 1.18, "learning_rate": 0.00012288571270010243, "loss": 0.0087, "step": 234040 }, { "epoch": 1.18, "learning_rate": 0.0001228781450070884, "loss": 0.0121, "step": 234050 }, { "epoch": 1.18, "learning_rate": 0.0001228705773140744, "loss": 0.0133, "step": 234060 }, { "epoch": 1.18, "learning_rate": 0.00012286300962106037, "loss": 0.0101, "step": 234070 }, { "epoch": 1.18, "learning_rate": 0.00012285544192804638, "loss": 0.0087, "step": 234080 }, { "epoch": 1.18, "learning_rate": 0.00012284787423503236, "loss": 0.0087, "step": 234090 }, { "epoch": 1.18, "learning_rate": 0.00012284030654201834, "loss": 0.009, "step": 234100 }, { "epoch": 1.18, "learning_rate": 0.00012283273884900432, "loss": 0.0122, "step": 234110 }, { "epoch": 1.18, "learning_rate": 0.0001228251711559903, "loss": 0.0091, "step": 234120 }, { "epoch": 1.18, "learning_rate": 0.0001228176034629763, "loss": 0.0075, "step": 234130 }, { "epoch": 1.18, "learning_rate": 0.0001228100357699623, "loss": 0.0132, "step": 234140 }, { "epoch": 1.18, "learning_rate": 0.00012280246807694828, "loss": 0.0093, "step": 234150 }, { "epoch": 1.18, "learning_rate": 0.00012279490038393428, "loss": 0.0114, "step": 234160 }, { "epoch": 1.18, "learning_rate": 0.00012278733269092027, "loss": 0.0084, "step": 234170 }, { "epoch": 1.18, "learning_rate": 0.00012277976499790625, "loss": 0.0076, "step": 234180 }, { "epoch": 1.18, "learning_rate": 0.00012277219730489226, "loss": 0.008, "step": 234190 }, { "epoch": 1.18, "learning_rate": 0.00012276462961187824, "loss": 0.0101, "step": 234200 }, { "epoch": 1.18, "learning_rate": 0.00012275706191886422, "loss": 0.0094, "step": 234210 }, { "epoch": 1.18, "learning_rate": 0.00012274949422585023, "loss": 0.0091, "step": 234220 }, { "epoch": 1.18, "learning_rate": 0.0001227419265328362, "loss": 0.0084, "step": 234230 }, { "epoch": 1.18, "learning_rate": 0.0001227343588398222, "loss": 0.009, "step": 234240 }, { "epoch": 1.18, "learning_rate": 0.00012272679114680817, "loss": 0.0096, "step": 234250 }, { "epoch": 1.18, "learning_rate": 0.00012271922345379418, "loss": 0.0084, "step": 234260 }, { "epoch": 1.18, "learning_rate": 0.00012271165576078016, "loss": 0.0093, "step": 234270 }, { "epoch": 1.18, "learning_rate": 0.00012270408806776614, "loss": 0.009, "step": 234280 }, { "epoch": 1.18, "learning_rate": 0.00012269652037475215, "loss": 0.0104, "step": 234290 }, { "epoch": 1.18, "learning_rate": 0.00012268895268173813, "loss": 0.012, "step": 234300 }, { "epoch": 1.18, "learning_rate": 0.00012268138498872411, "loss": 0.008, "step": 234310 }, { "epoch": 1.18, "learning_rate": 0.00012267381729571012, "loss": 0.0097, "step": 234320 }, { "epoch": 1.18, "learning_rate": 0.0001226662496026961, "loss": 0.0094, "step": 234330 }, { "epoch": 1.18, "learning_rate": 0.00012265868190968209, "loss": 0.0074, "step": 234340 }, { "epoch": 1.18, "learning_rate": 0.0001226511142166681, "loss": 0.0083, "step": 234350 }, { "epoch": 1.18, "learning_rate": 0.00012264354652365408, "loss": 0.0084, "step": 234360 }, { "epoch": 1.18, "learning_rate": 0.00012263597883064006, "loss": 0.0073, "step": 234370 }, { "epoch": 1.18, "learning_rate": 0.00012262841113762607, "loss": 0.0081, "step": 234380 }, { "epoch": 1.18, "learning_rate": 0.00012262084344461205, "loss": 0.0145, "step": 234390 }, { "epoch": 1.18, "learning_rate": 0.00012261327575159803, "loss": 0.008, "step": 234400 }, { "epoch": 1.18, "learning_rate": 0.000122605708058584, "loss": 0.0093, "step": 234410 }, { "epoch": 1.18, "learning_rate": 0.00012259814036557002, "loss": 0.0098, "step": 234420 }, { "epoch": 1.18, "learning_rate": 0.000122590572672556, "loss": 0.0073, "step": 234430 }, { "epoch": 1.18, "learning_rate": 0.00012258300497954198, "loss": 0.0078, "step": 234440 }, { "epoch": 1.18, "learning_rate": 0.000122575437286528, "loss": 0.0088, "step": 234450 }, { "epoch": 1.18, "learning_rate": 0.00012256786959351397, "loss": 0.0077, "step": 234460 }, { "epoch": 1.18, "learning_rate": 0.00012256030190049995, "loss": 0.0106, "step": 234470 }, { "epoch": 1.18, "learning_rate": 0.00012255273420748596, "loss": 0.0096, "step": 234480 }, { "epoch": 1.18, "learning_rate": 0.00012254516651447194, "loss": 0.0084, "step": 234490 }, { "epoch": 1.18, "learning_rate": 0.00012253759882145792, "loss": 0.0068, "step": 234500 }, { "epoch": 1.18, "learning_rate": 0.00012253003112844393, "loss": 0.0092, "step": 234510 }, { "epoch": 1.18, "learning_rate": 0.00012252246343542991, "loss": 0.0098, "step": 234520 }, { "epoch": 1.18, "learning_rate": 0.0001225148957424159, "loss": 0.009, "step": 234530 }, { "epoch": 1.18, "learning_rate": 0.0001225073280494019, "loss": 0.0088, "step": 234540 }, { "epoch": 1.18, "learning_rate": 0.00012249976035638789, "loss": 0.0087, "step": 234550 }, { "epoch": 1.18, "learning_rate": 0.00012249219266337387, "loss": 0.0109, "step": 234560 }, { "epoch": 1.18, "learning_rate": 0.00012248462497035988, "loss": 0.0095, "step": 234570 }, { "epoch": 1.18, "learning_rate": 0.00012247705727734586, "loss": 0.0097, "step": 234580 }, { "epoch": 1.18, "learning_rate": 0.00012246948958433184, "loss": 0.0087, "step": 234590 }, { "epoch": 1.18, "learning_rate": 0.00012246192189131782, "loss": 0.0073, "step": 234600 }, { "epoch": 1.18, "learning_rate": 0.00012245435419830383, "loss": 0.0079, "step": 234610 }, { "epoch": 1.18, "learning_rate": 0.0001224467865052898, "loss": 0.0123, "step": 234620 }, { "epoch": 1.18, "learning_rate": 0.0001224392188122758, "loss": 0.008, "step": 234630 }, { "epoch": 1.18, "learning_rate": 0.0001224316511192618, "loss": 0.0096, "step": 234640 }, { "epoch": 1.18, "learning_rate": 0.00012242408342624778, "loss": 0.0111, "step": 234650 }, { "epoch": 1.18, "learning_rate": 0.00012241651573323376, "loss": 0.0072, "step": 234660 }, { "epoch": 1.18, "learning_rate": 0.00012240894804021977, "loss": 0.0067, "step": 234670 }, { "epoch": 1.18, "learning_rate": 0.00012240138034720575, "loss": 0.0083, "step": 234680 }, { "epoch": 1.18, "learning_rate": 0.00012239381265419173, "loss": 0.0082, "step": 234690 }, { "epoch": 1.18, "learning_rate": 0.00012238624496117774, "loss": 0.0092, "step": 234700 }, { "epoch": 1.18, "learning_rate": 0.00012237867726816372, "loss": 0.0081, "step": 234710 }, { "epoch": 1.18, "learning_rate": 0.0001223711095751497, "loss": 0.0094, "step": 234720 }, { "epoch": 1.18, "learning_rate": 0.0001223635418821357, "loss": 0.0126, "step": 234730 }, { "epoch": 1.18, "learning_rate": 0.00012235597418912167, "loss": 0.0092, "step": 234740 }, { "epoch": 1.18, "learning_rate": 0.00012234840649610768, "loss": 0.0095, "step": 234750 }, { "epoch": 1.18, "learning_rate": 0.00012234083880309366, "loss": 0.009, "step": 234760 }, { "epoch": 1.18, "learning_rate": 0.00012233327111007964, "loss": 0.0077, "step": 234770 }, { "epoch": 1.18, "learning_rate": 0.00012232570341706562, "loss": 0.0098, "step": 234780 }, { "epoch": 1.18, "learning_rate": 0.00012231813572405163, "loss": 0.0104, "step": 234790 }, { "epoch": 1.18, "learning_rate": 0.0001223105680310376, "loss": 0.0077, "step": 234800 }, { "epoch": 1.18, "learning_rate": 0.0001223030003380236, "loss": 0.0093, "step": 234810 }, { "epoch": 1.18, "learning_rate": 0.0001222954326450096, "loss": 0.009, "step": 234820 }, { "epoch": 1.18, "learning_rate": 0.00012228786495199558, "loss": 0.0072, "step": 234830 }, { "epoch": 1.18, "learning_rate": 0.00012228029725898156, "loss": 0.0075, "step": 234840 }, { "epoch": 1.18, "learning_rate": 0.00012227272956596757, "loss": 0.0096, "step": 234850 }, { "epoch": 1.18, "learning_rate": 0.00012226516187295355, "loss": 0.0091, "step": 234860 }, { "epoch": 1.18, "learning_rate": 0.00012225759417993954, "loss": 0.0098, "step": 234870 }, { "epoch": 1.18, "learning_rate": 0.00012225002648692554, "loss": 0.0073, "step": 234880 }, { "epoch": 1.19, "learning_rate": 0.00012224245879391153, "loss": 0.009, "step": 234890 }, { "epoch": 1.19, "learning_rate": 0.0001222348911008975, "loss": 0.01, "step": 234900 }, { "epoch": 1.19, "learning_rate": 0.00012222732340788352, "loss": 0.0075, "step": 234910 }, { "epoch": 1.19, "learning_rate": 0.0001222197557148695, "loss": 0.0084, "step": 234920 }, { "epoch": 1.19, "learning_rate": 0.00012221218802185548, "loss": 0.0083, "step": 234930 }, { "epoch": 1.19, "learning_rate": 0.0001222046203288415, "loss": 0.0104, "step": 234940 }, { "epoch": 1.19, "learning_rate": 0.00012219705263582747, "loss": 0.011, "step": 234950 }, { "epoch": 1.19, "learning_rate": 0.00012218948494281345, "loss": 0.0108, "step": 234960 }, { "epoch": 1.19, "learning_rate": 0.00012218191724979943, "loss": 0.0099, "step": 234970 }, { "epoch": 1.19, "learning_rate": 0.00012217434955678544, "loss": 0.0071, "step": 234980 }, { "epoch": 1.19, "learning_rate": 0.00012216678186377142, "loss": 0.0084, "step": 234990 }, { "epoch": 1.19, "learning_rate": 0.0001221592141707574, "loss": 0.0086, "step": 235000 }, { "epoch": 1.19, "eval_cer": 0.9144362920387732, "eval_loss": 0.0068534985184669495, "eval_runtime": 115.6303, "eval_samples_per_second": 17.297, "eval_steps_per_second": 4.324, "step": 235000 }, { "epoch": 1.19, "learning_rate": 0.0001221516464777434, "loss": 0.008, "step": 235010 }, { "epoch": 1.19, "learning_rate": 0.0001221440787847294, "loss": 0.0096, "step": 235020 }, { "epoch": 1.19, "learning_rate": 0.00012213651109171537, "loss": 0.0084, "step": 235030 }, { "epoch": 1.19, "learning_rate": 0.00012212894339870138, "loss": 0.0104, "step": 235040 }, { "epoch": 1.19, "learning_rate": 0.00012212137570568736, "loss": 0.011, "step": 235050 }, { "epoch": 1.19, "learning_rate": 0.00012211380801267335, "loss": 0.0076, "step": 235060 }, { "epoch": 1.19, "learning_rate": 0.00012210624031965935, "loss": 0.0067, "step": 235070 }, { "epoch": 1.19, "learning_rate": 0.00012209867262664534, "loss": 0.0076, "step": 235080 }, { "epoch": 1.19, "learning_rate": 0.00012209110493363132, "loss": 0.0078, "step": 235090 }, { "epoch": 1.19, "learning_rate": 0.00012208353724061733, "loss": 0.0137, "step": 235100 }, { "epoch": 1.19, "learning_rate": 0.0001220759695476033, "loss": 0.01, "step": 235110 }, { "epoch": 1.19, "learning_rate": 0.00012206840185458929, "loss": 0.0119, "step": 235120 }, { "epoch": 1.19, "learning_rate": 0.00012206083416157528, "loss": 0.0062, "step": 235130 }, { "epoch": 1.19, "learning_rate": 0.00012205326646856128, "loss": 0.007, "step": 235140 }, { "epoch": 1.19, "learning_rate": 0.00012204569877554726, "loss": 0.0088, "step": 235150 }, { "epoch": 1.19, "learning_rate": 0.00012203813108253326, "loss": 0.0084, "step": 235160 }, { "epoch": 1.19, "learning_rate": 0.00012203056338951924, "loss": 0.0076, "step": 235170 }, { "epoch": 1.19, "learning_rate": 0.00012202299569650523, "loss": 0.0117, "step": 235180 }, { "epoch": 1.19, "learning_rate": 0.00012201542800349123, "loss": 0.0087, "step": 235190 }, { "epoch": 1.19, "learning_rate": 0.00012200786031047721, "loss": 0.009, "step": 235200 }, { "epoch": 1.19, "learning_rate": 0.0001220002926174632, "loss": 0.0074, "step": 235210 }, { "epoch": 1.19, "learning_rate": 0.0001219927249244492, "loss": 0.0066, "step": 235220 }, { "epoch": 1.19, "learning_rate": 0.00012198515723143518, "loss": 0.0079, "step": 235230 }, { "epoch": 1.19, "learning_rate": 0.00012197758953842117, "loss": 0.0104, "step": 235240 }, { "epoch": 1.19, "learning_rate": 0.00012197002184540716, "loss": 0.0083, "step": 235250 }, { "epoch": 1.19, "learning_rate": 0.00012196245415239315, "loss": 0.0091, "step": 235260 }, { "epoch": 1.19, "learning_rate": 0.00012195488645937915, "loss": 0.0093, "step": 235270 }, { "epoch": 1.19, "learning_rate": 0.00012194731876636513, "loss": 0.0099, "step": 235280 }, { "epoch": 1.19, "learning_rate": 0.00012193975107335112, "loss": 0.0095, "step": 235290 }, { "epoch": 1.19, "learning_rate": 0.00012193218338033712, "loss": 0.0069, "step": 235300 }, { "epoch": 1.19, "learning_rate": 0.0001219246156873231, "loss": 0.0073, "step": 235310 }, { "epoch": 1.19, "learning_rate": 0.0001219170479943091, "loss": 0.0073, "step": 235320 }, { "epoch": 1.19, "learning_rate": 0.00012190948030129508, "loss": 0.0078, "step": 235330 }, { "epoch": 1.19, "learning_rate": 0.00012190191260828107, "loss": 0.0085, "step": 235340 }, { "epoch": 1.19, "learning_rate": 0.00012189434491526707, "loss": 0.0103, "step": 235350 }, { "epoch": 1.19, "learning_rate": 0.00012188677722225303, "loss": 0.008, "step": 235360 }, { "epoch": 1.19, "learning_rate": 0.00012187920952923903, "loss": 0.0074, "step": 235370 }, { "epoch": 1.19, "learning_rate": 0.00012187164183622501, "loss": 0.0074, "step": 235380 }, { "epoch": 1.19, "learning_rate": 0.000121864074143211, "loss": 0.0115, "step": 235390 }, { "epoch": 1.19, "learning_rate": 0.000121856506450197, "loss": 0.01, "step": 235400 }, { "epoch": 1.19, "learning_rate": 0.00012184893875718298, "loss": 0.008, "step": 235410 }, { "epoch": 1.19, "learning_rate": 0.00012184137106416898, "loss": 0.0076, "step": 235420 }, { "epoch": 1.19, "learning_rate": 0.00012183380337115497, "loss": 0.0083, "step": 235430 }, { "epoch": 1.19, "learning_rate": 0.00012182623567814095, "loss": 0.0069, "step": 235440 }, { "epoch": 1.19, "learning_rate": 0.00012181866798512695, "loss": 0.0111, "step": 235450 }, { "epoch": 1.19, "learning_rate": 0.00012181110029211293, "loss": 0.0087, "step": 235460 }, { "epoch": 1.19, "learning_rate": 0.00012180353259909892, "loss": 0.0099, "step": 235470 }, { "epoch": 1.19, "learning_rate": 0.00012179596490608492, "loss": 0.0103, "step": 235480 }, { "epoch": 1.19, "learning_rate": 0.0001217883972130709, "loss": 0.0076, "step": 235490 }, { "epoch": 1.19, "learning_rate": 0.0001217808295200569, "loss": 0.011, "step": 235500 }, { "epoch": 1.19, "learning_rate": 0.00012177326182704289, "loss": 0.0087, "step": 235510 }, { "epoch": 1.19, "learning_rate": 0.00012176569413402887, "loss": 0.01, "step": 235520 }, { "epoch": 1.19, "learning_rate": 0.00012175812644101487, "loss": 0.0119, "step": 235530 }, { "epoch": 1.19, "learning_rate": 0.00012175055874800085, "loss": 0.0106, "step": 235540 }, { "epoch": 1.19, "learning_rate": 0.00012174299105498684, "loss": 0.0085, "step": 235550 }, { "epoch": 1.19, "learning_rate": 0.00012173542336197284, "loss": 0.0083, "step": 235560 }, { "epoch": 1.19, "learning_rate": 0.00012172785566895882, "loss": 0.0087, "step": 235570 }, { "epoch": 1.19, "learning_rate": 0.00012172028797594481, "loss": 0.0065, "step": 235580 }, { "epoch": 1.19, "learning_rate": 0.00012171272028293081, "loss": 0.0102, "step": 235590 }, { "epoch": 1.19, "learning_rate": 0.00012170515258991679, "loss": 0.0092, "step": 235600 }, { "epoch": 1.19, "learning_rate": 0.00012169758489690279, "loss": 0.0089, "step": 235610 }, { "epoch": 1.19, "learning_rate": 0.00012169001720388877, "loss": 0.0097, "step": 235620 }, { "epoch": 1.19, "learning_rate": 0.00012168244951087476, "loss": 0.0092, "step": 235630 }, { "epoch": 1.19, "learning_rate": 0.00012167488181786076, "loss": 0.0095, "step": 235640 }, { "epoch": 1.19, "learning_rate": 0.00012166731412484674, "loss": 0.0089, "step": 235650 }, { "epoch": 1.19, "learning_rate": 0.00012165974643183273, "loss": 0.0076, "step": 235660 }, { "epoch": 1.19, "learning_rate": 0.00012165217873881873, "loss": 0.0089, "step": 235670 }, { "epoch": 1.19, "learning_rate": 0.00012164461104580471, "loss": 0.0101, "step": 235680 }, { "epoch": 1.19, "learning_rate": 0.0001216370433527907, "loss": 0.0102, "step": 235690 }, { "epoch": 1.19, "learning_rate": 0.00012162947565977669, "loss": 0.0073, "step": 235700 }, { "epoch": 1.19, "learning_rate": 0.00012162190796676268, "loss": 0.0111, "step": 235710 }, { "epoch": 1.19, "learning_rate": 0.00012161434027374868, "loss": 0.0104, "step": 235720 }, { "epoch": 1.19, "learning_rate": 0.00012160677258073466, "loss": 0.0076, "step": 235730 }, { "epoch": 1.19, "learning_rate": 0.00012159920488772065, "loss": 0.0099, "step": 235740 }, { "epoch": 1.19, "learning_rate": 0.00012159163719470665, "loss": 0.0097, "step": 235750 }, { "epoch": 1.19, "learning_rate": 0.00012158406950169263, "loss": 0.0108, "step": 235760 }, { "epoch": 1.19, "learning_rate": 0.00012157650180867862, "loss": 0.0102, "step": 235770 }, { "epoch": 1.19, "learning_rate": 0.0001215689341156646, "loss": 0.0076, "step": 235780 }, { "epoch": 1.19, "learning_rate": 0.0001215613664226506, "loss": 0.0079, "step": 235790 }, { "epoch": 1.19, "learning_rate": 0.0001215537987296366, "loss": 0.0084, "step": 235800 }, { "epoch": 1.19, "learning_rate": 0.00012154623103662258, "loss": 0.0086, "step": 235810 }, { "epoch": 1.19, "learning_rate": 0.00012153866334360857, "loss": 0.0099, "step": 235820 }, { "epoch": 1.19, "learning_rate": 0.00012153109565059457, "loss": 0.0096, "step": 235830 }, { "epoch": 1.19, "learning_rate": 0.00012152352795758055, "loss": 0.0077, "step": 235840 }, { "epoch": 1.19, "learning_rate": 0.00012151596026456654, "loss": 0.0094, "step": 235850 }, { "epoch": 1.19, "learning_rate": 0.00012150839257155253, "loss": 0.0099, "step": 235860 }, { "epoch": 1.19, "learning_rate": 0.00012150082487853852, "loss": 0.0109, "step": 235870 }, { "epoch": 1.19, "learning_rate": 0.00012149325718552452, "loss": 0.0102, "step": 235880 }, { "epoch": 1.19, "learning_rate": 0.0001214856894925105, "loss": 0.0093, "step": 235890 }, { "epoch": 1.19, "learning_rate": 0.00012147812179949649, "loss": 0.0101, "step": 235900 }, { "epoch": 1.19, "learning_rate": 0.00012147055410648249, "loss": 0.0096, "step": 235910 }, { "epoch": 1.19, "learning_rate": 0.00012146298641346847, "loss": 0.0116, "step": 235920 }, { "epoch": 1.19, "learning_rate": 0.00012145541872045446, "loss": 0.008, "step": 235930 }, { "epoch": 1.19, "learning_rate": 0.00012144785102744046, "loss": 0.0091, "step": 235940 }, { "epoch": 1.19, "learning_rate": 0.00012144028333442644, "loss": 0.0081, "step": 235950 }, { "epoch": 1.19, "learning_rate": 0.00012143271564141243, "loss": 0.0084, "step": 235960 }, { "epoch": 1.19, "learning_rate": 0.00012142514794839842, "loss": 0.0083, "step": 235970 }, { "epoch": 1.19, "learning_rate": 0.00012141758025538441, "loss": 0.0092, "step": 235980 }, { "epoch": 1.19, "learning_rate": 0.00012141001256237038, "loss": 0.0095, "step": 235990 }, { "epoch": 1.19, "learning_rate": 0.00012140244486935637, "loss": 0.0086, "step": 236000 }, { "epoch": 1.19, "eval_cer": 0.9144469663961525, "eval_loss": 0.0067824204452335835, "eval_runtime": 116.0471, "eval_samples_per_second": 17.234, "eval_steps_per_second": 4.309, "step": 236000 }, { "epoch": 1.19, "learning_rate": 0.00012139487717634237, "loss": 0.0095, "step": 236010 }, { "epoch": 1.19, "learning_rate": 0.00012138730948332835, "loss": 0.0084, "step": 236020 }, { "epoch": 1.19, "learning_rate": 0.00012137974179031435, "loss": 0.0092, "step": 236030 }, { "epoch": 1.19, "learning_rate": 0.00012137217409730034, "loss": 0.0083, "step": 236040 }, { "epoch": 1.19, "learning_rate": 0.00012136460640428632, "loss": 0.0062, "step": 236050 }, { "epoch": 1.19, "learning_rate": 0.00012135703871127232, "loss": 0.0106, "step": 236060 }, { "epoch": 1.19, "learning_rate": 0.0001213494710182583, "loss": 0.0077, "step": 236070 }, { "epoch": 1.19, "learning_rate": 0.00012134190332524429, "loss": 0.008, "step": 236080 }, { "epoch": 1.19, "learning_rate": 0.00012133433563223029, "loss": 0.0079, "step": 236090 }, { "epoch": 1.19, "learning_rate": 0.00012132676793921627, "loss": 0.0077, "step": 236100 }, { "epoch": 1.19, "learning_rate": 0.00012131920024620226, "loss": 0.008, "step": 236110 }, { "epoch": 1.19, "learning_rate": 0.00012131163255318826, "loss": 0.0112, "step": 236120 }, { "epoch": 1.19, "learning_rate": 0.00012130406486017424, "loss": 0.0098, "step": 236130 }, { "epoch": 1.19, "learning_rate": 0.00012129649716716024, "loss": 0.0091, "step": 236140 }, { "epoch": 1.19, "learning_rate": 0.00012128892947414622, "loss": 0.0088, "step": 236150 }, { "epoch": 1.19, "learning_rate": 0.00012128136178113221, "loss": 0.0092, "step": 236160 }, { "epoch": 1.19, "learning_rate": 0.00012127379408811821, "loss": 0.0089, "step": 236170 }, { "epoch": 1.19, "learning_rate": 0.00012126622639510419, "loss": 0.009, "step": 236180 }, { "epoch": 1.19, "learning_rate": 0.00012125865870209018, "loss": 0.0077, "step": 236190 }, { "epoch": 1.19, "learning_rate": 0.00012125109100907618, "loss": 0.0105, "step": 236200 }, { "epoch": 1.19, "learning_rate": 0.00012124352331606216, "loss": 0.0112, "step": 236210 }, { "epoch": 1.19, "learning_rate": 0.00012123595562304816, "loss": 0.0075, "step": 236220 }, { "epoch": 1.19, "learning_rate": 0.00012122838793003414, "loss": 0.0082, "step": 236230 }, { "epoch": 1.19, "learning_rate": 0.00012122082023702013, "loss": 0.0091, "step": 236240 }, { "epoch": 1.19, "learning_rate": 0.00012121325254400613, "loss": 0.009, "step": 236250 }, { "epoch": 1.19, "learning_rate": 0.00012120568485099211, "loss": 0.0099, "step": 236260 }, { "epoch": 1.19, "learning_rate": 0.0001211981171579781, "loss": 0.0083, "step": 236270 }, { "epoch": 1.19, "learning_rate": 0.0001211905494649641, "loss": 0.0066, "step": 236280 }, { "epoch": 1.19, "learning_rate": 0.00012118298177195008, "loss": 0.0072, "step": 236290 }, { "epoch": 1.19, "learning_rate": 0.00012117541407893607, "loss": 0.0096, "step": 236300 }, { "epoch": 1.19, "learning_rate": 0.00012116784638592206, "loss": 0.0085, "step": 236310 }, { "epoch": 1.19, "learning_rate": 0.00012116027869290805, "loss": 0.0092, "step": 236320 }, { "epoch": 1.19, "learning_rate": 0.00012115271099989405, "loss": 0.0091, "step": 236330 }, { "epoch": 1.19, "learning_rate": 0.00012114514330688003, "loss": 0.0081, "step": 236340 }, { "epoch": 1.19, "learning_rate": 0.00012113757561386602, "loss": 0.0088, "step": 236350 }, { "epoch": 1.19, "learning_rate": 0.00012113000792085202, "loss": 0.0112, "step": 236360 }, { "epoch": 1.19, "learning_rate": 0.000121122440227838, "loss": 0.0093, "step": 236370 }, { "epoch": 1.19, "learning_rate": 0.000121114872534824, "loss": 0.0099, "step": 236380 }, { "epoch": 1.19, "learning_rate": 0.00012110730484180999, "loss": 0.008, "step": 236390 }, { "epoch": 1.19, "learning_rate": 0.00012109973714879597, "loss": 0.0097, "step": 236400 }, { "epoch": 1.19, "learning_rate": 0.00012109216945578197, "loss": 0.01, "step": 236410 }, { "epoch": 1.19, "learning_rate": 0.00012108460176276795, "loss": 0.0091, "step": 236420 }, { "epoch": 1.19, "learning_rate": 0.00012107703406975394, "loss": 0.0103, "step": 236430 }, { "epoch": 1.19, "learning_rate": 0.00012106946637673994, "loss": 0.0086, "step": 236440 }, { "epoch": 1.19, "learning_rate": 0.00012106189868372592, "loss": 0.01, "step": 236450 }, { "epoch": 1.19, "learning_rate": 0.00012105433099071191, "loss": 0.0099, "step": 236460 }, { "epoch": 1.19, "learning_rate": 0.00012104676329769791, "loss": 0.0085, "step": 236470 }, { "epoch": 1.19, "learning_rate": 0.00012103919560468389, "loss": 0.0087, "step": 236480 }, { "epoch": 1.19, "learning_rate": 0.00012103162791166988, "loss": 0.0097, "step": 236490 }, { "epoch": 1.19, "learning_rate": 0.00012102406021865587, "loss": 0.0094, "step": 236500 }, { "epoch": 1.19, "learning_rate": 0.00012101649252564186, "loss": 0.0103, "step": 236510 }, { "epoch": 1.19, "learning_rate": 0.00012100892483262786, "loss": 0.0099, "step": 236520 }, { "epoch": 1.19, "learning_rate": 0.00012100135713961384, "loss": 0.0103, "step": 236530 }, { "epoch": 1.19, "learning_rate": 0.00012099378944659983, "loss": 0.0081, "step": 236540 }, { "epoch": 1.19, "learning_rate": 0.00012098622175358583, "loss": 0.0068, "step": 236550 }, { "epoch": 1.19, "learning_rate": 0.00012097865406057181, "loss": 0.0097, "step": 236560 }, { "epoch": 1.19, "learning_rate": 0.0001209710863675578, "loss": 0.0074, "step": 236570 }, { "epoch": 1.19, "learning_rate": 0.00012096351867454379, "loss": 0.0062, "step": 236580 }, { "epoch": 1.19, "learning_rate": 0.00012095595098152978, "loss": 0.0097, "step": 236590 }, { "epoch": 1.19, "learning_rate": 0.00012094838328851578, "loss": 0.0089, "step": 236600 }, { "epoch": 1.19, "learning_rate": 0.00012094081559550174, "loss": 0.0083, "step": 236610 }, { "epoch": 1.19, "learning_rate": 0.00012093324790248774, "loss": 0.0087, "step": 236620 }, { "epoch": 1.19, "learning_rate": 0.00012092568020947372, "loss": 0.0095, "step": 236630 }, { "epoch": 1.19, "learning_rate": 0.00012091811251645971, "loss": 0.0083, "step": 236640 }, { "epoch": 1.19, "learning_rate": 0.00012091054482344571, "loss": 0.0109, "step": 236650 }, { "epoch": 1.19, "learning_rate": 0.00012090297713043169, "loss": 0.008, "step": 236660 }, { "epoch": 1.19, "learning_rate": 0.00012089540943741769, "loss": 0.0095, "step": 236670 }, { "epoch": 1.19, "learning_rate": 0.00012088784174440367, "loss": 0.0082, "step": 236680 }, { "epoch": 1.19, "learning_rate": 0.00012088027405138966, "loss": 0.0108, "step": 236690 }, { "epoch": 1.19, "learning_rate": 0.00012087270635837566, "loss": 0.0072, "step": 236700 }, { "epoch": 1.19, "learning_rate": 0.00012086513866536164, "loss": 0.0085, "step": 236710 }, { "epoch": 1.19, "learning_rate": 0.00012085757097234763, "loss": 0.0084, "step": 236720 }, { "epoch": 1.19, "learning_rate": 0.00012085000327933363, "loss": 0.0116, "step": 236730 }, { "epoch": 1.19, "learning_rate": 0.00012084243558631961, "loss": 0.0098, "step": 236740 }, { "epoch": 1.19, "learning_rate": 0.0001208348678933056, "loss": 0.0089, "step": 236750 }, { "epoch": 1.19, "learning_rate": 0.00012082730020029159, "loss": 0.0076, "step": 236760 }, { "epoch": 1.19, "learning_rate": 0.00012081973250727758, "loss": 0.009, "step": 236770 }, { "epoch": 1.19, "learning_rate": 0.00012081216481426358, "loss": 0.0076, "step": 236780 }, { "epoch": 1.19, "learning_rate": 0.00012080459712124956, "loss": 0.0076, "step": 236790 }, { "epoch": 1.19, "learning_rate": 0.00012079702942823555, "loss": 0.0078, "step": 236800 }, { "epoch": 1.19, "learning_rate": 0.00012078946173522155, "loss": 0.0102, "step": 236810 }, { "epoch": 1.19, "learning_rate": 0.00012078189404220753, "loss": 0.0106, "step": 236820 }, { "epoch": 1.19, "learning_rate": 0.00012077432634919352, "loss": 0.0089, "step": 236830 }, { "epoch": 1.19, "learning_rate": 0.00012076675865617952, "loss": 0.0093, "step": 236840 }, { "epoch": 1.19, "learning_rate": 0.0001207591909631655, "loss": 0.0079, "step": 236850 }, { "epoch": 1.19, "learning_rate": 0.0001207516232701515, "loss": 0.0105, "step": 236860 }, { "epoch": 1.2, "learning_rate": 0.00012074405557713748, "loss": 0.0109, "step": 236870 }, { "epoch": 1.2, "learning_rate": 0.00012073648788412347, "loss": 0.0144, "step": 236880 }, { "epoch": 1.2, "learning_rate": 0.00012072892019110947, "loss": 0.0087, "step": 236890 }, { "epoch": 1.2, "learning_rate": 0.00012072135249809545, "loss": 0.0086, "step": 236900 }, { "epoch": 1.2, "learning_rate": 0.00012071378480508144, "loss": 0.0076, "step": 236910 }, { "epoch": 1.2, "learning_rate": 0.00012070621711206744, "loss": 0.0099, "step": 236920 }, { "epoch": 1.2, "learning_rate": 0.00012069864941905342, "loss": 0.0101, "step": 236930 }, { "epoch": 1.2, "learning_rate": 0.00012069108172603942, "loss": 0.008, "step": 236940 }, { "epoch": 1.2, "learning_rate": 0.0001206835140330254, "loss": 0.0107, "step": 236950 }, { "epoch": 1.2, "learning_rate": 0.00012067594634001139, "loss": 0.009, "step": 236960 }, { "epoch": 1.2, "learning_rate": 0.00012066837864699739, "loss": 0.0087, "step": 236970 }, { "epoch": 1.2, "learning_rate": 0.00012066081095398337, "loss": 0.009, "step": 236980 }, { "epoch": 1.2, "learning_rate": 0.00012065324326096936, "loss": 0.008, "step": 236990 }, { "epoch": 1.2, "learning_rate": 0.00012064567556795536, "loss": 0.0089, "step": 237000 }, { "epoch": 1.2, "eval_cer": 0.9144498775845288, "eval_loss": 0.006527193821966648, "eval_runtime": 116.0102, "eval_samples_per_second": 17.24, "eval_steps_per_second": 4.31, "step": 237000 }, { "epoch": 1.2, "learning_rate": 0.00012063810787494134, "loss": 0.0077, "step": 237010 }, { "epoch": 1.2, "learning_rate": 0.00012063054018192733, "loss": 0.0088, "step": 237020 }, { "epoch": 1.2, "learning_rate": 0.00012062297248891332, "loss": 0.0082, "step": 237030 }, { "epoch": 1.2, "learning_rate": 0.00012061540479589931, "loss": 0.0078, "step": 237040 }, { "epoch": 1.2, "learning_rate": 0.0001206078371028853, "loss": 0.0085, "step": 237050 }, { "epoch": 1.2, "learning_rate": 0.00012060026940987129, "loss": 0.0078, "step": 237060 }, { "epoch": 1.2, "learning_rate": 0.00012059270171685728, "loss": 0.0082, "step": 237070 }, { "epoch": 1.2, "learning_rate": 0.00012058513402384328, "loss": 0.009, "step": 237080 }, { "epoch": 1.2, "learning_rate": 0.00012057756633082926, "loss": 0.0074, "step": 237090 }, { "epoch": 1.2, "learning_rate": 0.00012056999863781525, "loss": 0.0083, "step": 237100 }, { "epoch": 1.2, "learning_rate": 0.00012056243094480124, "loss": 0.0088, "step": 237110 }, { "epoch": 1.2, "learning_rate": 0.00012055486325178723, "loss": 0.0087, "step": 237120 }, { "epoch": 1.2, "learning_rate": 0.00012054729555877323, "loss": 0.0056, "step": 237130 }, { "epoch": 1.2, "learning_rate": 0.00012053972786575921, "loss": 0.0098, "step": 237140 }, { "epoch": 1.2, "learning_rate": 0.0001205321601727452, "loss": 0.0074, "step": 237150 }, { "epoch": 1.2, "learning_rate": 0.0001205245924797312, "loss": 0.01, "step": 237160 }, { "epoch": 1.2, "learning_rate": 0.00012051702478671718, "loss": 0.0059, "step": 237170 }, { "epoch": 1.2, "learning_rate": 0.00012050945709370317, "loss": 0.0088, "step": 237180 }, { "epoch": 1.2, "learning_rate": 0.00012050188940068915, "loss": 0.0105, "step": 237190 }, { "epoch": 1.2, "learning_rate": 0.00012049432170767515, "loss": 0.0096, "step": 237200 }, { "epoch": 1.2, "learning_rate": 0.00012048675401466114, "loss": 0.0077, "step": 237210 }, { "epoch": 1.2, "learning_rate": 0.00012047918632164713, "loss": 0.0107, "step": 237220 }, { "epoch": 1.2, "learning_rate": 0.00012047161862863312, "loss": 0.0078, "step": 237230 }, { "epoch": 1.2, "learning_rate": 0.00012046405093561909, "loss": 0.0099, "step": 237240 }, { "epoch": 1.2, "learning_rate": 0.00012045648324260508, "loss": 0.0119, "step": 237250 }, { "epoch": 1.2, "learning_rate": 0.00012044891554959108, "loss": 0.0108, "step": 237260 }, { "epoch": 1.2, "learning_rate": 0.00012044134785657706, "loss": 0.0089, "step": 237270 }, { "epoch": 1.2, "learning_rate": 0.00012043378016356306, "loss": 0.0096, "step": 237280 }, { "epoch": 1.2, "learning_rate": 0.00012042621247054905, "loss": 0.0081, "step": 237290 }, { "epoch": 1.2, "learning_rate": 0.00012041864477753503, "loss": 0.0121, "step": 237300 }, { "epoch": 1.2, "learning_rate": 0.00012041107708452103, "loss": 0.0133, "step": 237310 }, { "epoch": 1.2, "learning_rate": 0.00012040350939150701, "loss": 0.0095, "step": 237320 }, { "epoch": 1.2, "learning_rate": 0.000120395941698493, "loss": 0.0087, "step": 237330 }, { "epoch": 1.2, "learning_rate": 0.000120388374005479, "loss": 0.0082, "step": 237340 }, { "epoch": 1.2, "learning_rate": 0.00012038080631246498, "loss": 0.0112, "step": 237350 }, { "epoch": 1.2, "learning_rate": 0.00012037323861945097, "loss": 0.0075, "step": 237360 }, { "epoch": 1.2, "learning_rate": 0.00012036567092643697, "loss": 0.0113, "step": 237370 }, { "epoch": 1.2, "learning_rate": 0.00012035810323342295, "loss": 0.0089, "step": 237380 }, { "epoch": 1.2, "learning_rate": 0.00012035053554040895, "loss": 0.0094, "step": 237390 }, { "epoch": 1.2, "learning_rate": 0.00012034296784739493, "loss": 0.0082, "step": 237400 }, { "epoch": 1.2, "learning_rate": 0.00012033540015438092, "loss": 0.0079, "step": 237410 }, { "epoch": 1.2, "learning_rate": 0.00012032783246136692, "loss": 0.0073, "step": 237420 }, { "epoch": 1.2, "learning_rate": 0.0001203202647683529, "loss": 0.0091, "step": 237430 }, { "epoch": 1.2, "learning_rate": 0.0001203126970753389, "loss": 0.0102, "step": 237440 }, { "epoch": 1.2, "learning_rate": 0.00012030512938232489, "loss": 0.0109, "step": 237450 }, { "epoch": 1.2, "learning_rate": 0.00012029756168931087, "loss": 0.0104, "step": 237460 }, { "epoch": 1.2, "learning_rate": 0.00012028999399629687, "loss": 0.0095, "step": 237470 }, { "epoch": 1.2, "learning_rate": 0.00012028242630328285, "loss": 0.0079, "step": 237480 }, { "epoch": 1.2, "learning_rate": 0.00012027485861026884, "loss": 0.0082, "step": 237490 }, { "epoch": 1.2, "learning_rate": 0.00012026729091725484, "loss": 0.0116, "step": 237500 }, { "epoch": 1.2, "learning_rate": 0.00012025972322424082, "loss": 0.008, "step": 237510 }, { "epoch": 1.2, "learning_rate": 0.00012025215553122681, "loss": 0.0079, "step": 237520 }, { "epoch": 1.2, "learning_rate": 0.00012024458783821281, "loss": 0.0075, "step": 237530 }, { "epoch": 1.2, "learning_rate": 0.00012023702014519879, "loss": 0.0077, "step": 237540 }, { "epoch": 1.2, "learning_rate": 0.00012022945245218478, "loss": 0.0101, "step": 237550 }, { "epoch": 1.2, "learning_rate": 0.00012022188475917077, "loss": 0.0086, "step": 237560 }, { "epoch": 1.2, "learning_rate": 0.00012021431706615676, "loss": 0.0096, "step": 237570 }, { "epoch": 1.2, "learning_rate": 0.00012020674937314276, "loss": 0.0081, "step": 237580 }, { "epoch": 1.2, "learning_rate": 0.00012019918168012874, "loss": 0.008, "step": 237590 }, { "epoch": 1.2, "learning_rate": 0.00012019161398711473, "loss": 0.0087, "step": 237600 }, { "epoch": 1.2, "learning_rate": 0.00012018404629410073, "loss": 0.0089, "step": 237610 }, { "epoch": 1.2, "learning_rate": 0.00012017647860108671, "loss": 0.0107, "step": 237620 }, { "epoch": 1.2, "learning_rate": 0.0001201689109080727, "loss": 0.0099, "step": 237630 }, { "epoch": 1.2, "learning_rate": 0.00012016134321505869, "loss": 0.0073, "step": 237640 }, { "epoch": 1.2, "learning_rate": 0.00012015377552204468, "loss": 0.0076, "step": 237650 }, { "epoch": 1.2, "learning_rate": 0.00012014620782903068, "loss": 0.0096, "step": 237660 }, { "epoch": 1.2, "learning_rate": 0.00012013864013601666, "loss": 0.0088, "step": 237670 }, { "epoch": 1.2, "learning_rate": 0.00012013107244300265, "loss": 0.0068, "step": 237680 }, { "epoch": 1.2, "learning_rate": 0.00012012350474998865, "loss": 0.0092, "step": 237690 }, { "epoch": 1.2, "learning_rate": 0.00012011593705697463, "loss": 0.0114, "step": 237700 }, { "epoch": 1.2, "learning_rate": 0.00012010836936396062, "loss": 0.0086, "step": 237710 }, { "epoch": 1.2, "learning_rate": 0.0001201008016709466, "loss": 0.0068, "step": 237720 }, { "epoch": 1.2, "learning_rate": 0.0001200932339779326, "loss": 0.0136, "step": 237730 }, { "epoch": 1.2, "learning_rate": 0.0001200856662849186, "loss": 0.0099, "step": 237740 }, { "epoch": 1.2, "learning_rate": 0.00012007809859190458, "loss": 0.0104, "step": 237750 }, { "epoch": 1.2, "learning_rate": 0.00012007053089889057, "loss": 0.0075, "step": 237760 }, { "epoch": 1.2, "learning_rate": 0.00012006296320587657, "loss": 0.0079, "step": 237770 }, { "epoch": 1.2, "learning_rate": 0.00012005539551286255, "loss": 0.01, "step": 237780 }, { "epoch": 1.2, "learning_rate": 0.00012004782781984854, "loss": 0.0095, "step": 237790 }, { "epoch": 1.2, "learning_rate": 0.00012004026012683452, "loss": 0.0083, "step": 237800 }, { "epoch": 1.2, "learning_rate": 0.00012003269243382052, "loss": 0.0081, "step": 237810 }, { "epoch": 1.2, "learning_rate": 0.00012002512474080651, "loss": 0.009, "step": 237820 }, { "epoch": 1.2, "learning_rate": 0.0001200175570477925, "loss": 0.0106, "step": 237830 }, { "epoch": 1.2, "learning_rate": 0.00012000998935477849, "loss": 0.0073, "step": 237840 }, { "epoch": 1.2, "learning_rate": 0.00012000242166176449, "loss": 0.0096, "step": 237850 }, { "epoch": 1.2, "learning_rate": 0.00011999485396875047, "loss": 0.0091, "step": 237860 }, { "epoch": 1.2, "learning_rate": 0.00011998728627573645, "loss": 0.0076, "step": 237870 }, { "epoch": 1.2, "learning_rate": 0.00011997971858272243, "loss": 0.0106, "step": 237880 }, { "epoch": 1.2, "learning_rate": 0.00011997215088970843, "loss": 0.0086, "step": 237890 }, { "epoch": 1.2, "learning_rate": 0.00011996458319669442, "loss": 0.0106, "step": 237900 }, { "epoch": 1.2, "learning_rate": 0.0001199570155036804, "loss": 0.0089, "step": 237910 }, { "epoch": 1.2, "learning_rate": 0.0001199494478106664, "loss": 0.0094, "step": 237920 }, { "epoch": 1.2, "learning_rate": 0.00011994188011765238, "loss": 0.0085, "step": 237930 }, { "epoch": 1.2, "learning_rate": 0.00011993431242463837, "loss": 0.0084, "step": 237940 }, { "epoch": 1.2, "learning_rate": 0.00011992674473162437, "loss": 0.0087, "step": 237950 }, { "epoch": 1.2, "learning_rate": 0.00011991917703861035, "loss": 0.0086, "step": 237960 }, { "epoch": 1.2, "learning_rate": 0.00011991160934559634, "loss": 0.0083, "step": 237970 }, { "epoch": 1.2, "learning_rate": 0.00011990404165258234, "loss": 0.0088, "step": 237980 }, { "epoch": 1.2, "learning_rate": 0.00011989647395956832, "loss": 0.0099, "step": 237990 }, { "epoch": 1.2, "learning_rate": 0.00011988890626655432, "loss": 0.0077, "step": 238000 }, { "epoch": 1.2, "eval_cer": 0.9144586111496574, "eval_loss": 0.006760002113878727, "eval_runtime": 116.0385, "eval_samples_per_second": 17.236, "eval_steps_per_second": 4.309, "step": 238000 }, { "epoch": 1.2, "learning_rate": 0.0001198813385735403, "loss": 0.0085, "step": 238010 }, { "epoch": 1.2, "learning_rate": 0.00011987377088052629, "loss": 0.0084, "step": 238020 }, { "epoch": 1.2, "learning_rate": 0.00011986620318751229, "loss": 0.0085, "step": 238030 }, { "epoch": 1.2, "learning_rate": 0.00011985863549449827, "loss": 0.0106, "step": 238040 }, { "epoch": 1.2, "learning_rate": 0.00011985106780148426, "loss": 0.0088, "step": 238050 }, { "epoch": 1.2, "learning_rate": 0.00011984350010847026, "loss": 0.0071, "step": 238060 }, { "epoch": 1.2, "learning_rate": 0.00011983593241545624, "loss": 0.0094, "step": 238070 }, { "epoch": 1.2, "learning_rate": 0.00011982836472244224, "loss": 0.0105, "step": 238080 }, { "epoch": 1.2, "learning_rate": 0.00011982079702942822, "loss": 0.0102, "step": 238090 }, { "epoch": 1.2, "learning_rate": 0.00011981322933641421, "loss": 0.0075, "step": 238100 }, { "epoch": 1.2, "learning_rate": 0.0001198056616434002, "loss": 0.0087, "step": 238110 }, { "epoch": 1.2, "learning_rate": 0.00011979809395038619, "loss": 0.009, "step": 238120 }, { "epoch": 1.2, "learning_rate": 0.00011979052625737218, "loss": 0.0088, "step": 238130 }, { "epoch": 1.2, "learning_rate": 0.00011978295856435818, "loss": 0.0101, "step": 238140 }, { "epoch": 1.2, "learning_rate": 0.00011977539087134416, "loss": 0.0115, "step": 238150 }, { "epoch": 1.2, "learning_rate": 0.00011976782317833015, "loss": 0.0093, "step": 238160 }, { "epoch": 1.2, "learning_rate": 0.00011976025548531614, "loss": 0.0112, "step": 238170 }, { "epoch": 1.2, "learning_rate": 0.00011975268779230213, "loss": 0.0084, "step": 238180 }, { "epoch": 1.2, "learning_rate": 0.00011974512009928813, "loss": 0.0089, "step": 238190 }, { "epoch": 1.2, "learning_rate": 0.00011973755240627411, "loss": 0.0079, "step": 238200 }, { "epoch": 1.2, "learning_rate": 0.0001197299847132601, "loss": 0.0084, "step": 238210 }, { "epoch": 1.2, "learning_rate": 0.0001197224170202461, "loss": 0.0092, "step": 238220 }, { "epoch": 1.2, "learning_rate": 0.00011971484932723208, "loss": 0.0074, "step": 238230 }, { "epoch": 1.2, "learning_rate": 0.00011970728163421807, "loss": 0.0086, "step": 238240 }, { "epoch": 1.2, "learning_rate": 0.00011969971394120406, "loss": 0.0086, "step": 238250 }, { "epoch": 1.2, "learning_rate": 0.00011969214624819005, "loss": 0.0078, "step": 238260 }, { "epoch": 1.2, "learning_rate": 0.00011968457855517605, "loss": 0.0092, "step": 238270 }, { "epoch": 1.2, "learning_rate": 0.00011967701086216203, "loss": 0.0085, "step": 238280 }, { "epoch": 1.2, "learning_rate": 0.00011966944316914802, "loss": 0.0106, "step": 238290 }, { "epoch": 1.2, "learning_rate": 0.00011966187547613402, "loss": 0.0075, "step": 238300 }, { "epoch": 1.2, "learning_rate": 0.00011965430778312, "loss": 0.0098, "step": 238310 }, { "epoch": 1.2, "learning_rate": 0.00011964674009010599, "loss": 0.0083, "step": 238320 }, { "epoch": 1.2, "learning_rate": 0.00011963917239709199, "loss": 0.0078, "step": 238330 }, { "epoch": 1.2, "learning_rate": 0.00011963160470407797, "loss": 0.0074, "step": 238340 }, { "epoch": 1.2, "learning_rate": 0.00011962403701106396, "loss": 0.0089, "step": 238350 }, { "epoch": 1.2, "learning_rate": 0.00011961646931804995, "loss": 0.0101, "step": 238360 }, { "epoch": 1.2, "learning_rate": 0.00011960890162503594, "loss": 0.0079, "step": 238370 }, { "epoch": 1.2, "learning_rate": 0.00011960133393202194, "loss": 0.0082, "step": 238380 }, { "epoch": 1.2, "learning_rate": 0.00011959376623900792, "loss": 0.0094, "step": 238390 }, { "epoch": 1.2, "learning_rate": 0.00011958619854599391, "loss": 0.009, "step": 238400 }, { "epoch": 1.2, "learning_rate": 0.00011957863085297991, "loss": 0.01, "step": 238410 }, { "epoch": 1.2, "learning_rate": 0.00011957106315996589, "loss": 0.0107, "step": 238420 }, { "epoch": 1.2, "learning_rate": 0.00011956349546695188, "loss": 0.0081, "step": 238430 }, { "epoch": 1.2, "learning_rate": 0.00011955592777393787, "loss": 0.0084, "step": 238440 }, { "epoch": 1.2, "learning_rate": 0.00011954836008092386, "loss": 0.0084, "step": 238450 }, { "epoch": 1.2, "learning_rate": 0.00011954079238790986, "loss": 0.0076, "step": 238460 }, { "epoch": 1.2, "learning_rate": 0.00011953322469489584, "loss": 0.0066, "step": 238470 }, { "epoch": 1.2, "learning_rate": 0.00011952565700188183, "loss": 0.0095, "step": 238480 }, { "epoch": 1.2, "learning_rate": 0.00011951808930886783, "loss": 0.0117, "step": 238490 }, { "epoch": 1.2, "learning_rate": 0.0001195105216158538, "loss": 0.0088, "step": 238500 }, { "epoch": 1.2, "learning_rate": 0.00011950295392283979, "loss": 0.0094, "step": 238510 }, { "epoch": 1.2, "learning_rate": 0.00011949538622982577, "loss": 0.008, "step": 238520 }, { "epoch": 1.2, "learning_rate": 0.00011948781853681177, "loss": 0.0072, "step": 238530 }, { "epoch": 1.2, "learning_rate": 0.00011948025084379775, "loss": 0.0093, "step": 238540 }, { "epoch": 1.2, "learning_rate": 0.00011947268315078374, "loss": 0.0105, "step": 238550 }, { "epoch": 1.2, "learning_rate": 0.00011946511545776974, "loss": 0.0082, "step": 238560 }, { "epoch": 1.2, "learning_rate": 0.00011945754776475572, "loss": 0.0087, "step": 238570 }, { "epoch": 1.2, "learning_rate": 0.00011944998007174171, "loss": 0.0079, "step": 238580 }, { "epoch": 1.2, "learning_rate": 0.00011944241237872771, "loss": 0.0105, "step": 238590 }, { "epoch": 1.2, "learning_rate": 0.00011943484468571369, "loss": 0.0134, "step": 238600 }, { "epoch": 1.2, "learning_rate": 0.00011942727699269969, "loss": 0.0087, "step": 238610 }, { "epoch": 1.2, "learning_rate": 0.00011941970929968567, "loss": 0.0089, "step": 238620 }, { "epoch": 1.2, "learning_rate": 0.00011941214160667166, "loss": 0.0089, "step": 238630 }, { "epoch": 1.2, "learning_rate": 0.00011940457391365766, "loss": 0.008, "step": 238640 }, { "epoch": 1.2, "learning_rate": 0.00011939700622064364, "loss": 0.0086, "step": 238650 }, { "epoch": 1.2, "learning_rate": 0.00011938943852762963, "loss": 0.006, "step": 238660 }, { "epoch": 1.2, "learning_rate": 0.00011938187083461563, "loss": 0.008, "step": 238670 }, { "epoch": 1.2, "learning_rate": 0.00011937430314160161, "loss": 0.0102, "step": 238680 }, { "epoch": 1.2, "learning_rate": 0.0001193667354485876, "loss": 0.0093, "step": 238690 }, { "epoch": 1.2, "learning_rate": 0.00011935916775557359, "loss": 0.0068, "step": 238700 }, { "epoch": 1.2, "learning_rate": 0.00011935160006255958, "loss": 0.0154, "step": 238710 }, { "epoch": 1.2, "learning_rate": 0.00011934403236954558, "loss": 0.01, "step": 238720 }, { "epoch": 1.2, "learning_rate": 0.00011933646467653156, "loss": 0.011, "step": 238730 }, { "epoch": 1.2, "learning_rate": 0.00011932889698351755, "loss": 0.014, "step": 238740 }, { "epoch": 1.2, "learning_rate": 0.00011932132929050355, "loss": 0.0096, "step": 238750 }, { "epoch": 1.2, "learning_rate": 0.00011931376159748953, "loss": 0.0136, "step": 238760 }, { "epoch": 1.2, "learning_rate": 0.00011930619390447552, "loss": 0.0114, "step": 238770 }, { "epoch": 1.2, "learning_rate": 0.00011929862621146152, "loss": 0.0117, "step": 238780 }, { "epoch": 1.2, "learning_rate": 0.0001192910585184475, "loss": 0.0094, "step": 238790 }, { "epoch": 1.2, "learning_rate": 0.0001192834908254335, "loss": 0.0101, "step": 238800 }, { "epoch": 1.2, "learning_rate": 0.00011927592313241948, "loss": 0.0109, "step": 238810 }, { "epoch": 1.2, "learning_rate": 0.00011926835543940547, "loss": 0.008, "step": 238820 }, { "epoch": 1.2, "learning_rate": 0.00011926078774639147, "loss": 0.0087, "step": 238830 }, { "epoch": 1.2, "learning_rate": 0.00011925322005337745, "loss": 0.0087, "step": 238840 }, { "epoch": 1.21, "learning_rate": 0.00011924565236036344, "loss": 0.0089, "step": 238850 }, { "epoch": 1.21, "learning_rate": 0.00011923808466734944, "loss": 0.0085, "step": 238860 }, { "epoch": 1.21, "learning_rate": 0.00011923051697433542, "loss": 0.008, "step": 238870 }, { "epoch": 1.21, "learning_rate": 0.00011922294928132141, "loss": 0.0104, "step": 238880 }, { "epoch": 1.21, "learning_rate": 0.0001192153815883074, "loss": 0.01, "step": 238890 }, { "epoch": 1.21, "learning_rate": 0.00011920781389529339, "loss": 0.0075, "step": 238900 }, { "epoch": 1.21, "learning_rate": 0.00011920024620227939, "loss": 0.0132, "step": 238910 }, { "epoch": 1.21, "learning_rate": 0.00011919267850926537, "loss": 0.0115, "step": 238920 }, { "epoch": 1.21, "learning_rate": 0.00011918511081625136, "loss": 0.0073, "step": 238930 }, { "epoch": 1.21, "learning_rate": 0.00011917754312323736, "loss": 0.0087, "step": 238940 }, { "epoch": 1.21, "learning_rate": 0.00011916997543022334, "loss": 0.0086, "step": 238950 }, { "epoch": 1.21, "learning_rate": 0.00011916240773720933, "loss": 0.0075, "step": 238960 }, { "epoch": 1.21, "learning_rate": 0.00011915484004419532, "loss": 0.01, "step": 238970 }, { "epoch": 1.21, "learning_rate": 0.00011914727235118131, "loss": 0.0095, "step": 238980 }, { "epoch": 1.21, "learning_rate": 0.0001191397046581673, "loss": 0.0074, "step": 238990 }, { "epoch": 1.21, "learning_rate": 0.00011913213696515329, "loss": 0.0104, "step": 239000 }, { "epoch": 1.21, "eval_cer": 0.914452788772905, "eval_loss": 0.006802674382925034, "eval_runtime": 116.1446, "eval_samples_per_second": 17.22, "eval_steps_per_second": 4.305, "step": 239000 }, { "epoch": 1.21, "learning_rate": 0.00011912456927213928, "loss": 0.0092, "step": 239010 }, { "epoch": 1.21, "learning_rate": 0.00011911700157912528, "loss": 0.0083, "step": 239020 }, { "epoch": 1.21, "learning_rate": 0.00011910943388611126, "loss": 0.0094, "step": 239030 }, { "epoch": 1.21, "learning_rate": 0.00011910186619309725, "loss": 0.0085, "step": 239040 }, { "epoch": 1.21, "learning_rate": 0.00011909429850008323, "loss": 0.0076, "step": 239050 }, { "epoch": 1.21, "learning_rate": 0.00011908673080706923, "loss": 0.0081, "step": 239060 }, { "epoch": 1.21, "learning_rate": 0.00011907916311405522, "loss": 0.0099, "step": 239070 }, { "epoch": 1.21, "learning_rate": 0.0001190715954210412, "loss": 0.0075, "step": 239080 }, { "epoch": 1.21, "learning_rate": 0.0001190640277280272, "loss": 0.008, "step": 239090 }, { "epoch": 1.21, "learning_rate": 0.0001190564600350132, "loss": 0.007, "step": 239100 }, { "epoch": 1.21, "learning_rate": 0.00011904889234199918, "loss": 0.008, "step": 239110 }, { "epoch": 1.21, "learning_rate": 0.00011904132464898517, "loss": 0.008, "step": 239120 }, { "epoch": 1.21, "learning_rate": 0.00011903375695597114, "loss": 0.0085, "step": 239130 }, { "epoch": 1.21, "learning_rate": 0.00011902618926295714, "loss": 0.0094, "step": 239140 }, { "epoch": 1.21, "learning_rate": 0.00011901862156994312, "loss": 0.0086, "step": 239150 }, { "epoch": 1.21, "learning_rate": 0.00011901105387692911, "loss": 0.0069, "step": 239160 }, { "epoch": 1.21, "learning_rate": 0.00011900348618391511, "loss": 0.0095, "step": 239170 }, { "epoch": 1.21, "learning_rate": 0.00011899591849090109, "loss": 0.0115, "step": 239180 }, { "epoch": 1.21, "learning_rate": 0.00011898835079788708, "loss": 0.0105, "step": 239190 }, { "epoch": 1.21, "learning_rate": 0.00011898078310487308, "loss": 0.0095, "step": 239200 }, { "epoch": 1.21, "learning_rate": 0.00011897321541185906, "loss": 0.009, "step": 239210 }, { "epoch": 1.21, "learning_rate": 0.00011896564771884505, "loss": 0.0087, "step": 239220 }, { "epoch": 1.21, "learning_rate": 0.00011895808002583105, "loss": 0.0114, "step": 239230 }, { "epoch": 1.21, "learning_rate": 0.00011895051233281703, "loss": 0.0121, "step": 239240 }, { "epoch": 1.21, "learning_rate": 0.00011894294463980303, "loss": 0.0107, "step": 239250 }, { "epoch": 1.21, "learning_rate": 0.00011893537694678901, "loss": 0.0095, "step": 239260 }, { "epoch": 1.21, "learning_rate": 0.000118927809253775, "loss": 0.01, "step": 239270 }, { "epoch": 1.21, "learning_rate": 0.000118920241560761, "loss": 0.0069, "step": 239280 }, { "epoch": 1.21, "learning_rate": 0.00011891267386774698, "loss": 0.0089, "step": 239290 }, { "epoch": 1.21, "learning_rate": 0.00011890510617473297, "loss": 0.0079, "step": 239300 }, { "epoch": 1.21, "learning_rate": 0.00011889753848171897, "loss": 0.0109, "step": 239310 }, { "epoch": 1.21, "learning_rate": 0.00011888997078870495, "loss": 0.0067, "step": 239320 }, { "epoch": 1.21, "learning_rate": 0.00011888240309569095, "loss": 0.0119, "step": 239330 }, { "epoch": 1.21, "learning_rate": 0.00011887483540267693, "loss": 0.0096, "step": 239340 }, { "epoch": 1.21, "learning_rate": 0.00011886726770966292, "loss": 0.009, "step": 239350 }, { "epoch": 1.21, "learning_rate": 0.00011885970001664892, "loss": 0.0089, "step": 239360 }, { "epoch": 1.21, "learning_rate": 0.0001188521323236349, "loss": 0.0122, "step": 239370 }, { "epoch": 1.21, "learning_rate": 0.0001188445646306209, "loss": 0.0085, "step": 239380 }, { "epoch": 1.21, "learning_rate": 0.00011883699693760689, "loss": 0.0121, "step": 239390 }, { "epoch": 1.21, "learning_rate": 0.00011882942924459287, "loss": 0.0157, "step": 239400 }, { "epoch": 1.21, "learning_rate": 0.00011882186155157886, "loss": 0.0116, "step": 239410 }, { "epoch": 1.21, "learning_rate": 0.00011881429385856485, "loss": 0.009, "step": 239420 }, { "epoch": 1.21, "learning_rate": 0.00011880672616555084, "loss": 0.008, "step": 239430 }, { "epoch": 1.21, "learning_rate": 0.00011879915847253684, "loss": 0.0129, "step": 239440 }, { "epoch": 1.21, "learning_rate": 0.00011879159077952282, "loss": 0.0101, "step": 239450 }, { "epoch": 1.21, "learning_rate": 0.00011878402308650881, "loss": 0.0082, "step": 239460 }, { "epoch": 1.21, "learning_rate": 0.00011877645539349481, "loss": 0.0088, "step": 239470 }, { "epoch": 1.21, "learning_rate": 0.00011876888770048079, "loss": 0.0076, "step": 239480 }, { "epoch": 1.21, "learning_rate": 0.00011876132000746678, "loss": 0.0095, "step": 239490 }, { "epoch": 1.21, "learning_rate": 0.00011875375231445277, "loss": 0.008, "step": 239500 }, { "epoch": 1.21, "learning_rate": 0.00011874618462143876, "loss": 0.0095, "step": 239510 }, { "epoch": 1.21, "learning_rate": 0.00011873861692842476, "loss": 0.0069, "step": 239520 }, { "epoch": 1.21, "learning_rate": 0.00011873104923541074, "loss": 0.0066, "step": 239530 }, { "epoch": 1.21, "learning_rate": 0.00011872348154239673, "loss": 0.0062, "step": 239540 }, { "epoch": 1.21, "learning_rate": 0.00011871591384938273, "loss": 0.0083, "step": 239550 }, { "epoch": 1.21, "learning_rate": 0.00011870834615636871, "loss": 0.0108, "step": 239560 }, { "epoch": 1.21, "learning_rate": 0.0001187007784633547, "loss": 0.007, "step": 239570 }, { "epoch": 1.21, "learning_rate": 0.00011869321077034068, "loss": 0.0102, "step": 239580 }, { "epoch": 1.21, "learning_rate": 0.00011868564307732668, "loss": 0.011, "step": 239590 }, { "epoch": 1.21, "learning_rate": 0.00011867807538431267, "loss": 0.0107, "step": 239600 }, { "epoch": 1.21, "learning_rate": 0.00011867050769129866, "loss": 0.0106, "step": 239610 }, { "epoch": 1.21, "learning_rate": 0.00011866293999828465, "loss": 0.0095, "step": 239620 }, { "epoch": 1.21, "learning_rate": 0.00011865537230527065, "loss": 0.0095, "step": 239630 }, { "epoch": 1.21, "learning_rate": 0.00011864780461225663, "loss": 0.0091, "step": 239640 }, { "epoch": 1.21, "learning_rate": 0.00011864023691924262, "loss": 0.0085, "step": 239650 }, { "epoch": 1.21, "learning_rate": 0.0001186326692262286, "loss": 0.0107, "step": 239660 }, { "epoch": 1.21, "learning_rate": 0.0001186251015332146, "loss": 0.0118, "step": 239670 }, { "epoch": 1.21, "learning_rate": 0.0001186175338402006, "loss": 0.009, "step": 239680 }, { "epoch": 1.21, "learning_rate": 0.00011860996614718658, "loss": 0.0103, "step": 239690 }, { "epoch": 1.21, "learning_rate": 0.00011860239845417257, "loss": 0.0054, "step": 239700 }, { "epoch": 1.21, "learning_rate": 0.00011859483076115857, "loss": 0.0111, "step": 239710 }, { "epoch": 1.21, "learning_rate": 0.00011858726306814455, "loss": 0.0119, "step": 239720 }, { "epoch": 1.21, "learning_rate": 0.00011857969537513054, "loss": 0.0082, "step": 239730 }, { "epoch": 1.21, "learning_rate": 0.00011857212768211652, "loss": 0.0077, "step": 239740 }, { "epoch": 1.21, "learning_rate": 0.00011856455998910252, "loss": 0.0077, "step": 239750 }, { "epoch": 1.21, "learning_rate": 0.0001185569922960885, "loss": 0.0089, "step": 239760 }, { "epoch": 1.21, "learning_rate": 0.00011854942460307448, "loss": 0.008, "step": 239770 }, { "epoch": 1.21, "learning_rate": 0.00011854185691006048, "loss": 0.0062, "step": 239780 }, { "epoch": 1.21, "learning_rate": 0.00011853428921704646, "loss": 0.0078, "step": 239790 }, { "epoch": 1.21, "learning_rate": 0.00011852672152403245, "loss": 0.0077, "step": 239800 }, { "epoch": 1.21, "learning_rate": 0.00011851915383101845, "loss": 0.008, "step": 239810 }, { "epoch": 1.21, "learning_rate": 0.00011851158613800443, "loss": 0.009, "step": 239820 }, { "epoch": 1.21, "learning_rate": 0.00011850401844499042, "loss": 0.0081, "step": 239830 }, { "epoch": 1.21, "learning_rate": 0.00011849645075197642, "loss": 0.0091, "step": 239840 }, { "epoch": 1.21, "learning_rate": 0.0001184888830589624, "loss": 0.0097, "step": 239850 }, { "epoch": 1.21, "learning_rate": 0.0001184813153659484, "loss": 0.0075, "step": 239860 }, { "epoch": 1.21, "learning_rate": 0.00011847374767293438, "loss": 0.0067, "step": 239870 }, { "epoch": 1.21, "learning_rate": 0.00011846617997992037, "loss": 0.0084, "step": 239880 }, { "epoch": 1.21, "learning_rate": 0.00011845861228690637, "loss": 0.0079, "step": 239890 }, { "epoch": 1.21, "learning_rate": 0.00011845104459389235, "loss": 0.0075, "step": 239900 }, { "epoch": 1.21, "learning_rate": 0.00011844347690087834, "loss": 0.0079, "step": 239910 }, { "epoch": 1.21, "learning_rate": 0.00011843590920786434, "loss": 0.0084, "step": 239920 }, { "epoch": 1.21, "learning_rate": 0.00011842834151485032, "loss": 0.0077, "step": 239930 }, { "epoch": 1.21, "learning_rate": 0.00011842077382183631, "loss": 0.0082, "step": 239940 }, { "epoch": 1.21, "learning_rate": 0.0001184132061288223, "loss": 0.009, "step": 239950 }, { "epoch": 1.21, "learning_rate": 0.00011840563843580829, "loss": 0.0076, "step": 239960 }, { "epoch": 1.21, "learning_rate": 0.00011839807074279429, "loss": 0.0085, "step": 239970 }, { "epoch": 1.21, "learning_rate": 0.00011839050304978027, "loss": 0.0076, "step": 239980 }, { "epoch": 1.21, "learning_rate": 0.00011838293535676626, "loss": 0.0097, "step": 239990 }, { "epoch": 1.21, "learning_rate": 0.00011837536766375226, "loss": 0.0094, "step": 240000 }, { "epoch": 1.21, "eval_cer": 0.9144537591690304, "eval_loss": 0.006650357041507959, "eval_runtime": 116.0541, "eval_samples_per_second": 17.233, "eval_steps_per_second": 4.308, "step": 240000 }, { "epoch": 1.21, "learning_rate": 0.00011836779997073824, "loss": 0.0113, "step": 240010 }, { "epoch": 1.21, "learning_rate": 0.00011836023227772423, "loss": 0.0091, "step": 240020 }, { "epoch": 1.21, "learning_rate": 0.00011835266458471022, "loss": 0.0129, "step": 240030 }, { "epoch": 1.21, "learning_rate": 0.00011834509689169621, "loss": 0.0065, "step": 240040 }, { "epoch": 1.21, "learning_rate": 0.0001183375291986822, "loss": 0.0102, "step": 240050 }, { "epoch": 1.21, "learning_rate": 0.00011832996150566819, "loss": 0.0102, "step": 240060 }, { "epoch": 1.21, "learning_rate": 0.00011832239381265418, "loss": 0.0093, "step": 240070 }, { "epoch": 1.21, "learning_rate": 0.00011831482611964018, "loss": 0.0099, "step": 240080 }, { "epoch": 1.21, "learning_rate": 0.00011830725842662616, "loss": 0.0091, "step": 240090 }, { "epoch": 1.21, "learning_rate": 0.00011829969073361215, "loss": 0.0108, "step": 240100 }, { "epoch": 1.21, "learning_rate": 0.00011829212304059813, "loss": 0.0067, "step": 240110 }, { "epoch": 1.21, "learning_rate": 0.00011828455534758413, "loss": 0.0085, "step": 240120 }, { "epoch": 1.21, "learning_rate": 0.00011827698765457012, "loss": 0.0086, "step": 240130 }, { "epoch": 1.21, "learning_rate": 0.0001182694199615561, "loss": 0.0085, "step": 240140 }, { "epoch": 1.21, "learning_rate": 0.0001182618522685421, "loss": 0.0077, "step": 240150 }, { "epoch": 1.21, "learning_rate": 0.0001182542845755281, "loss": 0.0075, "step": 240160 }, { "epoch": 1.21, "learning_rate": 0.00011824671688251408, "loss": 0.0091, "step": 240170 }, { "epoch": 1.21, "learning_rate": 0.00011823914918950007, "loss": 0.0082, "step": 240180 }, { "epoch": 1.21, "learning_rate": 0.00011823158149648605, "loss": 0.0077, "step": 240190 }, { "epoch": 1.21, "learning_rate": 0.00011822401380347205, "loss": 0.009, "step": 240200 }, { "epoch": 1.21, "learning_rate": 0.00011821644611045804, "loss": 0.0085, "step": 240210 }, { "epoch": 1.21, "learning_rate": 0.00011820887841744403, "loss": 0.0086, "step": 240220 }, { "epoch": 1.21, "learning_rate": 0.00011820131072443002, "loss": 0.0077, "step": 240230 }, { "epoch": 1.21, "learning_rate": 0.00011819374303141602, "loss": 0.009, "step": 240240 }, { "epoch": 1.21, "learning_rate": 0.000118186175338402, "loss": 0.0079, "step": 240250 }, { "epoch": 1.21, "learning_rate": 0.00011817860764538799, "loss": 0.0118, "step": 240260 }, { "epoch": 1.21, "learning_rate": 0.00011817103995237399, "loss": 0.008, "step": 240270 }, { "epoch": 1.21, "learning_rate": 0.00011816347225935997, "loss": 0.0072, "step": 240280 }, { "epoch": 1.21, "learning_rate": 0.00011815590456634596, "loss": 0.0075, "step": 240290 }, { "epoch": 1.21, "learning_rate": 0.00011814833687333194, "loss": 0.008, "step": 240300 }, { "epoch": 1.21, "learning_rate": 0.00011814076918031794, "loss": 0.008, "step": 240310 }, { "epoch": 1.21, "learning_rate": 0.00011813320148730393, "loss": 0.0086, "step": 240320 }, { "epoch": 1.21, "learning_rate": 0.00011812563379428992, "loss": 0.0074, "step": 240330 }, { "epoch": 1.21, "learning_rate": 0.00011811806610127591, "loss": 0.0094, "step": 240340 }, { "epoch": 1.21, "learning_rate": 0.0001181104984082619, "loss": 0.0072, "step": 240350 }, { "epoch": 1.21, "learning_rate": 0.00011810293071524789, "loss": 0.009, "step": 240360 }, { "epoch": 1.21, "learning_rate": 0.00011809536302223388, "loss": 0.0111, "step": 240370 }, { "epoch": 1.21, "learning_rate": 0.00011808779532921985, "loss": 0.0085, "step": 240380 }, { "epoch": 1.21, "learning_rate": 0.00011808022763620585, "loss": 0.0093, "step": 240390 }, { "epoch": 1.21, "learning_rate": 0.00011807265994319183, "loss": 0.0099, "step": 240400 }, { "epoch": 1.21, "learning_rate": 0.00011806509225017782, "loss": 0.0093, "step": 240410 }, { "epoch": 1.21, "learning_rate": 0.00011805752455716382, "loss": 0.0074, "step": 240420 }, { "epoch": 1.21, "learning_rate": 0.0001180499568641498, "loss": 0.0078, "step": 240430 }, { "epoch": 1.21, "learning_rate": 0.0001180423891711358, "loss": 0.0111, "step": 240440 }, { "epoch": 1.21, "learning_rate": 0.00011803482147812179, "loss": 0.0108, "step": 240450 }, { "epoch": 1.21, "learning_rate": 0.00011802725378510777, "loss": 0.0064, "step": 240460 }, { "epoch": 1.21, "learning_rate": 0.00011801968609209376, "loss": 0.0073, "step": 240470 }, { "epoch": 1.21, "learning_rate": 0.00011801211839907975, "loss": 0.0078, "step": 240480 }, { "epoch": 1.21, "learning_rate": 0.00011800455070606574, "loss": 0.0115, "step": 240490 }, { "epoch": 1.21, "learning_rate": 0.00011799698301305174, "loss": 0.0078, "step": 240500 }, { "epoch": 1.21, "learning_rate": 0.00011798941532003772, "loss": 0.009, "step": 240510 }, { "epoch": 1.21, "learning_rate": 0.00011798184762702371, "loss": 0.0067, "step": 240520 }, { "epoch": 1.21, "learning_rate": 0.00011797427993400971, "loss": 0.0092, "step": 240530 }, { "epoch": 1.21, "learning_rate": 0.00011796671224099569, "loss": 0.0081, "step": 240540 }, { "epoch": 1.21, "learning_rate": 0.00011795914454798168, "loss": 0.0083, "step": 240550 }, { "epoch": 1.21, "learning_rate": 0.00011795157685496767, "loss": 0.0081, "step": 240560 }, { "epoch": 1.21, "learning_rate": 0.00011794400916195366, "loss": 0.0073, "step": 240570 }, { "epoch": 1.21, "learning_rate": 0.00011793644146893966, "loss": 0.0076, "step": 240580 }, { "epoch": 1.21, "learning_rate": 0.00011792887377592564, "loss": 0.0071, "step": 240590 }, { "epoch": 1.21, "learning_rate": 0.00011792130608291163, "loss": 0.0091, "step": 240600 }, { "epoch": 1.21, "learning_rate": 0.00011791373838989763, "loss": 0.0074, "step": 240610 }, { "epoch": 1.21, "learning_rate": 0.00011790617069688361, "loss": 0.0104, "step": 240620 }, { "epoch": 1.21, "learning_rate": 0.0001178986030038696, "loss": 0.0088, "step": 240630 }, { "epoch": 1.21, "learning_rate": 0.00011789103531085559, "loss": 0.0082, "step": 240640 }, { "epoch": 1.21, "learning_rate": 0.00011788346761784158, "loss": 0.0143, "step": 240650 }, { "epoch": 1.21, "learning_rate": 0.00011787589992482758, "loss": 0.0065, "step": 240660 }, { "epoch": 1.21, "learning_rate": 0.00011786833223181356, "loss": 0.0099, "step": 240670 }, { "epoch": 1.21, "learning_rate": 0.00011786076453879955, "loss": 0.0077, "step": 240680 }, { "epoch": 1.21, "learning_rate": 0.00011785319684578555, "loss": 0.0119, "step": 240690 }, { "epoch": 1.21, "learning_rate": 0.00011784562915277153, "loss": 0.008, "step": 240700 }, { "epoch": 1.21, "learning_rate": 0.00011783806145975752, "loss": 0.0092, "step": 240710 }, { "epoch": 1.21, "learning_rate": 0.00011783049376674352, "loss": 0.0078, "step": 240720 }, { "epoch": 1.21, "learning_rate": 0.0001178229260737295, "loss": 0.0086, "step": 240730 }, { "epoch": 1.21, "learning_rate": 0.0001178153583807155, "loss": 0.0084, "step": 240740 }, { "epoch": 1.21, "learning_rate": 0.00011780779068770148, "loss": 0.0095, "step": 240750 }, { "epoch": 1.21, "learning_rate": 0.00011780022299468747, "loss": 0.0092, "step": 240760 }, { "epoch": 1.21, "learning_rate": 0.00011779265530167347, "loss": 0.0088, "step": 240770 }, { "epoch": 1.21, "learning_rate": 0.00011778508760865945, "loss": 0.01, "step": 240780 }, { "epoch": 1.21, "learning_rate": 0.00011777751991564544, "loss": 0.0105, "step": 240790 }, { "epoch": 1.21, "learning_rate": 0.00011776995222263144, "loss": 0.0083, "step": 240800 }, { "epoch": 1.21, "learning_rate": 0.00011776238452961742, "loss": 0.0094, "step": 240810 }, { "epoch": 1.21, "learning_rate": 0.00011775481683660341, "loss": 0.0067, "step": 240820 }, { "epoch": 1.22, "learning_rate": 0.0001177472491435894, "loss": 0.0084, "step": 240830 }, { "epoch": 1.22, "learning_rate": 0.00011773968145057539, "loss": 0.0106, "step": 240840 }, { "epoch": 1.22, "learning_rate": 0.00011773211375756139, "loss": 0.0092, "step": 240850 }, { "epoch": 1.22, "learning_rate": 0.00011772454606454737, "loss": 0.0089, "step": 240860 }, { "epoch": 1.22, "learning_rate": 0.00011771697837153336, "loss": 0.0101, "step": 240870 }, { "epoch": 1.22, "learning_rate": 0.00011770941067851936, "loss": 0.0092, "step": 240880 }, { "epoch": 1.22, "learning_rate": 0.00011770184298550534, "loss": 0.0093, "step": 240890 }, { "epoch": 1.22, "learning_rate": 0.00011769427529249133, "loss": 0.0081, "step": 240900 }, { "epoch": 1.22, "learning_rate": 0.00011768670759947731, "loss": 0.0071, "step": 240910 }, { "epoch": 1.22, "learning_rate": 0.00011767913990646331, "loss": 0.0068, "step": 240920 }, { "epoch": 1.22, "learning_rate": 0.0001176715722134493, "loss": 0.0152, "step": 240930 }, { "epoch": 1.22, "learning_rate": 0.00011766400452043529, "loss": 0.0089, "step": 240940 }, { "epoch": 1.22, "learning_rate": 0.00011765643682742128, "loss": 0.01, "step": 240950 }, { "epoch": 1.22, "learning_rate": 0.00011764886913440728, "loss": 0.0083, "step": 240960 }, { "epoch": 1.22, "learning_rate": 0.00011764130144139326, "loss": 0.0104, "step": 240970 }, { "epoch": 1.22, "learning_rate": 0.00011763373374837925, "loss": 0.01, "step": 240980 }, { "epoch": 1.22, "learning_rate": 0.00011762616605536523, "loss": 0.0068, "step": 240990 }, { "epoch": 1.22, "learning_rate": 0.00011761859836235123, "loss": 0.0096, "step": 241000 }, { "epoch": 1.22, "eval_cer": 0.9144644335264098, "eval_loss": 0.00682118721306324, "eval_runtime": 115.8371, "eval_samples_per_second": 17.266, "eval_steps_per_second": 4.316, "step": 241000 }, { "epoch": 1.22, "learning_rate": 0.0001176110306693372, "loss": 0.009, "step": 241010 }, { "epoch": 1.22, "learning_rate": 0.00011760346297632319, "loss": 0.0076, "step": 241020 }, { "epoch": 1.22, "learning_rate": 0.00011759589528330919, "loss": 0.0101, "step": 241030 }, { "epoch": 1.22, "learning_rate": 0.00011758832759029517, "loss": 0.008, "step": 241040 }, { "epoch": 1.22, "learning_rate": 0.00011758075989728116, "loss": 0.0074, "step": 241050 }, { "epoch": 1.22, "learning_rate": 0.00011757319220426716, "loss": 0.0099, "step": 241060 }, { "epoch": 1.22, "learning_rate": 0.00011756562451125314, "loss": 0.0094, "step": 241070 }, { "epoch": 1.22, "learning_rate": 0.00011755805681823913, "loss": 0.0089, "step": 241080 }, { "epoch": 1.22, "learning_rate": 0.00011755048912522512, "loss": 0.0091, "step": 241090 }, { "epoch": 1.22, "learning_rate": 0.00011754292143221111, "loss": 0.0092, "step": 241100 }, { "epoch": 1.22, "learning_rate": 0.0001175353537391971, "loss": 0.0076, "step": 241110 }, { "epoch": 1.22, "learning_rate": 0.00011752778604618309, "loss": 0.0101, "step": 241120 }, { "epoch": 1.22, "learning_rate": 0.00011752021835316908, "loss": 0.008, "step": 241130 }, { "epoch": 1.22, "learning_rate": 0.00011751265066015508, "loss": 0.0094, "step": 241140 }, { "epoch": 1.22, "learning_rate": 0.00011750508296714106, "loss": 0.0082, "step": 241150 }, { "epoch": 1.22, "learning_rate": 0.00011749751527412705, "loss": 0.0109, "step": 241160 }, { "epoch": 1.22, "learning_rate": 0.00011748994758111305, "loss": 0.007, "step": 241170 }, { "epoch": 1.22, "learning_rate": 0.00011748237988809903, "loss": 0.0094, "step": 241180 }, { "epoch": 1.22, "learning_rate": 0.00011747481219508503, "loss": 0.012, "step": 241190 }, { "epoch": 1.22, "learning_rate": 0.000117467244502071, "loss": 0.0086, "step": 241200 }, { "epoch": 1.22, "learning_rate": 0.000117459676809057, "loss": 0.0098, "step": 241210 }, { "epoch": 1.22, "learning_rate": 0.000117452109116043, "loss": 0.0079, "step": 241220 }, { "epoch": 1.22, "learning_rate": 0.00011744454142302898, "loss": 0.0094, "step": 241230 }, { "epoch": 1.22, "learning_rate": 0.00011743697373001497, "loss": 0.0072, "step": 241240 }, { "epoch": 1.22, "learning_rate": 0.00011742940603700097, "loss": 0.0093, "step": 241250 }, { "epoch": 1.22, "learning_rate": 0.00011742183834398695, "loss": 0.0075, "step": 241260 }, { "epoch": 1.22, "learning_rate": 0.00011741427065097294, "loss": 0.0064, "step": 241270 }, { "epoch": 1.22, "learning_rate": 0.00011740670295795893, "loss": 0.0112, "step": 241280 }, { "epoch": 1.22, "learning_rate": 0.00011739913526494492, "loss": 0.008, "step": 241290 }, { "epoch": 1.22, "learning_rate": 0.00011739156757193092, "loss": 0.0069, "step": 241300 }, { "epoch": 1.22, "learning_rate": 0.0001173839998789169, "loss": 0.0092, "step": 241310 }, { "epoch": 1.22, "learning_rate": 0.00011737643218590289, "loss": 0.0076, "step": 241320 }, { "epoch": 1.22, "learning_rate": 0.00011736886449288889, "loss": 0.0095, "step": 241330 }, { "epoch": 1.22, "learning_rate": 0.00011736129679987487, "loss": 0.0076, "step": 241340 }, { "epoch": 1.22, "learning_rate": 0.00011735372910686086, "loss": 0.0086, "step": 241350 }, { "epoch": 1.22, "learning_rate": 0.00011734616141384685, "loss": 0.0082, "step": 241360 }, { "epoch": 1.22, "learning_rate": 0.00011733859372083284, "loss": 0.0092, "step": 241370 }, { "epoch": 1.22, "learning_rate": 0.00011733102602781884, "loss": 0.0105, "step": 241380 }, { "epoch": 1.22, "learning_rate": 0.00011732345833480482, "loss": 0.008, "step": 241390 }, { "epoch": 1.22, "learning_rate": 0.00011731589064179081, "loss": 0.0086, "step": 241400 }, { "epoch": 1.22, "learning_rate": 0.0001173083229487768, "loss": 0.0106, "step": 241410 }, { "epoch": 1.22, "learning_rate": 0.00011730075525576279, "loss": 0.0089, "step": 241420 }, { "epoch": 1.22, "learning_rate": 0.00011729318756274878, "loss": 0.0082, "step": 241430 }, { "epoch": 1.22, "learning_rate": 0.00011728561986973476, "loss": 0.0106, "step": 241440 }, { "epoch": 1.22, "learning_rate": 0.00011727805217672076, "loss": 0.0094, "step": 241450 }, { "epoch": 1.22, "learning_rate": 0.00011727048448370675, "loss": 0.0086, "step": 241460 }, { "epoch": 1.22, "learning_rate": 0.00011726291679069274, "loss": 0.0089, "step": 241470 }, { "epoch": 1.22, "learning_rate": 0.00011725534909767873, "loss": 0.0072, "step": 241480 }, { "epoch": 1.22, "learning_rate": 0.00011724778140466473, "loss": 0.0098, "step": 241490 }, { "epoch": 1.22, "learning_rate": 0.00011724021371165071, "loss": 0.0069, "step": 241500 }, { "epoch": 1.22, "learning_rate": 0.0001172326460186367, "loss": 0.0082, "step": 241510 }, { "epoch": 1.22, "learning_rate": 0.00011722507832562268, "loss": 0.0103, "step": 241520 }, { "epoch": 1.22, "learning_rate": 0.00011721751063260868, "loss": 0.0091, "step": 241530 }, { "epoch": 1.22, "learning_rate": 0.00011720994293959467, "loss": 0.0061, "step": 241540 }, { "epoch": 1.22, "learning_rate": 0.00011720237524658066, "loss": 0.0092, "step": 241550 }, { "epoch": 1.22, "learning_rate": 0.00011719480755356665, "loss": 0.0088, "step": 241560 }, { "epoch": 1.22, "learning_rate": 0.00011718723986055265, "loss": 0.0072, "step": 241570 }, { "epoch": 1.22, "learning_rate": 0.00011717967216753863, "loss": 0.0063, "step": 241580 }, { "epoch": 1.22, "learning_rate": 0.00011717210447452462, "loss": 0.0099, "step": 241590 }, { "epoch": 1.22, "learning_rate": 0.0001171645367815106, "loss": 0.0075, "step": 241600 }, { "epoch": 1.22, "learning_rate": 0.0001171569690884966, "loss": 0.01, "step": 241610 }, { "epoch": 1.22, "learning_rate": 0.00011714940139548259, "loss": 0.007, "step": 241620 }, { "epoch": 1.22, "learning_rate": 0.00011714183370246857, "loss": 0.0139, "step": 241630 }, { "epoch": 1.22, "learning_rate": 0.00011713426600945456, "loss": 0.0063, "step": 241640 }, { "epoch": 1.22, "learning_rate": 0.00011712669831644054, "loss": 0.0064, "step": 241650 }, { "epoch": 1.22, "learning_rate": 0.00011711913062342653, "loss": 0.0109, "step": 241660 }, { "epoch": 1.22, "learning_rate": 0.00011711156293041253, "loss": 0.0095, "step": 241670 }, { "epoch": 1.22, "learning_rate": 0.00011710399523739851, "loss": 0.0121, "step": 241680 }, { "epoch": 1.22, "learning_rate": 0.0001170964275443845, "loss": 0.0091, "step": 241690 }, { "epoch": 1.22, "learning_rate": 0.0001170888598513705, "loss": 0.0068, "step": 241700 }, { "epoch": 1.22, "learning_rate": 0.00011708129215835648, "loss": 0.0092, "step": 241710 }, { "epoch": 1.22, "learning_rate": 0.00011707372446534248, "loss": 0.0075, "step": 241720 }, { "epoch": 1.22, "learning_rate": 0.00011706615677232846, "loss": 0.009, "step": 241730 }, { "epoch": 1.22, "learning_rate": 0.00011705858907931445, "loss": 0.0067, "step": 241740 }, { "epoch": 1.22, "learning_rate": 0.00011705102138630045, "loss": 0.0087, "step": 241750 }, { "epoch": 1.22, "learning_rate": 0.00011704345369328643, "loss": 0.0099, "step": 241760 }, { "epoch": 1.22, "learning_rate": 0.00011703588600027242, "loss": 0.0085, "step": 241770 }, { "epoch": 1.22, "learning_rate": 0.00011702831830725842, "loss": 0.0084, "step": 241780 }, { "epoch": 1.22, "learning_rate": 0.0001170207506142444, "loss": 0.0078, "step": 241790 }, { "epoch": 1.22, "learning_rate": 0.0001170131829212304, "loss": 0.0106, "step": 241800 }, { "epoch": 1.22, "learning_rate": 0.00011700561522821638, "loss": 0.0083, "step": 241810 }, { "epoch": 1.22, "learning_rate": 0.00011699804753520237, "loss": 0.0099, "step": 241820 }, { "epoch": 1.22, "learning_rate": 0.00011699047984218837, "loss": 0.0091, "step": 241830 }, { "epoch": 1.22, "learning_rate": 0.00011698291214917435, "loss": 0.0086, "step": 241840 }, { "epoch": 1.22, "learning_rate": 0.00011697534445616034, "loss": 0.0081, "step": 241850 }, { "epoch": 1.22, "learning_rate": 0.00011696777676314634, "loss": 0.0075, "step": 241860 }, { "epoch": 1.22, "learning_rate": 0.00011696020907013232, "loss": 0.0075, "step": 241870 }, { "epoch": 1.22, "learning_rate": 0.00011695264137711831, "loss": 0.0098, "step": 241880 }, { "epoch": 1.22, "learning_rate": 0.0001169450736841043, "loss": 0.0075, "step": 241890 }, { "epoch": 1.22, "learning_rate": 0.00011693750599109029, "loss": 0.0063, "step": 241900 }, { "epoch": 1.22, "learning_rate": 0.00011692993829807629, "loss": 0.0092, "step": 241910 }, { "epoch": 1.22, "learning_rate": 0.00011692237060506227, "loss": 0.0076, "step": 241920 }, { "epoch": 1.22, "learning_rate": 0.00011691480291204826, "loss": 0.0099, "step": 241930 }, { "epoch": 1.22, "learning_rate": 0.00011690723521903426, "loss": 0.0111, "step": 241940 }, { "epoch": 1.22, "learning_rate": 0.00011689966752602024, "loss": 0.01, "step": 241950 }, { "epoch": 1.22, "learning_rate": 0.00011689209983300623, "loss": 0.0082, "step": 241960 }, { "epoch": 1.22, "learning_rate": 0.00011688453213999221, "loss": 0.0092, "step": 241970 }, { "epoch": 1.22, "learning_rate": 0.00011687696444697821, "loss": 0.0101, "step": 241980 }, { "epoch": 1.22, "learning_rate": 0.0001168693967539642, "loss": 0.0077, "step": 241990 }, { "epoch": 1.22, "learning_rate": 0.00011686182906095019, "loss": 0.0066, "step": 242000 }, { "epoch": 1.22, "eval_cer": 0.914452788772905, "eval_loss": 0.006828702986240387, "eval_runtime": 115.9715, "eval_samples_per_second": 17.246, "eval_steps_per_second": 4.311, "step": 242000 }, { "epoch": 1.22, "learning_rate": 0.00011685426136793618, "loss": 0.0095, "step": 242010 }, { "epoch": 1.22, "learning_rate": 0.00011684669367492218, "loss": 0.0078, "step": 242020 }, { "epoch": 1.22, "learning_rate": 0.00011683912598190816, "loss": 0.0118, "step": 242030 }, { "epoch": 1.22, "learning_rate": 0.00011683155828889415, "loss": 0.0077, "step": 242040 }, { "epoch": 1.22, "learning_rate": 0.00011682399059588013, "loss": 0.0069, "step": 242050 }, { "epoch": 1.22, "learning_rate": 0.00011681642290286613, "loss": 0.0081, "step": 242060 }, { "epoch": 1.22, "learning_rate": 0.00011680885520985212, "loss": 0.0084, "step": 242070 }, { "epoch": 1.22, "learning_rate": 0.0001168012875168381, "loss": 0.0099, "step": 242080 }, { "epoch": 1.22, "learning_rate": 0.0001167937198238241, "loss": 0.0099, "step": 242090 }, { "epoch": 1.22, "learning_rate": 0.0001167861521308101, "loss": 0.0084, "step": 242100 }, { "epoch": 1.22, "learning_rate": 0.00011677858443779608, "loss": 0.0108, "step": 242110 }, { "epoch": 1.22, "learning_rate": 0.00011677101674478207, "loss": 0.0062, "step": 242120 }, { "epoch": 1.22, "learning_rate": 0.00011676344905176805, "loss": 0.0079, "step": 242130 }, { "epoch": 1.22, "learning_rate": 0.00011675588135875405, "loss": 0.0175, "step": 242140 }, { "epoch": 1.22, "learning_rate": 0.00011674831366574004, "loss": 0.0095, "step": 242150 }, { "epoch": 1.22, "learning_rate": 0.00011674074597272602, "loss": 0.007, "step": 242160 }, { "epoch": 1.22, "learning_rate": 0.00011673317827971202, "loss": 0.0118, "step": 242170 }, { "epoch": 1.22, "learning_rate": 0.00011672561058669801, "loss": 0.0104, "step": 242180 }, { "epoch": 1.22, "learning_rate": 0.000116718042893684, "loss": 0.0086, "step": 242190 }, { "epoch": 1.22, "learning_rate": 0.00011671047520066999, "loss": 0.0094, "step": 242200 }, { "epoch": 1.22, "learning_rate": 0.00011670290750765599, "loss": 0.0085, "step": 242210 }, { "epoch": 1.22, "learning_rate": 0.00011669533981464197, "loss": 0.0105, "step": 242220 }, { "epoch": 1.22, "learning_rate": 0.00011668777212162796, "loss": 0.0074, "step": 242230 }, { "epoch": 1.22, "learning_rate": 0.00011668020442861394, "loss": 0.0078, "step": 242240 }, { "epoch": 1.22, "learning_rate": 0.00011667263673559994, "loss": 0.0091, "step": 242250 }, { "epoch": 1.22, "learning_rate": 0.00011666506904258593, "loss": 0.0106, "step": 242260 }, { "epoch": 1.22, "learning_rate": 0.0001166575013495719, "loss": 0.0089, "step": 242270 }, { "epoch": 1.22, "learning_rate": 0.0001166499336565579, "loss": 0.0077, "step": 242280 }, { "epoch": 1.22, "learning_rate": 0.00011664236596354388, "loss": 0.0124, "step": 242290 }, { "epoch": 1.22, "learning_rate": 0.00011663479827052987, "loss": 0.0078, "step": 242300 }, { "epoch": 1.22, "learning_rate": 0.00011662723057751587, "loss": 0.0122, "step": 242310 }, { "epoch": 1.22, "learning_rate": 0.00011661966288450185, "loss": 0.008, "step": 242320 }, { "epoch": 1.22, "learning_rate": 0.00011661209519148784, "loss": 0.0117, "step": 242330 }, { "epoch": 1.22, "learning_rate": 0.00011660452749847383, "loss": 0.0086, "step": 242340 }, { "epoch": 1.22, "learning_rate": 0.00011659695980545982, "loss": 0.0096, "step": 242350 }, { "epoch": 1.22, "learning_rate": 0.00011658939211244582, "loss": 0.0084, "step": 242360 }, { "epoch": 1.22, "learning_rate": 0.0001165818244194318, "loss": 0.012, "step": 242370 }, { "epoch": 1.22, "learning_rate": 0.00011657425672641779, "loss": 0.0099, "step": 242380 }, { "epoch": 1.22, "learning_rate": 0.00011656668903340379, "loss": 0.0084, "step": 242390 }, { "epoch": 1.22, "learning_rate": 0.00011655912134038977, "loss": 0.0101, "step": 242400 }, { "epoch": 1.22, "learning_rate": 0.00011655155364737576, "loss": 0.0102, "step": 242410 }, { "epoch": 1.22, "learning_rate": 0.00011654398595436175, "loss": 0.0097, "step": 242420 }, { "epoch": 1.22, "learning_rate": 0.00011653641826134774, "loss": 0.0113, "step": 242430 }, { "epoch": 1.22, "learning_rate": 0.00011652885056833374, "loss": 0.0103, "step": 242440 }, { "epoch": 1.22, "learning_rate": 0.00011652128287531972, "loss": 0.0093, "step": 242450 }, { "epoch": 1.22, "learning_rate": 0.00011651371518230571, "loss": 0.0087, "step": 242460 }, { "epoch": 1.22, "learning_rate": 0.00011650614748929171, "loss": 0.0088, "step": 242470 }, { "epoch": 1.22, "learning_rate": 0.00011649857979627769, "loss": 0.011, "step": 242480 }, { "epoch": 1.22, "learning_rate": 0.00011649101210326368, "loss": 0.0075, "step": 242490 }, { "epoch": 1.22, "learning_rate": 0.00011648344441024966, "loss": 0.0078, "step": 242500 }, { "epoch": 1.22, "learning_rate": 0.00011647587671723566, "loss": 0.0076, "step": 242510 }, { "epoch": 1.22, "learning_rate": 0.00011646830902422165, "loss": 0.0074, "step": 242520 }, { "epoch": 1.22, "learning_rate": 0.00011646074133120764, "loss": 0.0097, "step": 242530 }, { "epoch": 1.22, "learning_rate": 0.00011645317363819363, "loss": 0.0106, "step": 242540 }, { "epoch": 1.22, "learning_rate": 0.00011644560594517963, "loss": 0.0096, "step": 242550 }, { "epoch": 1.22, "learning_rate": 0.00011643803825216561, "loss": 0.0083, "step": 242560 }, { "epoch": 1.22, "learning_rate": 0.0001164304705591516, "loss": 0.008, "step": 242570 }, { "epoch": 1.22, "learning_rate": 0.00011642290286613758, "loss": 0.0097, "step": 242580 }, { "epoch": 1.22, "learning_rate": 0.00011641533517312358, "loss": 0.0077, "step": 242590 }, { "epoch": 1.22, "learning_rate": 0.00011640776748010957, "loss": 0.0096, "step": 242600 }, { "epoch": 1.22, "learning_rate": 0.00011640019978709556, "loss": 0.0104, "step": 242610 }, { "epoch": 1.22, "learning_rate": 0.00011639263209408155, "loss": 0.0094, "step": 242620 }, { "epoch": 1.22, "learning_rate": 0.00011638506440106755, "loss": 0.0079, "step": 242630 }, { "epoch": 1.22, "learning_rate": 0.00011637749670805353, "loss": 0.0072, "step": 242640 }, { "epoch": 1.22, "learning_rate": 0.00011636992901503952, "loss": 0.0078, "step": 242650 }, { "epoch": 1.22, "learning_rate": 0.00011636236132202552, "loss": 0.0078, "step": 242660 }, { "epoch": 1.22, "learning_rate": 0.0001163547936290115, "loss": 0.0083, "step": 242670 }, { "epoch": 1.22, "learning_rate": 0.0001163472259359975, "loss": 0.007, "step": 242680 }, { "epoch": 1.22, "learning_rate": 0.00011633965824298347, "loss": 0.0072, "step": 242690 }, { "epoch": 1.22, "learning_rate": 0.00011633209054996947, "loss": 0.0079, "step": 242700 }, { "epoch": 1.22, "learning_rate": 0.00011632452285695546, "loss": 0.0102, "step": 242710 }, { "epoch": 1.22, "learning_rate": 0.00011631695516394145, "loss": 0.0082, "step": 242720 }, { "epoch": 1.22, "learning_rate": 0.00011630938747092744, "loss": 0.0093, "step": 242730 }, { "epoch": 1.22, "learning_rate": 0.00011630181977791344, "loss": 0.0074, "step": 242740 }, { "epoch": 1.22, "learning_rate": 0.00011629425208489942, "loss": 0.0108, "step": 242750 }, { "epoch": 1.22, "learning_rate": 0.00011628668439188541, "loss": 0.0086, "step": 242760 }, { "epoch": 1.22, "learning_rate": 0.0001162791166988714, "loss": 0.0104, "step": 242770 }, { "epoch": 1.22, "learning_rate": 0.00011627154900585739, "loss": 0.0114, "step": 242780 }, { "epoch": 1.22, "learning_rate": 0.00011626398131284338, "loss": 0.0087, "step": 242790 }, { "epoch": 1.22, "learning_rate": 0.00011625641361982937, "loss": 0.0087, "step": 242800 }, { "epoch": 1.23, "learning_rate": 0.00011624884592681536, "loss": 0.0112, "step": 242810 }, { "epoch": 1.23, "learning_rate": 0.00011624127823380136, "loss": 0.0091, "step": 242820 }, { "epoch": 1.23, "learning_rate": 0.00011623371054078734, "loss": 0.0068, "step": 242830 }, { "epoch": 1.23, "learning_rate": 0.00011622614284777333, "loss": 0.0089, "step": 242840 }, { "epoch": 1.23, "learning_rate": 0.00011621857515475931, "loss": 0.0091, "step": 242850 }, { "epoch": 1.23, "learning_rate": 0.00011621100746174531, "loss": 0.0098, "step": 242860 }, { "epoch": 1.23, "learning_rate": 0.0001162034397687313, "loss": 0.008, "step": 242870 }, { "epoch": 1.23, "learning_rate": 0.00011619587207571728, "loss": 0.0095, "step": 242880 }, { "epoch": 1.23, "learning_rate": 0.00011618830438270328, "loss": 0.0126, "step": 242890 }, { "epoch": 1.23, "learning_rate": 0.00011618073668968925, "loss": 0.0092, "step": 242900 }, { "epoch": 1.23, "learning_rate": 0.00011617316899667524, "loss": 0.0085, "step": 242910 }, { "epoch": 1.23, "learning_rate": 0.00011616560130366124, "loss": 0.01, "step": 242920 }, { "epoch": 1.23, "learning_rate": 0.00011615803361064722, "loss": 0.0084, "step": 242930 }, { "epoch": 1.23, "learning_rate": 0.00011615046591763321, "loss": 0.008, "step": 242940 }, { "epoch": 1.23, "learning_rate": 0.0001161428982246192, "loss": 0.0072, "step": 242950 }, { "epoch": 1.23, "learning_rate": 0.00011613533053160519, "loss": 0.0086, "step": 242960 }, { "epoch": 1.23, "learning_rate": 0.00011612776283859119, "loss": 0.007, "step": 242970 }, { "epoch": 1.23, "learning_rate": 0.00011612019514557717, "loss": 0.0097, "step": 242980 }, { "epoch": 1.23, "learning_rate": 0.00011611262745256316, "loss": 0.0086, "step": 242990 }, { "epoch": 1.23, "learning_rate": 0.00011610505975954916, "loss": 0.0072, "step": 243000 }, { "epoch": 1.23, "eval_cer": 0.9144401736232748, "eval_loss": 0.006801496725529432, "eval_runtime": 115.8442, "eval_samples_per_second": 17.265, "eval_steps_per_second": 4.316, "step": 243000 }, { "epoch": 1.23, "learning_rate": 0.00011609749206653514, "loss": 0.008, "step": 243010 }, { "epoch": 1.23, "learning_rate": 0.00011608992437352113, "loss": 0.0087, "step": 243020 }, { "epoch": 1.23, "learning_rate": 0.00011608235668050711, "loss": 0.008, "step": 243030 }, { "epoch": 1.23, "learning_rate": 0.00011607478898749311, "loss": 0.0099, "step": 243040 }, { "epoch": 1.23, "learning_rate": 0.0001160672212944791, "loss": 0.0075, "step": 243050 }, { "epoch": 1.23, "learning_rate": 0.00011605965360146509, "loss": 0.0095, "step": 243060 }, { "epoch": 1.23, "learning_rate": 0.00011605208590845108, "loss": 0.0066, "step": 243070 }, { "epoch": 1.23, "learning_rate": 0.00011604451821543708, "loss": 0.0085, "step": 243080 }, { "epoch": 1.23, "learning_rate": 0.00011603695052242306, "loss": 0.0087, "step": 243090 }, { "epoch": 1.23, "learning_rate": 0.00011602938282940905, "loss": 0.0074, "step": 243100 }, { "epoch": 1.23, "learning_rate": 0.00011602181513639505, "loss": 0.0061, "step": 243110 }, { "epoch": 1.23, "learning_rate": 0.00011601424744338103, "loss": 0.0112, "step": 243120 }, { "epoch": 1.23, "learning_rate": 0.00011600667975036702, "loss": 0.0095, "step": 243130 }, { "epoch": 1.23, "learning_rate": 0.000115999112057353, "loss": 0.0083, "step": 243140 }, { "epoch": 1.23, "learning_rate": 0.000115991544364339, "loss": 0.0089, "step": 243150 }, { "epoch": 1.23, "learning_rate": 0.000115983976671325, "loss": 0.0105, "step": 243160 }, { "epoch": 1.23, "learning_rate": 0.00011597640897831098, "loss": 0.0081, "step": 243170 }, { "epoch": 1.23, "learning_rate": 0.00011596884128529697, "loss": 0.0112, "step": 243180 }, { "epoch": 1.23, "learning_rate": 0.00011596127359228297, "loss": 0.0081, "step": 243190 }, { "epoch": 1.23, "learning_rate": 0.00011595370589926895, "loss": 0.0083, "step": 243200 }, { "epoch": 1.23, "learning_rate": 0.00011594613820625494, "loss": 0.0116, "step": 243210 }, { "epoch": 1.23, "learning_rate": 0.00011593857051324092, "loss": 0.0099, "step": 243220 }, { "epoch": 1.23, "learning_rate": 0.00011593100282022692, "loss": 0.0075, "step": 243230 }, { "epoch": 1.23, "learning_rate": 0.00011592343512721291, "loss": 0.0065, "step": 243240 }, { "epoch": 1.23, "learning_rate": 0.0001159158674341989, "loss": 0.0084, "step": 243250 }, { "epoch": 1.23, "learning_rate": 0.00011590829974118489, "loss": 0.0082, "step": 243260 }, { "epoch": 1.23, "learning_rate": 0.00011590073204817089, "loss": 0.0113, "step": 243270 }, { "epoch": 1.23, "learning_rate": 0.00011589316435515687, "loss": 0.0084, "step": 243280 }, { "epoch": 1.23, "learning_rate": 0.00011588559666214286, "loss": 0.008, "step": 243290 }, { "epoch": 1.23, "learning_rate": 0.00011587802896912884, "loss": 0.009, "step": 243300 }, { "epoch": 1.23, "learning_rate": 0.00011587046127611484, "loss": 0.0114, "step": 243310 }, { "epoch": 1.23, "learning_rate": 0.00011586289358310083, "loss": 0.0094, "step": 243320 }, { "epoch": 1.23, "learning_rate": 0.00011585532589008682, "loss": 0.0073, "step": 243330 }, { "epoch": 1.23, "learning_rate": 0.00011584775819707281, "loss": 0.0095, "step": 243340 }, { "epoch": 1.23, "learning_rate": 0.0001158401905040588, "loss": 0.0098, "step": 243350 }, { "epoch": 1.23, "learning_rate": 0.00011583262281104479, "loss": 0.0084, "step": 243360 }, { "epoch": 1.23, "learning_rate": 0.00011582505511803078, "loss": 0.0064, "step": 243370 }, { "epoch": 1.23, "learning_rate": 0.00011581748742501676, "loss": 0.0093, "step": 243380 }, { "epoch": 1.23, "learning_rate": 0.00011580991973200276, "loss": 0.0094, "step": 243390 }, { "epoch": 1.23, "learning_rate": 0.00011580235203898875, "loss": 0.0099, "step": 243400 }, { "epoch": 1.23, "learning_rate": 0.00011579478434597473, "loss": 0.0103, "step": 243410 }, { "epoch": 1.23, "learning_rate": 0.00011578721665296073, "loss": 0.0087, "step": 243420 }, { "epoch": 1.23, "learning_rate": 0.00011577964895994672, "loss": 0.0092, "step": 243430 }, { "epoch": 1.23, "learning_rate": 0.0001157720812669327, "loss": 0.0077, "step": 243440 }, { "epoch": 1.23, "learning_rate": 0.0001157645135739187, "loss": 0.0105, "step": 243450 }, { "epoch": 1.23, "learning_rate": 0.00011575694588090468, "loss": 0.0064, "step": 243460 }, { "epoch": 1.23, "learning_rate": 0.00011574937818789068, "loss": 0.0084, "step": 243470 }, { "epoch": 1.23, "learning_rate": 0.00011574181049487667, "loss": 0.0086, "step": 243480 }, { "epoch": 1.23, "learning_rate": 0.00011573424280186265, "loss": 0.0076, "step": 243490 }, { "epoch": 1.23, "learning_rate": 0.00011572667510884865, "loss": 0.0082, "step": 243500 }, { "epoch": 1.23, "learning_rate": 0.00011571910741583464, "loss": 0.0068, "step": 243510 }, { "epoch": 1.23, "learning_rate": 0.00011571153972282063, "loss": 0.01, "step": 243520 }, { "epoch": 1.23, "learning_rate": 0.00011570397202980661, "loss": 0.0089, "step": 243530 }, { "epoch": 1.23, "learning_rate": 0.00011569640433679259, "loss": 0.0078, "step": 243540 }, { "epoch": 1.23, "learning_rate": 0.00011568883664377858, "loss": 0.007, "step": 243550 }, { "epoch": 1.23, "learning_rate": 0.00011568126895076458, "loss": 0.0085, "step": 243560 }, { "epoch": 1.23, "learning_rate": 0.00011567370125775056, "loss": 0.0097, "step": 243570 }, { "epoch": 1.23, "learning_rate": 0.00011566613356473656, "loss": 0.0106, "step": 243580 }, { "epoch": 1.23, "learning_rate": 0.00011565856587172254, "loss": 0.0081, "step": 243590 }, { "epoch": 1.23, "learning_rate": 0.00011565099817870853, "loss": 0.0091, "step": 243600 }, { "epoch": 1.23, "learning_rate": 0.00011564343048569453, "loss": 0.0128, "step": 243610 }, { "epoch": 1.23, "learning_rate": 0.00011563586279268051, "loss": 0.0085, "step": 243620 }, { "epoch": 1.23, "learning_rate": 0.0001156282950996665, "loss": 0.0087, "step": 243630 }, { "epoch": 1.23, "learning_rate": 0.0001156207274066525, "loss": 0.0089, "step": 243640 }, { "epoch": 1.23, "learning_rate": 0.00011561315971363848, "loss": 0.0075, "step": 243650 }, { "epoch": 1.23, "learning_rate": 0.00011560559202062447, "loss": 0.0074, "step": 243660 }, { "epoch": 1.23, "learning_rate": 0.00011559802432761046, "loss": 0.0089, "step": 243670 }, { "epoch": 1.23, "learning_rate": 0.00011559045663459645, "loss": 0.0084, "step": 243680 }, { "epoch": 1.23, "learning_rate": 0.00011558288894158245, "loss": 0.0083, "step": 243690 }, { "epoch": 1.23, "learning_rate": 0.00011557532124856843, "loss": 0.008, "step": 243700 }, { "epoch": 1.23, "learning_rate": 0.00011556775355555442, "loss": 0.0082, "step": 243710 }, { "epoch": 1.23, "learning_rate": 0.00011556018586254042, "loss": 0.0079, "step": 243720 }, { "epoch": 1.23, "learning_rate": 0.0001155526181695264, "loss": 0.0062, "step": 243730 }, { "epoch": 1.23, "learning_rate": 0.0001155450504765124, "loss": 0.0079, "step": 243740 }, { "epoch": 1.23, "learning_rate": 0.00011553748278349838, "loss": 0.0086, "step": 243750 }, { "epoch": 1.23, "learning_rate": 0.00011552991509048437, "loss": 0.0108, "step": 243760 }, { "epoch": 1.23, "learning_rate": 0.00011552234739747037, "loss": 0.0095, "step": 243770 }, { "epoch": 1.23, "learning_rate": 0.00011551477970445635, "loss": 0.0083, "step": 243780 }, { "epoch": 1.23, "learning_rate": 0.00011550721201144234, "loss": 0.0077, "step": 243790 }, { "epoch": 1.23, "learning_rate": 0.00011549964431842834, "loss": 0.0078, "step": 243800 }, { "epoch": 1.23, "learning_rate": 0.00011549207662541432, "loss": 0.0095, "step": 243810 }, { "epoch": 1.23, "learning_rate": 0.00011548450893240031, "loss": 0.0108, "step": 243820 }, { "epoch": 1.23, "learning_rate": 0.0001154769412393863, "loss": 0.0075, "step": 243830 }, { "epoch": 1.23, "learning_rate": 0.00011546937354637229, "loss": 0.007, "step": 243840 }, { "epoch": 1.23, "learning_rate": 0.00011546180585335828, "loss": 0.0094, "step": 243850 }, { "epoch": 1.23, "learning_rate": 0.00011545423816034427, "loss": 0.0087, "step": 243860 }, { "epoch": 1.23, "learning_rate": 0.00011544667046733026, "loss": 0.0076, "step": 243870 }, { "epoch": 1.23, "learning_rate": 0.00011543910277431626, "loss": 0.0091, "step": 243880 }, { "epoch": 1.23, "learning_rate": 0.00011543153508130224, "loss": 0.0088, "step": 243890 }, { "epoch": 1.23, "learning_rate": 0.00011542396738828823, "loss": 0.0078, "step": 243900 }, { "epoch": 1.23, "learning_rate": 0.00011541639969527421, "loss": 0.0072, "step": 243910 }, { "epoch": 1.23, "learning_rate": 0.00011540883200226021, "loss": 0.0076, "step": 243920 }, { "epoch": 1.23, "learning_rate": 0.0001154012643092462, "loss": 0.0079, "step": 243930 }, { "epoch": 1.23, "learning_rate": 0.00011539369661623219, "loss": 0.0091, "step": 243940 }, { "epoch": 1.23, "learning_rate": 0.00011538612892321818, "loss": 0.0087, "step": 243950 }, { "epoch": 1.23, "learning_rate": 0.00011537856123020418, "loss": 0.008, "step": 243960 }, { "epoch": 1.23, "learning_rate": 0.00011537099353719016, "loss": 0.006, "step": 243970 }, { "epoch": 1.23, "learning_rate": 0.00011536342584417615, "loss": 0.0075, "step": 243980 }, { "epoch": 1.23, "learning_rate": 0.00011535585815116213, "loss": 0.0075, "step": 243990 }, { "epoch": 1.23, "learning_rate": 0.00011534829045814813, "loss": 0.0077, "step": 244000 }, { "epoch": 1.23, "eval_cer": 0.9144731670915385, "eval_loss": 0.00690747844055295, "eval_runtime": 116.0173, "eval_samples_per_second": 17.239, "eval_steps_per_second": 4.31, "step": 244000 }, { "epoch": 1.23, "learning_rate": 0.00011534072276513412, "loss": 0.007, "step": 244010 }, { "epoch": 1.23, "learning_rate": 0.0001153331550721201, "loss": 0.0058, "step": 244020 }, { "epoch": 1.23, "learning_rate": 0.0001153255873791061, "loss": 0.0058, "step": 244030 }, { "epoch": 1.23, "learning_rate": 0.0001153180196860921, "loss": 0.0135, "step": 244040 }, { "epoch": 1.23, "learning_rate": 0.00011531045199307808, "loss": 0.009, "step": 244050 }, { "epoch": 1.23, "learning_rate": 0.00011530288430006407, "loss": 0.0083, "step": 244060 }, { "epoch": 1.23, "learning_rate": 0.00011529531660705005, "loss": 0.0095, "step": 244070 }, { "epoch": 1.23, "learning_rate": 0.00011528774891403605, "loss": 0.0074, "step": 244080 }, { "epoch": 1.23, "learning_rate": 0.00011528018122102204, "loss": 0.0089, "step": 244090 }, { "epoch": 1.23, "learning_rate": 0.00011527261352800802, "loss": 0.0083, "step": 244100 }, { "epoch": 1.23, "learning_rate": 0.00011526504583499402, "loss": 0.0085, "step": 244110 }, { "epoch": 1.23, "learning_rate": 0.00011525747814198001, "loss": 0.0083, "step": 244120 }, { "epoch": 1.23, "learning_rate": 0.000115249910448966, "loss": 0.0076, "step": 244130 }, { "epoch": 1.23, "learning_rate": 0.00011524234275595199, "loss": 0.0103, "step": 244140 }, { "epoch": 1.23, "learning_rate": 0.00011523477506293799, "loss": 0.0077, "step": 244150 }, { "epoch": 1.23, "learning_rate": 0.00011522720736992395, "loss": 0.0104, "step": 244160 }, { "epoch": 1.23, "learning_rate": 0.00011521963967690995, "loss": 0.0092, "step": 244170 }, { "epoch": 1.23, "learning_rate": 0.00011521207198389593, "loss": 0.0099, "step": 244180 }, { "epoch": 1.23, "learning_rate": 0.00011520450429088192, "loss": 0.0099, "step": 244190 }, { "epoch": 1.23, "learning_rate": 0.0001151969365978679, "loss": 0.0085, "step": 244200 }, { "epoch": 1.23, "learning_rate": 0.0001151893689048539, "loss": 0.0087, "step": 244210 }, { "epoch": 1.23, "learning_rate": 0.0001151818012118399, "loss": 0.0111, "step": 244220 }, { "epoch": 1.23, "learning_rate": 0.00011517423351882588, "loss": 0.0085, "step": 244230 }, { "epoch": 1.23, "learning_rate": 0.00011516666582581187, "loss": 0.0106, "step": 244240 }, { "epoch": 1.23, "learning_rate": 0.00011515909813279787, "loss": 0.0089, "step": 244250 }, { "epoch": 1.23, "learning_rate": 0.00011515153043978385, "loss": 0.0116, "step": 244260 }, { "epoch": 1.23, "learning_rate": 0.00011514396274676984, "loss": 0.009, "step": 244270 }, { "epoch": 1.23, "learning_rate": 0.00011513639505375583, "loss": 0.0083, "step": 244280 }, { "epoch": 1.23, "learning_rate": 0.00011512882736074182, "loss": 0.0093, "step": 244290 }, { "epoch": 1.23, "learning_rate": 0.00011512125966772782, "loss": 0.0078, "step": 244300 }, { "epoch": 1.23, "learning_rate": 0.0001151136919747138, "loss": 0.0082, "step": 244310 }, { "epoch": 1.23, "learning_rate": 0.00011510612428169979, "loss": 0.0081, "step": 244320 }, { "epoch": 1.23, "learning_rate": 0.00011509855658868579, "loss": 0.0124, "step": 244330 }, { "epoch": 1.23, "learning_rate": 0.00011509098889567177, "loss": 0.0068, "step": 244340 }, { "epoch": 1.23, "learning_rate": 0.00011508342120265776, "loss": 0.01, "step": 244350 }, { "epoch": 1.23, "learning_rate": 0.00011507585350964374, "loss": 0.0093, "step": 244360 }, { "epoch": 1.23, "learning_rate": 0.00011506828581662974, "loss": 0.0085, "step": 244370 }, { "epoch": 1.23, "learning_rate": 0.00011506071812361573, "loss": 0.0086, "step": 244380 }, { "epoch": 1.23, "learning_rate": 0.00011505315043060172, "loss": 0.009, "step": 244390 }, { "epoch": 1.23, "learning_rate": 0.00011504558273758771, "loss": 0.0076, "step": 244400 }, { "epoch": 1.23, "learning_rate": 0.0001150380150445737, "loss": 0.0076, "step": 244410 }, { "epoch": 1.23, "learning_rate": 0.00011503044735155969, "loss": 0.0121, "step": 244420 }, { "epoch": 1.23, "learning_rate": 0.00011502287965854568, "loss": 0.0088, "step": 244430 }, { "epoch": 1.23, "learning_rate": 0.00011501531196553166, "loss": 0.0085, "step": 244440 }, { "epoch": 1.23, "learning_rate": 0.00011500774427251766, "loss": 0.0091, "step": 244450 }, { "epoch": 1.23, "learning_rate": 0.00011500017657950365, "loss": 0.0089, "step": 244460 }, { "epoch": 1.23, "learning_rate": 0.00011499260888648964, "loss": 0.0087, "step": 244470 }, { "epoch": 1.23, "learning_rate": 0.00011498504119347563, "loss": 0.0099, "step": 244480 }, { "epoch": 1.23, "learning_rate": 0.00011497747350046163, "loss": 0.0102, "step": 244490 }, { "epoch": 1.23, "learning_rate": 0.0001149699058074476, "loss": 0.0073, "step": 244500 }, { "epoch": 1.23, "learning_rate": 0.0001149623381144336, "loss": 0.013, "step": 244510 }, { "epoch": 1.23, "learning_rate": 0.00011495477042141958, "loss": 0.0087, "step": 244520 }, { "epoch": 1.23, "learning_rate": 0.00011494720272840558, "loss": 0.0093, "step": 244530 }, { "epoch": 1.23, "learning_rate": 0.00011493963503539157, "loss": 0.0091, "step": 244540 }, { "epoch": 1.23, "learning_rate": 0.00011493206734237755, "loss": 0.0103, "step": 244550 }, { "epoch": 1.23, "learning_rate": 0.00011492449964936355, "loss": 0.0096, "step": 244560 }, { "epoch": 1.23, "learning_rate": 0.00011491693195634954, "loss": 0.0086, "step": 244570 }, { "epoch": 1.23, "learning_rate": 0.00011490936426333553, "loss": 0.0098, "step": 244580 }, { "epoch": 1.23, "learning_rate": 0.00011490179657032152, "loss": 0.0086, "step": 244590 }, { "epoch": 1.23, "learning_rate": 0.00011489422887730752, "loss": 0.0095, "step": 244600 }, { "epoch": 1.23, "learning_rate": 0.0001148866611842935, "loss": 0.0092, "step": 244610 }, { "epoch": 1.23, "learning_rate": 0.00011487909349127949, "loss": 0.0092, "step": 244620 }, { "epoch": 1.23, "learning_rate": 0.00011487152579826547, "loss": 0.0105, "step": 244630 }, { "epoch": 1.23, "learning_rate": 0.00011486395810525147, "loss": 0.009, "step": 244640 }, { "epoch": 1.23, "learning_rate": 0.00011485639041223746, "loss": 0.0071, "step": 244650 }, { "epoch": 1.23, "learning_rate": 0.00011484882271922345, "loss": 0.0095, "step": 244660 }, { "epoch": 1.23, "learning_rate": 0.00011484125502620944, "loss": 0.0117, "step": 244670 }, { "epoch": 1.23, "learning_rate": 0.00011483368733319544, "loss": 0.0106, "step": 244680 }, { "epoch": 1.23, "learning_rate": 0.00011482611964018142, "loss": 0.0073, "step": 244690 }, { "epoch": 1.23, "learning_rate": 0.00011481855194716741, "loss": 0.0073, "step": 244700 }, { "epoch": 1.23, "learning_rate": 0.00011481098425415339, "loss": 0.0147, "step": 244710 }, { "epoch": 1.23, "learning_rate": 0.00011480341656113939, "loss": 0.01, "step": 244720 }, { "epoch": 1.23, "learning_rate": 0.00011479584886812538, "loss": 0.0083, "step": 244730 }, { "epoch": 1.23, "learning_rate": 0.00011478828117511136, "loss": 0.0085, "step": 244740 }, { "epoch": 1.23, "learning_rate": 0.00011478071348209736, "loss": 0.0076, "step": 244750 }, { "epoch": 1.23, "learning_rate": 0.00011477314578908335, "loss": 0.0077, "step": 244760 }, { "epoch": 1.23, "learning_rate": 0.00011476557809606934, "loss": 0.0118, "step": 244770 }, { "epoch": 1.23, "learning_rate": 0.00011475801040305532, "loss": 0.0099, "step": 244780 }, { "epoch": 1.23, "learning_rate": 0.0001147504427100413, "loss": 0.0101, "step": 244790 }, { "epoch": 1.24, "learning_rate": 0.0001147428750170273, "loss": 0.0093, "step": 244800 }, { "epoch": 1.24, "learning_rate": 0.00011473530732401328, "loss": 0.0073, "step": 244810 }, { "epoch": 1.24, "learning_rate": 0.00011472773963099927, "loss": 0.0087, "step": 244820 }, { "epoch": 1.24, "learning_rate": 0.00011472017193798527, "loss": 0.009, "step": 244830 }, { "epoch": 1.24, "learning_rate": 0.00011471260424497125, "loss": 0.0075, "step": 244840 }, { "epoch": 1.24, "learning_rate": 0.00011470503655195724, "loss": 0.0085, "step": 244850 }, { "epoch": 1.24, "learning_rate": 0.00011469746885894324, "loss": 0.0088, "step": 244860 }, { "epoch": 1.24, "learning_rate": 0.00011468990116592922, "loss": 0.0071, "step": 244870 }, { "epoch": 1.24, "learning_rate": 0.00011468233347291521, "loss": 0.0079, "step": 244880 }, { "epoch": 1.24, "learning_rate": 0.0001146747657799012, "loss": 0.0101, "step": 244890 }, { "epoch": 1.24, "learning_rate": 0.00011466719808688719, "loss": 0.0074, "step": 244900 }, { "epoch": 1.24, "learning_rate": 0.00011465963039387318, "loss": 0.0117, "step": 244910 }, { "epoch": 1.24, "learning_rate": 0.00011465206270085917, "loss": 0.0089, "step": 244920 }, { "epoch": 1.24, "learning_rate": 0.00011464449500784516, "loss": 0.0079, "step": 244930 }, { "epoch": 1.24, "learning_rate": 0.00011463692731483116, "loss": 0.0119, "step": 244940 }, { "epoch": 1.24, "learning_rate": 0.00011462935962181714, "loss": 0.0103, "step": 244950 }, { "epoch": 1.24, "learning_rate": 0.00011462179192880313, "loss": 0.0083, "step": 244960 }, { "epoch": 1.24, "learning_rate": 0.00011461422423578911, "loss": 0.0081, "step": 244970 }, { "epoch": 1.24, "learning_rate": 0.00011460665654277511, "loss": 0.0092, "step": 244980 }, { "epoch": 1.24, "learning_rate": 0.0001145990888497611, "loss": 0.0088, "step": 244990 }, { "epoch": 1.24, "learning_rate": 0.00011459152115674709, "loss": 0.0093, "step": 245000 }, { "epoch": 1.24, "eval_cer": 0.9144741374876638, "eval_loss": 0.006758058909326792, "eval_runtime": 115.9822, "eval_samples_per_second": 17.244, "eval_steps_per_second": 4.311, "step": 245000 }, { "epoch": 1.24, "learning_rate": 0.00011458395346373308, "loss": 0.0081, "step": 245010 }, { "epoch": 1.24, "learning_rate": 0.00011457638577071908, "loss": 0.0073, "step": 245020 }, { "epoch": 1.24, "learning_rate": 0.00011456881807770506, "loss": 0.0077, "step": 245030 }, { "epoch": 1.24, "learning_rate": 0.00011456125038469105, "loss": 0.0079, "step": 245040 }, { "epoch": 1.24, "learning_rate": 0.00011455368269167705, "loss": 0.007, "step": 245050 }, { "epoch": 1.24, "learning_rate": 0.00011454611499866303, "loss": 0.0085, "step": 245060 }, { "epoch": 1.24, "learning_rate": 0.00011453854730564902, "loss": 0.0083, "step": 245070 }, { "epoch": 1.24, "learning_rate": 0.000114530979612635, "loss": 0.0075, "step": 245080 }, { "epoch": 1.24, "learning_rate": 0.000114523411919621, "loss": 0.0091, "step": 245090 }, { "epoch": 1.24, "learning_rate": 0.000114515844226607, "loss": 0.011, "step": 245100 }, { "epoch": 1.24, "learning_rate": 0.00011450827653359298, "loss": 0.008, "step": 245110 }, { "epoch": 1.24, "learning_rate": 0.00011450070884057897, "loss": 0.0092, "step": 245120 }, { "epoch": 1.24, "learning_rate": 0.00011449314114756497, "loss": 0.0094, "step": 245130 }, { "epoch": 1.24, "learning_rate": 0.00011448557345455095, "loss": 0.0102, "step": 245140 }, { "epoch": 1.24, "learning_rate": 0.00011447800576153694, "loss": 0.0085, "step": 245150 }, { "epoch": 1.24, "learning_rate": 0.00011447043806852292, "loss": 0.0099, "step": 245160 }, { "epoch": 1.24, "learning_rate": 0.00011446287037550892, "loss": 0.0073, "step": 245170 }, { "epoch": 1.24, "learning_rate": 0.00011445530268249491, "loss": 0.0094, "step": 245180 }, { "epoch": 1.24, "learning_rate": 0.0001144477349894809, "loss": 0.0084, "step": 245190 }, { "epoch": 1.24, "learning_rate": 0.00011444016729646689, "loss": 0.0087, "step": 245200 }, { "epoch": 1.24, "learning_rate": 0.00011443259960345289, "loss": 0.0093, "step": 245210 }, { "epoch": 1.24, "learning_rate": 0.00011442503191043887, "loss": 0.0103, "step": 245220 }, { "epoch": 1.24, "learning_rate": 0.00011441746421742486, "loss": 0.0085, "step": 245230 }, { "epoch": 1.24, "learning_rate": 0.00011440989652441084, "loss": 0.0087, "step": 245240 }, { "epoch": 1.24, "learning_rate": 0.00011440232883139684, "loss": 0.0089, "step": 245250 }, { "epoch": 1.24, "learning_rate": 0.00011439476113838283, "loss": 0.0092, "step": 245260 }, { "epoch": 1.24, "learning_rate": 0.00011438719344536881, "loss": 0.0082, "step": 245270 }, { "epoch": 1.24, "learning_rate": 0.00011437962575235481, "loss": 0.0095, "step": 245280 }, { "epoch": 1.24, "learning_rate": 0.0001143720580593408, "loss": 0.0092, "step": 245290 }, { "epoch": 1.24, "learning_rate": 0.00011436449036632679, "loss": 0.0118, "step": 245300 }, { "epoch": 1.24, "learning_rate": 0.00011435692267331278, "loss": 0.0076, "step": 245310 }, { "epoch": 1.24, "learning_rate": 0.00011434935498029876, "loss": 0.0085, "step": 245320 }, { "epoch": 1.24, "learning_rate": 0.00011434178728728476, "loss": 0.0175, "step": 245330 }, { "epoch": 1.24, "learning_rate": 0.00011433421959427075, "loss": 0.0096, "step": 245340 }, { "epoch": 1.24, "learning_rate": 0.00011432665190125673, "loss": 0.009, "step": 245350 }, { "epoch": 1.24, "learning_rate": 0.00011431908420824273, "loss": 0.0069, "step": 245360 }, { "epoch": 1.24, "learning_rate": 0.00011431151651522872, "loss": 0.0088, "step": 245370 }, { "epoch": 1.24, "learning_rate": 0.0001143039488222147, "loss": 0.0099, "step": 245380 }, { "epoch": 1.24, "learning_rate": 0.0001142963811292007, "loss": 0.0097, "step": 245390 }, { "epoch": 1.24, "learning_rate": 0.00011428881343618668, "loss": 0.007, "step": 245400 }, { "epoch": 1.24, "learning_rate": 0.00011428124574317266, "loss": 0.0089, "step": 245410 }, { "epoch": 1.24, "learning_rate": 0.00011427367805015864, "loss": 0.0078, "step": 245420 }, { "epoch": 1.24, "learning_rate": 0.00011426611035714464, "loss": 0.0098, "step": 245430 }, { "epoch": 1.24, "learning_rate": 0.00011425854266413063, "loss": 0.0104, "step": 245440 }, { "epoch": 1.24, "learning_rate": 0.00011425097497111662, "loss": 0.008, "step": 245450 }, { "epoch": 1.24, "learning_rate": 0.00011424340727810261, "loss": 0.0094, "step": 245460 }, { "epoch": 1.24, "learning_rate": 0.0001142358395850886, "loss": 0.0083, "step": 245470 }, { "epoch": 1.24, "learning_rate": 0.00011422827189207459, "loss": 0.0099, "step": 245480 }, { "epoch": 1.24, "learning_rate": 0.00011422070419906058, "loss": 0.0099, "step": 245490 }, { "epoch": 1.24, "learning_rate": 0.00011421313650604658, "loss": 0.0114, "step": 245500 }, { "epoch": 1.24, "learning_rate": 0.00011420556881303256, "loss": 0.0087, "step": 245510 }, { "epoch": 1.24, "learning_rate": 0.00011419800112001855, "loss": 0.0078, "step": 245520 }, { "epoch": 1.24, "learning_rate": 0.00011419043342700454, "loss": 0.0087, "step": 245530 }, { "epoch": 1.24, "learning_rate": 0.00011418286573399053, "loss": 0.0088, "step": 245540 }, { "epoch": 1.24, "learning_rate": 0.00011417529804097653, "loss": 0.0097, "step": 245550 }, { "epoch": 1.24, "learning_rate": 0.00011416773034796251, "loss": 0.0084, "step": 245560 }, { "epoch": 1.24, "learning_rate": 0.0001141601626549485, "loss": 0.009, "step": 245570 }, { "epoch": 1.24, "learning_rate": 0.0001141525949619345, "loss": 0.009, "step": 245580 }, { "epoch": 1.24, "learning_rate": 0.00011414502726892048, "loss": 0.0068, "step": 245590 }, { "epoch": 1.24, "learning_rate": 0.00011413745957590647, "loss": 0.0081, "step": 245600 }, { "epoch": 1.24, "learning_rate": 0.00011412989188289245, "loss": 0.0078, "step": 245610 }, { "epoch": 1.24, "learning_rate": 0.00011412232418987845, "loss": 0.0099, "step": 245620 }, { "epoch": 1.24, "learning_rate": 0.00011411475649686444, "loss": 0.0121, "step": 245630 }, { "epoch": 1.24, "learning_rate": 0.00011410718880385043, "loss": 0.0116, "step": 245640 }, { "epoch": 1.24, "learning_rate": 0.00011409962111083642, "loss": 0.0088, "step": 245650 }, { "epoch": 1.24, "learning_rate": 0.00011409205341782242, "loss": 0.0087, "step": 245660 }, { "epoch": 1.24, "learning_rate": 0.0001140844857248084, "loss": 0.0069, "step": 245670 }, { "epoch": 1.24, "learning_rate": 0.00011407691803179439, "loss": 0.0077, "step": 245680 }, { "epoch": 1.24, "learning_rate": 0.00011406935033878037, "loss": 0.0086, "step": 245690 }, { "epoch": 1.24, "learning_rate": 0.00011406178264576637, "loss": 0.008, "step": 245700 }, { "epoch": 1.24, "learning_rate": 0.00011405421495275236, "loss": 0.0081, "step": 245710 }, { "epoch": 1.24, "learning_rate": 0.00011404664725973835, "loss": 0.0077, "step": 245720 }, { "epoch": 1.24, "learning_rate": 0.00011403907956672434, "loss": 0.0108, "step": 245730 }, { "epoch": 1.24, "learning_rate": 0.00011403151187371034, "loss": 0.0085, "step": 245740 }, { "epoch": 1.24, "learning_rate": 0.00011402394418069632, "loss": 0.0094, "step": 245750 }, { "epoch": 1.24, "learning_rate": 0.00011401637648768231, "loss": 0.0082, "step": 245760 }, { "epoch": 1.24, "learning_rate": 0.0001140088087946683, "loss": 0.0068, "step": 245770 }, { "epoch": 1.24, "learning_rate": 0.00011400124110165429, "loss": 0.0072, "step": 245780 }, { "epoch": 1.24, "learning_rate": 0.00011399367340864028, "loss": 0.008, "step": 245790 }, { "epoch": 1.24, "learning_rate": 0.00011398610571562626, "loss": 0.0109, "step": 245800 }, { "epoch": 1.24, "learning_rate": 0.00011397853802261226, "loss": 0.0073, "step": 245810 }, { "epoch": 1.24, "learning_rate": 0.00011397097032959825, "loss": 0.0092, "step": 245820 }, { "epoch": 1.24, "learning_rate": 0.00011396340263658424, "loss": 0.0086, "step": 245830 }, { "epoch": 1.24, "learning_rate": 0.00011395583494357023, "loss": 0.0068, "step": 245840 }, { "epoch": 1.24, "learning_rate": 0.00011394826725055621, "loss": 0.0118, "step": 245850 }, { "epoch": 1.24, "learning_rate": 0.00011394069955754221, "loss": 0.0098, "step": 245860 }, { "epoch": 1.24, "learning_rate": 0.0001139331318645282, "loss": 0.0093, "step": 245870 }, { "epoch": 1.24, "learning_rate": 0.00011392556417151418, "loss": 0.0087, "step": 245880 }, { "epoch": 1.24, "learning_rate": 0.00011391799647850018, "loss": 0.0084, "step": 245890 }, { "epoch": 1.24, "learning_rate": 0.00011391042878548617, "loss": 0.0091, "step": 245900 }, { "epoch": 1.24, "learning_rate": 0.00011390286109247216, "loss": 0.0074, "step": 245910 }, { "epoch": 1.24, "learning_rate": 0.00011389529339945815, "loss": 0.0078, "step": 245920 }, { "epoch": 1.24, "learning_rate": 0.00011388772570644413, "loss": 0.0077, "step": 245930 }, { "epoch": 1.24, "learning_rate": 0.00011388015801343013, "loss": 0.0085, "step": 245940 }, { "epoch": 1.24, "learning_rate": 0.00011387259032041612, "loss": 0.0089, "step": 245950 }, { "epoch": 1.24, "learning_rate": 0.0001138650226274021, "loss": 0.0082, "step": 245960 }, { "epoch": 1.24, "learning_rate": 0.0001138574549343881, "loss": 0.0077, "step": 245970 }, { "epoch": 1.24, "learning_rate": 0.0001138498872413741, "loss": 0.0091, "step": 245980 }, { "epoch": 1.24, "learning_rate": 0.00011384231954836007, "loss": 0.0083, "step": 245990 }, { "epoch": 1.24, "learning_rate": 0.00011383475185534607, "loss": 0.0084, "step": 246000 }, { "epoch": 1.24, "eval_cer": 0.9144343512465224, "eval_loss": 0.006622600369155407, "eval_runtime": 115.7041, "eval_samples_per_second": 17.285, "eval_steps_per_second": 4.321, "step": 246000 }, { "epoch": 1.24, "learning_rate": 0.00011382718416233205, "loss": 0.0117, "step": 246010 }, { "epoch": 1.24, "learning_rate": 0.00011381961646931805, "loss": 0.011, "step": 246020 }, { "epoch": 1.24, "learning_rate": 0.00011381204877630404, "loss": 0.009, "step": 246030 }, { "epoch": 1.24, "learning_rate": 0.00011380448108329001, "loss": 0.009, "step": 246040 }, { "epoch": 1.24, "learning_rate": 0.000113796913390276, "loss": 0.0117, "step": 246050 }, { "epoch": 1.24, "learning_rate": 0.00011378934569726199, "loss": 0.0121, "step": 246060 }, { "epoch": 1.24, "learning_rate": 0.00011378177800424798, "loss": 0.0087, "step": 246070 }, { "epoch": 1.24, "learning_rate": 0.00011377421031123398, "loss": 0.0069, "step": 246080 }, { "epoch": 1.24, "learning_rate": 0.00011376664261821996, "loss": 0.0072, "step": 246090 }, { "epoch": 1.24, "learning_rate": 0.00011375907492520595, "loss": 0.009, "step": 246100 }, { "epoch": 1.24, "learning_rate": 0.00011375150723219195, "loss": 0.0082, "step": 246110 }, { "epoch": 1.24, "learning_rate": 0.00011374393953917793, "loss": 0.0083, "step": 246120 }, { "epoch": 1.24, "learning_rate": 0.00011373637184616392, "loss": 0.0108, "step": 246130 }, { "epoch": 1.24, "learning_rate": 0.0001137288041531499, "loss": 0.0092, "step": 246140 }, { "epoch": 1.24, "learning_rate": 0.0001137212364601359, "loss": 0.0074, "step": 246150 }, { "epoch": 1.24, "learning_rate": 0.0001137136687671219, "loss": 0.0091, "step": 246160 }, { "epoch": 1.24, "learning_rate": 0.00011370610107410788, "loss": 0.0083, "step": 246170 }, { "epoch": 1.24, "learning_rate": 0.00011369853338109387, "loss": 0.0102, "step": 246180 }, { "epoch": 1.24, "learning_rate": 0.00011369096568807987, "loss": 0.0095, "step": 246190 }, { "epoch": 1.24, "learning_rate": 0.00011368339799506585, "loss": 0.0086, "step": 246200 }, { "epoch": 1.24, "learning_rate": 0.00011367583030205184, "loss": 0.0094, "step": 246210 }, { "epoch": 1.24, "learning_rate": 0.00011366826260903782, "loss": 0.0091, "step": 246220 }, { "epoch": 1.24, "learning_rate": 0.00011366069491602382, "loss": 0.0078, "step": 246230 }, { "epoch": 1.24, "learning_rate": 0.00011365312722300981, "loss": 0.0105, "step": 246240 }, { "epoch": 1.24, "learning_rate": 0.0001136455595299958, "loss": 0.0097, "step": 246250 }, { "epoch": 1.24, "learning_rate": 0.00011363799183698179, "loss": 0.0107, "step": 246260 }, { "epoch": 1.24, "learning_rate": 0.00011363042414396779, "loss": 0.0089, "step": 246270 }, { "epoch": 1.24, "learning_rate": 0.00011362285645095377, "loss": 0.0098, "step": 246280 }, { "epoch": 1.24, "learning_rate": 0.00011361528875793976, "loss": 0.012, "step": 246290 }, { "epoch": 1.24, "learning_rate": 0.00011360772106492574, "loss": 0.0097, "step": 246300 }, { "epoch": 1.24, "learning_rate": 0.00011360015337191174, "loss": 0.0083, "step": 246310 }, { "epoch": 1.24, "learning_rate": 0.00011359258567889773, "loss": 0.0079, "step": 246320 }, { "epoch": 1.24, "learning_rate": 0.00011358501798588371, "loss": 0.0103, "step": 246330 }, { "epoch": 1.24, "learning_rate": 0.00011357745029286971, "loss": 0.0075, "step": 246340 }, { "epoch": 1.24, "learning_rate": 0.0001135698825998557, "loss": 0.007, "step": 246350 }, { "epoch": 1.24, "learning_rate": 0.00011356231490684169, "loss": 0.0092, "step": 246360 }, { "epoch": 1.24, "learning_rate": 0.00011355474721382768, "loss": 0.01, "step": 246370 }, { "epoch": 1.24, "learning_rate": 0.00011354717952081366, "loss": 0.0113, "step": 246380 }, { "epoch": 1.24, "learning_rate": 0.00011353961182779966, "loss": 0.0075, "step": 246390 }, { "epoch": 1.24, "learning_rate": 0.00011353204413478565, "loss": 0.0083, "step": 246400 }, { "epoch": 1.24, "learning_rate": 0.00011352447644177163, "loss": 0.0071, "step": 246410 }, { "epoch": 1.24, "learning_rate": 0.00011351690874875763, "loss": 0.0095, "step": 246420 }, { "epoch": 1.24, "learning_rate": 0.00011350934105574362, "loss": 0.0113, "step": 246430 }, { "epoch": 1.24, "learning_rate": 0.0001135017733627296, "loss": 0.0079, "step": 246440 }, { "epoch": 1.24, "learning_rate": 0.0001134942056697156, "loss": 0.01, "step": 246450 }, { "epoch": 1.24, "learning_rate": 0.00011348663797670158, "loss": 0.0087, "step": 246460 }, { "epoch": 1.24, "learning_rate": 0.00011347907028368758, "loss": 0.0081, "step": 246470 }, { "epoch": 1.24, "learning_rate": 0.00011347150259067357, "loss": 0.0097, "step": 246480 }, { "epoch": 1.24, "learning_rate": 0.00011346393489765955, "loss": 0.0094, "step": 246490 }, { "epoch": 1.24, "learning_rate": 0.00011345636720464555, "loss": 0.0087, "step": 246500 }, { "epoch": 1.24, "learning_rate": 0.00011344879951163154, "loss": 0.0078, "step": 246510 }, { "epoch": 1.24, "learning_rate": 0.00011344123181861753, "loss": 0.0095, "step": 246520 }, { "epoch": 1.24, "learning_rate": 0.00011343366412560352, "loss": 0.0107, "step": 246530 }, { "epoch": 1.24, "learning_rate": 0.00011342609643258952, "loss": 0.0082, "step": 246540 }, { "epoch": 1.24, "learning_rate": 0.0001134185287395755, "loss": 0.0086, "step": 246550 }, { "epoch": 1.24, "learning_rate": 0.00011341096104656149, "loss": 0.0064, "step": 246560 }, { "epoch": 1.24, "learning_rate": 0.00011340339335354747, "loss": 0.0116, "step": 246570 }, { "epoch": 1.24, "learning_rate": 0.00011339582566053347, "loss": 0.0077, "step": 246580 }, { "epoch": 1.24, "learning_rate": 0.00011338825796751946, "loss": 0.0114, "step": 246590 }, { "epoch": 1.24, "learning_rate": 0.00011338069027450544, "loss": 0.0078, "step": 246600 }, { "epoch": 1.24, "learning_rate": 0.00011337312258149144, "loss": 0.0086, "step": 246610 }, { "epoch": 1.24, "learning_rate": 0.00011336555488847743, "loss": 0.0109, "step": 246620 }, { "epoch": 1.24, "learning_rate": 0.00011335798719546342, "loss": 0.0097, "step": 246630 }, { "epoch": 1.24, "learning_rate": 0.00011335041950244941, "loss": 0.0087, "step": 246640 }, { "epoch": 1.24, "learning_rate": 0.00011334285180943539, "loss": 0.0085, "step": 246650 }, { "epoch": 1.24, "learning_rate": 0.00011333528411642139, "loss": 0.0071, "step": 246660 }, { "epoch": 1.24, "learning_rate": 0.00011332771642340736, "loss": 0.0083, "step": 246670 }, { "epoch": 1.24, "learning_rate": 0.00011332014873039335, "loss": 0.0093, "step": 246680 }, { "epoch": 1.24, "learning_rate": 0.00011331258103737935, "loss": 0.0078, "step": 246690 }, { "epoch": 1.24, "learning_rate": 0.00011330501334436533, "loss": 0.0088, "step": 246700 }, { "epoch": 1.24, "learning_rate": 0.00011329744565135132, "loss": 0.0079, "step": 246710 }, { "epoch": 1.24, "learning_rate": 0.00011328987795833732, "loss": 0.0111, "step": 246720 }, { "epoch": 1.24, "learning_rate": 0.0001132823102653233, "loss": 0.0111, "step": 246730 }, { "epoch": 1.24, "learning_rate": 0.00011327474257230929, "loss": 0.0091, "step": 246740 }, { "epoch": 1.24, "learning_rate": 0.00011326717487929527, "loss": 0.0078, "step": 246750 }, { "epoch": 1.24, "learning_rate": 0.00011325960718628127, "loss": 0.0083, "step": 246760 }, { "epoch": 1.24, "learning_rate": 0.00011325203949326726, "loss": 0.0069, "step": 246770 }, { "epoch": 1.25, "learning_rate": 0.00011324447180025325, "loss": 0.0077, "step": 246780 }, { "epoch": 1.25, "learning_rate": 0.00011323690410723924, "loss": 0.0096, "step": 246790 }, { "epoch": 1.25, "learning_rate": 0.00011322933641422524, "loss": 0.0079, "step": 246800 }, { "epoch": 1.25, "learning_rate": 0.00011322176872121122, "loss": 0.0104, "step": 246810 }, { "epoch": 1.25, "learning_rate": 0.00011321420102819721, "loss": 0.0072, "step": 246820 }, { "epoch": 1.25, "learning_rate": 0.0001132066333351832, "loss": 0.0076, "step": 246830 }, { "epoch": 1.25, "learning_rate": 0.00011319906564216919, "loss": 0.0087, "step": 246840 }, { "epoch": 1.25, "learning_rate": 0.00011319149794915518, "loss": 0.0078, "step": 246850 }, { "epoch": 1.25, "learning_rate": 0.00011318393025614117, "loss": 0.0085, "step": 246860 }, { "epoch": 1.25, "learning_rate": 0.00011317636256312716, "loss": 0.008, "step": 246870 }, { "epoch": 1.25, "learning_rate": 0.00011316879487011316, "loss": 0.0088, "step": 246880 }, { "epoch": 1.25, "learning_rate": 0.00011316122717709914, "loss": 0.0074, "step": 246890 }, { "epoch": 1.25, "learning_rate": 0.00011315365948408513, "loss": 0.0087, "step": 246900 }, { "epoch": 1.25, "learning_rate": 0.00011314609179107111, "loss": 0.0078, "step": 246910 }, { "epoch": 1.25, "learning_rate": 0.00011313852409805711, "loss": 0.0114, "step": 246920 }, { "epoch": 1.25, "learning_rate": 0.0001131309564050431, "loss": 0.0079, "step": 246930 }, { "epoch": 1.25, "learning_rate": 0.00011312338871202908, "loss": 0.0084, "step": 246940 }, { "epoch": 1.25, "learning_rate": 0.00011311582101901508, "loss": 0.0083, "step": 246950 }, { "epoch": 1.25, "learning_rate": 0.00011310825332600107, "loss": 0.0092, "step": 246960 }, { "epoch": 1.25, "learning_rate": 0.00011310068563298706, "loss": 0.0094, "step": 246970 }, { "epoch": 1.25, "learning_rate": 0.00011309311793997305, "loss": 0.0071, "step": 246980 }, { "epoch": 1.25, "learning_rate": 0.00011308555024695905, "loss": 0.0085, "step": 246990 }, { "epoch": 1.25, "learning_rate": 0.00011307798255394503, "loss": 0.0074, "step": 247000 }, { "epoch": 1.25, "eval_cer": 0.914457640753532, "eval_loss": 0.0065944562666118145, "eval_runtime": 115.9058, "eval_samples_per_second": 17.255, "eval_steps_per_second": 4.314, "step": 247000 }, { "epoch": 1.25, "learning_rate": 0.00011307041486093102, "loss": 0.0071, "step": 247010 }, { "epoch": 1.25, "learning_rate": 0.000113062847167917, "loss": 0.0072, "step": 247020 }, { "epoch": 1.25, "learning_rate": 0.000113055279474903, "loss": 0.0116, "step": 247030 }, { "epoch": 1.25, "learning_rate": 0.000113047711781889, "loss": 0.0117, "step": 247040 }, { "epoch": 1.25, "learning_rate": 0.00011304014408887498, "loss": 0.0084, "step": 247050 }, { "epoch": 1.25, "learning_rate": 0.00011303257639586097, "loss": 0.0063, "step": 247060 }, { "epoch": 1.25, "learning_rate": 0.00011302500870284697, "loss": 0.0082, "step": 247070 }, { "epoch": 1.25, "learning_rate": 0.00011301744100983295, "loss": 0.0065, "step": 247080 }, { "epoch": 1.25, "learning_rate": 0.00011300987331681894, "loss": 0.0079, "step": 247090 }, { "epoch": 1.25, "learning_rate": 0.00011300230562380492, "loss": 0.0095, "step": 247100 }, { "epoch": 1.25, "learning_rate": 0.00011299473793079092, "loss": 0.0101, "step": 247110 }, { "epoch": 1.25, "learning_rate": 0.00011298717023777691, "loss": 0.0083, "step": 247120 }, { "epoch": 1.25, "learning_rate": 0.0001129796025447629, "loss": 0.0125, "step": 247130 }, { "epoch": 1.25, "learning_rate": 0.00011297203485174889, "loss": 0.0077, "step": 247140 }, { "epoch": 1.25, "learning_rate": 0.00011296446715873488, "loss": 0.013, "step": 247150 }, { "epoch": 1.25, "learning_rate": 0.00011295689946572087, "loss": 0.0101, "step": 247160 }, { "epoch": 1.25, "learning_rate": 0.00011294933177270686, "loss": 0.0075, "step": 247170 }, { "epoch": 1.25, "learning_rate": 0.00011294176407969284, "loss": 0.0093, "step": 247180 }, { "epoch": 1.25, "learning_rate": 0.00011293419638667884, "loss": 0.0076, "step": 247190 }, { "epoch": 1.25, "learning_rate": 0.00011292662869366483, "loss": 0.0078, "step": 247200 }, { "epoch": 1.25, "learning_rate": 0.00011291906100065081, "loss": 0.0093, "step": 247210 }, { "epoch": 1.25, "learning_rate": 0.00011291149330763681, "loss": 0.0114, "step": 247220 }, { "epoch": 1.25, "learning_rate": 0.0001129039256146228, "loss": 0.0104, "step": 247230 }, { "epoch": 1.25, "learning_rate": 0.00011289635792160879, "loss": 0.0094, "step": 247240 }, { "epoch": 1.25, "learning_rate": 0.00011288879022859478, "loss": 0.0088, "step": 247250 }, { "epoch": 1.25, "learning_rate": 0.00011288122253558076, "loss": 0.0096, "step": 247260 }, { "epoch": 1.25, "learning_rate": 0.00011287365484256676, "loss": 0.0067, "step": 247270 }, { "epoch": 1.25, "learning_rate": 0.00011286608714955275, "loss": 0.0094, "step": 247280 }, { "epoch": 1.25, "learning_rate": 0.00011285851945653873, "loss": 0.0072, "step": 247290 }, { "epoch": 1.25, "learning_rate": 0.00011285095176352471, "loss": 0.0096, "step": 247300 }, { "epoch": 1.25, "learning_rate": 0.0001128433840705107, "loss": 0.0096, "step": 247310 }, { "epoch": 1.25, "learning_rate": 0.00011283581637749669, "loss": 0.0072, "step": 247320 }, { "epoch": 1.25, "learning_rate": 0.00011282824868448269, "loss": 0.0112, "step": 247330 }, { "epoch": 1.25, "learning_rate": 0.00011282068099146867, "loss": 0.0096, "step": 247340 }, { "epoch": 1.25, "learning_rate": 0.00011281311329845466, "loss": 0.0078, "step": 247350 }, { "epoch": 1.25, "learning_rate": 0.00011280554560544064, "loss": 0.0086, "step": 247360 }, { "epoch": 1.25, "learning_rate": 0.00011279797791242664, "loss": 0.007, "step": 247370 }, { "epoch": 1.25, "learning_rate": 0.00011279041021941263, "loss": 0.0093, "step": 247380 }, { "epoch": 1.25, "learning_rate": 0.00011278284252639862, "loss": 0.0105, "step": 247390 }, { "epoch": 1.25, "learning_rate": 0.00011277527483338461, "loss": 0.0089, "step": 247400 }, { "epoch": 1.25, "learning_rate": 0.0001127677071403706, "loss": 0.0075, "step": 247410 }, { "epoch": 1.25, "learning_rate": 0.00011276013944735659, "loss": 0.0084, "step": 247420 }, { "epoch": 1.25, "learning_rate": 0.00011275257175434258, "loss": 0.0072, "step": 247430 }, { "epoch": 1.25, "learning_rate": 0.00011274500406132858, "loss": 0.0094, "step": 247440 }, { "epoch": 1.25, "learning_rate": 0.00011273743636831456, "loss": 0.0073, "step": 247450 }, { "epoch": 1.25, "learning_rate": 0.00011272986867530055, "loss": 0.0092, "step": 247460 }, { "epoch": 1.25, "learning_rate": 0.00011272230098228653, "loss": 0.0097, "step": 247470 }, { "epoch": 1.25, "learning_rate": 0.00011271473328927253, "loss": 0.0089, "step": 247480 }, { "epoch": 1.25, "learning_rate": 0.00011270716559625852, "loss": 0.0069, "step": 247490 }, { "epoch": 1.25, "learning_rate": 0.0001126995979032445, "loss": 0.0071, "step": 247500 }, { "epoch": 1.25, "learning_rate": 0.0001126920302102305, "loss": 0.0077, "step": 247510 }, { "epoch": 1.25, "learning_rate": 0.0001126844625172165, "loss": 0.0071, "step": 247520 }, { "epoch": 1.25, "learning_rate": 0.00011267689482420248, "loss": 0.013, "step": 247530 }, { "epoch": 1.25, "learning_rate": 0.00011266932713118847, "loss": 0.008, "step": 247540 }, { "epoch": 1.25, "learning_rate": 0.00011266175943817445, "loss": 0.0083, "step": 247550 }, { "epoch": 1.25, "learning_rate": 0.00011265419174516045, "loss": 0.009, "step": 247560 }, { "epoch": 1.25, "learning_rate": 0.00011264662405214644, "loss": 0.007, "step": 247570 }, { "epoch": 1.25, "learning_rate": 0.00011263905635913243, "loss": 0.0116, "step": 247580 }, { "epoch": 1.25, "learning_rate": 0.00011263148866611842, "loss": 0.0071, "step": 247590 }, { "epoch": 1.25, "learning_rate": 0.00011262392097310442, "loss": 0.0104, "step": 247600 }, { "epoch": 1.25, "learning_rate": 0.0001126163532800904, "loss": 0.0109, "step": 247610 }, { "epoch": 1.25, "learning_rate": 0.00011260878558707639, "loss": 0.0094, "step": 247620 }, { "epoch": 1.25, "learning_rate": 0.00011260121789406237, "loss": 0.0095, "step": 247630 }, { "epoch": 1.25, "learning_rate": 0.00011259365020104837, "loss": 0.0079, "step": 247640 }, { "epoch": 1.25, "learning_rate": 0.00011258608250803436, "loss": 0.0097, "step": 247650 }, { "epoch": 1.25, "learning_rate": 0.00011257851481502034, "loss": 0.0113, "step": 247660 }, { "epoch": 1.25, "learning_rate": 0.00011257094712200634, "loss": 0.0082, "step": 247670 }, { "epoch": 1.25, "learning_rate": 0.00011256337942899233, "loss": 0.0112, "step": 247680 }, { "epoch": 1.25, "learning_rate": 0.00011255581173597832, "loss": 0.0082, "step": 247690 }, { "epoch": 1.25, "learning_rate": 0.00011254824404296431, "loss": 0.0065, "step": 247700 }, { "epoch": 1.25, "learning_rate": 0.00011254067634995029, "loss": 0.0094, "step": 247710 }, { "epoch": 1.25, "learning_rate": 0.00011253310865693629, "loss": 0.0067, "step": 247720 }, { "epoch": 1.25, "learning_rate": 0.00011252554096392228, "loss": 0.0091, "step": 247730 }, { "epoch": 1.25, "learning_rate": 0.00011251797327090826, "loss": 0.0085, "step": 247740 }, { "epoch": 1.25, "learning_rate": 0.00011251040557789426, "loss": 0.007, "step": 247750 }, { "epoch": 1.25, "learning_rate": 0.00011250283788488025, "loss": 0.009, "step": 247760 }, { "epoch": 1.25, "learning_rate": 0.00011249527019186624, "loss": 0.008, "step": 247770 }, { "epoch": 1.25, "learning_rate": 0.00011248770249885223, "loss": 0.0084, "step": 247780 }, { "epoch": 1.25, "learning_rate": 0.00011248013480583821, "loss": 0.0093, "step": 247790 }, { "epoch": 1.25, "learning_rate": 0.0001124725671128242, "loss": 0.0076, "step": 247800 }, { "epoch": 1.25, "learning_rate": 0.0001124649994198102, "loss": 0.009, "step": 247810 }, { "epoch": 1.25, "learning_rate": 0.00011245743172679618, "loss": 0.0098, "step": 247820 }, { "epoch": 1.25, "learning_rate": 0.00011244986403378218, "loss": 0.0107, "step": 247830 }, { "epoch": 1.25, "learning_rate": 0.00011244229634076817, "loss": 0.009, "step": 247840 }, { "epoch": 1.25, "learning_rate": 0.00011243472864775415, "loss": 0.0113, "step": 247850 }, { "epoch": 1.25, "learning_rate": 0.00011242716095474015, "loss": 0.0066, "step": 247860 }, { "epoch": 1.25, "learning_rate": 0.00011241959326172613, "loss": 0.0096, "step": 247870 }, { "epoch": 1.25, "learning_rate": 0.00011241202556871213, "loss": 0.0104, "step": 247880 }, { "epoch": 1.25, "learning_rate": 0.00011240445787569812, "loss": 0.0082, "step": 247890 }, { "epoch": 1.25, "learning_rate": 0.0001123968901826841, "loss": 0.0103, "step": 247900 }, { "epoch": 1.25, "learning_rate": 0.0001123893224896701, "loss": 0.0089, "step": 247910 }, { "epoch": 1.25, "learning_rate": 0.00011238175479665609, "loss": 0.0091, "step": 247920 }, { "epoch": 1.25, "learning_rate": 0.00011237418710364206, "loss": 0.007, "step": 247930 }, { "epoch": 1.25, "learning_rate": 0.00011236661941062806, "loss": 0.0096, "step": 247940 }, { "epoch": 1.25, "learning_rate": 0.00011235905171761404, "loss": 0.0075, "step": 247950 }, { "epoch": 1.25, "learning_rate": 0.00011235148402460003, "loss": 0.0092, "step": 247960 }, { "epoch": 1.25, "learning_rate": 0.00011234391633158603, "loss": 0.0093, "step": 247970 }, { "epoch": 1.25, "learning_rate": 0.00011233634863857201, "loss": 0.0112, "step": 247980 }, { "epoch": 1.25, "learning_rate": 0.000112328780945558, "loss": 0.0092, "step": 247990 }, { "epoch": 1.25, "learning_rate": 0.00011232121325254398, "loss": 0.0083, "step": 248000 }, { "epoch": 1.25, "eval_cer": 0.914462492734159, "eval_loss": 0.006537660490721464, "eval_runtime": 115.8787, "eval_samples_per_second": 17.259, "eval_steps_per_second": 4.315, "step": 248000 }, { "epoch": 1.25, "learning_rate": 0.00011231364555952998, "loss": 0.0089, "step": 248010 }, { "epoch": 1.25, "learning_rate": 0.00011230607786651597, "loss": 0.01, "step": 248020 }, { "epoch": 1.25, "learning_rate": 0.00011229851017350196, "loss": 0.01, "step": 248030 }, { "epoch": 1.25, "learning_rate": 0.00011229094248048795, "loss": 0.0116, "step": 248040 }, { "epoch": 1.25, "learning_rate": 0.00011228337478747395, "loss": 0.0099, "step": 248050 }, { "epoch": 1.25, "learning_rate": 0.00011227580709445993, "loss": 0.0073, "step": 248060 }, { "epoch": 1.25, "learning_rate": 0.00011226823940144592, "loss": 0.0092, "step": 248070 }, { "epoch": 1.25, "learning_rate": 0.0001122606717084319, "loss": 0.0095, "step": 248080 }, { "epoch": 1.25, "learning_rate": 0.0001122531040154179, "loss": 0.0082, "step": 248090 }, { "epoch": 1.25, "learning_rate": 0.0001122455363224039, "loss": 0.0089, "step": 248100 }, { "epoch": 1.25, "learning_rate": 0.00011223796862938988, "loss": 0.0087, "step": 248110 }, { "epoch": 1.25, "learning_rate": 0.00011223040093637587, "loss": 0.0082, "step": 248120 }, { "epoch": 1.25, "learning_rate": 0.00011222283324336187, "loss": 0.0067, "step": 248130 }, { "epoch": 1.25, "learning_rate": 0.00011221526555034785, "loss": 0.0081, "step": 248140 }, { "epoch": 1.25, "learning_rate": 0.00011220769785733384, "loss": 0.0053, "step": 248150 }, { "epoch": 1.25, "learning_rate": 0.00011220013016431982, "loss": 0.0078, "step": 248160 }, { "epoch": 1.25, "learning_rate": 0.00011219256247130582, "loss": 0.0096, "step": 248170 }, { "epoch": 1.25, "learning_rate": 0.00011218499477829181, "loss": 0.0102, "step": 248180 }, { "epoch": 1.25, "learning_rate": 0.0001121774270852778, "loss": 0.007, "step": 248190 }, { "epoch": 1.25, "learning_rate": 0.00011216985939226379, "loss": 0.0075, "step": 248200 }, { "epoch": 1.25, "learning_rate": 0.00011216229169924978, "loss": 0.0106, "step": 248210 }, { "epoch": 1.25, "learning_rate": 0.00011215472400623577, "loss": 0.0094, "step": 248220 }, { "epoch": 1.25, "learning_rate": 0.00011214715631322176, "loss": 0.0096, "step": 248230 }, { "epoch": 1.25, "learning_rate": 0.00011213958862020774, "loss": 0.0081, "step": 248240 }, { "epoch": 1.25, "learning_rate": 0.00011213202092719374, "loss": 0.0086, "step": 248250 }, { "epoch": 1.25, "learning_rate": 0.00011212445323417973, "loss": 0.0088, "step": 248260 }, { "epoch": 1.25, "learning_rate": 0.00011211688554116571, "loss": 0.0069, "step": 248270 }, { "epoch": 1.25, "learning_rate": 0.00011210931784815171, "loss": 0.0086, "step": 248280 }, { "epoch": 1.25, "learning_rate": 0.0001121017501551377, "loss": 0.0112, "step": 248290 }, { "epoch": 1.25, "learning_rate": 0.00011209418246212369, "loss": 0.0103, "step": 248300 }, { "epoch": 1.25, "learning_rate": 0.00011208661476910968, "loss": 0.0074, "step": 248310 }, { "epoch": 1.25, "learning_rate": 0.00011207904707609566, "loss": 0.0073, "step": 248320 }, { "epoch": 1.25, "learning_rate": 0.00011207147938308166, "loss": 0.0095, "step": 248330 }, { "epoch": 1.25, "learning_rate": 0.00011206391169006765, "loss": 0.009, "step": 248340 }, { "epoch": 1.25, "learning_rate": 0.00011205634399705363, "loss": 0.0157, "step": 248350 }, { "epoch": 1.25, "learning_rate": 0.00011204877630403963, "loss": 0.0075, "step": 248360 }, { "epoch": 1.25, "learning_rate": 0.00011204120861102562, "loss": 0.0073, "step": 248370 }, { "epoch": 1.25, "learning_rate": 0.0001120336409180116, "loss": 0.0082, "step": 248380 }, { "epoch": 1.25, "learning_rate": 0.0001120260732249976, "loss": 0.0088, "step": 248390 }, { "epoch": 1.25, "learning_rate": 0.00011201850553198358, "loss": 0.0128, "step": 248400 }, { "epoch": 1.25, "learning_rate": 0.00011201093783896958, "loss": 0.0089, "step": 248410 }, { "epoch": 1.25, "learning_rate": 0.00011200337014595557, "loss": 0.0084, "step": 248420 }, { "epoch": 1.25, "learning_rate": 0.00011199580245294155, "loss": 0.0087, "step": 248430 }, { "epoch": 1.25, "learning_rate": 0.00011198823475992755, "loss": 0.0077, "step": 248440 }, { "epoch": 1.25, "learning_rate": 0.00011198066706691354, "loss": 0.0079, "step": 248450 }, { "epoch": 1.25, "learning_rate": 0.00011197309937389952, "loss": 0.0082, "step": 248460 }, { "epoch": 1.25, "learning_rate": 0.00011196553168088552, "loss": 0.01, "step": 248470 }, { "epoch": 1.25, "learning_rate": 0.00011195796398787151, "loss": 0.007, "step": 248480 }, { "epoch": 1.25, "learning_rate": 0.0001119503962948575, "loss": 0.009, "step": 248490 }, { "epoch": 1.25, "learning_rate": 0.00011194282860184349, "loss": 0.0088, "step": 248500 }, { "epoch": 1.25, "learning_rate": 0.00011193526090882947, "loss": 0.0075, "step": 248510 }, { "epoch": 1.25, "learning_rate": 0.00011192769321581547, "loss": 0.0085, "step": 248520 }, { "epoch": 1.25, "learning_rate": 0.00011192012552280146, "loss": 0.0073, "step": 248530 }, { "epoch": 1.25, "learning_rate": 0.00011191255782978744, "loss": 0.0085, "step": 248540 }, { "epoch": 1.25, "learning_rate": 0.00011190499013677342, "loss": 0.0078, "step": 248550 }, { "epoch": 1.25, "learning_rate": 0.0001118974224437594, "loss": 0.0087, "step": 248560 }, { "epoch": 1.25, "learning_rate": 0.0001118898547507454, "loss": 0.0085, "step": 248570 }, { "epoch": 1.25, "learning_rate": 0.0001118822870577314, "loss": 0.0071, "step": 248580 }, { "epoch": 1.25, "learning_rate": 0.00011187471936471738, "loss": 0.0055, "step": 248590 }, { "epoch": 1.25, "learning_rate": 0.00011186715167170337, "loss": 0.0078, "step": 248600 }, { "epoch": 1.25, "learning_rate": 0.00011185958397868935, "loss": 0.0079, "step": 248610 }, { "epoch": 1.25, "learning_rate": 0.00011185201628567535, "loss": 0.0065, "step": 248620 }, { "epoch": 1.25, "learning_rate": 0.00011184444859266134, "loss": 0.0103, "step": 248630 }, { "epoch": 1.25, "learning_rate": 0.00011183688089964733, "loss": 0.0068, "step": 248640 }, { "epoch": 1.25, "learning_rate": 0.00011182931320663332, "loss": 0.0089, "step": 248650 }, { "epoch": 1.25, "learning_rate": 0.00011182174551361932, "loss": 0.0082, "step": 248660 }, { "epoch": 1.25, "learning_rate": 0.0001118141778206053, "loss": 0.0066, "step": 248670 }, { "epoch": 1.25, "learning_rate": 0.00011180661012759129, "loss": 0.0079, "step": 248680 }, { "epoch": 1.25, "learning_rate": 0.00011179904243457727, "loss": 0.0108, "step": 248690 }, { "epoch": 1.25, "learning_rate": 0.00011179147474156327, "loss": 0.0074, "step": 248700 }, { "epoch": 1.25, "learning_rate": 0.00011178390704854926, "loss": 0.0099, "step": 248710 }, { "epoch": 1.25, "learning_rate": 0.00011177633935553524, "loss": 0.0077, "step": 248720 }, { "epoch": 1.25, "learning_rate": 0.00011176877166252124, "loss": 0.0081, "step": 248730 }, { "epoch": 1.25, "learning_rate": 0.00011176120396950723, "loss": 0.0074, "step": 248740 }, { "epoch": 1.25, "learning_rate": 0.00011175363627649322, "loss": 0.0082, "step": 248750 }, { "epoch": 1.26, "learning_rate": 0.00011174606858347921, "loss": 0.0082, "step": 248760 }, { "epoch": 1.26, "learning_rate": 0.00011173850089046519, "loss": 0.0071, "step": 248770 }, { "epoch": 1.26, "learning_rate": 0.00011173093319745119, "loss": 0.0117, "step": 248780 }, { "epoch": 1.26, "learning_rate": 0.00011172336550443718, "loss": 0.0085, "step": 248790 }, { "epoch": 1.26, "learning_rate": 0.00011171579781142316, "loss": 0.0081, "step": 248800 }, { "epoch": 1.26, "learning_rate": 0.00011170823011840916, "loss": 0.011, "step": 248810 }, { "epoch": 1.26, "learning_rate": 0.00011170066242539515, "loss": 0.0055, "step": 248820 }, { "epoch": 1.26, "learning_rate": 0.00011169309473238114, "loss": 0.014, "step": 248830 }, { "epoch": 1.26, "learning_rate": 0.00011168552703936713, "loss": 0.0116, "step": 248840 }, { "epoch": 1.26, "learning_rate": 0.00011167795934635311, "loss": 0.0121, "step": 248850 }, { "epoch": 1.26, "learning_rate": 0.00011167039165333911, "loss": 0.0106, "step": 248860 }, { "epoch": 1.26, "learning_rate": 0.0001116628239603251, "loss": 0.0061, "step": 248870 }, { "epoch": 1.26, "learning_rate": 0.00011165525626731108, "loss": 0.008, "step": 248880 }, { "epoch": 1.26, "learning_rate": 0.00011164768857429708, "loss": 0.009, "step": 248890 }, { "epoch": 1.26, "learning_rate": 0.00011164012088128307, "loss": 0.0073, "step": 248900 }, { "epoch": 1.26, "learning_rate": 0.00011163255318826905, "loss": 0.0091, "step": 248910 }, { "epoch": 1.26, "learning_rate": 0.00011162498549525505, "loss": 0.0079, "step": 248920 }, { "epoch": 1.26, "learning_rate": 0.00011161741780224104, "loss": 0.0079, "step": 248930 }, { "epoch": 1.26, "learning_rate": 0.00011160985010922703, "loss": 0.0073, "step": 248940 }, { "epoch": 1.26, "learning_rate": 0.00011160228241621302, "loss": 0.0081, "step": 248950 }, { "epoch": 1.26, "learning_rate": 0.000111594714723199, "loss": 0.0071, "step": 248960 }, { "epoch": 1.26, "learning_rate": 0.000111587147030185, "loss": 0.0081, "step": 248970 }, { "epoch": 1.26, "learning_rate": 0.00011157957933717099, "loss": 0.0072, "step": 248980 }, { "epoch": 1.26, "learning_rate": 0.00011157201164415697, "loss": 0.0082, "step": 248990 }, { "epoch": 1.26, "learning_rate": 0.00011156444395114297, "loss": 0.0098, "step": 249000 }, { "epoch": 1.26, "eval_cer": 0.9144459960000272, "eval_loss": 0.0065380726009607315, "eval_runtime": 116.0227, "eval_samples_per_second": 17.238, "eval_steps_per_second": 4.31, "step": 249000 }, { "epoch": 1.26, "learning_rate": 0.00011155687625812896, "loss": 0.0078, "step": 249010 }, { "epoch": 1.26, "learning_rate": 0.00011154930856511495, "loss": 0.0102, "step": 249020 }, { "epoch": 1.26, "learning_rate": 0.00011154174087210094, "loss": 0.0087, "step": 249030 }, { "epoch": 1.26, "learning_rate": 0.00011153417317908692, "loss": 0.0088, "step": 249040 }, { "epoch": 1.26, "learning_rate": 0.00011152660548607292, "loss": 0.0087, "step": 249050 }, { "epoch": 1.26, "learning_rate": 0.00011151903779305891, "loss": 0.0083, "step": 249060 }, { "epoch": 1.26, "learning_rate": 0.0001115114701000449, "loss": 0.0094, "step": 249070 }, { "epoch": 1.26, "learning_rate": 0.00011150390240703089, "loss": 0.0092, "step": 249080 }, { "epoch": 1.26, "learning_rate": 0.00011149633471401688, "loss": 0.0103, "step": 249090 }, { "epoch": 1.26, "learning_rate": 0.00011148876702100286, "loss": 0.0098, "step": 249100 }, { "epoch": 1.26, "learning_rate": 0.00011148119932798886, "loss": 0.0088, "step": 249110 }, { "epoch": 1.26, "learning_rate": 0.00011147363163497484, "loss": 0.0103, "step": 249120 }, { "epoch": 1.26, "learning_rate": 0.00011146606394196084, "loss": 0.0086, "step": 249130 }, { "epoch": 1.26, "learning_rate": 0.00011145849624894683, "loss": 0.0074, "step": 249140 }, { "epoch": 1.26, "learning_rate": 0.00011145092855593281, "loss": 0.0073, "step": 249150 }, { "epoch": 1.26, "learning_rate": 0.00011144336086291881, "loss": 0.0089, "step": 249160 }, { "epoch": 1.26, "learning_rate": 0.0001114357931699048, "loss": 0.0086, "step": 249170 }, { "epoch": 1.26, "learning_rate": 0.00011142822547689077, "loss": 0.0079, "step": 249180 }, { "epoch": 1.26, "learning_rate": 0.00011142065778387677, "loss": 0.0073, "step": 249190 }, { "epoch": 1.26, "learning_rate": 0.00011141309009086275, "loss": 0.01, "step": 249200 }, { "epoch": 1.26, "learning_rate": 0.00011140552239784874, "loss": 0.0088, "step": 249210 }, { "epoch": 1.26, "learning_rate": 0.00011139795470483472, "loss": 0.0086, "step": 249220 }, { "epoch": 1.26, "learning_rate": 0.00011139038701182072, "loss": 0.0081, "step": 249230 }, { "epoch": 1.26, "learning_rate": 0.00011138281931880671, "loss": 0.0085, "step": 249240 }, { "epoch": 1.26, "learning_rate": 0.0001113752516257927, "loss": 0.0093, "step": 249250 }, { "epoch": 1.26, "learning_rate": 0.00011136768393277869, "loss": 0.0072, "step": 249260 }, { "epoch": 1.26, "learning_rate": 0.00011136011623976468, "loss": 0.0131, "step": 249270 }, { "epoch": 1.26, "learning_rate": 0.00011135254854675067, "loss": 0.0073, "step": 249280 }, { "epoch": 1.26, "learning_rate": 0.00011134498085373666, "loss": 0.0081, "step": 249290 }, { "epoch": 1.26, "learning_rate": 0.00011133741316072264, "loss": 0.008, "step": 249300 }, { "epoch": 1.26, "learning_rate": 0.00011132984546770864, "loss": 0.0079, "step": 249310 }, { "epoch": 1.26, "learning_rate": 0.00011132227777469463, "loss": 0.0091, "step": 249320 }, { "epoch": 1.26, "learning_rate": 0.00011131471008168061, "loss": 0.0098, "step": 249330 }, { "epoch": 1.26, "learning_rate": 0.00011130714238866661, "loss": 0.0087, "step": 249340 }, { "epoch": 1.26, "learning_rate": 0.0001112995746956526, "loss": 0.0099, "step": 249350 }, { "epoch": 1.26, "learning_rate": 0.00011129200700263859, "loss": 0.0089, "step": 249360 }, { "epoch": 1.26, "learning_rate": 0.00011128443930962458, "loss": 0.009, "step": 249370 }, { "epoch": 1.26, "learning_rate": 0.00011127687161661056, "loss": 0.0063, "step": 249380 }, { "epoch": 1.26, "learning_rate": 0.00011126930392359656, "loss": 0.0089, "step": 249390 }, { "epoch": 1.26, "learning_rate": 0.00011126173623058255, "loss": 0.0098, "step": 249400 }, { "epoch": 1.26, "learning_rate": 0.00011125416853756853, "loss": 0.0076, "step": 249410 }, { "epoch": 1.26, "learning_rate": 0.00011124660084455453, "loss": 0.01, "step": 249420 }, { "epoch": 1.26, "learning_rate": 0.00011123903315154052, "loss": 0.0076, "step": 249430 }, { "epoch": 1.26, "learning_rate": 0.0001112314654585265, "loss": 0.0069, "step": 249440 }, { "epoch": 1.26, "learning_rate": 0.0001112238977655125, "loss": 0.0082, "step": 249450 }, { "epoch": 1.26, "learning_rate": 0.0001112163300724985, "loss": 0.0091, "step": 249460 }, { "epoch": 1.26, "learning_rate": 0.00011120876237948448, "loss": 0.0102, "step": 249470 }, { "epoch": 1.26, "learning_rate": 0.00011120119468647047, "loss": 0.0084, "step": 249480 }, { "epoch": 1.26, "learning_rate": 0.00011119362699345645, "loss": 0.0075, "step": 249490 }, { "epoch": 1.26, "learning_rate": 0.00011118605930044245, "loss": 0.0081, "step": 249500 }, { "epoch": 1.26, "learning_rate": 0.00011117849160742844, "loss": 0.0085, "step": 249510 }, { "epoch": 1.26, "learning_rate": 0.00011117092391441442, "loss": 0.0091, "step": 249520 }, { "epoch": 1.26, "learning_rate": 0.00011116335622140042, "loss": 0.0071, "step": 249530 }, { "epoch": 1.26, "learning_rate": 0.00011115578852838641, "loss": 0.0082, "step": 249540 }, { "epoch": 1.26, "learning_rate": 0.0001111482208353724, "loss": 0.0078, "step": 249550 }, { "epoch": 1.26, "learning_rate": 0.00011114065314235839, "loss": 0.011, "step": 249560 }, { "epoch": 1.26, "learning_rate": 0.00011113308544934437, "loss": 0.0076, "step": 249570 }, { "epoch": 1.26, "learning_rate": 0.00011112551775633037, "loss": 0.0072, "step": 249580 }, { "epoch": 1.26, "learning_rate": 0.00011111795006331636, "loss": 0.0099, "step": 249590 }, { "epoch": 1.26, "learning_rate": 0.00011111038237030234, "loss": 0.0096, "step": 249600 }, { "epoch": 1.26, "learning_rate": 0.00011110281467728834, "loss": 0.0088, "step": 249610 }, { "epoch": 1.26, "learning_rate": 0.00011109524698427433, "loss": 0.0079, "step": 249620 }, { "epoch": 1.26, "learning_rate": 0.00011108767929126032, "loss": 0.0093, "step": 249630 }, { "epoch": 1.26, "learning_rate": 0.00011108011159824631, "loss": 0.0095, "step": 249640 }, { "epoch": 1.26, "learning_rate": 0.00011107254390523229, "loss": 0.0076, "step": 249650 }, { "epoch": 1.26, "learning_rate": 0.00011106497621221829, "loss": 0.0132, "step": 249660 }, { "epoch": 1.26, "learning_rate": 0.00011105740851920428, "loss": 0.011, "step": 249670 }, { "epoch": 1.26, "learning_rate": 0.00011104984082619026, "loss": 0.0128, "step": 249680 }, { "epoch": 1.26, "learning_rate": 0.00011104227313317626, "loss": 0.0088, "step": 249690 }, { "epoch": 1.26, "learning_rate": 0.00011103470544016225, "loss": 0.0089, "step": 249700 }, { "epoch": 1.26, "learning_rate": 0.00011102713774714823, "loss": 0.0087, "step": 249710 }, { "epoch": 1.26, "learning_rate": 0.00011101957005413423, "loss": 0.0105, "step": 249720 }, { "epoch": 1.26, "learning_rate": 0.00011101200236112021, "loss": 0.0078, "step": 249730 }, { "epoch": 1.26, "learning_rate": 0.0001110044346681062, "loss": 0.01, "step": 249740 }, { "epoch": 1.26, "learning_rate": 0.0001109968669750922, "loss": 0.0086, "step": 249750 }, { "epoch": 1.26, "learning_rate": 0.00011098929928207818, "loss": 0.0102, "step": 249760 }, { "epoch": 1.26, "learning_rate": 0.00011098173158906418, "loss": 0.0095, "step": 249770 }, { "epoch": 1.26, "learning_rate": 0.00011097416389605017, "loss": 0.0066, "step": 249780 }, { "epoch": 1.26, "learning_rate": 0.00011096659620303615, "loss": 0.0099, "step": 249790 }, { "epoch": 1.26, "learning_rate": 0.00011095902851002215, "loss": 0.0086, "step": 249800 }, { "epoch": 1.26, "learning_rate": 0.00011095146081700812, "loss": 0.0089, "step": 249810 }, { "epoch": 1.26, "learning_rate": 0.00011094389312399411, "loss": 0.0072, "step": 249820 }, { "epoch": 1.26, "learning_rate": 0.00011093632543098009, "loss": 0.0065, "step": 249830 }, { "epoch": 1.26, "learning_rate": 0.00011092875773796609, "loss": 0.0085, "step": 249840 }, { "epoch": 1.26, "learning_rate": 0.00011092119004495208, "loss": 0.0074, "step": 249850 }, { "epoch": 1.26, "learning_rate": 0.00011091362235193806, "loss": 0.0085, "step": 249860 }, { "epoch": 1.26, "learning_rate": 0.00011090605465892406, "loss": 0.0113, "step": 249870 }, { "epoch": 1.26, "learning_rate": 0.00011089848696591005, "loss": 0.0093, "step": 249880 }, { "epoch": 1.26, "learning_rate": 0.00011089091927289604, "loss": 0.0078, "step": 249890 }, { "epoch": 1.26, "learning_rate": 0.00011088335157988203, "loss": 0.0072, "step": 249900 }, { "epoch": 1.26, "learning_rate": 0.00011087578388686803, "loss": 0.0131, "step": 249910 }, { "epoch": 1.26, "learning_rate": 0.00011086821619385401, "loss": 0.0095, "step": 249920 }, { "epoch": 1.26, "learning_rate": 0.00011086064850084, "loss": 0.009, "step": 249930 }, { "epoch": 1.26, "learning_rate": 0.00011085308080782598, "loss": 0.008, "step": 249940 }, { "epoch": 1.26, "learning_rate": 0.00011084551311481198, "loss": 0.0107, "step": 249950 }, { "epoch": 1.26, "learning_rate": 0.00011083794542179797, "loss": 0.0086, "step": 249960 }, { "epoch": 1.26, "learning_rate": 0.00011083037772878396, "loss": 0.0092, "step": 249970 }, { "epoch": 1.26, "learning_rate": 0.00011082281003576995, "loss": 0.0072, "step": 249980 }, { "epoch": 1.26, "learning_rate": 0.00011081524234275595, "loss": 0.0098, "step": 249990 }, { "epoch": 1.26, "learning_rate": 0.00011080767464974193, "loss": 0.0082, "step": 250000 }, { "epoch": 1.26, "eval_cer": 0.9144537591690304, "eval_loss": 0.0067350054159760475, "eval_runtime": 115.9925, "eval_samples_per_second": 17.243, "eval_steps_per_second": 4.311, "step": 250000 }, { "epoch": 1.26, "learning_rate": 0.00011080010695672792, "loss": 0.0085, "step": 250010 }, { "epoch": 1.26, "learning_rate": 0.0001107925392637139, "loss": 0.0154, "step": 250020 }, { "epoch": 1.26, "learning_rate": 0.0001107849715706999, "loss": 0.0071, "step": 250030 }, { "epoch": 1.26, "learning_rate": 0.00011077740387768589, "loss": 0.0072, "step": 250040 }, { "epoch": 1.26, "learning_rate": 0.00011076983618467187, "loss": 0.0067, "step": 250050 }, { "epoch": 1.26, "learning_rate": 0.00011076226849165787, "loss": 0.0066, "step": 250060 }, { "epoch": 1.26, "learning_rate": 0.00011075470079864386, "loss": 0.0121, "step": 250070 }, { "epoch": 1.26, "learning_rate": 0.00011074713310562985, "loss": 0.0063, "step": 250080 }, { "epoch": 1.26, "learning_rate": 0.00011073956541261584, "loss": 0.0088, "step": 250090 }, { "epoch": 1.26, "learning_rate": 0.00011073199771960182, "loss": 0.0071, "step": 250100 }, { "epoch": 1.26, "learning_rate": 0.00011072443002658782, "loss": 0.0084, "step": 250110 }, { "epoch": 1.26, "learning_rate": 0.00011071686233357381, "loss": 0.0107, "step": 250120 }, { "epoch": 1.26, "learning_rate": 0.0001107092946405598, "loss": 0.0104, "step": 250130 }, { "epoch": 1.26, "learning_rate": 0.00011070172694754579, "loss": 0.008, "step": 250140 }, { "epoch": 1.26, "learning_rate": 0.00011069415925453178, "loss": 0.0079, "step": 250150 }, { "epoch": 1.26, "learning_rate": 0.00011068659156151777, "loss": 0.0079, "step": 250160 }, { "epoch": 1.26, "learning_rate": 0.00011067902386850376, "loss": 0.007, "step": 250170 }, { "epoch": 1.26, "learning_rate": 0.00011067145617548974, "loss": 0.0088, "step": 250180 }, { "epoch": 1.26, "learning_rate": 0.00011066388848247574, "loss": 0.0085, "step": 250190 }, { "epoch": 1.26, "learning_rate": 0.00011065632078946173, "loss": 0.0106, "step": 250200 }, { "epoch": 1.26, "learning_rate": 0.00011064875309644771, "loss": 0.0085, "step": 250210 }, { "epoch": 1.26, "learning_rate": 0.00011064118540343371, "loss": 0.0104, "step": 250220 }, { "epoch": 1.26, "learning_rate": 0.0001106336177104197, "loss": 0.007, "step": 250230 }, { "epoch": 1.26, "learning_rate": 0.00011062605001740568, "loss": 0.0087, "step": 250240 }, { "epoch": 1.26, "learning_rate": 0.00011061848232439168, "loss": 0.0104, "step": 250250 }, { "epoch": 1.26, "learning_rate": 0.00011061091463137766, "loss": 0.0107, "step": 250260 }, { "epoch": 1.26, "learning_rate": 0.00011060334693836366, "loss": 0.0108, "step": 250270 }, { "epoch": 1.26, "learning_rate": 0.00011059577924534965, "loss": 0.0069, "step": 250280 }, { "epoch": 1.26, "learning_rate": 0.00011058821155233563, "loss": 0.0086, "step": 250290 }, { "epoch": 1.26, "learning_rate": 0.00011058064385932163, "loss": 0.0125, "step": 250300 }, { "epoch": 1.26, "learning_rate": 0.00011057307616630762, "loss": 0.006, "step": 250310 }, { "epoch": 1.26, "learning_rate": 0.0001105655084732936, "loss": 0.0094, "step": 250320 }, { "epoch": 1.26, "learning_rate": 0.0001105579407802796, "loss": 0.0072, "step": 250330 }, { "epoch": 1.26, "learning_rate": 0.00011055037308726558, "loss": 0.0094, "step": 250340 }, { "epoch": 1.26, "learning_rate": 0.00011054280539425158, "loss": 0.0074, "step": 250350 }, { "epoch": 1.26, "learning_rate": 0.00011053523770123757, "loss": 0.0099, "step": 250360 }, { "epoch": 1.26, "learning_rate": 0.00011052767000822355, "loss": 0.0101, "step": 250370 }, { "epoch": 1.26, "learning_rate": 0.00011052010231520955, "loss": 0.0101, "step": 250380 }, { "epoch": 1.26, "learning_rate": 0.00011051253462219554, "loss": 0.0078, "step": 250390 }, { "epoch": 1.26, "learning_rate": 0.00011050496692918152, "loss": 0.013, "step": 250400 }, { "epoch": 1.26, "learning_rate": 0.00011049739923616752, "loss": 0.0104, "step": 250410 }, { "epoch": 1.26, "learning_rate": 0.00011048983154315351, "loss": 0.0068, "step": 250420 }, { "epoch": 1.26, "learning_rate": 0.0001104822638501395, "loss": 0.0083, "step": 250430 }, { "epoch": 1.26, "learning_rate": 0.00011047469615712548, "loss": 0.009, "step": 250440 }, { "epoch": 1.26, "learning_rate": 0.00011046712846411146, "loss": 0.0075, "step": 250450 }, { "epoch": 1.26, "learning_rate": 0.00011045956077109745, "loss": 0.0087, "step": 250460 }, { "epoch": 1.26, "learning_rate": 0.00011045199307808343, "loss": 0.0065, "step": 250470 }, { "epoch": 1.26, "learning_rate": 0.00011044442538506943, "loss": 0.0091, "step": 250480 }, { "epoch": 1.26, "learning_rate": 0.00011043685769205542, "loss": 0.0077, "step": 250490 }, { "epoch": 1.26, "learning_rate": 0.0001104292899990414, "loss": 0.0068, "step": 250500 }, { "epoch": 1.26, "learning_rate": 0.0001104217223060274, "loss": 0.0067, "step": 250510 }, { "epoch": 1.26, "learning_rate": 0.0001104141546130134, "loss": 0.0116, "step": 250520 }, { "epoch": 1.26, "learning_rate": 0.00011040658691999938, "loss": 0.0096, "step": 250530 }, { "epoch": 1.26, "learning_rate": 0.00011039901922698537, "loss": 0.0068, "step": 250540 }, { "epoch": 1.26, "learning_rate": 0.00011039145153397135, "loss": 0.0066, "step": 250550 }, { "epoch": 1.26, "learning_rate": 0.00011038388384095735, "loss": 0.0085, "step": 250560 }, { "epoch": 1.26, "learning_rate": 0.00011037631614794334, "loss": 0.0078, "step": 250570 }, { "epoch": 1.26, "learning_rate": 0.00011036874845492932, "loss": 0.0086, "step": 250580 }, { "epoch": 1.26, "learning_rate": 0.00011036118076191532, "loss": 0.0092, "step": 250590 }, { "epoch": 1.26, "learning_rate": 0.00011035361306890131, "loss": 0.0072, "step": 250600 }, { "epoch": 1.26, "learning_rate": 0.0001103460453758873, "loss": 0.0147, "step": 250610 }, { "epoch": 1.26, "learning_rate": 0.00011033847768287329, "loss": 0.0101, "step": 250620 }, { "epoch": 1.26, "learning_rate": 0.00011033090998985927, "loss": 0.0103, "step": 250630 }, { "epoch": 1.26, "learning_rate": 0.00011032334229684527, "loss": 0.0112, "step": 250640 }, { "epoch": 1.26, "learning_rate": 0.00011031577460383126, "loss": 0.007, "step": 250650 }, { "epoch": 1.26, "learning_rate": 0.00011030820691081724, "loss": 0.009, "step": 250660 }, { "epoch": 1.26, "learning_rate": 0.00011030063921780324, "loss": 0.0072, "step": 250670 }, { "epoch": 1.26, "learning_rate": 0.00011029307152478923, "loss": 0.0099, "step": 250680 }, { "epoch": 1.26, "learning_rate": 0.00011028550383177522, "loss": 0.0082, "step": 250690 }, { "epoch": 1.26, "learning_rate": 0.00011027793613876121, "loss": 0.0091, "step": 250700 }, { "epoch": 1.26, "learning_rate": 0.00011027036844574719, "loss": 0.0071, "step": 250710 }, { "epoch": 1.26, "learning_rate": 0.00011026280075273319, "loss": 0.0089, "step": 250720 }, { "epoch": 1.26, "learning_rate": 0.00011025523305971918, "loss": 0.0071, "step": 250730 }, { "epoch": 1.27, "learning_rate": 0.00011024766536670516, "loss": 0.0068, "step": 250740 }, { "epoch": 1.27, "learning_rate": 0.00011024009767369116, "loss": 0.0087, "step": 250750 }, { "epoch": 1.27, "learning_rate": 0.00011023252998067715, "loss": 0.0115, "step": 250760 }, { "epoch": 1.27, "learning_rate": 0.00011022496228766313, "loss": 0.0079, "step": 250770 }, { "epoch": 1.27, "learning_rate": 0.00011021739459464913, "loss": 0.013, "step": 250780 }, { "epoch": 1.27, "learning_rate": 0.00011020982690163511, "loss": 0.0095, "step": 250790 }, { "epoch": 1.27, "learning_rate": 0.0001102022592086211, "loss": 0.0059, "step": 250800 }, { "epoch": 1.27, "learning_rate": 0.0001101946915156071, "loss": 0.0074, "step": 250810 }, { "epoch": 1.27, "learning_rate": 0.00011018712382259308, "loss": 0.0091, "step": 250820 }, { "epoch": 1.27, "learning_rate": 0.00011017955612957908, "loss": 0.0113, "step": 250830 }, { "epoch": 1.27, "learning_rate": 0.00011017198843656507, "loss": 0.0089, "step": 250840 }, { "epoch": 1.27, "learning_rate": 0.00011016442074355105, "loss": 0.0103, "step": 250850 }, { "epoch": 1.27, "learning_rate": 0.00011015685305053705, "loss": 0.0079, "step": 250860 }, { "epoch": 1.27, "learning_rate": 0.00011014928535752304, "loss": 0.0082, "step": 250870 }, { "epoch": 1.27, "learning_rate": 0.00011014171766450903, "loss": 0.0073, "step": 250880 }, { "epoch": 1.27, "learning_rate": 0.00011013414997149502, "loss": 0.0103, "step": 250890 }, { "epoch": 1.27, "learning_rate": 0.000110126582278481, "loss": 0.0083, "step": 250900 }, { "epoch": 1.27, "learning_rate": 0.000110119014585467, "loss": 0.009, "step": 250910 }, { "epoch": 1.27, "learning_rate": 0.00011011144689245299, "loss": 0.0092, "step": 250920 }, { "epoch": 1.27, "learning_rate": 0.00011010387919943897, "loss": 0.0134, "step": 250930 }, { "epoch": 1.27, "learning_rate": 0.00011009631150642497, "loss": 0.008, "step": 250940 }, { "epoch": 1.27, "learning_rate": 0.00011008874381341096, "loss": 0.0071, "step": 250950 }, { "epoch": 1.27, "learning_rate": 0.00011008117612039694, "loss": 0.0106, "step": 250960 }, { "epoch": 1.27, "learning_rate": 0.00011007360842738294, "loss": 0.0072, "step": 250970 }, { "epoch": 1.27, "learning_rate": 0.00011006604073436892, "loss": 0.0057, "step": 250980 }, { "epoch": 1.27, "learning_rate": 0.00011005847304135492, "loss": 0.0099, "step": 250990 }, { "epoch": 1.27, "learning_rate": 0.00011005090534834091, "loss": 0.01, "step": 251000 }, { "epoch": 1.27, "eval_cer": 0.9144605519419082, "eval_loss": 0.0065511371940374374, "eval_runtime": 116.1225, "eval_samples_per_second": 17.223, "eval_steps_per_second": 4.306, "step": 251000 }, { "epoch": 1.27, "learning_rate": 0.00011004333765532689, "loss": 0.008, "step": 251010 }, { "epoch": 1.27, "learning_rate": 0.00011003576996231289, "loss": 0.0103, "step": 251020 }, { "epoch": 1.27, "learning_rate": 0.00011002820226929888, "loss": 0.0099, "step": 251030 }, { "epoch": 1.27, "learning_rate": 0.00011002063457628486, "loss": 0.0089, "step": 251040 }, { "epoch": 1.27, "learning_rate": 0.00011001306688327086, "loss": 0.0064, "step": 251050 }, { "epoch": 1.27, "learning_rate": 0.00011000549919025684, "loss": 0.0073, "step": 251060 }, { "epoch": 1.27, "learning_rate": 0.00010999793149724282, "loss": 0.0122, "step": 251070 }, { "epoch": 1.27, "learning_rate": 0.0001099903638042288, "loss": 0.0112, "step": 251080 }, { "epoch": 1.27, "learning_rate": 0.0001099827961112148, "loss": 0.0081, "step": 251090 }, { "epoch": 1.27, "learning_rate": 0.0001099752284182008, "loss": 0.0078, "step": 251100 }, { "epoch": 1.27, "learning_rate": 0.00010996766072518677, "loss": 0.0107, "step": 251110 }, { "epoch": 1.27, "learning_rate": 0.00010996009303217277, "loss": 0.0084, "step": 251120 }, { "epoch": 1.27, "learning_rate": 0.00010995252533915876, "loss": 0.0076, "step": 251130 }, { "epoch": 1.27, "learning_rate": 0.00010994495764614475, "loss": 0.009, "step": 251140 }, { "epoch": 1.27, "learning_rate": 0.00010993738995313074, "loss": 0.0084, "step": 251150 }, { "epoch": 1.27, "learning_rate": 0.00010992982226011672, "loss": 0.0088, "step": 251160 }, { "epoch": 1.27, "learning_rate": 0.00010992225456710272, "loss": 0.0078, "step": 251170 }, { "epoch": 1.27, "learning_rate": 0.00010991468687408871, "loss": 0.0075, "step": 251180 }, { "epoch": 1.27, "learning_rate": 0.0001099071191810747, "loss": 0.0084, "step": 251190 }, { "epoch": 1.27, "learning_rate": 0.00010989955148806069, "loss": 0.007, "step": 251200 }, { "epoch": 1.27, "learning_rate": 0.00010989198379504668, "loss": 0.0082, "step": 251210 }, { "epoch": 1.27, "learning_rate": 0.00010988441610203267, "loss": 0.0088, "step": 251220 }, { "epoch": 1.27, "learning_rate": 0.00010987684840901866, "loss": 0.008, "step": 251230 }, { "epoch": 1.27, "learning_rate": 0.00010986928071600464, "loss": 0.0102, "step": 251240 }, { "epoch": 1.27, "learning_rate": 0.00010986171302299064, "loss": 0.0115, "step": 251250 }, { "epoch": 1.27, "learning_rate": 0.00010985414532997663, "loss": 0.009, "step": 251260 }, { "epoch": 1.27, "learning_rate": 0.00010984657763696261, "loss": 0.0064, "step": 251270 }, { "epoch": 1.27, "learning_rate": 0.00010983900994394861, "loss": 0.0101, "step": 251280 }, { "epoch": 1.27, "learning_rate": 0.0001098314422509346, "loss": 0.0092, "step": 251290 }, { "epoch": 1.27, "learning_rate": 0.00010982387455792058, "loss": 0.008, "step": 251300 }, { "epoch": 1.27, "learning_rate": 0.00010981630686490658, "loss": 0.0094, "step": 251310 }, { "epoch": 1.27, "learning_rate": 0.00010980873917189256, "loss": 0.0088, "step": 251320 }, { "epoch": 1.27, "learning_rate": 0.00010980117147887856, "loss": 0.0083, "step": 251330 }, { "epoch": 1.27, "learning_rate": 0.00010979360378586455, "loss": 0.0069, "step": 251340 }, { "epoch": 1.27, "learning_rate": 0.00010978603609285053, "loss": 0.0097, "step": 251350 }, { "epoch": 1.27, "learning_rate": 0.00010977846839983653, "loss": 0.0093, "step": 251360 }, { "epoch": 1.27, "learning_rate": 0.00010977090070682252, "loss": 0.0067, "step": 251370 }, { "epoch": 1.27, "learning_rate": 0.0001097633330138085, "loss": 0.0083, "step": 251380 }, { "epoch": 1.27, "learning_rate": 0.0001097557653207945, "loss": 0.0096, "step": 251390 }, { "epoch": 1.27, "learning_rate": 0.0001097481976277805, "loss": 0.0085, "step": 251400 }, { "epoch": 1.27, "learning_rate": 0.00010974062993476648, "loss": 0.0088, "step": 251410 }, { "epoch": 1.27, "learning_rate": 0.00010973306224175247, "loss": 0.0075, "step": 251420 }, { "epoch": 1.27, "learning_rate": 0.00010972549454873845, "loss": 0.0082, "step": 251430 }, { "epoch": 1.27, "learning_rate": 0.00010971792685572445, "loss": 0.01, "step": 251440 }, { "epoch": 1.27, "learning_rate": 0.00010971035916271044, "loss": 0.0093, "step": 251450 }, { "epoch": 1.27, "learning_rate": 0.00010970279146969642, "loss": 0.0108, "step": 251460 }, { "epoch": 1.27, "learning_rate": 0.00010969522377668242, "loss": 0.0089, "step": 251470 }, { "epoch": 1.27, "learning_rate": 0.00010968765608366841, "loss": 0.0074, "step": 251480 }, { "epoch": 1.27, "learning_rate": 0.0001096800883906544, "loss": 0.0113, "step": 251490 }, { "epoch": 1.27, "learning_rate": 0.00010967252069764039, "loss": 0.0082, "step": 251500 }, { "epoch": 1.27, "learning_rate": 0.00010966495300462637, "loss": 0.0085, "step": 251510 }, { "epoch": 1.27, "learning_rate": 0.00010965738531161237, "loss": 0.0115, "step": 251520 }, { "epoch": 1.27, "learning_rate": 0.00010964981761859836, "loss": 0.0091, "step": 251530 }, { "epoch": 1.27, "learning_rate": 0.00010964224992558434, "loss": 0.0076, "step": 251540 }, { "epoch": 1.27, "learning_rate": 0.00010963468223257034, "loss": 0.0101, "step": 251550 }, { "epoch": 1.27, "learning_rate": 0.00010962711453955633, "loss": 0.0086, "step": 251560 }, { "epoch": 1.27, "learning_rate": 0.00010961954684654231, "loss": 0.0072, "step": 251570 }, { "epoch": 1.27, "learning_rate": 0.00010961197915352831, "loss": 0.0104, "step": 251580 }, { "epoch": 1.27, "learning_rate": 0.00010960441146051429, "loss": 0.0085, "step": 251590 }, { "epoch": 1.27, "learning_rate": 0.00010959684376750029, "loss": 0.0097, "step": 251600 }, { "epoch": 1.27, "learning_rate": 0.00010958927607448628, "loss": 0.0101, "step": 251610 }, { "epoch": 1.27, "learning_rate": 0.00010958170838147226, "loss": 0.0098, "step": 251620 }, { "epoch": 1.27, "learning_rate": 0.00010957414068845826, "loss": 0.0068, "step": 251630 }, { "epoch": 1.27, "learning_rate": 0.00010956657299544425, "loss": 0.0095, "step": 251640 }, { "epoch": 1.27, "learning_rate": 0.00010955900530243023, "loss": 0.009, "step": 251650 }, { "epoch": 1.27, "learning_rate": 0.00010955143760941623, "loss": 0.0099, "step": 251660 }, { "epoch": 1.27, "learning_rate": 0.00010954386991640221, "loss": 0.0068, "step": 251670 }, { "epoch": 1.27, "learning_rate": 0.0001095363022233882, "loss": 0.008, "step": 251680 }, { "epoch": 1.27, "learning_rate": 0.0001095287345303742, "loss": 0.0092, "step": 251690 }, { "epoch": 1.27, "learning_rate": 0.00010952116683736017, "loss": 0.0072, "step": 251700 }, { "epoch": 1.27, "learning_rate": 0.00010951359914434616, "loss": 0.0091, "step": 251710 }, { "epoch": 1.27, "learning_rate": 0.00010950603145133214, "loss": 0.0075, "step": 251720 }, { "epoch": 1.27, "learning_rate": 0.00010949846375831814, "loss": 0.0081, "step": 251730 }, { "epoch": 1.27, "learning_rate": 0.00010949089606530413, "loss": 0.009, "step": 251740 }, { "epoch": 1.27, "learning_rate": 0.00010948332837229012, "loss": 0.0122, "step": 251750 }, { "epoch": 1.27, "learning_rate": 0.00010947576067927611, "loss": 0.0083, "step": 251760 }, { "epoch": 1.27, "learning_rate": 0.00010946819298626209, "loss": 0.0077, "step": 251770 }, { "epoch": 1.27, "learning_rate": 0.00010946062529324809, "loss": 0.0097, "step": 251780 }, { "epoch": 1.27, "learning_rate": 0.00010945305760023408, "loss": 0.0082, "step": 251790 }, { "epoch": 1.27, "learning_rate": 0.00010944548990722006, "loss": 0.0094, "step": 251800 }, { "epoch": 1.27, "learning_rate": 0.00010943792221420606, "loss": 0.0111, "step": 251810 }, { "epoch": 1.27, "learning_rate": 0.00010943035452119205, "loss": 0.0094, "step": 251820 }, { "epoch": 1.27, "learning_rate": 0.00010942278682817803, "loss": 0.0086, "step": 251830 }, { "epoch": 1.27, "learning_rate": 0.00010941521913516403, "loss": 0.0095, "step": 251840 }, { "epoch": 1.27, "learning_rate": 0.00010940765144215002, "loss": 0.0117, "step": 251850 }, { "epoch": 1.27, "learning_rate": 0.000109400083749136, "loss": 0.011, "step": 251860 }, { "epoch": 1.27, "learning_rate": 0.000109392516056122, "loss": 0.0084, "step": 251870 }, { "epoch": 1.27, "learning_rate": 0.00010938494836310798, "loss": 0.0079, "step": 251880 }, { "epoch": 1.27, "learning_rate": 0.00010937738067009398, "loss": 0.0087, "step": 251890 }, { "epoch": 1.27, "learning_rate": 0.00010936981297707997, "loss": 0.0064, "step": 251900 }, { "epoch": 1.27, "learning_rate": 0.00010936224528406595, "loss": 0.0084, "step": 251910 }, { "epoch": 1.27, "learning_rate": 0.00010935467759105195, "loss": 0.0076, "step": 251920 }, { "epoch": 1.27, "learning_rate": 0.00010934710989803794, "loss": 0.0084, "step": 251930 }, { "epoch": 1.27, "learning_rate": 0.00010933954220502393, "loss": 0.0093, "step": 251940 }, { "epoch": 1.27, "learning_rate": 0.00010933197451200992, "loss": 0.0097, "step": 251950 }, { "epoch": 1.27, "learning_rate": 0.0001093244068189959, "loss": 0.0075, "step": 251960 }, { "epoch": 1.27, "learning_rate": 0.0001093168391259819, "loss": 0.0095, "step": 251970 }, { "epoch": 1.27, "learning_rate": 0.00010930927143296789, "loss": 0.0093, "step": 251980 }, { "epoch": 1.27, "learning_rate": 0.00010930170373995387, "loss": 0.0078, "step": 251990 }, { "epoch": 1.27, "learning_rate": 0.00010929413604693987, "loss": 0.0073, "step": 252000 }, { "epoch": 1.27, "eval_cer": 0.9144789894682909, "eval_loss": 0.006821473129093647, "eval_runtime": 116.1992, "eval_samples_per_second": 17.212, "eval_steps_per_second": 4.303, "step": 252000 }, { "epoch": 1.27, "learning_rate": 0.00010928656835392586, "loss": 0.0073, "step": 252010 }, { "epoch": 1.27, "learning_rate": 0.00010927900066091184, "loss": 0.008, "step": 252020 }, { "epoch": 1.27, "learning_rate": 0.00010927143296789784, "loss": 0.008, "step": 252030 }, { "epoch": 1.27, "learning_rate": 0.00010926386527488382, "loss": 0.0102, "step": 252040 }, { "epoch": 1.27, "learning_rate": 0.00010925629758186982, "loss": 0.0111, "step": 252050 }, { "epoch": 1.27, "learning_rate": 0.00010924872988885581, "loss": 0.0092, "step": 252060 }, { "epoch": 1.27, "learning_rate": 0.00010924116219584179, "loss": 0.0105, "step": 252070 }, { "epoch": 1.27, "learning_rate": 0.00010923359450282779, "loss": 0.0085, "step": 252080 }, { "epoch": 1.27, "learning_rate": 0.00010922602680981378, "loss": 0.0093, "step": 252090 }, { "epoch": 1.27, "learning_rate": 0.00010921845911679976, "loss": 0.0074, "step": 252100 }, { "epoch": 1.27, "learning_rate": 0.00010921089142378576, "loss": 0.008, "step": 252110 }, { "epoch": 1.27, "learning_rate": 0.00010920332373077174, "loss": 0.0098, "step": 252120 }, { "epoch": 1.27, "learning_rate": 0.00010919575603775774, "loss": 0.0109, "step": 252130 }, { "epoch": 1.27, "learning_rate": 0.00010918818834474373, "loss": 0.0083, "step": 252140 }, { "epoch": 1.27, "learning_rate": 0.00010918062065172971, "loss": 0.0078, "step": 252150 }, { "epoch": 1.27, "learning_rate": 0.00010917305295871571, "loss": 0.0095, "step": 252160 }, { "epoch": 1.27, "learning_rate": 0.0001091654852657017, "loss": 0.0081, "step": 252170 }, { "epoch": 1.27, "learning_rate": 0.00010915791757268768, "loss": 0.0083, "step": 252180 }, { "epoch": 1.27, "learning_rate": 0.00010915034987967368, "loss": 0.0097, "step": 252190 }, { "epoch": 1.27, "learning_rate": 0.00010914278218665966, "loss": 0.0115, "step": 252200 }, { "epoch": 1.27, "learning_rate": 0.00010913521449364565, "loss": 0.0086, "step": 252210 }, { "epoch": 1.27, "learning_rate": 0.00010912764680063165, "loss": 0.0091, "step": 252220 }, { "epoch": 1.27, "learning_rate": 0.00010912007910761763, "loss": 0.0093, "step": 252230 }, { "epoch": 1.27, "learning_rate": 0.00010911251141460363, "loss": 0.0101, "step": 252240 }, { "epoch": 1.27, "learning_rate": 0.00010910494372158962, "loss": 0.0114, "step": 252250 }, { "epoch": 1.27, "learning_rate": 0.0001090973760285756, "loss": 0.0113, "step": 252260 }, { "epoch": 1.27, "learning_rate": 0.0001090898083355616, "loss": 0.0083, "step": 252270 }, { "epoch": 1.27, "learning_rate": 0.00010908224064254758, "loss": 0.0098, "step": 252280 }, { "epoch": 1.27, "learning_rate": 0.00010907467294953357, "loss": 0.0095, "step": 252290 }, { "epoch": 1.27, "learning_rate": 0.00010906710525651957, "loss": 0.0058, "step": 252300 }, { "epoch": 1.27, "learning_rate": 0.00010905953756350555, "loss": 0.0095, "step": 252310 }, { "epoch": 1.27, "learning_rate": 0.00010905196987049153, "loss": 0.0078, "step": 252320 }, { "epoch": 1.27, "learning_rate": 0.00010904440217747751, "loss": 0.0087, "step": 252330 }, { "epoch": 1.27, "learning_rate": 0.00010903683448446351, "loss": 0.0099, "step": 252340 }, { "epoch": 1.27, "learning_rate": 0.0001090292667914495, "loss": 0.013, "step": 252350 }, { "epoch": 1.27, "learning_rate": 0.00010902169909843549, "loss": 0.0082, "step": 252360 }, { "epoch": 1.27, "learning_rate": 0.00010901413140542148, "loss": 0.0077, "step": 252370 }, { "epoch": 1.27, "learning_rate": 0.00010900656371240748, "loss": 0.0088, "step": 252380 }, { "epoch": 1.27, "learning_rate": 0.00010899899601939346, "loss": 0.0075, "step": 252390 }, { "epoch": 1.27, "learning_rate": 0.00010899142832637945, "loss": 0.0079, "step": 252400 }, { "epoch": 1.27, "learning_rate": 0.00010898386063336543, "loss": 0.0111, "step": 252410 }, { "epoch": 1.27, "learning_rate": 0.00010897629294035143, "loss": 0.009, "step": 252420 }, { "epoch": 1.27, "learning_rate": 0.00010896872524733742, "loss": 0.0089, "step": 252430 }, { "epoch": 1.27, "learning_rate": 0.0001089611575543234, "loss": 0.0071, "step": 252440 }, { "epoch": 1.27, "learning_rate": 0.0001089535898613094, "loss": 0.01, "step": 252450 }, { "epoch": 1.27, "learning_rate": 0.0001089460221682954, "loss": 0.007, "step": 252460 }, { "epoch": 1.27, "learning_rate": 0.00010893845447528138, "loss": 0.0075, "step": 252470 }, { "epoch": 1.27, "learning_rate": 0.00010893088678226737, "loss": 0.0082, "step": 252480 }, { "epoch": 1.27, "learning_rate": 0.00010892331908925335, "loss": 0.0066, "step": 252490 }, { "epoch": 1.27, "learning_rate": 0.00010891575139623935, "loss": 0.0091, "step": 252500 }, { "epoch": 1.27, "learning_rate": 0.00010890818370322534, "loss": 0.0088, "step": 252510 }, { "epoch": 1.27, "learning_rate": 0.00010890061601021132, "loss": 0.0069, "step": 252520 }, { "epoch": 1.27, "learning_rate": 0.00010889304831719732, "loss": 0.0084, "step": 252530 }, { "epoch": 1.27, "learning_rate": 0.00010888548062418331, "loss": 0.0076, "step": 252540 }, { "epoch": 1.27, "learning_rate": 0.0001088779129311693, "loss": 0.0093, "step": 252550 }, { "epoch": 1.27, "learning_rate": 0.00010887034523815529, "loss": 0.01, "step": 252560 }, { "epoch": 1.27, "learning_rate": 0.00010886277754514127, "loss": 0.0071, "step": 252570 }, { "epoch": 1.27, "learning_rate": 0.00010885520985212727, "loss": 0.0075, "step": 252580 }, { "epoch": 1.27, "learning_rate": 0.00010884764215911326, "loss": 0.0073, "step": 252590 }, { "epoch": 1.27, "learning_rate": 0.00010884007446609924, "loss": 0.0089, "step": 252600 }, { "epoch": 1.27, "learning_rate": 0.00010883250677308524, "loss": 0.0086, "step": 252610 }, { "epoch": 1.27, "learning_rate": 0.00010882493908007123, "loss": 0.0087, "step": 252620 }, { "epoch": 1.27, "learning_rate": 0.00010881737138705721, "loss": 0.0078, "step": 252630 }, { "epoch": 1.27, "learning_rate": 0.00010880980369404321, "loss": 0.0086, "step": 252640 }, { "epoch": 1.27, "learning_rate": 0.00010880223600102919, "loss": 0.0088, "step": 252650 }, { "epoch": 1.27, "learning_rate": 0.00010879466830801519, "loss": 0.01, "step": 252660 }, { "epoch": 1.27, "learning_rate": 0.00010878710061500118, "loss": 0.0066, "step": 252670 }, { "epoch": 1.27, "learning_rate": 0.00010877953292198716, "loss": 0.0095, "step": 252680 }, { "epoch": 1.27, "learning_rate": 0.00010877196522897316, "loss": 0.0091, "step": 252690 }, { "epoch": 1.27, "learning_rate": 0.00010876439753595915, "loss": 0.0073, "step": 252700 }, { "epoch": 1.27, "learning_rate": 0.00010875682984294513, "loss": 0.007, "step": 252710 }, { "epoch": 1.27, "learning_rate": 0.00010874926214993113, "loss": 0.0081, "step": 252720 }, { "epoch": 1.28, "learning_rate": 0.00010874169445691711, "loss": 0.0079, "step": 252730 }, { "epoch": 1.28, "learning_rate": 0.0001087341267639031, "loss": 0.0083, "step": 252740 }, { "epoch": 1.28, "learning_rate": 0.0001087265590708891, "loss": 0.0078, "step": 252750 }, { "epoch": 1.28, "learning_rate": 0.00010871899137787508, "loss": 0.008, "step": 252760 }, { "epoch": 1.28, "learning_rate": 0.00010871142368486108, "loss": 0.0079, "step": 252770 }, { "epoch": 1.28, "learning_rate": 0.00010870385599184707, "loss": 0.0082, "step": 252780 }, { "epoch": 1.28, "learning_rate": 0.00010869628829883305, "loss": 0.0076, "step": 252790 }, { "epoch": 1.28, "learning_rate": 0.00010868872060581905, "loss": 0.007, "step": 252800 }, { "epoch": 1.28, "learning_rate": 0.00010868115291280504, "loss": 0.0071, "step": 252810 }, { "epoch": 1.28, "learning_rate": 0.00010867358521979102, "loss": 0.0149, "step": 252820 }, { "epoch": 1.28, "learning_rate": 0.00010866601752677702, "loss": 0.0081, "step": 252830 }, { "epoch": 1.28, "learning_rate": 0.000108658449833763, "loss": 0.0081, "step": 252840 }, { "epoch": 1.28, "learning_rate": 0.000108650882140749, "loss": 0.0087, "step": 252850 }, { "epoch": 1.28, "learning_rate": 0.00010864331444773499, "loss": 0.0088, "step": 252860 }, { "epoch": 1.28, "learning_rate": 0.00010863574675472097, "loss": 0.0068, "step": 252870 }, { "epoch": 1.28, "learning_rate": 0.00010862817906170697, "loss": 0.0077, "step": 252880 }, { "epoch": 1.28, "learning_rate": 0.00010862061136869296, "loss": 0.0066, "step": 252890 }, { "epoch": 1.28, "learning_rate": 0.00010861304367567894, "loss": 0.0096, "step": 252900 }, { "epoch": 1.28, "learning_rate": 0.00010860547598266494, "loss": 0.006, "step": 252910 }, { "epoch": 1.28, "learning_rate": 0.00010859790828965092, "loss": 0.0083, "step": 252920 }, { "epoch": 1.28, "learning_rate": 0.00010859034059663692, "loss": 0.0099, "step": 252930 }, { "epoch": 1.28, "learning_rate": 0.00010858277290362291, "loss": 0.0076, "step": 252940 }, { "epoch": 1.28, "learning_rate": 0.00010857520521060888, "loss": 0.0091, "step": 252950 }, { "epoch": 1.28, "learning_rate": 0.00010856763751759487, "loss": 0.0137, "step": 252960 }, { "epoch": 1.28, "learning_rate": 0.00010856006982458085, "loss": 0.008, "step": 252970 }, { "epoch": 1.28, "learning_rate": 0.00010855250213156685, "loss": 0.0133, "step": 252980 }, { "epoch": 1.28, "learning_rate": 0.00010854493443855284, "loss": 0.009, "step": 252990 }, { "epoch": 1.28, "learning_rate": 0.00010853736674553883, "loss": 0.0104, "step": 253000 }, { "epoch": 1.28, "eval_cer": 0.914462492734159, "eval_loss": 0.006441994570195675, "eval_runtime": 116.0386, "eval_samples_per_second": 17.236, "eval_steps_per_second": 4.309, "step": 253000 }, { "epoch": 1.28, "learning_rate": 0.00010852979905252482, "loss": 0.0092, "step": 253010 }, { "epoch": 1.28, "learning_rate": 0.0001085222313595108, "loss": 0.0089, "step": 253020 }, { "epoch": 1.28, "learning_rate": 0.0001085146636664968, "loss": 0.0102, "step": 253030 }, { "epoch": 1.28, "learning_rate": 0.00010850709597348279, "loss": 0.0077, "step": 253040 }, { "epoch": 1.28, "learning_rate": 0.00010849952828046877, "loss": 0.0061, "step": 253050 }, { "epoch": 1.28, "learning_rate": 0.00010849196058745477, "loss": 0.0063, "step": 253060 }, { "epoch": 1.28, "learning_rate": 0.00010848439289444076, "loss": 0.0087, "step": 253070 }, { "epoch": 1.28, "learning_rate": 0.00010847682520142675, "loss": 0.0101, "step": 253080 }, { "epoch": 1.28, "learning_rate": 0.00010846925750841274, "loss": 0.0072, "step": 253090 }, { "epoch": 1.28, "learning_rate": 0.00010846168981539872, "loss": 0.0116, "step": 253100 }, { "epoch": 1.28, "learning_rate": 0.00010845412212238472, "loss": 0.0094, "step": 253110 }, { "epoch": 1.28, "learning_rate": 0.00010844655442937071, "loss": 0.0119, "step": 253120 }, { "epoch": 1.28, "learning_rate": 0.00010843898673635669, "loss": 0.0078, "step": 253130 }, { "epoch": 1.28, "learning_rate": 0.00010843141904334269, "loss": 0.0098, "step": 253140 }, { "epoch": 1.28, "learning_rate": 0.00010842385135032868, "loss": 0.0076, "step": 253150 }, { "epoch": 1.28, "learning_rate": 0.00010841628365731466, "loss": 0.0073, "step": 253160 }, { "epoch": 1.28, "learning_rate": 0.00010840871596430066, "loss": 0.0101, "step": 253170 }, { "epoch": 1.28, "learning_rate": 0.00010840114827128664, "loss": 0.0056, "step": 253180 }, { "epoch": 1.28, "learning_rate": 0.00010839358057827264, "loss": 0.0105, "step": 253190 }, { "epoch": 1.28, "learning_rate": 0.00010838601288525863, "loss": 0.0076, "step": 253200 }, { "epoch": 1.28, "learning_rate": 0.00010837844519224461, "loss": 0.0093, "step": 253210 }, { "epoch": 1.28, "learning_rate": 0.00010837087749923061, "loss": 0.0098, "step": 253220 }, { "epoch": 1.28, "learning_rate": 0.0001083633098062166, "loss": 0.0087, "step": 253230 }, { "epoch": 1.28, "learning_rate": 0.00010835574211320258, "loss": 0.0076, "step": 253240 }, { "epoch": 1.28, "learning_rate": 0.00010834817442018858, "loss": 0.0082, "step": 253250 }, { "epoch": 1.28, "learning_rate": 0.00010834060672717456, "loss": 0.0101, "step": 253260 }, { "epoch": 1.28, "learning_rate": 0.00010833303903416056, "loss": 0.0087, "step": 253270 }, { "epoch": 1.28, "learning_rate": 0.00010832547134114655, "loss": 0.0085, "step": 253280 }, { "epoch": 1.28, "learning_rate": 0.00010831790364813253, "loss": 0.0092, "step": 253290 }, { "epoch": 1.28, "learning_rate": 0.00010831033595511853, "loss": 0.0082, "step": 253300 }, { "epoch": 1.28, "learning_rate": 0.00010830276826210452, "loss": 0.0058, "step": 253310 }, { "epoch": 1.28, "learning_rate": 0.0001082952005690905, "loss": 0.0075, "step": 253320 }, { "epoch": 1.28, "learning_rate": 0.0001082876328760765, "loss": 0.008, "step": 253330 }, { "epoch": 1.28, "learning_rate": 0.00010828006518306249, "loss": 0.008, "step": 253340 }, { "epoch": 1.28, "learning_rate": 0.00010827249749004847, "loss": 0.0085, "step": 253350 }, { "epoch": 1.28, "learning_rate": 0.00010826492979703447, "loss": 0.0099, "step": 253360 }, { "epoch": 1.28, "learning_rate": 0.00010825736210402045, "loss": 0.0093, "step": 253370 }, { "epoch": 1.28, "learning_rate": 0.00010824979441100645, "loss": 0.0081, "step": 253380 }, { "epoch": 1.28, "learning_rate": 0.00010824222671799244, "loss": 0.0081, "step": 253390 }, { "epoch": 1.28, "learning_rate": 0.00010823465902497842, "loss": 0.0096, "step": 253400 }, { "epoch": 1.28, "learning_rate": 0.00010822709133196442, "loss": 0.0087, "step": 253410 }, { "epoch": 1.28, "learning_rate": 0.00010821952363895041, "loss": 0.0083, "step": 253420 }, { "epoch": 1.28, "learning_rate": 0.0001082119559459364, "loss": 0.0083, "step": 253430 }, { "epoch": 1.28, "learning_rate": 0.00010820438825292239, "loss": 0.008, "step": 253440 }, { "epoch": 1.28, "learning_rate": 0.00010819682055990837, "loss": 0.0079, "step": 253450 }, { "epoch": 1.28, "learning_rate": 0.00010818925286689437, "loss": 0.0076, "step": 253460 }, { "epoch": 1.28, "learning_rate": 0.00010818168517388036, "loss": 0.0065, "step": 253470 }, { "epoch": 1.28, "learning_rate": 0.00010817411748086634, "loss": 0.0085, "step": 253480 }, { "epoch": 1.28, "learning_rate": 0.00010816654978785234, "loss": 0.0091, "step": 253490 }, { "epoch": 1.28, "learning_rate": 0.00010815898209483833, "loss": 0.0084, "step": 253500 }, { "epoch": 1.28, "learning_rate": 0.00010815141440182431, "loss": 0.0096, "step": 253510 }, { "epoch": 1.28, "learning_rate": 0.00010814384670881031, "loss": 0.0078, "step": 253520 }, { "epoch": 1.28, "learning_rate": 0.00010813627901579629, "loss": 0.0063, "step": 253530 }, { "epoch": 1.28, "learning_rate": 0.00010812871132278228, "loss": 0.0098, "step": 253540 }, { "epoch": 1.28, "learning_rate": 0.00010812114362976828, "loss": 0.0076, "step": 253550 }, { "epoch": 1.28, "learning_rate": 0.00010811357593675426, "loss": 0.0078, "step": 253560 }, { "epoch": 1.28, "learning_rate": 0.00010810600824374026, "loss": 0.0088, "step": 253570 }, { "epoch": 1.28, "learning_rate": 0.00010809844055072622, "loss": 0.0088, "step": 253580 }, { "epoch": 1.28, "learning_rate": 0.00010809087285771222, "loss": 0.0081, "step": 253590 }, { "epoch": 1.28, "learning_rate": 0.00010808330516469821, "loss": 0.0106, "step": 253600 }, { "epoch": 1.28, "learning_rate": 0.0001080757374716842, "loss": 0.0098, "step": 253610 }, { "epoch": 1.28, "learning_rate": 0.00010806816977867019, "loss": 0.0077, "step": 253620 }, { "epoch": 1.28, "learning_rate": 0.00010806060208565617, "loss": 0.0113, "step": 253630 }, { "epoch": 1.28, "learning_rate": 0.00010805303439264217, "loss": 0.0108, "step": 253640 }, { "epoch": 1.28, "learning_rate": 0.00010804546669962816, "loss": 0.0066, "step": 253650 }, { "epoch": 1.28, "learning_rate": 0.00010803789900661414, "loss": 0.0083, "step": 253660 }, { "epoch": 1.28, "learning_rate": 0.00010803033131360014, "loss": 0.0077, "step": 253670 }, { "epoch": 1.28, "learning_rate": 0.00010802276362058613, "loss": 0.0091, "step": 253680 }, { "epoch": 1.28, "learning_rate": 0.00010801519592757211, "loss": 0.0111, "step": 253690 }, { "epoch": 1.28, "learning_rate": 0.00010800762823455811, "loss": 0.0066, "step": 253700 }, { "epoch": 1.28, "learning_rate": 0.00010800006054154409, "loss": 0.0086, "step": 253710 }, { "epoch": 1.28, "learning_rate": 0.00010799249284853009, "loss": 0.0077, "step": 253720 }, { "epoch": 1.28, "learning_rate": 0.00010798492515551608, "loss": 0.0101, "step": 253730 }, { "epoch": 1.28, "learning_rate": 0.00010797735746250206, "loss": 0.0064, "step": 253740 }, { "epoch": 1.28, "learning_rate": 0.00010796978976948806, "loss": 0.0095, "step": 253750 }, { "epoch": 1.28, "learning_rate": 0.00010796222207647405, "loss": 0.0089, "step": 253760 }, { "epoch": 1.28, "learning_rate": 0.00010795465438346003, "loss": 0.0085, "step": 253770 }, { "epoch": 1.28, "learning_rate": 0.00010794708669044603, "loss": 0.0114, "step": 253780 }, { "epoch": 1.28, "learning_rate": 0.00010793951899743202, "loss": 0.0083, "step": 253790 }, { "epoch": 1.28, "learning_rate": 0.000107931951304418, "loss": 0.0082, "step": 253800 }, { "epoch": 1.28, "learning_rate": 0.000107924383611404, "loss": 0.0098, "step": 253810 }, { "epoch": 1.28, "learning_rate": 0.00010791681591838998, "loss": 0.0109, "step": 253820 }, { "epoch": 1.28, "learning_rate": 0.00010790924822537598, "loss": 0.0069, "step": 253830 }, { "epoch": 1.28, "learning_rate": 0.00010790168053236197, "loss": 0.0092, "step": 253840 }, { "epoch": 1.28, "learning_rate": 0.00010789411283934795, "loss": 0.0066, "step": 253850 }, { "epoch": 1.28, "learning_rate": 0.00010788654514633395, "loss": 0.0077, "step": 253860 }, { "epoch": 1.28, "learning_rate": 0.00010787897745331994, "loss": 0.0086, "step": 253870 }, { "epoch": 1.28, "learning_rate": 0.00010787140976030592, "loss": 0.008, "step": 253880 }, { "epoch": 1.28, "learning_rate": 0.00010786384206729192, "loss": 0.0077, "step": 253890 }, { "epoch": 1.28, "learning_rate": 0.0001078562743742779, "loss": 0.0068, "step": 253900 }, { "epoch": 1.28, "learning_rate": 0.0001078487066812639, "loss": 0.0079, "step": 253910 }, { "epoch": 1.28, "learning_rate": 0.00010784113898824989, "loss": 0.0103, "step": 253920 }, { "epoch": 1.28, "learning_rate": 0.00010783357129523587, "loss": 0.0084, "step": 253930 }, { "epoch": 1.28, "learning_rate": 0.00010782600360222187, "loss": 0.0103, "step": 253940 }, { "epoch": 1.28, "learning_rate": 0.00010781843590920786, "loss": 0.0072, "step": 253950 }, { "epoch": 1.28, "learning_rate": 0.00010781086821619384, "loss": 0.0081, "step": 253960 }, { "epoch": 1.28, "learning_rate": 0.00010780330052317984, "loss": 0.0073, "step": 253970 }, { "epoch": 1.28, "learning_rate": 0.00010779573283016582, "loss": 0.0068, "step": 253980 }, { "epoch": 1.28, "learning_rate": 0.00010778816513715182, "loss": 0.0079, "step": 253990 }, { "epoch": 1.28, "learning_rate": 0.00010778059744413781, "loss": 0.0083, "step": 254000 }, { "epoch": 1.28, "eval_cer": 0.9144450256039017, "eval_loss": 0.00646965904161334, "eval_runtime": 116.1648, "eval_samples_per_second": 17.217, "eval_steps_per_second": 4.304, "step": 254000 }, { "epoch": 1.28, "learning_rate": 0.00010777302975112379, "loss": 0.0087, "step": 254010 }, { "epoch": 1.28, "learning_rate": 0.00010776546205810979, "loss": 0.0091, "step": 254020 }, { "epoch": 1.28, "learning_rate": 0.00010775789436509578, "loss": 0.0086, "step": 254030 }, { "epoch": 1.28, "learning_rate": 0.00010775032667208176, "loss": 0.007, "step": 254040 }, { "epoch": 1.28, "learning_rate": 0.00010774275897906776, "loss": 0.0056, "step": 254050 }, { "epoch": 1.28, "learning_rate": 0.00010773519128605374, "loss": 0.0102, "step": 254060 }, { "epoch": 1.28, "learning_rate": 0.00010772762359303973, "loss": 0.0067, "step": 254070 }, { "epoch": 1.28, "learning_rate": 0.00010772005590002573, "loss": 0.0117, "step": 254080 }, { "epoch": 1.28, "learning_rate": 0.00010771248820701171, "loss": 0.0115, "step": 254090 }, { "epoch": 1.28, "learning_rate": 0.0001077049205139977, "loss": 0.0086, "step": 254100 }, { "epoch": 1.28, "learning_rate": 0.0001076973528209837, "loss": 0.0099, "step": 254110 }, { "epoch": 1.28, "learning_rate": 0.00010768978512796968, "loss": 0.0091, "step": 254120 }, { "epoch": 1.28, "learning_rate": 0.00010768221743495568, "loss": 0.0071, "step": 254130 }, { "epoch": 1.28, "learning_rate": 0.00010767464974194166, "loss": 0.0087, "step": 254140 }, { "epoch": 1.28, "learning_rate": 0.00010766708204892765, "loss": 0.0093, "step": 254150 }, { "epoch": 1.28, "learning_rate": 0.00010765951435591365, "loss": 0.0119, "step": 254160 }, { "epoch": 1.28, "learning_rate": 0.00010765194666289963, "loss": 0.0076, "step": 254170 }, { "epoch": 1.28, "learning_rate": 0.00010764437896988563, "loss": 0.0086, "step": 254180 }, { "epoch": 1.28, "learning_rate": 0.00010763681127687162, "loss": 0.007, "step": 254190 }, { "epoch": 1.28, "learning_rate": 0.0001076292435838576, "loss": 0.0095, "step": 254200 }, { "epoch": 1.28, "learning_rate": 0.00010762167589084358, "loss": 0.0099, "step": 254210 }, { "epoch": 1.28, "learning_rate": 0.00010761410819782956, "loss": 0.0076, "step": 254220 }, { "epoch": 1.28, "learning_rate": 0.00010760654050481556, "loss": 0.0084, "step": 254230 }, { "epoch": 1.28, "learning_rate": 0.00010759897281180155, "loss": 0.0107, "step": 254240 }, { "epoch": 1.28, "learning_rate": 0.00010759140511878754, "loss": 0.0091, "step": 254250 }, { "epoch": 1.28, "learning_rate": 0.00010758383742577353, "loss": 0.0097, "step": 254260 }, { "epoch": 1.28, "learning_rate": 0.00010757626973275951, "loss": 0.0082, "step": 254270 }, { "epoch": 1.28, "learning_rate": 0.00010756870203974551, "loss": 0.0086, "step": 254280 }, { "epoch": 1.28, "learning_rate": 0.0001075611343467315, "loss": 0.0054, "step": 254290 }, { "epoch": 1.28, "learning_rate": 0.00010755356665371748, "loss": 0.0101, "step": 254300 }, { "epoch": 1.28, "learning_rate": 0.00010754599896070348, "loss": 0.0087, "step": 254310 }, { "epoch": 1.28, "learning_rate": 0.00010753843126768947, "loss": 0.008, "step": 254320 }, { "epoch": 1.28, "learning_rate": 0.00010753086357467546, "loss": 0.0066, "step": 254330 }, { "epoch": 1.28, "learning_rate": 0.00010752329588166145, "loss": 0.0086, "step": 254340 }, { "epoch": 1.28, "learning_rate": 0.00010751572818864743, "loss": 0.0067, "step": 254350 }, { "epoch": 1.28, "learning_rate": 0.00010750816049563343, "loss": 0.0075, "step": 254360 }, { "epoch": 1.28, "learning_rate": 0.00010750059280261942, "loss": 0.0091, "step": 254370 }, { "epoch": 1.28, "learning_rate": 0.0001074930251096054, "loss": 0.0079, "step": 254380 }, { "epoch": 1.28, "learning_rate": 0.0001074854574165914, "loss": 0.0082, "step": 254390 }, { "epoch": 1.28, "learning_rate": 0.0001074778897235774, "loss": 0.0079, "step": 254400 }, { "epoch": 1.28, "learning_rate": 0.00010747032203056337, "loss": 0.0081, "step": 254410 }, { "epoch": 1.28, "learning_rate": 0.00010746275433754937, "loss": 0.0174, "step": 254420 }, { "epoch": 1.28, "learning_rate": 0.00010745518664453535, "loss": 0.0067, "step": 254430 }, { "epoch": 1.28, "learning_rate": 0.00010744761895152135, "loss": 0.0102, "step": 254440 }, { "epoch": 1.28, "learning_rate": 0.00010744005125850734, "loss": 0.0054, "step": 254450 }, { "epoch": 1.28, "learning_rate": 0.00010743248356549332, "loss": 0.0075, "step": 254460 }, { "epoch": 1.28, "learning_rate": 0.00010742491587247932, "loss": 0.0085, "step": 254470 }, { "epoch": 1.28, "learning_rate": 0.00010741734817946531, "loss": 0.0096, "step": 254480 }, { "epoch": 1.28, "learning_rate": 0.0001074097804864513, "loss": 0.0095, "step": 254490 }, { "epoch": 1.28, "learning_rate": 0.00010740221279343729, "loss": 0.0095, "step": 254500 }, { "epoch": 1.28, "learning_rate": 0.00010739464510042327, "loss": 0.0093, "step": 254510 }, { "epoch": 1.28, "learning_rate": 0.00010738707740740927, "loss": 0.011, "step": 254520 }, { "epoch": 1.28, "learning_rate": 0.00010737950971439526, "loss": 0.0073, "step": 254530 }, { "epoch": 1.28, "learning_rate": 0.00010737194202138124, "loss": 0.0104, "step": 254540 }, { "epoch": 1.28, "learning_rate": 0.00010736437432836724, "loss": 0.0081, "step": 254550 }, { "epoch": 1.28, "learning_rate": 0.00010735680663535323, "loss": 0.0097, "step": 254560 }, { "epoch": 1.28, "learning_rate": 0.00010734923894233921, "loss": 0.0077, "step": 254570 }, { "epoch": 1.28, "learning_rate": 0.00010734167124932521, "loss": 0.0076, "step": 254580 }, { "epoch": 1.28, "learning_rate": 0.00010733410355631119, "loss": 0.0079, "step": 254590 }, { "epoch": 1.28, "learning_rate": 0.00010732653586329718, "loss": 0.0133, "step": 254600 }, { "epoch": 1.28, "learning_rate": 0.00010731896817028318, "loss": 0.0108, "step": 254610 }, { "epoch": 1.28, "learning_rate": 0.00010731140047726916, "loss": 0.0079, "step": 254620 }, { "epoch": 1.28, "learning_rate": 0.00010730383278425516, "loss": 0.0094, "step": 254630 }, { "epoch": 1.28, "learning_rate": 0.00010729626509124115, "loss": 0.0073, "step": 254640 }, { "epoch": 1.28, "learning_rate": 0.00010728869739822713, "loss": 0.0094, "step": 254650 }, { "epoch": 1.28, "learning_rate": 0.00010728112970521313, "loss": 0.0096, "step": 254660 }, { "epoch": 1.28, "learning_rate": 0.00010727356201219911, "loss": 0.0085, "step": 254670 }, { "epoch": 1.28, "learning_rate": 0.0001072659943191851, "loss": 0.0091, "step": 254680 }, { "epoch": 1.28, "learning_rate": 0.0001072584266261711, "loss": 0.0088, "step": 254690 }, { "epoch": 1.28, "learning_rate": 0.00010725085893315708, "loss": 0.0103, "step": 254700 }, { "epoch": 1.29, "learning_rate": 0.00010724329124014308, "loss": 0.0095, "step": 254710 }, { "epoch": 1.29, "learning_rate": 0.00010723572354712907, "loss": 0.0085, "step": 254720 }, { "epoch": 1.29, "learning_rate": 0.00010722815585411505, "loss": 0.0077, "step": 254730 }, { "epoch": 1.29, "learning_rate": 0.00010722058816110105, "loss": 0.0079, "step": 254740 }, { "epoch": 1.29, "learning_rate": 0.00010721302046808704, "loss": 0.0082, "step": 254750 }, { "epoch": 1.29, "learning_rate": 0.00010720545277507302, "loss": 0.0093, "step": 254760 }, { "epoch": 1.29, "learning_rate": 0.00010719788508205902, "loss": 0.0098, "step": 254770 }, { "epoch": 1.29, "learning_rate": 0.000107190317389045, "loss": 0.0109, "step": 254780 }, { "epoch": 1.29, "learning_rate": 0.000107182749696031, "loss": 0.0098, "step": 254790 }, { "epoch": 1.29, "learning_rate": 0.00010717518200301699, "loss": 0.0088, "step": 254800 }, { "epoch": 1.29, "learning_rate": 0.00010716761431000297, "loss": 0.0068, "step": 254810 }, { "epoch": 1.29, "learning_rate": 0.00010716004661698897, "loss": 0.0066, "step": 254820 }, { "epoch": 1.29, "learning_rate": 0.00010715247892397496, "loss": 0.0084, "step": 254830 }, { "epoch": 1.29, "learning_rate": 0.00010714491123096093, "loss": 0.0066, "step": 254840 }, { "epoch": 1.29, "learning_rate": 0.00010713734353794692, "loss": 0.0097, "step": 254850 }, { "epoch": 1.29, "learning_rate": 0.0001071297758449329, "loss": 0.0091, "step": 254860 }, { "epoch": 1.29, "learning_rate": 0.0001071222081519189, "loss": 0.0077, "step": 254870 }, { "epoch": 1.29, "learning_rate": 0.00010711464045890488, "loss": 0.0077, "step": 254880 }, { "epoch": 1.29, "learning_rate": 0.00010710707276589088, "loss": 0.0065, "step": 254890 }, { "epoch": 1.29, "learning_rate": 0.00010709950507287687, "loss": 0.0063, "step": 254900 }, { "epoch": 1.29, "learning_rate": 0.00010709193737986285, "loss": 0.0095, "step": 254910 }, { "epoch": 1.29, "learning_rate": 0.00010708436968684885, "loss": 0.0085, "step": 254920 }, { "epoch": 1.29, "learning_rate": 0.00010707680199383484, "loss": 0.0083, "step": 254930 }, { "epoch": 1.29, "learning_rate": 0.00010706923430082082, "loss": 0.0083, "step": 254940 }, { "epoch": 1.29, "learning_rate": 0.00010706166660780682, "loss": 0.0091, "step": 254950 }, { "epoch": 1.29, "learning_rate": 0.0001070540989147928, "loss": 0.0081, "step": 254960 }, { "epoch": 1.29, "learning_rate": 0.0001070465312217788, "loss": 0.0079, "step": 254970 }, { "epoch": 1.29, "learning_rate": 0.00010703896352876479, "loss": 0.0076, "step": 254980 }, { "epoch": 1.29, "learning_rate": 0.00010703139583575077, "loss": 0.0068, "step": 254990 }, { "epoch": 1.29, "learning_rate": 0.00010702382814273677, "loss": 0.0085, "step": 255000 }, { "epoch": 1.29, "eval_cer": 0.9144411440194001, "eval_loss": 0.006503617390990257, "eval_runtime": 116.441, "eval_samples_per_second": 17.176, "eval_steps_per_second": 4.294, "step": 255000 }, { "epoch": 1.29, "learning_rate": 0.00010701626044972276, "loss": 0.0077, "step": 255010 }, { "epoch": 1.29, "learning_rate": 0.00010700869275670874, "loss": 0.0102, "step": 255020 }, { "epoch": 1.29, "learning_rate": 0.00010700112506369474, "loss": 0.01, "step": 255030 }, { "epoch": 1.29, "learning_rate": 0.00010699355737068072, "loss": 0.0079, "step": 255040 }, { "epoch": 1.29, "learning_rate": 0.00010698598967766672, "loss": 0.0077, "step": 255050 }, { "epoch": 1.29, "learning_rate": 0.00010697842198465271, "loss": 0.0095, "step": 255060 }, { "epoch": 1.29, "learning_rate": 0.00010697085429163869, "loss": 0.0066, "step": 255070 }, { "epoch": 1.29, "learning_rate": 0.00010696328659862469, "loss": 0.0077, "step": 255080 }, { "epoch": 1.29, "learning_rate": 0.00010695571890561068, "loss": 0.0085, "step": 255090 }, { "epoch": 1.29, "learning_rate": 0.00010694815121259666, "loss": 0.0082, "step": 255100 }, { "epoch": 1.29, "learning_rate": 0.00010694058351958266, "loss": 0.0094, "step": 255110 }, { "epoch": 1.29, "learning_rate": 0.00010693301582656864, "loss": 0.0108, "step": 255120 }, { "epoch": 1.29, "learning_rate": 0.00010692544813355463, "loss": 0.0079, "step": 255130 }, { "epoch": 1.29, "learning_rate": 0.00010691788044054063, "loss": 0.0101, "step": 255140 }, { "epoch": 1.29, "learning_rate": 0.00010691031274752661, "loss": 0.0099, "step": 255150 }, { "epoch": 1.29, "learning_rate": 0.0001069027450545126, "loss": 0.0064, "step": 255160 }, { "epoch": 1.29, "learning_rate": 0.0001068951773614986, "loss": 0.0099, "step": 255170 }, { "epoch": 1.29, "learning_rate": 0.00010688760966848458, "loss": 0.0072, "step": 255180 }, { "epoch": 1.29, "learning_rate": 0.00010688004197547058, "loss": 0.0076, "step": 255190 }, { "epoch": 1.29, "learning_rate": 0.00010687247428245656, "loss": 0.0069, "step": 255200 }, { "epoch": 1.29, "learning_rate": 0.00010686490658944255, "loss": 0.0071, "step": 255210 }, { "epoch": 1.29, "learning_rate": 0.00010685733889642855, "loss": 0.0081, "step": 255220 }, { "epoch": 1.29, "learning_rate": 0.00010684977120341453, "loss": 0.0077, "step": 255230 }, { "epoch": 1.29, "learning_rate": 0.00010684220351040053, "loss": 0.0082, "step": 255240 }, { "epoch": 1.29, "learning_rate": 0.00010683463581738652, "loss": 0.0086, "step": 255250 }, { "epoch": 1.29, "learning_rate": 0.0001068270681243725, "loss": 0.0077, "step": 255260 }, { "epoch": 1.29, "learning_rate": 0.0001068195004313585, "loss": 0.0067, "step": 255270 }, { "epoch": 1.29, "learning_rate": 0.00010681193273834449, "loss": 0.0075, "step": 255280 }, { "epoch": 1.29, "learning_rate": 0.00010680436504533047, "loss": 0.0084, "step": 255290 }, { "epoch": 1.29, "learning_rate": 0.00010679679735231647, "loss": 0.009, "step": 255300 }, { "epoch": 1.29, "learning_rate": 0.00010678922965930245, "loss": 0.0091, "step": 255310 }, { "epoch": 1.29, "learning_rate": 0.00010678166196628845, "loss": 0.0089, "step": 255320 }, { "epoch": 1.29, "learning_rate": 0.00010677409427327444, "loss": 0.0099, "step": 255330 }, { "epoch": 1.29, "learning_rate": 0.00010676652658026042, "loss": 0.0086, "step": 255340 }, { "epoch": 1.29, "learning_rate": 0.00010675895888724642, "loss": 0.0082, "step": 255350 }, { "epoch": 1.29, "learning_rate": 0.00010675139119423241, "loss": 0.0066, "step": 255360 }, { "epoch": 1.29, "learning_rate": 0.00010674382350121839, "loss": 0.0111, "step": 255370 }, { "epoch": 1.29, "learning_rate": 0.00010673625580820439, "loss": 0.0081, "step": 255380 }, { "epoch": 1.29, "learning_rate": 0.00010672868811519037, "loss": 0.0074, "step": 255390 }, { "epoch": 1.29, "learning_rate": 0.00010672112042217636, "loss": 0.0077, "step": 255400 }, { "epoch": 1.29, "learning_rate": 0.00010671355272916236, "loss": 0.0106, "step": 255410 }, { "epoch": 1.29, "learning_rate": 0.00010670598503614834, "loss": 0.0102, "step": 255420 }, { "epoch": 1.29, "learning_rate": 0.00010669841734313434, "loss": 0.0095, "step": 255430 }, { "epoch": 1.29, "learning_rate": 0.00010669084965012033, "loss": 0.0085, "step": 255440 }, { "epoch": 1.29, "learning_rate": 0.00010668328195710631, "loss": 0.0077, "step": 255450 }, { "epoch": 1.29, "learning_rate": 0.00010667571426409231, "loss": 0.007, "step": 255460 }, { "epoch": 1.29, "learning_rate": 0.00010666814657107828, "loss": 0.0067, "step": 255470 }, { "epoch": 1.29, "learning_rate": 0.00010666057887806427, "loss": 0.0087, "step": 255480 }, { "epoch": 1.29, "learning_rate": 0.00010665301118505025, "loss": 0.0079, "step": 255490 }, { "epoch": 1.29, "learning_rate": 0.00010664544349203625, "loss": 0.0123, "step": 255500 }, { "epoch": 1.29, "learning_rate": 0.00010663787579902224, "loss": 0.0079, "step": 255510 }, { "epoch": 1.29, "learning_rate": 0.00010663030810600822, "loss": 0.0073, "step": 255520 }, { "epoch": 1.29, "learning_rate": 0.00010662274041299422, "loss": 0.0078, "step": 255530 }, { "epoch": 1.29, "learning_rate": 0.00010661517271998021, "loss": 0.0081, "step": 255540 }, { "epoch": 1.29, "learning_rate": 0.0001066076050269662, "loss": 0.0059, "step": 255550 }, { "epoch": 1.29, "learning_rate": 0.00010660003733395219, "loss": 0.0078, "step": 255560 }, { "epoch": 1.29, "learning_rate": 0.00010659246964093817, "loss": 0.0106, "step": 255570 }, { "epoch": 1.29, "learning_rate": 0.00010658490194792417, "loss": 0.0103, "step": 255580 }, { "epoch": 1.29, "learning_rate": 0.00010657733425491016, "loss": 0.0072, "step": 255590 }, { "epoch": 1.29, "learning_rate": 0.00010656976656189614, "loss": 0.0102, "step": 255600 }, { "epoch": 1.29, "learning_rate": 0.00010656219886888214, "loss": 0.0095, "step": 255610 }, { "epoch": 1.29, "learning_rate": 0.00010655463117586813, "loss": 0.01, "step": 255620 }, { "epoch": 1.29, "learning_rate": 0.00010654706348285411, "loss": 0.0071, "step": 255630 }, { "epoch": 1.29, "learning_rate": 0.00010653949578984011, "loss": 0.0072, "step": 255640 }, { "epoch": 1.29, "learning_rate": 0.00010653192809682609, "loss": 0.0082, "step": 255650 }, { "epoch": 1.29, "learning_rate": 0.00010652436040381209, "loss": 0.0116, "step": 255660 }, { "epoch": 1.29, "learning_rate": 0.00010651679271079808, "loss": 0.0079, "step": 255670 }, { "epoch": 1.29, "learning_rate": 0.00010650922501778406, "loss": 0.0082, "step": 255680 }, { "epoch": 1.29, "learning_rate": 0.00010650165732477006, "loss": 0.0076, "step": 255690 }, { "epoch": 1.29, "learning_rate": 0.00010649408963175605, "loss": 0.0062, "step": 255700 }, { "epoch": 1.29, "learning_rate": 0.00010648652193874203, "loss": 0.0081, "step": 255710 }, { "epoch": 1.29, "learning_rate": 0.00010647895424572803, "loss": 0.006, "step": 255720 }, { "epoch": 1.29, "learning_rate": 0.00010647138655271402, "loss": 0.0097, "step": 255730 }, { "epoch": 1.29, "learning_rate": 0.0001064638188597, "loss": 0.009, "step": 255740 }, { "epoch": 1.29, "learning_rate": 0.000106456251166686, "loss": 0.007, "step": 255750 }, { "epoch": 1.29, "learning_rate": 0.00010644868347367198, "loss": 0.0082, "step": 255760 }, { "epoch": 1.29, "learning_rate": 0.00010644111578065798, "loss": 0.0082, "step": 255770 }, { "epoch": 1.29, "learning_rate": 0.00010643354808764397, "loss": 0.0096, "step": 255780 }, { "epoch": 1.29, "learning_rate": 0.00010642598039462995, "loss": 0.0097, "step": 255790 }, { "epoch": 1.29, "learning_rate": 0.00010641841270161595, "loss": 0.0076, "step": 255800 }, { "epoch": 1.29, "learning_rate": 0.00010641084500860194, "loss": 0.0061, "step": 255810 }, { "epoch": 1.29, "learning_rate": 0.00010640327731558792, "loss": 0.0092, "step": 255820 }, { "epoch": 1.29, "learning_rate": 0.00010639570962257392, "loss": 0.0111, "step": 255830 }, { "epoch": 1.29, "learning_rate": 0.0001063881419295599, "loss": 0.0082, "step": 255840 }, { "epoch": 1.29, "learning_rate": 0.0001063805742365459, "loss": 0.0073, "step": 255850 }, { "epoch": 1.29, "learning_rate": 0.00010637300654353189, "loss": 0.01, "step": 255860 }, { "epoch": 1.29, "learning_rate": 0.00010636543885051787, "loss": 0.0084, "step": 255870 }, { "epoch": 1.29, "learning_rate": 0.00010635787115750387, "loss": 0.0084, "step": 255880 }, { "epoch": 1.29, "learning_rate": 0.00010635030346448986, "loss": 0.0101, "step": 255890 }, { "epoch": 1.29, "learning_rate": 0.00010634273577147584, "loss": 0.0082, "step": 255900 }, { "epoch": 1.29, "learning_rate": 0.00010633516807846184, "loss": 0.0078, "step": 255910 }, { "epoch": 1.29, "learning_rate": 0.00010632760038544782, "loss": 0.008, "step": 255920 }, { "epoch": 1.29, "learning_rate": 0.00010632003269243381, "loss": 0.0119, "step": 255930 }, { "epoch": 1.29, "learning_rate": 0.00010631246499941981, "loss": 0.0065, "step": 255940 }, { "epoch": 1.29, "learning_rate": 0.00010630489730640579, "loss": 0.0079, "step": 255950 }, { "epoch": 1.29, "learning_rate": 0.00010629732961339179, "loss": 0.0069, "step": 255960 }, { "epoch": 1.29, "learning_rate": 0.00010628976192037778, "loss": 0.0073, "step": 255970 }, { "epoch": 1.29, "learning_rate": 0.00010628219422736376, "loss": 0.01, "step": 255980 }, { "epoch": 1.29, "learning_rate": 0.00010627462653434976, "loss": 0.0083, "step": 255990 }, { "epoch": 1.29, "learning_rate": 0.00010626705884133574, "loss": 0.0072, "step": 256000 }, { "epoch": 1.29, "eval_cer": 0.9144615223380336, "eval_loss": 0.00655102264136076, "eval_runtime": 116.4546, "eval_samples_per_second": 17.174, "eval_steps_per_second": 4.294, "step": 256000 }, { "epoch": 1.29, "learning_rate": 0.00010625949114832173, "loss": 0.0075, "step": 256010 }, { "epoch": 1.29, "learning_rate": 0.00010625192345530773, "loss": 0.007, "step": 256020 }, { "epoch": 1.29, "learning_rate": 0.00010624435576229371, "loss": 0.01, "step": 256030 }, { "epoch": 1.29, "learning_rate": 0.0001062367880692797, "loss": 0.0083, "step": 256040 }, { "epoch": 1.29, "learning_rate": 0.0001062292203762657, "loss": 0.0073, "step": 256050 }, { "epoch": 1.29, "learning_rate": 0.00010622165268325168, "loss": 0.0081, "step": 256060 }, { "epoch": 1.29, "learning_rate": 0.00010621408499023768, "loss": 0.0099, "step": 256070 }, { "epoch": 1.29, "learning_rate": 0.00010620651729722366, "loss": 0.0083, "step": 256080 }, { "epoch": 1.29, "learning_rate": 0.00010619894960420965, "loss": 0.0073, "step": 256090 }, { "epoch": 1.29, "learning_rate": 0.00010619138191119562, "loss": 0.0084, "step": 256100 }, { "epoch": 1.29, "learning_rate": 0.00010618381421818162, "loss": 0.0085, "step": 256110 }, { "epoch": 1.29, "learning_rate": 0.00010617624652516761, "loss": 0.008, "step": 256120 }, { "epoch": 1.29, "learning_rate": 0.00010616867883215359, "loss": 0.0109, "step": 256130 }, { "epoch": 1.29, "learning_rate": 0.00010616111113913959, "loss": 0.0098, "step": 256140 }, { "epoch": 1.29, "learning_rate": 0.00010615354344612558, "loss": 0.0094, "step": 256150 }, { "epoch": 1.29, "learning_rate": 0.00010614597575311156, "loss": 0.0076, "step": 256160 }, { "epoch": 1.29, "learning_rate": 0.00010613840806009756, "loss": 0.0082, "step": 256170 }, { "epoch": 1.29, "learning_rate": 0.00010613084036708355, "loss": 0.0084, "step": 256180 }, { "epoch": 1.29, "learning_rate": 0.00010612327267406954, "loss": 0.0103, "step": 256190 }, { "epoch": 1.29, "learning_rate": 0.00010611570498105553, "loss": 0.0092, "step": 256200 }, { "epoch": 1.29, "learning_rate": 0.00010610813728804151, "loss": 0.0091, "step": 256210 }, { "epoch": 1.29, "learning_rate": 0.0001061005695950275, "loss": 0.0086, "step": 256220 }, { "epoch": 1.29, "learning_rate": 0.0001060930019020135, "loss": 0.0085, "step": 256230 }, { "epoch": 1.29, "learning_rate": 0.00010608543420899948, "loss": 0.0095, "step": 256240 }, { "epoch": 1.29, "learning_rate": 0.00010607786651598548, "loss": 0.0098, "step": 256250 }, { "epoch": 1.29, "learning_rate": 0.00010607029882297147, "loss": 0.0072, "step": 256260 }, { "epoch": 1.29, "learning_rate": 0.00010606273112995745, "loss": 0.0059, "step": 256270 }, { "epoch": 1.29, "learning_rate": 0.00010605516343694345, "loss": 0.0112, "step": 256280 }, { "epoch": 1.29, "learning_rate": 0.00010604759574392943, "loss": 0.0104, "step": 256290 }, { "epoch": 1.29, "learning_rate": 0.00010604002805091543, "loss": 0.0111, "step": 256300 }, { "epoch": 1.29, "learning_rate": 0.00010603246035790142, "loss": 0.0069, "step": 256310 }, { "epoch": 1.29, "learning_rate": 0.0001060248926648874, "loss": 0.0092, "step": 256320 }, { "epoch": 1.29, "learning_rate": 0.0001060173249718734, "loss": 0.0073, "step": 256330 }, { "epoch": 1.29, "learning_rate": 0.00010600975727885939, "loss": 0.0066, "step": 256340 }, { "epoch": 1.29, "learning_rate": 0.00010600218958584537, "loss": 0.0065, "step": 256350 }, { "epoch": 1.29, "learning_rate": 0.00010599462189283137, "loss": 0.0083, "step": 256360 }, { "epoch": 1.29, "learning_rate": 0.00010598705419981735, "loss": 0.0079, "step": 256370 }, { "epoch": 1.29, "learning_rate": 0.00010597948650680335, "loss": 0.0065, "step": 256380 }, { "epoch": 1.29, "learning_rate": 0.00010597191881378934, "loss": 0.0103, "step": 256390 }, { "epoch": 1.29, "learning_rate": 0.00010596435112077532, "loss": 0.0078, "step": 256400 }, { "epoch": 1.29, "learning_rate": 0.00010595678342776132, "loss": 0.0073, "step": 256410 }, { "epoch": 1.29, "learning_rate": 0.00010594921573474731, "loss": 0.0068, "step": 256420 }, { "epoch": 1.29, "learning_rate": 0.00010594164804173329, "loss": 0.0089, "step": 256430 }, { "epoch": 1.29, "learning_rate": 0.00010593408034871929, "loss": 0.0068, "step": 256440 }, { "epoch": 1.29, "learning_rate": 0.00010592651265570527, "loss": 0.0098, "step": 256450 }, { "epoch": 1.29, "learning_rate": 0.00010591894496269126, "loss": 0.0068, "step": 256460 }, { "epoch": 1.29, "learning_rate": 0.00010591137726967726, "loss": 0.0096, "step": 256470 }, { "epoch": 1.29, "learning_rate": 0.00010590380957666324, "loss": 0.0087, "step": 256480 }, { "epoch": 1.29, "learning_rate": 0.00010589624188364924, "loss": 0.0102, "step": 256490 }, { "epoch": 1.29, "learning_rate": 0.00010588867419063523, "loss": 0.0071, "step": 256500 }, { "epoch": 1.29, "learning_rate": 0.00010588110649762121, "loss": 0.0083, "step": 256510 }, { "epoch": 1.29, "learning_rate": 0.00010587353880460721, "loss": 0.0073, "step": 256520 }, { "epoch": 1.29, "learning_rate": 0.00010586597111159319, "loss": 0.0082, "step": 256530 }, { "epoch": 1.29, "learning_rate": 0.00010585840341857918, "loss": 0.0058, "step": 256540 }, { "epoch": 1.29, "learning_rate": 0.00010585083572556518, "loss": 0.0082, "step": 256550 }, { "epoch": 1.29, "learning_rate": 0.00010584326803255116, "loss": 0.0075, "step": 256560 }, { "epoch": 1.29, "learning_rate": 0.00010583570033953716, "loss": 0.0111, "step": 256570 }, { "epoch": 1.29, "learning_rate": 0.00010582813264652315, "loss": 0.0122, "step": 256580 }, { "epoch": 1.29, "learning_rate": 0.00010582056495350913, "loss": 0.0064, "step": 256590 }, { "epoch": 1.29, "learning_rate": 0.00010581299726049513, "loss": 0.007, "step": 256600 }, { "epoch": 1.29, "learning_rate": 0.00010580542956748111, "loss": 0.0099, "step": 256610 }, { "epoch": 1.29, "learning_rate": 0.0001057978618744671, "loss": 0.0096, "step": 256620 }, { "epoch": 1.29, "learning_rate": 0.0001057902941814531, "loss": 0.0086, "step": 256630 }, { "epoch": 1.29, "learning_rate": 0.00010578272648843908, "loss": 0.0067, "step": 256640 }, { "epoch": 1.29, "learning_rate": 0.00010577515879542507, "loss": 0.0092, "step": 256650 }, { "epoch": 1.29, "learning_rate": 0.00010576759110241107, "loss": 0.0104, "step": 256660 }, { "epoch": 1.29, "learning_rate": 0.00010576002340939705, "loss": 0.0091, "step": 256670 }, { "epoch": 1.29, "learning_rate": 0.00010575245571638305, "loss": 0.0085, "step": 256680 }, { "epoch": 1.3, "learning_rate": 0.00010574488802336904, "loss": 0.0091, "step": 256690 }, { "epoch": 1.3, "learning_rate": 0.00010573732033035502, "loss": 0.0096, "step": 256700 }, { "epoch": 1.3, "learning_rate": 0.00010572975263734102, "loss": 0.0076, "step": 256710 }, { "epoch": 1.3, "learning_rate": 0.00010572218494432699, "loss": 0.0088, "step": 256720 }, { "epoch": 1.3, "learning_rate": 0.00010571461725131298, "loss": 0.0076, "step": 256730 }, { "epoch": 1.3, "learning_rate": 0.00010570704955829896, "loss": 0.0076, "step": 256740 }, { "epoch": 1.3, "learning_rate": 0.00010569948186528496, "loss": 0.007, "step": 256750 }, { "epoch": 1.3, "learning_rate": 0.00010569191417227095, "loss": 0.0103, "step": 256760 }, { "epoch": 1.3, "learning_rate": 0.00010568434647925693, "loss": 0.0113, "step": 256770 }, { "epoch": 1.3, "learning_rate": 0.00010567677878624293, "loss": 0.0086, "step": 256780 }, { "epoch": 1.3, "learning_rate": 0.00010566921109322892, "loss": 0.0086, "step": 256790 }, { "epoch": 1.3, "learning_rate": 0.0001056616434002149, "loss": 0.0076, "step": 256800 }, { "epoch": 1.3, "learning_rate": 0.0001056540757072009, "loss": 0.0071, "step": 256810 }, { "epoch": 1.3, "learning_rate": 0.00010564650801418688, "loss": 0.0076, "step": 256820 }, { "epoch": 1.3, "learning_rate": 0.00010563894032117288, "loss": 0.0079, "step": 256830 }, { "epoch": 1.3, "learning_rate": 0.00010563137262815887, "loss": 0.0084, "step": 256840 }, { "epoch": 1.3, "learning_rate": 0.00010562380493514485, "loss": 0.0096, "step": 256850 }, { "epoch": 1.3, "learning_rate": 0.00010561623724213085, "loss": 0.0077, "step": 256860 }, { "epoch": 1.3, "learning_rate": 0.00010560866954911684, "loss": 0.0073, "step": 256870 }, { "epoch": 1.3, "learning_rate": 0.00010560110185610282, "loss": 0.0058, "step": 256880 }, { "epoch": 1.3, "learning_rate": 0.00010559353416308882, "loss": 0.0077, "step": 256890 }, { "epoch": 1.3, "learning_rate": 0.0001055859664700748, "loss": 0.009, "step": 256900 }, { "epoch": 1.3, "learning_rate": 0.0001055783987770608, "loss": 0.0109, "step": 256910 }, { "epoch": 1.3, "learning_rate": 0.00010557083108404679, "loss": 0.0076, "step": 256920 }, { "epoch": 1.3, "learning_rate": 0.00010556326339103277, "loss": 0.0121, "step": 256930 }, { "epoch": 1.3, "learning_rate": 0.00010555569569801877, "loss": 0.0067, "step": 256940 }, { "epoch": 1.3, "learning_rate": 0.00010554812800500476, "loss": 0.0082, "step": 256950 }, { "epoch": 1.3, "learning_rate": 0.00010554056031199074, "loss": 0.0062, "step": 256960 }, { "epoch": 1.3, "learning_rate": 0.00010553299261897674, "loss": 0.0082, "step": 256970 }, { "epoch": 1.3, "learning_rate": 0.00010552542492596272, "loss": 0.007, "step": 256980 }, { "epoch": 1.3, "learning_rate": 0.00010551785723294871, "loss": 0.0085, "step": 256990 }, { "epoch": 1.3, "learning_rate": 0.00010551028953993471, "loss": 0.0071, "step": 257000 }, { "epoch": 1.3, "eval_cer": 0.914467344714786, "eval_loss": 0.006512925960123539, "eval_runtime": 116.5432, "eval_samples_per_second": 17.161, "eval_steps_per_second": 4.29, "step": 257000 }, { "epoch": 1.3, "learning_rate": 0.00010550272184692069, "loss": 0.0082, "step": 257010 }, { "epoch": 1.3, "learning_rate": 0.00010549515415390669, "loss": 0.0078, "step": 257020 }, { "epoch": 1.3, "learning_rate": 0.00010548758646089268, "loss": 0.0088, "step": 257030 }, { "epoch": 1.3, "learning_rate": 0.00010548001876787866, "loss": 0.0096, "step": 257040 }, { "epoch": 1.3, "learning_rate": 0.00010547245107486466, "loss": 0.0073, "step": 257050 }, { "epoch": 1.3, "learning_rate": 0.00010546488338185064, "loss": 0.0076, "step": 257060 }, { "epoch": 1.3, "learning_rate": 0.00010545731568883663, "loss": 0.0102, "step": 257070 }, { "epoch": 1.3, "learning_rate": 0.00010544974799582263, "loss": 0.009, "step": 257080 }, { "epoch": 1.3, "learning_rate": 0.00010544218030280861, "loss": 0.0085, "step": 257090 }, { "epoch": 1.3, "learning_rate": 0.0001054346126097946, "loss": 0.011, "step": 257100 }, { "epoch": 1.3, "learning_rate": 0.0001054270449167806, "loss": 0.0064, "step": 257110 }, { "epoch": 1.3, "learning_rate": 0.00010541947722376658, "loss": 0.0097, "step": 257120 }, { "epoch": 1.3, "learning_rate": 0.00010541190953075258, "loss": 0.0094, "step": 257130 }, { "epoch": 1.3, "learning_rate": 0.00010540434183773856, "loss": 0.0082, "step": 257140 }, { "epoch": 1.3, "learning_rate": 0.00010539677414472455, "loss": 0.0079, "step": 257150 }, { "epoch": 1.3, "learning_rate": 0.00010538920645171055, "loss": 0.0079, "step": 257160 }, { "epoch": 1.3, "learning_rate": 0.00010538163875869653, "loss": 0.0105, "step": 257170 }, { "epoch": 1.3, "learning_rate": 0.00010537407106568252, "loss": 0.0108, "step": 257180 }, { "epoch": 1.3, "learning_rate": 0.00010536650337266852, "loss": 0.0124, "step": 257190 }, { "epoch": 1.3, "learning_rate": 0.0001053589356796545, "loss": 0.0101, "step": 257200 }, { "epoch": 1.3, "learning_rate": 0.0001053513679866405, "loss": 0.0067, "step": 257210 }, { "epoch": 1.3, "learning_rate": 0.00010534380029362649, "loss": 0.0089, "step": 257220 }, { "epoch": 1.3, "learning_rate": 0.00010533623260061247, "loss": 0.0073, "step": 257230 }, { "epoch": 1.3, "learning_rate": 0.00010532866490759847, "loss": 0.01, "step": 257240 }, { "epoch": 1.3, "learning_rate": 0.00010532109721458445, "loss": 0.0087, "step": 257250 }, { "epoch": 1.3, "learning_rate": 0.00010531352952157044, "loss": 0.0102, "step": 257260 }, { "epoch": 1.3, "learning_rate": 0.00010530596182855644, "loss": 0.0081, "step": 257270 }, { "epoch": 1.3, "learning_rate": 0.00010529839413554242, "loss": 0.0079, "step": 257280 }, { "epoch": 1.3, "learning_rate": 0.00010529082644252842, "loss": 0.0071, "step": 257290 }, { "epoch": 1.3, "learning_rate": 0.00010528325874951441, "loss": 0.0066, "step": 257300 }, { "epoch": 1.3, "learning_rate": 0.00010527569105650039, "loss": 0.0088, "step": 257310 }, { "epoch": 1.3, "learning_rate": 0.00010526812336348639, "loss": 0.0085, "step": 257320 }, { "epoch": 1.3, "learning_rate": 0.00010526055567047237, "loss": 0.0074, "step": 257330 }, { "epoch": 1.3, "learning_rate": 0.00010525298797745836, "loss": 0.0088, "step": 257340 }, { "epoch": 1.3, "learning_rate": 0.00010524542028444433, "loss": 0.0078, "step": 257350 }, { "epoch": 1.3, "learning_rate": 0.00010523785259143033, "loss": 0.0096, "step": 257360 }, { "epoch": 1.3, "learning_rate": 0.00010523028489841632, "loss": 0.0087, "step": 257370 }, { "epoch": 1.3, "learning_rate": 0.0001052227172054023, "loss": 0.0079, "step": 257380 }, { "epoch": 1.3, "learning_rate": 0.0001052151495123883, "loss": 0.0085, "step": 257390 }, { "epoch": 1.3, "learning_rate": 0.00010520758181937429, "loss": 0.0082, "step": 257400 }, { "epoch": 1.3, "learning_rate": 0.00010520001412636027, "loss": 0.0067, "step": 257410 }, { "epoch": 1.3, "learning_rate": 0.00010519244643334627, "loss": 0.0085, "step": 257420 }, { "epoch": 1.3, "learning_rate": 0.00010518487874033225, "loss": 0.0092, "step": 257430 }, { "epoch": 1.3, "learning_rate": 0.00010517731104731825, "loss": 0.0061, "step": 257440 }, { "epoch": 1.3, "learning_rate": 0.00010516974335430424, "loss": 0.0104, "step": 257450 }, { "epoch": 1.3, "learning_rate": 0.00010516217566129022, "loss": 0.0088, "step": 257460 }, { "epoch": 1.3, "learning_rate": 0.00010515460796827622, "loss": 0.0077, "step": 257470 }, { "epoch": 1.3, "learning_rate": 0.00010514704027526221, "loss": 0.007, "step": 257480 }, { "epoch": 1.3, "learning_rate": 0.0001051394725822482, "loss": 0.008, "step": 257490 }, { "epoch": 1.3, "learning_rate": 0.00010513190488923419, "loss": 0.0072, "step": 257500 }, { "epoch": 1.3, "learning_rate": 0.00010512433719622017, "loss": 0.0091, "step": 257510 }, { "epoch": 1.3, "learning_rate": 0.00010511676950320616, "loss": 0.0077, "step": 257520 }, { "epoch": 1.3, "learning_rate": 0.00010510920181019216, "loss": 0.007, "step": 257530 }, { "epoch": 1.3, "learning_rate": 0.00010510163411717814, "loss": 0.0059, "step": 257540 }, { "epoch": 1.3, "learning_rate": 0.00010509406642416414, "loss": 0.009, "step": 257550 }, { "epoch": 1.3, "learning_rate": 0.00010508649873115013, "loss": 0.0077, "step": 257560 }, { "epoch": 1.3, "learning_rate": 0.00010507893103813611, "loss": 0.009, "step": 257570 }, { "epoch": 1.3, "learning_rate": 0.00010507136334512211, "loss": 0.0083, "step": 257580 }, { "epoch": 1.3, "learning_rate": 0.00010506379565210809, "loss": 0.008, "step": 257590 }, { "epoch": 1.3, "learning_rate": 0.00010505622795909408, "loss": 0.008, "step": 257600 }, { "epoch": 1.3, "learning_rate": 0.00010504866026608008, "loss": 0.0073, "step": 257610 }, { "epoch": 1.3, "learning_rate": 0.00010504109257306606, "loss": 0.0072, "step": 257620 }, { "epoch": 1.3, "learning_rate": 0.00010503352488005206, "loss": 0.008, "step": 257630 }, { "epoch": 1.3, "learning_rate": 0.00010502595718703805, "loss": 0.009, "step": 257640 }, { "epoch": 1.3, "learning_rate": 0.00010501838949402403, "loss": 0.0075, "step": 257650 }, { "epoch": 1.3, "learning_rate": 0.00010501082180101003, "loss": 0.0096, "step": 257660 }, { "epoch": 1.3, "learning_rate": 0.00010500325410799602, "loss": 0.0074, "step": 257670 }, { "epoch": 1.3, "learning_rate": 0.000104995686414982, "loss": 0.0097, "step": 257680 }, { "epoch": 1.3, "learning_rate": 0.000104988118721968, "loss": 0.0064, "step": 257690 }, { "epoch": 1.3, "learning_rate": 0.00010498055102895398, "loss": 0.0084, "step": 257700 }, { "epoch": 1.3, "learning_rate": 0.00010497298333593997, "loss": 0.0089, "step": 257710 }, { "epoch": 1.3, "learning_rate": 0.00010496541564292597, "loss": 0.0076, "step": 257720 }, { "epoch": 1.3, "learning_rate": 0.00010495784794991195, "loss": 0.0089, "step": 257730 }, { "epoch": 1.3, "learning_rate": 0.00010495028025689795, "loss": 0.0091, "step": 257740 }, { "epoch": 1.3, "learning_rate": 0.00010494271256388394, "loss": 0.0084, "step": 257750 }, { "epoch": 1.3, "learning_rate": 0.00010493514487086992, "loss": 0.0105, "step": 257760 }, { "epoch": 1.3, "learning_rate": 0.00010492757717785592, "loss": 0.0098, "step": 257770 }, { "epoch": 1.3, "learning_rate": 0.0001049200094848419, "loss": 0.0094, "step": 257780 }, { "epoch": 1.3, "learning_rate": 0.0001049124417918279, "loss": 0.0105, "step": 257790 }, { "epoch": 1.3, "learning_rate": 0.00010490487409881389, "loss": 0.0093, "step": 257800 }, { "epoch": 1.3, "learning_rate": 0.00010489730640579987, "loss": 0.0108, "step": 257810 }, { "epoch": 1.3, "learning_rate": 0.00010488973871278587, "loss": 0.008, "step": 257820 }, { "epoch": 1.3, "learning_rate": 0.00010488217101977186, "loss": 0.0075, "step": 257830 }, { "epoch": 1.3, "learning_rate": 0.00010487460332675784, "loss": 0.0106, "step": 257840 }, { "epoch": 1.3, "learning_rate": 0.00010486703563374384, "loss": 0.0066, "step": 257850 }, { "epoch": 1.3, "learning_rate": 0.00010485946794072982, "loss": 0.0099, "step": 257860 }, { "epoch": 1.3, "learning_rate": 0.00010485190024771581, "loss": 0.0085, "step": 257870 }, { "epoch": 1.3, "learning_rate": 0.00010484433255470181, "loss": 0.0074, "step": 257880 }, { "epoch": 1.3, "learning_rate": 0.00010483676486168779, "loss": 0.0097, "step": 257890 }, { "epoch": 1.3, "learning_rate": 0.00010482919716867378, "loss": 0.0063, "step": 257900 }, { "epoch": 1.3, "learning_rate": 0.00010482162947565978, "loss": 0.0108, "step": 257910 }, { "epoch": 1.3, "learning_rate": 0.00010481406178264576, "loss": 0.0082, "step": 257920 }, { "epoch": 1.3, "learning_rate": 0.00010480649408963176, "loss": 0.011, "step": 257930 }, { "epoch": 1.3, "learning_rate": 0.00010479892639661774, "loss": 0.0069, "step": 257940 }, { "epoch": 1.3, "learning_rate": 0.00010479135870360373, "loss": 0.0096, "step": 257950 }, { "epoch": 1.3, "learning_rate": 0.00010478379101058973, "loss": 0.0081, "step": 257960 }, { "epoch": 1.3, "learning_rate": 0.00010477622331757571, "loss": 0.0073, "step": 257970 }, { "epoch": 1.3, "learning_rate": 0.00010476865562456169, "loss": 0.0075, "step": 257980 }, { "epoch": 1.3, "learning_rate": 0.00010476108793154767, "loss": 0.0078, "step": 257990 }, { "epoch": 1.3, "learning_rate": 0.00010475352023853367, "loss": 0.007, "step": 258000 }, { "epoch": 1.3, "eval_cer": 0.9144421144155256, "eval_loss": 0.006312798708677292, "eval_runtime": 116.232, "eval_samples_per_second": 17.207, "eval_steps_per_second": 4.302, "step": 258000 }, { "epoch": 1.3, "learning_rate": 0.00010474595254551966, "loss": 0.0089, "step": 258010 }, { "epoch": 1.3, "learning_rate": 0.00010473838485250564, "loss": 0.0082, "step": 258020 }, { "epoch": 1.3, "learning_rate": 0.00010473081715949164, "loss": 0.0086, "step": 258030 }, { "epoch": 1.3, "learning_rate": 0.00010472324946647762, "loss": 0.0103, "step": 258040 }, { "epoch": 1.3, "learning_rate": 0.00010471568177346362, "loss": 0.0107, "step": 258050 }, { "epoch": 1.3, "learning_rate": 0.00010470811408044961, "loss": 0.0083, "step": 258060 }, { "epoch": 1.3, "learning_rate": 0.00010470054638743559, "loss": 0.0068, "step": 258070 }, { "epoch": 1.3, "learning_rate": 0.00010469297869442159, "loss": 0.0113, "step": 258080 }, { "epoch": 1.3, "learning_rate": 0.00010468541100140758, "loss": 0.0092, "step": 258090 }, { "epoch": 1.3, "learning_rate": 0.00010467784330839356, "loss": 0.0082, "step": 258100 }, { "epoch": 1.3, "learning_rate": 0.00010467027561537956, "loss": 0.0086, "step": 258110 }, { "epoch": 1.3, "learning_rate": 0.00010466270792236555, "loss": 0.007, "step": 258120 }, { "epoch": 1.3, "learning_rate": 0.00010465514022935153, "loss": 0.0097, "step": 258130 }, { "epoch": 1.3, "learning_rate": 0.00010464757253633753, "loss": 0.0092, "step": 258140 }, { "epoch": 1.3, "learning_rate": 0.00010464000484332351, "loss": 0.0081, "step": 258150 }, { "epoch": 1.3, "learning_rate": 0.0001046324371503095, "loss": 0.0077, "step": 258160 }, { "epoch": 1.3, "learning_rate": 0.0001046248694572955, "loss": 0.0097, "step": 258170 }, { "epoch": 1.3, "learning_rate": 0.00010461730176428148, "loss": 0.0071, "step": 258180 }, { "epoch": 1.3, "learning_rate": 0.00010460973407126748, "loss": 0.009, "step": 258190 }, { "epoch": 1.3, "learning_rate": 0.00010460216637825347, "loss": 0.0083, "step": 258200 }, { "epoch": 1.3, "learning_rate": 0.00010459459868523945, "loss": 0.0077, "step": 258210 }, { "epoch": 1.3, "learning_rate": 0.00010458703099222545, "loss": 0.0066, "step": 258220 }, { "epoch": 1.3, "learning_rate": 0.00010457946329921143, "loss": 0.0066, "step": 258230 }, { "epoch": 1.3, "learning_rate": 0.00010457189560619743, "loss": 0.011, "step": 258240 }, { "epoch": 1.3, "learning_rate": 0.00010456432791318342, "loss": 0.0082, "step": 258250 }, { "epoch": 1.3, "learning_rate": 0.0001045567602201694, "loss": 0.0067, "step": 258260 }, { "epoch": 1.3, "learning_rate": 0.0001045491925271554, "loss": 0.0081, "step": 258270 }, { "epoch": 1.3, "learning_rate": 0.00010454162483414139, "loss": 0.0085, "step": 258280 }, { "epoch": 1.3, "learning_rate": 0.00010453405714112737, "loss": 0.007, "step": 258290 }, { "epoch": 1.3, "learning_rate": 0.00010452648944811337, "loss": 0.0118, "step": 258300 }, { "epoch": 1.3, "learning_rate": 0.00010451892175509935, "loss": 0.0094, "step": 258310 }, { "epoch": 1.3, "learning_rate": 0.00010451135406208534, "loss": 0.008, "step": 258320 }, { "epoch": 1.3, "learning_rate": 0.00010450378636907134, "loss": 0.0089, "step": 258330 }, { "epoch": 1.3, "learning_rate": 0.00010449621867605732, "loss": 0.006, "step": 258340 }, { "epoch": 1.3, "learning_rate": 0.00010448865098304332, "loss": 0.0077, "step": 258350 }, { "epoch": 1.3, "learning_rate": 0.00010448108329002931, "loss": 0.0082, "step": 258360 }, { "epoch": 1.3, "learning_rate": 0.00010447351559701529, "loss": 0.0083, "step": 258370 }, { "epoch": 1.3, "learning_rate": 0.00010446594790400129, "loss": 0.0097, "step": 258380 }, { "epoch": 1.3, "learning_rate": 0.00010445838021098727, "loss": 0.0065, "step": 258390 }, { "epoch": 1.3, "learning_rate": 0.00010445081251797326, "loss": 0.0105, "step": 258400 }, { "epoch": 1.3, "learning_rate": 0.00010444324482495926, "loss": 0.0073, "step": 258410 }, { "epoch": 1.3, "learning_rate": 0.00010443567713194524, "loss": 0.0108, "step": 258420 }, { "epoch": 1.3, "learning_rate": 0.00010442810943893124, "loss": 0.0085, "step": 258430 }, { "epoch": 1.3, "learning_rate": 0.00010442054174591723, "loss": 0.0084, "step": 258440 }, { "epoch": 1.3, "learning_rate": 0.00010441297405290321, "loss": 0.0084, "step": 258450 }, { "epoch": 1.3, "learning_rate": 0.0001044054063598892, "loss": 0.0079, "step": 258460 }, { "epoch": 1.3, "learning_rate": 0.00010439783866687519, "loss": 0.0085, "step": 258470 }, { "epoch": 1.3, "learning_rate": 0.00010439027097386118, "loss": 0.0098, "step": 258480 }, { "epoch": 1.3, "learning_rate": 0.00010438270328084718, "loss": 0.008, "step": 258490 }, { "epoch": 1.3, "learning_rate": 0.00010437513558783316, "loss": 0.0082, "step": 258500 }, { "epoch": 1.3, "learning_rate": 0.00010436756789481915, "loss": 0.0082, "step": 258510 }, { "epoch": 1.3, "learning_rate": 0.00010436000020180515, "loss": 0.0095, "step": 258520 }, { "epoch": 1.3, "learning_rate": 0.00010435243250879113, "loss": 0.0095, "step": 258530 }, { "epoch": 1.3, "learning_rate": 0.00010434486481577713, "loss": 0.0096, "step": 258540 }, { "epoch": 1.3, "learning_rate": 0.00010433729712276311, "loss": 0.007, "step": 258550 }, { "epoch": 1.3, "learning_rate": 0.0001043297294297491, "loss": 0.0083, "step": 258560 }, { "epoch": 1.3, "learning_rate": 0.0001043221617367351, "loss": 0.0082, "step": 258570 }, { "epoch": 1.3, "learning_rate": 0.00010431459404372108, "loss": 0.01, "step": 258580 }, { "epoch": 1.3, "learning_rate": 0.00010430702635070707, "loss": 0.0061, "step": 258590 }, { "epoch": 1.3, "learning_rate": 0.00010429945865769307, "loss": 0.0076, "step": 258600 }, { "epoch": 1.3, "learning_rate": 0.00010429189096467904, "loss": 0.0081, "step": 258610 }, { "epoch": 1.3, "learning_rate": 0.00010428432327166503, "loss": 0.0086, "step": 258620 }, { "epoch": 1.3, "learning_rate": 0.00010427675557865101, "loss": 0.0075, "step": 258630 }, { "epoch": 1.3, "learning_rate": 0.00010426918788563701, "loss": 0.0092, "step": 258640 }, { "epoch": 1.3, "learning_rate": 0.000104261620192623, "loss": 0.0064, "step": 258650 }, { "epoch": 1.3, "learning_rate": 0.00010425405249960898, "loss": 0.0091, "step": 258660 }, { "epoch": 1.31, "learning_rate": 0.00010424648480659498, "loss": 0.007, "step": 258670 }, { "epoch": 1.31, "learning_rate": 0.00010423891711358096, "loss": 0.0089, "step": 258680 }, { "epoch": 1.31, "learning_rate": 0.00010423134942056696, "loss": 0.0069, "step": 258690 }, { "epoch": 1.31, "learning_rate": 0.00010422378172755295, "loss": 0.0081, "step": 258700 }, { "epoch": 1.31, "learning_rate": 0.00010421621403453893, "loss": 0.0078, "step": 258710 }, { "epoch": 1.31, "learning_rate": 0.00010420864634152493, "loss": 0.0069, "step": 258720 }, { "epoch": 1.31, "learning_rate": 0.00010420107864851092, "loss": 0.0089, "step": 258730 }, { "epoch": 1.31, "learning_rate": 0.0001041935109554969, "loss": 0.0078, "step": 258740 }, { "epoch": 1.31, "learning_rate": 0.0001041859432624829, "loss": 0.0086, "step": 258750 }, { "epoch": 1.31, "learning_rate": 0.00010417837556946888, "loss": 0.0085, "step": 258760 }, { "epoch": 1.31, "learning_rate": 0.00010417080787645488, "loss": 0.0093, "step": 258770 }, { "epoch": 1.31, "learning_rate": 0.00010416324018344087, "loss": 0.0079, "step": 258780 }, { "epoch": 1.31, "learning_rate": 0.00010415567249042685, "loss": 0.0091, "step": 258790 }, { "epoch": 1.31, "learning_rate": 0.00010414810479741285, "loss": 0.0072, "step": 258800 }, { "epoch": 1.31, "learning_rate": 0.00010414053710439884, "loss": 0.0086, "step": 258810 }, { "epoch": 1.31, "learning_rate": 0.00010413296941138482, "loss": 0.011, "step": 258820 }, { "epoch": 1.31, "learning_rate": 0.00010412540171837082, "loss": 0.0079, "step": 258830 }, { "epoch": 1.31, "learning_rate": 0.0001041178340253568, "loss": 0.0096, "step": 258840 }, { "epoch": 1.31, "learning_rate": 0.0001041102663323428, "loss": 0.0082, "step": 258850 }, { "epoch": 1.31, "learning_rate": 0.00010410269863932879, "loss": 0.0087, "step": 258860 }, { "epoch": 1.31, "learning_rate": 0.00010409513094631477, "loss": 0.0074, "step": 258870 }, { "epoch": 1.31, "learning_rate": 0.00010408756325330077, "loss": 0.0072, "step": 258880 }, { "epoch": 1.31, "learning_rate": 0.00010407999556028676, "loss": 0.01, "step": 258890 }, { "epoch": 1.31, "learning_rate": 0.00010407242786727274, "loss": 0.0152, "step": 258900 }, { "epoch": 1.31, "learning_rate": 0.00010406486017425874, "loss": 0.0074, "step": 258910 }, { "epoch": 1.31, "learning_rate": 0.00010405729248124472, "loss": 0.0074, "step": 258920 }, { "epoch": 1.31, "learning_rate": 0.00010404972478823071, "loss": 0.0082, "step": 258930 }, { "epoch": 1.31, "learning_rate": 0.00010404215709521671, "loss": 0.0058, "step": 258940 }, { "epoch": 1.31, "learning_rate": 0.00010403458940220269, "loss": 0.007, "step": 258950 }, { "epoch": 1.31, "learning_rate": 0.00010402702170918869, "loss": 0.0074, "step": 258960 }, { "epoch": 1.31, "learning_rate": 0.00010401945401617468, "loss": 0.0096, "step": 258970 }, { "epoch": 1.31, "learning_rate": 0.00010401188632316066, "loss": 0.0112, "step": 258980 }, { "epoch": 1.31, "learning_rate": 0.00010400431863014666, "loss": 0.0079, "step": 258990 }, { "epoch": 1.31, "learning_rate": 0.00010399675093713264, "loss": 0.0105, "step": 259000 }, { "epoch": 1.31, "eval_cer": 0.914452788772905, "eval_loss": 0.006329988595098257, "eval_runtime": 116.6658, "eval_samples_per_second": 17.143, "eval_steps_per_second": 4.286, "step": 259000 }, { "epoch": 1.31, "learning_rate": 0.00010398918324411863, "loss": 0.0085, "step": 259010 }, { "epoch": 1.31, "learning_rate": 0.00010398161555110463, "loss": 0.0072, "step": 259020 }, { "epoch": 1.31, "learning_rate": 0.00010397404785809061, "loss": 0.0092, "step": 259030 }, { "epoch": 1.31, "learning_rate": 0.0001039664801650766, "loss": 0.0097, "step": 259040 }, { "epoch": 1.31, "learning_rate": 0.0001039589124720626, "loss": 0.0078, "step": 259050 }, { "epoch": 1.31, "learning_rate": 0.00010395134477904858, "loss": 0.0083, "step": 259060 }, { "epoch": 1.31, "learning_rate": 0.00010394377708603458, "loss": 0.0086, "step": 259070 }, { "epoch": 1.31, "learning_rate": 0.00010393620939302056, "loss": 0.009, "step": 259080 }, { "epoch": 1.31, "learning_rate": 0.00010392864170000655, "loss": 0.0076, "step": 259090 }, { "epoch": 1.31, "learning_rate": 0.00010392107400699255, "loss": 0.0084, "step": 259100 }, { "epoch": 1.31, "learning_rate": 0.00010391350631397853, "loss": 0.0069, "step": 259110 }, { "epoch": 1.31, "learning_rate": 0.00010390593862096452, "loss": 0.0081, "step": 259120 }, { "epoch": 1.31, "learning_rate": 0.00010389837092795052, "loss": 0.0088, "step": 259130 }, { "epoch": 1.31, "learning_rate": 0.0001038908032349365, "loss": 0.0083, "step": 259140 }, { "epoch": 1.31, "learning_rate": 0.0001038832355419225, "loss": 0.0065, "step": 259150 }, { "epoch": 1.31, "learning_rate": 0.00010387566784890849, "loss": 0.007, "step": 259160 }, { "epoch": 1.31, "learning_rate": 0.00010386810015589447, "loss": 0.0096, "step": 259170 }, { "epoch": 1.31, "learning_rate": 0.00010386053246288047, "loss": 0.0081, "step": 259180 }, { "epoch": 1.31, "learning_rate": 0.00010385296476986645, "loss": 0.0085, "step": 259190 }, { "epoch": 1.31, "learning_rate": 0.00010384539707685244, "loss": 0.0118, "step": 259200 }, { "epoch": 1.31, "learning_rate": 0.00010383782938383844, "loss": 0.0087, "step": 259210 }, { "epoch": 1.31, "learning_rate": 0.00010383026169082442, "loss": 0.0084, "step": 259220 }, { "epoch": 1.31, "learning_rate": 0.00010382269399781041, "loss": 0.0109, "step": 259230 }, { "epoch": 1.31, "learning_rate": 0.00010381512630479638, "loss": 0.0094, "step": 259240 }, { "epoch": 1.31, "learning_rate": 0.00010380755861178238, "loss": 0.007, "step": 259250 }, { "epoch": 1.31, "learning_rate": 0.00010379999091876837, "loss": 0.007, "step": 259260 }, { "epoch": 1.31, "learning_rate": 0.00010379242322575435, "loss": 0.0124, "step": 259270 }, { "epoch": 1.31, "learning_rate": 0.00010378485553274035, "loss": 0.0077, "step": 259280 }, { "epoch": 1.31, "learning_rate": 0.00010377728783972633, "loss": 0.0089, "step": 259290 }, { "epoch": 1.31, "learning_rate": 0.00010376972014671233, "loss": 0.0106, "step": 259300 }, { "epoch": 1.31, "learning_rate": 0.00010376215245369832, "loss": 0.0071, "step": 259310 }, { "epoch": 1.31, "learning_rate": 0.0001037545847606843, "loss": 0.0108, "step": 259320 }, { "epoch": 1.31, "learning_rate": 0.0001037470170676703, "loss": 0.0091, "step": 259330 }, { "epoch": 1.31, "learning_rate": 0.00010373944937465629, "loss": 0.0085, "step": 259340 }, { "epoch": 1.31, "learning_rate": 0.00010373188168164227, "loss": 0.0084, "step": 259350 }, { "epoch": 1.31, "learning_rate": 0.00010372431398862827, "loss": 0.0087, "step": 259360 }, { "epoch": 1.31, "learning_rate": 0.00010371674629561425, "loss": 0.0107, "step": 259370 }, { "epoch": 1.31, "learning_rate": 0.00010370917860260024, "loss": 0.0077, "step": 259380 }, { "epoch": 1.31, "learning_rate": 0.00010370161090958624, "loss": 0.0072, "step": 259390 }, { "epoch": 1.31, "learning_rate": 0.00010369404321657222, "loss": 0.009, "step": 259400 }, { "epoch": 1.31, "learning_rate": 0.00010368647552355822, "loss": 0.0103, "step": 259410 }, { "epoch": 1.31, "learning_rate": 0.00010367890783054421, "loss": 0.0078, "step": 259420 }, { "epoch": 1.31, "learning_rate": 0.00010367134013753019, "loss": 0.0077, "step": 259430 }, { "epoch": 1.31, "learning_rate": 0.00010366377244451619, "loss": 0.0069, "step": 259440 }, { "epoch": 1.31, "learning_rate": 0.00010365620475150217, "loss": 0.0096, "step": 259450 }, { "epoch": 1.31, "learning_rate": 0.00010364863705848816, "loss": 0.0117, "step": 259460 }, { "epoch": 1.31, "learning_rate": 0.00010364106936547416, "loss": 0.0069, "step": 259470 }, { "epoch": 1.31, "learning_rate": 0.00010363350167246014, "loss": 0.0068, "step": 259480 }, { "epoch": 1.31, "learning_rate": 0.00010362593397944614, "loss": 0.008, "step": 259490 }, { "epoch": 1.31, "learning_rate": 0.00010361836628643213, "loss": 0.0072, "step": 259500 }, { "epoch": 1.31, "learning_rate": 0.00010361079859341811, "loss": 0.0092, "step": 259510 }, { "epoch": 1.31, "learning_rate": 0.00010360323090040411, "loss": 0.0104, "step": 259520 }, { "epoch": 1.31, "learning_rate": 0.00010359566320739009, "loss": 0.0086, "step": 259530 }, { "epoch": 1.31, "learning_rate": 0.00010358809551437608, "loss": 0.0081, "step": 259540 }, { "epoch": 1.31, "learning_rate": 0.00010358052782136208, "loss": 0.0067, "step": 259550 }, { "epoch": 1.31, "learning_rate": 0.00010357296012834806, "loss": 0.0122, "step": 259560 }, { "epoch": 1.31, "learning_rate": 0.00010356539243533405, "loss": 0.0065, "step": 259570 }, { "epoch": 1.31, "learning_rate": 0.00010355782474232005, "loss": 0.0083, "step": 259580 }, { "epoch": 1.31, "learning_rate": 0.00010355025704930603, "loss": 0.012, "step": 259590 }, { "epoch": 1.31, "learning_rate": 0.00010354268935629203, "loss": 0.0089, "step": 259600 }, { "epoch": 1.31, "learning_rate": 0.00010353512166327802, "loss": 0.0074, "step": 259610 }, { "epoch": 1.31, "learning_rate": 0.000103527553970264, "loss": 0.0066, "step": 259620 }, { "epoch": 1.31, "learning_rate": 0.00010351998627725, "loss": 0.0082, "step": 259630 }, { "epoch": 1.31, "learning_rate": 0.00010351241858423598, "loss": 0.0114, "step": 259640 }, { "epoch": 1.31, "learning_rate": 0.00010350485089122197, "loss": 0.0073, "step": 259650 }, { "epoch": 1.31, "learning_rate": 0.00010349728319820797, "loss": 0.0078, "step": 259660 }, { "epoch": 1.31, "learning_rate": 0.00010348971550519395, "loss": 0.01, "step": 259670 }, { "epoch": 1.31, "learning_rate": 0.00010348214781217995, "loss": 0.0067, "step": 259680 }, { "epoch": 1.31, "learning_rate": 0.00010347458011916594, "loss": 0.0074, "step": 259690 }, { "epoch": 1.31, "learning_rate": 0.00010346701242615192, "loss": 0.0085, "step": 259700 }, { "epoch": 1.31, "learning_rate": 0.00010345944473313792, "loss": 0.0106, "step": 259710 }, { "epoch": 1.31, "learning_rate": 0.0001034518770401239, "loss": 0.0067, "step": 259720 }, { "epoch": 1.31, "learning_rate": 0.0001034443093471099, "loss": 0.0073, "step": 259730 }, { "epoch": 1.31, "learning_rate": 0.00010343674165409589, "loss": 0.0093, "step": 259740 }, { "epoch": 1.31, "learning_rate": 0.00010342917396108187, "loss": 0.0085, "step": 259750 }, { "epoch": 1.31, "learning_rate": 0.00010342160626806786, "loss": 0.0067, "step": 259760 }, { "epoch": 1.31, "learning_rate": 0.00010341403857505386, "loss": 0.0078, "step": 259770 }, { "epoch": 1.31, "learning_rate": 0.00010340647088203984, "loss": 0.0062, "step": 259780 }, { "epoch": 1.31, "learning_rate": 0.00010339890318902584, "loss": 0.0058, "step": 259790 }, { "epoch": 1.31, "learning_rate": 0.00010339133549601182, "loss": 0.0069, "step": 259800 }, { "epoch": 1.31, "learning_rate": 0.00010338376780299781, "loss": 0.0057, "step": 259810 }, { "epoch": 1.31, "learning_rate": 0.00010337620010998381, "loss": 0.0074, "step": 259820 }, { "epoch": 1.31, "learning_rate": 0.00010336863241696979, "loss": 0.0066, "step": 259830 }, { "epoch": 1.31, "learning_rate": 0.00010336106472395578, "loss": 0.0107, "step": 259840 }, { "epoch": 1.31, "learning_rate": 0.00010335349703094178, "loss": 0.0097, "step": 259850 }, { "epoch": 1.31, "learning_rate": 0.00010334592933792776, "loss": 0.0076, "step": 259860 }, { "epoch": 1.31, "learning_rate": 0.00010333836164491374, "loss": 0.0074, "step": 259870 }, { "epoch": 1.31, "learning_rate": 0.00010333079395189972, "loss": 0.008, "step": 259880 }, { "epoch": 1.31, "learning_rate": 0.00010332322625888572, "loss": 0.0097, "step": 259890 }, { "epoch": 1.31, "learning_rate": 0.0001033156585658717, "loss": 0.0079, "step": 259900 }, { "epoch": 1.31, "learning_rate": 0.0001033080908728577, "loss": 0.01, "step": 259910 }, { "epoch": 1.31, "learning_rate": 0.00010330052317984369, "loss": 0.0061, "step": 259920 }, { "epoch": 1.31, "learning_rate": 0.00010329295548682967, "loss": 0.0081, "step": 259930 }, { "epoch": 1.31, "learning_rate": 0.00010328538779381567, "loss": 0.0092, "step": 259940 }, { "epoch": 1.31, "learning_rate": 0.00010327782010080166, "loss": 0.0076, "step": 259950 }, { "epoch": 1.31, "learning_rate": 0.00010327025240778764, "loss": 0.0087, "step": 259960 }, { "epoch": 1.31, "learning_rate": 0.00010326268471477364, "loss": 0.0088, "step": 259970 }, { "epoch": 1.31, "learning_rate": 0.00010325511702175962, "loss": 0.008, "step": 259980 }, { "epoch": 1.31, "learning_rate": 0.00010324754932874561, "loss": 0.0084, "step": 259990 }, { "epoch": 1.31, "learning_rate": 0.00010323998163573161, "loss": 0.0089, "step": 260000 }, { "epoch": 1.31, "eval_cer": 0.9144333808503969, "eval_loss": 0.006425743922591209, "eval_runtime": 116.2948, "eval_samples_per_second": 17.198, "eval_steps_per_second": 4.299, "step": 260000 }, { "epoch": 1.31, "learning_rate": 0.00010323241394271759, "loss": 0.0065, "step": 260010 }, { "epoch": 1.31, "learning_rate": 0.00010322484624970359, "loss": 0.0073, "step": 260020 }, { "epoch": 1.31, "learning_rate": 0.00010321727855668958, "loss": 0.0094, "step": 260030 }, { "epoch": 1.31, "learning_rate": 0.00010320971086367556, "loss": 0.0076, "step": 260040 }, { "epoch": 1.31, "learning_rate": 0.00010320214317066156, "loss": 0.0106, "step": 260050 }, { "epoch": 1.31, "learning_rate": 0.00010319457547764755, "loss": 0.0063, "step": 260060 }, { "epoch": 1.31, "learning_rate": 0.00010318700778463353, "loss": 0.0092, "step": 260070 }, { "epoch": 1.31, "learning_rate": 0.00010317944009161953, "loss": 0.0087, "step": 260080 }, { "epoch": 1.31, "learning_rate": 0.00010317187239860551, "loss": 0.0069, "step": 260090 }, { "epoch": 1.31, "learning_rate": 0.0001031643047055915, "loss": 0.0072, "step": 260100 }, { "epoch": 1.31, "learning_rate": 0.0001031567370125775, "loss": 0.0109, "step": 260110 }, { "epoch": 1.31, "learning_rate": 0.00010314916931956348, "loss": 0.0062, "step": 260120 }, { "epoch": 1.31, "learning_rate": 0.00010314160162654948, "loss": 0.0117, "step": 260130 }, { "epoch": 1.31, "learning_rate": 0.00010313403393353547, "loss": 0.0076, "step": 260140 }, { "epoch": 1.31, "learning_rate": 0.00010312646624052145, "loss": 0.0078, "step": 260150 }, { "epoch": 1.31, "learning_rate": 0.00010311889854750745, "loss": 0.0064, "step": 260160 }, { "epoch": 1.31, "learning_rate": 0.00010311133085449343, "loss": 0.0069, "step": 260170 }, { "epoch": 1.31, "learning_rate": 0.00010310376316147942, "loss": 0.0074, "step": 260180 }, { "epoch": 1.31, "learning_rate": 0.00010309619546846542, "loss": 0.006, "step": 260190 }, { "epoch": 1.31, "learning_rate": 0.0001030886277754514, "loss": 0.0077, "step": 260200 }, { "epoch": 1.31, "learning_rate": 0.0001030810600824374, "loss": 0.0125, "step": 260210 }, { "epoch": 1.31, "learning_rate": 0.00010307349238942339, "loss": 0.0064, "step": 260220 }, { "epoch": 1.31, "learning_rate": 0.00010306592469640937, "loss": 0.0095, "step": 260230 }, { "epoch": 1.31, "learning_rate": 0.00010305835700339537, "loss": 0.0073, "step": 260240 }, { "epoch": 1.31, "learning_rate": 0.00010305078931038135, "loss": 0.009, "step": 260250 }, { "epoch": 1.31, "learning_rate": 0.00010304322161736734, "loss": 0.0082, "step": 260260 }, { "epoch": 1.31, "learning_rate": 0.00010303565392435334, "loss": 0.0101, "step": 260270 }, { "epoch": 1.31, "learning_rate": 0.00010302808623133932, "loss": 0.0089, "step": 260280 }, { "epoch": 1.31, "learning_rate": 0.00010302051853832531, "loss": 0.0112, "step": 260290 }, { "epoch": 1.31, "learning_rate": 0.00010301295084531131, "loss": 0.01, "step": 260300 }, { "epoch": 1.31, "learning_rate": 0.00010300538315229729, "loss": 0.0062, "step": 260310 }, { "epoch": 1.31, "learning_rate": 0.00010299781545928329, "loss": 0.0077, "step": 260320 }, { "epoch": 1.31, "learning_rate": 0.00010299024776626927, "loss": 0.0075, "step": 260330 }, { "epoch": 1.31, "learning_rate": 0.00010298268007325526, "loss": 0.0063, "step": 260340 }, { "epoch": 1.31, "learning_rate": 0.00010297511238024126, "loss": 0.0087, "step": 260350 }, { "epoch": 1.31, "learning_rate": 0.00010296754468722724, "loss": 0.0087, "step": 260360 }, { "epoch": 1.31, "learning_rate": 0.00010295997699421323, "loss": 0.0085, "step": 260370 }, { "epoch": 1.31, "learning_rate": 0.00010295240930119923, "loss": 0.0076, "step": 260380 }, { "epoch": 1.31, "learning_rate": 0.00010294484160818521, "loss": 0.0075, "step": 260390 }, { "epoch": 1.31, "learning_rate": 0.0001029372739151712, "loss": 0.0074, "step": 260400 }, { "epoch": 1.31, "learning_rate": 0.00010292970622215719, "loss": 0.0087, "step": 260410 }, { "epoch": 1.31, "learning_rate": 0.00010292213852914318, "loss": 0.0075, "step": 260420 }, { "epoch": 1.31, "learning_rate": 0.00010291457083612918, "loss": 0.0067, "step": 260430 }, { "epoch": 1.31, "learning_rate": 0.00010290700314311516, "loss": 0.0107, "step": 260440 }, { "epoch": 1.31, "learning_rate": 0.00010289943545010115, "loss": 0.0068, "step": 260450 }, { "epoch": 1.31, "learning_rate": 0.00010289186775708715, "loss": 0.0061, "step": 260460 }, { "epoch": 1.31, "learning_rate": 0.00010288430006407313, "loss": 0.0101, "step": 260470 }, { "epoch": 1.31, "learning_rate": 0.00010287673237105912, "loss": 0.0093, "step": 260480 }, { "epoch": 1.31, "learning_rate": 0.00010286916467804509, "loss": 0.0081, "step": 260490 }, { "epoch": 1.31, "learning_rate": 0.00010286159698503109, "loss": 0.011, "step": 260500 }, { "epoch": 1.31, "learning_rate": 0.00010285402929201708, "loss": 0.0083, "step": 260510 }, { "epoch": 1.31, "learning_rate": 0.00010284646159900306, "loss": 0.0073, "step": 260520 }, { "epoch": 1.31, "learning_rate": 0.00010283889390598906, "loss": 0.0084, "step": 260530 }, { "epoch": 1.31, "learning_rate": 0.00010283132621297504, "loss": 0.0086, "step": 260540 }, { "epoch": 1.31, "learning_rate": 0.00010282375851996104, "loss": 0.0084, "step": 260550 }, { "epoch": 1.31, "learning_rate": 0.00010281619082694703, "loss": 0.0097, "step": 260560 }, { "epoch": 1.31, "learning_rate": 0.00010280862313393301, "loss": 0.0073, "step": 260570 }, { "epoch": 1.31, "learning_rate": 0.00010280105544091901, "loss": 0.0073, "step": 260580 }, { "epoch": 1.31, "learning_rate": 0.000102793487747905, "loss": 0.0073, "step": 260590 }, { "epoch": 1.31, "learning_rate": 0.00010278592005489098, "loss": 0.0068, "step": 260600 }, { "epoch": 1.31, "learning_rate": 0.00010277835236187698, "loss": 0.0064, "step": 260610 }, { "epoch": 1.31, "learning_rate": 0.00010277078466886296, "loss": 0.0071, "step": 260620 }, { "epoch": 1.31, "learning_rate": 0.00010276321697584895, "loss": 0.0072, "step": 260630 }, { "epoch": 1.31, "learning_rate": 0.00010275564928283495, "loss": 0.0082, "step": 260640 }, { "epoch": 1.32, "learning_rate": 0.00010274808158982093, "loss": 0.0089, "step": 260650 }, { "epoch": 1.32, "learning_rate": 0.00010274051389680693, "loss": 0.0098, "step": 260660 }, { "epoch": 1.32, "learning_rate": 0.00010273294620379292, "loss": 0.0093, "step": 260670 }, { "epoch": 1.32, "learning_rate": 0.0001027253785107789, "loss": 0.0083, "step": 260680 }, { "epoch": 1.32, "learning_rate": 0.0001027178108177649, "loss": 0.0086, "step": 260690 }, { "epoch": 1.32, "learning_rate": 0.00010271024312475088, "loss": 0.0069, "step": 260700 }, { "epoch": 1.32, "learning_rate": 0.00010270267543173687, "loss": 0.0085, "step": 260710 }, { "epoch": 1.32, "learning_rate": 0.00010269510773872287, "loss": 0.0072, "step": 260720 }, { "epoch": 1.32, "learning_rate": 0.00010268754004570885, "loss": 0.008, "step": 260730 }, { "epoch": 1.32, "learning_rate": 0.00010267997235269485, "loss": 0.0065, "step": 260740 }, { "epoch": 1.32, "learning_rate": 0.00010267240465968084, "loss": 0.0075, "step": 260750 }, { "epoch": 1.32, "learning_rate": 0.00010266483696666682, "loss": 0.0094, "step": 260760 }, { "epoch": 1.32, "learning_rate": 0.00010265726927365282, "loss": 0.007, "step": 260770 }, { "epoch": 1.32, "learning_rate": 0.0001026497015806388, "loss": 0.0085, "step": 260780 }, { "epoch": 1.32, "learning_rate": 0.0001026421338876248, "loss": 0.0086, "step": 260790 }, { "epoch": 1.32, "learning_rate": 0.00010263456619461079, "loss": 0.0075, "step": 260800 }, { "epoch": 1.32, "learning_rate": 0.00010262699850159677, "loss": 0.0073, "step": 260810 }, { "epoch": 1.32, "learning_rate": 0.00010261943080858276, "loss": 0.0094, "step": 260820 }, { "epoch": 1.32, "learning_rate": 0.00010261186311556876, "loss": 0.0094, "step": 260830 }, { "epoch": 1.32, "learning_rate": 0.00010260429542255474, "loss": 0.0098, "step": 260840 }, { "epoch": 1.32, "learning_rate": 0.00010259672772954074, "loss": 0.0075, "step": 260850 }, { "epoch": 1.32, "learning_rate": 0.00010258916003652672, "loss": 0.0079, "step": 260860 }, { "epoch": 1.32, "learning_rate": 0.00010258159234351271, "loss": 0.0075, "step": 260870 }, { "epoch": 1.32, "learning_rate": 0.00010257402465049871, "loss": 0.0052, "step": 260880 }, { "epoch": 1.32, "learning_rate": 0.00010256645695748469, "loss": 0.007, "step": 260890 }, { "epoch": 1.32, "learning_rate": 0.00010255888926447068, "loss": 0.007, "step": 260900 }, { "epoch": 1.32, "learning_rate": 0.00010255132157145668, "loss": 0.0083, "step": 260910 }, { "epoch": 1.32, "learning_rate": 0.00010254375387844266, "loss": 0.0072, "step": 260920 }, { "epoch": 1.32, "learning_rate": 0.00010253618618542866, "loss": 0.0082, "step": 260930 }, { "epoch": 1.32, "learning_rate": 0.00010252861849241464, "loss": 0.0076, "step": 260940 }, { "epoch": 1.32, "learning_rate": 0.00010252105079940063, "loss": 0.0086, "step": 260950 }, { "epoch": 1.32, "learning_rate": 0.00010251348310638663, "loss": 0.0079, "step": 260960 }, { "epoch": 1.32, "learning_rate": 0.00010250591541337261, "loss": 0.0087, "step": 260970 }, { "epoch": 1.32, "learning_rate": 0.0001024983477203586, "loss": 0.0076, "step": 260980 }, { "epoch": 1.32, "learning_rate": 0.0001024907800273446, "loss": 0.0073, "step": 260990 }, { "epoch": 1.32, "learning_rate": 0.00010248321233433058, "loss": 0.008, "step": 261000 }, { "epoch": 1.32, "eval_cer": 0.9144343512465224, "eval_loss": 0.006257697008550167, "eval_runtime": 116.3265, "eval_samples_per_second": 17.193, "eval_steps_per_second": 4.298, "step": 261000 }, { "epoch": 1.32, "learning_rate": 0.00010247564464131657, "loss": 0.0073, "step": 261010 }, { "epoch": 1.32, "learning_rate": 0.00010246807694830256, "loss": 0.006, "step": 261020 }, { "epoch": 1.32, "learning_rate": 0.00010246050925528855, "loss": 0.0093, "step": 261030 }, { "epoch": 1.32, "learning_rate": 0.00010245294156227455, "loss": 0.0065, "step": 261040 }, { "epoch": 1.32, "learning_rate": 0.00010244537386926053, "loss": 0.007, "step": 261050 }, { "epoch": 1.32, "learning_rate": 0.00010243780617624652, "loss": 0.0078, "step": 261060 }, { "epoch": 1.32, "learning_rate": 0.00010243023848323252, "loss": 0.0096, "step": 261070 }, { "epoch": 1.32, "learning_rate": 0.0001024226707902185, "loss": 0.0081, "step": 261080 }, { "epoch": 1.32, "learning_rate": 0.0001024151030972045, "loss": 0.0085, "step": 261090 }, { "epoch": 1.32, "learning_rate": 0.00010240753540419049, "loss": 0.007, "step": 261100 }, { "epoch": 1.32, "learning_rate": 0.00010239996771117647, "loss": 0.0109, "step": 261110 }, { "epoch": 1.32, "learning_rate": 0.00010239240001816245, "loss": 0.008, "step": 261120 }, { "epoch": 1.32, "learning_rate": 0.00010238483232514843, "loss": 0.0087, "step": 261130 }, { "epoch": 1.32, "learning_rate": 0.00010237726463213443, "loss": 0.0107, "step": 261140 }, { "epoch": 1.32, "learning_rate": 0.00010236969693912041, "loss": 0.0088, "step": 261150 }, { "epoch": 1.32, "learning_rate": 0.0001023621292461064, "loss": 0.0075, "step": 261160 }, { "epoch": 1.32, "learning_rate": 0.0001023545615530924, "loss": 0.0109, "step": 261170 }, { "epoch": 1.32, "learning_rate": 0.00010234699386007838, "loss": 0.0081, "step": 261180 }, { "epoch": 1.32, "learning_rate": 0.00010233942616706438, "loss": 0.0108, "step": 261190 }, { "epoch": 1.32, "learning_rate": 0.00010233185847405037, "loss": 0.0106, "step": 261200 }, { "epoch": 1.32, "learning_rate": 0.00010232429078103635, "loss": 0.0068, "step": 261210 }, { "epoch": 1.32, "learning_rate": 0.00010231672308802235, "loss": 0.0084, "step": 261220 }, { "epoch": 1.32, "learning_rate": 0.00010230915539500833, "loss": 0.0085, "step": 261230 }, { "epoch": 1.32, "learning_rate": 0.00010230158770199432, "loss": 0.0077, "step": 261240 }, { "epoch": 1.32, "learning_rate": 0.00010229402000898032, "loss": 0.0085, "step": 261250 }, { "epoch": 1.32, "learning_rate": 0.0001022864523159663, "loss": 0.0076, "step": 261260 }, { "epoch": 1.32, "learning_rate": 0.0001022788846229523, "loss": 0.0069, "step": 261270 }, { "epoch": 1.32, "learning_rate": 0.00010227131692993829, "loss": 0.0076, "step": 261280 }, { "epoch": 1.32, "learning_rate": 0.00010226374923692427, "loss": 0.0106, "step": 261290 }, { "epoch": 1.32, "learning_rate": 0.00010225618154391027, "loss": 0.0093, "step": 261300 }, { "epoch": 1.32, "learning_rate": 0.00010224861385089625, "loss": 0.0078, "step": 261310 }, { "epoch": 1.32, "learning_rate": 0.00010224104615788224, "loss": 0.0058, "step": 261320 }, { "epoch": 1.32, "learning_rate": 0.00010223347846486824, "loss": 0.0078, "step": 261330 }, { "epoch": 1.32, "learning_rate": 0.00010222591077185422, "loss": 0.007, "step": 261340 }, { "epoch": 1.32, "learning_rate": 0.00010221834307884022, "loss": 0.0082, "step": 261350 }, { "epoch": 1.32, "learning_rate": 0.00010221077538582621, "loss": 0.0074, "step": 261360 }, { "epoch": 1.32, "learning_rate": 0.00010220320769281219, "loss": 0.0105, "step": 261370 }, { "epoch": 1.32, "learning_rate": 0.00010219563999979819, "loss": 0.0078, "step": 261380 }, { "epoch": 1.32, "learning_rate": 0.00010218807230678417, "loss": 0.0058, "step": 261390 }, { "epoch": 1.32, "learning_rate": 0.00010218050461377016, "loss": 0.0082, "step": 261400 }, { "epoch": 1.32, "learning_rate": 0.00010217293692075616, "loss": 0.0111, "step": 261410 }, { "epoch": 1.32, "learning_rate": 0.00010216536922774214, "loss": 0.0074, "step": 261420 }, { "epoch": 1.32, "learning_rate": 0.00010215780153472813, "loss": 0.0102, "step": 261430 }, { "epoch": 1.32, "learning_rate": 0.00010215023384171413, "loss": 0.0093, "step": 261440 }, { "epoch": 1.32, "learning_rate": 0.00010214266614870011, "loss": 0.0101, "step": 261450 }, { "epoch": 1.32, "learning_rate": 0.0001021350984556861, "loss": 0.0093, "step": 261460 }, { "epoch": 1.32, "learning_rate": 0.00010212753076267209, "loss": 0.0077, "step": 261470 }, { "epoch": 1.32, "learning_rate": 0.00010211996306965808, "loss": 0.0071, "step": 261480 }, { "epoch": 1.32, "learning_rate": 0.00010211239537664408, "loss": 0.0101, "step": 261490 }, { "epoch": 1.32, "learning_rate": 0.00010210482768363006, "loss": 0.0124, "step": 261500 }, { "epoch": 1.32, "learning_rate": 0.00010209725999061605, "loss": 0.0068, "step": 261510 }, { "epoch": 1.32, "learning_rate": 0.00010208969229760205, "loss": 0.0075, "step": 261520 }, { "epoch": 1.32, "learning_rate": 0.00010208212460458803, "loss": 0.0102, "step": 261530 }, { "epoch": 1.32, "learning_rate": 0.00010207455691157403, "loss": 0.0073, "step": 261540 }, { "epoch": 1.32, "learning_rate": 0.00010206698921856002, "loss": 0.0083, "step": 261550 }, { "epoch": 1.32, "learning_rate": 0.000102059421525546, "loss": 0.0071, "step": 261560 }, { "epoch": 1.32, "learning_rate": 0.000102051853832532, "loss": 0.0079, "step": 261570 }, { "epoch": 1.32, "learning_rate": 0.00010204428613951798, "loss": 0.0086, "step": 261580 }, { "epoch": 1.32, "learning_rate": 0.00010203671844650397, "loss": 0.0088, "step": 261590 }, { "epoch": 1.32, "learning_rate": 0.00010202915075348997, "loss": 0.0087, "step": 261600 }, { "epoch": 1.32, "learning_rate": 0.00010202158306047595, "loss": 0.0099, "step": 261610 }, { "epoch": 1.32, "learning_rate": 0.00010201401536746194, "loss": 0.0086, "step": 261620 }, { "epoch": 1.32, "learning_rate": 0.00010200644767444794, "loss": 0.0104, "step": 261630 }, { "epoch": 1.32, "learning_rate": 0.00010199887998143392, "loss": 0.0064, "step": 261640 }, { "epoch": 1.32, "learning_rate": 0.00010199131228841992, "loss": 0.0099, "step": 261650 }, { "epoch": 1.32, "learning_rate": 0.0001019837445954059, "loss": 0.0097, "step": 261660 }, { "epoch": 1.32, "learning_rate": 0.00010197617690239189, "loss": 0.0084, "step": 261670 }, { "epoch": 1.32, "learning_rate": 0.00010196860920937789, "loss": 0.0091, "step": 261680 }, { "epoch": 1.32, "learning_rate": 0.00010196104151636387, "loss": 0.0067, "step": 261690 }, { "epoch": 1.32, "learning_rate": 0.00010195347382334986, "loss": 0.0099, "step": 261700 }, { "epoch": 1.32, "learning_rate": 0.00010194590613033586, "loss": 0.0085, "step": 261710 }, { "epoch": 1.32, "learning_rate": 0.00010193833843732184, "loss": 0.008, "step": 261720 }, { "epoch": 1.32, "learning_rate": 0.00010193077074430784, "loss": 0.0105, "step": 261730 }, { "epoch": 1.32, "learning_rate": 0.00010192320305129382, "loss": 0.0121, "step": 261740 }, { "epoch": 1.32, "learning_rate": 0.0001019156353582798, "loss": 0.0082, "step": 261750 }, { "epoch": 1.32, "learning_rate": 0.00010190806766526578, "loss": 0.0068, "step": 261760 }, { "epoch": 1.32, "learning_rate": 0.00010190049997225177, "loss": 0.0068, "step": 261770 }, { "epoch": 1.32, "learning_rate": 0.00010189293227923777, "loss": 0.0095, "step": 261780 }, { "epoch": 1.32, "learning_rate": 0.00010188536458622375, "loss": 0.0082, "step": 261790 }, { "epoch": 1.32, "learning_rate": 0.00010187779689320975, "loss": 0.008, "step": 261800 }, { "epoch": 1.32, "learning_rate": 0.00010187022920019574, "loss": 0.008, "step": 261810 }, { "epoch": 1.32, "learning_rate": 0.00010186266150718172, "loss": 0.0063, "step": 261820 }, { "epoch": 1.32, "learning_rate": 0.00010185509381416772, "loss": 0.0083, "step": 261830 }, { "epoch": 1.32, "learning_rate": 0.0001018475261211537, "loss": 0.0105, "step": 261840 }, { "epoch": 1.32, "learning_rate": 0.0001018399584281397, "loss": 0.0063, "step": 261850 }, { "epoch": 1.32, "learning_rate": 0.00010183239073512569, "loss": 0.0074, "step": 261860 }, { "epoch": 1.32, "learning_rate": 0.00010182482304211167, "loss": 0.0089, "step": 261870 }, { "epoch": 1.32, "learning_rate": 0.00010181725534909767, "loss": 0.0067, "step": 261880 }, { "epoch": 1.32, "learning_rate": 0.00010180968765608366, "loss": 0.0063, "step": 261890 }, { "epoch": 1.32, "learning_rate": 0.00010180211996306964, "loss": 0.0063, "step": 261900 }, { "epoch": 1.32, "learning_rate": 0.00010179455227005564, "loss": 0.0086, "step": 261910 }, { "epoch": 1.32, "learning_rate": 0.00010178698457704162, "loss": 0.0092, "step": 261920 }, { "epoch": 1.32, "learning_rate": 0.00010177941688402761, "loss": 0.0069, "step": 261930 }, { "epoch": 1.32, "learning_rate": 0.00010177184919101361, "loss": 0.0105, "step": 261940 }, { "epoch": 1.32, "learning_rate": 0.00010176428149799959, "loss": 0.0083, "step": 261950 }, { "epoch": 1.32, "learning_rate": 0.00010175671380498558, "loss": 0.008, "step": 261960 }, { "epoch": 1.32, "learning_rate": 0.00010174914611197158, "loss": 0.0071, "step": 261970 }, { "epoch": 1.32, "learning_rate": 0.00010174157841895756, "loss": 0.0069, "step": 261980 }, { "epoch": 1.32, "learning_rate": 0.00010173401072594356, "loss": 0.0081, "step": 261990 }, { "epoch": 1.32, "learning_rate": 0.00010172644303292955, "loss": 0.0084, "step": 262000 }, { "epoch": 1.32, "eval_cer": 0.9144411440194001, "eval_loss": 0.006132941693067551, "eval_runtime": 116.3656, "eval_samples_per_second": 17.187, "eval_steps_per_second": 4.297, "step": 262000 }, { "epoch": 1.32, "learning_rate": 0.00010171887533991553, "loss": 0.0079, "step": 262010 }, { "epoch": 1.32, "learning_rate": 0.00010171130764690153, "loss": 0.0081, "step": 262020 }, { "epoch": 1.32, "learning_rate": 0.00010170373995388751, "loss": 0.0077, "step": 262030 }, { "epoch": 1.32, "learning_rate": 0.0001016961722608735, "loss": 0.0089, "step": 262040 }, { "epoch": 1.32, "learning_rate": 0.0001016886045678595, "loss": 0.0096, "step": 262050 }, { "epoch": 1.32, "learning_rate": 0.00010168103687484548, "loss": 0.0128, "step": 262060 }, { "epoch": 1.32, "learning_rate": 0.00010167346918183148, "loss": 0.0066, "step": 262070 }, { "epoch": 1.32, "learning_rate": 0.00010166590148881747, "loss": 0.0071, "step": 262080 }, { "epoch": 1.32, "learning_rate": 0.00010165833379580345, "loss": 0.01, "step": 262090 }, { "epoch": 1.32, "learning_rate": 0.00010165076610278945, "loss": 0.0071, "step": 262100 }, { "epoch": 1.32, "learning_rate": 0.00010164319840977543, "loss": 0.0079, "step": 262110 }, { "epoch": 1.32, "learning_rate": 0.00010163563071676142, "loss": 0.0097, "step": 262120 }, { "epoch": 1.32, "learning_rate": 0.00010162806302374742, "loss": 0.01, "step": 262130 }, { "epoch": 1.32, "learning_rate": 0.0001016204953307334, "loss": 0.0076, "step": 262140 }, { "epoch": 1.32, "learning_rate": 0.0001016129276377194, "loss": 0.0073, "step": 262150 }, { "epoch": 1.32, "learning_rate": 0.00010160535994470539, "loss": 0.009, "step": 262160 }, { "epoch": 1.32, "learning_rate": 0.00010159779225169137, "loss": 0.0074, "step": 262170 }, { "epoch": 1.32, "learning_rate": 0.00010159022455867737, "loss": 0.0076, "step": 262180 }, { "epoch": 1.32, "learning_rate": 0.00010158265686566335, "loss": 0.0091, "step": 262190 }, { "epoch": 1.32, "learning_rate": 0.00010157508917264934, "loss": 0.0066, "step": 262200 }, { "epoch": 1.32, "learning_rate": 0.00010156752147963534, "loss": 0.0078, "step": 262210 }, { "epoch": 1.32, "learning_rate": 0.00010155995378662132, "loss": 0.0066, "step": 262220 }, { "epoch": 1.32, "learning_rate": 0.00010155238609360731, "loss": 0.0121, "step": 262230 }, { "epoch": 1.32, "learning_rate": 0.00010154481840059331, "loss": 0.0083, "step": 262240 }, { "epoch": 1.32, "learning_rate": 0.00010153725070757929, "loss": 0.0082, "step": 262250 }, { "epoch": 1.32, "learning_rate": 0.00010152968301456529, "loss": 0.0083, "step": 262260 }, { "epoch": 1.32, "learning_rate": 0.00010152211532155127, "loss": 0.0092, "step": 262270 }, { "epoch": 1.32, "learning_rate": 0.00010151454762853726, "loss": 0.0067, "step": 262280 }, { "epoch": 1.32, "learning_rate": 0.00010150697993552326, "loss": 0.0079, "step": 262290 }, { "epoch": 1.32, "learning_rate": 0.00010149941224250924, "loss": 0.0078, "step": 262300 }, { "epoch": 1.32, "learning_rate": 0.00010149184454949523, "loss": 0.0076, "step": 262310 }, { "epoch": 1.32, "learning_rate": 0.00010148427685648123, "loss": 0.0077, "step": 262320 }, { "epoch": 1.32, "learning_rate": 0.00010147670916346721, "loss": 0.0078, "step": 262330 }, { "epoch": 1.32, "learning_rate": 0.0001014691414704532, "loss": 0.0097, "step": 262340 }, { "epoch": 1.32, "learning_rate": 0.00010146157377743919, "loss": 0.008, "step": 262350 }, { "epoch": 1.32, "learning_rate": 0.00010145400608442518, "loss": 0.0074, "step": 262360 }, { "epoch": 1.32, "learning_rate": 0.00010144643839141118, "loss": 0.0095, "step": 262370 }, { "epoch": 1.32, "learning_rate": 0.00010143887069839714, "loss": 0.0099, "step": 262380 }, { "epoch": 1.32, "learning_rate": 0.00010143130300538314, "loss": 0.0085, "step": 262390 }, { "epoch": 1.32, "learning_rate": 0.00010142373531236912, "loss": 0.0069, "step": 262400 }, { "epoch": 1.32, "learning_rate": 0.00010141616761935512, "loss": 0.0079, "step": 262410 }, { "epoch": 1.32, "learning_rate": 0.00010140859992634111, "loss": 0.0086, "step": 262420 }, { "epoch": 1.32, "learning_rate": 0.00010140103223332709, "loss": 0.0066, "step": 262430 }, { "epoch": 1.32, "learning_rate": 0.00010139346454031309, "loss": 0.007, "step": 262440 }, { "epoch": 1.32, "learning_rate": 0.00010138589684729908, "loss": 0.0093, "step": 262450 }, { "epoch": 1.32, "learning_rate": 0.00010137832915428506, "loss": 0.0085, "step": 262460 }, { "epoch": 1.32, "learning_rate": 0.00010137076146127106, "loss": 0.0086, "step": 262470 }, { "epoch": 1.32, "learning_rate": 0.00010136319376825704, "loss": 0.0096, "step": 262480 }, { "epoch": 1.32, "learning_rate": 0.00010135562607524303, "loss": 0.0076, "step": 262490 }, { "epoch": 1.32, "learning_rate": 0.00010134805838222903, "loss": 0.0096, "step": 262500 }, { "epoch": 1.32, "learning_rate": 0.00010134049068921501, "loss": 0.0069, "step": 262510 }, { "epoch": 1.32, "learning_rate": 0.000101332922996201, "loss": 0.0089, "step": 262520 }, { "epoch": 1.32, "learning_rate": 0.000101325355303187, "loss": 0.0072, "step": 262530 }, { "epoch": 1.32, "learning_rate": 0.00010131778761017298, "loss": 0.0078, "step": 262540 }, { "epoch": 1.32, "learning_rate": 0.00010131021991715898, "loss": 0.0075, "step": 262550 }, { "epoch": 1.32, "learning_rate": 0.00010130265222414496, "loss": 0.0106, "step": 262560 }, { "epoch": 1.32, "learning_rate": 0.00010129508453113095, "loss": 0.008, "step": 262570 }, { "epoch": 1.32, "learning_rate": 0.00010128751683811695, "loss": 0.0078, "step": 262580 }, { "epoch": 1.32, "learning_rate": 0.00010127994914510293, "loss": 0.0094, "step": 262590 }, { "epoch": 1.32, "learning_rate": 0.00010127238145208893, "loss": 0.0101, "step": 262600 }, { "epoch": 1.32, "learning_rate": 0.00010126481375907492, "loss": 0.0104, "step": 262610 }, { "epoch": 1.32, "learning_rate": 0.0001012572460660609, "loss": 0.0079, "step": 262620 }, { "epoch": 1.32, "learning_rate": 0.0001012496783730469, "loss": 0.0074, "step": 262630 }, { "epoch": 1.33, "learning_rate": 0.00010124211068003288, "loss": 0.0084, "step": 262640 }, { "epoch": 1.33, "learning_rate": 0.00010123454298701887, "loss": 0.0073, "step": 262650 }, { "epoch": 1.33, "learning_rate": 0.00010122697529400487, "loss": 0.0097, "step": 262660 }, { "epoch": 1.33, "learning_rate": 0.00010121940760099085, "loss": 0.0094, "step": 262670 }, { "epoch": 1.33, "learning_rate": 0.00010121183990797684, "loss": 0.0095, "step": 262680 }, { "epoch": 1.33, "learning_rate": 0.00010120427221496284, "loss": 0.0072, "step": 262690 }, { "epoch": 1.33, "learning_rate": 0.00010119670452194882, "loss": 0.01, "step": 262700 }, { "epoch": 1.33, "learning_rate": 0.00010118913682893482, "loss": 0.0063, "step": 262710 }, { "epoch": 1.33, "learning_rate": 0.0001011815691359208, "loss": 0.0075, "step": 262720 }, { "epoch": 1.33, "learning_rate": 0.00010117400144290679, "loss": 0.007, "step": 262730 }, { "epoch": 1.33, "learning_rate": 0.00010116643374989279, "loss": 0.0105, "step": 262740 }, { "epoch": 1.33, "learning_rate": 0.00010115886605687877, "loss": 0.0103, "step": 262750 }, { "epoch": 1.33, "learning_rate": 0.00010115129836386476, "loss": 0.0081, "step": 262760 }, { "epoch": 1.33, "learning_rate": 0.00010114373067085076, "loss": 0.0076, "step": 262770 }, { "epoch": 1.33, "learning_rate": 0.00010113616297783674, "loss": 0.0075, "step": 262780 }, { "epoch": 1.33, "learning_rate": 0.00010112859528482274, "loss": 0.0089, "step": 262790 }, { "epoch": 1.33, "learning_rate": 0.00010112102759180872, "loss": 0.0095, "step": 262800 }, { "epoch": 1.33, "learning_rate": 0.00010111345989879471, "loss": 0.008, "step": 262810 }, { "epoch": 1.33, "learning_rate": 0.00010110589220578071, "loss": 0.0057, "step": 262820 }, { "epoch": 1.33, "learning_rate": 0.00010109832451276669, "loss": 0.009, "step": 262830 }, { "epoch": 1.33, "learning_rate": 0.00010109075681975268, "loss": 0.0088, "step": 262840 }, { "epoch": 1.33, "learning_rate": 0.00010108318912673868, "loss": 0.0086, "step": 262850 }, { "epoch": 1.33, "learning_rate": 0.00010107562143372466, "loss": 0.0075, "step": 262860 }, { "epoch": 1.33, "learning_rate": 0.00010106805374071065, "loss": 0.0088, "step": 262870 }, { "epoch": 1.33, "learning_rate": 0.00010106048604769664, "loss": 0.0084, "step": 262880 }, { "epoch": 1.33, "learning_rate": 0.00010105291835468263, "loss": 0.0074, "step": 262890 }, { "epoch": 1.33, "learning_rate": 0.00010104535066166863, "loss": 0.0074, "step": 262900 }, { "epoch": 1.33, "learning_rate": 0.00010103778296865461, "loss": 0.0073, "step": 262910 }, { "epoch": 1.33, "learning_rate": 0.0001010302152756406, "loss": 0.0067, "step": 262920 }, { "epoch": 1.33, "learning_rate": 0.0001010226475826266, "loss": 0.0069, "step": 262930 }, { "epoch": 1.33, "learning_rate": 0.00010101507988961258, "loss": 0.0076, "step": 262940 }, { "epoch": 1.33, "learning_rate": 0.00010100751219659857, "loss": 0.0084, "step": 262950 }, { "epoch": 1.33, "learning_rate": 0.00010099994450358456, "loss": 0.0066, "step": 262960 }, { "epoch": 1.33, "learning_rate": 0.00010099237681057055, "loss": 0.0092, "step": 262970 }, { "epoch": 1.33, "learning_rate": 0.00010098480911755655, "loss": 0.0081, "step": 262980 }, { "epoch": 1.33, "learning_rate": 0.00010097724142454253, "loss": 0.0097, "step": 262990 }, { "epoch": 1.33, "learning_rate": 0.00010096967373152852, "loss": 0.0079, "step": 263000 }, { "epoch": 1.33, "eval_cer": 0.9144459960000272, "eval_loss": 0.005995141342282295, "eval_runtime": 116.2956, "eval_samples_per_second": 17.198, "eval_steps_per_second": 4.299, "step": 263000 }, { "epoch": 1.33, "learning_rate": 0.00010096210603851449, "loss": 0.0107, "step": 263010 }, { "epoch": 1.33, "learning_rate": 0.00010095453834550048, "loss": 0.0082, "step": 263020 }, { "epoch": 1.33, "learning_rate": 0.00010094697065248648, "loss": 0.0079, "step": 263030 }, { "epoch": 1.33, "learning_rate": 0.00010093940295947246, "loss": 0.0063, "step": 263040 }, { "epoch": 1.33, "learning_rate": 0.00010093183526645846, "loss": 0.0076, "step": 263050 }, { "epoch": 1.33, "learning_rate": 0.00010092426757344445, "loss": 0.0089, "step": 263060 }, { "epoch": 1.33, "learning_rate": 0.00010091669988043043, "loss": 0.007, "step": 263070 }, { "epoch": 1.33, "learning_rate": 0.00010090913218741643, "loss": 0.0068, "step": 263080 }, { "epoch": 1.33, "learning_rate": 0.00010090156449440241, "loss": 0.0105, "step": 263090 }, { "epoch": 1.33, "learning_rate": 0.0001008939968013884, "loss": 0.0061, "step": 263100 }, { "epoch": 1.33, "learning_rate": 0.0001008864291083744, "loss": 0.0082, "step": 263110 }, { "epoch": 1.33, "learning_rate": 0.00010087886141536038, "loss": 0.0059, "step": 263120 }, { "epoch": 1.33, "learning_rate": 0.00010087129372234638, "loss": 0.0111, "step": 263130 }, { "epoch": 1.33, "learning_rate": 0.00010086372602933237, "loss": 0.008, "step": 263140 }, { "epoch": 1.33, "learning_rate": 0.00010085615833631835, "loss": 0.0089, "step": 263150 }, { "epoch": 1.33, "learning_rate": 0.00010084859064330435, "loss": 0.0064, "step": 263160 }, { "epoch": 1.33, "learning_rate": 0.00010084102295029033, "loss": 0.0078, "step": 263170 }, { "epoch": 1.33, "learning_rate": 0.00010083345525727632, "loss": 0.0066, "step": 263180 }, { "epoch": 1.33, "learning_rate": 0.00010082588756426232, "loss": 0.0072, "step": 263190 }, { "epoch": 1.33, "learning_rate": 0.0001008183198712483, "loss": 0.0086, "step": 263200 }, { "epoch": 1.33, "learning_rate": 0.0001008107521782343, "loss": 0.0093, "step": 263210 }, { "epoch": 1.33, "learning_rate": 0.00010080318448522029, "loss": 0.0078, "step": 263220 }, { "epoch": 1.33, "learning_rate": 0.00010079561679220627, "loss": 0.0067, "step": 263230 }, { "epoch": 1.33, "learning_rate": 0.00010078804909919227, "loss": 0.0096, "step": 263240 }, { "epoch": 1.33, "learning_rate": 0.00010078048140617825, "loss": 0.0106, "step": 263250 }, { "epoch": 1.33, "learning_rate": 0.00010077291371316424, "loss": 0.008, "step": 263260 }, { "epoch": 1.33, "learning_rate": 0.00010076534602015024, "loss": 0.0092, "step": 263270 }, { "epoch": 1.33, "learning_rate": 0.00010075777832713622, "loss": 0.0079, "step": 263280 }, { "epoch": 1.33, "learning_rate": 0.00010075021063412221, "loss": 0.0121, "step": 263290 }, { "epoch": 1.33, "learning_rate": 0.00010074264294110821, "loss": 0.0085, "step": 263300 }, { "epoch": 1.33, "learning_rate": 0.00010073507524809419, "loss": 0.0082, "step": 263310 }, { "epoch": 1.33, "learning_rate": 0.00010072750755508019, "loss": 0.0094, "step": 263320 }, { "epoch": 1.33, "learning_rate": 0.00010071993986206617, "loss": 0.0073, "step": 263330 }, { "epoch": 1.33, "learning_rate": 0.00010071237216905216, "loss": 0.0075, "step": 263340 }, { "epoch": 1.33, "learning_rate": 0.00010070480447603816, "loss": 0.0092, "step": 263350 }, { "epoch": 1.33, "learning_rate": 0.00010069723678302414, "loss": 0.0085, "step": 263360 }, { "epoch": 1.33, "learning_rate": 0.00010068966909001013, "loss": 0.0088, "step": 263370 }, { "epoch": 1.33, "learning_rate": 0.00010068210139699613, "loss": 0.0075, "step": 263380 }, { "epoch": 1.33, "learning_rate": 0.00010067453370398211, "loss": 0.0077, "step": 263390 }, { "epoch": 1.33, "learning_rate": 0.0001006669660109681, "loss": 0.0087, "step": 263400 }, { "epoch": 1.33, "learning_rate": 0.00010065939831795409, "loss": 0.0103, "step": 263410 }, { "epoch": 1.33, "learning_rate": 0.00010065183062494008, "loss": 0.0081, "step": 263420 }, { "epoch": 1.33, "learning_rate": 0.00010064426293192608, "loss": 0.0106, "step": 263430 }, { "epoch": 1.33, "learning_rate": 0.00010063669523891206, "loss": 0.0127, "step": 263440 }, { "epoch": 1.33, "learning_rate": 0.00010062912754589805, "loss": 0.009, "step": 263450 }, { "epoch": 1.33, "learning_rate": 0.00010062155985288405, "loss": 0.0086, "step": 263460 }, { "epoch": 1.33, "learning_rate": 0.00010061399215987003, "loss": 0.009, "step": 263470 }, { "epoch": 1.33, "learning_rate": 0.00010060642446685602, "loss": 0.0115, "step": 263480 }, { "epoch": 1.33, "learning_rate": 0.00010059885677384202, "loss": 0.0085, "step": 263490 }, { "epoch": 1.33, "learning_rate": 0.000100591289080828, "loss": 0.0074, "step": 263500 }, { "epoch": 1.33, "learning_rate": 0.000100583721387814, "loss": 0.009, "step": 263510 }, { "epoch": 1.33, "learning_rate": 0.00010057615369479998, "loss": 0.0085, "step": 263520 }, { "epoch": 1.33, "learning_rate": 0.00010056858600178597, "loss": 0.0081, "step": 263530 }, { "epoch": 1.33, "learning_rate": 0.00010056101830877197, "loss": 0.011, "step": 263540 }, { "epoch": 1.33, "learning_rate": 0.00010055345061575795, "loss": 0.0088, "step": 263550 }, { "epoch": 1.33, "learning_rate": 0.00010054588292274394, "loss": 0.0076, "step": 263560 }, { "epoch": 1.33, "learning_rate": 0.00010053831522972994, "loss": 0.0069, "step": 263570 }, { "epoch": 1.33, "learning_rate": 0.00010053074753671592, "loss": 0.009, "step": 263580 }, { "epoch": 1.33, "learning_rate": 0.00010052317984370191, "loss": 0.0082, "step": 263590 }, { "epoch": 1.33, "learning_rate": 0.0001005156121506879, "loss": 0.007, "step": 263600 }, { "epoch": 1.33, "learning_rate": 0.00010050804445767389, "loss": 0.0092, "step": 263610 }, { "epoch": 1.33, "learning_rate": 0.00010050047676465989, "loss": 0.0074, "step": 263620 }, { "epoch": 1.33, "learning_rate": 0.00010049290907164587, "loss": 0.0065, "step": 263630 }, { "epoch": 1.33, "learning_rate": 0.00010048534137863185, "loss": 0.0078, "step": 263640 }, { "epoch": 1.33, "learning_rate": 0.00010047777368561783, "loss": 0.0085, "step": 263650 }, { "epoch": 1.33, "learning_rate": 0.00010047020599260383, "loss": 0.0087, "step": 263660 }, { "epoch": 1.33, "learning_rate": 0.00010046263829958982, "loss": 0.0087, "step": 263670 }, { "epoch": 1.33, "learning_rate": 0.0001004550706065758, "loss": 0.0082, "step": 263680 }, { "epoch": 1.33, "learning_rate": 0.0001004475029135618, "loss": 0.0078, "step": 263690 }, { "epoch": 1.33, "learning_rate": 0.00010043993522054778, "loss": 0.0103, "step": 263700 }, { "epoch": 1.33, "learning_rate": 0.00010043236752753377, "loss": 0.0103, "step": 263710 }, { "epoch": 1.33, "learning_rate": 0.00010042479983451977, "loss": 0.0072, "step": 263720 }, { "epoch": 1.33, "learning_rate": 0.00010041723214150575, "loss": 0.0084, "step": 263730 }, { "epoch": 1.33, "learning_rate": 0.00010040966444849174, "loss": 0.0122, "step": 263740 }, { "epoch": 1.33, "learning_rate": 0.00010040209675547774, "loss": 0.0067, "step": 263750 }, { "epoch": 1.33, "learning_rate": 0.00010039452906246372, "loss": 0.0081, "step": 263760 }, { "epoch": 1.33, "learning_rate": 0.00010038696136944972, "loss": 0.0093, "step": 263770 }, { "epoch": 1.33, "learning_rate": 0.0001003793936764357, "loss": 0.0117, "step": 263780 }, { "epoch": 1.33, "learning_rate": 0.00010037182598342169, "loss": 0.0089, "step": 263790 }, { "epoch": 1.33, "learning_rate": 0.00010036425829040769, "loss": 0.0079, "step": 263800 }, { "epoch": 1.33, "learning_rate": 0.00010035669059739367, "loss": 0.0093, "step": 263810 }, { "epoch": 1.33, "learning_rate": 0.00010034912290437966, "loss": 0.0076, "step": 263820 }, { "epoch": 1.33, "learning_rate": 0.00010034155521136566, "loss": 0.0092, "step": 263830 }, { "epoch": 1.33, "learning_rate": 0.00010033398751835164, "loss": 0.0089, "step": 263840 }, { "epoch": 1.33, "learning_rate": 0.00010032641982533764, "loss": 0.0073, "step": 263850 }, { "epoch": 1.33, "learning_rate": 0.00010031885213232362, "loss": 0.0075, "step": 263860 }, { "epoch": 1.33, "learning_rate": 0.00010031128443930961, "loss": 0.0099, "step": 263870 }, { "epoch": 1.33, "learning_rate": 0.00010030371674629561, "loss": 0.0102, "step": 263880 }, { "epoch": 1.33, "learning_rate": 0.00010029614905328159, "loss": 0.0074, "step": 263890 }, { "epoch": 1.33, "learning_rate": 0.00010028858136026758, "loss": 0.0074, "step": 263900 }, { "epoch": 1.33, "learning_rate": 0.00010028101366725358, "loss": 0.0062, "step": 263910 }, { "epoch": 1.33, "learning_rate": 0.00010027344597423956, "loss": 0.0081, "step": 263920 }, { "epoch": 1.33, "learning_rate": 0.00010026587828122556, "loss": 0.009, "step": 263930 }, { "epoch": 1.33, "learning_rate": 0.00010025831058821155, "loss": 0.0059, "step": 263940 }, { "epoch": 1.33, "learning_rate": 0.00010025074289519753, "loss": 0.01, "step": 263950 }, { "epoch": 1.33, "learning_rate": 0.00010024317520218353, "loss": 0.0073, "step": 263960 }, { "epoch": 1.33, "learning_rate": 0.00010023560750916951, "loss": 0.0072, "step": 263970 }, { "epoch": 1.33, "learning_rate": 0.0001002280398161555, "loss": 0.0095, "step": 263980 }, { "epoch": 1.33, "learning_rate": 0.0001002204721231415, "loss": 0.0097, "step": 263990 }, { "epoch": 1.33, "learning_rate": 0.00010021290443012748, "loss": 0.0096, "step": 264000 }, { "epoch": 1.33, "eval_cer": 0.9144285288697699, "eval_loss": 0.006162929814308882, "eval_runtime": 116.2184, "eval_samples_per_second": 17.209, "eval_steps_per_second": 4.302, "step": 264000 }, { "epoch": 1.33, "learning_rate": 0.00010020533673711347, "loss": 0.0106, "step": 264010 }, { "epoch": 1.33, "learning_rate": 0.00010019776904409947, "loss": 0.0084, "step": 264020 }, { "epoch": 1.33, "learning_rate": 0.00010019020135108545, "loss": 0.0065, "step": 264030 }, { "epoch": 1.33, "learning_rate": 0.00010018263365807145, "loss": 0.0059, "step": 264040 }, { "epoch": 1.33, "learning_rate": 0.00010017506596505743, "loss": 0.0088, "step": 264050 }, { "epoch": 1.33, "learning_rate": 0.00010016749827204342, "loss": 0.0093, "step": 264060 }, { "epoch": 1.33, "learning_rate": 0.00010015993057902942, "loss": 0.0067, "step": 264070 }, { "epoch": 1.33, "learning_rate": 0.0001001523628860154, "loss": 0.0083, "step": 264080 }, { "epoch": 1.33, "learning_rate": 0.0001001447951930014, "loss": 0.0107, "step": 264090 }, { "epoch": 1.33, "learning_rate": 0.00010013722749998739, "loss": 0.0081, "step": 264100 }, { "epoch": 1.33, "learning_rate": 0.00010012965980697337, "loss": 0.0105, "step": 264110 }, { "epoch": 1.33, "learning_rate": 0.00010012209211395937, "loss": 0.0081, "step": 264120 }, { "epoch": 1.33, "learning_rate": 0.00010011452442094535, "loss": 0.0091, "step": 264130 }, { "epoch": 1.33, "learning_rate": 0.00010010695672793134, "loss": 0.0072, "step": 264140 }, { "epoch": 1.33, "learning_rate": 0.00010009938903491734, "loss": 0.0092, "step": 264150 }, { "epoch": 1.33, "learning_rate": 0.00010009182134190332, "loss": 0.0082, "step": 264160 }, { "epoch": 1.33, "learning_rate": 0.00010008425364888931, "loss": 0.0091, "step": 264170 }, { "epoch": 1.33, "learning_rate": 0.00010007668595587531, "loss": 0.0088, "step": 264180 }, { "epoch": 1.33, "learning_rate": 0.00010006911826286129, "loss": 0.0094, "step": 264190 }, { "epoch": 1.33, "learning_rate": 0.00010006155056984728, "loss": 0.0067, "step": 264200 }, { "epoch": 1.33, "learning_rate": 0.00010005398287683327, "loss": 0.0077, "step": 264210 }, { "epoch": 1.33, "learning_rate": 0.00010004641518381926, "loss": 0.0087, "step": 264220 }, { "epoch": 1.33, "learning_rate": 0.00010003884749080526, "loss": 0.009, "step": 264230 }, { "epoch": 1.33, "learning_rate": 0.00010003127979779124, "loss": 0.011, "step": 264240 }, { "epoch": 1.33, "learning_rate": 0.00010002371210477723, "loss": 0.008, "step": 264250 }, { "epoch": 1.33, "learning_rate": 0.00010001614441176323, "loss": 0.0059, "step": 264260 }, { "epoch": 1.33, "learning_rate": 0.0001000085767187492, "loss": 0.0082, "step": 264270 }, { "epoch": 1.33, "learning_rate": 0.00010000100902573519, "loss": 0.0078, "step": 264280 }, { "epoch": 1.33, "learning_rate": 9.999344133272117e-05, "loss": 0.0097, "step": 264290 }, { "epoch": 1.33, "learning_rate": 9.998587363970717e-05, "loss": 0.0074, "step": 264300 }, { "epoch": 1.33, "learning_rate": 9.997830594669315e-05, "loss": 0.0096, "step": 264310 }, { "epoch": 1.33, "learning_rate": 9.997073825367914e-05, "loss": 0.0086, "step": 264320 }, { "epoch": 1.33, "learning_rate": 9.996317056066514e-05, "loss": 0.0069, "step": 264330 }, { "epoch": 1.33, "learning_rate": 9.995560286765112e-05, "loss": 0.0069, "step": 264340 }, { "epoch": 1.33, "learning_rate": 9.994803517463711e-05, "loss": 0.0063, "step": 264350 }, { "epoch": 1.33, "learning_rate": 9.994046748162311e-05, "loss": 0.0081, "step": 264360 }, { "epoch": 1.33, "learning_rate": 9.993289978860909e-05, "loss": 0.0105, "step": 264370 }, { "epoch": 1.33, "learning_rate": 9.992533209559509e-05, "loss": 0.0073, "step": 264380 }, { "epoch": 1.33, "learning_rate": 9.991776440258108e-05, "loss": 0.0131, "step": 264390 }, { "epoch": 1.33, "learning_rate": 9.991019670956706e-05, "loss": 0.0094, "step": 264400 }, { "epoch": 1.33, "learning_rate": 9.990262901655306e-05, "loss": 0.0091, "step": 264410 }, { "epoch": 1.33, "learning_rate": 9.989506132353904e-05, "loss": 0.0088, "step": 264420 }, { "epoch": 1.33, "learning_rate": 9.988749363052503e-05, "loss": 0.0077, "step": 264430 }, { "epoch": 1.33, "learning_rate": 9.987992593751103e-05, "loss": 0.0069, "step": 264440 }, { "epoch": 1.33, "learning_rate": 9.987235824449701e-05, "loss": 0.0083, "step": 264450 }, { "epoch": 1.33, "learning_rate": 9.9864790551483e-05, "loss": 0.0086, "step": 264460 }, { "epoch": 1.33, "learning_rate": 9.9857222858469e-05, "loss": 0.008, "step": 264470 }, { "epoch": 1.33, "learning_rate": 9.984965516545498e-05, "loss": 0.0065, "step": 264480 }, { "epoch": 1.33, "learning_rate": 9.984208747244098e-05, "loss": 0.008, "step": 264490 }, { "epoch": 1.33, "learning_rate": 9.983451977942696e-05, "loss": 0.0077, "step": 264500 }, { "epoch": 1.33, "learning_rate": 9.982695208641295e-05, "loss": 0.0082, "step": 264510 }, { "epoch": 1.33, "learning_rate": 9.981938439339895e-05, "loss": 0.0118, "step": 264520 }, { "epoch": 1.33, "learning_rate": 9.981181670038493e-05, "loss": 0.0074, "step": 264530 }, { "epoch": 1.33, "learning_rate": 9.980424900737092e-05, "loss": 0.0071, "step": 264540 }, { "epoch": 1.33, "learning_rate": 9.979668131435692e-05, "loss": 0.0089, "step": 264550 }, { "epoch": 1.33, "learning_rate": 9.97891136213429e-05, "loss": 0.0074, "step": 264560 }, { "epoch": 1.33, "learning_rate": 9.97815459283289e-05, "loss": 0.0085, "step": 264570 }, { "epoch": 1.33, "learning_rate": 9.977397823531488e-05, "loss": 0.0082, "step": 264580 }, { "epoch": 1.33, "learning_rate": 9.976641054230087e-05, "loss": 0.0061, "step": 264590 }, { "epoch": 1.33, "learning_rate": 9.975884284928687e-05, "loss": 0.0083, "step": 264600 }, { "epoch": 1.33, "learning_rate": 9.975127515627285e-05, "loss": 0.0083, "step": 264610 }, { "epoch": 1.34, "learning_rate": 9.974370746325884e-05, "loss": 0.0076, "step": 264620 }, { "epoch": 1.34, "learning_rate": 9.973613977024484e-05, "loss": 0.0074, "step": 264630 }, { "epoch": 1.34, "learning_rate": 9.972857207723082e-05, "loss": 0.0087, "step": 264640 }, { "epoch": 1.34, "learning_rate": 9.972100438421682e-05, "loss": 0.0094, "step": 264650 }, { "epoch": 1.34, "learning_rate": 9.97134366912028e-05, "loss": 0.0108, "step": 264660 }, { "epoch": 1.34, "learning_rate": 9.970586899818879e-05, "loss": 0.007, "step": 264670 }, { "epoch": 1.34, "learning_rate": 9.969830130517479e-05, "loss": 0.0077, "step": 264680 }, { "epoch": 1.34, "learning_rate": 9.969073361216077e-05, "loss": 0.0071, "step": 264690 }, { "epoch": 1.34, "learning_rate": 9.968316591914676e-05, "loss": 0.0087, "step": 264700 }, { "epoch": 1.34, "learning_rate": 9.967559822613276e-05, "loss": 0.0091, "step": 264710 }, { "epoch": 1.34, "learning_rate": 9.966803053311874e-05, "loss": 0.0084, "step": 264720 }, { "epoch": 1.34, "learning_rate": 9.966046284010473e-05, "loss": 0.0077, "step": 264730 }, { "epoch": 1.34, "learning_rate": 9.965289514709072e-05, "loss": 0.0085, "step": 264740 }, { "epoch": 1.34, "learning_rate": 9.964532745407671e-05, "loss": 0.0071, "step": 264750 }, { "epoch": 1.34, "learning_rate": 9.96377597610627e-05, "loss": 0.0077, "step": 264760 }, { "epoch": 1.34, "learning_rate": 9.963019206804869e-05, "loss": 0.0073, "step": 264770 }, { "epoch": 1.34, "learning_rate": 9.962262437503468e-05, "loss": 0.0074, "step": 264780 }, { "epoch": 1.34, "learning_rate": 9.961505668202068e-05, "loss": 0.0085, "step": 264790 }, { "epoch": 1.34, "learning_rate": 9.960748898900666e-05, "loss": 0.0112, "step": 264800 }, { "epoch": 1.34, "learning_rate": 9.959992129599265e-05, "loss": 0.0086, "step": 264810 }, { "epoch": 1.34, "learning_rate": 9.959235360297864e-05, "loss": 0.007, "step": 264820 }, { "epoch": 1.34, "learning_rate": 9.958478590996463e-05, "loss": 0.0079, "step": 264830 }, { "epoch": 1.34, "learning_rate": 9.957721821695063e-05, "loss": 0.0064, "step": 264840 }, { "epoch": 1.34, "learning_rate": 9.95696505239366e-05, "loss": 0.0075, "step": 264850 }, { "epoch": 1.34, "learning_rate": 9.95620828309226e-05, "loss": 0.0078, "step": 264860 }, { "epoch": 1.34, "learning_rate": 9.95545151379086e-05, "loss": 0.0091, "step": 264870 }, { "epoch": 1.34, "learning_rate": 9.954694744489458e-05, "loss": 0.0095, "step": 264880 }, { "epoch": 1.34, "learning_rate": 9.953937975188056e-05, "loss": 0.0084, "step": 264890 }, { "epoch": 1.34, "learning_rate": 9.953181205886654e-05, "loss": 0.0089, "step": 264900 }, { "epoch": 1.34, "learning_rate": 9.952424436585254e-05, "loss": 0.0081, "step": 264910 }, { "epoch": 1.34, "learning_rate": 9.951667667283853e-05, "loss": 0.0067, "step": 264920 }, { "epoch": 1.34, "learning_rate": 9.950910897982451e-05, "loss": 0.0083, "step": 264930 }, { "epoch": 1.34, "learning_rate": 9.950154128681051e-05, "loss": 0.0112, "step": 264940 }, { "epoch": 1.34, "learning_rate": 9.949397359379649e-05, "loss": 0.0071, "step": 264950 }, { "epoch": 1.34, "learning_rate": 9.948640590078248e-05, "loss": 0.0082, "step": 264960 }, { "epoch": 1.34, "learning_rate": 9.947883820776848e-05, "loss": 0.0069, "step": 264970 }, { "epoch": 1.34, "learning_rate": 9.947127051475446e-05, "loss": 0.0074, "step": 264980 }, { "epoch": 1.34, "learning_rate": 9.946370282174046e-05, "loss": 0.0087, "step": 264990 }, { "epoch": 1.34, "learning_rate": 9.945613512872645e-05, "loss": 0.0052, "step": 265000 }, { "epoch": 1.34, "eval_cer": 0.9144372624348985, "eval_loss": 0.006056656129658222, "eval_runtime": 116.3287, "eval_samples_per_second": 17.193, "eval_steps_per_second": 4.298, "step": 265000 }, { "epoch": 1.34, "learning_rate": 9.944856743571243e-05, "loss": 0.0073, "step": 265010 }, { "epoch": 1.34, "learning_rate": 9.944099974269843e-05, "loss": 0.0094, "step": 265020 }, { "epoch": 1.34, "learning_rate": 9.943343204968441e-05, "loss": 0.0105, "step": 265030 }, { "epoch": 1.34, "learning_rate": 9.94258643566704e-05, "loss": 0.007, "step": 265040 }, { "epoch": 1.34, "learning_rate": 9.94182966636564e-05, "loss": 0.0087, "step": 265050 }, { "epoch": 1.34, "learning_rate": 9.941072897064238e-05, "loss": 0.0078, "step": 265060 }, { "epoch": 1.34, "learning_rate": 9.940316127762837e-05, "loss": 0.007, "step": 265070 }, { "epoch": 1.34, "learning_rate": 9.939559358461437e-05, "loss": 0.0071, "step": 265080 }, { "epoch": 1.34, "learning_rate": 9.938802589160035e-05, "loss": 0.0092, "step": 265090 }, { "epoch": 1.34, "learning_rate": 9.938045819858635e-05, "loss": 0.0069, "step": 265100 }, { "epoch": 1.34, "learning_rate": 9.937289050557233e-05, "loss": 0.0077, "step": 265110 }, { "epoch": 1.34, "learning_rate": 9.936532281255832e-05, "loss": 0.0051, "step": 265120 }, { "epoch": 1.34, "learning_rate": 9.935775511954432e-05, "loss": 0.0083, "step": 265130 }, { "epoch": 1.34, "learning_rate": 9.93501874265303e-05, "loss": 0.0099, "step": 265140 }, { "epoch": 1.34, "learning_rate": 9.93426197335163e-05, "loss": 0.007, "step": 265150 }, { "epoch": 1.34, "learning_rate": 9.933505204050229e-05, "loss": 0.0064, "step": 265160 }, { "epoch": 1.34, "learning_rate": 9.932748434748827e-05, "loss": 0.0075, "step": 265170 }, { "epoch": 1.34, "learning_rate": 9.931991665447427e-05, "loss": 0.0079, "step": 265180 }, { "epoch": 1.34, "learning_rate": 9.931234896146025e-05, "loss": 0.0083, "step": 265190 }, { "epoch": 1.34, "learning_rate": 9.930478126844624e-05, "loss": 0.0106, "step": 265200 }, { "epoch": 1.34, "learning_rate": 9.929721357543224e-05, "loss": 0.0072, "step": 265210 }, { "epoch": 1.34, "learning_rate": 9.928964588241822e-05, "loss": 0.0075, "step": 265220 }, { "epoch": 1.34, "learning_rate": 9.928207818940421e-05, "loss": 0.0092, "step": 265230 }, { "epoch": 1.34, "learning_rate": 9.927451049639021e-05, "loss": 0.0089, "step": 265240 }, { "epoch": 1.34, "learning_rate": 9.926694280337619e-05, "loss": 0.0072, "step": 265250 }, { "epoch": 1.34, "learning_rate": 9.925937511036218e-05, "loss": 0.0057, "step": 265260 }, { "epoch": 1.34, "learning_rate": 9.925180741734817e-05, "loss": 0.0066, "step": 265270 }, { "epoch": 1.34, "learning_rate": 9.924423972433416e-05, "loss": 0.0104, "step": 265280 }, { "epoch": 1.34, "learning_rate": 9.923667203132016e-05, "loss": 0.0071, "step": 265290 }, { "epoch": 1.34, "learning_rate": 9.922910433830614e-05, "loss": 0.0096, "step": 265300 }, { "epoch": 1.34, "learning_rate": 9.922153664529213e-05, "loss": 0.0097, "step": 265310 }, { "epoch": 1.34, "learning_rate": 9.921396895227813e-05, "loss": 0.0077, "step": 265320 }, { "epoch": 1.34, "learning_rate": 9.920640125926411e-05, "loss": 0.0084, "step": 265330 }, { "epoch": 1.34, "learning_rate": 9.91988335662501e-05, "loss": 0.0076, "step": 265340 }, { "epoch": 1.34, "learning_rate": 9.919126587323609e-05, "loss": 0.0081, "step": 265350 }, { "epoch": 1.34, "learning_rate": 9.918369818022208e-05, "loss": 0.0087, "step": 265360 }, { "epoch": 1.34, "learning_rate": 9.917613048720808e-05, "loss": 0.0095, "step": 265370 }, { "epoch": 1.34, "learning_rate": 9.916856279419406e-05, "loss": 0.007, "step": 265380 }, { "epoch": 1.34, "learning_rate": 9.916099510118005e-05, "loss": 0.0076, "step": 265390 }, { "epoch": 1.34, "learning_rate": 9.915342740816605e-05, "loss": 0.0075, "step": 265400 }, { "epoch": 1.34, "learning_rate": 9.914585971515203e-05, "loss": 0.0089, "step": 265410 }, { "epoch": 1.34, "learning_rate": 9.913829202213802e-05, "loss": 0.0094, "step": 265420 }, { "epoch": 1.34, "learning_rate": 9.913072432912402e-05, "loss": 0.0081, "step": 265430 }, { "epoch": 1.34, "learning_rate": 9.912315663611e-05, "loss": 0.0077, "step": 265440 }, { "epoch": 1.34, "learning_rate": 9.9115588943096e-05, "loss": 0.0087, "step": 265450 }, { "epoch": 1.34, "learning_rate": 9.910802125008198e-05, "loss": 0.0096, "step": 265460 }, { "epoch": 1.34, "learning_rate": 9.910045355706797e-05, "loss": 0.0096, "step": 265470 }, { "epoch": 1.34, "learning_rate": 9.909288586405397e-05, "loss": 0.0078, "step": 265480 }, { "epoch": 1.34, "learning_rate": 9.908531817103995e-05, "loss": 0.0092, "step": 265490 }, { "epoch": 1.34, "learning_rate": 9.907775047802594e-05, "loss": 0.0088, "step": 265500 }, { "epoch": 1.34, "learning_rate": 9.907018278501194e-05, "loss": 0.0063, "step": 265510 }, { "epoch": 1.34, "learning_rate": 9.90626150919979e-05, "loss": 0.0074, "step": 265520 }, { "epoch": 1.34, "learning_rate": 9.90550473989839e-05, "loss": 0.0072, "step": 265530 }, { "epoch": 1.34, "learning_rate": 9.904747970596988e-05, "loss": 0.0077, "step": 265540 }, { "epoch": 1.34, "learning_rate": 9.903991201295588e-05, "loss": 0.0075, "step": 265550 }, { "epoch": 1.34, "learning_rate": 9.903234431994186e-05, "loss": 0.0068, "step": 265560 }, { "epoch": 1.34, "learning_rate": 9.902477662692785e-05, "loss": 0.0077, "step": 265570 }, { "epoch": 1.34, "learning_rate": 9.901720893391385e-05, "loss": 0.0083, "step": 265580 }, { "epoch": 1.34, "learning_rate": 9.900964124089983e-05, "loss": 0.0065, "step": 265590 }, { "epoch": 1.34, "learning_rate": 9.900207354788582e-05, "loss": 0.0084, "step": 265600 }, { "epoch": 1.34, "learning_rate": 9.899450585487182e-05, "loss": 0.0069, "step": 265610 }, { "epoch": 1.34, "learning_rate": 9.89869381618578e-05, "loss": 0.0091, "step": 265620 }, { "epoch": 1.34, "learning_rate": 9.89793704688438e-05, "loss": 0.0109, "step": 265630 }, { "epoch": 1.34, "learning_rate": 9.897180277582978e-05, "loss": 0.007, "step": 265640 }, { "epoch": 1.34, "learning_rate": 9.896423508281577e-05, "loss": 0.0075, "step": 265650 }, { "epoch": 1.34, "learning_rate": 9.895666738980177e-05, "loss": 0.008, "step": 265660 }, { "epoch": 1.34, "learning_rate": 9.894909969678775e-05, "loss": 0.0115, "step": 265670 }, { "epoch": 1.34, "learning_rate": 9.894153200377374e-05, "loss": 0.0075, "step": 265680 }, { "epoch": 1.34, "learning_rate": 9.893396431075974e-05, "loss": 0.0077, "step": 265690 }, { "epoch": 1.34, "learning_rate": 9.892639661774572e-05, "loss": 0.0103, "step": 265700 }, { "epoch": 1.34, "learning_rate": 9.891882892473172e-05, "loss": 0.0092, "step": 265710 }, { "epoch": 1.34, "learning_rate": 9.89112612317177e-05, "loss": 0.0081, "step": 265720 }, { "epoch": 1.34, "learning_rate": 9.890369353870369e-05, "loss": 0.0108, "step": 265730 }, { "epoch": 1.34, "learning_rate": 9.889612584568969e-05, "loss": 0.0098, "step": 265740 }, { "epoch": 1.34, "learning_rate": 9.888855815267567e-05, "loss": 0.0092, "step": 265750 }, { "epoch": 1.34, "learning_rate": 9.888099045966166e-05, "loss": 0.0099, "step": 265760 }, { "epoch": 1.34, "learning_rate": 9.887342276664766e-05, "loss": 0.0094, "step": 265770 }, { "epoch": 1.34, "learning_rate": 9.886585507363364e-05, "loss": 0.0071, "step": 265780 }, { "epoch": 1.34, "learning_rate": 9.885828738061963e-05, "loss": 0.0105, "step": 265790 }, { "epoch": 1.34, "learning_rate": 9.885071968760562e-05, "loss": 0.0069, "step": 265800 }, { "epoch": 1.34, "learning_rate": 9.884315199459161e-05, "loss": 0.01, "step": 265810 }, { "epoch": 1.34, "learning_rate": 9.88355843015776e-05, "loss": 0.0071, "step": 265820 }, { "epoch": 1.34, "learning_rate": 9.882801660856359e-05, "loss": 0.0072, "step": 265830 }, { "epoch": 1.34, "learning_rate": 9.882044891554958e-05, "loss": 0.0092, "step": 265840 }, { "epoch": 1.34, "learning_rate": 9.881288122253558e-05, "loss": 0.0076, "step": 265850 }, { "epoch": 1.34, "learning_rate": 9.880531352952156e-05, "loss": 0.0083, "step": 265860 }, { "epoch": 1.34, "learning_rate": 9.879774583650755e-05, "loss": 0.0085, "step": 265870 }, { "epoch": 1.34, "learning_rate": 9.879017814349355e-05, "loss": 0.0094, "step": 265880 }, { "epoch": 1.34, "learning_rate": 9.878261045047953e-05, "loss": 0.0073, "step": 265890 }, { "epoch": 1.34, "learning_rate": 9.877504275746553e-05, "loss": 0.0069, "step": 265900 }, { "epoch": 1.34, "learning_rate": 9.876747506445151e-05, "loss": 0.0099, "step": 265910 }, { "epoch": 1.34, "learning_rate": 9.87599073714375e-05, "loss": 0.0094, "step": 265920 }, { "epoch": 1.34, "learning_rate": 9.87523396784235e-05, "loss": 0.0089, "step": 265930 }, { "epoch": 1.34, "learning_rate": 9.874477198540948e-05, "loss": 0.0088, "step": 265940 }, { "epoch": 1.34, "learning_rate": 9.873720429239547e-05, "loss": 0.0088, "step": 265950 }, { "epoch": 1.34, "learning_rate": 9.872963659938147e-05, "loss": 0.0059, "step": 265960 }, { "epoch": 1.34, "learning_rate": 9.872206890636745e-05, "loss": 0.0053, "step": 265970 }, { "epoch": 1.34, "learning_rate": 9.871450121335344e-05, "loss": 0.0104, "step": 265980 }, { "epoch": 1.34, "learning_rate": 9.870693352033943e-05, "loss": 0.0073, "step": 265990 }, { "epoch": 1.34, "learning_rate": 9.869936582732542e-05, "loss": 0.0097, "step": 266000 }, { "epoch": 1.34, "eval_cer": 0.9144401736232748, "eval_loss": 0.0059706708416342735, "eval_runtime": 116.3669, "eval_samples_per_second": 17.187, "eval_steps_per_second": 4.297, "step": 266000 }, { "epoch": 1.34, "learning_rate": 9.869179813431142e-05, "loss": 0.0073, "step": 266010 }, { "epoch": 1.34, "learning_rate": 9.86842304412974e-05, "loss": 0.0072, "step": 266020 }, { "epoch": 1.34, "learning_rate": 9.867666274828339e-05, "loss": 0.0052, "step": 266030 }, { "epoch": 1.34, "learning_rate": 9.866909505526939e-05, "loss": 0.0078, "step": 266040 }, { "epoch": 1.34, "learning_rate": 9.866152736225537e-05, "loss": 0.0076, "step": 266050 }, { "epoch": 1.34, "learning_rate": 9.865395966924136e-05, "loss": 0.0073, "step": 266060 }, { "epoch": 1.34, "learning_rate": 9.864639197622735e-05, "loss": 0.0083, "step": 266070 }, { "epoch": 1.34, "learning_rate": 9.863882428321334e-05, "loss": 0.009, "step": 266080 }, { "epoch": 1.34, "learning_rate": 9.863125659019934e-05, "loss": 0.0075, "step": 266090 }, { "epoch": 1.34, "learning_rate": 9.862368889718532e-05, "loss": 0.0103, "step": 266100 }, { "epoch": 1.34, "learning_rate": 9.861612120417131e-05, "loss": 0.0073, "step": 266110 }, { "epoch": 1.34, "learning_rate": 9.860855351115731e-05, "loss": 0.0117, "step": 266120 }, { "epoch": 1.34, "learning_rate": 9.860098581814329e-05, "loss": 0.0078, "step": 266130 }, { "epoch": 1.34, "learning_rate": 9.859341812512928e-05, "loss": 0.0095, "step": 266140 }, { "epoch": 1.34, "learning_rate": 9.858585043211525e-05, "loss": 0.009, "step": 266150 }, { "epoch": 1.34, "learning_rate": 9.857828273910125e-05, "loss": 0.0063, "step": 266160 }, { "epoch": 1.34, "learning_rate": 9.857071504608723e-05, "loss": 0.0091, "step": 266170 }, { "epoch": 1.34, "learning_rate": 9.856314735307322e-05, "loss": 0.007, "step": 266180 }, { "epoch": 1.34, "learning_rate": 9.855557966005922e-05, "loss": 0.0086, "step": 266190 }, { "epoch": 1.34, "learning_rate": 9.85480119670452e-05, "loss": 0.0069, "step": 266200 }, { "epoch": 1.34, "learning_rate": 9.85404442740312e-05, "loss": 0.0078, "step": 266210 }, { "epoch": 1.34, "learning_rate": 9.853287658101719e-05, "loss": 0.0068, "step": 266220 }, { "epoch": 1.34, "learning_rate": 9.852530888800317e-05, "loss": 0.0091, "step": 266230 }, { "epoch": 1.34, "learning_rate": 9.851774119498917e-05, "loss": 0.0066, "step": 266240 }, { "epoch": 1.34, "learning_rate": 9.851017350197515e-05, "loss": 0.0071, "step": 266250 }, { "epoch": 1.34, "learning_rate": 9.850260580896114e-05, "loss": 0.0086, "step": 266260 }, { "epoch": 1.34, "learning_rate": 9.849503811594714e-05, "loss": 0.0057, "step": 266270 }, { "epoch": 1.34, "learning_rate": 9.848747042293312e-05, "loss": 0.0054, "step": 266280 }, { "epoch": 1.34, "learning_rate": 9.847990272991911e-05, "loss": 0.0068, "step": 266290 }, { "epoch": 1.34, "learning_rate": 9.847233503690511e-05, "loss": 0.0069, "step": 266300 }, { "epoch": 1.34, "learning_rate": 9.846476734389109e-05, "loss": 0.0081, "step": 266310 }, { "epoch": 1.34, "learning_rate": 9.845719965087708e-05, "loss": 0.0083, "step": 266320 }, { "epoch": 1.34, "learning_rate": 9.844963195786308e-05, "loss": 0.0089, "step": 266330 }, { "epoch": 1.34, "learning_rate": 9.844206426484906e-05, "loss": 0.008, "step": 266340 }, { "epoch": 1.34, "learning_rate": 9.843449657183506e-05, "loss": 0.006, "step": 266350 }, { "epoch": 1.34, "learning_rate": 9.842692887882104e-05, "loss": 0.0073, "step": 266360 }, { "epoch": 1.34, "learning_rate": 9.841936118580703e-05, "loss": 0.0086, "step": 266370 }, { "epoch": 1.34, "learning_rate": 9.841179349279303e-05, "loss": 0.0073, "step": 266380 }, { "epoch": 1.34, "learning_rate": 9.840422579977901e-05, "loss": 0.0072, "step": 266390 }, { "epoch": 1.34, "learning_rate": 9.8396658106765e-05, "loss": 0.0069, "step": 266400 }, { "epoch": 1.34, "learning_rate": 9.8389090413751e-05, "loss": 0.0091, "step": 266410 }, { "epoch": 1.34, "learning_rate": 9.838152272073698e-05, "loss": 0.0104, "step": 266420 }, { "epoch": 1.34, "learning_rate": 9.837395502772298e-05, "loss": 0.0079, "step": 266430 }, { "epoch": 1.34, "learning_rate": 9.836638733470896e-05, "loss": 0.0057, "step": 266440 }, { "epoch": 1.34, "learning_rate": 9.835881964169495e-05, "loss": 0.0086, "step": 266450 }, { "epoch": 1.34, "learning_rate": 9.835125194868095e-05, "loss": 0.0064, "step": 266460 }, { "epoch": 1.34, "learning_rate": 9.834368425566693e-05, "loss": 0.0084, "step": 266470 }, { "epoch": 1.34, "learning_rate": 9.833611656265292e-05, "loss": 0.0075, "step": 266480 }, { "epoch": 1.34, "learning_rate": 9.832854886963892e-05, "loss": 0.0102, "step": 266490 }, { "epoch": 1.34, "learning_rate": 9.83209811766249e-05, "loss": 0.0078, "step": 266500 }, { "epoch": 1.34, "learning_rate": 9.83134134836109e-05, "loss": 0.0077, "step": 266510 }, { "epoch": 1.34, "learning_rate": 9.830584579059688e-05, "loss": 0.0062, "step": 266520 }, { "epoch": 1.34, "learning_rate": 9.829827809758287e-05, "loss": 0.0086, "step": 266530 }, { "epoch": 1.34, "learning_rate": 9.829071040456887e-05, "loss": 0.009, "step": 266540 }, { "epoch": 1.34, "learning_rate": 9.828314271155485e-05, "loss": 0.0093, "step": 266550 }, { "epoch": 1.34, "learning_rate": 9.827557501854084e-05, "loss": 0.0072, "step": 266560 }, { "epoch": 1.34, "learning_rate": 9.826800732552684e-05, "loss": 0.0083, "step": 266570 }, { "epoch": 1.34, "learning_rate": 9.826043963251282e-05, "loss": 0.0077, "step": 266580 }, { "epoch": 1.34, "learning_rate": 9.825287193949881e-05, "loss": 0.0084, "step": 266590 }, { "epoch": 1.35, "learning_rate": 9.82453042464848e-05, "loss": 0.0082, "step": 266600 }, { "epoch": 1.35, "learning_rate": 9.823773655347079e-05, "loss": 0.0086, "step": 266610 }, { "epoch": 1.35, "learning_rate": 9.823016886045679e-05, "loss": 0.0064, "step": 266620 }, { "epoch": 1.35, "learning_rate": 9.822260116744277e-05, "loss": 0.0083, "step": 266630 }, { "epoch": 1.35, "learning_rate": 9.821503347442876e-05, "loss": 0.0085, "step": 266640 }, { "epoch": 1.35, "learning_rate": 9.820746578141476e-05, "loss": 0.0081, "step": 266650 }, { "epoch": 1.35, "learning_rate": 9.819989808840074e-05, "loss": 0.0196, "step": 266660 }, { "epoch": 1.35, "learning_rate": 9.819233039538673e-05, "loss": 0.0096, "step": 266670 }, { "epoch": 1.35, "learning_rate": 9.818476270237271e-05, "loss": 0.007, "step": 266680 }, { "epoch": 1.35, "learning_rate": 9.817719500935871e-05, "loss": 0.0066, "step": 266690 }, { "epoch": 1.35, "learning_rate": 9.81696273163447e-05, "loss": 0.0086, "step": 266700 }, { "epoch": 1.35, "learning_rate": 9.816205962333069e-05, "loss": 0.005, "step": 266710 }, { "epoch": 1.35, "learning_rate": 9.815449193031668e-05, "loss": 0.009, "step": 266720 }, { "epoch": 1.35, "learning_rate": 9.814692423730268e-05, "loss": 0.0079, "step": 266730 }, { "epoch": 1.35, "learning_rate": 9.813935654428866e-05, "loss": 0.0074, "step": 266740 }, { "epoch": 1.35, "learning_rate": 9.813178885127465e-05, "loss": 0.0069, "step": 266750 }, { "epoch": 1.35, "learning_rate": 9.812422115826063e-05, "loss": 0.0085, "step": 266760 }, { "epoch": 1.35, "learning_rate": 9.811665346524663e-05, "loss": 0.0131, "step": 266770 }, { "epoch": 1.35, "learning_rate": 9.810908577223261e-05, "loss": 0.0096, "step": 266780 }, { "epoch": 1.35, "learning_rate": 9.810151807921859e-05, "loss": 0.0064, "step": 266790 }, { "epoch": 1.35, "learning_rate": 9.809395038620459e-05, "loss": 0.0065, "step": 266800 }, { "epoch": 1.35, "learning_rate": 9.808638269319057e-05, "loss": 0.0081, "step": 266810 }, { "epoch": 1.35, "learning_rate": 9.807881500017656e-05, "loss": 0.007, "step": 266820 }, { "epoch": 1.35, "learning_rate": 9.807124730716256e-05, "loss": 0.0081, "step": 266830 }, { "epoch": 1.35, "learning_rate": 9.806367961414854e-05, "loss": 0.0087, "step": 266840 }, { "epoch": 1.35, "learning_rate": 9.805611192113454e-05, "loss": 0.0071, "step": 266850 }, { "epoch": 1.35, "learning_rate": 9.804854422812053e-05, "loss": 0.0072, "step": 266860 }, { "epoch": 1.35, "learning_rate": 9.804097653510651e-05, "loss": 0.0063, "step": 266870 }, { "epoch": 1.35, "learning_rate": 9.80334088420925e-05, "loss": 0.0085, "step": 266880 }, { "epoch": 1.35, "learning_rate": 9.802584114907849e-05, "loss": 0.0098, "step": 266890 }, { "epoch": 1.35, "learning_rate": 9.801827345606448e-05, "loss": 0.0072, "step": 266900 }, { "epoch": 1.35, "learning_rate": 9.801070576305048e-05, "loss": 0.0077, "step": 266910 }, { "epoch": 1.35, "learning_rate": 9.800313807003646e-05, "loss": 0.0079, "step": 266920 }, { "epoch": 1.35, "learning_rate": 9.799557037702245e-05, "loss": 0.0086, "step": 266930 }, { "epoch": 1.35, "learning_rate": 9.798800268400845e-05, "loss": 0.0101, "step": 266940 }, { "epoch": 1.35, "learning_rate": 9.798043499099443e-05, "loss": 0.0088, "step": 266950 }, { "epoch": 1.35, "learning_rate": 9.797286729798043e-05, "loss": 0.0081, "step": 266960 }, { "epoch": 1.35, "learning_rate": 9.796529960496641e-05, "loss": 0.0099, "step": 266970 }, { "epoch": 1.35, "learning_rate": 9.79577319119524e-05, "loss": 0.0081, "step": 266980 }, { "epoch": 1.35, "learning_rate": 9.79501642189384e-05, "loss": 0.0088, "step": 266990 }, { "epoch": 1.35, "learning_rate": 9.794259652592438e-05, "loss": 0.0085, "step": 267000 }, { "epoch": 1.35, "eval_cer": 0.9144362920387732, "eval_loss": 0.006072907242923975, "eval_runtime": 116.2245, "eval_samples_per_second": 17.208, "eval_steps_per_second": 4.302, "step": 267000 }, { "epoch": 1.35, "learning_rate": 9.793502883291037e-05, "loss": 0.0077, "step": 267010 }, { "epoch": 1.35, "learning_rate": 9.792746113989637e-05, "loss": 0.0094, "step": 267020 }, { "epoch": 1.35, "learning_rate": 9.791989344688235e-05, "loss": 0.0094, "step": 267030 }, { "epoch": 1.35, "learning_rate": 9.791232575386835e-05, "loss": 0.0082, "step": 267040 }, { "epoch": 1.35, "learning_rate": 9.790475806085433e-05, "loss": 0.0073, "step": 267050 }, { "epoch": 1.35, "learning_rate": 9.789719036784032e-05, "loss": 0.0083, "step": 267060 }, { "epoch": 1.35, "learning_rate": 9.788962267482632e-05, "loss": 0.0071, "step": 267070 }, { "epoch": 1.35, "learning_rate": 9.78820549818123e-05, "loss": 0.0079, "step": 267080 }, { "epoch": 1.35, "learning_rate": 9.787448728879829e-05, "loss": 0.0073, "step": 267090 }, { "epoch": 1.35, "learning_rate": 9.786691959578429e-05, "loss": 0.0102, "step": 267100 }, { "epoch": 1.35, "learning_rate": 9.785935190277027e-05, "loss": 0.007, "step": 267110 }, { "epoch": 1.35, "learning_rate": 9.785178420975626e-05, "loss": 0.0063, "step": 267120 }, { "epoch": 1.35, "learning_rate": 9.784421651674225e-05, "loss": 0.0094, "step": 267130 }, { "epoch": 1.35, "learning_rate": 9.783664882372824e-05, "loss": 0.0085, "step": 267140 }, { "epoch": 1.35, "learning_rate": 9.782908113071424e-05, "loss": 0.0124, "step": 267150 }, { "epoch": 1.35, "learning_rate": 9.782151343770022e-05, "loss": 0.0082, "step": 267160 }, { "epoch": 1.35, "learning_rate": 9.781394574468621e-05, "loss": 0.0076, "step": 267170 }, { "epoch": 1.35, "learning_rate": 9.780637805167221e-05, "loss": 0.0082, "step": 267180 }, { "epoch": 1.35, "learning_rate": 9.779881035865819e-05, "loss": 0.0074, "step": 267190 }, { "epoch": 1.35, "learning_rate": 9.779124266564418e-05, "loss": 0.0057, "step": 267200 }, { "epoch": 1.35, "learning_rate": 9.778367497263017e-05, "loss": 0.0079, "step": 267210 }, { "epoch": 1.35, "learning_rate": 9.777610727961616e-05, "loss": 0.0075, "step": 267220 }, { "epoch": 1.35, "learning_rate": 9.776853958660216e-05, "loss": 0.0092, "step": 267230 }, { "epoch": 1.35, "learning_rate": 9.776097189358814e-05, "loss": 0.0084, "step": 267240 }, { "epoch": 1.35, "learning_rate": 9.775340420057413e-05, "loss": 0.008, "step": 267250 }, { "epoch": 1.35, "learning_rate": 9.774583650756013e-05, "loss": 0.0095, "step": 267260 }, { "epoch": 1.35, "learning_rate": 9.773826881454611e-05, "loss": 0.0112, "step": 267270 }, { "epoch": 1.35, "learning_rate": 9.77307011215321e-05, "loss": 0.0085, "step": 267280 }, { "epoch": 1.35, "learning_rate": 9.772313342851808e-05, "loss": 0.0072, "step": 267290 }, { "epoch": 1.35, "learning_rate": 9.771556573550408e-05, "loss": 0.0122, "step": 267300 }, { "epoch": 1.35, "learning_rate": 9.770799804249007e-05, "loss": 0.007, "step": 267310 }, { "epoch": 1.35, "learning_rate": 9.770043034947606e-05, "loss": 0.0099, "step": 267320 }, { "epoch": 1.35, "learning_rate": 9.769286265646205e-05, "loss": 0.0078, "step": 267330 }, { "epoch": 1.35, "learning_rate": 9.768529496344805e-05, "loss": 0.0059, "step": 267340 }, { "epoch": 1.35, "learning_rate": 9.767772727043403e-05, "loss": 0.0083, "step": 267350 }, { "epoch": 1.35, "learning_rate": 9.767015957742002e-05, "loss": 0.0074, "step": 267360 }, { "epoch": 1.35, "learning_rate": 9.766259188440602e-05, "loss": 0.0079, "step": 267370 }, { "epoch": 1.35, "learning_rate": 9.7655024191392e-05, "loss": 0.0111, "step": 267380 }, { "epoch": 1.35, "learning_rate": 9.7647456498378e-05, "loss": 0.0085, "step": 267390 }, { "epoch": 1.35, "learning_rate": 9.763988880536398e-05, "loss": 0.0073, "step": 267400 }, { "epoch": 1.35, "learning_rate": 9.763232111234996e-05, "loss": 0.0077, "step": 267410 }, { "epoch": 1.35, "learning_rate": 9.762475341933594e-05, "loss": 0.0072, "step": 267420 }, { "epoch": 1.35, "learning_rate": 9.761718572632193e-05, "loss": 0.0089, "step": 267430 }, { "epoch": 1.35, "learning_rate": 9.760961803330793e-05, "loss": 0.0073, "step": 267440 }, { "epoch": 1.35, "learning_rate": 9.760205034029391e-05, "loss": 0.0093, "step": 267450 }, { "epoch": 1.35, "learning_rate": 9.75944826472799e-05, "loss": 0.0102, "step": 267460 }, { "epoch": 1.35, "learning_rate": 9.75869149542659e-05, "loss": 0.0109, "step": 267470 }, { "epoch": 1.35, "learning_rate": 9.757934726125188e-05, "loss": 0.0072, "step": 267480 }, { "epoch": 1.35, "learning_rate": 9.757177956823788e-05, "loss": 0.0081, "step": 267490 }, { "epoch": 1.35, "learning_rate": 9.756421187522386e-05, "loss": 0.0072, "step": 267500 }, { "epoch": 1.35, "learning_rate": 9.755664418220985e-05, "loss": 0.0104, "step": 267510 }, { "epoch": 1.35, "learning_rate": 9.754907648919585e-05, "loss": 0.0084, "step": 267520 }, { "epoch": 1.35, "learning_rate": 9.754150879618183e-05, "loss": 0.0082, "step": 267530 }, { "epoch": 1.35, "learning_rate": 9.753394110316782e-05, "loss": 0.0063, "step": 267540 }, { "epoch": 1.35, "learning_rate": 9.752637341015382e-05, "loss": 0.0057, "step": 267550 }, { "epoch": 1.35, "learning_rate": 9.75188057171398e-05, "loss": 0.008, "step": 267560 }, { "epoch": 1.35, "learning_rate": 9.75112380241258e-05, "loss": 0.008, "step": 267570 }, { "epoch": 1.35, "learning_rate": 9.750367033111178e-05, "loss": 0.007, "step": 267580 }, { "epoch": 1.35, "learning_rate": 9.749610263809777e-05, "loss": 0.0084, "step": 267590 }, { "epoch": 1.35, "learning_rate": 9.748853494508377e-05, "loss": 0.0078, "step": 267600 }, { "epoch": 1.35, "learning_rate": 9.748096725206975e-05, "loss": 0.0078, "step": 267610 }, { "epoch": 1.35, "learning_rate": 9.747339955905574e-05, "loss": 0.0081, "step": 267620 }, { "epoch": 1.35, "learning_rate": 9.746583186604174e-05, "loss": 0.0074, "step": 267630 }, { "epoch": 1.35, "learning_rate": 9.745826417302772e-05, "loss": 0.0079, "step": 267640 }, { "epoch": 1.35, "learning_rate": 9.745069648001371e-05, "loss": 0.0091, "step": 267650 }, { "epoch": 1.35, "learning_rate": 9.74431287869997e-05, "loss": 0.0076, "step": 267660 }, { "epoch": 1.35, "learning_rate": 9.743556109398569e-05, "loss": 0.0065, "step": 267670 }, { "epoch": 1.35, "learning_rate": 9.742799340097169e-05, "loss": 0.0077, "step": 267680 }, { "epoch": 1.35, "learning_rate": 9.742042570795767e-05, "loss": 0.0087, "step": 267690 }, { "epoch": 1.35, "learning_rate": 9.741285801494366e-05, "loss": 0.0082, "step": 267700 }, { "epoch": 1.35, "learning_rate": 9.740529032192966e-05, "loss": 0.0082, "step": 267710 }, { "epoch": 1.35, "learning_rate": 9.739772262891564e-05, "loss": 0.008, "step": 267720 }, { "epoch": 1.35, "learning_rate": 9.739015493590163e-05, "loss": 0.0072, "step": 267730 }, { "epoch": 1.35, "learning_rate": 9.738258724288762e-05, "loss": 0.0094, "step": 267740 }, { "epoch": 1.35, "learning_rate": 9.737501954987361e-05, "loss": 0.0073, "step": 267750 }, { "epoch": 1.35, "learning_rate": 9.73674518568596e-05, "loss": 0.009, "step": 267760 }, { "epoch": 1.35, "learning_rate": 9.735988416384559e-05, "loss": 0.0092, "step": 267770 }, { "epoch": 1.35, "learning_rate": 9.735231647083158e-05, "loss": 0.0104, "step": 267780 }, { "epoch": 1.35, "learning_rate": 9.734474877781758e-05, "loss": 0.0093, "step": 267790 }, { "epoch": 1.35, "learning_rate": 9.733718108480356e-05, "loss": 0.0077, "step": 267800 }, { "epoch": 1.35, "learning_rate": 9.732961339178955e-05, "loss": 0.0078, "step": 267810 }, { "epoch": 1.35, "learning_rate": 9.732204569877555e-05, "loss": 0.0077, "step": 267820 }, { "epoch": 1.35, "learning_rate": 9.731447800576153e-05, "loss": 0.0108, "step": 267830 }, { "epoch": 1.35, "learning_rate": 9.730691031274752e-05, "loss": 0.0084, "step": 267840 }, { "epoch": 1.35, "learning_rate": 9.72993426197335e-05, "loss": 0.009, "step": 267850 }, { "epoch": 1.35, "learning_rate": 9.72917749267195e-05, "loss": 0.0091, "step": 267860 }, { "epoch": 1.35, "learning_rate": 9.72842072337055e-05, "loss": 0.0086, "step": 267870 }, { "epoch": 1.35, "learning_rate": 9.727663954069148e-05, "loss": 0.0076, "step": 267880 }, { "epoch": 1.35, "learning_rate": 9.726907184767747e-05, "loss": 0.0094, "step": 267890 }, { "epoch": 1.35, "learning_rate": 9.726150415466347e-05, "loss": 0.0069, "step": 267900 }, { "epoch": 1.35, "learning_rate": 9.725393646164945e-05, "loss": 0.0094, "step": 267910 }, { "epoch": 1.35, "learning_rate": 9.724636876863544e-05, "loss": 0.0084, "step": 267920 }, { "epoch": 1.35, "learning_rate": 9.723880107562143e-05, "loss": 0.0083, "step": 267930 }, { "epoch": 1.35, "learning_rate": 9.723123338260742e-05, "loss": 0.0065, "step": 267940 }, { "epoch": 1.35, "learning_rate": 9.722366568959342e-05, "loss": 0.0069, "step": 267950 }, { "epoch": 1.35, "learning_rate": 9.72160979965794e-05, "loss": 0.0082, "step": 267960 }, { "epoch": 1.35, "learning_rate": 9.720853030356539e-05, "loss": 0.0048, "step": 267970 }, { "epoch": 1.35, "learning_rate": 9.720096261055139e-05, "loss": 0.0075, "step": 267980 }, { "epoch": 1.35, "learning_rate": 9.719339491753737e-05, "loss": 0.0079, "step": 267990 }, { "epoch": 1.35, "learning_rate": 9.718582722452336e-05, "loss": 0.0097, "step": 268000 }, { "epoch": 1.35, "eval_cer": 0.9144178545123905, "eval_loss": 0.006040630396455526, "eval_runtime": 116.1695, "eval_samples_per_second": 17.216, "eval_steps_per_second": 4.304, "step": 268000 }, { "epoch": 1.35, "learning_rate": 9.717825953150934e-05, "loss": 0.0077, "step": 268010 }, { "epoch": 1.35, "learning_rate": 9.717069183849534e-05, "loss": 0.0066, "step": 268020 }, { "epoch": 1.35, "learning_rate": 9.716312414548133e-05, "loss": 0.0069, "step": 268030 }, { "epoch": 1.35, "learning_rate": 9.71555564524673e-05, "loss": 0.0067, "step": 268040 }, { "epoch": 1.35, "learning_rate": 9.71479887594533e-05, "loss": 0.009, "step": 268050 }, { "epoch": 1.35, "learning_rate": 9.714042106643928e-05, "loss": 0.0094, "step": 268060 }, { "epoch": 1.35, "learning_rate": 9.713285337342527e-05, "loss": 0.0093, "step": 268070 }, { "epoch": 1.35, "learning_rate": 9.712528568041127e-05, "loss": 0.009, "step": 268080 }, { "epoch": 1.35, "learning_rate": 9.711771798739725e-05, "loss": 0.0085, "step": 268090 }, { "epoch": 1.35, "learning_rate": 9.711015029438325e-05, "loss": 0.006, "step": 268100 }, { "epoch": 1.35, "learning_rate": 9.710258260136923e-05, "loss": 0.0086, "step": 268110 }, { "epoch": 1.35, "learning_rate": 9.709501490835522e-05, "loss": 0.0087, "step": 268120 }, { "epoch": 1.35, "learning_rate": 9.708744721534122e-05, "loss": 0.0082, "step": 268130 }, { "epoch": 1.35, "learning_rate": 9.70798795223272e-05, "loss": 0.01, "step": 268140 }, { "epoch": 1.35, "learning_rate": 9.707231182931319e-05, "loss": 0.0074, "step": 268150 }, { "epoch": 1.35, "learning_rate": 9.706474413629919e-05, "loss": 0.0075, "step": 268160 }, { "epoch": 1.35, "learning_rate": 9.705717644328517e-05, "loss": 0.0093, "step": 268170 }, { "epoch": 1.35, "learning_rate": 9.704960875027116e-05, "loss": 0.0103, "step": 268180 }, { "epoch": 1.35, "learning_rate": 9.704204105725715e-05, "loss": 0.011, "step": 268190 }, { "epoch": 1.35, "learning_rate": 9.703447336424314e-05, "loss": 0.0117, "step": 268200 }, { "epoch": 1.35, "learning_rate": 9.702690567122914e-05, "loss": 0.0072, "step": 268210 }, { "epoch": 1.35, "learning_rate": 9.701933797821512e-05, "loss": 0.0082, "step": 268220 }, { "epoch": 1.35, "learning_rate": 9.701177028520111e-05, "loss": 0.0095, "step": 268230 }, { "epoch": 1.35, "learning_rate": 9.700420259218711e-05, "loss": 0.0063, "step": 268240 }, { "epoch": 1.35, "learning_rate": 9.699663489917309e-05, "loss": 0.0084, "step": 268250 }, { "epoch": 1.35, "learning_rate": 9.698906720615908e-05, "loss": 0.0082, "step": 268260 }, { "epoch": 1.35, "learning_rate": 9.698149951314508e-05, "loss": 0.0067, "step": 268270 }, { "epoch": 1.35, "learning_rate": 9.697393182013106e-05, "loss": 0.0108, "step": 268280 }, { "epoch": 1.35, "learning_rate": 9.696636412711706e-05, "loss": 0.0059, "step": 268290 }, { "epoch": 1.35, "learning_rate": 9.695879643410304e-05, "loss": 0.0091, "step": 268300 }, { "epoch": 1.35, "learning_rate": 9.695122874108903e-05, "loss": 0.0077, "step": 268310 }, { "epoch": 1.35, "learning_rate": 9.694366104807503e-05, "loss": 0.0072, "step": 268320 }, { "epoch": 1.35, "learning_rate": 9.693609335506101e-05, "loss": 0.0088, "step": 268330 }, { "epoch": 1.35, "learning_rate": 9.6928525662047e-05, "loss": 0.0086, "step": 268340 }, { "epoch": 1.35, "learning_rate": 9.6920957969033e-05, "loss": 0.0089, "step": 268350 }, { "epoch": 1.35, "learning_rate": 9.691339027601898e-05, "loss": 0.0096, "step": 268360 }, { "epoch": 1.35, "learning_rate": 9.690582258300497e-05, "loss": 0.0066, "step": 268370 }, { "epoch": 1.35, "learning_rate": 9.689825488999096e-05, "loss": 0.0087, "step": 268380 }, { "epoch": 1.35, "learning_rate": 9.689068719697695e-05, "loss": 0.0076, "step": 268390 }, { "epoch": 1.35, "learning_rate": 9.688311950396295e-05, "loss": 0.0084, "step": 268400 }, { "epoch": 1.35, "learning_rate": 9.687555181094893e-05, "loss": 0.0072, "step": 268410 }, { "epoch": 1.35, "learning_rate": 9.686798411793492e-05, "loss": 0.0071, "step": 268420 }, { "epoch": 1.35, "learning_rate": 9.686041642492092e-05, "loss": 0.0054, "step": 268430 }, { "epoch": 1.35, "learning_rate": 9.68528487319069e-05, "loss": 0.0069, "step": 268440 }, { "epoch": 1.35, "learning_rate": 9.68452810388929e-05, "loss": 0.0066, "step": 268450 }, { "epoch": 1.35, "learning_rate": 9.683771334587888e-05, "loss": 0.0079, "step": 268460 }, { "epoch": 1.35, "learning_rate": 9.683014565286487e-05, "loss": 0.0091, "step": 268470 }, { "epoch": 1.35, "learning_rate": 9.682257795985087e-05, "loss": 0.0072, "step": 268480 }, { "epoch": 1.35, "learning_rate": 9.681501026683685e-05, "loss": 0.0107, "step": 268490 }, { "epoch": 1.35, "learning_rate": 9.680744257382284e-05, "loss": 0.0106, "step": 268500 }, { "epoch": 1.35, "learning_rate": 9.679987488080884e-05, "loss": 0.0089, "step": 268510 }, { "epoch": 1.35, "learning_rate": 9.679230718779482e-05, "loss": 0.0089, "step": 268520 }, { "epoch": 1.35, "learning_rate": 9.678473949478081e-05, "loss": 0.0067, "step": 268530 }, { "epoch": 1.35, "learning_rate": 9.67771718017668e-05, "loss": 0.0096, "step": 268540 }, { "epoch": 1.35, "learning_rate": 9.676960410875279e-05, "loss": 0.0089, "step": 268550 }, { "epoch": 1.35, "learning_rate": 9.676203641573878e-05, "loss": 0.007, "step": 268560 }, { "epoch": 1.35, "learning_rate": 9.675446872272477e-05, "loss": 0.0088, "step": 268570 }, { "epoch": 1.36, "learning_rate": 9.674690102971076e-05, "loss": 0.0074, "step": 268580 }, { "epoch": 1.36, "learning_rate": 9.673933333669676e-05, "loss": 0.0077, "step": 268590 }, { "epoch": 1.36, "learning_rate": 9.673176564368274e-05, "loss": 0.008, "step": 268600 }, { "epoch": 1.36, "learning_rate": 9.672419795066873e-05, "loss": 0.0067, "step": 268610 }, { "epoch": 1.36, "learning_rate": 9.671663025765471e-05, "loss": 0.0069, "step": 268620 }, { "epoch": 1.36, "learning_rate": 9.670906256464071e-05, "loss": 0.008, "step": 268630 }, { "epoch": 1.36, "learning_rate": 9.67014948716267e-05, "loss": 0.008, "step": 268640 }, { "epoch": 1.36, "learning_rate": 9.669392717861269e-05, "loss": 0.0084, "step": 268650 }, { "epoch": 1.36, "learning_rate": 9.668635948559867e-05, "loss": 0.0067, "step": 268660 }, { "epoch": 1.36, "learning_rate": 9.667879179258465e-05, "loss": 0.0069, "step": 268670 }, { "epoch": 1.36, "learning_rate": 9.667122409957064e-05, "loss": 0.0072, "step": 268680 }, { "epoch": 1.36, "learning_rate": 9.666365640655664e-05, "loss": 0.0089, "step": 268690 }, { "epoch": 1.36, "learning_rate": 9.665608871354262e-05, "loss": 0.0101, "step": 268700 }, { "epoch": 1.36, "learning_rate": 9.664852102052861e-05, "loss": 0.0076, "step": 268710 }, { "epoch": 1.36, "learning_rate": 9.664095332751461e-05, "loss": 0.0063, "step": 268720 }, { "epoch": 1.36, "learning_rate": 9.663338563450059e-05, "loss": 0.0059, "step": 268730 }, { "epoch": 1.36, "learning_rate": 9.662581794148659e-05, "loss": 0.0095, "step": 268740 }, { "epoch": 1.36, "learning_rate": 9.661825024847257e-05, "loss": 0.0082, "step": 268750 }, { "epoch": 1.36, "learning_rate": 9.661068255545856e-05, "loss": 0.0068, "step": 268760 }, { "epoch": 1.36, "learning_rate": 9.660311486244456e-05, "loss": 0.0121, "step": 268770 }, { "epoch": 1.36, "learning_rate": 9.659554716943054e-05, "loss": 0.0091, "step": 268780 }, { "epoch": 1.36, "learning_rate": 9.658797947641653e-05, "loss": 0.0057, "step": 268790 }, { "epoch": 1.36, "learning_rate": 9.658041178340253e-05, "loss": 0.0102, "step": 268800 }, { "epoch": 1.36, "learning_rate": 9.657284409038851e-05, "loss": 0.012, "step": 268810 }, { "epoch": 1.36, "learning_rate": 9.65652763973745e-05, "loss": 0.0092, "step": 268820 }, { "epoch": 1.36, "learning_rate": 9.655770870436049e-05, "loss": 0.0078, "step": 268830 }, { "epoch": 1.36, "learning_rate": 9.655014101134648e-05, "loss": 0.0102, "step": 268840 }, { "epoch": 1.36, "learning_rate": 9.654257331833248e-05, "loss": 0.0084, "step": 268850 }, { "epoch": 1.36, "learning_rate": 9.653500562531846e-05, "loss": 0.0069, "step": 268860 }, { "epoch": 1.36, "learning_rate": 9.652743793230445e-05, "loss": 0.0055, "step": 268870 }, { "epoch": 1.36, "learning_rate": 9.651987023929045e-05, "loss": 0.0075, "step": 268880 }, { "epoch": 1.36, "learning_rate": 9.651230254627643e-05, "loss": 0.0062, "step": 268890 }, { "epoch": 1.36, "learning_rate": 9.650473485326242e-05, "loss": 0.0084, "step": 268900 }, { "epoch": 1.36, "learning_rate": 9.64971671602484e-05, "loss": 0.0083, "step": 268910 }, { "epoch": 1.36, "learning_rate": 9.64895994672344e-05, "loss": 0.0065, "step": 268920 }, { "epoch": 1.36, "learning_rate": 9.64820317742204e-05, "loss": 0.0084, "step": 268930 }, { "epoch": 1.36, "learning_rate": 9.647446408120638e-05, "loss": 0.0078, "step": 268940 }, { "epoch": 1.36, "learning_rate": 9.646689638819237e-05, "loss": 0.0071, "step": 268950 }, { "epoch": 1.36, "learning_rate": 9.645932869517837e-05, "loss": 0.007, "step": 268960 }, { "epoch": 1.36, "learning_rate": 9.645176100216435e-05, "loss": 0.008, "step": 268970 }, { "epoch": 1.36, "learning_rate": 9.644419330915034e-05, "loss": 0.007, "step": 268980 }, { "epoch": 1.36, "learning_rate": 9.643662561613633e-05, "loss": 0.0079, "step": 268990 }, { "epoch": 1.36, "learning_rate": 9.642905792312232e-05, "loss": 0.0084, "step": 269000 }, { "epoch": 1.36, "eval_cer": 0.9144071801550111, "eval_loss": 0.006098465994000435, "eval_runtime": 116.3578, "eval_samples_per_second": 17.188, "eval_steps_per_second": 4.297, "step": 269000 }, { "epoch": 1.36, "learning_rate": 9.642149023010832e-05, "loss": 0.0086, "step": 269010 }, { "epoch": 1.36, "learning_rate": 9.64139225370943e-05, "loss": 0.0089, "step": 269020 }, { "epoch": 1.36, "learning_rate": 9.640635484408029e-05, "loss": 0.0087, "step": 269030 }, { "epoch": 1.36, "learning_rate": 9.639878715106629e-05, "loss": 0.0073, "step": 269040 }, { "epoch": 1.36, "learning_rate": 9.639121945805227e-05, "loss": 0.007, "step": 269050 }, { "epoch": 1.36, "learning_rate": 9.638365176503826e-05, "loss": 0.0061, "step": 269060 }, { "epoch": 1.36, "learning_rate": 9.637608407202424e-05, "loss": 0.0093, "step": 269070 }, { "epoch": 1.36, "learning_rate": 9.636851637901024e-05, "loss": 0.0096, "step": 269080 }, { "epoch": 1.36, "learning_rate": 9.636094868599623e-05, "loss": 0.0075, "step": 269090 }, { "epoch": 1.36, "learning_rate": 9.635338099298222e-05, "loss": 0.0059, "step": 269100 }, { "epoch": 1.36, "learning_rate": 9.634581329996821e-05, "loss": 0.0064, "step": 269110 }, { "epoch": 1.36, "learning_rate": 9.63382456069542e-05, "loss": 0.0079, "step": 269120 }, { "epoch": 1.36, "learning_rate": 9.633067791394019e-05, "loss": 0.0084, "step": 269130 }, { "epoch": 1.36, "learning_rate": 9.632311022092618e-05, "loss": 0.01, "step": 269140 }, { "epoch": 1.36, "learning_rate": 9.631554252791216e-05, "loss": 0.0084, "step": 269150 }, { "epoch": 1.36, "learning_rate": 9.630797483489816e-05, "loss": 0.0088, "step": 269160 }, { "epoch": 1.36, "learning_rate": 9.630040714188415e-05, "loss": 0.0103, "step": 269170 }, { "epoch": 1.36, "learning_rate": 9.629283944887014e-05, "loss": 0.0071, "step": 269180 }, { "epoch": 1.36, "learning_rate": 9.628527175585613e-05, "loss": 0.0075, "step": 269190 }, { "epoch": 1.36, "learning_rate": 9.627770406284213e-05, "loss": 0.01, "step": 269200 }, { "epoch": 1.36, "learning_rate": 9.627013636982811e-05, "loss": 0.0089, "step": 269210 }, { "epoch": 1.36, "learning_rate": 9.62625686768141e-05, "loss": 0.0079, "step": 269220 }, { "epoch": 1.36, "learning_rate": 9.625500098380008e-05, "loss": 0.0076, "step": 269230 }, { "epoch": 1.36, "learning_rate": 9.624743329078608e-05, "loss": 0.0089, "step": 269240 }, { "epoch": 1.36, "learning_rate": 9.623986559777207e-05, "loss": 0.0101, "step": 269250 }, { "epoch": 1.36, "learning_rate": 9.623229790475805e-05, "loss": 0.0067, "step": 269260 }, { "epoch": 1.36, "learning_rate": 9.622473021174405e-05, "loss": 0.0118, "step": 269270 }, { "epoch": 1.36, "learning_rate": 9.621716251873004e-05, "loss": 0.0084, "step": 269280 }, { "epoch": 1.36, "learning_rate": 9.620959482571601e-05, "loss": 0.0121, "step": 269290 }, { "epoch": 1.36, "learning_rate": 9.620202713270201e-05, "loss": 0.0075, "step": 269300 }, { "epoch": 1.36, "learning_rate": 9.619445943968799e-05, "loss": 0.0071, "step": 269310 }, { "epoch": 1.36, "learning_rate": 9.618689174667398e-05, "loss": 0.0084, "step": 269320 }, { "epoch": 1.36, "learning_rate": 9.617932405365998e-05, "loss": 0.0066, "step": 269330 }, { "epoch": 1.36, "learning_rate": 9.617175636064596e-05, "loss": 0.0132, "step": 269340 }, { "epoch": 1.36, "learning_rate": 9.616418866763196e-05, "loss": 0.0086, "step": 269350 }, { "epoch": 1.36, "learning_rate": 9.615662097461794e-05, "loss": 0.0085, "step": 269360 }, { "epoch": 1.36, "learning_rate": 9.614905328160393e-05, "loss": 0.0111, "step": 269370 }, { "epoch": 1.36, "learning_rate": 9.614148558858993e-05, "loss": 0.0076, "step": 269380 }, { "epoch": 1.36, "learning_rate": 9.613391789557591e-05, "loss": 0.0058, "step": 269390 }, { "epoch": 1.36, "learning_rate": 9.61263502025619e-05, "loss": 0.0119, "step": 269400 }, { "epoch": 1.36, "learning_rate": 9.61187825095479e-05, "loss": 0.008, "step": 269410 }, { "epoch": 1.36, "learning_rate": 9.611121481653388e-05, "loss": 0.0097, "step": 269420 }, { "epoch": 1.36, "learning_rate": 9.610364712351987e-05, "loss": 0.0094, "step": 269430 }, { "epoch": 1.36, "learning_rate": 9.609607943050586e-05, "loss": 0.0089, "step": 269440 }, { "epoch": 1.36, "learning_rate": 9.608851173749185e-05, "loss": 0.0077, "step": 269450 }, { "epoch": 1.36, "learning_rate": 9.608094404447785e-05, "loss": 0.0083, "step": 269460 }, { "epoch": 1.36, "learning_rate": 9.607337635146383e-05, "loss": 0.0076, "step": 269470 }, { "epoch": 1.36, "learning_rate": 9.606580865844982e-05, "loss": 0.0094, "step": 269480 }, { "epoch": 1.36, "learning_rate": 9.605824096543582e-05, "loss": 0.0062, "step": 269490 }, { "epoch": 1.36, "learning_rate": 9.60506732724218e-05, "loss": 0.0084, "step": 269500 }, { "epoch": 1.36, "learning_rate": 9.60431055794078e-05, "loss": 0.007, "step": 269510 }, { "epoch": 1.36, "learning_rate": 9.603553788639378e-05, "loss": 0.0101, "step": 269520 }, { "epoch": 1.36, "learning_rate": 9.602797019337977e-05, "loss": 0.0064, "step": 269530 }, { "epoch": 1.36, "learning_rate": 9.602040250036577e-05, "loss": 0.0061, "step": 269540 }, { "epoch": 1.36, "learning_rate": 9.601283480735175e-05, "loss": 0.0073, "step": 269550 }, { "epoch": 1.36, "learning_rate": 9.600526711433774e-05, "loss": 0.0067, "step": 269560 }, { "epoch": 1.36, "learning_rate": 9.599769942132374e-05, "loss": 0.007, "step": 269570 }, { "epoch": 1.36, "learning_rate": 9.599013172830972e-05, "loss": 0.0078, "step": 269580 }, { "epoch": 1.36, "learning_rate": 9.598256403529571e-05, "loss": 0.0085, "step": 269590 }, { "epoch": 1.36, "learning_rate": 9.59749963422817e-05, "loss": 0.0066, "step": 269600 }, { "epoch": 1.36, "learning_rate": 9.596742864926769e-05, "loss": 0.0091, "step": 269610 }, { "epoch": 1.36, "learning_rate": 9.595986095625368e-05, "loss": 0.0078, "step": 269620 }, { "epoch": 1.36, "learning_rate": 9.595229326323967e-05, "loss": 0.0072, "step": 269630 }, { "epoch": 1.36, "learning_rate": 9.594472557022566e-05, "loss": 0.0078, "step": 269640 }, { "epoch": 1.36, "learning_rate": 9.593715787721166e-05, "loss": 0.0075, "step": 269650 }, { "epoch": 1.36, "learning_rate": 9.592959018419764e-05, "loss": 0.008, "step": 269660 }, { "epoch": 1.36, "learning_rate": 9.592202249118363e-05, "loss": 0.0098, "step": 269670 }, { "epoch": 1.36, "learning_rate": 9.591445479816961e-05, "loss": 0.0063, "step": 269680 }, { "epoch": 1.36, "learning_rate": 9.590688710515561e-05, "loss": 0.0096, "step": 269690 }, { "epoch": 1.36, "learning_rate": 9.58993194121416e-05, "loss": 0.0078, "step": 269700 }, { "epoch": 1.36, "learning_rate": 9.589175171912759e-05, "loss": 0.0085, "step": 269710 }, { "epoch": 1.36, "learning_rate": 9.588418402611358e-05, "loss": 0.007, "step": 269720 }, { "epoch": 1.36, "learning_rate": 9.587661633309958e-05, "loss": 0.0074, "step": 269730 }, { "epoch": 1.36, "learning_rate": 9.586904864008556e-05, "loss": 0.0079, "step": 269740 }, { "epoch": 1.36, "learning_rate": 9.586148094707155e-05, "loss": 0.0071, "step": 269750 }, { "epoch": 1.36, "learning_rate": 9.585391325405755e-05, "loss": 0.0103, "step": 269760 }, { "epoch": 1.36, "learning_rate": 9.584634556104353e-05, "loss": 0.0076, "step": 269770 }, { "epoch": 1.36, "learning_rate": 9.583877786802952e-05, "loss": 0.0091, "step": 269780 }, { "epoch": 1.36, "learning_rate": 9.58312101750155e-05, "loss": 0.0077, "step": 269790 }, { "epoch": 1.36, "learning_rate": 9.58236424820015e-05, "loss": 0.0103, "step": 269800 }, { "epoch": 1.36, "learning_rate": 9.58160747889875e-05, "loss": 0.008, "step": 269810 }, { "epoch": 1.36, "learning_rate": 9.580850709597348e-05, "loss": 0.0086, "step": 269820 }, { "epoch": 1.36, "learning_rate": 9.580093940295947e-05, "loss": 0.0072, "step": 269830 }, { "epoch": 1.36, "learning_rate": 9.579337170994547e-05, "loss": 0.0057, "step": 269840 }, { "epoch": 1.36, "learning_rate": 9.578580401693145e-05, "loss": 0.0089, "step": 269850 }, { "epoch": 1.36, "learning_rate": 9.577823632391744e-05, "loss": 0.0089, "step": 269860 }, { "epoch": 1.36, "learning_rate": 9.577066863090342e-05, "loss": 0.0091, "step": 269870 }, { "epoch": 1.36, "learning_rate": 9.576310093788942e-05, "loss": 0.0081, "step": 269880 }, { "epoch": 1.36, "learning_rate": 9.575553324487541e-05, "loss": 0.0081, "step": 269890 }, { "epoch": 1.36, "learning_rate": 9.57479655518614e-05, "loss": 0.0074, "step": 269900 }, { "epoch": 1.36, "learning_rate": 9.574039785884739e-05, "loss": 0.0084, "step": 269910 }, { "epoch": 1.36, "learning_rate": 9.573283016583336e-05, "loss": 0.008, "step": 269920 }, { "epoch": 1.36, "learning_rate": 9.572526247281935e-05, "loss": 0.0081, "step": 269930 }, { "epoch": 1.36, "learning_rate": 9.571769477980535e-05, "loss": 0.0082, "step": 269940 }, { "epoch": 1.36, "learning_rate": 9.571012708679133e-05, "loss": 0.0071, "step": 269950 }, { "epoch": 1.36, "learning_rate": 9.570255939377733e-05, "loss": 0.0065, "step": 269960 }, { "epoch": 1.36, "learning_rate": 9.56949917007633e-05, "loss": 0.0084, "step": 269970 }, { "epoch": 1.36, "learning_rate": 9.56874240077493e-05, "loss": 0.0086, "step": 269980 }, { "epoch": 1.36, "learning_rate": 9.56798563147353e-05, "loss": 0.0087, "step": 269990 }, { "epoch": 1.36, "learning_rate": 9.567228862172128e-05, "loss": 0.0089, "step": 270000 }, { "epoch": 1.36, "eval_cer": 0.9144333808503969, "eval_loss": 0.006005189847201109, "eval_runtime": 116.1544, "eval_samples_per_second": 17.218, "eval_steps_per_second": 4.305, "step": 270000 }, { "epoch": 1.36, "learning_rate": 9.566472092870727e-05, "loss": 0.009, "step": 270010 }, { "epoch": 1.36, "learning_rate": 9.565715323569327e-05, "loss": 0.0076, "step": 270020 }, { "epoch": 1.36, "learning_rate": 9.564958554267925e-05, "loss": 0.008, "step": 270030 }, { "epoch": 1.36, "learning_rate": 9.564201784966524e-05, "loss": 0.0072, "step": 270040 }, { "epoch": 1.36, "learning_rate": 9.563445015665123e-05, "loss": 0.007, "step": 270050 }, { "epoch": 1.36, "learning_rate": 9.562688246363722e-05, "loss": 0.0064, "step": 270060 }, { "epoch": 1.36, "learning_rate": 9.561931477062322e-05, "loss": 0.0069, "step": 270070 }, { "epoch": 1.36, "learning_rate": 9.56117470776092e-05, "loss": 0.0092, "step": 270080 }, { "epoch": 1.36, "learning_rate": 9.560417938459519e-05, "loss": 0.0101, "step": 270090 }, { "epoch": 1.36, "learning_rate": 9.559661169158119e-05, "loss": 0.0097, "step": 270100 }, { "epoch": 1.36, "learning_rate": 9.558904399856717e-05, "loss": 0.0091, "step": 270110 }, { "epoch": 1.36, "learning_rate": 9.558147630555316e-05, "loss": 0.007, "step": 270120 }, { "epoch": 1.36, "learning_rate": 9.557390861253915e-05, "loss": 0.0101, "step": 270130 }, { "epoch": 1.36, "learning_rate": 9.556634091952514e-05, "loss": 0.0088, "step": 270140 }, { "epoch": 1.36, "learning_rate": 9.555877322651114e-05, "loss": 0.0064, "step": 270150 }, { "epoch": 1.36, "learning_rate": 9.555120553349712e-05, "loss": 0.0073, "step": 270160 }, { "epoch": 1.36, "learning_rate": 9.554363784048311e-05, "loss": 0.0073, "step": 270170 }, { "epoch": 1.36, "learning_rate": 9.55360701474691e-05, "loss": 0.0063, "step": 270180 }, { "epoch": 1.36, "learning_rate": 9.552850245445509e-05, "loss": 0.0069, "step": 270190 }, { "epoch": 1.36, "learning_rate": 9.552093476144108e-05, "loss": 0.0084, "step": 270200 }, { "epoch": 1.36, "learning_rate": 9.551336706842708e-05, "loss": 0.0074, "step": 270210 }, { "epoch": 1.36, "learning_rate": 9.550579937541306e-05, "loss": 0.0074, "step": 270220 }, { "epoch": 1.36, "learning_rate": 9.549823168239905e-05, "loss": 0.0057, "step": 270230 }, { "epoch": 1.36, "learning_rate": 9.549066398938504e-05, "loss": 0.0102, "step": 270240 }, { "epoch": 1.36, "learning_rate": 9.548309629637103e-05, "loss": 0.0072, "step": 270250 }, { "epoch": 1.36, "learning_rate": 9.547552860335703e-05, "loss": 0.0056, "step": 270260 }, { "epoch": 1.36, "learning_rate": 9.546796091034301e-05, "loss": 0.0065, "step": 270270 }, { "epoch": 1.36, "learning_rate": 9.5460393217329e-05, "loss": 0.0075, "step": 270280 }, { "epoch": 1.36, "learning_rate": 9.5452825524315e-05, "loss": 0.0137, "step": 270290 }, { "epoch": 1.36, "learning_rate": 9.544525783130098e-05, "loss": 0.0086, "step": 270300 }, { "epoch": 1.36, "learning_rate": 9.543769013828697e-05, "loss": 0.0099, "step": 270310 }, { "epoch": 1.36, "learning_rate": 9.543012244527296e-05, "loss": 0.0071, "step": 270320 }, { "epoch": 1.36, "learning_rate": 9.542255475225895e-05, "loss": 0.0083, "step": 270330 }, { "epoch": 1.36, "learning_rate": 9.541498705924495e-05, "loss": 0.0088, "step": 270340 }, { "epoch": 1.36, "learning_rate": 9.540741936623093e-05, "loss": 0.0081, "step": 270350 }, { "epoch": 1.36, "learning_rate": 9.539985167321692e-05, "loss": 0.0068, "step": 270360 }, { "epoch": 1.36, "learning_rate": 9.539228398020292e-05, "loss": 0.009, "step": 270370 }, { "epoch": 1.36, "learning_rate": 9.53847162871889e-05, "loss": 0.0095, "step": 270380 }, { "epoch": 1.36, "learning_rate": 9.537714859417489e-05, "loss": 0.0088, "step": 270390 }, { "epoch": 1.36, "learning_rate": 9.536958090116087e-05, "loss": 0.0054, "step": 270400 }, { "epoch": 1.36, "learning_rate": 9.536201320814687e-05, "loss": 0.0095, "step": 270410 }, { "epoch": 1.36, "learning_rate": 9.535444551513286e-05, "loss": 0.0065, "step": 270420 }, { "epoch": 1.36, "learning_rate": 9.534687782211885e-05, "loss": 0.007, "step": 270430 }, { "epoch": 1.36, "learning_rate": 9.533931012910484e-05, "loss": 0.0067, "step": 270440 }, { "epoch": 1.36, "learning_rate": 9.533174243609084e-05, "loss": 0.0108, "step": 270450 }, { "epoch": 1.36, "learning_rate": 9.532417474307682e-05, "loss": 0.0086, "step": 270460 }, { "epoch": 1.36, "learning_rate": 9.531660705006281e-05, "loss": 0.0096, "step": 270470 }, { "epoch": 1.36, "learning_rate": 9.53090393570488e-05, "loss": 0.0108, "step": 270480 }, { "epoch": 1.36, "learning_rate": 9.530147166403479e-05, "loss": 0.0072, "step": 270490 }, { "epoch": 1.36, "learning_rate": 9.529390397102078e-05, "loss": 0.0075, "step": 270500 }, { "epoch": 1.36, "learning_rate": 9.528633627800677e-05, "loss": 0.0064, "step": 270510 }, { "epoch": 1.36, "learning_rate": 9.527876858499276e-05, "loss": 0.009, "step": 270520 }, { "epoch": 1.36, "learning_rate": 9.527120089197876e-05, "loss": 0.0097, "step": 270530 }, { "epoch": 1.36, "learning_rate": 9.526363319896474e-05, "loss": 0.0086, "step": 270540 }, { "epoch": 1.36, "learning_rate": 9.525606550595072e-05, "loss": 0.0065, "step": 270550 }, { "epoch": 1.37, "learning_rate": 9.52484978129367e-05, "loss": 0.0082, "step": 270560 }, { "epoch": 1.37, "learning_rate": 9.52409301199227e-05, "loss": 0.0068, "step": 270570 }, { "epoch": 1.37, "learning_rate": 9.523336242690868e-05, "loss": 0.0097, "step": 270580 }, { "epoch": 1.37, "learning_rate": 9.522579473389467e-05, "loss": 0.0063, "step": 270590 }, { "epoch": 1.37, "learning_rate": 9.521822704088067e-05, "loss": 0.0072, "step": 270600 }, { "epoch": 1.37, "learning_rate": 9.521065934786665e-05, "loss": 0.0096, "step": 270610 }, { "epoch": 1.37, "learning_rate": 9.520309165485264e-05, "loss": 0.0068, "step": 270620 }, { "epoch": 1.37, "learning_rate": 9.519552396183864e-05, "loss": 0.0065, "step": 270630 }, { "epoch": 1.37, "learning_rate": 9.518795626882462e-05, "loss": 0.0081, "step": 270640 }, { "epoch": 1.37, "learning_rate": 9.518038857581061e-05, "loss": 0.0074, "step": 270650 }, { "epoch": 1.37, "learning_rate": 9.517282088279661e-05, "loss": 0.0066, "step": 270660 }, { "epoch": 1.37, "learning_rate": 9.516525318978259e-05, "loss": 0.0092, "step": 270670 }, { "epoch": 1.37, "learning_rate": 9.515768549676859e-05, "loss": 0.0133, "step": 270680 }, { "epoch": 1.37, "learning_rate": 9.515011780375457e-05, "loss": 0.0075, "step": 270690 }, { "epoch": 1.37, "learning_rate": 9.514255011074056e-05, "loss": 0.0079, "step": 270700 }, { "epoch": 1.37, "learning_rate": 9.513498241772656e-05, "loss": 0.0083, "step": 270710 }, { "epoch": 1.37, "learning_rate": 9.512741472471254e-05, "loss": 0.0081, "step": 270720 }, { "epoch": 1.37, "learning_rate": 9.511984703169853e-05, "loss": 0.0077, "step": 270730 }, { "epoch": 1.37, "learning_rate": 9.511227933868453e-05, "loss": 0.0062, "step": 270740 }, { "epoch": 1.37, "learning_rate": 9.510471164567051e-05, "loss": 0.0069, "step": 270750 }, { "epoch": 1.37, "learning_rate": 9.50971439526565e-05, "loss": 0.007, "step": 270760 }, { "epoch": 1.37, "learning_rate": 9.508957625964249e-05, "loss": 0.0087, "step": 270770 }, { "epoch": 1.37, "learning_rate": 9.508200856662848e-05, "loss": 0.0093, "step": 270780 }, { "epoch": 1.37, "learning_rate": 9.507444087361448e-05, "loss": 0.0117, "step": 270790 }, { "epoch": 1.37, "learning_rate": 9.506687318060046e-05, "loss": 0.0083, "step": 270800 }, { "epoch": 1.37, "learning_rate": 9.505930548758645e-05, "loss": 0.0069, "step": 270810 }, { "epoch": 1.37, "learning_rate": 9.505173779457245e-05, "loss": 0.0078, "step": 270820 }, { "epoch": 1.37, "learning_rate": 9.504417010155843e-05, "loss": 0.0079, "step": 270830 }, { "epoch": 1.37, "learning_rate": 9.503660240854442e-05, "loss": 0.0082, "step": 270840 }, { "epoch": 1.37, "learning_rate": 9.50290347155304e-05, "loss": 0.0089, "step": 270850 }, { "epoch": 1.37, "learning_rate": 9.50214670225164e-05, "loss": 0.0098, "step": 270860 }, { "epoch": 1.37, "learning_rate": 9.50138993295024e-05, "loss": 0.006, "step": 270870 }, { "epoch": 1.37, "learning_rate": 9.500633163648838e-05, "loss": 0.0139, "step": 270880 }, { "epoch": 1.37, "learning_rate": 9.499876394347437e-05, "loss": 0.0072, "step": 270890 }, { "epoch": 1.37, "learning_rate": 9.499119625046037e-05, "loss": 0.0115, "step": 270900 }, { "epoch": 1.37, "learning_rate": 9.498362855744635e-05, "loss": 0.0098, "step": 270910 }, { "epoch": 1.37, "learning_rate": 9.497606086443234e-05, "loss": 0.0091, "step": 270920 }, { "epoch": 1.37, "learning_rate": 9.496849317141832e-05, "loss": 0.0077, "step": 270930 }, { "epoch": 1.37, "learning_rate": 9.496092547840432e-05, "loss": 0.007, "step": 270940 }, { "epoch": 1.37, "learning_rate": 9.495335778539031e-05, "loss": 0.0098, "step": 270950 }, { "epoch": 1.37, "learning_rate": 9.49457900923763e-05, "loss": 0.0077, "step": 270960 }, { "epoch": 1.37, "learning_rate": 9.493822239936229e-05, "loss": 0.0075, "step": 270970 }, { "epoch": 1.37, "learning_rate": 9.493065470634829e-05, "loss": 0.0089, "step": 270980 }, { "epoch": 1.37, "learning_rate": 9.492308701333427e-05, "loss": 0.0077, "step": 270990 }, { "epoch": 1.37, "learning_rate": 9.491551932032026e-05, "loss": 0.012, "step": 271000 }, { "epoch": 1.37, "eval_cer": 0.9144411440194001, "eval_loss": 0.0061246431432664394, "eval_runtime": 116.2526, "eval_samples_per_second": 17.204, "eval_steps_per_second": 4.301, "step": 271000 }, { "epoch": 1.37, "learning_rate": 9.490795162730624e-05, "loss": 0.0075, "step": 271010 }, { "epoch": 1.37, "learning_rate": 9.490038393429224e-05, "loss": 0.0075, "step": 271020 }, { "epoch": 1.37, "learning_rate": 9.489281624127823e-05, "loss": 0.0087, "step": 271030 }, { "epoch": 1.37, "learning_rate": 9.488524854826422e-05, "loss": 0.0078, "step": 271040 }, { "epoch": 1.37, "learning_rate": 9.487768085525021e-05, "loss": 0.0111, "step": 271050 }, { "epoch": 1.37, "learning_rate": 9.48701131622362e-05, "loss": 0.008, "step": 271060 }, { "epoch": 1.37, "learning_rate": 9.486254546922219e-05, "loss": 0.0117, "step": 271070 }, { "epoch": 1.37, "learning_rate": 9.485497777620818e-05, "loss": 0.005, "step": 271080 }, { "epoch": 1.37, "learning_rate": 9.484741008319416e-05, "loss": 0.009, "step": 271090 }, { "epoch": 1.37, "learning_rate": 9.483984239018016e-05, "loss": 0.0068, "step": 271100 }, { "epoch": 1.37, "learning_rate": 9.483227469716615e-05, "loss": 0.007, "step": 271110 }, { "epoch": 1.37, "learning_rate": 9.482470700415213e-05, "loss": 0.0074, "step": 271120 }, { "epoch": 1.37, "learning_rate": 9.481713931113813e-05, "loss": 0.0065, "step": 271130 }, { "epoch": 1.37, "learning_rate": 9.480957161812412e-05, "loss": 0.0068, "step": 271140 }, { "epoch": 1.37, "learning_rate": 9.48020039251101e-05, "loss": 0.0091, "step": 271150 }, { "epoch": 1.37, "learning_rate": 9.47944362320961e-05, "loss": 0.007, "step": 271160 }, { "epoch": 1.37, "learning_rate": 9.478686853908208e-05, "loss": 0.0083, "step": 271170 }, { "epoch": 1.37, "learning_rate": 9.477930084606806e-05, "loss": 0.009, "step": 271180 }, { "epoch": 1.37, "learning_rate": 9.477173315305406e-05, "loss": 0.0062, "step": 271190 }, { "epoch": 1.37, "learning_rate": 9.476416546004004e-05, "loss": 0.0092, "step": 271200 }, { "epoch": 1.37, "learning_rate": 9.475659776702604e-05, "loss": 0.0084, "step": 271210 }, { "epoch": 1.37, "learning_rate": 9.474903007401202e-05, "loss": 0.0113, "step": 271220 }, { "epoch": 1.37, "learning_rate": 9.474146238099801e-05, "loss": 0.0079, "step": 271230 }, { "epoch": 1.37, "learning_rate": 9.473389468798401e-05, "loss": 0.0083, "step": 271240 }, { "epoch": 1.37, "learning_rate": 9.472632699496999e-05, "loss": 0.0095, "step": 271250 }, { "epoch": 1.37, "learning_rate": 9.471875930195598e-05, "loss": 0.0082, "step": 271260 }, { "epoch": 1.37, "learning_rate": 9.471119160894198e-05, "loss": 0.009, "step": 271270 }, { "epoch": 1.37, "learning_rate": 9.470362391592796e-05, "loss": 0.0114, "step": 271280 }, { "epoch": 1.37, "learning_rate": 9.469605622291395e-05, "loss": 0.0084, "step": 271290 }, { "epoch": 1.37, "learning_rate": 9.468848852989994e-05, "loss": 0.007, "step": 271300 }, { "epoch": 1.37, "learning_rate": 9.468092083688593e-05, "loss": 0.0064, "step": 271310 }, { "epoch": 1.37, "learning_rate": 9.467335314387193e-05, "loss": 0.0104, "step": 271320 }, { "epoch": 1.37, "learning_rate": 9.466578545085791e-05, "loss": 0.0073, "step": 271330 }, { "epoch": 1.37, "learning_rate": 9.46582177578439e-05, "loss": 0.0086, "step": 271340 }, { "epoch": 1.37, "learning_rate": 9.46506500648299e-05, "loss": 0.0073, "step": 271350 }, { "epoch": 1.37, "learning_rate": 9.464308237181588e-05, "loss": 0.0072, "step": 271360 }, { "epoch": 1.37, "learning_rate": 9.463551467880187e-05, "loss": 0.0088, "step": 271370 }, { "epoch": 1.37, "learning_rate": 9.462794698578786e-05, "loss": 0.0065, "step": 271380 }, { "epoch": 1.37, "learning_rate": 9.462037929277385e-05, "loss": 0.0062, "step": 271390 }, { "epoch": 1.37, "learning_rate": 9.461281159975985e-05, "loss": 0.0115, "step": 271400 }, { "epoch": 1.37, "learning_rate": 9.460524390674583e-05, "loss": 0.0074, "step": 271410 }, { "epoch": 1.37, "learning_rate": 9.459767621373182e-05, "loss": 0.0073, "step": 271420 }, { "epoch": 1.37, "learning_rate": 9.459010852071782e-05, "loss": 0.01, "step": 271430 }, { "epoch": 1.37, "learning_rate": 9.45825408277038e-05, "loss": 0.0072, "step": 271440 }, { "epoch": 1.37, "learning_rate": 9.45749731346898e-05, "loss": 0.008, "step": 271450 }, { "epoch": 1.37, "learning_rate": 9.456740544167577e-05, "loss": 0.0094, "step": 271460 }, { "epoch": 1.37, "learning_rate": 9.455983774866177e-05, "loss": 0.0077, "step": 271470 }, { "epoch": 1.37, "learning_rate": 9.455227005564776e-05, "loss": 0.0082, "step": 271480 }, { "epoch": 1.37, "learning_rate": 9.454470236263375e-05, "loss": 0.0071, "step": 271490 }, { "epoch": 1.37, "learning_rate": 9.453713466961974e-05, "loss": 0.0099, "step": 271500 }, { "epoch": 1.37, "learning_rate": 9.452956697660574e-05, "loss": 0.0083, "step": 271510 }, { "epoch": 1.37, "learning_rate": 9.452199928359172e-05, "loss": 0.0072, "step": 271520 }, { "epoch": 1.37, "learning_rate": 9.451443159057771e-05, "loss": 0.0083, "step": 271530 }, { "epoch": 1.37, "learning_rate": 9.45068638975637e-05, "loss": 0.0101, "step": 271540 }, { "epoch": 1.37, "learning_rate": 9.449929620454969e-05, "loss": 0.0081, "step": 271550 }, { "epoch": 1.37, "learning_rate": 9.449172851153568e-05, "loss": 0.007, "step": 271560 }, { "epoch": 1.37, "learning_rate": 9.448416081852167e-05, "loss": 0.0088, "step": 271570 }, { "epoch": 1.37, "learning_rate": 9.447659312550766e-05, "loss": 0.0093, "step": 271580 }, { "epoch": 1.37, "learning_rate": 9.446902543249366e-05, "loss": 0.0113, "step": 271590 }, { "epoch": 1.37, "learning_rate": 9.446145773947964e-05, "loss": 0.0093, "step": 271600 }, { "epoch": 1.37, "learning_rate": 9.445389004646563e-05, "loss": 0.0099, "step": 271610 }, { "epoch": 1.37, "learning_rate": 9.444632235345161e-05, "loss": 0.0067, "step": 271620 }, { "epoch": 1.37, "learning_rate": 9.443875466043761e-05, "loss": 0.0093, "step": 271630 }, { "epoch": 1.37, "learning_rate": 9.44311869674236e-05, "loss": 0.0079, "step": 271640 }, { "epoch": 1.37, "learning_rate": 9.442361927440958e-05, "loss": 0.0093, "step": 271650 }, { "epoch": 1.37, "learning_rate": 9.441605158139558e-05, "loss": 0.0091, "step": 271660 }, { "epoch": 1.37, "learning_rate": 9.440848388838157e-05, "loss": 0.0064, "step": 271670 }, { "epoch": 1.37, "learning_rate": 9.440091619536756e-05, "loss": 0.0096, "step": 271680 }, { "epoch": 1.37, "learning_rate": 9.439334850235355e-05, "loss": 0.0059, "step": 271690 }, { "epoch": 1.37, "learning_rate": 9.438578080933955e-05, "loss": 0.0094, "step": 271700 }, { "epoch": 1.37, "learning_rate": 9.437821311632553e-05, "loss": 0.0067, "step": 271710 }, { "epoch": 1.37, "learning_rate": 9.437064542331152e-05, "loss": 0.0079, "step": 271720 }, { "epoch": 1.37, "learning_rate": 9.43630777302975e-05, "loss": 0.0076, "step": 271730 }, { "epoch": 1.37, "learning_rate": 9.43555100372835e-05, "loss": 0.0068, "step": 271740 }, { "epoch": 1.37, "learning_rate": 9.43479423442695e-05, "loss": 0.0091, "step": 271750 }, { "epoch": 1.37, "learning_rate": 9.434037465125548e-05, "loss": 0.0053, "step": 271760 }, { "epoch": 1.37, "learning_rate": 9.433280695824147e-05, "loss": 0.0085, "step": 271770 }, { "epoch": 1.37, "learning_rate": 9.432523926522747e-05, "loss": 0.0073, "step": 271780 }, { "epoch": 1.37, "learning_rate": 9.431767157221345e-05, "loss": 0.0087, "step": 271790 }, { "epoch": 1.37, "learning_rate": 9.431010387919944e-05, "loss": 0.0074, "step": 271800 }, { "epoch": 1.37, "learning_rate": 9.430253618618541e-05, "loss": 0.0061, "step": 271810 }, { "epoch": 1.37, "learning_rate": 9.42949684931714e-05, "loss": 0.0081, "step": 271820 }, { "epoch": 1.37, "learning_rate": 9.428740080015739e-05, "loss": 0.0084, "step": 271830 }, { "epoch": 1.37, "learning_rate": 9.427983310714338e-05, "loss": 0.0134, "step": 271840 }, { "epoch": 1.37, "learning_rate": 9.427226541412938e-05, "loss": 0.0075, "step": 271850 }, { "epoch": 1.37, "learning_rate": 9.426469772111536e-05, "loss": 0.0069, "step": 271860 }, { "epoch": 1.37, "learning_rate": 9.425713002810135e-05, "loss": 0.0091, "step": 271870 }, { "epoch": 1.37, "learning_rate": 9.424956233508735e-05, "loss": 0.0076, "step": 271880 }, { "epoch": 1.37, "learning_rate": 9.424199464207333e-05, "loss": 0.009, "step": 271890 }, { "epoch": 1.37, "learning_rate": 9.423442694905932e-05, "loss": 0.0088, "step": 271900 }, { "epoch": 1.37, "learning_rate": 9.42268592560453e-05, "loss": 0.008, "step": 271910 }, { "epoch": 1.37, "learning_rate": 9.42192915630313e-05, "loss": 0.0059, "step": 271920 }, { "epoch": 1.37, "learning_rate": 9.42117238700173e-05, "loss": 0.0109, "step": 271930 }, { "epoch": 1.37, "learning_rate": 9.420415617700328e-05, "loss": 0.0077, "step": 271940 }, { "epoch": 1.37, "learning_rate": 9.419658848398927e-05, "loss": 0.0073, "step": 271950 }, { "epoch": 1.37, "learning_rate": 9.418902079097527e-05, "loss": 0.0094, "step": 271960 }, { "epoch": 1.37, "learning_rate": 9.418145309796125e-05, "loss": 0.0062, "step": 271970 }, { "epoch": 1.37, "learning_rate": 9.417388540494724e-05, "loss": 0.0092, "step": 271980 }, { "epoch": 1.37, "learning_rate": 9.416631771193322e-05, "loss": 0.0069, "step": 271990 }, { "epoch": 1.37, "learning_rate": 9.415875001891922e-05, "loss": 0.0082, "step": 272000 }, { "epoch": 1.37, "eval_cer": 0.9144265880775191, "eval_loss": 0.006095241755247116, "eval_runtime": 116.2589, "eval_samples_per_second": 17.203, "eval_steps_per_second": 4.301, "step": 272000 }, { "epoch": 1.37, "learning_rate": 9.415118232590521e-05, "loss": 0.0073, "step": 272010 }, { "epoch": 1.37, "learning_rate": 9.41436146328912e-05, "loss": 0.0076, "step": 272020 }, { "epoch": 1.37, "learning_rate": 9.413604693987719e-05, "loss": 0.0072, "step": 272030 }, { "epoch": 1.37, "learning_rate": 9.412847924686319e-05, "loss": 0.007, "step": 272040 }, { "epoch": 1.37, "learning_rate": 9.412091155384917e-05, "loss": 0.0083, "step": 272050 }, { "epoch": 1.37, "learning_rate": 9.411334386083516e-05, "loss": 0.0082, "step": 272060 }, { "epoch": 1.37, "learning_rate": 9.410577616782114e-05, "loss": 0.0097, "step": 272070 }, { "epoch": 1.37, "learning_rate": 9.409820847480714e-05, "loss": 0.0093, "step": 272080 }, { "epoch": 1.37, "learning_rate": 9.409064078179313e-05, "loss": 0.0096, "step": 272090 }, { "epoch": 1.37, "learning_rate": 9.408307308877912e-05, "loss": 0.0073, "step": 272100 }, { "epoch": 1.37, "learning_rate": 9.407550539576511e-05, "loss": 0.0092, "step": 272110 }, { "epoch": 1.37, "learning_rate": 9.40679377027511e-05, "loss": 0.0085, "step": 272120 }, { "epoch": 1.37, "learning_rate": 9.406037000973709e-05, "loss": 0.0071, "step": 272130 }, { "epoch": 1.37, "learning_rate": 9.405280231672308e-05, "loss": 0.0066, "step": 272140 }, { "epoch": 1.37, "learning_rate": 9.404523462370908e-05, "loss": 0.0074, "step": 272150 }, { "epoch": 1.37, "learning_rate": 9.403766693069506e-05, "loss": 0.0072, "step": 272160 }, { "epoch": 1.37, "learning_rate": 9.403009923768105e-05, "loss": 0.0103, "step": 272170 }, { "epoch": 1.37, "learning_rate": 9.402253154466703e-05, "loss": 0.0086, "step": 272180 }, { "epoch": 1.37, "learning_rate": 9.401496385165303e-05, "loss": 0.0081, "step": 272190 }, { "epoch": 1.37, "learning_rate": 9.400739615863902e-05, "loss": 0.0071, "step": 272200 }, { "epoch": 1.37, "learning_rate": 9.3999828465625e-05, "loss": 0.0072, "step": 272210 }, { "epoch": 1.37, "learning_rate": 9.3992260772611e-05, "loss": 0.0096, "step": 272220 }, { "epoch": 1.37, "learning_rate": 9.3984693079597e-05, "loss": 0.0064, "step": 272230 }, { "epoch": 1.37, "learning_rate": 9.397712538658298e-05, "loss": 0.009, "step": 272240 }, { "epoch": 1.37, "learning_rate": 9.396955769356897e-05, "loss": 0.0081, "step": 272250 }, { "epoch": 1.37, "learning_rate": 9.396199000055495e-05, "loss": 0.0076, "step": 272260 }, { "epoch": 1.37, "learning_rate": 9.395442230754095e-05, "loss": 0.0074, "step": 272270 }, { "epoch": 1.37, "learning_rate": 9.394685461452694e-05, "loss": 0.0106, "step": 272280 }, { "epoch": 1.37, "learning_rate": 9.393928692151293e-05, "loss": 0.0071, "step": 272290 }, { "epoch": 1.37, "learning_rate": 9.393171922849892e-05, "loss": 0.0125, "step": 272300 }, { "epoch": 1.37, "learning_rate": 9.392415153548492e-05, "loss": 0.0077, "step": 272310 }, { "epoch": 1.37, "learning_rate": 9.39165838424709e-05, "loss": 0.0095, "step": 272320 }, { "epoch": 1.37, "learning_rate": 9.390901614945689e-05, "loss": 0.0074, "step": 272330 }, { "epoch": 1.37, "learning_rate": 9.390144845644287e-05, "loss": 0.007, "step": 272340 }, { "epoch": 1.37, "learning_rate": 9.389388076342887e-05, "loss": 0.0068, "step": 272350 }, { "epoch": 1.37, "learning_rate": 9.388631307041486e-05, "loss": 0.0066, "step": 272360 }, { "epoch": 1.37, "learning_rate": 9.387874537740084e-05, "loss": 0.0082, "step": 272370 }, { "epoch": 1.37, "learning_rate": 9.387117768438684e-05, "loss": 0.0056, "step": 272380 }, { "epoch": 1.37, "learning_rate": 9.386360999137283e-05, "loss": 0.008, "step": 272390 }, { "epoch": 1.37, "learning_rate": 9.385604229835882e-05, "loss": 0.0074, "step": 272400 }, { "epoch": 1.37, "learning_rate": 9.384847460534481e-05, "loss": 0.0077, "step": 272410 }, { "epoch": 1.37, "learning_rate": 9.384090691233079e-05, "loss": 0.0081, "step": 272420 }, { "epoch": 1.37, "learning_rate": 9.383333921931679e-05, "loss": 0.0084, "step": 272430 }, { "epoch": 1.37, "learning_rate": 9.382577152630276e-05, "loss": 0.0084, "step": 272440 }, { "epoch": 1.37, "learning_rate": 9.381820383328875e-05, "loss": 0.0067, "step": 272450 }, { "epoch": 1.37, "learning_rate": 9.381063614027475e-05, "loss": 0.0077, "step": 272460 }, { "epoch": 1.37, "learning_rate": 9.380306844726073e-05, "loss": 0.0076, "step": 272470 }, { "epoch": 1.37, "learning_rate": 9.379550075424672e-05, "loss": 0.01, "step": 272480 }, { "epoch": 1.37, "learning_rate": 9.378793306123272e-05, "loss": 0.0071, "step": 272490 }, { "epoch": 1.37, "learning_rate": 9.37803653682187e-05, "loss": 0.0084, "step": 272500 }, { "epoch": 1.37, "learning_rate": 9.37727976752047e-05, "loss": 0.011, "step": 272510 }, { "epoch": 1.37, "learning_rate": 9.376522998219067e-05, "loss": 0.007, "step": 272520 }, { "epoch": 1.37, "learning_rate": 9.375766228917667e-05, "loss": 0.0083, "step": 272530 }, { "epoch": 1.37, "learning_rate": 9.375009459616266e-05, "loss": 0.0069, "step": 272540 }, { "epoch": 1.38, "learning_rate": 9.374252690314865e-05, "loss": 0.0123, "step": 272550 }, { "epoch": 1.38, "learning_rate": 9.373495921013464e-05, "loss": 0.0067, "step": 272560 }, { "epoch": 1.38, "learning_rate": 9.372739151712064e-05, "loss": 0.01, "step": 272570 }, { "epoch": 1.38, "learning_rate": 9.371982382410662e-05, "loss": 0.0076, "step": 272580 }, { "epoch": 1.38, "learning_rate": 9.371225613109261e-05, "loss": 0.0083, "step": 272590 }, { "epoch": 1.38, "learning_rate": 9.370468843807861e-05, "loss": 0.0054, "step": 272600 }, { "epoch": 1.38, "learning_rate": 9.369712074506459e-05, "loss": 0.0102, "step": 272610 }, { "epoch": 1.38, "learning_rate": 9.368955305205058e-05, "loss": 0.0083, "step": 272620 }, { "epoch": 1.38, "learning_rate": 9.368198535903657e-05, "loss": 0.0091, "step": 272630 }, { "epoch": 1.38, "learning_rate": 9.367441766602256e-05, "loss": 0.0084, "step": 272640 }, { "epoch": 1.38, "learning_rate": 9.366684997300856e-05, "loss": 0.0076, "step": 272650 }, { "epoch": 1.38, "learning_rate": 9.365928227999454e-05, "loss": 0.0069, "step": 272660 }, { "epoch": 1.38, "learning_rate": 9.365171458698053e-05, "loss": 0.0089, "step": 272670 }, { "epoch": 1.38, "learning_rate": 9.364414689396653e-05, "loss": 0.0073, "step": 272680 }, { "epoch": 1.38, "learning_rate": 9.363657920095251e-05, "loss": 0.0088, "step": 272690 }, { "epoch": 1.38, "learning_rate": 9.36290115079385e-05, "loss": 0.0068, "step": 272700 }, { "epoch": 1.38, "learning_rate": 9.362144381492449e-05, "loss": 0.0073, "step": 272710 }, { "epoch": 1.38, "learning_rate": 9.361387612191048e-05, "loss": 0.01, "step": 272720 }, { "epoch": 1.38, "learning_rate": 9.360630842889648e-05, "loss": 0.0082, "step": 272730 }, { "epoch": 1.38, "learning_rate": 9.359874073588246e-05, "loss": 0.0086, "step": 272740 }, { "epoch": 1.38, "learning_rate": 9.359117304286845e-05, "loss": 0.0065, "step": 272750 }, { "epoch": 1.38, "learning_rate": 9.358360534985445e-05, "loss": 0.0087, "step": 272760 }, { "epoch": 1.38, "learning_rate": 9.357603765684043e-05, "loss": 0.0076, "step": 272770 }, { "epoch": 1.38, "learning_rate": 9.356846996382642e-05, "loss": 0.0071, "step": 272780 }, { "epoch": 1.38, "learning_rate": 9.35609022708124e-05, "loss": 0.007, "step": 272790 }, { "epoch": 1.38, "learning_rate": 9.35533345777984e-05, "loss": 0.0075, "step": 272800 }, { "epoch": 1.38, "learning_rate": 9.35457668847844e-05, "loss": 0.0081, "step": 272810 }, { "epoch": 1.38, "learning_rate": 9.353819919177038e-05, "loss": 0.0082, "step": 272820 }, { "epoch": 1.38, "learning_rate": 9.353063149875637e-05, "loss": 0.0053, "step": 272830 }, { "epoch": 1.38, "learning_rate": 9.352306380574237e-05, "loss": 0.0099, "step": 272840 }, { "epoch": 1.38, "learning_rate": 9.351549611272835e-05, "loss": 0.0074, "step": 272850 }, { "epoch": 1.38, "learning_rate": 9.350792841971434e-05, "loss": 0.0065, "step": 272860 }, { "epoch": 1.38, "learning_rate": 9.350036072670032e-05, "loss": 0.0073, "step": 272870 }, { "epoch": 1.38, "learning_rate": 9.349279303368632e-05, "loss": 0.006, "step": 272880 }, { "epoch": 1.38, "learning_rate": 9.348522534067231e-05, "loss": 0.0061, "step": 272890 }, { "epoch": 1.38, "learning_rate": 9.34776576476583e-05, "loss": 0.0102, "step": 272900 }, { "epoch": 1.38, "learning_rate": 9.347008995464429e-05, "loss": 0.0057, "step": 272910 }, { "epoch": 1.38, "learning_rate": 9.346252226163029e-05, "loss": 0.0077, "step": 272920 }, { "epoch": 1.38, "learning_rate": 9.345495456861627e-05, "loss": 0.0068, "step": 272930 }, { "epoch": 1.38, "learning_rate": 9.344738687560226e-05, "loss": 0.007, "step": 272940 }, { "epoch": 1.38, "learning_rate": 9.343981918258824e-05, "loss": 0.0072, "step": 272950 }, { "epoch": 1.38, "learning_rate": 9.343225148957424e-05, "loss": 0.0077, "step": 272960 }, { "epoch": 1.38, "learning_rate": 9.342468379656023e-05, "loss": 0.0072, "step": 272970 }, { "epoch": 1.38, "learning_rate": 9.341711610354621e-05, "loss": 0.0084, "step": 272980 }, { "epoch": 1.38, "learning_rate": 9.340954841053221e-05, "loss": 0.0084, "step": 272990 }, { "epoch": 1.38, "learning_rate": 9.34019807175182e-05, "loss": 0.008, "step": 273000 }, { "epoch": 1.38, "eval_cer": 0.9144256176813937, "eval_loss": 0.005903230048716068, "eval_runtime": 116.3214, "eval_samples_per_second": 17.194, "eval_steps_per_second": 4.298, "step": 273000 }, { "epoch": 1.38, "learning_rate": 9.339441302450419e-05, "loss": 0.0064, "step": 273010 }, { "epoch": 1.38, "learning_rate": 9.338684533149018e-05, "loss": 0.0092, "step": 273020 }, { "epoch": 1.38, "learning_rate": 9.337927763847616e-05, "loss": 0.0106, "step": 273030 }, { "epoch": 1.38, "learning_rate": 9.337170994546216e-05, "loss": 0.0071, "step": 273040 }, { "epoch": 1.38, "learning_rate": 9.336414225244815e-05, "loss": 0.0089, "step": 273050 }, { "epoch": 1.38, "learning_rate": 9.335657455943412e-05, "loss": 0.0078, "step": 273060 }, { "epoch": 1.38, "learning_rate": 9.334900686642012e-05, "loss": 0.0094, "step": 273070 }, { "epoch": 1.38, "learning_rate": 9.33414391734061e-05, "loss": 0.0096, "step": 273080 }, { "epoch": 1.38, "learning_rate": 9.333387148039209e-05, "loss": 0.0079, "step": 273090 }, { "epoch": 1.38, "learning_rate": 9.332630378737809e-05, "loss": 0.0095, "step": 273100 }, { "epoch": 1.38, "learning_rate": 9.331873609436407e-05, "loss": 0.0078, "step": 273110 }, { "epoch": 1.38, "learning_rate": 9.331116840135006e-05, "loss": 0.0068, "step": 273120 }, { "epoch": 1.38, "learning_rate": 9.330360070833606e-05, "loss": 0.0071, "step": 273130 }, { "epoch": 1.38, "learning_rate": 9.329603301532204e-05, "loss": 0.0081, "step": 273140 }, { "epoch": 1.38, "learning_rate": 9.328846532230803e-05, "loss": 0.0064, "step": 273150 }, { "epoch": 1.38, "learning_rate": 9.328089762929402e-05, "loss": 0.009, "step": 273160 }, { "epoch": 1.38, "learning_rate": 9.327332993628001e-05, "loss": 0.009, "step": 273170 }, { "epoch": 1.38, "learning_rate": 9.3265762243266e-05, "loss": 0.0086, "step": 273180 }, { "epoch": 1.38, "learning_rate": 9.325819455025199e-05, "loss": 0.0071, "step": 273190 }, { "epoch": 1.38, "learning_rate": 9.325062685723798e-05, "loss": 0.0079, "step": 273200 }, { "epoch": 1.38, "learning_rate": 9.324305916422398e-05, "loss": 0.0075, "step": 273210 }, { "epoch": 1.38, "learning_rate": 9.323549147120996e-05, "loss": 0.0088, "step": 273220 }, { "epoch": 1.38, "learning_rate": 9.322792377819595e-05, "loss": 0.0063, "step": 273230 }, { "epoch": 1.38, "learning_rate": 9.322035608518194e-05, "loss": 0.0077, "step": 273240 }, { "epoch": 1.38, "learning_rate": 9.321278839216793e-05, "loss": 0.0092, "step": 273250 }, { "epoch": 1.38, "learning_rate": 9.320522069915393e-05, "loss": 0.0082, "step": 273260 }, { "epoch": 1.38, "learning_rate": 9.31976530061399e-05, "loss": 0.0068, "step": 273270 }, { "epoch": 1.38, "learning_rate": 9.31900853131259e-05, "loss": 0.0071, "step": 273280 }, { "epoch": 1.38, "learning_rate": 9.31825176201119e-05, "loss": 0.0058, "step": 273290 }, { "epoch": 1.38, "learning_rate": 9.317494992709788e-05, "loss": 0.0077, "step": 273300 }, { "epoch": 1.38, "learning_rate": 9.316738223408387e-05, "loss": 0.0089, "step": 273310 }, { "epoch": 1.38, "learning_rate": 9.315981454106985e-05, "loss": 0.0059, "step": 273320 }, { "epoch": 1.38, "learning_rate": 9.315224684805585e-05, "loss": 0.0069, "step": 273330 }, { "epoch": 1.38, "learning_rate": 9.314467915504184e-05, "loss": 0.0072, "step": 273340 }, { "epoch": 1.38, "learning_rate": 9.313711146202783e-05, "loss": 0.0094, "step": 273350 }, { "epoch": 1.38, "learning_rate": 9.312954376901382e-05, "loss": 0.0096, "step": 273360 }, { "epoch": 1.38, "learning_rate": 9.312197607599982e-05, "loss": 0.0047, "step": 273370 }, { "epoch": 1.38, "learning_rate": 9.31144083829858e-05, "loss": 0.0077, "step": 273380 }, { "epoch": 1.38, "learning_rate": 9.310684068997179e-05, "loss": 0.0069, "step": 273390 }, { "epoch": 1.38, "learning_rate": 9.309927299695777e-05, "loss": 0.0081, "step": 273400 }, { "epoch": 1.38, "learning_rate": 9.309170530394377e-05, "loss": 0.0089, "step": 273410 }, { "epoch": 1.38, "learning_rate": 9.308413761092976e-05, "loss": 0.007, "step": 273420 }, { "epoch": 1.38, "learning_rate": 9.307656991791575e-05, "loss": 0.0067, "step": 273430 }, { "epoch": 1.38, "learning_rate": 9.306900222490174e-05, "loss": 0.0077, "step": 273440 }, { "epoch": 1.38, "learning_rate": 9.306143453188774e-05, "loss": 0.0075, "step": 273450 }, { "epoch": 1.38, "learning_rate": 9.305386683887372e-05, "loss": 0.0076, "step": 273460 }, { "epoch": 1.38, "learning_rate": 9.304629914585971e-05, "loss": 0.0085, "step": 273470 }, { "epoch": 1.38, "learning_rate": 9.303873145284569e-05, "loss": 0.0079, "step": 273480 }, { "epoch": 1.38, "learning_rate": 9.303116375983169e-05, "loss": 0.007, "step": 273490 }, { "epoch": 1.38, "learning_rate": 9.302359606681768e-05, "loss": 0.0117, "step": 273500 }, { "epoch": 1.38, "learning_rate": 9.301602837380366e-05, "loss": 0.0087, "step": 273510 }, { "epoch": 1.38, "learning_rate": 9.300846068078966e-05, "loss": 0.0091, "step": 273520 }, { "epoch": 1.38, "learning_rate": 9.300089298777565e-05, "loss": 0.0072, "step": 273530 }, { "epoch": 1.38, "learning_rate": 9.299332529476164e-05, "loss": 0.0056, "step": 273540 }, { "epoch": 1.38, "learning_rate": 9.298575760174763e-05, "loss": 0.0063, "step": 273550 }, { "epoch": 1.38, "learning_rate": 9.297818990873361e-05, "loss": 0.0069, "step": 273560 }, { "epoch": 1.38, "learning_rate": 9.297062221571961e-05, "loss": 0.0079, "step": 273570 }, { "epoch": 1.38, "learning_rate": 9.29630545227056e-05, "loss": 0.0087, "step": 273580 }, { "epoch": 1.38, "learning_rate": 9.295548682969158e-05, "loss": 0.0075, "step": 273590 }, { "epoch": 1.38, "learning_rate": 9.294791913667758e-05, "loss": 0.0083, "step": 273600 }, { "epoch": 1.38, "learning_rate": 9.294035144366357e-05, "loss": 0.0074, "step": 273610 }, { "epoch": 1.38, "learning_rate": 9.293278375064956e-05, "loss": 0.0096, "step": 273620 }, { "epoch": 1.38, "learning_rate": 9.292521605763555e-05, "loss": 0.0082, "step": 273630 }, { "epoch": 1.38, "learning_rate": 9.291764836462155e-05, "loss": 0.0089, "step": 273640 }, { "epoch": 1.38, "learning_rate": 9.291008067160753e-05, "loss": 0.0084, "step": 273650 }, { "epoch": 1.38, "learning_rate": 9.290251297859352e-05, "loss": 0.0084, "step": 273660 }, { "epoch": 1.38, "learning_rate": 9.28949452855795e-05, "loss": 0.0074, "step": 273670 }, { "epoch": 1.38, "learning_rate": 9.28873775925655e-05, "loss": 0.0092, "step": 273680 }, { "epoch": 1.38, "learning_rate": 9.287980989955147e-05, "loss": 0.0077, "step": 273690 }, { "epoch": 1.38, "learning_rate": 9.287224220653746e-05, "loss": 0.0074, "step": 273700 }, { "epoch": 1.38, "learning_rate": 9.286467451352346e-05, "loss": 0.0059, "step": 273710 }, { "epoch": 1.38, "learning_rate": 9.285710682050944e-05, "loss": 0.0105, "step": 273720 }, { "epoch": 1.38, "learning_rate": 9.284953912749543e-05, "loss": 0.0079, "step": 273730 }, { "epoch": 1.38, "learning_rate": 9.284197143448143e-05, "loss": 0.0083, "step": 273740 }, { "epoch": 1.38, "learning_rate": 9.283440374146741e-05, "loss": 0.0091, "step": 273750 }, { "epoch": 1.38, "learning_rate": 9.28268360484534e-05, "loss": 0.0071, "step": 273760 }, { "epoch": 1.38, "learning_rate": 9.281926835543939e-05, "loss": 0.0085, "step": 273770 }, { "epoch": 1.38, "learning_rate": 9.281170066242538e-05, "loss": 0.0087, "step": 273780 }, { "epoch": 1.38, "learning_rate": 9.280413296941138e-05, "loss": 0.0084, "step": 273790 }, { "epoch": 1.38, "learning_rate": 9.279656527639736e-05, "loss": 0.0074, "step": 273800 }, { "epoch": 1.38, "learning_rate": 9.278899758338335e-05, "loss": 0.0109, "step": 273810 }, { "epoch": 1.38, "learning_rate": 9.278142989036935e-05, "loss": 0.0089, "step": 273820 }, { "epoch": 1.38, "learning_rate": 9.277386219735533e-05, "loss": 0.0079, "step": 273830 }, { "epoch": 1.38, "learning_rate": 9.276629450434132e-05, "loss": 0.0094, "step": 273840 }, { "epoch": 1.38, "learning_rate": 9.27587268113273e-05, "loss": 0.0089, "step": 273850 }, { "epoch": 1.38, "learning_rate": 9.27511591183133e-05, "loss": 0.0064, "step": 273860 }, { "epoch": 1.38, "learning_rate": 9.27435914252993e-05, "loss": 0.0079, "step": 273870 }, { "epoch": 1.38, "learning_rate": 9.273602373228528e-05, "loss": 0.0088, "step": 273880 }, { "epoch": 1.38, "learning_rate": 9.272845603927127e-05, "loss": 0.0091, "step": 273890 }, { "epoch": 1.38, "learning_rate": 9.272088834625727e-05, "loss": 0.0071, "step": 273900 }, { "epoch": 1.38, "learning_rate": 9.271332065324325e-05, "loss": 0.0075, "step": 273910 }, { "epoch": 1.38, "learning_rate": 9.270575296022924e-05, "loss": 0.006, "step": 273920 }, { "epoch": 1.38, "learning_rate": 9.269818526721522e-05, "loss": 0.007, "step": 273930 }, { "epoch": 1.38, "learning_rate": 9.269061757420122e-05, "loss": 0.0062, "step": 273940 }, { "epoch": 1.38, "learning_rate": 9.268304988118721e-05, "loss": 0.0068, "step": 273950 }, { "epoch": 1.38, "learning_rate": 9.26754821881732e-05, "loss": 0.0064, "step": 273960 }, { "epoch": 1.38, "learning_rate": 9.266791449515919e-05, "loss": 0.0055, "step": 273970 }, { "epoch": 1.38, "learning_rate": 9.266034680214519e-05, "loss": 0.0063, "step": 273980 }, { "epoch": 1.38, "learning_rate": 9.265277910913117e-05, "loss": 0.0087, "step": 273990 }, { "epoch": 1.38, "learning_rate": 9.264521141611716e-05, "loss": 0.0063, "step": 274000 }, { "epoch": 1.38, "eval_cer": 0.9144392032271493, "eval_loss": 0.005893085617572069, "eval_runtime": 116.3239, "eval_samples_per_second": 17.193, "eval_steps_per_second": 4.298, "step": 274000 }, { "epoch": 1.38, "learning_rate": 9.263764372310314e-05, "loss": 0.005, "step": 274010 }, { "epoch": 1.38, "learning_rate": 9.263007603008914e-05, "loss": 0.0073, "step": 274020 }, { "epoch": 1.38, "learning_rate": 9.262250833707513e-05, "loss": 0.0083, "step": 274030 }, { "epoch": 1.38, "learning_rate": 9.261494064406111e-05, "loss": 0.0101, "step": 274040 }, { "epoch": 1.38, "learning_rate": 9.260737295104711e-05, "loss": 0.0059, "step": 274050 }, { "epoch": 1.38, "learning_rate": 9.25998052580331e-05, "loss": 0.0083, "step": 274060 }, { "epoch": 1.38, "learning_rate": 9.259223756501909e-05, "loss": 0.0075, "step": 274070 }, { "epoch": 1.38, "learning_rate": 9.258466987200508e-05, "loss": 0.0155, "step": 274080 }, { "epoch": 1.38, "learning_rate": 9.257710217899108e-05, "loss": 0.0085, "step": 274090 }, { "epoch": 1.38, "learning_rate": 9.256953448597706e-05, "loss": 0.0081, "step": 274100 }, { "epoch": 1.38, "learning_rate": 9.256196679296305e-05, "loss": 0.0065, "step": 274110 }, { "epoch": 1.38, "learning_rate": 9.255439909994903e-05, "loss": 0.01, "step": 274120 }, { "epoch": 1.38, "learning_rate": 9.254683140693503e-05, "loss": 0.0083, "step": 274130 }, { "epoch": 1.38, "learning_rate": 9.253926371392102e-05, "loss": 0.0069, "step": 274140 }, { "epoch": 1.38, "learning_rate": 9.2531696020907e-05, "loss": 0.0068, "step": 274150 }, { "epoch": 1.38, "learning_rate": 9.2524128327893e-05, "loss": 0.007, "step": 274160 }, { "epoch": 1.38, "learning_rate": 9.2516560634879e-05, "loss": 0.0096, "step": 274170 }, { "epoch": 1.38, "learning_rate": 9.250899294186498e-05, "loss": 0.0076, "step": 274180 }, { "epoch": 1.38, "learning_rate": 9.250142524885097e-05, "loss": 0.0089, "step": 274190 }, { "epoch": 1.38, "learning_rate": 9.249385755583695e-05, "loss": 0.0082, "step": 274200 }, { "epoch": 1.38, "learning_rate": 9.248628986282295e-05, "loss": 0.0074, "step": 274210 }, { "epoch": 1.38, "learning_rate": 9.247872216980894e-05, "loss": 0.0074, "step": 274220 }, { "epoch": 1.38, "learning_rate": 9.247115447679492e-05, "loss": 0.0075, "step": 274230 }, { "epoch": 1.38, "learning_rate": 9.246358678378092e-05, "loss": 0.0085, "step": 274240 }, { "epoch": 1.38, "learning_rate": 9.245601909076691e-05, "loss": 0.0087, "step": 274250 }, { "epoch": 1.38, "learning_rate": 9.24484513977529e-05, "loss": 0.0078, "step": 274260 }, { "epoch": 1.38, "learning_rate": 9.244088370473889e-05, "loss": 0.0086, "step": 274270 }, { "epoch": 1.38, "learning_rate": 9.243331601172487e-05, "loss": 0.0117, "step": 274280 }, { "epoch": 1.38, "learning_rate": 9.242574831871087e-05, "loss": 0.0084, "step": 274290 }, { "epoch": 1.38, "learning_rate": 9.241818062569686e-05, "loss": 0.0077, "step": 274300 }, { "epoch": 1.38, "learning_rate": 9.241061293268284e-05, "loss": 0.0069, "step": 274310 }, { "epoch": 1.38, "learning_rate": 9.240304523966883e-05, "loss": 0.0099, "step": 274320 }, { "epoch": 1.38, "learning_rate": 9.239547754665481e-05, "loss": 0.0086, "step": 274330 }, { "epoch": 1.38, "learning_rate": 9.23879098536408e-05, "loss": 0.0081, "step": 274340 }, { "epoch": 1.38, "learning_rate": 9.23803421606268e-05, "loss": 0.0064, "step": 274350 }, { "epoch": 1.38, "learning_rate": 9.237277446761278e-05, "loss": 0.011, "step": 274360 }, { "epoch": 1.38, "learning_rate": 9.236520677459877e-05, "loss": 0.0071, "step": 274370 }, { "epoch": 1.38, "learning_rate": 9.235763908158475e-05, "loss": 0.0081, "step": 274380 }, { "epoch": 1.38, "learning_rate": 9.235007138857075e-05, "loss": 0.0097, "step": 274390 }, { "epoch": 1.38, "learning_rate": 9.234250369555674e-05, "loss": 0.0087, "step": 274400 }, { "epoch": 1.38, "learning_rate": 9.233493600254273e-05, "loss": 0.006, "step": 274410 }, { "epoch": 1.38, "learning_rate": 9.232736830952872e-05, "loss": 0.0097, "step": 274420 }, { "epoch": 1.38, "learning_rate": 9.231980061651472e-05, "loss": 0.0087, "step": 274430 }, { "epoch": 1.38, "learning_rate": 9.23122329235007e-05, "loss": 0.0083, "step": 274440 }, { "epoch": 1.38, "learning_rate": 9.230466523048669e-05, "loss": 0.0096, "step": 274450 }, { "epoch": 1.38, "learning_rate": 9.229709753747267e-05, "loss": 0.0078, "step": 274460 }, { "epoch": 1.38, "learning_rate": 9.228952984445867e-05, "loss": 0.0051, "step": 274470 }, { "epoch": 1.38, "learning_rate": 9.228196215144466e-05, "loss": 0.0083, "step": 274480 }, { "epoch": 1.38, "learning_rate": 9.227439445843065e-05, "loss": 0.0075, "step": 274490 }, { "epoch": 1.38, "learning_rate": 9.226682676541664e-05, "loss": 0.0085, "step": 274500 }, { "epoch": 1.38, "learning_rate": 9.225925907240264e-05, "loss": 0.0061, "step": 274510 }, { "epoch": 1.38, "learning_rate": 9.225169137938862e-05, "loss": 0.0071, "step": 274520 }, { "epoch": 1.39, "learning_rate": 9.224412368637461e-05, "loss": 0.0066, "step": 274530 }, { "epoch": 1.39, "learning_rate": 9.223655599336061e-05, "loss": 0.0066, "step": 274540 }, { "epoch": 1.39, "learning_rate": 9.222898830034659e-05, "loss": 0.0072, "step": 274550 }, { "epoch": 1.39, "learning_rate": 9.222142060733258e-05, "loss": 0.0098, "step": 274560 }, { "epoch": 1.39, "learning_rate": 9.221385291431856e-05, "loss": 0.0073, "step": 274570 }, { "epoch": 1.39, "learning_rate": 9.220628522130456e-05, "loss": 0.0073, "step": 274580 }, { "epoch": 1.39, "learning_rate": 9.219871752829055e-05, "loss": 0.0083, "step": 274590 }, { "epoch": 1.39, "learning_rate": 9.219114983527654e-05, "loss": 0.007, "step": 274600 }, { "epoch": 1.39, "learning_rate": 9.218358214226253e-05, "loss": 0.009, "step": 274610 }, { "epoch": 1.39, "learning_rate": 9.217601444924853e-05, "loss": 0.0087, "step": 274620 }, { "epoch": 1.39, "learning_rate": 9.216844675623451e-05, "loss": 0.0063, "step": 274630 }, { "epoch": 1.39, "learning_rate": 9.21608790632205e-05, "loss": 0.0066, "step": 274640 }, { "epoch": 1.39, "learning_rate": 9.215331137020648e-05, "loss": 0.0061, "step": 274650 }, { "epoch": 1.39, "learning_rate": 9.214574367719248e-05, "loss": 0.0116, "step": 274660 }, { "epoch": 1.39, "learning_rate": 9.213817598417847e-05, "loss": 0.0063, "step": 274670 }, { "epoch": 1.39, "learning_rate": 9.213060829116446e-05, "loss": 0.0069, "step": 274680 }, { "epoch": 1.39, "learning_rate": 9.212304059815045e-05, "loss": 0.0085, "step": 274690 }, { "epoch": 1.39, "learning_rate": 9.211547290513645e-05, "loss": 0.0107, "step": 274700 }, { "epoch": 1.39, "learning_rate": 9.210790521212243e-05, "loss": 0.0087, "step": 274710 }, { "epoch": 1.39, "learning_rate": 9.210033751910842e-05, "loss": 0.0091, "step": 274720 }, { "epoch": 1.39, "learning_rate": 9.20927698260944e-05, "loss": 0.007, "step": 274730 }, { "epoch": 1.39, "learning_rate": 9.20852021330804e-05, "loss": 0.0074, "step": 274740 }, { "epoch": 1.39, "learning_rate": 9.20776344400664e-05, "loss": 0.0076, "step": 274750 }, { "epoch": 1.39, "learning_rate": 9.207006674705237e-05, "loss": 0.007, "step": 274760 }, { "epoch": 1.39, "learning_rate": 9.206249905403837e-05, "loss": 0.008, "step": 274770 }, { "epoch": 1.39, "learning_rate": 9.205493136102436e-05, "loss": 0.0072, "step": 274780 }, { "epoch": 1.39, "learning_rate": 9.204736366801035e-05, "loss": 0.008, "step": 274790 }, { "epoch": 1.39, "learning_rate": 9.203979597499634e-05, "loss": 0.0075, "step": 274800 }, { "epoch": 1.39, "learning_rate": 9.203222828198232e-05, "loss": 0.0087, "step": 274810 }, { "epoch": 1.39, "learning_rate": 9.202466058896832e-05, "loss": 0.0072, "step": 274820 }, { "epoch": 1.39, "learning_rate": 9.201709289595431e-05, "loss": 0.0056, "step": 274830 }, { "epoch": 1.39, "learning_rate": 9.20095252029403e-05, "loss": 0.0086, "step": 274840 }, { "epoch": 1.39, "learning_rate": 9.200195750992629e-05, "loss": 0.0078, "step": 274850 }, { "epoch": 1.39, "learning_rate": 9.199438981691228e-05, "loss": 0.0084, "step": 274860 }, { "epoch": 1.39, "learning_rate": 9.198682212389827e-05, "loss": 0.0085, "step": 274870 }, { "epoch": 1.39, "learning_rate": 9.197925443088426e-05, "loss": 0.008, "step": 274880 }, { "epoch": 1.39, "learning_rate": 9.197168673787024e-05, "loss": 0.0087, "step": 274890 }, { "epoch": 1.39, "learning_rate": 9.196411904485624e-05, "loss": 0.0097, "step": 274900 }, { "epoch": 1.39, "learning_rate": 9.195655135184223e-05, "loss": 0.0067, "step": 274910 }, { "epoch": 1.39, "learning_rate": 9.194898365882821e-05, "loss": 0.0095, "step": 274920 }, { "epoch": 1.39, "learning_rate": 9.194141596581421e-05, "loss": 0.0104, "step": 274930 }, { "epoch": 1.39, "learning_rate": 9.19338482728002e-05, "loss": 0.006, "step": 274940 }, { "epoch": 1.39, "learning_rate": 9.192628057978617e-05, "loss": 0.0074, "step": 274950 }, { "epoch": 1.39, "learning_rate": 9.191871288677217e-05, "loss": 0.0066, "step": 274960 }, { "epoch": 1.39, "learning_rate": 9.191114519375815e-05, "loss": 0.0074, "step": 274970 }, { "epoch": 1.39, "learning_rate": 9.190357750074414e-05, "loss": 0.0072, "step": 274980 }, { "epoch": 1.39, "learning_rate": 9.189600980773014e-05, "loss": 0.0077, "step": 274990 }, { "epoch": 1.39, "learning_rate": 9.188844211471612e-05, "loss": 0.0088, "step": 275000 }, { "epoch": 1.39, "eval_cer": 0.9144459960000272, "eval_loss": 0.005970404949039221, "eval_runtime": 116.7373, "eval_samples_per_second": 17.132, "eval_steps_per_second": 4.283, "step": 275000 }, { "epoch": 1.39, "learning_rate": 9.188087442170211e-05, "loss": 0.0106, "step": 275010 }, { "epoch": 1.39, "learning_rate": 9.18733067286881e-05, "loss": 0.0089, "step": 275020 }, { "epoch": 1.39, "learning_rate": 9.186573903567409e-05, "loss": 0.0075, "step": 275030 }, { "epoch": 1.39, "learning_rate": 9.185817134266009e-05, "loss": 0.0061, "step": 275040 }, { "epoch": 1.39, "learning_rate": 9.185060364964607e-05, "loss": 0.0067, "step": 275050 }, { "epoch": 1.39, "learning_rate": 9.184303595663206e-05, "loss": 0.0075, "step": 275060 }, { "epoch": 1.39, "learning_rate": 9.183546826361806e-05, "loss": 0.0072, "step": 275070 }, { "epoch": 1.39, "learning_rate": 9.182790057060404e-05, "loss": 0.0077, "step": 275080 }, { "epoch": 1.39, "learning_rate": 9.182033287759003e-05, "loss": 0.0062, "step": 275090 }, { "epoch": 1.39, "learning_rate": 9.181276518457601e-05, "loss": 0.0077, "step": 275100 }, { "epoch": 1.39, "learning_rate": 9.180519749156201e-05, "loss": 0.0062, "step": 275110 }, { "epoch": 1.39, "learning_rate": 9.1797629798548e-05, "loss": 0.0079, "step": 275120 }, { "epoch": 1.39, "learning_rate": 9.179006210553399e-05, "loss": 0.0115, "step": 275130 }, { "epoch": 1.39, "learning_rate": 9.178249441251998e-05, "loss": 0.0108, "step": 275140 }, { "epoch": 1.39, "learning_rate": 9.177492671950598e-05, "loss": 0.0073, "step": 275150 }, { "epoch": 1.39, "learning_rate": 9.176735902649196e-05, "loss": 0.0085, "step": 275160 }, { "epoch": 1.39, "learning_rate": 9.175979133347795e-05, "loss": 0.0111, "step": 275170 }, { "epoch": 1.39, "learning_rate": 9.175222364046393e-05, "loss": 0.0105, "step": 275180 }, { "epoch": 1.39, "learning_rate": 9.174465594744993e-05, "loss": 0.0073, "step": 275190 }, { "epoch": 1.39, "learning_rate": 9.173708825443592e-05, "loss": 0.0091, "step": 275200 }, { "epoch": 1.39, "learning_rate": 9.17295205614219e-05, "loss": 0.008, "step": 275210 }, { "epoch": 1.39, "learning_rate": 9.17219528684079e-05, "loss": 0.0051, "step": 275220 }, { "epoch": 1.39, "learning_rate": 9.17143851753939e-05, "loss": 0.0074, "step": 275230 }, { "epoch": 1.39, "learning_rate": 9.170681748237988e-05, "loss": 0.007, "step": 275240 }, { "epoch": 1.39, "learning_rate": 9.169924978936587e-05, "loss": 0.0097, "step": 275250 }, { "epoch": 1.39, "learning_rate": 9.169168209635185e-05, "loss": 0.0075, "step": 275260 }, { "epoch": 1.39, "learning_rate": 9.168411440333785e-05, "loss": 0.008, "step": 275270 }, { "epoch": 1.39, "learning_rate": 9.167654671032384e-05, "loss": 0.0059, "step": 275280 }, { "epoch": 1.39, "learning_rate": 9.166897901730982e-05, "loss": 0.0047, "step": 275290 }, { "epoch": 1.39, "learning_rate": 9.166141132429582e-05, "loss": 0.0081, "step": 275300 }, { "epoch": 1.39, "learning_rate": 9.165384363128181e-05, "loss": 0.0081, "step": 275310 }, { "epoch": 1.39, "learning_rate": 9.16462759382678e-05, "loss": 0.0101, "step": 275320 }, { "epoch": 1.39, "learning_rate": 9.163870824525379e-05, "loss": 0.0071, "step": 275330 }, { "epoch": 1.39, "learning_rate": 9.163114055223977e-05, "loss": 0.0074, "step": 275340 }, { "epoch": 1.39, "learning_rate": 9.162357285922577e-05, "loss": 0.009, "step": 275350 }, { "epoch": 1.39, "learning_rate": 9.161600516621176e-05, "loss": 0.0082, "step": 275360 }, { "epoch": 1.39, "learning_rate": 9.160843747319774e-05, "loss": 0.0074, "step": 275370 }, { "epoch": 1.39, "learning_rate": 9.160086978018374e-05, "loss": 0.0071, "step": 275380 }, { "epoch": 1.39, "learning_rate": 9.159330208716973e-05, "loss": 0.0094, "step": 275390 }, { "epoch": 1.39, "learning_rate": 9.158573439415572e-05, "loss": 0.0085, "step": 275400 }, { "epoch": 1.39, "learning_rate": 9.157816670114171e-05, "loss": 0.0069, "step": 275410 }, { "epoch": 1.39, "learning_rate": 9.157059900812769e-05, "loss": 0.0078, "step": 275420 }, { "epoch": 1.39, "learning_rate": 9.156303131511369e-05, "loss": 0.0096, "step": 275430 }, { "epoch": 1.39, "learning_rate": 9.155546362209968e-05, "loss": 0.0082, "step": 275440 }, { "epoch": 1.39, "learning_rate": 9.154789592908566e-05, "loss": 0.0068, "step": 275450 }, { "epoch": 1.39, "learning_rate": 9.154032823607166e-05, "loss": 0.007, "step": 275460 }, { "epoch": 1.39, "learning_rate": 9.153276054305765e-05, "loss": 0.0097, "step": 275470 }, { "epoch": 1.39, "learning_rate": 9.152519285004363e-05, "loss": 0.0078, "step": 275480 }, { "epoch": 1.39, "learning_rate": 9.151762515702963e-05, "loss": 0.0117, "step": 275490 }, { "epoch": 1.39, "learning_rate": 9.151005746401561e-05, "loss": 0.0085, "step": 275500 }, { "epoch": 1.39, "learning_rate": 9.15024897710016e-05, "loss": 0.0064, "step": 275510 }, { "epoch": 1.39, "learning_rate": 9.14949220779876e-05, "loss": 0.009, "step": 275520 }, { "epoch": 1.39, "learning_rate": 9.148735438497358e-05, "loss": 0.0085, "step": 275530 }, { "epoch": 1.39, "learning_rate": 9.147978669195958e-05, "loss": 0.0081, "step": 275540 }, { "epoch": 1.39, "learning_rate": 9.147221899894557e-05, "loss": 0.0066, "step": 275550 }, { "epoch": 1.39, "learning_rate": 9.146465130593155e-05, "loss": 0.0073, "step": 275560 }, { "epoch": 1.39, "learning_rate": 9.145708361291755e-05, "loss": 0.0081, "step": 275570 }, { "epoch": 1.39, "learning_rate": 9.144951591990352e-05, "loss": 0.009, "step": 275580 }, { "epoch": 1.39, "learning_rate": 9.144194822688951e-05, "loss": 0.0093, "step": 275590 }, { "epoch": 1.39, "learning_rate": 9.143438053387551e-05, "loss": 0.0077, "step": 275600 }, { "epoch": 1.39, "learning_rate": 9.142681284086149e-05, "loss": 0.0091, "step": 275610 }, { "epoch": 1.39, "learning_rate": 9.141924514784748e-05, "loss": 0.0078, "step": 275620 }, { "epoch": 1.39, "learning_rate": 9.141167745483347e-05, "loss": 0.006, "step": 275630 }, { "epoch": 1.39, "learning_rate": 9.140410976181946e-05, "loss": 0.0066, "step": 275640 }, { "epoch": 1.39, "learning_rate": 9.139654206880546e-05, "loss": 0.0082, "step": 275650 }, { "epoch": 1.39, "learning_rate": 9.138897437579144e-05, "loss": 0.0071, "step": 275660 }, { "epoch": 1.39, "learning_rate": 9.138140668277743e-05, "loss": 0.0107, "step": 275670 }, { "epoch": 1.39, "learning_rate": 9.137383898976343e-05, "loss": 0.0103, "step": 275680 }, { "epoch": 1.39, "learning_rate": 9.136627129674941e-05, "loss": 0.0091, "step": 275690 }, { "epoch": 1.39, "learning_rate": 9.13587036037354e-05, "loss": 0.0083, "step": 275700 }, { "epoch": 1.39, "learning_rate": 9.135113591072138e-05, "loss": 0.0082, "step": 275710 }, { "epoch": 1.39, "learning_rate": 9.134356821770738e-05, "loss": 0.0095, "step": 275720 }, { "epoch": 1.39, "learning_rate": 9.133600052469337e-05, "loss": 0.0103, "step": 275730 }, { "epoch": 1.39, "learning_rate": 9.132843283167936e-05, "loss": 0.0112, "step": 275740 }, { "epoch": 1.39, "learning_rate": 9.132086513866535e-05, "loss": 0.0059, "step": 275750 }, { "epoch": 1.39, "learning_rate": 9.131329744565135e-05, "loss": 0.01, "step": 275760 }, { "epoch": 1.39, "learning_rate": 9.130572975263733e-05, "loss": 0.0091, "step": 275770 }, { "epoch": 1.39, "learning_rate": 9.129816205962332e-05, "loss": 0.0085, "step": 275780 }, { "epoch": 1.39, "learning_rate": 9.12905943666093e-05, "loss": 0.007, "step": 275790 }, { "epoch": 1.39, "learning_rate": 9.12830266735953e-05, "loss": 0.0058, "step": 275800 }, { "epoch": 1.39, "learning_rate": 9.12754589805813e-05, "loss": 0.0095, "step": 275810 }, { "epoch": 1.39, "learning_rate": 9.126789128756728e-05, "loss": 0.0068, "step": 275820 }, { "epoch": 1.39, "learning_rate": 9.126032359455327e-05, "loss": 0.0052, "step": 275830 }, { "epoch": 1.39, "learning_rate": 9.125275590153927e-05, "loss": 0.0089, "step": 275840 }, { "epoch": 1.39, "learning_rate": 9.124518820852525e-05, "loss": 0.007, "step": 275850 }, { "epoch": 1.39, "learning_rate": 9.123762051551124e-05, "loss": 0.0087, "step": 275860 }, { "epoch": 1.39, "learning_rate": 9.123005282249722e-05, "loss": 0.0083, "step": 275870 }, { "epoch": 1.39, "learning_rate": 9.122248512948322e-05, "loss": 0.0081, "step": 275880 }, { "epoch": 1.39, "learning_rate": 9.121491743646921e-05, "loss": 0.0067, "step": 275890 }, { "epoch": 1.39, "learning_rate": 9.12073497434552e-05, "loss": 0.0093, "step": 275900 }, { "epoch": 1.39, "learning_rate": 9.119978205044119e-05, "loss": 0.006, "step": 275910 }, { "epoch": 1.39, "learning_rate": 9.119221435742718e-05, "loss": 0.0068, "step": 275920 }, { "epoch": 1.39, "learning_rate": 9.118464666441317e-05, "loss": 0.008, "step": 275930 }, { "epoch": 1.39, "learning_rate": 9.117707897139916e-05, "loss": 0.0077, "step": 275940 }, { "epoch": 1.39, "learning_rate": 9.116951127838514e-05, "loss": 0.0091, "step": 275950 }, { "epoch": 1.39, "learning_rate": 9.116194358537114e-05, "loss": 0.0095, "step": 275960 }, { "epoch": 1.39, "learning_rate": 9.115437589235713e-05, "loss": 0.0101, "step": 275970 }, { "epoch": 1.39, "learning_rate": 9.114680819934311e-05, "loss": 0.0085, "step": 275980 }, { "epoch": 1.39, "learning_rate": 9.113924050632911e-05, "loss": 0.007, "step": 275990 }, { "epoch": 1.39, "learning_rate": 9.11316728133151e-05, "loss": 0.0081, "step": 276000 }, { "epoch": 1.39, "eval_cer": 0.9144159137201398, "eval_loss": 0.006024388130754232, "eval_runtime": 116.144, "eval_samples_per_second": 17.22, "eval_steps_per_second": 4.305, "step": 276000 }, { "epoch": 1.39, "learning_rate": 9.112410512030109e-05, "loss": 0.0067, "step": 276010 }, { "epoch": 1.39, "learning_rate": 9.111653742728708e-05, "loss": 0.008, "step": 276020 }, { "epoch": 1.39, "learning_rate": 9.110896973427308e-05, "loss": 0.0073, "step": 276030 }, { "epoch": 1.39, "learning_rate": 9.110140204125906e-05, "loss": 0.0059, "step": 276040 }, { "epoch": 1.39, "learning_rate": 9.109383434824505e-05, "loss": 0.0076, "step": 276050 }, { "epoch": 1.39, "learning_rate": 9.108626665523103e-05, "loss": 0.0077, "step": 276060 }, { "epoch": 1.39, "learning_rate": 9.107869896221703e-05, "loss": 0.0095, "step": 276070 }, { "epoch": 1.39, "learning_rate": 9.107113126920302e-05, "loss": 0.008, "step": 276080 }, { "epoch": 1.39, "learning_rate": 9.1063563576189e-05, "loss": 0.0068, "step": 276090 }, { "epoch": 1.39, "learning_rate": 9.1055995883175e-05, "loss": 0.009, "step": 276100 }, { "epoch": 1.39, "learning_rate": 9.1048428190161e-05, "loss": 0.0076, "step": 276110 }, { "epoch": 1.39, "learning_rate": 9.104086049714698e-05, "loss": 0.008, "step": 276120 }, { "epoch": 1.39, "learning_rate": 9.103329280413297e-05, "loss": 0.0088, "step": 276130 }, { "epoch": 1.39, "learning_rate": 9.102572511111895e-05, "loss": 0.0075, "step": 276140 }, { "epoch": 1.39, "learning_rate": 9.101815741810495e-05, "loss": 0.0066, "step": 276150 }, { "epoch": 1.39, "learning_rate": 9.101058972509094e-05, "loss": 0.0072, "step": 276160 }, { "epoch": 1.39, "learning_rate": 9.100302203207692e-05, "loss": 0.0086, "step": 276170 }, { "epoch": 1.39, "learning_rate": 9.099545433906292e-05, "loss": 0.0081, "step": 276180 }, { "epoch": 1.39, "learning_rate": 9.098788664604891e-05, "loss": 0.0111, "step": 276190 }, { "epoch": 1.39, "learning_rate": 9.09803189530349e-05, "loss": 0.0076, "step": 276200 }, { "epoch": 1.39, "learning_rate": 9.097275126002088e-05, "loss": 0.0082, "step": 276210 }, { "epoch": 1.39, "learning_rate": 9.096518356700686e-05, "loss": 0.0066, "step": 276220 }, { "epoch": 1.39, "learning_rate": 9.095761587399285e-05, "loss": 0.006, "step": 276230 }, { "epoch": 1.39, "learning_rate": 9.095004818097883e-05, "loss": 0.008, "step": 276240 }, { "epoch": 1.39, "learning_rate": 9.094248048796483e-05, "loss": 0.0087, "step": 276250 }, { "epoch": 1.39, "learning_rate": 9.093491279495082e-05, "loss": 0.0075, "step": 276260 }, { "epoch": 1.39, "learning_rate": 9.09273451019368e-05, "loss": 0.0082, "step": 276270 }, { "epoch": 1.39, "learning_rate": 9.09197774089228e-05, "loss": 0.008, "step": 276280 }, { "epoch": 1.39, "learning_rate": 9.09122097159088e-05, "loss": 0.0081, "step": 276290 }, { "epoch": 1.39, "learning_rate": 9.090464202289478e-05, "loss": 0.0065, "step": 276300 }, { "epoch": 1.39, "learning_rate": 9.089707432988077e-05, "loss": 0.0072, "step": 276310 }, { "epoch": 1.39, "learning_rate": 9.088950663686675e-05, "loss": 0.0103, "step": 276320 }, { "epoch": 1.39, "learning_rate": 9.088193894385275e-05, "loss": 0.0092, "step": 276330 }, { "epoch": 1.39, "learning_rate": 9.087437125083874e-05, "loss": 0.0075, "step": 276340 }, { "epoch": 1.39, "learning_rate": 9.086680355782473e-05, "loss": 0.0072, "step": 276350 }, { "epoch": 1.39, "learning_rate": 9.085923586481072e-05, "loss": 0.0077, "step": 276360 }, { "epoch": 1.39, "learning_rate": 9.085166817179672e-05, "loss": 0.0074, "step": 276370 }, { "epoch": 1.39, "learning_rate": 9.08441004787827e-05, "loss": 0.0067, "step": 276380 }, { "epoch": 1.39, "learning_rate": 9.083653278576869e-05, "loss": 0.0082, "step": 276390 }, { "epoch": 1.39, "learning_rate": 9.082896509275467e-05, "loss": 0.008, "step": 276400 }, { "epoch": 1.39, "learning_rate": 9.082139739974067e-05, "loss": 0.0094, "step": 276410 }, { "epoch": 1.39, "learning_rate": 9.081382970672666e-05, "loss": 0.0074, "step": 276420 }, { "epoch": 1.39, "learning_rate": 9.080626201371264e-05, "loss": 0.007, "step": 276430 }, { "epoch": 1.39, "learning_rate": 9.079869432069864e-05, "loss": 0.009, "step": 276440 }, { "epoch": 1.39, "learning_rate": 9.079112662768463e-05, "loss": 0.0074, "step": 276450 }, { "epoch": 1.39, "learning_rate": 9.078355893467062e-05, "loss": 0.0067, "step": 276460 }, { "epoch": 1.39, "learning_rate": 9.077599124165661e-05, "loss": 0.0085, "step": 276470 }, { "epoch": 1.39, "learning_rate": 9.07684235486426e-05, "loss": 0.0057, "step": 276480 }, { "epoch": 1.39, "learning_rate": 9.076085585562859e-05, "loss": 0.0088, "step": 276490 }, { "epoch": 1.39, "learning_rate": 9.075328816261458e-05, "loss": 0.0063, "step": 276500 }, { "epoch": 1.4, "learning_rate": 9.074572046960056e-05, "loss": 0.0112, "step": 276510 }, { "epoch": 1.4, "learning_rate": 9.073815277658656e-05, "loss": 0.0102, "step": 276520 }, { "epoch": 1.4, "learning_rate": 9.073058508357255e-05, "loss": 0.0064, "step": 276530 }, { "epoch": 1.4, "learning_rate": 9.072301739055854e-05, "loss": 0.0093, "step": 276540 }, { "epoch": 1.4, "learning_rate": 9.071544969754453e-05, "loss": 0.0077, "step": 276550 }, { "epoch": 1.4, "learning_rate": 9.070788200453053e-05, "loss": 0.0068, "step": 276560 }, { "epoch": 1.4, "learning_rate": 9.07003143115165e-05, "loss": 0.0073, "step": 276570 }, { "epoch": 1.4, "learning_rate": 9.06927466185025e-05, "loss": 0.0084, "step": 276580 }, { "epoch": 1.4, "learning_rate": 9.068517892548848e-05, "loss": 0.006, "step": 276590 }, { "epoch": 1.4, "learning_rate": 9.067761123247448e-05, "loss": 0.0082, "step": 276600 }, { "epoch": 1.4, "learning_rate": 9.067004353946047e-05, "loss": 0.0066, "step": 276610 }, { "epoch": 1.4, "learning_rate": 9.066247584644645e-05, "loss": 0.0082, "step": 276620 }, { "epoch": 1.4, "learning_rate": 9.065490815343245e-05, "loss": 0.0056, "step": 276630 }, { "epoch": 1.4, "learning_rate": 9.064734046041844e-05, "loss": 0.0073, "step": 276640 }, { "epoch": 1.4, "learning_rate": 9.063977276740443e-05, "loss": 0.0062, "step": 276650 }, { "epoch": 1.4, "learning_rate": 9.063220507439042e-05, "loss": 0.0068, "step": 276660 }, { "epoch": 1.4, "learning_rate": 9.06246373813764e-05, "loss": 0.0082, "step": 276670 }, { "epoch": 1.4, "learning_rate": 9.06170696883624e-05, "loss": 0.0087, "step": 276680 }, { "epoch": 1.4, "learning_rate": 9.060950199534839e-05, "loss": 0.0092, "step": 276690 }, { "epoch": 1.4, "learning_rate": 9.060193430233437e-05, "loss": 0.0095, "step": 276700 }, { "epoch": 1.4, "learning_rate": 9.059436660932037e-05, "loss": 0.0076, "step": 276710 }, { "epoch": 1.4, "learning_rate": 9.058679891630636e-05, "loss": 0.0083, "step": 276720 }, { "epoch": 1.4, "learning_rate": 9.057923122329235e-05, "loss": 0.0076, "step": 276730 }, { "epoch": 1.4, "learning_rate": 9.057166353027834e-05, "loss": 0.0095, "step": 276740 }, { "epoch": 1.4, "learning_rate": 9.056409583726432e-05, "loss": 0.0075, "step": 276750 }, { "epoch": 1.4, "learning_rate": 9.055652814425032e-05, "loss": 0.009, "step": 276760 }, { "epoch": 1.4, "learning_rate": 9.054896045123631e-05, "loss": 0.009, "step": 276770 }, { "epoch": 1.4, "learning_rate": 9.054139275822229e-05, "loss": 0.0081, "step": 276780 }, { "epoch": 1.4, "learning_rate": 9.053382506520829e-05, "loss": 0.0057, "step": 276790 }, { "epoch": 1.4, "learning_rate": 9.052625737219428e-05, "loss": 0.0069, "step": 276800 }, { "epoch": 1.4, "learning_rate": 9.051868967918026e-05, "loss": 0.008, "step": 276810 }, { "epoch": 1.4, "learning_rate": 9.051112198616626e-05, "loss": 0.0081, "step": 276820 }, { "epoch": 1.4, "learning_rate": 9.050355429315223e-05, "loss": 0.0084, "step": 276830 }, { "epoch": 1.4, "learning_rate": 9.049598660013822e-05, "loss": 0.0085, "step": 276840 }, { "epoch": 1.4, "learning_rate": 9.04884189071242e-05, "loss": 0.0064, "step": 276850 }, { "epoch": 1.4, "learning_rate": 9.04808512141102e-05, "loss": 0.0084, "step": 276860 }, { "epoch": 1.4, "learning_rate": 9.04732835210962e-05, "loss": 0.0075, "step": 276870 }, { "epoch": 1.4, "learning_rate": 9.046571582808218e-05, "loss": 0.0063, "step": 276880 }, { "epoch": 1.4, "learning_rate": 9.045814813506817e-05, "loss": 0.0092, "step": 276890 }, { "epoch": 1.4, "learning_rate": 9.045058044205417e-05, "loss": 0.0066, "step": 276900 }, { "epoch": 1.4, "learning_rate": 9.044301274904015e-05, "loss": 0.0101, "step": 276910 }, { "epoch": 1.4, "learning_rate": 9.043544505602614e-05, "loss": 0.0095, "step": 276920 }, { "epoch": 1.4, "learning_rate": 9.042787736301214e-05, "loss": 0.0066, "step": 276930 }, { "epoch": 1.4, "learning_rate": 9.042030966999812e-05, "loss": 0.0063, "step": 276940 }, { "epoch": 1.4, "learning_rate": 9.041274197698411e-05, "loss": 0.0063, "step": 276950 }, { "epoch": 1.4, "learning_rate": 9.04051742839701e-05, "loss": 0.0074, "step": 276960 }, { "epoch": 1.4, "learning_rate": 9.039760659095609e-05, "loss": 0.0064, "step": 276970 }, { "epoch": 1.4, "learning_rate": 9.039003889794208e-05, "loss": 0.0076, "step": 276980 }, { "epoch": 1.4, "learning_rate": 9.038247120492807e-05, "loss": 0.0109, "step": 276990 }, { "epoch": 1.4, "learning_rate": 9.037490351191406e-05, "loss": 0.008, "step": 277000 }, { "epoch": 1.4, "eval_cer": 0.9144246472852683, "eval_loss": 0.0058305272832512856, "eval_runtime": 115.9259, "eval_samples_per_second": 17.252, "eval_steps_per_second": 4.313, "step": 277000 }, { "epoch": 1.4, "learning_rate": 9.036733581890006e-05, "loss": 0.0067, "step": 277010 }, { "epoch": 1.4, "learning_rate": 9.035976812588604e-05, "loss": 0.0072, "step": 277020 }, { "epoch": 1.4, "learning_rate": 9.035220043287203e-05, "loss": 0.0073, "step": 277030 }, { "epoch": 1.4, "learning_rate": 9.034463273985801e-05, "loss": 0.0185, "step": 277040 }, { "epoch": 1.4, "learning_rate": 9.033706504684401e-05, "loss": 0.0088, "step": 277050 }, { "epoch": 1.4, "learning_rate": 9.032949735383e-05, "loss": 0.0105, "step": 277060 }, { "epoch": 1.4, "learning_rate": 9.032192966081599e-05, "loss": 0.0067, "step": 277070 }, { "epoch": 1.4, "learning_rate": 9.031436196780198e-05, "loss": 0.0099, "step": 277080 }, { "epoch": 1.4, "learning_rate": 9.030679427478798e-05, "loss": 0.0111, "step": 277090 }, { "epoch": 1.4, "learning_rate": 9.029922658177396e-05, "loss": 0.0069, "step": 277100 }, { "epoch": 1.4, "learning_rate": 9.029165888875995e-05, "loss": 0.0076, "step": 277110 }, { "epoch": 1.4, "learning_rate": 9.028409119574593e-05, "loss": 0.0072, "step": 277120 }, { "epoch": 1.4, "learning_rate": 9.027652350273193e-05, "loss": 0.0106, "step": 277130 }, { "epoch": 1.4, "learning_rate": 9.026895580971792e-05, "loss": 0.0064, "step": 277140 }, { "epoch": 1.4, "learning_rate": 9.02613881167039e-05, "loss": 0.0084, "step": 277150 }, { "epoch": 1.4, "learning_rate": 9.02538204236899e-05, "loss": 0.0092, "step": 277160 }, { "epoch": 1.4, "learning_rate": 9.02462527306759e-05, "loss": 0.0072, "step": 277170 }, { "epoch": 1.4, "learning_rate": 9.023868503766188e-05, "loss": 0.0079, "step": 277180 }, { "epoch": 1.4, "learning_rate": 9.023111734464787e-05, "loss": 0.0056, "step": 277190 }, { "epoch": 1.4, "learning_rate": 9.022354965163385e-05, "loss": 0.0073, "step": 277200 }, { "epoch": 1.4, "learning_rate": 9.021598195861985e-05, "loss": 0.0073, "step": 277210 }, { "epoch": 1.4, "learning_rate": 9.020841426560584e-05, "loss": 0.0074, "step": 277220 }, { "epoch": 1.4, "learning_rate": 9.020084657259182e-05, "loss": 0.0068, "step": 277230 }, { "epoch": 1.4, "learning_rate": 9.019327887957782e-05, "loss": 0.0076, "step": 277240 }, { "epoch": 1.4, "learning_rate": 9.018571118656381e-05, "loss": 0.0081, "step": 277250 }, { "epoch": 1.4, "learning_rate": 9.01781434935498e-05, "loss": 0.0079, "step": 277260 }, { "epoch": 1.4, "learning_rate": 9.017057580053579e-05, "loss": 0.0062, "step": 277270 }, { "epoch": 1.4, "learning_rate": 9.016300810752177e-05, "loss": 0.0101, "step": 277280 }, { "epoch": 1.4, "learning_rate": 9.015544041450777e-05, "loss": 0.0067, "step": 277290 }, { "epoch": 1.4, "learning_rate": 9.014787272149376e-05, "loss": 0.0109, "step": 277300 }, { "epoch": 1.4, "learning_rate": 9.014030502847974e-05, "loss": 0.008, "step": 277310 }, { "epoch": 1.4, "learning_rate": 9.013273733546574e-05, "loss": 0.008, "step": 277320 }, { "epoch": 1.4, "learning_rate": 9.012516964245173e-05, "loss": 0.0079, "step": 277330 }, { "epoch": 1.4, "learning_rate": 9.011760194943771e-05, "loss": 0.0073, "step": 277340 }, { "epoch": 1.4, "learning_rate": 9.011003425642371e-05, "loss": 0.0077, "step": 277350 }, { "epoch": 1.4, "learning_rate": 9.010246656340969e-05, "loss": 0.0074, "step": 277360 }, { "epoch": 1.4, "learning_rate": 9.009489887039569e-05, "loss": 0.0094, "step": 277370 }, { "epoch": 1.4, "learning_rate": 9.008733117738168e-05, "loss": 0.0087, "step": 277380 }, { "epoch": 1.4, "learning_rate": 9.007976348436766e-05, "loss": 0.0059, "step": 277390 }, { "epoch": 1.4, "learning_rate": 9.007219579135366e-05, "loss": 0.0082, "step": 277400 }, { "epoch": 1.4, "learning_rate": 9.006462809833965e-05, "loss": 0.0079, "step": 277410 }, { "epoch": 1.4, "learning_rate": 9.005706040532563e-05, "loss": 0.0069, "step": 277420 }, { "epoch": 1.4, "learning_rate": 9.004949271231163e-05, "loss": 0.0078, "step": 277430 }, { "epoch": 1.4, "learning_rate": 9.004192501929761e-05, "loss": 0.0102, "step": 277440 }, { "epoch": 1.4, "learning_rate": 9.00343573262836e-05, "loss": 0.0081, "step": 277450 }, { "epoch": 1.4, "learning_rate": 9.002678963326959e-05, "loss": 0.0075, "step": 277460 }, { "epoch": 1.4, "learning_rate": 9.001922194025557e-05, "loss": 0.0065, "step": 277470 }, { "epoch": 1.4, "learning_rate": 9.001165424724156e-05, "loss": 0.0087, "step": 277480 }, { "epoch": 1.4, "learning_rate": 9.000408655422754e-05, "loss": 0.008, "step": 277490 }, { "epoch": 1.4, "learning_rate": 8.999651886121354e-05, "loss": 0.0082, "step": 277500 }, { "epoch": 1.4, "learning_rate": 8.998895116819953e-05, "loss": 0.0089, "step": 277510 }, { "epoch": 1.4, "learning_rate": 8.998138347518552e-05, "loss": 0.0079, "step": 277520 }, { "epoch": 1.4, "learning_rate": 8.997381578217151e-05, "loss": 0.0101, "step": 277530 }, { "epoch": 1.4, "learning_rate": 8.99662480891575e-05, "loss": 0.0087, "step": 277540 }, { "epoch": 1.4, "learning_rate": 8.995868039614349e-05, "loss": 0.0067, "step": 277550 }, { "epoch": 1.4, "learning_rate": 8.995111270312948e-05, "loss": 0.009, "step": 277560 }, { "epoch": 1.4, "learning_rate": 8.994354501011546e-05, "loss": 0.0071, "step": 277570 }, { "epoch": 1.4, "learning_rate": 8.993597731710146e-05, "loss": 0.0085, "step": 277580 }, { "epoch": 1.4, "learning_rate": 8.992840962408745e-05, "loss": 0.0066, "step": 277590 }, { "epoch": 1.4, "learning_rate": 8.992084193107344e-05, "loss": 0.0073, "step": 277600 }, { "epoch": 1.4, "learning_rate": 8.991327423805943e-05, "loss": 0.0068, "step": 277610 }, { "epoch": 1.4, "learning_rate": 8.990570654504543e-05, "loss": 0.0081, "step": 277620 }, { "epoch": 1.4, "learning_rate": 8.989813885203141e-05, "loss": 0.0061, "step": 277630 }, { "epoch": 1.4, "learning_rate": 8.98905711590174e-05, "loss": 0.0068, "step": 277640 }, { "epoch": 1.4, "learning_rate": 8.988300346600338e-05, "loss": 0.0055, "step": 277650 }, { "epoch": 1.4, "learning_rate": 8.987543577298938e-05, "loss": 0.0089, "step": 277660 }, { "epoch": 1.4, "learning_rate": 8.986786807997537e-05, "loss": 0.007, "step": 277670 }, { "epoch": 1.4, "learning_rate": 8.986030038696135e-05, "loss": 0.0072, "step": 277680 }, { "epoch": 1.4, "learning_rate": 8.985273269394735e-05, "loss": 0.0063, "step": 277690 }, { "epoch": 1.4, "learning_rate": 8.984516500093334e-05, "loss": 0.0089, "step": 277700 }, { "epoch": 1.4, "learning_rate": 8.983759730791933e-05, "loss": 0.0078, "step": 277710 }, { "epoch": 1.4, "learning_rate": 8.983002961490532e-05, "loss": 0.0084, "step": 277720 }, { "epoch": 1.4, "learning_rate": 8.98224619218913e-05, "loss": 0.0073, "step": 277730 }, { "epoch": 1.4, "learning_rate": 8.98148942288773e-05, "loss": 0.0081, "step": 277740 }, { "epoch": 1.4, "learning_rate": 8.980732653586329e-05, "loss": 0.0077, "step": 277750 }, { "epoch": 1.4, "learning_rate": 8.979975884284927e-05, "loss": 0.0083, "step": 277760 }, { "epoch": 1.4, "learning_rate": 8.979219114983527e-05, "loss": 0.0084, "step": 277770 }, { "epoch": 1.4, "learning_rate": 8.978462345682126e-05, "loss": 0.0089, "step": 277780 }, { "epoch": 1.4, "learning_rate": 8.977705576380725e-05, "loss": 0.0069, "step": 277790 }, { "epoch": 1.4, "learning_rate": 8.976948807079324e-05, "loss": 0.0067, "step": 277800 }, { "epoch": 1.4, "learning_rate": 8.976192037777922e-05, "loss": 0.0079, "step": 277810 }, { "epoch": 1.4, "learning_rate": 8.975435268476522e-05, "loss": 0.0098, "step": 277820 }, { "epoch": 1.4, "learning_rate": 8.974678499175121e-05, "loss": 0.0071, "step": 277830 }, { "epoch": 1.4, "learning_rate": 8.97392172987372e-05, "loss": 0.0104, "step": 277840 }, { "epoch": 1.4, "learning_rate": 8.973164960572319e-05, "loss": 0.0064, "step": 277850 }, { "epoch": 1.4, "learning_rate": 8.972408191270918e-05, "loss": 0.007, "step": 277860 }, { "epoch": 1.4, "learning_rate": 8.971651421969516e-05, "loss": 0.0072, "step": 277870 }, { "epoch": 1.4, "learning_rate": 8.970894652668116e-05, "loss": 0.0095, "step": 277880 }, { "epoch": 1.4, "learning_rate": 8.970137883366714e-05, "loss": 0.0055, "step": 277890 }, { "epoch": 1.4, "learning_rate": 8.969381114065314e-05, "loss": 0.0072, "step": 277900 }, { "epoch": 1.4, "learning_rate": 8.968624344763913e-05, "loss": 0.007, "step": 277910 }, { "epoch": 1.4, "learning_rate": 8.967867575462511e-05, "loss": 0.0077, "step": 277920 }, { "epoch": 1.4, "learning_rate": 8.967110806161111e-05, "loss": 0.008, "step": 277930 }, { "epoch": 1.4, "learning_rate": 8.96635403685971e-05, "loss": 0.0076, "step": 277940 }, { "epoch": 1.4, "learning_rate": 8.965597267558308e-05, "loss": 0.0095, "step": 277950 }, { "epoch": 1.4, "learning_rate": 8.964840498256908e-05, "loss": 0.0068, "step": 277960 }, { "epoch": 1.4, "learning_rate": 8.964083728955507e-05, "loss": 0.007, "step": 277970 }, { "epoch": 1.4, "learning_rate": 8.963326959654106e-05, "loss": 0.0061, "step": 277980 }, { "epoch": 1.4, "learning_rate": 8.962570190352705e-05, "loss": 0.0084, "step": 277990 }, { "epoch": 1.4, "learning_rate": 8.961813421051303e-05, "loss": 0.0072, "step": 278000 }, { "epoch": 1.4, "eval_cer": 0.9144246472852683, "eval_loss": 0.0060167377814650536, "eval_runtime": 116.7043, "eval_samples_per_second": 17.137, "eval_steps_per_second": 4.284, "step": 278000 }, { "epoch": 1.4, "learning_rate": 8.961056651749903e-05, "loss": 0.0077, "step": 278010 }, { "epoch": 1.4, "learning_rate": 8.960299882448502e-05, "loss": 0.0077, "step": 278020 }, { "epoch": 1.4, "learning_rate": 8.9595431131471e-05, "loss": 0.0079, "step": 278030 }, { "epoch": 1.4, "learning_rate": 8.9587863438457e-05, "loss": 0.0053, "step": 278040 }, { "epoch": 1.4, "learning_rate": 8.9580295745443e-05, "loss": 0.0078, "step": 278050 }, { "epoch": 1.4, "learning_rate": 8.957272805242897e-05, "loss": 0.0081, "step": 278060 }, { "epoch": 1.4, "learning_rate": 8.956516035941497e-05, "loss": 0.0333, "step": 278070 }, { "epoch": 1.4, "learning_rate": 8.955759266640095e-05, "loss": 0.0085, "step": 278080 }, { "epoch": 1.4, "learning_rate": 8.955002497338693e-05, "loss": 0.0099, "step": 278090 }, { "epoch": 1.4, "learning_rate": 8.954245728037291e-05, "loss": 0.0075, "step": 278100 }, { "epoch": 1.4, "learning_rate": 8.953488958735891e-05, "loss": 0.0079, "step": 278110 }, { "epoch": 1.4, "learning_rate": 8.95273218943449e-05, "loss": 0.006, "step": 278120 }, { "epoch": 1.4, "learning_rate": 8.951975420133089e-05, "loss": 0.0086, "step": 278130 }, { "epoch": 1.4, "learning_rate": 8.951218650831688e-05, "loss": 0.0102, "step": 278140 }, { "epoch": 1.4, "learning_rate": 8.950461881530288e-05, "loss": 0.0066, "step": 278150 }, { "epoch": 1.4, "learning_rate": 8.949705112228886e-05, "loss": 0.0067, "step": 278160 }, { "epoch": 1.4, "learning_rate": 8.948948342927485e-05, "loss": 0.0073, "step": 278170 }, { "epoch": 1.4, "learning_rate": 8.948191573626083e-05, "loss": 0.0079, "step": 278180 }, { "epoch": 1.4, "learning_rate": 8.947434804324683e-05, "loss": 0.0069, "step": 278190 }, { "epoch": 1.4, "learning_rate": 8.946678035023282e-05, "loss": 0.0076, "step": 278200 }, { "epoch": 1.4, "learning_rate": 8.94592126572188e-05, "loss": 0.0058, "step": 278210 }, { "epoch": 1.4, "learning_rate": 8.94516449642048e-05, "loss": 0.0093, "step": 278220 }, { "epoch": 1.4, "learning_rate": 8.94440772711908e-05, "loss": 0.0097, "step": 278230 }, { "epoch": 1.4, "learning_rate": 8.943650957817678e-05, "loss": 0.0078, "step": 278240 }, { "epoch": 1.4, "learning_rate": 8.942894188516277e-05, "loss": 0.0091, "step": 278250 }, { "epoch": 1.4, "learning_rate": 8.942137419214875e-05, "loss": 0.009, "step": 278260 }, { "epoch": 1.4, "learning_rate": 8.941380649913475e-05, "loss": 0.0104, "step": 278270 }, { "epoch": 1.4, "learning_rate": 8.940623880612074e-05, "loss": 0.0088, "step": 278280 }, { "epoch": 1.4, "learning_rate": 8.939867111310672e-05, "loss": 0.0088, "step": 278290 }, { "epoch": 1.4, "learning_rate": 8.939110342009272e-05, "loss": 0.0064, "step": 278300 }, { "epoch": 1.4, "learning_rate": 8.938353572707871e-05, "loss": 0.0117, "step": 278310 }, { "epoch": 1.4, "learning_rate": 8.93759680340647e-05, "loss": 0.0091, "step": 278320 }, { "epoch": 1.4, "learning_rate": 8.936840034105069e-05, "loss": 0.0065, "step": 278330 }, { "epoch": 1.4, "learning_rate": 8.936083264803667e-05, "loss": 0.0086, "step": 278340 }, { "epoch": 1.4, "learning_rate": 8.935326495502267e-05, "loss": 0.01, "step": 278350 }, { "epoch": 1.4, "learning_rate": 8.934569726200866e-05, "loss": 0.0098, "step": 278360 }, { "epoch": 1.4, "learning_rate": 8.933812956899464e-05, "loss": 0.0073, "step": 278370 }, { "epoch": 1.4, "learning_rate": 8.933056187598064e-05, "loss": 0.0072, "step": 278380 }, { "epoch": 1.4, "learning_rate": 8.932299418296663e-05, "loss": 0.009, "step": 278390 }, { "epoch": 1.4, "learning_rate": 8.931542648995261e-05, "loss": 0.0078, "step": 278400 }, { "epoch": 1.4, "learning_rate": 8.930785879693861e-05, "loss": 0.0084, "step": 278410 }, { "epoch": 1.4, "learning_rate": 8.93002911039246e-05, "loss": 0.0071, "step": 278420 }, { "epoch": 1.4, "learning_rate": 8.929272341091059e-05, "loss": 0.0102, "step": 278430 }, { "epoch": 1.4, "learning_rate": 8.928515571789658e-05, "loss": 0.0086, "step": 278440 }, { "epoch": 1.4, "learning_rate": 8.927758802488256e-05, "loss": 0.0069, "step": 278450 }, { "epoch": 1.4, "learning_rate": 8.927002033186856e-05, "loss": 0.0084, "step": 278460 }, { "epoch": 1.4, "learning_rate": 8.926245263885455e-05, "loss": 0.007, "step": 278470 }, { "epoch": 1.4, "learning_rate": 8.925488494584053e-05, "loss": 0.0083, "step": 278480 }, { "epoch": 1.41, "learning_rate": 8.924731725282653e-05, "loss": 0.0057, "step": 278490 }, { "epoch": 1.41, "learning_rate": 8.923974955981252e-05, "loss": 0.0076, "step": 278500 }, { "epoch": 1.41, "learning_rate": 8.92321818667985e-05, "loss": 0.0075, "step": 278510 }, { "epoch": 1.41, "learning_rate": 8.92246141737845e-05, "loss": 0.0074, "step": 278520 }, { "epoch": 1.41, "learning_rate": 8.921704648077048e-05, "loss": 0.0076, "step": 278530 }, { "epoch": 1.41, "learning_rate": 8.920947878775648e-05, "loss": 0.0058, "step": 278540 }, { "epoch": 1.41, "learning_rate": 8.920191109474247e-05, "loss": 0.0066, "step": 278550 }, { "epoch": 1.41, "learning_rate": 8.919434340172845e-05, "loss": 0.0095, "step": 278560 }, { "epoch": 1.41, "learning_rate": 8.918677570871445e-05, "loss": 0.006, "step": 278570 }, { "epoch": 1.41, "learning_rate": 8.917920801570044e-05, "loss": 0.0083, "step": 278580 }, { "epoch": 1.41, "learning_rate": 8.917164032268643e-05, "loss": 0.0092, "step": 278590 }, { "epoch": 1.41, "learning_rate": 8.916407262967242e-05, "loss": 0.0093, "step": 278600 }, { "epoch": 1.41, "learning_rate": 8.91565049366584e-05, "loss": 0.0077, "step": 278610 }, { "epoch": 1.41, "learning_rate": 8.91489372436444e-05, "loss": 0.0076, "step": 278620 }, { "epoch": 1.41, "learning_rate": 8.914136955063039e-05, "loss": 0.0093, "step": 278630 }, { "epoch": 1.41, "learning_rate": 8.913380185761637e-05, "loss": 0.0081, "step": 278640 }, { "epoch": 1.41, "learning_rate": 8.912623416460237e-05, "loss": 0.0067, "step": 278650 }, { "epoch": 1.41, "learning_rate": 8.911866647158836e-05, "loss": 0.0076, "step": 278660 }, { "epoch": 1.41, "learning_rate": 8.911109877857434e-05, "loss": 0.0068, "step": 278670 }, { "epoch": 1.41, "learning_rate": 8.910353108556034e-05, "loss": 0.0163, "step": 278680 }, { "epoch": 1.41, "learning_rate": 8.909596339254632e-05, "loss": 0.0074, "step": 278690 }, { "epoch": 1.41, "learning_rate": 8.908839569953232e-05, "loss": 0.0058, "step": 278700 }, { "epoch": 1.41, "learning_rate": 8.908082800651831e-05, "loss": 0.0087, "step": 278710 }, { "epoch": 1.41, "learning_rate": 8.907326031350428e-05, "loss": 0.0092, "step": 278720 }, { "epoch": 1.41, "learning_rate": 8.906569262049027e-05, "loss": 0.006, "step": 278730 }, { "epoch": 1.41, "learning_rate": 8.905812492747626e-05, "loss": 0.0092, "step": 278740 }, { "epoch": 1.41, "learning_rate": 8.905055723446225e-05, "loss": 0.0081, "step": 278750 }, { "epoch": 1.41, "learning_rate": 8.904298954144825e-05, "loss": 0.0115, "step": 278760 }, { "epoch": 1.41, "learning_rate": 8.903542184843423e-05, "loss": 0.0111, "step": 278770 }, { "epoch": 1.41, "learning_rate": 8.902785415542022e-05, "loss": 0.0076, "step": 278780 }, { "epoch": 1.41, "learning_rate": 8.90202864624062e-05, "loss": 0.0093, "step": 278790 }, { "epoch": 1.41, "learning_rate": 8.90127187693922e-05, "loss": 0.0068, "step": 278800 }, { "epoch": 1.41, "learning_rate": 8.900515107637819e-05, "loss": 0.0084, "step": 278810 }, { "epoch": 1.41, "learning_rate": 8.899758338336417e-05, "loss": 0.009, "step": 278820 }, { "epoch": 1.41, "learning_rate": 8.899001569035017e-05, "loss": 0.0107, "step": 278830 }, { "epoch": 1.41, "learning_rate": 8.898244799733616e-05, "loss": 0.0064, "step": 278840 }, { "epoch": 1.41, "learning_rate": 8.897488030432215e-05, "loss": 0.0068, "step": 278850 }, { "epoch": 1.41, "learning_rate": 8.896731261130814e-05, "loss": 0.0069, "step": 278860 }, { "epoch": 1.41, "learning_rate": 8.895974491829414e-05, "loss": 0.0059, "step": 278870 }, { "epoch": 1.41, "learning_rate": 8.895217722528012e-05, "loss": 0.0076, "step": 278880 }, { "epoch": 1.41, "learning_rate": 8.894460953226611e-05, "loss": 0.0083, "step": 278890 }, { "epoch": 1.41, "learning_rate": 8.89370418392521e-05, "loss": 0.0081, "step": 278900 }, { "epoch": 1.41, "learning_rate": 8.892947414623809e-05, "loss": 0.0057, "step": 278910 }, { "epoch": 1.41, "learning_rate": 8.892190645322408e-05, "loss": 0.0089, "step": 278920 }, { "epoch": 1.41, "learning_rate": 8.891433876021007e-05, "loss": 0.0064, "step": 278930 }, { "epoch": 1.41, "learning_rate": 8.890677106719606e-05, "loss": 0.0072, "step": 278940 }, { "epoch": 1.41, "learning_rate": 8.889920337418206e-05, "loss": 0.006, "step": 278950 }, { "epoch": 1.41, "learning_rate": 8.889163568116804e-05, "loss": 0.0081, "step": 278960 }, { "epoch": 1.41, "learning_rate": 8.888406798815403e-05, "loss": 0.0066, "step": 278970 }, { "epoch": 1.41, "learning_rate": 8.887650029514001e-05, "loss": 0.0074, "step": 278980 }, { "epoch": 1.41, "learning_rate": 8.886893260212601e-05, "loss": 0.0054, "step": 278990 }, { "epoch": 1.41, "learning_rate": 8.8861364909112e-05, "loss": 0.0108, "step": 279000 }, { "epoch": 1.41, "eval_cer": 0.9144304696620207, "eval_loss": 0.005943993106484413, "eval_runtime": 116.6988, "eval_samples_per_second": 17.138, "eval_steps_per_second": 4.285, "step": 279000 }, { "epoch": 1.41, "learning_rate": 8.885379721609798e-05, "loss": 0.0093, "step": 279010 }, { "epoch": 1.41, "learning_rate": 8.884622952308398e-05, "loss": 0.0072, "step": 279020 }, { "epoch": 1.41, "learning_rate": 8.883866183006997e-05, "loss": 0.0059, "step": 279030 }, { "epoch": 1.41, "learning_rate": 8.883109413705596e-05, "loss": 0.0074, "step": 279040 }, { "epoch": 1.41, "learning_rate": 8.882352644404195e-05, "loss": 0.008, "step": 279050 }, { "epoch": 1.41, "learning_rate": 8.881595875102793e-05, "loss": 0.006, "step": 279060 }, { "epoch": 1.41, "learning_rate": 8.880839105801393e-05, "loss": 0.0079, "step": 279070 }, { "epoch": 1.41, "learning_rate": 8.880082336499992e-05, "loss": 0.0054, "step": 279080 }, { "epoch": 1.41, "learning_rate": 8.87932556719859e-05, "loss": 0.0101, "step": 279090 }, { "epoch": 1.41, "learning_rate": 8.87856879789719e-05, "loss": 0.0071, "step": 279100 }, { "epoch": 1.41, "learning_rate": 8.87781202859579e-05, "loss": 0.0065, "step": 279110 }, { "epoch": 1.41, "learning_rate": 8.877055259294388e-05, "loss": 0.0083, "step": 279120 }, { "epoch": 1.41, "learning_rate": 8.876298489992987e-05, "loss": 0.0102, "step": 279130 }, { "epoch": 1.41, "learning_rate": 8.875541720691585e-05, "loss": 0.0076, "step": 279140 }, { "epoch": 1.41, "learning_rate": 8.874784951390185e-05, "loss": 0.008, "step": 279150 }, { "epoch": 1.41, "learning_rate": 8.874028182088784e-05, "loss": 0.0103, "step": 279160 }, { "epoch": 1.41, "learning_rate": 8.873271412787382e-05, "loss": 0.0114, "step": 279170 }, { "epoch": 1.41, "learning_rate": 8.872514643485982e-05, "loss": 0.011, "step": 279180 }, { "epoch": 1.41, "learning_rate": 8.871757874184581e-05, "loss": 0.0088, "step": 279190 }, { "epoch": 1.41, "learning_rate": 8.87100110488318e-05, "loss": 0.0078, "step": 279200 }, { "epoch": 1.41, "learning_rate": 8.870244335581779e-05, "loss": 0.0108, "step": 279210 }, { "epoch": 1.41, "learning_rate": 8.869487566280377e-05, "loss": 0.01, "step": 279220 }, { "epoch": 1.41, "learning_rate": 8.868730796978977e-05, "loss": 0.0081, "step": 279230 }, { "epoch": 1.41, "learning_rate": 8.867974027677576e-05, "loss": 0.0081, "step": 279240 }, { "epoch": 1.41, "learning_rate": 8.867217258376174e-05, "loss": 0.0055, "step": 279250 }, { "epoch": 1.41, "learning_rate": 8.866460489074774e-05, "loss": 0.0071, "step": 279260 }, { "epoch": 1.41, "learning_rate": 8.865703719773373e-05, "loss": 0.0096, "step": 279270 }, { "epoch": 1.41, "learning_rate": 8.864946950471971e-05, "loss": 0.0088, "step": 279280 }, { "epoch": 1.41, "learning_rate": 8.864190181170571e-05, "loss": 0.0068, "step": 279290 }, { "epoch": 1.41, "learning_rate": 8.863433411869169e-05, "loss": 0.0068, "step": 279300 }, { "epoch": 1.41, "learning_rate": 8.862676642567769e-05, "loss": 0.0074, "step": 279310 }, { "epoch": 1.41, "learning_rate": 8.861919873266368e-05, "loss": 0.0099, "step": 279320 }, { "epoch": 1.41, "learning_rate": 8.861163103964966e-05, "loss": 0.0091, "step": 279330 }, { "epoch": 1.41, "learning_rate": 8.860406334663566e-05, "loss": 0.0082, "step": 279340 }, { "epoch": 1.41, "learning_rate": 8.859649565362162e-05, "loss": 0.0097, "step": 279350 }, { "epoch": 1.41, "learning_rate": 8.858892796060762e-05, "loss": 0.0079, "step": 279360 }, { "epoch": 1.41, "learning_rate": 8.858136026759361e-05, "loss": 0.0092, "step": 279370 }, { "epoch": 1.41, "learning_rate": 8.85737925745796e-05, "loss": 0.0101, "step": 279380 }, { "epoch": 1.41, "learning_rate": 8.856622488156559e-05, "loss": 0.0099, "step": 279390 }, { "epoch": 1.41, "learning_rate": 8.855865718855159e-05, "loss": 0.01, "step": 279400 }, { "epoch": 1.41, "learning_rate": 8.855108949553757e-05, "loss": 0.0079, "step": 279410 }, { "epoch": 1.41, "learning_rate": 8.854352180252356e-05, "loss": 0.0092, "step": 279420 }, { "epoch": 1.41, "learning_rate": 8.853595410950954e-05, "loss": 0.0098, "step": 279430 }, { "epoch": 1.41, "learning_rate": 8.852838641649554e-05, "loss": 0.0073, "step": 279440 }, { "epoch": 1.41, "learning_rate": 8.852081872348153e-05, "loss": 0.0056, "step": 279450 }, { "epoch": 1.41, "learning_rate": 8.851325103046752e-05, "loss": 0.0063, "step": 279460 }, { "epoch": 1.41, "learning_rate": 8.850568333745351e-05, "loss": 0.0073, "step": 279470 }, { "epoch": 1.41, "learning_rate": 8.84981156444395e-05, "loss": 0.0077, "step": 279480 }, { "epoch": 1.41, "learning_rate": 8.849054795142549e-05, "loss": 0.0109, "step": 279490 }, { "epoch": 1.41, "learning_rate": 8.848298025841148e-05, "loss": 0.0085, "step": 279500 }, { "epoch": 1.41, "learning_rate": 8.847541256539746e-05, "loss": 0.0091, "step": 279510 }, { "epoch": 1.41, "learning_rate": 8.846784487238346e-05, "loss": 0.0081, "step": 279520 }, { "epoch": 1.41, "learning_rate": 8.846027717936945e-05, "loss": 0.0068, "step": 279530 }, { "epoch": 1.41, "learning_rate": 8.845270948635543e-05, "loss": 0.0084, "step": 279540 }, { "epoch": 1.41, "learning_rate": 8.844514179334143e-05, "loss": 0.0085, "step": 279550 }, { "epoch": 1.41, "learning_rate": 8.843757410032742e-05, "loss": 0.0079, "step": 279560 }, { "epoch": 1.41, "learning_rate": 8.84300064073134e-05, "loss": 0.0079, "step": 279570 }, { "epoch": 1.41, "learning_rate": 8.84224387142994e-05, "loss": 0.0062, "step": 279580 }, { "epoch": 1.41, "learning_rate": 8.841487102128538e-05, "loss": 0.0073, "step": 279590 }, { "epoch": 1.41, "learning_rate": 8.840730332827138e-05, "loss": 0.006, "step": 279600 }, { "epoch": 1.41, "learning_rate": 8.839973563525737e-05, "loss": 0.0069, "step": 279610 }, { "epoch": 1.41, "learning_rate": 8.839216794224335e-05, "loss": 0.0088, "step": 279620 }, { "epoch": 1.41, "learning_rate": 8.838460024922935e-05, "loss": 0.0078, "step": 279630 }, { "epoch": 1.41, "learning_rate": 8.837703255621534e-05, "loss": 0.0078, "step": 279640 }, { "epoch": 1.41, "learning_rate": 8.836946486320133e-05, "loss": 0.0078, "step": 279650 }, { "epoch": 1.41, "learning_rate": 8.836189717018732e-05, "loss": 0.0093, "step": 279660 }, { "epoch": 1.41, "learning_rate": 8.83543294771733e-05, "loss": 0.0081, "step": 279670 }, { "epoch": 1.41, "learning_rate": 8.83467617841593e-05, "loss": 0.0066, "step": 279680 }, { "epoch": 1.41, "learning_rate": 8.833919409114529e-05, "loss": 0.0081, "step": 279690 }, { "epoch": 1.41, "learning_rate": 8.833162639813127e-05, "loss": 0.0074, "step": 279700 }, { "epoch": 1.41, "learning_rate": 8.832405870511727e-05, "loss": 0.0071, "step": 279710 }, { "epoch": 1.41, "learning_rate": 8.831649101210326e-05, "loss": 0.0065, "step": 279720 }, { "epoch": 1.41, "learning_rate": 8.830892331908924e-05, "loss": 0.0079, "step": 279730 }, { "epoch": 1.41, "learning_rate": 8.830135562607524e-05, "loss": 0.0097, "step": 279740 }, { "epoch": 1.41, "learning_rate": 8.829378793306122e-05, "loss": 0.0058, "step": 279750 }, { "epoch": 1.41, "learning_rate": 8.828622024004722e-05, "loss": 0.0074, "step": 279760 }, { "epoch": 1.41, "learning_rate": 8.827865254703321e-05, "loss": 0.0084, "step": 279770 }, { "epoch": 1.41, "learning_rate": 8.827108485401919e-05, "loss": 0.0069, "step": 279780 }, { "epoch": 1.41, "learning_rate": 8.826351716100519e-05, "loss": 0.0096, "step": 279790 }, { "epoch": 1.41, "learning_rate": 8.825594946799118e-05, "loss": 0.0073, "step": 279800 }, { "epoch": 1.41, "learning_rate": 8.824838177497716e-05, "loss": 0.007, "step": 279810 }, { "epoch": 1.41, "learning_rate": 8.824081408196316e-05, "loss": 0.0091, "step": 279820 }, { "epoch": 1.41, "learning_rate": 8.823324638894914e-05, "loss": 0.0073, "step": 279830 }, { "epoch": 1.41, "learning_rate": 8.822567869593514e-05, "loss": 0.008, "step": 279840 }, { "epoch": 1.41, "learning_rate": 8.821811100292113e-05, "loss": 0.0069, "step": 279850 }, { "epoch": 1.41, "learning_rate": 8.821054330990711e-05, "loss": 0.0103, "step": 279860 }, { "epoch": 1.41, "learning_rate": 8.820297561689311e-05, "loss": 0.0126, "step": 279870 }, { "epoch": 1.41, "learning_rate": 8.81954079238791e-05, "loss": 0.0068, "step": 279880 }, { "epoch": 1.41, "learning_rate": 8.818784023086508e-05, "loss": 0.0083, "step": 279890 }, { "epoch": 1.41, "learning_rate": 8.818027253785108e-05, "loss": 0.0071, "step": 279900 }, { "epoch": 1.41, "learning_rate": 8.817270484483707e-05, "loss": 0.0073, "step": 279910 }, { "epoch": 1.41, "learning_rate": 8.816513715182305e-05, "loss": 0.006, "step": 279920 }, { "epoch": 1.41, "learning_rate": 8.815756945880905e-05, "loss": 0.0077, "step": 279930 }, { "epoch": 1.41, "learning_rate": 8.815000176579503e-05, "loss": 0.009, "step": 279940 }, { "epoch": 1.41, "learning_rate": 8.814243407278103e-05, "loss": 0.0081, "step": 279950 }, { "epoch": 1.41, "learning_rate": 8.813486637976702e-05, "loss": 0.0089, "step": 279960 }, { "epoch": 1.41, "learning_rate": 8.8127298686753e-05, "loss": 0.0083, "step": 279970 }, { "epoch": 1.41, "learning_rate": 8.811973099373898e-05, "loss": 0.0079, "step": 279980 }, { "epoch": 1.41, "learning_rate": 8.811216330072497e-05, "loss": 0.0088, "step": 279990 }, { "epoch": 1.41, "learning_rate": 8.810459560771096e-05, "loss": 0.0067, "step": 280000 }, { "epoch": 1.41, "eval_cer": 0.914423676889143, "eval_loss": 0.005915849469602108, "eval_runtime": 116.6786, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 280000 }, { "epoch": 1.41, "learning_rate": 8.809702791469696e-05, "loss": 0.0075, "step": 280010 }, { "epoch": 1.41, "learning_rate": 8.808946022168294e-05, "loss": 0.0087, "step": 280020 }, { "epoch": 1.41, "learning_rate": 8.808189252866893e-05, "loss": 0.0069, "step": 280030 }, { "epoch": 1.41, "learning_rate": 8.807432483565491e-05, "loss": 0.0081, "step": 280040 }, { "epoch": 1.41, "learning_rate": 8.806675714264091e-05, "loss": 0.0091, "step": 280050 }, { "epoch": 1.41, "learning_rate": 8.80591894496269e-05, "loss": 0.0067, "step": 280060 }, { "epoch": 1.41, "learning_rate": 8.805162175661288e-05, "loss": 0.0065, "step": 280070 }, { "epoch": 1.41, "learning_rate": 8.804405406359888e-05, "loss": 0.0092, "step": 280080 }, { "epoch": 1.41, "learning_rate": 8.803648637058487e-05, "loss": 0.0086, "step": 280090 }, { "epoch": 1.41, "learning_rate": 8.802891867757086e-05, "loss": 0.0066, "step": 280100 }, { "epoch": 1.41, "learning_rate": 8.802135098455685e-05, "loss": 0.0096, "step": 280110 }, { "epoch": 1.41, "learning_rate": 8.801378329154283e-05, "loss": 0.0122, "step": 280120 }, { "epoch": 1.41, "learning_rate": 8.800621559852883e-05, "loss": 0.0083, "step": 280130 }, { "epoch": 1.41, "learning_rate": 8.799864790551482e-05, "loss": 0.0074, "step": 280140 }, { "epoch": 1.41, "learning_rate": 8.79910802125008e-05, "loss": 0.0068, "step": 280150 }, { "epoch": 1.41, "learning_rate": 8.79835125194868e-05, "loss": 0.0067, "step": 280160 }, { "epoch": 1.41, "learning_rate": 8.79759448264728e-05, "loss": 0.007, "step": 280170 }, { "epoch": 1.41, "learning_rate": 8.796837713345878e-05, "loss": 0.0065, "step": 280180 }, { "epoch": 1.41, "learning_rate": 8.796080944044477e-05, "loss": 0.0076, "step": 280190 }, { "epoch": 1.41, "learning_rate": 8.795324174743075e-05, "loss": 0.0083, "step": 280200 }, { "epoch": 1.41, "learning_rate": 8.794567405441675e-05, "loss": 0.0071, "step": 280210 }, { "epoch": 1.41, "learning_rate": 8.793810636140274e-05, "loss": 0.0096, "step": 280220 }, { "epoch": 1.41, "learning_rate": 8.793053866838872e-05, "loss": 0.0086, "step": 280230 }, { "epoch": 1.41, "learning_rate": 8.792297097537472e-05, "loss": 0.0073, "step": 280240 }, { "epoch": 1.41, "learning_rate": 8.791540328236071e-05, "loss": 0.0096, "step": 280250 }, { "epoch": 1.41, "learning_rate": 8.79078355893467e-05, "loss": 0.0091, "step": 280260 }, { "epoch": 1.41, "learning_rate": 8.790026789633269e-05, "loss": 0.0068, "step": 280270 }, { "epoch": 1.41, "learning_rate": 8.789270020331867e-05, "loss": 0.0076, "step": 280280 }, { "epoch": 1.41, "learning_rate": 8.788513251030467e-05, "loss": 0.0065, "step": 280290 }, { "epoch": 1.41, "learning_rate": 8.787756481729066e-05, "loss": 0.0112, "step": 280300 }, { "epoch": 1.41, "learning_rate": 8.786999712427664e-05, "loss": 0.0057, "step": 280310 }, { "epoch": 1.41, "learning_rate": 8.786242943126264e-05, "loss": 0.0099, "step": 280320 }, { "epoch": 1.41, "learning_rate": 8.785486173824863e-05, "loss": 0.0113, "step": 280330 }, { "epoch": 1.41, "learning_rate": 8.784729404523461e-05, "loss": 0.0066, "step": 280340 }, { "epoch": 1.41, "learning_rate": 8.783972635222061e-05, "loss": 0.0084, "step": 280350 }, { "epoch": 1.41, "learning_rate": 8.78321586592066e-05, "loss": 0.0072, "step": 280360 }, { "epoch": 1.41, "learning_rate": 8.782459096619259e-05, "loss": 0.0094, "step": 280370 }, { "epoch": 1.41, "learning_rate": 8.781702327317858e-05, "loss": 0.008, "step": 280380 }, { "epoch": 1.41, "learning_rate": 8.780945558016456e-05, "loss": 0.0075, "step": 280390 }, { "epoch": 1.41, "learning_rate": 8.780188788715056e-05, "loss": 0.0078, "step": 280400 }, { "epoch": 1.41, "learning_rate": 8.779432019413655e-05, "loss": 0.0072, "step": 280410 }, { "epoch": 1.41, "learning_rate": 8.778675250112253e-05, "loss": 0.0064, "step": 280420 }, { "epoch": 1.41, "learning_rate": 8.777918480810853e-05, "loss": 0.0049, "step": 280430 }, { "epoch": 1.41, "learning_rate": 8.777161711509452e-05, "loss": 0.0099, "step": 280440 }, { "epoch": 1.41, "learning_rate": 8.77640494220805e-05, "loss": 0.0074, "step": 280450 }, { "epoch": 1.41, "learning_rate": 8.77564817290665e-05, "loss": 0.0061, "step": 280460 }, { "epoch": 1.42, "learning_rate": 8.774891403605248e-05, "loss": 0.0074, "step": 280470 }, { "epoch": 1.42, "learning_rate": 8.774134634303848e-05, "loss": 0.0063, "step": 280480 }, { "epoch": 1.42, "learning_rate": 8.773377865002447e-05, "loss": 0.0077, "step": 280490 }, { "epoch": 1.42, "learning_rate": 8.772621095701045e-05, "loss": 0.0076, "step": 280500 }, { "epoch": 1.42, "learning_rate": 8.771864326399645e-05, "loss": 0.0074, "step": 280510 }, { "epoch": 1.42, "learning_rate": 8.771107557098244e-05, "loss": 0.0058, "step": 280520 }, { "epoch": 1.42, "learning_rate": 8.770350787796842e-05, "loss": 0.0072, "step": 280530 }, { "epoch": 1.42, "learning_rate": 8.769594018495442e-05, "loss": 0.0066, "step": 280540 }, { "epoch": 1.42, "learning_rate": 8.76883724919404e-05, "loss": 0.0074, "step": 280550 }, { "epoch": 1.42, "learning_rate": 8.76808047989264e-05, "loss": 0.0075, "step": 280560 }, { "epoch": 1.42, "learning_rate": 8.767323710591239e-05, "loss": 0.0091, "step": 280570 }, { "epoch": 1.42, "learning_rate": 8.766566941289837e-05, "loss": 0.006, "step": 280580 }, { "epoch": 1.42, "learning_rate": 8.765810171988437e-05, "loss": 0.0088, "step": 280590 }, { "epoch": 1.42, "learning_rate": 8.765053402687033e-05, "loss": 0.0076, "step": 280600 }, { "epoch": 1.42, "learning_rate": 8.764296633385633e-05, "loss": 0.009, "step": 280610 }, { "epoch": 1.42, "learning_rate": 8.763539864084232e-05, "loss": 0.0063, "step": 280620 }, { "epoch": 1.42, "learning_rate": 8.76278309478283e-05, "loss": 0.0081, "step": 280630 }, { "epoch": 1.42, "learning_rate": 8.76202632548143e-05, "loss": 0.0071, "step": 280640 }, { "epoch": 1.42, "learning_rate": 8.761269556180028e-05, "loss": 0.0088, "step": 280650 }, { "epoch": 1.42, "learning_rate": 8.760512786878628e-05, "loss": 0.0095, "step": 280660 }, { "epoch": 1.42, "learning_rate": 8.759756017577227e-05, "loss": 0.0079, "step": 280670 }, { "epoch": 1.42, "learning_rate": 8.758999248275825e-05, "loss": 0.0133, "step": 280680 }, { "epoch": 1.42, "learning_rate": 8.758242478974425e-05, "loss": 0.0079, "step": 280690 }, { "epoch": 1.42, "learning_rate": 8.757485709673024e-05, "loss": 0.0084, "step": 280700 }, { "epoch": 1.42, "learning_rate": 8.756728940371623e-05, "loss": 0.0092, "step": 280710 }, { "epoch": 1.42, "learning_rate": 8.755972171070222e-05, "loss": 0.0055, "step": 280720 }, { "epoch": 1.42, "learning_rate": 8.75521540176882e-05, "loss": 0.0091, "step": 280730 }, { "epoch": 1.42, "learning_rate": 8.75445863246742e-05, "loss": 0.0068, "step": 280740 }, { "epoch": 1.42, "learning_rate": 8.753701863166019e-05, "loss": 0.0069, "step": 280750 }, { "epoch": 1.42, "learning_rate": 8.752945093864617e-05, "loss": 0.0091, "step": 280760 }, { "epoch": 1.42, "learning_rate": 8.752188324563217e-05, "loss": 0.0101, "step": 280770 }, { "epoch": 1.42, "learning_rate": 8.751431555261816e-05, "loss": 0.0064, "step": 280780 }, { "epoch": 1.42, "learning_rate": 8.750674785960414e-05, "loss": 0.0068, "step": 280790 }, { "epoch": 1.42, "learning_rate": 8.749918016659014e-05, "loss": 0.0088, "step": 280800 }, { "epoch": 1.42, "learning_rate": 8.749161247357613e-05, "loss": 0.008, "step": 280810 }, { "epoch": 1.42, "learning_rate": 8.748404478056212e-05, "loss": 0.0075, "step": 280820 }, { "epoch": 1.42, "learning_rate": 8.747647708754811e-05, "loss": 0.0063, "step": 280830 }, { "epoch": 1.42, "learning_rate": 8.746890939453409e-05, "loss": 0.0058, "step": 280840 }, { "epoch": 1.42, "learning_rate": 8.746134170152009e-05, "loss": 0.0066, "step": 280850 }, { "epoch": 1.42, "learning_rate": 8.745377400850608e-05, "loss": 0.0055, "step": 280860 }, { "epoch": 1.42, "learning_rate": 8.744620631549206e-05, "loss": 0.011, "step": 280870 }, { "epoch": 1.42, "learning_rate": 8.743863862247806e-05, "loss": 0.0079, "step": 280880 }, { "epoch": 1.42, "learning_rate": 8.743107092946405e-05, "loss": 0.008, "step": 280890 }, { "epoch": 1.42, "learning_rate": 8.742350323645004e-05, "loss": 0.0079, "step": 280900 }, { "epoch": 1.42, "learning_rate": 8.741593554343603e-05, "loss": 0.006, "step": 280910 }, { "epoch": 1.42, "learning_rate": 8.740836785042201e-05, "loss": 0.0065, "step": 280920 }, { "epoch": 1.42, "learning_rate": 8.740080015740801e-05, "loss": 0.0091, "step": 280930 }, { "epoch": 1.42, "learning_rate": 8.7393232464394e-05, "loss": 0.008, "step": 280940 }, { "epoch": 1.42, "learning_rate": 8.738566477137998e-05, "loss": 0.0059, "step": 280950 }, { "epoch": 1.42, "learning_rate": 8.737809707836598e-05, "loss": 0.008, "step": 280960 }, { "epoch": 1.42, "learning_rate": 8.737052938535197e-05, "loss": 0.0063, "step": 280970 }, { "epoch": 1.42, "learning_rate": 8.736296169233795e-05, "loss": 0.0103, "step": 280980 }, { "epoch": 1.42, "learning_rate": 8.735539399932395e-05, "loss": 0.006, "step": 280990 }, { "epoch": 1.42, "learning_rate": 8.734782630630993e-05, "loss": 0.0063, "step": 281000 }, { "epoch": 1.42, "eval_cer": 0.9144333808503969, "eval_loss": 0.0056717172265052795, "eval_runtime": 115.6852, "eval_samples_per_second": 17.288, "eval_steps_per_second": 4.322, "step": 281000 }, { "epoch": 1.42, "learning_rate": 8.734025861329593e-05, "loss": 0.013, "step": 281010 }, { "epoch": 1.42, "learning_rate": 8.733269092028192e-05, "loss": 0.0076, "step": 281020 }, { "epoch": 1.42, "learning_rate": 8.73251232272679e-05, "loss": 0.0083, "step": 281030 }, { "epoch": 1.42, "learning_rate": 8.73175555342539e-05, "loss": 0.0075, "step": 281040 }, { "epoch": 1.42, "learning_rate": 8.730998784123989e-05, "loss": 0.006, "step": 281050 }, { "epoch": 1.42, "learning_rate": 8.730242014822587e-05, "loss": 0.0078, "step": 281060 }, { "epoch": 1.42, "learning_rate": 8.729485245521187e-05, "loss": 0.007, "step": 281070 }, { "epoch": 1.42, "learning_rate": 8.728728476219785e-05, "loss": 0.008, "step": 281080 }, { "epoch": 1.42, "learning_rate": 8.727971706918385e-05, "loss": 0.008, "step": 281090 }, { "epoch": 1.42, "learning_rate": 8.727214937616984e-05, "loss": 0.0062, "step": 281100 }, { "epoch": 1.42, "learning_rate": 8.726458168315582e-05, "loss": 0.0086, "step": 281110 }, { "epoch": 1.42, "learning_rate": 8.725701399014182e-05, "loss": 0.007, "step": 281120 }, { "epoch": 1.42, "learning_rate": 8.724944629712781e-05, "loss": 0.0095, "step": 281130 }, { "epoch": 1.42, "learning_rate": 8.72418786041138e-05, "loss": 0.0093, "step": 281140 }, { "epoch": 1.42, "learning_rate": 8.723431091109979e-05, "loss": 0.0066, "step": 281150 }, { "epoch": 1.42, "learning_rate": 8.722674321808577e-05, "loss": 0.0068, "step": 281160 }, { "epoch": 1.42, "learning_rate": 8.721917552507176e-05, "loss": 0.0051, "step": 281170 }, { "epoch": 1.42, "learning_rate": 8.721160783205776e-05, "loss": 0.0067, "step": 281180 }, { "epoch": 1.42, "learning_rate": 8.720404013904374e-05, "loss": 0.0088, "step": 281190 }, { "epoch": 1.42, "learning_rate": 8.719647244602974e-05, "loss": 0.0079, "step": 281200 }, { "epoch": 1.42, "learning_rate": 8.718890475301573e-05, "loss": 0.0084, "step": 281210 }, { "epoch": 1.42, "learning_rate": 8.718133706000171e-05, "loss": 0.0057, "step": 281220 }, { "epoch": 1.42, "learning_rate": 8.71737693669877e-05, "loss": 0.0094, "step": 281230 }, { "epoch": 1.42, "learning_rate": 8.716620167397368e-05, "loss": 0.0061, "step": 281240 }, { "epoch": 1.42, "learning_rate": 8.715863398095967e-05, "loss": 0.0065, "step": 281250 }, { "epoch": 1.42, "learning_rate": 8.715106628794567e-05, "loss": 0.0065, "step": 281260 }, { "epoch": 1.42, "learning_rate": 8.714349859493165e-05, "loss": 0.0082, "step": 281270 }, { "epoch": 1.42, "learning_rate": 8.713593090191764e-05, "loss": 0.0081, "step": 281280 }, { "epoch": 1.42, "learning_rate": 8.712836320890362e-05, "loss": 0.0062, "step": 281290 }, { "epoch": 1.42, "learning_rate": 8.712079551588962e-05, "loss": 0.007, "step": 281300 }, { "epoch": 1.42, "learning_rate": 8.711322782287561e-05, "loss": 0.0088, "step": 281310 }, { "epoch": 1.42, "learning_rate": 8.71056601298616e-05, "loss": 0.0084, "step": 281320 }, { "epoch": 1.42, "learning_rate": 8.709809243684759e-05, "loss": 0.0091, "step": 281330 }, { "epoch": 1.42, "learning_rate": 8.709052474383359e-05, "loss": 0.0081, "step": 281340 }, { "epoch": 1.42, "learning_rate": 8.708295705081957e-05, "loss": 0.0078, "step": 281350 }, { "epoch": 1.42, "learning_rate": 8.707538935780556e-05, "loss": 0.0079, "step": 281360 }, { "epoch": 1.42, "learning_rate": 8.706782166479154e-05, "loss": 0.0084, "step": 281370 }, { "epoch": 1.42, "learning_rate": 8.706025397177754e-05, "loss": 0.0046, "step": 281380 }, { "epoch": 1.42, "learning_rate": 8.705268627876353e-05, "loss": 0.0079, "step": 281390 }, { "epoch": 1.42, "learning_rate": 8.704511858574951e-05, "loss": 0.0096, "step": 281400 }, { "epoch": 1.42, "learning_rate": 8.703755089273551e-05, "loss": 0.0068, "step": 281410 }, { "epoch": 1.42, "learning_rate": 8.70299831997215e-05, "loss": 0.0091, "step": 281420 }, { "epoch": 1.42, "learning_rate": 8.702241550670749e-05, "loss": 0.007, "step": 281430 }, { "epoch": 1.42, "learning_rate": 8.701484781369348e-05, "loss": 0.007, "step": 281440 }, { "epoch": 1.42, "learning_rate": 8.700728012067946e-05, "loss": 0.0126, "step": 281450 }, { "epoch": 1.42, "learning_rate": 8.699971242766546e-05, "loss": 0.008, "step": 281460 }, { "epoch": 1.42, "learning_rate": 8.699214473465145e-05, "loss": 0.0085, "step": 281470 }, { "epoch": 1.42, "learning_rate": 8.698457704163743e-05, "loss": 0.0089, "step": 281480 }, { "epoch": 1.42, "learning_rate": 8.697700934862343e-05, "loss": 0.0081, "step": 281490 }, { "epoch": 1.42, "learning_rate": 8.696944165560942e-05, "loss": 0.0075, "step": 281500 }, { "epoch": 1.42, "learning_rate": 8.69618739625954e-05, "loss": 0.0077, "step": 281510 }, { "epoch": 1.42, "learning_rate": 8.69543062695814e-05, "loss": 0.0078, "step": 281520 }, { "epoch": 1.42, "learning_rate": 8.694673857656738e-05, "loss": 0.0061, "step": 281530 }, { "epoch": 1.42, "learning_rate": 8.693917088355338e-05, "loss": 0.0076, "step": 281540 }, { "epoch": 1.42, "learning_rate": 8.693160319053937e-05, "loss": 0.0069, "step": 281550 }, { "epoch": 1.42, "learning_rate": 8.692403549752535e-05, "loss": 0.0083, "step": 281560 }, { "epoch": 1.42, "learning_rate": 8.691646780451135e-05, "loss": 0.0094, "step": 281570 }, { "epoch": 1.42, "learning_rate": 8.690890011149734e-05, "loss": 0.0055, "step": 281580 }, { "epoch": 1.42, "learning_rate": 8.690133241848332e-05, "loss": 0.0089, "step": 281590 }, { "epoch": 1.42, "learning_rate": 8.689376472546932e-05, "loss": 0.0072, "step": 281600 }, { "epoch": 1.42, "learning_rate": 8.68861970324553e-05, "loss": 0.0072, "step": 281610 }, { "epoch": 1.42, "learning_rate": 8.68786293394413e-05, "loss": 0.0119, "step": 281620 }, { "epoch": 1.42, "learning_rate": 8.687106164642729e-05, "loss": 0.0078, "step": 281630 }, { "epoch": 1.42, "learning_rate": 8.686349395341327e-05, "loss": 0.0089, "step": 281640 }, { "epoch": 1.42, "learning_rate": 8.685592626039927e-05, "loss": 0.0082, "step": 281650 }, { "epoch": 1.42, "learning_rate": 8.684835856738526e-05, "loss": 0.0086, "step": 281660 }, { "epoch": 1.42, "learning_rate": 8.684079087437124e-05, "loss": 0.0081, "step": 281670 }, { "epoch": 1.42, "learning_rate": 8.683322318135724e-05, "loss": 0.0073, "step": 281680 }, { "epoch": 1.42, "learning_rate": 8.682565548834322e-05, "loss": 0.0078, "step": 281690 }, { "epoch": 1.42, "learning_rate": 8.681808779532922e-05, "loss": 0.0077, "step": 281700 }, { "epoch": 1.42, "learning_rate": 8.681052010231521e-05, "loss": 0.0157, "step": 281710 }, { "epoch": 1.42, "learning_rate": 8.680295240930119e-05, "loss": 0.0071, "step": 281720 }, { "epoch": 1.42, "learning_rate": 8.679538471628719e-05, "loss": 0.0096, "step": 281730 }, { "epoch": 1.42, "learning_rate": 8.678781702327318e-05, "loss": 0.0093, "step": 281740 }, { "epoch": 1.42, "learning_rate": 8.678024933025916e-05, "loss": 0.0089, "step": 281750 }, { "epoch": 1.42, "learning_rate": 8.677268163724516e-05, "loss": 0.006, "step": 281760 }, { "epoch": 1.42, "learning_rate": 8.676511394423114e-05, "loss": 0.008, "step": 281770 }, { "epoch": 1.42, "learning_rate": 8.675754625121713e-05, "loss": 0.007, "step": 281780 }, { "epoch": 1.42, "learning_rate": 8.674997855820313e-05, "loss": 0.0085, "step": 281790 }, { "epoch": 1.42, "learning_rate": 8.674241086518911e-05, "loss": 0.0058, "step": 281800 }, { "epoch": 1.42, "learning_rate": 8.67348431721751e-05, "loss": 0.0073, "step": 281810 }, { "epoch": 1.42, "learning_rate": 8.67272754791611e-05, "loss": 0.0072, "step": 281820 }, { "epoch": 1.42, "learning_rate": 8.671970778614708e-05, "loss": 0.0065, "step": 281830 }, { "epoch": 1.42, "learning_rate": 8.671214009313308e-05, "loss": 0.0092, "step": 281840 }, { "epoch": 1.42, "learning_rate": 8.670457240011907e-05, "loss": 0.0075, "step": 281850 }, { "epoch": 1.42, "learning_rate": 8.669700470710504e-05, "loss": 0.0083, "step": 281860 }, { "epoch": 1.42, "learning_rate": 8.668943701409104e-05, "loss": 0.0101, "step": 281870 }, { "epoch": 1.42, "learning_rate": 8.668186932107702e-05, "loss": 0.0076, "step": 281880 }, { "epoch": 1.42, "learning_rate": 8.667430162806301e-05, "loss": 0.0057, "step": 281890 }, { "epoch": 1.42, "learning_rate": 8.666673393504899e-05, "loss": 0.0069, "step": 281900 }, { "epoch": 1.42, "learning_rate": 8.665916624203499e-05, "loss": 0.0071, "step": 281910 }, { "epoch": 1.42, "learning_rate": 8.665159854902098e-05, "loss": 0.0088, "step": 281920 }, { "epoch": 1.42, "learning_rate": 8.664403085600696e-05, "loss": 0.0092, "step": 281930 }, { "epoch": 1.42, "learning_rate": 8.663646316299296e-05, "loss": 0.0067, "step": 281940 }, { "epoch": 1.42, "learning_rate": 8.662889546997895e-05, "loss": 0.0076, "step": 281950 }, { "epoch": 1.42, "learning_rate": 8.662132777696494e-05, "loss": 0.0079, "step": 281960 }, { "epoch": 1.42, "learning_rate": 8.661376008395093e-05, "loss": 0.0076, "step": 281970 }, { "epoch": 1.42, "learning_rate": 8.660619239093691e-05, "loss": 0.0057, "step": 281980 }, { "epoch": 1.42, "learning_rate": 8.659862469792291e-05, "loss": 0.0067, "step": 281990 }, { "epoch": 1.42, "learning_rate": 8.65910570049089e-05, "loss": 0.0071, "step": 282000 }, { "epoch": 1.42, "eval_cer": 0.9144411440194001, "eval_loss": 0.005825493950396776, "eval_runtime": 115.8458, "eval_samples_per_second": 17.264, "eval_steps_per_second": 4.316, "step": 282000 }, { "epoch": 1.42, "learning_rate": 8.658348931189488e-05, "loss": 0.0092, "step": 282010 }, { "epoch": 1.42, "learning_rate": 8.657592161888088e-05, "loss": 0.0068, "step": 282020 }, { "epoch": 1.42, "learning_rate": 8.656835392586687e-05, "loss": 0.0086, "step": 282030 }, { "epoch": 1.42, "learning_rate": 8.656078623285286e-05, "loss": 0.0094, "step": 282040 }, { "epoch": 1.42, "learning_rate": 8.655321853983885e-05, "loss": 0.0084, "step": 282050 }, { "epoch": 1.42, "learning_rate": 8.654565084682483e-05, "loss": 0.0071, "step": 282060 }, { "epoch": 1.42, "learning_rate": 8.653808315381083e-05, "loss": 0.008, "step": 282070 }, { "epoch": 1.42, "learning_rate": 8.653051546079682e-05, "loss": 0.0097, "step": 282080 }, { "epoch": 1.42, "learning_rate": 8.65229477677828e-05, "loss": 0.0075, "step": 282090 }, { "epoch": 1.42, "learning_rate": 8.65153800747688e-05, "loss": 0.0071, "step": 282100 }, { "epoch": 1.42, "learning_rate": 8.650781238175479e-05, "loss": 0.0071, "step": 282110 }, { "epoch": 1.42, "learning_rate": 8.650024468874077e-05, "loss": 0.0104, "step": 282120 }, { "epoch": 1.42, "learning_rate": 8.649267699572677e-05, "loss": 0.009, "step": 282130 }, { "epoch": 1.42, "learning_rate": 8.648510930271275e-05, "loss": 0.0076, "step": 282140 }, { "epoch": 1.42, "learning_rate": 8.647754160969875e-05, "loss": 0.0108, "step": 282150 }, { "epoch": 1.42, "learning_rate": 8.646997391668474e-05, "loss": 0.0059, "step": 282160 }, { "epoch": 1.42, "learning_rate": 8.646240622367072e-05, "loss": 0.0081, "step": 282170 }, { "epoch": 1.42, "learning_rate": 8.645483853065672e-05, "loss": 0.0078, "step": 282180 }, { "epoch": 1.42, "learning_rate": 8.644727083764271e-05, "loss": 0.0074, "step": 282190 }, { "epoch": 1.42, "learning_rate": 8.64397031446287e-05, "loss": 0.0103, "step": 282200 }, { "epoch": 1.42, "learning_rate": 8.643213545161469e-05, "loss": 0.0076, "step": 282210 }, { "epoch": 1.42, "learning_rate": 8.642456775860067e-05, "loss": 0.0071, "step": 282220 }, { "epoch": 1.42, "learning_rate": 8.641700006558667e-05, "loss": 0.0054, "step": 282230 }, { "epoch": 1.42, "learning_rate": 8.640943237257266e-05, "loss": 0.0093, "step": 282240 }, { "epoch": 1.42, "learning_rate": 8.640186467955864e-05, "loss": 0.0078, "step": 282250 }, { "epoch": 1.42, "learning_rate": 8.639429698654464e-05, "loss": 0.008, "step": 282260 }, { "epoch": 1.42, "learning_rate": 8.638672929353063e-05, "loss": 0.0095, "step": 282270 }, { "epoch": 1.42, "learning_rate": 8.637916160051661e-05, "loss": 0.0071, "step": 282280 }, { "epoch": 1.42, "learning_rate": 8.637159390750261e-05, "loss": 0.0089, "step": 282290 }, { "epoch": 1.42, "learning_rate": 8.63640262144886e-05, "loss": 0.0081, "step": 282300 }, { "epoch": 1.42, "learning_rate": 8.635645852147458e-05, "loss": 0.0067, "step": 282310 }, { "epoch": 1.42, "learning_rate": 8.634889082846058e-05, "loss": 0.0076, "step": 282320 }, { "epoch": 1.42, "learning_rate": 8.634132313544656e-05, "loss": 0.0069, "step": 282330 }, { "epoch": 1.42, "learning_rate": 8.633375544243256e-05, "loss": 0.0079, "step": 282340 }, { "epoch": 1.42, "learning_rate": 8.632618774941855e-05, "loss": 0.0069, "step": 282350 }, { "epoch": 1.42, "learning_rate": 8.631862005640453e-05, "loss": 0.0093, "step": 282360 }, { "epoch": 1.42, "learning_rate": 8.631105236339053e-05, "loss": 0.0074, "step": 282370 }, { "epoch": 1.42, "learning_rate": 8.630348467037652e-05, "loss": 0.0065, "step": 282380 }, { "epoch": 1.42, "learning_rate": 8.62959169773625e-05, "loss": 0.0073, "step": 282390 }, { "epoch": 1.42, "learning_rate": 8.62883492843485e-05, "loss": 0.0065, "step": 282400 }, { "epoch": 1.42, "learning_rate": 8.628078159133448e-05, "loss": 0.009, "step": 282410 }, { "epoch": 1.42, "learning_rate": 8.627321389832048e-05, "loss": 0.007, "step": 282420 }, { "epoch": 1.42, "learning_rate": 8.626564620530647e-05, "loss": 0.0077, "step": 282430 }, { "epoch": 1.42, "learning_rate": 8.625807851229245e-05, "loss": 0.0073, "step": 282440 }, { "epoch": 1.42, "learning_rate": 8.625051081927845e-05, "loss": 0.0081, "step": 282450 }, { "epoch": 1.43, "learning_rate": 8.624294312626444e-05, "loss": 0.0091, "step": 282460 }, { "epoch": 1.43, "learning_rate": 8.623537543325042e-05, "loss": 0.0093, "step": 282470 }, { "epoch": 1.43, "learning_rate": 8.622780774023642e-05, "loss": 0.0075, "step": 282480 }, { "epoch": 1.43, "learning_rate": 8.622024004722239e-05, "loss": 0.008, "step": 282490 }, { "epoch": 1.43, "learning_rate": 8.621267235420838e-05, "loss": 0.0081, "step": 282500 }, { "epoch": 1.43, "learning_rate": 8.620510466119436e-05, "loss": 0.0064, "step": 282510 }, { "epoch": 1.43, "learning_rate": 8.619753696818036e-05, "loss": 0.008, "step": 282520 }, { "epoch": 1.43, "learning_rate": 8.618996927516635e-05, "loss": 0.0079, "step": 282530 }, { "epoch": 1.43, "learning_rate": 8.618240158215233e-05, "loss": 0.0087, "step": 282540 }, { "epoch": 1.43, "learning_rate": 8.617483388913833e-05, "loss": 0.0072, "step": 282550 }, { "epoch": 1.43, "learning_rate": 8.616726619612432e-05, "loss": 0.0066, "step": 282560 }, { "epoch": 1.43, "learning_rate": 8.61596985031103e-05, "loss": 0.009, "step": 282570 }, { "epoch": 1.43, "learning_rate": 8.61521308100963e-05, "loss": 0.0083, "step": 282580 }, { "epoch": 1.43, "learning_rate": 8.614456311708228e-05, "loss": 0.0065, "step": 282590 }, { "epoch": 1.43, "learning_rate": 8.613699542406828e-05, "loss": 0.0079, "step": 282600 }, { "epoch": 1.43, "learning_rate": 8.612942773105427e-05, "loss": 0.0071, "step": 282610 }, { "epoch": 1.43, "learning_rate": 8.612186003804025e-05, "loss": 0.009, "step": 282620 }, { "epoch": 1.43, "learning_rate": 8.611429234502625e-05, "loss": 0.0072, "step": 282630 }, { "epoch": 1.43, "learning_rate": 8.610672465201224e-05, "loss": 0.008, "step": 282640 }, { "epoch": 1.43, "learning_rate": 8.609915695899822e-05, "loss": 0.0062, "step": 282650 }, { "epoch": 1.43, "learning_rate": 8.609158926598422e-05, "loss": 0.0074, "step": 282660 }, { "epoch": 1.43, "learning_rate": 8.60840215729702e-05, "loss": 0.0065, "step": 282670 }, { "epoch": 1.43, "learning_rate": 8.60764538799562e-05, "loss": 0.0081, "step": 282680 }, { "epoch": 1.43, "learning_rate": 8.606888618694219e-05, "loss": 0.0078, "step": 282690 }, { "epoch": 1.43, "learning_rate": 8.606131849392817e-05, "loss": 0.0062, "step": 282700 }, { "epoch": 1.43, "learning_rate": 8.605375080091417e-05, "loss": 0.007, "step": 282710 }, { "epoch": 1.43, "learning_rate": 8.604618310790016e-05, "loss": 0.0081, "step": 282720 }, { "epoch": 1.43, "learning_rate": 8.603861541488614e-05, "loss": 0.009, "step": 282730 }, { "epoch": 1.43, "learning_rate": 8.603104772187214e-05, "loss": 0.0065, "step": 282740 }, { "epoch": 1.43, "learning_rate": 8.602348002885813e-05, "loss": 0.007, "step": 282750 }, { "epoch": 1.43, "learning_rate": 8.601591233584412e-05, "loss": 0.0077, "step": 282760 }, { "epoch": 1.43, "learning_rate": 8.600834464283011e-05, "loss": 0.0069, "step": 282770 }, { "epoch": 1.43, "learning_rate": 8.600077694981609e-05, "loss": 0.0089, "step": 282780 }, { "epoch": 1.43, "learning_rate": 8.599320925680209e-05, "loss": 0.0071, "step": 282790 }, { "epoch": 1.43, "learning_rate": 8.598564156378808e-05, "loss": 0.007, "step": 282800 }, { "epoch": 1.43, "learning_rate": 8.597807387077406e-05, "loss": 0.0068, "step": 282810 }, { "epoch": 1.43, "learning_rate": 8.597050617776006e-05, "loss": 0.0091, "step": 282820 }, { "epoch": 1.43, "learning_rate": 8.596293848474605e-05, "loss": 0.0063, "step": 282830 }, { "epoch": 1.43, "learning_rate": 8.595537079173203e-05, "loss": 0.0078, "step": 282840 }, { "epoch": 1.43, "learning_rate": 8.594780309871803e-05, "loss": 0.0053, "step": 282850 }, { "epoch": 1.43, "learning_rate": 8.594023540570401e-05, "loss": 0.0067, "step": 282860 }, { "epoch": 1.43, "learning_rate": 8.593266771269e-05, "loss": 0.0078, "step": 282870 }, { "epoch": 1.43, "learning_rate": 8.5925100019676e-05, "loss": 0.0084, "step": 282880 }, { "epoch": 1.43, "learning_rate": 8.591753232666198e-05, "loss": 0.0067, "step": 282890 }, { "epoch": 1.43, "learning_rate": 8.590996463364798e-05, "loss": 0.0077, "step": 282900 }, { "epoch": 1.43, "learning_rate": 8.590239694063397e-05, "loss": 0.0089, "step": 282910 }, { "epoch": 1.43, "learning_rate": 8.589482924761995e-05, "loss": 0.0068, "step": 282920 }, { "epoch": 1.43, "learning_rate": 8.588726155460595e-05, "loss": 0.0072, "step": 282930 }, { "epoch": 1.43, "learning_rate": 8.587969386159193e-05, "loss": 0.0078, "step": 282940 }, { "epoch": 1.43, "learning_rate": 8.587212616857793e-05, "loss": 0.0083, "step": 282950 }, { "epoch": 1.43, "learning_rate": 8.586455847556392e-05, "loss": 0.0083, "step": 282960 }, { "epoch": 1.43, "learning_rate": 8.58569907825499e-05, "loss": 0.0081, "step": 282970 }, { "epoch": 1.43, "learning_rate": 8.58494230895359e-05, "loss": 0.0056, "step": 282980 }, { "epoch": 1.43, "learning_rate": 8.584185539652189e-05, "loss": 0.0069, "step": 282990 }, { "epoch": 1.43, "learning_rate": 8.583428770350787e-05, "loss": 0.0087, "step": 283000 }, { "epoch": 1.43, "eval_cer": 0.9144392032271493, "eval_loss": 0.005669817794114351, "eval_runtime": 115.6754, "eval_samples_per_second": 17.29, "eval_steps_per_second": 4.322, "step": 283000 }, { "epoch": 1.43, "learning_rate": 8.582672001049387e-05, "loss": 0.01, "step": 283010 }, { "epoch": 1.43, "learning_rate": 8.581915231747985e-05, "loss": 0.007, "step": 283020 }, { "epoch": 1.43, "learning_rate": 8.581158462446584e-05, "loss": 0.0089, "step": 283030 }, { "epoch": 1.43, "learning_rate": 8.580401693145184e-05, "loss": 0.007, "step": 283040 }, { "epoch": 1.43, "learning_rate": 8.579644923843782e-05, "loss": 0.0098, "step": 283050 }, { "epoch": 1.43, "learning_rate": 8.578888154542382e-05, "loss": 0.0071, "step": 283060 }, { "epoch": 1.43, "learning_rate": 8.578131385240981e-05, "loss": 0.0091, "step": 283070 }, { "epoch": 1.43, "learning_rate": 8.577374615939579e-05, "loss": 0.0081, "step": 283080 }, { "epoch": 1.43, "learning_rate": 8.576617846638179e-05, "loss": 0.008, "step": 283090 }, { "epoch": 1.43, "learning_rate": 8.575861077336777e-05, "loss": 0.0062, "step": 283100 }, { "epoch": 1.43, "learning_rate": 8.575104308035376e-05, "loss": 0.008, "step": 283110 }, { "epoch": 1.43, "learning_rate": 8.574347538733973e-05, "loss": 0.0079, "step": 283120 }, { "epoch": 1.43, "learning_rate": 8.573590769432573e-05, "loss": 0.0073, "step": 283130 }, { "epoch": 1.43, "learning_rate": 8.572834000131172e-05, "loss": 0.0102, "step": 283140 }, { "epoch": 1.43, "learning_rate": 8.57207723082977e-05, "loss": 0.0078, "step": 283150 }, { "epoch": 1.43, "learning_rate": 8.57132046152837e-05, "loss": 0.008, "step": 283160 }, { "epoch": 1.43, "learning_rate": 8.57056369222697e-05, "loss": 0.0056, "step": 283170 }, { "epoch": 1.43, "learning_rate": 8.569806922925567e-05, "loss": 0.0093, "step": 283180 }, { "epoch": 1.43, "learning_rate": 8.569050153624167e-05, "loss": 0.0057, "step": 283190 }, { "epoch": 1.43, "learning_rate": 8.568293384322766e-05, "loss": 0.0064, "step": 283200 }, { "epoch": 1.43, "learning_rate": 8.567536615021365e-05, "loss": 0.0068, "step": 283210 }, { "epoch": 1.43, "learning_rate": 8.566779845719964e-05, "loss": 0.0078, "step": 283220 }, { "epoch": 1.43, "learning_rate": 8.566023076418562e-05, "loss": 0.0071, "step": 283230 }, { "epoch": 1.43, "learning_rate": 8.565266307117162e-05, "loss": 0.0067, "step": 283240 }, { "epoch": 1.43, "learning_rate": 8.564509537815761e-05, "loss": 0.0101, "step": 283250 }, { "epoch": 1.43, "learning_rate": 8.56375276851436e-05, "loss": 0.0059, "step": 283260 }, { "epoch": 1.43, "learning_rate": 8.562995999212959e-05, "loss": 0.0079, "step": 283270 }, { "epoch": 1.43, "learning_rate": 8.562239229911558e-05, "loss": 0.0073, "step": 283280 }, { "epoch": 1.43, "learning_rate": 8.561482460610157e-05, "loss": 0.0074, "step": 283290 }, { "epoch": 1.43, "learning_rate": 8.560725691308756e-05, "loss": 0.0044, "step": 283300 }, { "epoch": 1.43, "learning_rate": 8.559968922007354e-05, "loss": 0.0089, "step": 283310 }, { "epoch": 1.43, "learning_rate": 8.559212152705954e-05, "loss": 0.0085, "step": 283320 }, { "epoch": 1.43, "learning_rate": 8.558455383404553e-05, "loss": 0.0079, "step": 283330 }, { "epoch": 1.43, "learning_rate": 8.557698614103151e-05, "loss": 0.0064, "step": 283340 }, { "epoch": 1.43, "learning_rate": 8.556941844801751e-05, "loss": 0.0078, "step": 283350 }, { "epoch": 1.43, "learning_rate": 8.55618507550035e-05, "loss": 0.0079, "step": 283360 }, { "epoch": 1.43, "learning_rate": 8.555428306198948e-05, "loss": 0.0071, "step": 283370 }, { "epoch": 1.43, "learning_rate": 8.554671536897548e-05, "loss": 0.0076, "step": 283380 }, { "epoch": 1.43, "learning_rate": 8.553914767596146e-05, "loss": 0.0082, "step": 283390 }, { "epoch": 1.43, "learning_rate": 8.553157998294746e-05, "loss": 0.0068, "step": 283400 }, { "epoch": 1.43, "learning_rate": 8.552401228993345e-05, "loss": 0.0062, "step": 283410 }, { "epoch": 1.43, "learning_rate": 8.551644459691943e-05, "loss": 0.0094, "step": 283420 }, { "epoch": 1.43, "learning_rate": 8.550887690390543e-05, "loss": 0.0075, "step": 283430 }, { "epoch": 1.43, "learning_rate": 8.550130921089142e-05, "loss": 0.0068, "step": 283440 }, { "epoch": 1.43, "learning_rate": 8.54937415178774e-05, "loss": 0.0063, "step": 283450 }, { "epoch": 1.43, "learning_rate": 8.54861738248634e-05, "loss": 0.0087, "step": 283460 }, { "epoch": 1.43, "learning_rate": 8.547860613184938e-05, "loss": 0.0081, "step": 283470 }, { "epoch": 1.43, "learning_rate": 8.547103843883538e-05, "loss": 0.0083, "step": 283480 }, { "epoch": 1.43, "learning_rate": 8.546347074582137e-05, "loss": 0.0088, "step": 283490 }, { "epoch": 1.43, "learning_rate": 8.545590305280735e-05, "loss": 0.0065, "step": 283500 }, { "epoch": 1.43, "learning_rate": 8.544833535979335e-05, "loss": 0.0096, "step": 283510 }, { "epoch": 1.43, "learning_rate": 8.544076766677934e-05, "loss": 0.0085, "step": 283520 }, { "epoch": 1.43, "learning_rate": 8.543319997376532e-05, "loss": 0.0063, "step": 283530 }, { "epoch": 1.43, "learning_rate": 8.542563228075132e-05, "loss": 0.006, "step": 283540 }, { "epoch": 1.43, "learning_rate": 8.54180645877373e-05, "loss": 0.005, "step": 283550 }, { "epoch": 1.43, "learning_rate": 8.54104968947233e-05, "loss": 0.0066, "step": 283560 }, { "epoch": 1.43, "learning_rate": 8.540292920170929e-05, "loss": 0.0073, "step": 283570 }, { "epoch": 1.43, "learning_rate": 8.539536150869527e-05, "loss": 0.0068, "step": 283580 }, { "epoch": 1.43, "learning_rate": 8.538779381568127e-05, "loss": 0.0055, "step": 283590 }, { "epoch": 1.43, "learning_rate": 8.538022612266726e-05, "loss": 0.0061, "step": 283600 }, { "epoch": 1.43, "learning_rate": 8.537265842965324e-05, "loss": 0.0077, "step": 283610 }, { "epoch": 1.43, "learning_rate": 8.536509073663924e-05, "loss": 0.0086, "step": 283620 }, { "epoch": 1.43, "learning_rate": 8.535752304362522e-05, "loss": 0.0076, "step": 283630 }, { "epoch": 1.43, "learning_rate": 8.534995535061121e-05, "loss": 0.0093, "step": 283640 }, { "epoch": 1.43, "learning_rate": 8.534238765759721e-05, "loss": 0.0096, "step": 283650 }, { "epoch": 1.43, "learning_rate": 8.533481996458319e-05, "loss": 0.0069, "step": 283660 }, { "epoch": 1.43, "learning_rate": 8.532725227156919e-05, "loss": 0.0069, "step": 283670 }, { "epoch": 1.43, "learning_rate": 8.531968457855518e-05, "loss": 0.0083, "step": 283680 }, { "epoch": 1.43, "learning_rate": 8.531211688554116e-05, "loss": 0.0062, "step": 283690 }, { "epoch": 1.43, "learning_rate": 8.530454919252716e-05, "loss": 0.0092, "step": 283700 }, { "epoch": 1.43, "learning_rate": 8.529698149951314e-05, "loss": 0.0081, "step": 283710 }, { "epoch": 1.43, "learning_rate": 8.528941380649913e-05, "loss": 0.0065, "step": 283720 }, { "epoch": 1.43, "learning_rate": 8.528184611348513e-05, "loss": 0.0071, "step": 283730 }, { "epoch": 1.43, "learning_rate": 8.527427842047111e-05, "loss": 0.0082, "step": 283740 }, { "epoch": 1.43, "learning_rate": 8.526671072745709e-05, "loss": 0.0076, "step": 283750 }, { "epoch": 1.43, "learning_rate": 8.525914303444307e-05, "loss": 0.0057, "step": 283760 }, { "epoch": 1.43, "learning_rate": 8.525157534142907e-05, "loss": 0.0081, "step": 283770 }, { "epoch": 1.43, "learning_rate": 8.524400764841506e-05, "loss": 0.0063, "step": 283780 }, { "epoch": 1.43, "learning_rate": 8.523643995540104e-05, "loss": 0.0081, "step": 283790 }, { "epoch": 1.43, "learning_rate": 8.522887226238704e-05, "loss": 0.0073, "step": 283800 }, { "epoch": 1.43, "learning_rate": 8.522130456937303e-05, "loss": 0.0091, "step": 283810 }, { "epoch": 1.43, "learning_rate": 8.521373687635902e-05, "loss": 0.0066, "step": 283820 }, { "epoch": 1.43, "learning_rate": 8.520616918334501e-05, "loss": 0.0067, "step": 283830 }, { "epoch": 1.43, "learning_rate": 8.519860149033099e-05, "loss": 0.0079, "step": 283840 }, { "epoch": 1.43, "learning_rate": 8.519103379731699e-05, "loss": 0.0055, "step": 283850 }, { "epoch": 1.43, "learning_rate": 8.518346610430298e-05, "loss": 0.0081, "step": 283860 }, { "epoch": 1.43, "learning_rate": 8.517589841128896e-05, "loss": 0.0089, "step": 283870 }, { "epoch": 1.43, "learning_rate": 8.516833071827496e-05, "loss": 0.0066, "step": 283880 }, { "epoch": 1.43, "learning_rate": 8.516076302526095e-05, "loss": 0.0077, "step": 283890 }, { "epoch": 1.43, "learning_rate": 8.515319533224693e-05, "loss": 0.0061, "step": 283900 }, { "epoch": 1.43, "learning_rate": 8.514562763923293e-05, "loss": 0.0061, "step": 283910 }, { "epoch": 1.43, "learning_rate": 8.513805994621891e-05, "loss": 0.0083, "step": 283920 }, { "epoch": 1.43, "learning_rate": 8.51304922532049e-05, "loss": 0.0089, "step": 283930 }, { "epoch": 1.43, "learning_rate": 8.51229245601909e-05, "loss": 0.0094, "step": 283940 }, { "epoch": 1.43, "learning_rate": 8.511535686717688e-05, "loss": 0.0072, "step": 283950 }, { "epoch": 1.43, "learning_rate": 8.510778917416288e-05, "loss": 0.0075, "step": 283960 }, { "epoch": 1.43, "learning_rate": 8.510022148114887e-05, "loss": 0.0089, "step": 283970 }, { "epoch": 1.43, "learning_rate": 8.509265378813485e-05, "loss": 0.0087, "step": 283980 }, { "epoch": 1.43, "learning_rate": 8.508508609512085e-05, "loss": 0.0085, "step": 283990 }, { "epoch": 1.43, "learning_rate": 8.507751840210683e-05, "loss": 0.0077, "step": 284000 }, { "epoch": 1.43, "eval_cer": 0.914452788772905, "eval_loss": 0.005701255518943071, "eval_runtime": 115.7531, "eval_samples_per_second": 17.278, "eval_steps_per_second": 4.32, "step": 284000 }, { "epoch": 1.43, "learning_rate": 8.506995070909283e-05, "loss": 0.0066, "step": 284010 }, { "epoch": 1.43, "learning_rate": 8.506238301607882e-05, "loss": 0.0096, "step": 284020 }, { "epoch": 1.43, "learning_rate": 8.50548153230648e-05, "loss": 0.0078, "step": 284030 }, { "epoch": 1.43, "learning_rate": 8.50472476300508e-05, "loss": 0.0065, "step": 284040 }, { "epoch": 1.43, "learning_rate": 8.503967993703679e-05, "loss": 0.0051, "step": 284050 }, { "epoch": 1.43, "learning_rate": 8.503211224402277e-05, "loss": 0.0086, "step": 284060 }, { "epoch": 1.43, "learning_rate": 8.502454455100877e-05, "loss": 0.0053, "step": 284070 }, { "epoch": 1.43, "learning_rate": 8.501697685799475e-05, "loss": 0.006, "step": 284080 }, { "epoch": 1.43, "learning_rate": 8.500940916498074e-05, "loss": 0.0067, "step": 284090 }, { "epoch": 1.43, "learning_rate": 8.500184147196674e-05, "loss": 0.0077, "step": 284100 }, { "epoch": 1.43, "learning_rate": 8.499427377895272e-05, "loss": 0.0056, "step": 284110 }, { "epoch": 1.43, "learning_rate": 8.498670608593872e-05, "loss": 0.0081, "step": 284120 }, { "epoch": 1.43, "learning_rate": 8.497913839292471e-05, "loss": 0.0057, "step": 284130 }, { "epoch": 1.43, "learning_rate": 8.497157069991069e-05, "loss": 0.0098, "step": 284140 }, { "epoch": 1.43, "learning_rate": 8.496400300689669e-05, "loss": 0.008, "step": 284150 }, { "epoch": 1.43, "learning_rate": 8.495643531388267e-05, "loss": 0.01, "step": 284160 }, { "epoch": 1.43, "learning_rate": 8.494886762086866e-05, "loss": 0.0076, "step": 284170 }, { "epoch": 1.43, "learning_rate": 8.494129992785466e-05, "loss": 0.01, "step": 284180 }, { "epoch": 1.43, "learning_rate": 8.493373223484064e-05, "loss": 0.0084, "step": 284190 }, { "epoch": 1.43, "learning_rate": 8.492616454182664e-05, "loss": 0.0087, "step": 284200 }, { "epoch": 1.43, "learning_rate": 8.491859684881263e-05, "loss": 0.006, "step": 284210 }, { "epoch": 1.43, "learning_rate": 8.491102915579861e-05, "loss": 0.0073, "step": 284220 }, { "epoch": 1.43, "learning_rate": 8.490346146278461e-05, "loss": 0.0068, "step": 284230 }, { "epoch": 1.43, "learning_rate": 8.48958937697706e-05, "loss": 0.0079, "step": 284240 }, { "epoch": 1.43, "learning_rate": 8.488832607675658e-05, "loss": 0.0072, "step": 284250 }, { "epoch": 1.43, "learning_rate": 8.488075838374258e-05, "loss": 0.0069, "step": 284260 }, { "epoch": 1.43, "learning_rate": 8.487319069072856e-05, "loss": 0.0062, "step": 284270 }, { "epoch": 1.43, "learning_rate": 8.486562299771456e-05, "loss": 0.0072, "step": 284280 }, { "epoch": 1.43, "learning_rate": 8.485805530470055e-05, "loss": 0.0076, "step": 284290 }, { "epoch": 1.43, "learning_rate": 8.485048761168653e-05, "loss": 0.0089, "step": 284300 }, { "epoch": 1.43, "learning_rate": 8.484291991867253e-05, "loss": 0.0068, "step": 284310 }, { "epoch": 1.43, "learning_rate": 8.483535222565852e-05, "loss": 0.0049, "step": 284320 }, { "epoch": 1.43, "learning_rate": 8.48277845326445e-05, "loss": 0.0096, "step": 284330 }, { "epoch": 1.43, "learning_rate": 8.48202168396305e-05, "loss": 0.0077, "step": 284340 }, { "epoch": 1.43, "learning_rate": 8.481264914661648e-05, "loss": 0.0072, "step": 284350 }, { "epoch": 1.43, "learning_rate": 8.480508145360247e-05, "loss": 0.0078, "step": 284360 }, { "epoch": 1.43, "learning_rate": 8.479751376058847e-05, "loss": 0.0076, "step": 284370 }, { "epoch": 1.43, "learning_rate": 8.478994606757444e-05, "loss": 0.0071, "step": 284380 }, { "epoch": 1.43, "learning_rate": 8.478237837456043e-05, "loss": 0.0093, "step": 284390 }, { "epoch": 1.43, "learning_rate": 8.477481068154641e-05, "loss": 0.0096, "step": 284400 }, { "epoch": 1.43, "learning_rate": 8.476724298853241e-05, "loss": 0.01, "step": 284410 }, { "epoch": 1.43, "learning_rate": 8.47596752955184e-05, "loss": 0.0071, "step": 284420 }, { "epoch": 1.43, "learning_rate": 8.475210760250439e-05, "loss": 0.0073, "step": 284430 }, { "epoch": 1.44, "learning_rate": 8.474453990949038e-05, "loss": 0.0099, "step": 284440 }, { "epoch": 1.44, "learning_rate": 8.473697221647636e-05, "loss": 0.0073, "step": 284450 }, { "epoch": 1.44, "learning_rate": 8.472940452346236e-05, "loss": 0.0069, "step": 284460 }, { "epoch": 1.44, "learning_rate": 8.472183683044835e-05, "loss": 0.008, "step": 284470 }, { "epoch": 1.44, "learning_rate": 8.471426913743433e-05, "loss": 0.0087, "step": 284480 }, { "epoch": 1.44, "learning_rate": 8.470670144442033e-05, "loss": 0.007, "step": 284490 }, { "epoch": 1.44, "learning_rate": 8.469913375140632e-05, "loss": 0.0105, "step": 284500 }, { "epoch": 1.44, "learning_rate": 8.46915660583923e-05, "loss": 0.0077, "step": 284510 }, { "epoch": 1.44, "learning_rate": 8.46839983653783e-05, "loss": 0.0064, "step": 284520 }, { "epoch": 1.44, "learning_rate": 8.467643067236428e-05, "loss": 0.0085, "step": 284530 }, { "epoch": 1.44, "learning_rate": 8.466886297935028e-05, "loss": 0.0079, "step": 284540 }, { "epoch": 1.44, "learning_rate": 8.466129528633627e-05, "loss": 0.0076, "step": 284550 }, { "epoch": 1.44, "learning_rate": 8.465372759332225e-05, "loss": 0.0068, "step": 284560 }, { "epoch": 1.44, "learning_rate": 8.464615990030825e-05, "loss": 0.007, "step": 284570 }, { "epoch": 1.44, "learning_rate": 8.463859220729424e-05, "loss": 0.0094, "step": 284580 }, { "epoch": 1.44, "learning_rate": 8.463102451428022e-05, "loss": 0.0068, "step": 284590 }, { "epoch": 1.44, "learning_rate": 8.462345682126622e-05, "loss": 0.0078, "step": 284600 }, { "epoch": 1.44, "learning_rate": 8.46158891282522e-05, "loss": 0.0079, "step": 284610 }, { "epoch": 1.44, "learning_rate": 8.46083214352382e-05, "loss": 0.0067, "step": 284620 }, { "epoch": 1.44, "learning_rate": 8.460075374222419e-05, "loss": 0.0085, "step": 284630 }, { "epoch": 1.44, "learning_rate": 8.459318604921017e-05, "loss": 0.0082, "step": 284640 }, { "epoch": 1.44, "learning_rate": 8.458561835619617e-05, "loss": 0.007, "step": 284650 }, { "epoch": 1.44, "learning_rate": 8.457805066318216e-05, "loss": 0.0091, "step": 284660 }, { "epoch": 1.44, "learning_rate": 8.457048297016814e-05, "loss": 0.0082, "step": 284670 }, { "epoch": 1.44, "learning_rate": 8.456291527715414e-05, "loss": 0.0076, "step": 284680 }, { "epoch": 1.44, "learning_rate": 8.455534758414013e-05, "loss": 0.0086, "step": 284690 }, { "epoch": 1.44, "learning_rate": 8.454777989112611e-05, "loss": 0.0091, "step": 284700 }, { "epoch": 1.44, "learning_rate": 8.454021219811211e-05, "loss": 0.0089, "step": 284710 }, { "epoch": 1.44, "learning_rate": 8.453264450509809e-05, "loss": 0.007, "step": 284720 }, { "epoch": 1.44, "learning_rate": 8.452507681208409e-05, "loss": 0.0068, "step": 284730 }, { "epoch": 1.44, "learning_rate": 8.451750911907008e-05, "loss": 0.0073, "step": 284740 }, { "epoch": 1.44, "learning_rate": 8.450994142605606e-05, "loss": 0.0058, "step": 284750 }, { "epoch": 1.44, "learning_rate": 8.450237373304206e-05, "loss": 0.0079, "step": 284760 }, { "epoch": 1.44, "learning_rate": 8.449480604002805e-05, "loss": 0.0071, "step": 284770 }, { "epoch": 1.44, "learning_rate": 8.448723834701403e-05, "loss": 0.0085, "step": 284780 }, { "epoch": 1.44, "learning_rate": 8.447967065400003e-05, "loss": 0.0089, "step": 284790 }, { "epoch": 1.44, "learning_rate": 8.447210296098601e-05, "loss": 0.0075, "step": 284800 }, { "epoch": 1.44, "learning_rate": 8.4464535267972e-05, "loss": 0.0082, "step": 284810 }, { "epoch": 1.44, "learning_rate": 8.4456967574958e-05, "loss": 0.0078, "step": 284820 }, { "epoch": 1.44, "learning_rate": 8.444939988194398e-05, "loss": 0.0079, "step": 284830 }, { "epoch": 1.44, "learning_rate": 8.444183218892998e-05, "loss": 0.0099, "step": 284840 }, { "epoch": 1.44, "learning_rate": 8.443426449591597e-05, "loss": 0.0078, "step": 284850 }, { "epoch": 1.44, "learning_rate": 8.442669680290195e-05, "loss": 0.0056, "step": 284860 }, { "epoch": 1.44, "learning_rate": 8.441912910988795e-05, "loss": 0.0116, "step": 284870 }, { "epoch": 1.44, "learning_rate": 8.441156141687393e-05, "loss": 0.0071, "step": 284880 }, { "epoch": 1.44, "learning_rate": 8.440399372385992e-05, "loss": 0.0066, "step": 284890 }, { "epoch": 1.44, "learning_rate": 8.439642603084592e-05, "loss": 0.0103, "step": 284900 }, { "epoch": 1.44, "learning_rate": 8.43888583378319e-05, "loss": 0.0084, "step": 284910 }, { "epoch": 1.44, "learning_rate": 8.43812906448179e-05, "loss": 0.0082, "step": 284920 }, { "epoch": 1.44, "learning_rate": 8.437372295180389e-05, "loss": 0.0093, "step": 284930 }, { "epoch": 1.44, "learning_rate": 8.436615525878987e-05, "loss": 0.0093, "step": 284940 }, { "epoch": 1.44, "learning_rate": 8.435858756577587e-05, "loss": 0.0086, "step": 284950 }, { "epoch": 1.44, "learning_rate": 8.435101987276185e-05, "loss": 0.0077, "step": 284960 }, { "epoch": 1.44, "learning_rate": 8.434345217974784e-05, "loss": 0.0071, "step": 284970 }, { "epoch": 1.44, "learning_rate": 8.433588448673384e-05, "loss": 0.0079, "step": 284980 }, { "epoch": 1.44, "learning_rate": 8.432831679371982e-05, "loss": 0.0074, "step": 284990 }, { "epoch": 1.44, "learning_rate": 8.43207491007058e-05, "loss": 0.0069, "step": 285000 }, { "epoch": 1.44, "eval_cer": 0.9144430848116509, "eval_loss": 0.00582539290189743, "eval_runtime": 115.8203, "eval_samples_per_second": 17.268, "eval_steps_per_second": 4.317, "step": 285000 }, { "epoch": 1.44, "learning_rate": 8.431318140769178e-05, "loss": 0.0072, "step": 285010 }, { "epoch": 1.44, "learning_rate": 8.430561371467778e-05, "loss": 0.0062, "step": 285020 }, { "epoch": 1.44, "learning_rate": 8.429804602166377e-05, "loss": 0.0053, "step": 285030 }, { "epoch": 1.44, "learning_rate": 8.429047832864975e-05, "loss": 0.0096, "step": 285040 }, { "epoch": 1.44, "learning_rate": 8.428291063563575e-05, "loss": 0.0096, "step": 285050 }, { "epoch": 1.44, "learning_rate": 8.427534294262173e-05, "loss": 0.0098, "step": 285060 }, { "epoch": 1.44, "learning_rate": 8.426777524960773e-05, "loss": 0.0075, "step": 285070 }, { "epoch": 1.44, "learning_rate": 8.426020755659372e-05, "loss": 0.0077, "step": 285080 }, { "epoch": 1.44, "learning_rate": 8.42526398635797e-05, "loss": 0.0084, "step": 285090 }, { "epoch": 1.44, "learning_rate": 8.42450721705657e-05, "loss": 0.0072, "step": 285100 }, { "epoch": 1.44, "learning_rate": 8.423750447755169e-05, "loss": 0.0072, "step": 285110 }, { "epoch": 1.44, "learning_rate": 8.422993678453767e-05, "loss": 0.0112, "step": 285120 }, { "epoch": 1.44, "learning_rate": 8.422236909152367e-05, "loss": 0.0082, "step": 285130 }, { "epoch": 1.44, "learning_rate": 8.421480139850966e-05, "loss": 0.0075, "step": 285140 }, { "epoch": 1.44, "learning_rate": 8.420723370549565e-05, "loss": 0.0069, "step": 285150 }, { "epoch": 1.44, "learning_rate": 8.419966601248164e-05, "loss": 0.0072, "step": 285160 }, { "epoch": 1.44, "learning_rate": 8.419209831946762e-05, "loss": 0.006, "step": 285170 }, { "epoch": 1.44, "learning_rate": 8.418453062645362e-05, "loss": 0.0121, "step": 285180 }, { "epoch": 1.44, "learning_rate": 8.417696293343961e-05, "loss": 0.0046, "step": 285190 }, { "epoch": 1.44, "learning_rate": 8.416939524042559e-05, "loss": 0.0088, "step": 285200 }, { "epoch": 1.44, "learning_rate": 8.416182754741159e-05, "loss": 0.0075, "step": 285210 }, { "epoch": 1.44, "learning_rate": 8.415425985439758e-05, "loss": 0.0096, "step": 285220 }, { "epoch": 1.44, "learning_rate": 8.414669216138356e-05, "loss": 0.0079, "step": 285230 }, { "epoch": 1.44, "learning_rate": 8.413912446836956e-05, "loss": 0.0079, "step": 285240 }, { "epoch": 1.44, "learning_rate": 8.413155677535554e-05, "loss": 0.0082, "step": 285250 }, { "epoch": 1.44, "learning_rate": 8.412398908234154e-05, "loss": 0.0096, "step": 285260 }, { "epoch": 1.44, "learning_rate": 8.411642138932753e-05, "loss": 0.0075, "step": 285270 }, { "epoch": 1.44, "learning_rate": 8.410885369631351e-05, "loss": 0.0075, "step": 285280 }, { "epoch": 1.44, "learning_rate": 8.410128600329951e-05, "loss": 0.0081, "step": 285290 }, { "epoch": 1.44, "learning_rate": 8.40937183102855e-05, "loss": 0.0085, "step": 285300 }, { "epoch": 1.44, "learning_rate": 8.408615061727148e-05, "loss": 0.0069, "step": 285310 }, { "epoch": 1.44, "learning_rate": 8.407858292425748e-05, "loss": 0.0073, "step": 285320 }, { "epoch": 1.44, "learning_rate": 8.407101523124346e-05, "loss": 0.009, "step": 285330 }, { "epoch": 1.44, "learning_rate": 8.406344753822946e-05, "loss": 0.0086, "step": 285340 }, { "epoch": 1.44, "learning_rate": 8.405587984521545e-05, "loss": 0.0069, "step": 285350 }, { "epoch": 1.44, "learning_rate": 8.404831215220143e-05, "loss": 0.0053, "step": 285360 }, { "epoch": 1.44, "learning_rate": 8.404074445918743e-05, "loss": 0.0094, "step": 285370 }, { "epoch": 1.44, "learning_rate": 8.403317676617342e-05, "loss": 0.0088, "step": 285380 }, { "epoch": 1.44, "learning_rate": 8.40256090731594e-05, "loss": 0.0063, "step": 285390 }, { "epoch": 1.44, "learning_rate": 8.40180413801454e-05, "loss": 0.008, "step": 285400 }, { "epoch": 1.44, "learning_rate": 8.401047368713138e-05, "loss": 0.0075, "step": 285410 }, { "epoch": 1.44, "learning_rate": 8.400290599411737e-05, "loss": 0.0062, "step": 285420 }, { "epoch": 1.44, "learning_rate": 8.399533830110337e-05, "loss": 0.0058, "step": 285430 }, { "epoch": 1.44, "learning_rate": 8.398777060808935e-05, "loss": 0.0072, "step": 285440 }, { "epoch": 1.44, "learning_rate": 8.398020291507535e-05, "loss": 0.0067, "step": 285450 }, { "epoch": 1.44, "learning_rate": 8.397263522206134e-05, "loss": 0.0121, "step": 285460 }, { "epoch": 1.44, "learning_rate": 8.396506752904732e-05, "loss": 0.0099, "step": 285470 }, { "epoch": 1.44, "learning_rate": 8.395749983603332e-05, "loss": 0.0088, "step": 285480 }, { "epoch": 1.44, "learning_rate": 8.39499321430193e-05, "loss": 0.005, "step": 285490 }, { "epoch": 1.44, "learning_rate": 8.39423644500053e-05, "loss": 0.0078, "step": 285500 }, { "epoch": 1.44, "learning_rate": 8.393479675699129e-05, "loss": 0.0066, "step": 285510 }, { "epoch": 1.44, "learning_rate": 8.392722906397727e-05, "loss": 0.0066, "step": 285520 }, { "epoch": 1.44, "learning_rate": 8.391966137096327e-05, "loss": 0.0087, "step": 285530 }, { "epoch": 1.44, "learning_rate": 8.391209367794926e-05, "loss": 0.0092, "step": 285540 }, { "epoch": 1.44, "learning_rate": 8.390452598493524e-05, "loss": 0.0069, "step": 285550 }, { "epoch": 1.44, "learning_rate": 8.389695829192124e-05, "loss": 0.0083, "step": 285560 }, { "epoch": 1.44, "learning_rate": 8.388939059890722e-05, "loss": 0.0083, "step": 285570 }, { "epoch": 1.44, "learning_rate": 8.388182290589321e-05, "loss": 0.0066, "step": 285580 }, { "epoch": 1.44, "learning_rate": 8.387425521287921e-05, "loss": 0.0094, "step": 285590 }, { "epoch": 1.44, "learning_rate": 8.386668751986519e-05, "loss": 0.0083, "step": 285600 }, { "epoch": 1.44, "learning_rate": 8.385911982685118e-05, "loss": 0.0064, "step": 285610 }, { "epoch": 1.44, "learning_rate": 8.385155213383718e-05, "loss": 0.0074, "step": 285620 }, { "epoch": 1.44, "learning_rate": 8.384398444082315e-05, "loss": 0.0057, "step": 285630 }, { "epoch": 1.44, "learning_rate": 8.383641674780914e-05, "loss": 0.0077, "step": 285640 }, { "epoch": 1.44, "learning_rate": 8.382884905479512e-05, "loss": 0.0083, "step": 285650 }, { "epoch": 1.44, "learning_rate": 8.382128136178112e-05, "loss": 0.0095, "step": 285660 }, { "epoch": 1.44, "learning_rate": 8.381371366876711e-05, "loss": 0.0059, "step": 285670 }, { "epoch": 1.44, "learning_rate": 8.38061459757531e-05, "loss": 0.0081, "step": 285680 }, { "epoch": 1.44, "learning_rate": 8.379857828273909e-05, "loss": 0.0065, "step": 285690 }, { "epoch": 1.44, "learning_rate": 8.379101058972507e-05, "loss": 0.0093, "step": 285700 }, { "epoch": 1.44, "learning_rate": 8.378344289671107e-05, "loss": 0.0081, "step": 285710 }, { "epoch": 1.44, "learning_rate": 8.377587520369706e-05, "loss": 0.0121, "step": 285720 }, { "epoch": 1.44, "learning_rate": 8.376830751068304e-05, "loss": 0.0085, "step": 285730 }, { "epoch": 1.44, "learning_rate": 8.376073981766904e-05, "loss": 0.0073, "step": 285740 }, { "epoch": 1.44, "learning_rate": 8.375317212465503e-05, "loss": 0.0074, "step": 285750 }, { "epoch": 1.44, "learning_rate": 8.374560443164101e-05, "loss": 0.0077, "step": 285760 }, { "epoch": 1.44, "learning_rate": 8.373803673862701e-05, "loss": 0.0059, "step": 285770 }, { "epoch": 1.44, "learning_rate": 8.373046904561299e-05, "loss": 0.0068, "step": 285780 }, { "epoch": 1.44, "learning_rate": 8.372290135259899e-05, "loss": 0.0084, "step": 285790 }, { "epoch": 1.44, "learning_rate": 8.371533365958498e-05, "loss": 0.0058, "step": 285800 }, { "epoch": 1.44, "learning_rate": 8.370776596657096e-05, "loss": 0.0072, "step": 285810 }, { "epoch": 1.44, "learning_rate": 8.370019827355696e-05, "loss": 0.0074, "step": 285820 }, { "epoch": 1.44, "learning_rate": 8.369263058054295e-05, "loss": 0.0063, "step": 285830 }, { "epoch": 1.44, "learning_rate": 8.368506288752893e-05, "loss": 0.0089, "step": 285840 }, { "epoch": 1.44, "learning_rate": 8.367749519451493e-05, "loss": 0.0083, "step": 285850 }, { "epoch": 1.44, "learning_rate": 8.366992750150091e-05, "loss": 0.0087, "step": 285860 }, { "epoch": 1.44, "learning_rate": 8.36623598084869e-05, "loss": 0.0074, "step": 285870 }, { "epoch": 1.44, "learning_rate": 8.36547921154729e-05, "loss": 0.0094, "step": 285880 }, { "epoch": 1.44, "learning_rate": 8.364722442245888e-05, "loss": 0.0077, "step": 285890 }, { "epoch": 1.44, "learning_rate": 8.363965672944488e-05, "loss": 0.007, "step": 285900 }, { "epoch": 1.44, "learning_rate": 8.363208903643087e-05, "loss": 0.0097, "step": 285910 }, { "epoch": 1.44, "learning_rate": 8.362452134341685e-05, "loss": 0.007, "step": 285920 }, { "epoch": 1.44, "learning_rate": 8.361695365040285e-05, "loss": 0.0078, "step": 285930 }, { "epoch": 1.44, "learning_rate": 8.360938595738883e-05, "loss": 0.0073, "step": 285940 }, { "epoch": 1.44, "learning_rate": 8.360181826437482e-05, "loss": 0.0112, "step": 285950 }, { "epoch": 1.44, "learning_rate": 8.359425057136082e-05, "loss": 0.0101, "step": 285960 }, { "epoch": 1.44, "learning_rate": 8.35866828783468e-05, "loss": 0.0092, "step": 285970 }, { "epoch": 1.44, "learning_rate": 8.35791151853328e-05, "loss": 0.0067, "step": 285980 }, { "epoch": 1.44, "learning_rate": 8.357154749231879e-05, "loss": 0.011, "step": 285990 }, { "epoch": 1.44, "learning_rate": 8.356397979930477e-05, "loss": 0.0077, "step": 286000 }, { "epoch": 1.44, "eval_cer": 0.914438232831024, "eval_loss": 0.005684024654328823, "eval_runtime": 115.553, "eval_samples_per_second": 17.308, "eval_steps_per_second": 4.327, "step": 286000 }, { "epoch": 1.44, "learning_rate": 8.355641210629077e-05, "loss": 0.0067, "step": 286010 }, { "epoch": 1.44, "learning_rate": 8.354884441327675e-05, "loss": 0.0081, "step": 286020 }, { "epoch": 1.44, "learning_rate": 8.354127672026274e-05, "loss": 0.0082, "step": 286030 }, { "epoch": 1.44, "learning_rate": 8.353370902724874e-05, "loss": 0.0087, "step": 286040 }, { "epoch": 1.44, "learning_rate": 8.352614133423472e-05, "loss": 0.0059, "step": 286050 }, { "epoch": 1.44, "learning_rate": 8.351857364122072e-05, "loss": 0.0076, "step": 286060 }, { "epoch": 1.44, "learning_rate": 8.351100594820671e-05, "loss": 0.0074, "step": 286070 }, { "epoch": 1.44, "learning_rate": 8.350343825519269e-05, "loss": 0.0069, "step": 286080 }, { "epoch": 1.44, "learning_rate": 8.349587056217869e-05, "loss": 0.0068, "step": 286090 }, { "epoch": 1.44, "learning_rate": 8.348830286916467e-05, "loss": 0.0076, "step": 286100 }, { "epoch": 1.44, "learning_rate": 8.348073517615066e-05, "loss": 0.0074, "step": 286110 }, { "epoch": 1.44, "learning_rate": 8.347316748313666e-05, "loss": 0.0092, "step": 286120 }, { "epoch": 1.44, "learning_rate": 8.346559979012264e-05, "loss": 0.0099, "step": 286130 }, { "epoch": 1.44, "learning_rate": 8.345803209710863e-05, "loss": 0.0066, "step": 286140 }, { "epoch": 1.44, "learning_rate": 8.345046440409463e-05, "loss": 0.0075, "step": 286150 }, { "epoch": 1.44, "learning_rate": 8.344289671108061e-05, "loss": 0.0094, "step": 286160 }, { "epoch": 1.44, "learning_rate": 8.34353290180666e-05, "loss": 0.0064, "step": 286170 }, { "epoch": 1.44, "learning_rate": 8.34277613250526e-05, "loss": 0.0122, "step": 286180 }, { "epoch": 1.44, "learning_rate": 8.342019363203858e-05, "loss": 0.0086, "step": 286190 }, { "epoch": 1.44, "learning_rate": 8.341262593902458e-05, "loss": 0.0059, "step": 286200 }, { "epoch": 1.44, "learning_rate": 8.340505824601056e-05, "loss": 0.0048, "step": 286210 }, { "epoch": 1.44, "learning_rate": 8.339749055299655e-05, "loss": 0.0088, "step": 286220 }, { "epoch": 1.44, "learning_rate": 8.338992285998255e-05, "loss": 0.0069, "step": 286230 }, { "epoch": 1.44, "learning_rate": 8.338235516696853e-05, "loss": 0.0074, "step": 286240 }, { "epoch": 1.44, "learning_rate": 8.337478747395453e-05, "loss": 0.0069, "step": 286250 }, { "epoch": 1.44, "learning_rate": 8.33672197809405e-05, "loss": 0.0075, "step": 286260 }, { "epoch": 1.44, "learning_rate": 8.335965208792649e-05, "loss": 0.007, "step": 286270 }, { "epoch": 1.44, "learning_rate": 8.335208439491248e-05, "loss": 0.0057, "step": 286280 }, { "epoch": 1.44, "learning_rate": 8.334451670189846e-05, "loss": 0.0098, "step": 286290 }, { "epoch": 1.44, "learning_rate": 8.333694900888446e-05, "loss": 0.008, "step": 286300 }, { "epoch": 1.44, "learning_rate": 8.332938131587044e-05, "loss": 0.0071, "step": 286310 }, { "epoch": 1.44, "learning_rate": 8.332181362285644e-05, "loss": 0.0106, "step": 286320 }, { "epoch": 1.44, "learning_rate": 8.331424592984243e-05, "loss": 0.0068, "step": 286330 }, { "epoch": 1.44, "learning_rate": 8.330667823682841e-05, "loss": 0.005, "step": 286340 }, { "epoch": 1.44, "learning_rate": 8.329911054381441e-05, "loss": 0.0091, "step": 286350 }, { "epoch": 1.44, "learning_rate": 8.32915428508004e-05, "loss": 0.0077, "step": 286360 }, { "epoch": 1.44, "learning_rate": 8.328397515778638e-05, "loss": 0.0069, "step": 286370 }, { "epoch": 1.44, "learning_rate": 8.327640746477238e-05, "loss": 0.0062, "step": 286380 }, { "epoch": 1.44, "learning_rate": 8.326883977175836e-05, "loss": 0.0083, "step": 286390 }, { "epoch": 1.44, "learning_rate": 8.326127207874436e-05, "loss": 0.0083, "step": 286400 }, { "epoch": 1.44, "learning_rate": 8.325370438573035e-05, "loss": 0.0081, "step": 286410 }, { "epoch": 1.45, "learning_rate": 8.324613669271633e-05, "loss": 0.0066, "step": 286420 }, { "epoch": 1.45, "learning_rate": 8.323856899970233e-05, "loss": 0.0073, "step": 286430 }, { "epoch": 1.45, "learning_rate": 8.323100130668832e-05, "loss": 0.0081, "step": 286440 }, { "epoch": 1.45, "learning_rate": 8.32234336136743e-05, "loss": 0.0085, "step": 286450 }, { "epoch": 1.45, "learning_rate": 8.32158659206603e-05, "loss": 0.0059, "step": 286460 }, { "epoch": 1.45, "learning_rate": 8.320829822764628e-05, "loss": 0.0065, "step": 286470 }, { "epoch": 1.45, "learning_rate": 8.320073053463227e-05, "loss": 0.0085, "step": 286480 }, { "epoch": 1.45, "learning_rate": 8.319316284161827e-05, "loss": 0.0083, "step": 286490 }, { "epoch": 1.45, "learning_rate": 8.318559514860425e-05, "loss": 0.0062, "step": 286500 }, { "epoch": 1.45, "learning_rate": 8.317802745559025e-05, "loss": 0.0094, "step": 286510 }, { "epoch": 1.45, "learning_rate": 8.317045976257624e-05, "loss": 0.0103, "step": 286520 }, { "epoch": 1.45, "learning_rate": 8.316289206956222e-05, "loss": 0.0066, "step": 286530 }, { "epoch": 1.45, "learning_rate": 8.315532437654822e-05, "loss": 0.0091, "step": 286540 }, { "epoch": 1.45, "learning_rate": 8.31477566835342e-05, "loss": 0.0075, "step": 286550 }, { "epoch": 1.45, "learning_rate": 8.31401889905202e-05, "loss": 0.0103, "step": 286560 }, { "epoch": 1.45, "learning_rate": 8.313262129750619e-05, "loss": 0.009, "step": 286570 }, { "epoch": 1.45, "learning_rate": 8.312505360449217e-05, "loss": 0.0069, "step": 286580 }, { "epoch": 1.45, "learning_rate": 8.311748591147817e-05, "loss": 0.0085, "step": 286590 }, { "epoch": 1.45, "learning_rate": 8.310991821846416e-05, "loss": 0.007, "step": 286600 }, { "epoch": 1.45, "learning_rate": 8.310235052545014e-05, "loss": 0.0095, "step": 286610 }, { "epoch": 1.45, "learning_rate": 8.309478283243614e-05, "loss": 0.0085, "step": 286620 }, { "epoch": 1.45, "learning_rate": 8.308721513942213e-05, "loss": 0.0069, "step": 286630 }, { "epoch": 1.45, "learning_rate": 8.307964744640811e-05, "loss": 0.0085, "step": 286640 }, { "epoch": 1.45, "learning_rate": 8.307207975339411e-05, "loss": 0.006, "step": 286650 }, { "epoch": 1.45, "learning_rate": 8.306451206038009e-05, "loss": 0.0092, "step": 286660 }, { "epoch": 1.45, "learning_rate": 8.305694436736608e-05, "loss": 0.0094, "step": 286670 }, { "epoch": 1.45, "learning_rate": 8.304937667435208e-05, "loss": 0.0084, "step": 286680 }, { "epoch": 1.45, "learning_rate": 8.304180898133806e-05, "loss": 0.0062, "step": 286690 }, { "epoch": 1.45, "learning_rate": 8.303424128832406e-05, "loss": 0.0086, "step": 286700 }, { "epoch": 1.45, "learning_rate": 8.302667359531005e-05, "loss": 0.0084, "step": 286710 }, { "epoch": 1.45, "learning_rate": 8.301910590229603e-05, "loss": 0.0065, "step": 286720 }, { "epoch": 1.45, "learning_rate": 8.301153820928203e-05, "loss": 0.0085, "step": 286730 }, { "epoch": 1.45, "learning_rate": 8.300397051626801e-05, "loss": 0.0074, "step": 286740 }, { "epoch": 1.45, "learning_rate": 8.2996402823254e-05, "loss": 0.0068, "step": 286750 }, { "epoch": 1.45, "learning_rate": 8.298883513024e-05, "loss": 0.0093, "step": 286760 }, { "epoch": 1.45, "learning_rate": 8.298126743722598e-05, "loss": 0.0072, "step": 286770 }, { "epoch": 1.45, "learning_rate": 8.297369974421198e-05, "loss": 0.0082, "step": 286780 }, { "epoch": 1.45, "learning_rate": 8.296613205119797e-05, "loss": 0.0086, "step": 286790 }, { "epoch": 1.45, "learning_rate": 8.295856435818395e-05, "loss": 0.0083, "step": 286800 }, { "epoch": 1.45, "learning_rate": 8.295099666516995e-05, "loss": 0.0081, "step": 286810 }, { "epoch": 1.45, "learning_rate": 8.294342897215593e-05, "loss": 0.0102, "step": 286820 }, { "epoch": 1.45, "learning_rate": 8.293586127914192e-05, "loss": 0.009, "step": 286830 }, { "epoch": 1.45, "learning_rate": 8.292829358612792e-05, "loss": 0.0077, "step": 286840 }, { "epoch": 1.45, "learning_rate": 8.29207258931139e-05, "loss": 0.0085, "step": 286850 }, { "epoch": 1.45, "learning_rate": 8.29131582000999e-05, "loss": 0.0074, "step": 286860 }, { "epoch": 1.45, "learning_rate": 8.290559050708589e-05, "loss": 0.008, "step": 286870 }, { "epoch": 1.45, "learning_rate": 8.289802281407187e-05, "loss": 0.0063, "step": 286880 }, { "epoch": 1.45, "learning_rate": 8.289045512105785e-05, "loss": 0.0078, "step": 286890 }, { "epoch": 1.45, "learning_rate": 8.288288742804383e-05, "loss": 0.0095, "step": 286900 }, { "epoch": 1.45, "learning_rate": 8.287531973502983e-05, "loss": 0.0081, "step": 286910 }, { "epoch": 1.45, "learning_rate": 8.286775204201581e-05, "loss": 0.0069, "step": 286920 }, { "epoch": 1.45, "learning_rate": 8.28601843490018e-05, "loss": 0.0092, "step": 286930 }, { "epoch": 1.45, "learning_rate": 8.28526166559878e-05, "loss": 0.0095, "step": 286940 }, { "epoch": 1.45, "learning_rate": 8.284504896297378e-05, "loss": 0.0075, "step": 286950 }, { "epoch": 1.45, "learning_rate": 8.283748126995978e-05, "loss": 0.0052, "step": 286960 }, { "epoch": 1.45, "learning_rate": 8.282991357694577e-05, "loss": 0.0072, "step": 286970 }, { "epoch": 1.45, "learning_rate": 8.282234588393175e-05, "loss": 0.0081, "step": 286980 }, { "epoch": 1.45, "learning_rate": 8.281477819091775e-05, "loss": 0.0067, "step": 286990 }, { "epoch": 1.45, "learning_rate": 8.280721049790373e-05, "loss": 0.0068, "step": 287000 }, { "epoch": 1.45, "eval_cer": 0.9144333808503969, "eval_loss": 0.0057329838164150715, "eval_runtime": 115.5304, "eval_samples_per_second": 17.311, "eval_steps_per_second": 4.328, "step": 287000 }, { "epoch": 1.45, "learning_rate": 8.279964280488972e-05, "loss": 0.007, "step": 287010 }, { "epoch": 1.45, "learning_rate": 8.279207511187572e-05, "loss": 0.007, "step": 287020 }, { "epoch": 1.45, "learning_rate": 8.27845074188617e-05, "loss": 0.0062, "step": 287030 }, { "epoch": 1.45, "learning_rate": 8.27769397258477e-05, "loss": 0.0058, "step": 287040 }, { "epoch": 1.45, "learning_rate": 8.276937203283369e-05, "loss": 0.0082, "step": 287050 }, { "epoch": 1.45, "learning_rate": 8.276180433981967e-05, "loss": 0.0064, "step": 287060 }, { "epoch": 1.45, "learning_rate": 8.275423664680567e-05, "loss": 0.0075, "step": 287070 }, { "epoch": 1.45, "learning_rate": 8.274666895379166e-05, "loss": 0.0094, "step": 287080 }, { "epoch": 1.45, "learning_rate": 8.273910126077764e-05, "loss": 0.0068, "step": 287090 }, { "epoch": 1.45, "learning_rate": 8.273153356776364e-05, "loss": 0.0068, "step": 287100 }, { "epoch": 1.45, "learning_rate": 8.272396587474962e-05, "loss": 0.0054, "step": 287110 }, { "epoch": 1.45, "learning_rate": 8.271639818173562e-05, "loss": 0.0068, "step": 287120 }, { "epoch": 1.45, "learning_rate": 8.270883048872161e-05, "loss": 0.0065, "step": 287130 }, { "epoch": 1.45, "learning_rate": 8.270126279570759e-05, "loss": 0.0097, "step": 287140 }, { "epoch": 1.45, "learning_rate": 8.269369510269359e-05, "loss": 0.0064, "step": 287150 }, { "epoch": 1.45, "learning_rate": 8.268612740967958e-05, "loss": 0.0076, "step": 287160 }, { "epoch": 1.45, "learning_rate": 8.267855971666556e-05, "loss": 0.009, "step": 287170 }, { "epoch": 1.45, "learning_rate": 8.267099202365156e-05, "loss": 0.0066, "step": 287180 }, { "epoch": 1.45, "learning_rate": 8.266342433063754e-05, "loss": 0.0058, "step": 287190 }, { "epoch": 1.45, "learning_rate": 8.265585663762354e-05, "loss": 0.0064, "step": 287200 }, { "epoch": 1.45, "learning_rate": 8.264828894460953e-05, "loss": 0.0075, "step": 287210 }, { "epoch": 1.45, "learning_rate": 8.264072125159551e-05, "loss": 0.0097, "step": 287220 }, { "epoch": 1.45, "learning_rate": 8.26331535585815e-05, "loss": 0.0065, "step": 287230 }, { "epoch": 1.45, "learning_rate": 8.26255858655675e-05, "loss": 0.0105, "step": 287240 }, { "epoch": 1.45, "learning_rate": 8.261801817255348e-05, "loss": 0.0059, "step": 287250 }, { "epoch": 1.45, "learning_rate": 8.261045047953948e-05, "loss": 0.0071, "step": 287260 }, { "epoch": 1.45, "learning_rate": 8.260288278652546e-05, "loss": 0.0064, "step": 287270 }, { "epoch": 1.45, "learning_rate": 8.259531509351145e-05, "loss": 0.0086, "step": 287280 }, { "epoch": 1.45, "learning_rate": 8.258774740049745e-05, "loss": 0.0094, "step": 287290 }, { "epoch": 1.45, "learning_rate": 8.258017970748343e-05, "loss": 0.0055, "step": 287300 }, { "epoch": 1.45, "learning_rate": 8.257261201446943e-05, "loss": 0.0072, "step": 287310 }, { "epoch": 1.45, "learning_rate": 8.256504432145542e-05, "loss": 0.008, "step": 287320 }, { "epoch": 1.45, "learning_rate": 8.25574766284414e-05, "loss": 0.0085, "step": 287330 }, { "epoch": 1.45, "learning_rate": 8.25499089354274e-05, "loss": 0.009, "step": 287340 }, { "epoch": 1.45, "learning_rate": 8.254234124241338e-05, "loss": 0.0091, "step": 287350 }, { "epoch": 1.45, "learning_rate": 8.253477354939937e-05, "loss": 0.0068, "step": 287360 }, { "epoch": 1.45, "learning_rate": 8.252720585638537e-05, "loss": 0.0078, "step": 287370 }, { "epoch": 1.45, "learning_rate": 8.251963816337135e-05, "loss": 0.0068, "step": 287380 }, { "epoch": 1.45, "learning_rate": 8.251207047035735e-05, "loss": 0.0066, "step": 287390 }, { "epoch": 1.45, "learning_rate": 8.250450277734334e-05, "loss": 0.0074, "step": 287400 }, { "epoch": 1.45, "learning_rate": 8.249693508432932e-05, "loss": 0.0062, "step": 287410 }, { "epoch": 1.45, "learning_rate": 8.248936739131532e-05, "loss": 0.0079, "step": 287420 }, { "epoch": 1.45, "learning_rate": 8.24817996983013e-05, "loss": 0.0056, "step": 287430 }, { "epoch": 1.45, "learning_rate": 8.247423200528729e-05, "loss": 0.0096, "step": 287440 }, { "epoch": 1.45, "learning_rate": 8.246666431227329e-05, "loss": 0.0087, "step": 287450 }, { "epoch": 1.45, "learning_rate": 8.245909661925927e-05, "loss": 0.0084, "step": 287460 }, { "epoch": 1.45, "learning_rate": 8.245152892624526e-05, "loss": 0.0082, "step": 287470 }, { "epoch": 1.45, "learning_rate": 8.244396123323126e-05, "loss": 0.0084, "step": 287480 }, { "epoch": 1.45, "learning_rate": 8.243639354021724e-05, "loss": 0.0068, "step": 287490 }, { "epoch": 1.45, "learning_rate": 8.242882584720324e-05, "loss": 0.0081, "step": 287500 }, { "epoch": 1.45, "learning_rate": 8.242125815418922e-05, "loss": 0.0074, "step": 287510 }, { "epoch": 1.45, "learning_rate": 8.24136904611752e-05, "loss": 0.0046, "step": 287520 }, { "epoch": 1.45, "learning_rate": 8.240612276816118e-05, "loss": 0.0074, "step": 287530 }, { "epoch": 1.45, "learning_rate": 8.239855507514718e-05, "loss": 0.0061, "step": 287540 }, { "epoch": 1.45, "learning_rate": 8.239098738213317e-05, "loss": 0.0058, "step": 287550 }, { "epoch": 1.45, "learning_rate": 8.238341968911915e-05, "loss": 0.0062, "step": 287560 }, { "epoch": 1.45, "learning_rate": 8.237585199610515e-05, "loss": 0.0066, "step": 287570 }, { "epoch": 1.45, "learning_rate": 8.236828430309114e-05, "loss": 0.007, "step": 287580 }, { "epoch": 1.45, "learning_rate": 8.236071661007712e-05, "loss": 0.0066, "step": 287590 }, { "epoch": 1.45, "learning_rate": 8.235314891706312e-05, "loss": 0.0054, "step": 287600 }, { "epoch": 1.45, "learning_rate": 8.234558122404911e-05, "loss": 0.0071, "step": 287610 }, { "epoch": 1.45, "learning_rate": 8.23380135310351e-05, "loss": 0.0067, "step": 287620 }, { "epoch": 1.45, "learning_rate": 8.233044583802109e-05, "loss": 0.0093, "step": 287630 }, { "epoch": 1.45, "learning_rate": 8.232287814500707e-05, "loss": 0.0099, "step": 287640 }, { "epoch": 1.45, "learning_rate": 8.231531045199307e-05, "loss": 0.0072, "step": 287650 }, { "epoch": 1.45, "learning_rate": 8.230774275897906e-05, "loss": 0.007, "step": 287660 }, { "epoch": 1.45, "learning_rate": 8.230017506596504e-05, "loss": 0.0058, "step": 287670 }, { "epoch": 1.45, "learning_rate": 8.229260737295104e-05, "loss": 0.0081, "step": 287680 }, { "epoch": 1.45, "learning_rate": 8.228503967993703e-05, "loss": 0.0074, "step": 287690 }, { "epoch": 1.45, "learning_rate": 8.227747198692301e-05, "loss": 0.0076, "step": 287700 }, { "epoch": 1.45, "learning_rate": 8.226990429390901e-05, "loss": 0.008, "step": 287710 }, { "epoch": 1.45, "learning_rate": 8.226233660089499e-05, "loss": 0.0089, "step": 287720 }, { "epoch": 1.45, "learning_rate": 8.225476890788099e-05, "loss": 0.0065, "step": 287730 }, { "epoch": 1.45, "learning_rate": 8.224720121486698e-05, "loss": 0.0086, "step": 287740 }, { "epoch": 1.45, "learning_rate": 8.223963352185296e-05, "loss": 0.0077, "step": 287750 }, { "epoch": 1.45, "learning_rate": 8.223206582883896e-05, "loss": 0.0065, "step": 287760 }, { "epoch": 1.45, "learning_rate": 8.222449813582495e-05, "loss": 0.0069, "step": 287770 }, { "epoch": 1.45, "learning_rate": 8.221693044281093e-05, "loss": 0.0077, "step": 287780 }, { "epoch": 1.45, "learning_rate": 8.220936274979693e-05, "loss": 0.0054, "step": 287790 }, { "epoch": 1.45, "learning_rate": 8.220179505678291e-05, "loss": 0.0068, "step": 287800 }, { "epoch": 1.45, "learning_rate": 8.21942273637689e-05, "loss": 0.0057, "step": 287810 }, { "epoch": 1.45, "learning_rate": 8.21866596707549e-05, "loss": 0.007, "step": 287820 }, { "epoch": 1.45, "learning_rate": 8.217909197774088e-05, "loss": 0.0058, "step": 287830 }, { "epoch": 1.45, "learning_rate": 8.217152428472688e-05, "loss": 0.0104, "step": 287840 }, { "epoch": 1.45, "learning_rate": 8.216395659171287e-05, "loss": 0.005, "step": 287850 }, { "epoch": 1.45, "learning_rate": 8.215638889869885e-05, "loss": 0.0082, "step": 287860 }, { "epoch": 1.45, "learning_rate": 8.214882120568485e-05, "loss": 0.0084, "step": 287870 }, { "epoch": 1.45, "learning_rate": 8.214125351267083e-05, "loss": 0.0087, "step": 287880 }, { "epoch": 1.45, "learning_rate": 8.213368581965682e-05, "loss": 0.0069, "step": 287890 }, { "epoch": 1.45, "learning_rate": 8.212611812664282e-05, "loss": 0.0068, "step": 287900 }, { "epoch": 1.45, "learning_rate": 8.21185504336288e-05, "loss": 0.0085, "step": 287910 }, { "epoch": 1.45, "learning_rate": 8.21109827406148e-05, "loss": 0.0092, "step": 287920 }, { "epoch": 1.45, "learning_rate": 8.210341504760079e-05, "loss": 0.0063, "step": 287930 }, { "epoch": 1.45, "learning_rate": 8.209584735458677e-05, "loss": 0.0071, "step": 287940 }, { "epoch": 1.45, "learning_rate": 8.208827966157277e-05, "loss": 0.0086, "step": 287950 }, { "epoch": 1.45, "learning_rate": 8.208071196855875e-05, "loss": 0.0058, "step": 287960 }, { "epoch": 1.45, "learning_rate": 8.207314427554474e-05, "loss": 0.0076, "step": 287970 }, { "epoch": 1.45, "learning_rate": 8.206557658253074e-05, "loss": 0.0079, "step": 287980 }, { "epoch": 1.45, "learning_rate": 8.205800888951672e-05, "loss": 0.0071, "step": 287990 }, { "epoch": 1.45, "learning_rate": 8.205044119650271e-05, "loss": 0.0098, "step": 288000 }, { "epoch": 1.45, "eval_cer": 0.9144294992658953, "eval_loss": 0.005808565299957991, "eval_runtime": 115.5954, "eval_samples_per_second": 17.302, "eval_steps_per_second": 4.325, "step": 288000 }, { "epoch": 1.45, "learning_rate": 8.204287350348871e-05, "loss": 0.0074, "step": 288010 }, { "epoch": 1.45, "learning_rate": 8.203530581047469e-05, "loss": 0.005, "step": 288020 }, { "epoch": 1.45, "learning_rate": 8.202773811746069e-05, "loss": 0.0085, "step": 288030 }, { "epoch": 1.45, "learning_rate": 8.202017042444667e-05, "loss": 0.0083, "step": 288040 }, { "epoch": 1.45, "learning_rate": 8.201260273143266e-05, "loss": 0.0062, "step": 288050 }, { "epoch": 1.45, "learning_rate": 8.200503503841866e-05, "loss": 0.0086, "step": 288060 }, { "epoch": 1.45, "learning_rate": 8.199746734540464e-05, "loss": 0.0069, "step": 288070 }, { "epoch": 1.45, "learning_rate": 8.198989965239063e-05, "loss": 0.0068, "step": 288080 }, { "epoch": 1.45, "learning_rate": 8.198233195937663e-05, "loss": 0.0066, "step": 288090 }, { "epoch": 1.45, "learning_rate": 8.197476426636261e-05, "loss": 0.0067, "step": 288100 }, { "epoch": 1.45, "learning_rate": 8.19671965733486e-05, "loss": 0.007, "step": 288110 }, { "epoch": 1.45, "learning_rate": 8.19596288803346e-05, "loss": 0.0069, "step": 288120 }, { "epoch": 1.45, "learning_rate": 8.195206118732058e-05, "loss": 0.0069, "step": 288130 }, { "epoch": 1.45, "learning_rate": 8.194449349430658e-05, "loss": 0.0068, "step": 288140 }, { "epoch": 1.45, "learning_rate": 8.193692580129254e-05, "loss": 0.0056, "step": 288150 }, { "epoch": 1.45, "learning_rate": 8.192935810827854e-05, "loss": 0.0062, "step": 288160 }, { "epoch": 1.45, "learning_rate": 8.192179041526452e-05, "loss": 0.0079, "step": 288170 }, { "epoch": 1.45, "learning_rate": 8.191422272225052e-05, "loss": 0.008, "step": 288180 }, { "epoch": 1.45, "learning_rate": 8.190665502923651e-05, "loss": 0.0058, "step": 288190 }, { "epoch": 1.45, "learning_rate": 8.189908733622249e-05, "loss": 0.0078, "step": 288200 }, { "epoch": 1.45, "learning_rate": 8.189151964320849e-05, "loss": 0.0065, "step": 288210 }, { "epoch": 1.45, "learning_rate": 8.188395195019448e-05, "loss": 0.0079, "step": 288220 }, { "epoch": 1.45, "learning_rate": 8.187638425718046e-05, "loss": 0.0089, "step": 288230 }, { "epoch": 1.45, "learning_rate": 8.186881656416646e-05, "loss": 0.0086, "step": 288240 }, { "epoch": 1.45, "learning_rate": 8.186124887115244e-05, "loss": 0.0064, "step": 288250 }, { "epoch": 1.45, "learning_rate": 8.185368117813844e-05, "loss": 0.0069, "step": 288260 }, { "epoch": 1.45, "learning_rate": 8.184611348512443e-05, "loss": 0.0079, "step": 288270 }, { "epoch": 1.45, "learning_rate": 8.183854579211041e-05, "loss": 0.0076, "step": 288280 }, { "epoch": 1.45, "learning_rate": 8.18309780990964e-05, "loss": 0.0061, "step": 288290 }, { "epoch": 1.45, "learning_rate": 8.18234104060824e-05, "loss": 0.0063, "step": 288300 }, { "epoch": 1.45, "learning_rate": 8.181584271306838e-05, "loss": 0.0061, "step": 288310 }, { "epoch": 1.45, "learning_rate": 8.180827502005438e-05, "loss": 0.0076, "step": 288320 }, { "epoch": 1.45, "learning_rate": 8.180070732704036e-05, "loss": 0.0059, "step": 288330 }, { "epoch": 1.45, "learning_rate": 8.179313963402635e-05, "loss": 0.0086, "step": 288340 }, { "epoch": 1.45, "learning_rate": 8.178557194101235e-05, "loss": 0.0069, "step": 288350 }, { "epoch": 1.45, "learning_rate": 8.177800424799833e-05, "loss": 0.0077, "step": 288360 }, { "epoch": 1.45, "learning_rate": 8.177043655498433e-05, "loss": 0.0094, "step": 288370 }, { "epoch": 1.45, "learning_rate": 8.176286886197032e-05, "loss": 0.0085, "step": 288380 }, { "epoch": 1.45, "learning_rate": 8.17553011689563e-05, "loss": 0.0101, "step": 288390 }, { "epoch": 1.46, "learning_rate": 8.17477334759423e-05, "loss": 0.0065, "step": 288400 }, { "epoch": 1.46, "learning_rate": 8.174016578292828e-05, "loss": 0.0088, "step": 288410 }, { "epoch": 1.46, "learning_rate": 8.173259808991427e-05, "loss": 0.0083, "step": 288420 }, { "epoch": 1.46, "learning_rate": 8.172503039690027e-05, "loss": 0.0097, "step": 288430 }, { "epoch": 1.46, "learning_rate": 8.171746270388625e-05, "loss": 0.0067, "step": 288440 }, { "epoch": 1.46, "learning_rate": 8.170989501087225e-05, "loss": 0.0082, "step": 288450 }, { "epoch": 1.46, "learning_rate": 8.170232731785824e-05, "loss": 0.0073, "step": 288460 }, { "epoch": 1.46, "learning_rate": 8.169475962484422e-05, "loss": 0.0065, "step": 288470 }, { "epoch": 1.46, "learning_rate": 8.168719193183022e-05, "loss": 0.0098, "step": 288480 }, { "epoch": 1.46, "learning_rate": 8.16796242388162e-05, "loss": 0.0086, "step": 288490 }, { "epoch": 1.46, "learning_rate": 8.167205654580219e-05, "loss": 0.0061, "step": 288500 }, { "epoch": 1.46, "learning_rate": 8.166448885278819e-05, "loss": 0.0107, "step": 288510 }, { "epoch": 1.46, "learning_rate": 8.165692115977417e-05, "loss": 0.0065, "step": 288520 }, { "epoch": 1.46, "learning_rate": 8.164935346676016e-05, "loss": 0.0061, "step": 288530 }, { "epoch": 1.46, "learning_rate": 8.164178577374616e-05, "loss": 0.0061, "step": 288540 }, { "epoch": 1.46, "learning_rate": 8.163421808073214e-05, "loss": 0.0062, "step": 288550 }, { "epoch": 1.46, "learning_rate": 8.162665038771814e-05, "loss": 0.0097, "step": 288560 }, { "epoch": 1.46, "learning_rate": 8.161908269470413e-05, "loss": 0.0077, "step": 288570 }, { "epoch": 1.46, "learning_rate": 8.161151500169011e-05, "loss": 0.0095, "step": 288580 }, { "epoch": 1.46, "learning_rate": 8.160394730867611e-05, "loss": 0.0089, "step": 288590 }, { "epoch": 1.46, "learning_rate": 8.159637961566209e-05, "loss": 0.0075, "step": 288600 }, { "epoch": 1.46, "learning_rate": 8.158881192264808e-05, "loss": 0.0066, "step": 288610 }, { "epoch": 1.46, "learning_rate": 8.158124422963408e-05, "loss": 0.0055, "step": 288620 }, { "epoch": 1.46, "learning_rate": 8.157367653662006e-05, "loss": 0.0078, "step": 288630 }, { "epoch": 1.46, "learning_rate": 8.156610884360606e-05, "loss": 0.0053, "step": 288640 }, { "epoch": 1.46, "learning_rate": 8.155854115059205e-05, "loss": 0.0089, "step": 288650 }, { "epoch": 1.46, "learning_rate": 8.155097345757803e-05, "loss": 0.0053, "step": 288660 }, { "epoch": 1.46, "learning_rate": 8.154340576456403e-05, "loss": 0.0068, "step": 288670 }, { "epoch": 1.46, "learning_rate": 8.153583807155001e-05, "loss": 0.0097, "step": 288680 }, { "epoch": 1.46, "learning_rate": 8.1528270378536e-05, "loss": 0.0109, "step": 288690 }, { "epoch": 1.46, "learning_rate": 8.1520702685522e-05, "loss": 0.006, "step": 288700 }, { "epoch": 1.46, "learning_rate": 8.151313499250798e-05, "loss": 0.0065, "step": 288710 }, { "epoch": 1.46, "learning_rate": 8.150556729949397e-05, "loss": 0.0056, "step": 288720 }, { "epoch": 1.46, "learning_rate": 8.149799960647997e-05, "loss": 0.0076, "step": 288730 }, { "epoch": 1.46, "learning_rate": 8.149043191346595e-05, "loss": 0.0064, "step": 288740 }, { "epoch": 1.46, "learning_rate": 8.148286422045195e-05, "loss": 0.0078, "step": 288750 }, { "epoch": 1.46, "learning_rate": 8.147529652743793e-05, "loss": 0.0084, "step": 288760 }, { "epoch": 1.46, "learning_rate": 8.146772883442391e-05, "loss": 0.0084, "step": 288770 }, { "epoch": 1.46, "learning_rate": 8.146016114140989e-05, "loss": 0.0103, "step": 288780 }, { "epoch": 1.46, "learning_rate": 8.145259344839589e-05, "loss": 0.007, "step": 288790 }, { "epoch": 1.46, "learning_rate": 8.144502575538188e-05, "loss": 0.006, "step": 288800 }, { "epoch": 1.46, "learning_rate": 8.143745806236786e-05, "loss": 0.008, "step": 288810 }, { "epoch": 1.46, "learning_rate": 8.142989036935386e-05, "loss": 0.0071, "step": 288820 }, { "epoch": 1.46, "learning_rate": 8.142232267633985e-05, "loss": 0.0088, "step": 288830 }, { "epoch": 1.46, "learning_rate": 8.141475498332583e-05, "loss": 0.0061, "step": 288840 }, { "epoch": 1.46, "learning_rate": 8.140718729031183e-05, "loss": 0.0086, "step": 288850 }, { "epoch": 1.46, "learning_rate": 8.139961959729781e-05, "loss": 0.0082, "step": 288860 }, { "epoch": 1.46, "learning_rate": 8.13920519042838e-05, "loss": 0.0092, "step": 288870 }, { "epoch": 1.46, "learning_rate": 8.13844842112698e-05, "loss": 0.0092, "step": 288880 }, { "epoch": 1.46, "learning_rate": 8.137691651825578e-05, "loss": 0.008, "step": 288890 }, { "epoch": 1.46, "learning_rate": 8.136934882524178e-05, "loss": 0.0065, "step": 288900 }, { "epoch": 1.46, "learning_rate": 8.136178113222777e-05, "loss": 0.0061, "step": 288910 }, { "epoch": 1.46, "learning_rate": 8.135421343921375e-05, "loss": 0.007, "step": 288920 }, { "epoch": 1.46, "learning_rate": 8.134664574619975e-05, "loss": 0.0085, "step": 288930 }, { "epoch": 1.46, "learning_rate": 8.133907805318573e-05, "loss": 0.0088, "step": 288940 }, { "epoch": 1.46, "learning_rate": 8.133151036017172e-05, "loss": 0.0088, "step": 288950 }, { "epoch": 1.46, "learning_rate": 8.132394266715772e-05, "loss": 0.0072, "step": 288960 }, { "epoch": 1.46, "learning_rate": 8.13163749741437e-05, "loss": 0.0075, "step": 288970 }, { "epoch": 1.46, "learning_rate": 8.13088072811297e-05, "loss": 0.0079, "step": 288980 }, { "epoch": 1.46, "learning_rate": 8.130123958811569e-05, "loss": 0.0069, "step": 288990 }, { "epoch": 1.46, "learning_rate": 8.129367189510167e-05, "loss": 0.0077, "step": 289000 }, { "epoch": 1.46, "eval_cer": 0.9144401736232748, "eval_loss": 0.005669711157679558, "eval_runtime": 115.6193, "eval_samples_per_second": 17.298, "eval_steps_per_second": 4.325, "step": 289000 }, { "epoch": 1.46, "learning_rate": 8.128610420208767e-05, "loss": 0.0083, "step": 289010 }, { "epoch": 1.46, "learning_rate": 8.127853650907366e-05, "loss": 0.0078, "step": 289020 }, { "epoch": 1.46, "learning_rate": 8.127096881605964e-05, "loss": 0.0074, "step": 289030 }, { "epoch": 1.46, "learning_rate": 8.126340112304564e-05, "loss": 0.0092, "step": 289040 }, { "epoch": 1.46, "learning_rate": 8.125583343003162e-05, "loss": 0.0096, "step": 289050 }, { "epoch": 1.46, "learning_rate": 8.124826573701761e-05, "loss": 0.0076, "step": 289060 }, { "epoch": 1.46, "learning_rate": 8.124069804400361e-05, "loss": 0.0094, "step": 289070 }, { "epoch": 1.46, "learning_rate": 8.123313035098959e-05, "loss": 0.0089, "step": 289080 }, { "epoch": 1.46, "learning_rate": 8.122556265797559e-05, "loss": 0.0081, "step": 289090 }, { "epoch": 1.46, "learning_rate": 8.121799496496158e-05, "loss": 0.0074, "step": 289100 }, { "epoch": 1.46, "learning_rate": 8.121042727194756e-05, "loss": 0.0086, "step": 289110 }, { "epoch": 1.46, "learning_rate": 8.120285957893356e-05, "loss": 0.0066, "step": 289120 }, { "epoch": 1.46, "learning_rate": 8.119529188591954e-05, "loss": 0.0077, "step": 289130 }, { "epoch": 1.46, "learning_rate": 8.118772419290553e-05, "loss": 0.0051, "step": 289140 }, { "epoch": 1.46, "learning_rate": 8.118015649989153e-05, "loss": 0.0075, "step": 289150 }, { "epoch": 1.46, "learning_rate": 8.117258880687751e-05, "loss": 0.0066, "step": 289160 }, { "epoch": 1.46, "learning_rate": 8.11650211138635e-05, "loss": 0.0078, "step": 289170 }, { "epoch": 1.46, "learning_rate": 8.11574534208495e-05, "loss": 0.0134, "step": 289180 }, { "epoch": 1.46, "learning_rate": 8.114988572783548e-05, "loss": 0.0069, "step": 289190 }, { "epoch": 1.46, "learning_rate": 8.114231803482148e-05, "loss": 0.0054, "step": 289200 }, { "epoch": 1.46, "learning_rate": 8.113475034180746e-05, "loss": 0.0081, "step": 289210 }, { "epoch": 1.46, "learning_rate": 8.112718264879345e-05, "loss": 0.0065, "step": 289220 }, { "epoch": 1.46, "learning_rate": 8.111961495577945e-05, "loss": 0.0126, "step": 289230 }, { "epoch": 1.46, "learning_rate": 8.111204726276543e-05, "loss": 0.0083, "step": 289240 }, { "epoch": 1.46, "learning_rate": 8.110447956975142e-05, "loss": 0.0057, "step": 289250 }, { "epoch": 1.46, "learning_rate": 8.109691187673742e-05, "loss": 0.0074, "step": 289260 }, { "epoch": 1.46, "learning_rate": 8.10893441837234e-05, "loss": 0.0083, "step": 289270 }, { "epoch": 1.46, "learning_rate": 8.10817764907094e-05, "loss": 0.0078, "step": 289280 }, { "epoch": 1.46, "learning_rate": 8.107420879769538e-05, "loss": 0.0091, "step": 289290 }, { "epoch": 1.46, "learning_rate": 8.106664110468137e-05, "loss": 0.0087, "step": 289300 }, { "epoch": 1.46, "learning_rate": 8.105907341166737e-05, "loss": 0.0074, "step": 289310 }, { "epoch": 1.46, "learning_rate": 8.105150571865335e-05, "loss": 0.0129, "step": 289320 }, { "epoch": 1.46, "learning_rate": 8.104393802563934e-05, "loss": 0.0071, "step": 289330 }, { "epoch": 1.46, "learning_rate": 8.103637033262534e-05, "loss": 0.0109, "step": 289340 }, { "epoch": 1.46, "learning_rate": 8.102880263961132e-05, "loss": 0.0089, "step": 289350 }, { "epoch": 1.46, "learning_rate": 8.102123494659732e-05, "loss": 0.0071, "step": 289360 }, { "epoch": 1.46, "learning_rate": 8.10136672535833e-05, "loss": 0.0074, "step": 289370 }, { "epoch": 1.46, "learning_rate": 8.100609956056929e-05, "loss": 0.0107, "step": 289380 }, { "epoch": 1.46, "learning_rate": 8.099853186755529e-05, "loss": 0.0076, "step": 289390 }, { "epoch": 1.46, "learning_rate": 8.099096417454125e-05, "loss": 0.0075, "step": 289400 }, { "epoch": 1.46, "learning_rate": 8.098339648152725e-05, "loss": 0.0066, "step": 289410 }, { "epoch": 1.46, "learning_rate": 8.097582878851323e-05, "loss": 0.0068, "step": 289420 }, { "epoch": 1.46, "learning_rate": 8.096826109549923e-05, "loss": 0.0068, "step": 289430 }, { "epoch": 1.46, "learning_rate": 8.096069340248522e-05, "loss": 0.0068, "step": 289440 }, { "epoch": 1.46, "learning_rate": 8.09531257094712e-05, "loss": 0.0061, "step": 289450 }, { "epoch": 1.46, "learning_rate": 8.09455580164572e-05, "loss": 0.0067, "step": 289460 }, { "epoch": 1.46, "learning_rate": 8.093799032344318e-05, "loss": 0.0075, "step": 289470 }, { "epoch": 1.46, "learning_rate": 8.093042263042917e-05, "loss": 0.0092, "step": 289480 }, { "epoch": 1.46, "learning_rate": 8.092285493741517e-05, "loss": 0.0063, "step": 289490 }, { "epoch": 1.46, "learning_rate": 8.091528724440115e-05, "loss": 0.0077, "step": 289500 }, { "epoch": 1.46, "learning_rate": 8.090771955138715e-05, "loss": 0.0061, "step": 289510 }, { "epoch": 1.46, "learning_rate": 8.090015185837314e-05, "loss": 0.0064, "step": 289520 }, { "epoch": 1.46, "learning_rate": 8.089258416535912e-05, "loss": 0.0069, "step": 289530 }, { "epoch": 1.46, "learning_rate": 8.088501647234512e-05, "loss": 0.0076, "step": 289540 }, { "epoch": 1.46, "learning_rate": 8.087744877933111e-05, "loss": 0.0095, "step": 289550 }, { "epoch": 1.46, "learning_rate": 8.08698810863171e-05, "loss": 0.0064, "step": 289560 }, { "epoch": 1.46, "learning_rate": 8.086231339330309e-05, "loss": 0.0063, "step": 289570 }, { "epoch": 1.46, "learning_rate": 8.085474570028907e-05, "loss": 0.0075, "step": 289580 }, { "epoch": 1.46, "learning_rate": 8.084717800727506e-05, "loss": 0.0087, "step": 289590 }, { "epoch": 1.46, "learning_rate": 8.083961031426106e-05, "loss": 0.0085, "step": 289600 }, { "epoch": 1.46, "learning_rate": 8.083204262124704e-05, "loss": 0.0058, "step": 289610 }, { "epoch": 1.46, "learning_rate": 8.082447492823304e-05, "loss": 0.0068, "step": 289620 }, { "epoch": 1.46, "learning_rate": 8.081690723521903e-05, "loss": 0.0084, "step": 289630 }, { "epoch": 1.46, "learning_rate": 8.080933954220501e-05, "loss": 0.007, "step": 289640 }, { "epoch": 1.46, "learning_rate": 8.080177184919101e-05, "loss": 0.0063, "step": 289650 }, { "epoch": 1.46, "learning_rate": 8.079420415617699e-05, "loss": 0.0074, "step": 289660 }, { "epoch": 1.46, "learning_rate": 8.078663646316298e-05, "loss": 0.0075, "step": 289670 }, { "epoch": 1.46, "learning_rate": 8.077906877014898e-05, "loss": 0.0087, "step": 289680 }, { "epoch": 1.46, "learning_rate": 8.077150107713496e-05, "loss": 0.0083, "step": 289690 }, { "epoch": 1.46, "learning_rate": 8.076393338412096e-05, "loss": 0.0081, "step": 289700 }, { "epoch": 1.46, "learning_rate": 8.075636569110695e-05, "loss": 0.0069, "step": 289710 }, { "epoch": 1.46, "learning_rate": 8.074879799809293e-05, "loss": 0.0067, "step": 289720 }, { "epoch": 1.46, "learning_rate": 8.074123030507893e-05, "loss": 0.0077, "step": 289730 }, { "epoch": 1.46, "learning_rate": 8.073366261206491e-05, "loss": 0.0057, "step": 289740 }, { "epoch": 1.46, "learning_rate": 8.07260949190509e-05, "loss": 0.0068, "step": 289750 }, { "epoch": 1.46, "learning_rate": 8.07185272260369e-05, "loss": 0.0092, "step": 289760 }, { "epoch": 1.46, "learning_rate": 8.071095953302288e-05, "loss": 0.0071, "step": 289770 }, { "epoch": 1.46, "learning_rate": 8.070339184000887e-05, "loss": 0.0061, "step": 289780 }, { "epoch": 1.46, "learning_rate": 8.069582414699487e-05, "loss": 0.0079, "step": 289790 }, { "epoch": 1.46, "learning_rate": 8.068825645398085e-05, "loss": 0.007, "step": 289800 }, { "epoch": 1.46, "learning_rate": 8.068068876096685e-05, "loss": 0.0064, "step": 289810 }, { "epoch": 1.46, "learning_rate": 8.067312106795283e-05, "loss": 0.0073, "step": 289820 }, { "epoch": 1.46, "learning_rate": 8.066555337493882e-05, "loss": 0.0079, "step": 289830 }, { "epoch": 1.46, "learning_rate": 8.065798568192482e-05, "loss": 0.007, "step": 289840 }, { "epoch": 1.46, "learning_rate": 8.06504179889108e-05, "loss": 0.0076, "step": 289850 }, { "epoch": 1.46, "learning_rate": 8.06428502958968e-05, "loss": 0.0075, "step": 289860 }, { "epoch": 1.46, "learning_rate": 8.063528260288279e-05, "loss": 0.0061, "step": 289870 }, { "epoch": 1.46, "learning_rate": 8.062771490986877e-05, "loss": 0.0087, "step": 289880 }, { "epoch": 1.46, "learning_rate": 8.062014721685477e-05, "loss": 0.0097, "step": 289890 }, { "epoch": 1.46, "learning_rate": 8.061257952384075e-05, "loss": 0.0077, "step": 289900 }, { "epoch": 1.46, "learning_rate": 8.060501183082674e-05, "loss": 0.0085, "step": 289910 }, { "epoch": 1.46, "learning_rate": 8.059744413781274e-05, "loss": 0.007, "step": 289920 }, { "epoch": 1.46, "learning_rate": 8.058987644479872e-05, "loss": 0.0067, "step": 289930 }, { "epoch": 1.46, "learning_rate": 8.058230875178471e-05, "loss": 0.0078, "step": 289940 }, { "epoch": 1.46, "learning_rate": 8.057474105877071e-05, "loss": 0.0072, "step": 289950 }, { "epoch": 1.46, "learning_rate": 8.056717336575669e-05, "loss": 0.0068, "step": 289960 }, { "epoch": 1.46, "learning_rate": 8.055960567274268e-05, "loss": 0.0086, "step": 289970 }, { "epoch": 1.46, "learning_rate": 8.055203797972867e-05, "loss": 0.0066, "step": 289980 }, { "epoch": 1.46, "learning_rate": 8.054447028671466e-05, "loss": 0.0083, "step": 289990 }, { "epoch": 1.46, "learning_rate": 8.053690259370066e-05, "loss": 0.0078, "step": 290000 }, { "epoch": 1.46, "eval_cer": 0.9144586111496574, "eval_loss": 0.005535100121051073, "eval_runtime": 115.6597, "eval_samples_per_second": 17.292, "eval_steps_per_second": 4.323, "step": 290000 }, { "epoch": 1.46, "learning_rate": 8.052933490068664e-05, "loss": 0.0064, "step": 290010 }, { "epoch": 1.46, "learning_rate": 8.052176720767263e-05, "loss": 0.0088, "step": 290020 }, { "epoch": 1.46, "learning_rate": 8.05141995146586e-05, "loss": 0.0092, "step": 290030 }, { "epoch": 1.46, "learning_rate": 8.05066318216446e-05, "loss": 0.01, "step": 290040 }, { "epoch": 1.46, "learning_rate": 8.049906412863059e-05, "loss": 0.0075, "step": 290050 }, { "epoch": 1.46, "learning_rate": 8.049149643561657e-05, "loss": 0.0086, "step": 290060 }, { "epoch": 1.46, "learning_rate": 8.048392874260257e-05, "loss": 0.0071, "step": 290070 }, { "epoch": 1.46, "learning_rate": 8.047636104958856e-05, "loss": 0.0067, "step": 290080 }, { "epoch": 1.46, "learning_rate": 8.046879335657454e-05, "loss": 0.0062, "step": 290090 }, { "epoch": 1.46, "learning_rate": 8.046122566356054e-05, "loss": 0.0078, "step": 290100 }, { "epoch": 1.46, "learning_rate": 8.045365797054652e-05, "loss": 0.0079, "step": 290110 }, { "epoch": 1.46, "learning_rate": 8.044609027753252e-05, "loss": 0.0057, "step": 290120 }, { "epoch": 1.46, "learning_rate": 8.043852258451851e-05, "loss": 0.0101, "step": 290130 }, { "epoch": 1.46, "learning_rate": 8.043095489150449e-05, "loss": 0.0063, "step": 290140 }, { "epoch": 1.46, "learning_rate": 8.042338719849049e-05, "loss": 0.0072, "step": 290150 }, { "epoch": 1.46, "learning_rate": 8.041581950547648e-05, "loss": 0.0078, "step": 290160 }, { "epoch": 1.46, "learning_rate": 8.040825181246246e-05, "loss": 0.007, "step": 290170 }, { "epoch": 1.46, "learning_rate": 8.040068411944846e-05, "loss": 0.0085, "step": 290180 }, { "epoch": 1.46, "learning_rate": 8.039311642643444e-05, "loss": 0.0089, "step": 290190 }, { "epoch": 1.46, "learning_rate": 8.038554873342043e-05, "loss": 0.0091, "step": 290200 }, { "epoch": 1.46, "learning_rate": 8.037798104040643e-05, "loss": 0.0055, "step": 290210 }, { "epoch": 1.46, "learning_rate": 8.037041334739241e-05, "loss": 0.0091, "step": 290220 }, { "epoch": 1.46, "learning_rate": 8.03628456543784e-05, "loss": 0.0073, "step": 290230 }, { "epoch": 1.46, "learning_rate": 8.03552779613644e-05, "loss": 0.0066, "step": 290240 }, { "epoch": 1.46, "learning_rate": 8.034771026835038e-05, "loss": 0.0065, "step": 290250 }, { "epoch": 1.46, "learning_rate": 8.034014257533638e-05, "loss": 0.008, "step": 290260 }, { "epoch": 1.46, "learning_rate": 8.033257488232236e-05, "loss": 0.006, "step": 290270 }, { "epoch": 1.46, "learning_rate": 8.032500718930835e-05, "loss": 0.0061, "step": 290280 }, { "epoch": 1.46, "learning_rate": 8.031743949629435e-05, "loss": 0.0073, "step": 290290 }, { "epoch": 1.46, "learning_rate": 8.030987180328033e-05, "loss": 0.0075, "step": 290300 }, { "epoch": 1.46, "learning_rate": 8.030230411026633e-05, "loss": 0.0068, "step": 290310 }, { "epoch": 1.46, "learning_rate": 8.029473641725232e-05, "loss": 0.0066, "step": 290320 }, { "epoch": 1.46, "learning_rate": 8.02871687242383e-05, "loss": 0.0066, "step": 290330 }, { "epoch": 1.46, "learning_rate": 8.02796010312243e-05, "loss": 0.0081, "step": 290340 }, { "epoch": 1.46, "learning_rate": 8.027203333821028e-05, "loss": 0.0063, "step": 290350 }, { "epoch": 1.46, "learning_rate": 8.026446564519627e-05, "loss": 0.0075, "step": 290360 }, { "epoch": 1.46, "learning_rate": 8.025689795218227e-05, "loss": 0.0081, "step": 290370 }, { "epoch": 1.46, "learning_rate": 8.024933025916825e-05, "loss": 0.0071, "step": 290380 }, { "epoch": 1.47, "learning_rate": 8.024176256615424e-05, "loss": 0.007, "step": 290390 }, { "epoch": 1.47, "learning_rate": 8.023419487314024e-05, "loss": 0.0057, "step": 290400 }, { "epoch": 1.47, "learning_rate": 8.022662718012622e-05, "loss": 0.0058, "step": 290410 }, { "epoch": 1.47, "learning_rate": 8.021905948711222e-05, "loss": 0.0077, "step": 290420 }, { "epoch": 1.47, "learning_rate": 8.02114917940982e-05, "loss": 0.0067, "step": 290430 }, { "epoch": 1.47, "learning_rate": 8.020392410108419e-05, "loss": 0.0058, "step": 290440 }, { "epoch": 1.47, "learning_rate": 8.019635640807019e-05, "loss": 0.0095, "step": 290450 }, { "epoch": 1.47, "learning_rate": 8.018878871505617e-05, "loss": 0.0098, "step": 290460 }, { "epoch": 1.47, "learning_rate": 8.018122102204216e-05, "loss": 0.0105, "step": 290470 }, { "epoch": 1.47, "learning_rate": 8.017365332902816e-05, "loss": 0.007, "step": 290480 }, { "epoch": 1.47, "learning_rate": 8.016608563601414e-05, "loss": 0.0059, "step": 290490 }, { "epoch": 1.47, "learning_rate": 8.015851794300014e-05, "loss": 0.0067, "step": 290500 }, { "epoch": 1.47, "learning_rate": 8.015095024998613e-05, "loss": 0.009, "step": 290510 }, { "epoch": 1.47, "learning_rate": 8.014338255697211e-05, "loss": 0.0062, "step": 290520 }, { "epoch": 1.47, "learning_rate": 8.01358148639581e-05, "loss": 0.0079, "step": 290530 }, { "epoch": 1.47, "learning_rate": 8.012824717094409e-05, "loss": 0.0063, "step": 290540 }, { "epoch": 1.47, "learning_rate": 8.012067947793008e-05, "loss": 0.0073, "step": 290550 }, { "epoch": 1.47, "learning_rate": 8.011311178491608e-05, "loss": 0.0069, "step": 290560 }, { "epoch": 1.47, "learning_rate": 8.010554409190206e-05, "loss": 0.0082, "step": 290570 }, { "epoch": 1.47, "learning_rate": 8.009797639888805e-05, "loss": 0.0099, "step": 290580 }, { "epoch": 1.47, "learning_rate": 8.009040870587405e-05, "loss": 0.0081, "step": 290590 }, { "epoch": 1.47, "learning_rate": 8.008284101286003e-05, "loss": 0.0058, "step": 290600 }, { "epoch": 1.47, "learning_rate": 8.007527331984603e-05, "loss": 0.0069, "step": 290610 }, { "epoch": 1.47, "learning_rate": 8.006770562683201e-05, "loss": 0.008, "step": 290620 }, { "epoch": 1.47, "learning_rate": 8.0060137933818e-05, "loss": 0.0076, "step": 290630 }, { "epoch": 1.47, "learning_rate": 8.0052570240804e-05, "loss": 0.0069, "step": 290640 }, { "epoch": 1.47, "learning_rate": 8.004500254778998e-05, "loss": 0.0066, "step": 290650 }, { "epoch": 1.47, "learning_rate": 8.003743485477596e-05, "loss": 0.0074, "step": 290660 }, { "epoch": 1.47, "learning_rate": 8.002986716176194e-05, "loss": 0.0059, "step": 290670 }, { "epoch": 1.47, "learning_rate": 8.002229946874794e-05, "loss": 0.0061, "step": 290680 }, { "epoch": 1.47, "learning_rate": 8.001473177573393e-05, "loss": 0.0069, "step": 290690 }, { "epoch": 1.47, "learning_rate": 8.000716408271991e-05, "loss": 0.0054, "step": 290700 }, { "epoch": 1.47, "learning_rate": 7.999959638970591e-05, "loss": 0.0069, "step": 290710 }, { "epoch": 1.47, "learning_rate": 7.999202869669189e-05, "loss": 0.0099, "step": 290720 }, { "epoch": 1.47, "learning_rate": 7.998446100367788e-05, "loss": 0.0087, "step": 290730 }, { "epoch": 1.47, "learning_rate": 7.997689331066388e-05, "loss": 0.008, "step": 290740 }, { "epoch": 1.47, "learning_rate": 7.996932561764986e-05, "loss": 0.0067, "step": 290750 }, { "epoch": 1.47, "learning_rate": 7.996175792463586e-05, "loss": 0.0086, "step": 290760 }, { "epoch": 1.47, "learning_rate": 7.995419023162185e-05, "loss": 0.0082, "step": 290770 }, { "epoch": 1.47, "learning_rate": 7.994662253860783e-05, "loss": 0.0076, "step": 290780 }, { "epoch": 1.47, "learning_rate": 7.993905484559383e-05, "loss": 0.0088, "step": 290790 }, { "epoch": 1.47, "learning_rate": 7.993148715257981e-05, "loss": 0.0075, "step": 290800 }, { "epoch": 1.47, "learning_rate": 7.99239194595658e-05, "loss": 0.0065, "step": 290810 }, { "epoch": 1.47, "learning_rate": 7.99163517665518e-05, "loss": 0.0085, "step": 290820 }, { "epoch": 1.47, "learning_rate": 7.990878407353778e-05, "loss": 0.0107, "step": 290830 }, { "epoch": 1.47, "learning_rate": 7.990121638052378e-05, "loss": 0.008, "step": 290840 }, { "epoch": 1.47, "learning_rate": 7.989364868750977e-05, "loss": 0.009, "step": 290850 }, { "epoch": 1.47, "learning_rate": 7.988608099449575e-05, "loss": 0.008, "step": 290860 }, { "epoch": 1.47, "learning_rate": 7.987851330148175e-05, "loss": 0.0079, "step": 290870 }, { "epoch": 1.47, "learning_rate": 7.987094560846773e-05, "loss": 0.0075, "step": 290880 }, { "epoch": 1.47, "learning_rate": 7.986337791545372e-05, "loss": 0.0104, "step": 290890 }, { "epoch": 1.47, "learning_rate": 7.985581022243972e-05, "loss": 0.0059, "step": 290900 }, { "epoch": 1.47, "learning_rate": 7.98482425294257e-05, "loss": 0.0065, "step": 290910 }, { "epoch": 1.47, "learning_rate": 7.98406748364117e-05, "loss": 0.0068, "step": 290920 }, { "epoch": 1.47, "learning_rate": 7.983310714339769e-05, "loss": 0.0076, "step": 290930 }, { "epoch": 1.47, "learning_rate": 7.982553945038367e-05, "loss": 0.0061, "step": 290940 }, { "epoch": 1.47, "learning_rate": 7.981797175736967e-05, "loss": 0.0078, "step": 290950 }, { "epoch": 1.47, "learning_rate": 7.981040406435566e-05, "loss": 0.0078, "step": 290960 }, { "epoch": 1.47, "learning_rate": 7.980283637134164e-05, "loss": 0.0056, "step": 290970 }, { "epoch": 1.47, "learning_rate": 7.979526867832764e-05, "loss": 0.0072, "step": 290980 }, { "epoch": 1.47, "learning_rate": 7.978770098531362e-05, "loss": 0.0065, "step": 290990 }, { "epoch": 1.47, "learning_rate": 7.978013329229961e-05, "loss": 0.0068, "step": 291000 }, { "epoch": 1.47, "eval_cer": 0.9144314400581461, "eval_loss": 0.00572578888386488, "eval_runtime": 115.7089, "eval_samples_per_second": 17.285, "eval_steps_per_second": 4.321, "step": 291000 }, { "epoch": 1.47, "learning_rate": 7.977256559928561e-05, "loss": 0.0074, "step": 291010 }, { "epoch": 1.47, "learning_rate": 7.976499790627159e-05, "loss": 0.0065, "step": 291020 }, { "epoch": 1.47, "learning_rate": 7.975743021325759e-05, "loss": 0.0072, "step": 291030 }, { "epoch": 1.47, "learning_rate": 7.974986252024358e-05, "loss": 0.0094, "step": 291040 }, { "epoch": 1.47, "learning_rate": 7.974229482722956e-05, "loss": 0.0063, "step": 291050 }, { "epoch": 1.47, "learning_rate": 7.973472713421556e-05, "loss": 0.0079, "step": 291060 }, { "epoch": 1.47, "learning_rate": 7.972715944120154e-05, "loss": 0.0072, "step": 291070 }, { "epoch": 1.47, "learning_rate": 7.971959174818753e-05, "loss": 0.0079, "step": 291080 }, { "epoch": 1.47, "learning_rate": 7.971202405517353e-05, "loss": 0.0082, "step": 291090 }, { "epoch": 1.47, "learning_rate": 7.970445636215951e-05, "loss": 0.0075, "step": 291100 }, { "epoch": 1.47, "learning_rate": 7.96968886691455e-05, "loss": 0.0072, "step": 291110 }, { "epoch": 1.47, "learning_rate": 7.96893209761315e-05, "loss": 0.0062, "step": 291120 }, { "epoch": 1.47, "learning_rate": 7.968175328311748e-05, "loss": 0.0069, "step": 291130 }, { "epoch": 1.47, "learning_rate": 7.967418559010348e-05, "loss": 0.0065, "step": 291140 }, { "epoch": 1.47, "learning_rate": 7.966661789708946e-05, "loss": 0.0064, "step": 291150 }, { "epoch": 1.47, "learning_rate": 7.965905020407545e-05, "loss": 0.0065, "step": 291160 }, { "epoch": 1.47, "learning_rate": 7.965148251106145e-05, "loss": 0.0084, "step": 291170 }, { "epoch": 1.47, "learning_rate": 7.964391481804743e-05, "loss": 0.0071, "step": 291180 }, { "epoch": 1.47, "learning_rate": 7.963634712503342e-05, "loss": 0.0065, "step": 291190 }, { "epoch": 1.47, "learning_rate": 7.962877943201942e-05, "loss": 0.0054, "step": 291200 }, { "epoch": 1.47, "learning_rate": 7.96212117390054e-05, "loss": 0.0094, "step": 291210 }, { "epoch": 1.47, "learning_rate": 7.96136440459914e-05, "loss": 0.0073, "step": 291220 }, { "epoch": 1.47, "learning_rate": 7.960607635297738e-05, "loss": 0.0085, "step": 291230 }, { "epoch": 1.47, "learning_rate": 7.959850865996337e-05, "loss": 0.007, "step": 291240 }, { "epoch": 1.47, "learning_rate": 7.959094096694937e-05, "loss": 0.0076, "step": 291250 }, { "epoch": 1.47, "learning_rate": 7.958337327393535e-05, "loss": 0.0101, "step": 291260 }, { "epoch": 1.47, "learning_rate": 7.957580558092134e-05, "loss": 0.0066, "step": 291270 }, { "epoch": 1.47, "learning_rate": 7.956823788790734e-05, "loss": 0.0074, "step": 291280 }, { "epoch": 1.47, "learning_rate": 7.95606701948933e-05, "loss": 0.0065, "step": 291290 }, { "epoch": 1.47, "learning_rate": 7.95531025018793e-05, "loss": 0.0066, "step": 291300 }, { "epoch": 1.47, "learning_rate": 7.954553480886528e-05, "loss": 0.0076, "step": 291310 }, { "epoch": 1.47, "learning_rate": 7.953796711585128e-05, "loss": 0.0076, "step": 291320 }, { "epoch": 1.47, "learning_rate": 7.953039942283726e-05, "loss": 0.0058, "step": 291330 }, { "epoch": 1.47, "learning_rate": 7.952283172982325e-05, "loss": 0.0048, "step": 291340 }, { "epoch": 1.47, "learning_rate": 7.951526403680925e-05, "loss": 0.0088, "step": 291350 }, { "epoch": 1.47, "learning_rate": 7.950769634379523e-05, "loss": 0.0076, "step": 291360 }, { "epoch": 1.47, "learning_rate": 7.950012865078123e-05, "loss": 0.0103, "step": 291370 }, { "epoch": 1.47, "learning_rate": 7.949256095776722e-05, "loss": 0.0063, "step": 291380 }, { "epoch": 1.47, "learning_rate": 7.94849932647532e-05, "loss": 0.0058, "step": 291390 }, { "epoch": 1.47, "learning_rate": 7.94774255717392e-05, "loss": 0.0081, "step": 291400 }, { "epoch": 1.47, "learning_rate": 7.946985787872518e-05, "loss": 0.0072, "step": 291410 }, { "epoch": 1.47, "learning_rate": 7.946229018571117e-05, "loss": 0.0056, "step": 291420 }, { "epoch": 1.47, "learning_rate": 7.945472249269717e-05, "loss": 0.0075, "step": 291430 }, { "epoch": 1.47, "learning_rate": 7.944715479968315e-05, "loss": 0.0101, "step": 291440 }, { "epoch": 1.47, "learning_rate": 7.943958710666914e-05, "loss": 0.0093, "step": 291450 }, { "epoch": 1.47, "learning_rate": 7.943201941365514e-05, "loss": 0.0067, "step": 291460 }, { "epoch": 1.47, "learning_rate": 7.942445172064112e-05, "loss": 0.006, "step": 291470 }, { "epoch": 1.47, "learning_rate": 7.941688402762712e-05, "loss": 0.0071, "step": 291480 }, { "epoch": 1.47, "learning_rate": 7.940931633461311e-05, "loss": 0.0074, "step": 291490 }, { "epoch": 1.47, "learning_rate": 7.940174864159909e-05, "loss": 0.0118, "step": 291500 }, { "epoch": 1.47, "learning_rate": 7.939418094858509e-05, "loss": 0.0119, "step": 291510 }, { "epoch": 1.47, "learning_rate": 7.938661325557107e-05, "loss": 0.0089, "step": 291520 }, { "epoch": 1.47, "learning_rate": 7.937904556255706e-05, "loss": 0.0066, "step": 291530 }, { "epoch": 1.47, "learning_rate": 7.937147786954306e-05, "loss": 0.0084, "step": 291540 }, { "epoch": 1.47, "learning_rate": 7.936391017652904e-05, "loss": 0.0069, "step": 291550 }, { "epoch": 1.47, "learning_rate": 7.935634248351504e-05, "loss": 0.0099, "step": 291560 }, { "epoch": 1.47, "learning_rate": 7.934877479050103e-05, "loss": 0.0138, "step": 291570 }, { "epoch": 1.47, "learning_rate": 7.934120709748701e-05, "loss": 0.0103, "step": 291580 }, { "epoch": 1.47, "learning_rate": 7.933363940447301e-05, "loss": 0.0076, "step": 291590 }, { "epoch": 1.47, "learning_rate": 7.932607171145899e-05, "loss": 0.0089, "step": 291600 }, { "epoch": 1.47, "learning_rate": 7.931850401844498e-05, "loss": 0.0085, "step": 291610 }, { "epoch": 1.47, "learning_rate": 7.931093632543098e-05, "loss": 0.0066, "step": 291620 }, { "epoch": 1.47, "learning_rate": 7.930336863241696e-05, "loss": 0.0063, "step": 291630 }, { "epoch": 1.47, "learning_rate": 7.929580093940295e-05, "loss": 0.0085, "step": 291640 }, { "epoch": 1.47, "learning_rate": 7.928823324638895e-05, "loss": 0.0061, "step": 291650 }, { "epoch": 1.47, "learning_rate": 7.928066555337493e-05, "loss": 0.0066, "step": 291660 }, { "epoch": 1.47, "learning_rate": 7.927309786036093e-05, "loss": 0.0082, "step": 291670 }, { "epoch": 1.47, "learning_rate": 7.926553016734691e-05, "loss": 0.0107, "step": 291680 }, { "epoch": 1.47, "learning_rate": 7.92579624743329e-05, "loss": 0.0096, "step": 291690 }, { "epoch": 1.47, "learning_rate": 7.92503947813189e-05, "loss": 0.0065, "step": 291700 }, { "epoch": 1.47, "learning_rate": 7.924282708830488e-05, "loss": 0.007, "step": 291710 }, { "epoch": 1.47, "learning_rate": 7.923525939529087e-05, "loss": 0.0076, "step": 291720 }, { "epoch": 1.47, "learning_rate": 7.922769170227687e-05, "loss": 0.0083, "step": 291730 }, { "epoch": 1.47, "learning_rate": 7.922012400926285e-05, "loss": 0.0069, "step": 291740 }, { "epoch": 1.47, "learning_rate": 7.921255631624885e-05, "loss": 0.0074, "step": 291750 }, { "epoch": 1.47, "learning_rate": 7.920498862323483e-05, "loss": 0.0069, "step": 291760 }, { "epoch": 1.47, "learning_rate": 7.919742093022082e-05, "loss": 0.0076, "step": 291770 }, { "epoch": 1.47, "learning_rate": 7.918985323720682e-05, "loss": 0.0088, "step": 291780 }, { "epoch": 1.47, "learning_rate": 7.91822855441928e-05, "loss": 0.006, "step": 291790 }, { "epoch": 1.47, "learning_rate": 7.91747178511788e-05, "loss": 0.0103, "step": 291800 }, { "epoch": 1.47, "learning_rate": 7.916715015816479e-05, "loss": 0.006, "step": 291810 }, { "epoch": 1.47, "learning_rate": 7.915958246515077e-05, "loss": 0.0069, "step": 291820 }, { "epoch": 1.47, "learning_rate": 7.915201477213676e-05, "loss": 0.0069, "step": 291830 }, { "epoch": 1.47, "learning_rate": 7.914444707912275e-05, "loss": 0.0095, "step": 291840 }, { "epoch": 1.47, "learning_rate": 7.913687938610874e-05, "loss": 0.0098, "step": 291850 }, { "epoch": 1.47, "learning_rate": 7.912931169309474e-05, "loss": 0.008, "step": 291860 }, { "epoch": 1.47, "learning_rate": 7.912174400008072e-05, "loss": 0.009, "step": 291870 }, { "epoch": 1.47, "learning_rate": 7.911417630706671e-05, "loss": 0.006, "step": 291880 }, { "epoch": 1.47, "learning_rate": 7.910660861405271e-05, "loss": 0.0084, "step": 291890 }, { "epoch": 1.47, "learning_rate": 7.909904092103869e-05, "loss": 0.0072, "step": 291900 }, { "epoch": 1.47, "learning_rate": 7.909147322802468e-05, "loss": 0.006, "step": 291910 }, { "epoch": 1.47, "learning_rate": 7.908390553501065e-05, "loss": 0.0075, "step": 291920 }, { "epoch": 1.47, "learning_rate": 7.907633784199665e-05, "loss": 0.008, "step": 291930 }, { "epoch": 1.47, "learning_rate": 7.906877014898264e-05, "loss": 0.009, "step": 291940 }, { "epoch": 1.47, "learning_rate": 7.906120245596862e-05, "loss": 0.0079, "step": 291950 }, { "epoch": 1.47, "learning_rate": 7.905363476295462e-05, "loss": 0.0068, "step": 291960 }, { "epoch": 1.47, "learning_rate": 7.90460670699406e-05, "loss": 0.0057, "step": 291970 }, { "epoch": 1.47, "learning_rate": 7.90384993769266e-05, "loss": 0.0086, "step": 291980 }, { "epoch": 1.47, "learning_rate": 7.903093168391259e-05, "loss": 0.0059, "step": 291990 }, { "epoch": 1.47, "learning_rate": 7.902336399089857e-05, "loss": 0.0061, "step": 292000 }, { "epoch": 1.47, "eval_cer": 0.9144362920387732, "eval_loss": 0.0056129819713532925, "eval_runtime": 115.8149, "eval_samples_per_second": 17.269, "eval_steps_per_second": 4.317, "step": 292000 }, { "epoch": 1.47, "learning_rate": 7.901579629788457e-05, "loss": 0.0076, "step": 292010 }, { "epoch": 1.47, "learning_rate": 7.900822860487056e-05, "loss": 0.0053, "step": 292020 }, { "epoch": 1.47, "learning_rate": 7.900066091185654e-05, "loss": 0.0056, "step": 292030 }, { "epoch": 1.47, "learning_rate": 7.899309321884254e-05, "loss": 0.008, "step": 292040 }, { "epoch": 1.47, "learning_rate": 7.898552552582852e-05, "loss": 0.0089, "step": 292050 }, { "epoch": 1.47, "learning_rate": 7.897795783281451e-05, "loss": 0.0076, "step": 292060 }, { "epoch": 1.47, "learning_rate": 7.897039013980051e-05, "loss": 0.0095, "step": 292070 }, { "epoch": 1.47, "learning_rate": 7.896282244678649e-05, "loss": 0.0099, "step": 292080 }, { "epoch": 1.47, "learning_rate": 7.895525475377249e-05, "loss": 0.0069, "step": 292090 }, { "epoch": 1.47, "learning_rate": 7.894768706075848e-05, "loss": 0.0068, "step": 292100 }, { "epoch": 1.47, "learning_rate": 7.894011936774446e-05, "loss": 0.0063, "step": 292110 }, { "epoch": 1.47, "learning_rate": 7.893255167473046e-05, "loss": 0.0073, "step": 292120 }, { "epoch": 1.47, "learning_rate": 7.892498398171644e-05, "loss": 0.0071, "step": 292130 }, { "epoch": 1.47, "learning_rate": 7.891741628870243e-05, "loss": 0.0078, "step": 292140 }, { "epoch": 1.47, "learning_rate": 7.890984859568843e-05, "loss": 0.0091, "step": 292150 }, { "epoch": 1.47, "learning_rate": 7.890228090267441e-05, "loss": 0.009, "step": 292160 }, { "epoch": 1.47, "learning_rate": 7.88947132096604e-05, "loss": 0.007, "step": 292170 }, { "epoch": 1.47, "learning_rate": 7.88871455166464e-05, "loss": 0.007, "step": 292180 }, { "epoch": 1.47, "learning_rate": 7.887957782363238e-05, "loss": 0.0096, "step": 292190 }, { "epoch": 1.47, "learning_rate": 7.887201013061838e-05, "loss": 0.0073, "step": 292200 }, { "epoch": 1.47, "learning_rate": 7.886444243760436e-05, "loss": 0.007, "step": 292210 }, { "epoch": 1.47, "learning_rate": 7.885687474459035e-05, "loss": 0.0093, "step": 292220 }, { "epoch": 1.47, "learning_rate": 7.884930705157635e-05, "loss": 0.0076, "step": 292230 }, { "epoch": 1.47, "learning_rate": 7.884173935856233e-05, "loss": 0.0087, "step": 292240 }, { "epoch": 1.47, "learning_rate": 7.883417166554832e-05, "loss": 0.0087, "step": 292250 }, { "epoch": 1.47, "learning_rate": 7.882660397253432e-05, "loss": 0.0072, "step": 292260 }, { "epoch": 1.47, "learning_rate": 7.88190362795203e-05, "loss": 0.0077, "step": 292270 }, { "epoch": 1.47, "learning_rate": 7.88114685865063e-05, "loss": 0.009, "step": 292280 }, { "epoch": 1.47, "learning_rate": 7.880390089349228e-05, "loss": 0.0054, "step": 292290 }, { "epoch": 1.47, "learning_rate": 7.879633320047827e-05, "loss": 0.0058, "step": 292300 }, { "epoch": 1.47, "learning_rate": 7.878876550746427e-05, "loss": 0.0056, "step": 292310 }, { "epoch": 1.47, "learning_rate": 7.878119781445025e-05, "loss": 0.0081, "step": 292320 }, { "epoch": 1.47, "learning_rate": 7.877363012143624e-05, "loss": 0.0059, "step": 292330 }, { "epoch": 1.47, "learning_rate": 7.876606242842224e-05, "loss": 0.0077, "step": 292340 }, { "epoch": 1.47, "learning_rate": 7.875849473540822e-05, "loss": 0.0067, "step": 292350 }, { "epoch": 1.47, "learning_rate": 7.875092704239421e-05, "loss": 0.0073, "step": 292360 }, { "epoch": 1.48, "learning_rate": 7.87433593493802e-05, "loss": 0.0094, "step": 292370 }, { "epoch": 1.48, "learning_rate": 7.873579165636619e-05, "loss": 0.0057, "step": 292380 }, { "epoch": 1.48, "learning_rate": 7.872822396335219e-05, "loss": 0.008, "step": 292390 }, { "epoch": 1.48, "learning_rate": 7.872065627033817e-05, "loss": 0.0082, "step": 292400 }, { "epoch": 1.48, "learning_rate": 7.871308857732416e-05, "loss": 0.0072, "step": 292410 }, { "epoch": 1.48, "learning_rate": 7.870552088431016e-05, "loss": 0.0052, "step": 292420 }, { "epoch": 1.48, "learning_rate": 7.869795319129614e-05, "loss": 0.0072, "step": 292430 }, { "epoch": 1.48, "learning_rate": 7.869038549828213e-05, "loss": 0.0069, "step": 292440 }, { "epoch": 1.48, "learning_rate": 7.868281780526813e-05, "loss": 0.0056, "step": 292450 }, { "epoch": 1.48, "learning_rate": 7.867525011225411e-05, "loss": 0.0094, "step": 292460 }, { "epoch": 1.48, "learning_rate": 7.86676824192401e-05, "loss": 0.0074, "step": 292470 }, { "epoch": 1.48, "learning_rate": 7.866011472622609e-05, "loss": 0.0078, "step": 292480 }, { "epoch": 1.48, "learning_rate": 7.865254703321208e-05, "loss": 0.0064, "step": 292490 }, { "epoch": 1.48, "learning_rate": 7.864497934019808e-05, "loss": 0.008, "step": 292500 }, { "epoch": 1.48, "learning_rate": 7.863741164718406e-05, "loss": 0.0072, "step": 292510 }, { "epoch": 1.48, "learning_rate": 7.862984395417005e-05, "loss": 0.0045, "step": 292520 }, { "epoch": 1.48, "learning_rate": 7.862227626115605e-05, "loss": 0.0054, "step": 292530 }, { "epoch": 1.48, "learning_rate": 7.861470856814203e-05, "loss": 0.006, "step": 292540 }, { "epoch": 1.48, "learning_rate": 7.860714087512801e-05, "loss": 0.0077, "step": 292550 }, { "epoch": 1.48, "learning_rate": 7.859957318211399e-05, "loss": 0.0068, "step": 292560 }, { "epoch": 1.48, "learning_rate": 7.859200548909999e-05, "loss": 0.0079, "step": 292570 }, { "epoch": 1.48, "learning_rate": 7.858443779608597e-05, "loss": 0.0064, "step": 292580 }, { "epoch": 1.48, "learning_rate": 7.857687010307196e-05, "loss": 0.0076, "step": 292590 }, { "epoch": 1.48, "learning_rate": 7.856930241005796e-05, "loss": 0.0085, "step": 292600 }, { "epoch": 1.48, "learning_rate": 7.856173471704394e-05, "loss": 0.0062, "step": 292610 }, { "epoch": 1.48, "learning_rate": 7.855416702402994e-05, "loss": 0.0094, "step": 292620 }, { "epoch": 1.48, "learning_rate": 7.854659933101593e-05, "loss": 0.0065, "step": 292630 }, { "epoch": 1.48, "learning_rate": 7.853903163800191e-05, "loss": 0.0078, "step": 292640 }, { "epoch": 1.48, "learning_rate": 7.853146394498791e-05, "loss": 0.0071, "step": 292650 }, { "epoch": 1.48, "learning_rate": 7.852389625197389e-05, "loss": 0.0081, "step": 292660 }, { "epoch": 1.48, "learning_rate": 7.851632855895988e-05, "loss": 0.0077, "step": 292670 }, { "epoch": 1.48, "learning_rate": 7.850876086594588e-05, "loss": 0.0068, "step": 292680 }, { "epoch": 1.48, "learning_rate": 7.850119317293186e-05, "loss": 0.0062, "step": 292690 }, { "epoch": 1.48, "learning_rate": 7.849362547991785e-05, "loss": 0.008, "step": 292700 }, { "epoch": 1.48, "learning_rate": 7.848605778690385e-05, "loss": 0.0079, "step": 292710 }, { "epoch": 1.48, "learning_rate": 7.847849009388983e-05, "loss": 0.0072, "step": 292720 }, { "epoch": 1.48, "learning_rate": 7.847092240087583e-05, "loss": 0.0071, "step": 292730 }, { "epoch": 1.48, "learning_rate": 7.846335470786181e-05, "loss": 0.0081, "step": 292740 }, { "epoch": 1.48, "learning_rate": 7.84557870148478e-05, "loss": 0.0061, "step": 292750 }, { "epoch": 1.48, "learning_rate": 7.84482193218338e-05, "loss": 0.0054, "step": 292760 }, { "epoch": 1.48, "learning_rate": 7.844065162881978e-05, "loss": 0.0076, "step": 292770 }, { "epoch": 1.48, "learning_rate": 7.843308393580577e-05, "loss": 0.0063, "step": 292780 }, { "epoch": 1.48, "learning_rate": 7.842551624279177e-05, "loss": 0.0097, "step": 292790 }, { "epoch": 1.48, "learning_rate": 7.841794854977775e-05, "loss": 0.0076, "step": 292800 }, { "epoch": 1.48, "learning_rate": 7.841038085676375e-05, "loss": 0.0086, "step": 292810 }, { "epoch": 1.48, "learning_rate": 7.840281316374973e-05, "loss": 0.006, "step": 292820 }, { "epoch": 1.48, "learning_rate": 7.839524547073572e-05, "loss": 0.0081, "step": 292830 }, { "epoch": 1.48, "learning_rate": 7.838767777772172e-05, "loss": 0.009, "step": 292840 }, { "epoch": 1.48, "learning_rate": 7.83801100847077e-05, "loss": 0.0073, "step": 292850 }, { "epoch": 1.48, "learning_rate": 7.83725423916937e-05, "loss": 0.0068, "step": 292860 }, { "epoch": 1.48, "learning_rate": 7.836497469867969e-05, "loss": 0.0097, "step": 292870 }, { "epoch": 1.48, "learning_rate": 7.835740700566567e-05, "loss": 0.0068, "step": 292880 }, { "epoch": 1.48, "learning_rate": 7.834983931265166e-05, "loss": 0.0042, "step": 292890 }, { "epoch": 1.48, "learning_rate": 7.834227161963765e-05, "loss": 0.0079, "step": 292900 }, { "epoch": 1.48, "learning_rate": 7.833470392662364e-05, "loss": 0.0097, "step": 292910 }, { "epoch": 1.48, "learning_rate": 7.832713623360964e-05, "loss": 0.0059, "step": 292920 }, { "epoch": 1.48, "learning_rate": 7.831956854059562e-05, "loss": 0.0075, "step": 292930 }, { "epoch": 1.48, "learning_rate": 7.831200084758161e-05, "loss": 0.0066, "step": 292940 }, { "epoch": 1.48, "learning_rate": 7.830443315456761e-05, "loss": 0.0074, "step": 292950 }, { "epoch": 1.48, "learning_rate": 7.829686546155359e-05, "loss": 0.008, "step": 292960 }, { "epoch": 1.48, "learning_rate": 7.828929776853958e-05, "loss": 0.0108, "step": 292970 }, { "epoch": 1.48, "learning_rate": 7.828173007552558e-05, "loss": 0.0069, "step": 292980 }, { "epoch": 1.48, "learning_rate": 7.827416238251156e-05, "loss": 0.0047, "step": 292990 }, { "epoch": 1.48, "learning_rate": 7.826659468949756e-05, "loss": 0.0053, "step": 293000 }, { "epoch": 1.48, "eval_cer": 0.9144411440194001, "eval_loss": 0.005583611316978931, "eval_runtime": 116.624, "eval_samples_per_second": 17.149, "eval_steps_per_second": 4.287, "step": 293000 }, { "epoch": 1.48, "learning_rate": 7.825902699648354e-05, "loss": 0.0054, "step": 293010 }, { "epoch": 1.48, "learning_rate": 7.825145930346953e-05, "loss": 0.0113, "step": 293020 }, { "epoch": 1.48, "learning_rate": 7.824389161045553e-05, "loss": 0.0055, "step": 293030 }, { "epoch": 1.48, "learning_rate": 7.823632391744151e-05, "loss": 0.0072, "step": 293040 }, { "epoch": 1.48, "learning_rate": 7.82287562244275e-05, "loss": 0.0078, "step": 293050 }, { "epoch": 1.48, "learning_rate": 7.82211885314135e-05, "loss": 0.0059, "step": 293060 }, { "epoch": 1.48, "learning_rate": 7.821362083839948e-05, "loss": 0.0088, "step": 293070 }, { "epoch": 1.48, "learning_rate": 7.820605314538548e-05, "loss": 0.0097, "step": 293080 }, { "epoch": 1.48, "learning_rate": 7.819848545237146e-05, "loss": 0.0066, "step": 293090 }, { "epoch": 1.48, "learning_rate": 7.819091775935745e-05, "loss": 0.0094, "step": 293100 }, { "epoch": 1.48, "learning_rate": 7.818335006634345e-05, "loss": 0.008, "step": 293110 }, { "epoch": 1.48, "learning_rate": 7.817578237332943e-05, "loss": 0.0072, "step": 293120 }, { "epoch": 1.48, "learning_rate": 7.816821468031542e-05, "loss": 0.0096, "step": 293130 }, { "epoch": 1.48, "learning_rate": 7.816064698730142e-05, "loss": 0.0061, "step": 293140 }, { "epoch": 1.48, "learning_rate": 7.81530792942874e-05, "loss": 0.0085, "step": 293150 }, { "epoch": 1.48, "learning_rate": 7.81455116012734e-05, "loss": 0.0087, "step": 293160 }, { "epoch": 1.48, "learning_rate": 7.813794390825936e-05, "loss": 0.0083, "step": 293170 }, { "epoch": 1.48, "learning_rate": 7.813037621524536e-05, "loss": 0.0067, "step": 293180 }, { "epoch": 1.48, "learning_rate": 7.812280852223134e-05, "loss": 0.0076, "step": 293190 }, { "epoch": 1.48, "learning_rate": 7.811524082921733e-05, "loss": 0.0067, "step": 293200 }, { "epoch": 1.48, "learning_rate": 7.810767313620333e-05, "loss": 0.009, "step": 293210 }, { "epoch": 1.48, "learning_rate": 7.810010544318931e-05, "loss": 0.0053, "step": 293220 }, { "epoch": 1.48, "learning_rate": 7.80925377501753e-05, "loss": 0.0089, "step": 293230 }, { "epoch": 1.48, "learning_rate": 7.80849700571613e-05, "loss": 0.0068, "step": 293240 }, { "epoch": 1.48, "learning_rate": 7.807740236414728e-05, "loss": 0.0063, "step": 293250 }, { "epoch": 1.48, "learning_rate": 7.806983467113328e-05, "loss": 0.0076, "step": 293260 }, { "epoch": 1.48, "learning_rate": 7.806226697811926e-05, "loss": 0.0059, "step": 293270 }, { "epoch": 1.48, "learning_rate": 7.805469928510525e-05, "loss": 0.0082, "step": 293280 }, { "epoch": 1.48, "learning_rate": 7.804713159209125e-05, "loss": 0.0058, "step": 293290 }, { "epoch": 1.48, "learning_rate": 7.803956389907723e-05, "loss": 0.0079, "step": 293300 }, { "epoch": 1.48, "learning_rate": 7.803199620606322e-05, "loss": 0.0087, "step": 293310 }, { "epoch": 1.48, "learning_rate": 7.802442851304922e-05, "loss": 0.0082, "step": 293320 }, { "epoch": 1.48, "learning_rate": 7.80168608200352e-05, "loss": 0.0075, "step": 293330 }, { "epoch": 1.48, "learning_rate": 7.80092931270212e-05, "loss": 0.0079, "step": 293340 }, { "epoch": 1.48, "learning_rate": 7.800172543400718e-05, "loss": 0.0084, "step": 293350 }, { "epoch": 1.48, "learning_rate": 7.799415774099317e-05, "loss": 0.0075, "step": 293360 }, { "epoch": 1.48, "learning_rate": 7.798659004797917e-05, "loss": 0.0075, "step": 293370 }, { "epoch": 1.48, "learning_rate": 7.797902235496515e-05, "loss": 0.0057, "step": 293380 }, { "epoch": 1.48, "learning_rate": 7.797145466195114e-05, "loss": 0.0112, "step": 293390 }, { "epoch": 1.48, "learning_rate": 7.796388696893714e-05, "loss": 0.0076, "step": 293400 }, { "epoch": 1.48, "learning_rate": 7.795631927592312e-05, "loss": 0.0054, "step": 293410 }, { "epoch": 1.48, "learning_rate": 7.794875158290912e-05, "loss": 0.0068, "step": 293420 }, { "epoch": 1.48, "learning_rate": 7.794118388989511e-05, "loss": 0.0087, "step": 293430 }, { "epoch": 1.48, "learning_rate": 7.793361619688109e-05, "loss": 0.0066, "step": 293440 }, { "epoch": 1.48, "learning_rate": 7.792604850386709e-05, "loss": 0.0069, "step": 293450 }, { "epoch": 1.48, "learning_rate": 7.791848081085307e-05, "loss": 0.0067, "step": 293460 }, { "epoch": 1.48, "learning_rate": 7.791091311783906e-05, "loss": 0.0058, "step": 293470 }, { "epoch": 1.48, "learning_rate": 7.790334542482506e-05, "loss": 0.0075, "step": 293480 }, { "epoch": 1.48, "learning_rate": 7.789577773181104e-05, "loss": 0.0092, "step": 293490 }, { "epoch": 1.48, "learning_rate": 7.788821003879703e-05, "loss": 0.0085, "step": 293500 }, { "epoch": 1.48, "learning_rate": 7.788064234578303e-05, "loss": 0.0095, "step": 293510 }, { "epoch": 1.48, "learning_rate": 7.787307465276901e-05, "loss": 0.0087, "step": 293520 }, { "epoch": 1.48, "learning_rate": 7.7865506959755e-05, "loss": 0.0085, "step": 293530 }, { "epoch": 1.48, "learning_rate": 7.785793926674099e-05, "loss": 0.0071, "step": 293540 }, { "epoch": 1.48, "learning_rate": 7.785037157372698e-05, "loss": 0.0111, "step": 293550 }, { "epoch": 1.48, "learning_rate": 7.784280388071298e-05, "loss": 0.0065, "step": 293560 }, { "epoch": 1.48, "learning_rate": 7.783523618769896e-05, "loss": 0.0067, "step": 293570 }, { "epoch": 1.48, "learning_rate": 7.782766849468495e-05, "loss": 0.0064, "step": 293580 }, { "epoch": 1.48, "learning_rate": 7.782010080167095e-05, "loss": 0.0071, "step": 293590 }, { "epoch": 1.48, "learning_rate": 7.781253310865693e-05, "loss": 0.0069, "step": 293600 }, { "epoch": 1.48, "learning_rate": 7.780496541564293e-05, "loss": 0.0073, "step": 293610 }, { "epoch": 1.48, "learning_rate": 7.77973977226289e-05, "loss": 0.0093, "step": 293620 }, { "epoch": 1.48, "learning_rate": 7.77898300296149e-05, "loss": 0.0089, "step": 293630 }, { "epoch": 1.48, "learning_rate": 7.77822623366009e-05, "loss": 0.0068, "step": 293640 }, { "epoch": 1.48, "learning_rate": 7.777469464358688e-05, "loss": 0.0068, "step": 293650 }, { "epoch": 1.48, "learning_rate": 7.776712695057287e-05, "loss": 0.0077, "step": 293660 }, { "epoch": 1.48, "learning_rate": 7.775955925755887e-05, "loss": 0.0062, "step": 293670 }, { "epoch": 1.48, "learning_rate": 7.775199156454485e-05, "loss": 0.007, "step": 293680 }, { "epoch": 1.48, "learning_rate": 7.774442387153084e-05, "loss": 0.0084, "step": 293690 }, { "epoch": 1.48, "learning_rate": 7.773685617851683e-05, "loss": 0.0106, "step": 293700 }, { "epoch": 1.48, "learning_rate": 7.772928848550282e-05, "loss": 0.0088, "step": 293710 }, { "epoch": 1.48, "learning_rate": 7.772172079248882e-05, "loss": 0.006, "step": 293720 }, { "epoch": 1.48, "learning_rate": 7.77141530994748e-05, "loss": 0.0064, "step": 293730 }, { "epoch": 1.48, "learning_rate": 7.770658540646079e-05, "loss": 0.0088, "step": 293740 }, { "epoch": 1.48, "learning_rate": 7.769901771344679e-05, "loss": 0.0077, "step": 293750 }, { "epoch": 1.48, "learning_rate": 7.769145002043277e-05, "loss": 0.007, "step": 293760 }, { "epoch": 1.48, "learning_rate": 7.768388232741876e-05, "loss": 0.0079, "step": 293770 }, { "epoch": 1.48, "learning_rate": 7.767631463440475e-05, "loss": 0.0062, "step": 293780 }, { "epoch": 1.48, "learning_rate": 7.766874694139074e-05, "loss": 0.0079, "step": 293790 }, { "epoch": 1.48, "learning_rate": 7.766117924837671e-05, "loss": 0.006, "step": 293800 }, { "epoch": 1.48, "learning_rate": 7.76536115553627e-05, "loss": 0.0064, "step": 293810 }, { "epoch": 1.48, "learning_rate": 7.76460438623487e-05, "loss": 0.0076, "step": 293820 }, { "epoch": 1.48, "learning_rate": 7.763847616933468e-05, "loss": 0.0067, "step": 293830 }, { "epoch": 1.48, "learning_rate": 7.763090847632067e-05, "loss": 0.0071, "step": 293840 }, { "epoch": 1.48, "learning_rate": 7.762334078330667e-05, "loss": 0.01, "step": 293850 }, { "epoch": 1.48, "learning_rate": 7.761577309029265e-05, "loss": 0.0086, "step": 293860 }, { "epoch": 1.48, "learning_rate": 7.760820539727865e-05, "loss": 0.007, "step": 293870 }, { "epoch": 1.48, "learning_rate": 7.760063770426464e-05, "loss": 0.0063, "step": 293880 }, { "epoch": 1.48, "learning_rate": 7.759307001125062e-05, "loss": 0.0053, "step": 293890 }, { "epoch": 1.48, "learning_rate": 7.758550231823662e-05, "loss": 0.0071, "step": 293900 }, { "epoch": 1.48, "learning_rate": 7.75779346252226e-05, "loss": 0.0094, "step": 293910 }, { "epoch": 1.48, "learning_rate": 7.75703669322086e-05, "loss": 0.0071, "step": 293920 }, { "epoch": 1.48, "learning_rate": 7.756279923919459e-05, "loss": 0.0054, "step": 293930 }, { "epoch": 1.48, "learning_rate": 7.755523154618057e-05, "loss": 0.0081, "step": 293940 }, { "epoch": 1.48, "learning_rate": 7.754766385316657e-05, "loss": 0.0083, "step": 293950 }, { "epoch": 1.48, "learning_rate": 7.754009616015256e-05, "loss": 0.0053, "step": 293960 }, { "epoch": 1.48, "learning_rate": 7.753252846713854e-05, "loss": 0.0091, "step": 293970 }, { "epoch": 1.48, "learning_rate": 7.752496077412454e-05, "loss": 0.0072, "step": 293980 }, { "epoch": 1.48, "learning_rate": 7.751739308111052e-05, "loss": 0.009, "step": 293990 }, { "epoch": 1.48, "learning_rate": 7.750982538809651e-05, "loss": 0.0062, "step": 294000 }, { "epoch": 1.48, "eval_cer": 0.9144294992658953, "eval_loss": 0.005396208260208368, "eval_runtime": 116.6359, "eval_samples_per_second": 17.147, "eval_steps_per_second": 4.287, "step": 294000 }, { "epoch": 1.48, "learning_rate": 7.750225769508251e-05, "loss": 0.0058, "step": 294010 }, { "epoch": 1.48, "learning_rate": 7.749469000206849e-05, "loss": 0.006, "step": 294020 }, { "epoch": 1.48, "learning_rate": 7.748712230905448e-05, "loss": 0.0066, "step": 294030 }, { "epoch": 1.48, "learning_rate": 7.747955461604048e-05, "loss": 0.0085, "step": 294040 }, { "epoch": 1.48, "learning_rate": 7.747198692302646e-05, "loss": 0.0048, "step": 294050 }, { "epoch": 1.48, "learning_rate": 7.746441923001246e-05, "loss": 0.0075, "step": 294060 }, { "epoch": 1.48, "learning_rate": 7.745685153699844e-05, "loss": 0.0087, "step": 294070 }, { "epoch": 1.48, "learning_rate": 7.744928384398443e-05, "loss": 0.0077, "step": 294080 }, { "epoch": 1.48, "learning_rate": 7.744171615097043e-05, "loss": 0.0088, "step": 294090 }, { "epoch": 1.48, "learning_rate": 7.743414845795641e-05, "loss": 0.0064, "step": 294100 }, { "epoch": 1.48, "learning_rate": 7.74265807649424e-05, "loss": 0.0068, "step": 294110 }, { "epoch": 1.48, "learning_rate": 7.74190130719284e-05, "loss": 0.0055, "step": 294120 }, { "epoch": 1.48, "learning_rate": 7.741144537891438e-05, "loss": 0.0076, "step": 294130 }, { "epoch": 1.48, "learning_rate": 7.740387768590038e-05, "loss": 0.0072, "step": 294140 }, { "epoch": 1.48, "learning_rate": 7.739630999288636e-05, "loss": 0.0065, "step": 294150 }, { "epoch": 1.48, "learning_rate": 7.738874229987235e-05, "loss": 0.0068, "step": 294160 }, { "epoch": 1.48, "learning_rate": 7.738117460685835e-05, "loss": 0.0074, "step": 294170 }, { "epoch": 1.48, "learning_rate": 7.737360691384433e-05, "loss": 0.0088, "step": 294180 }, { "epoch": 1.48, "learning_rate": 7.736603922083032e-05, "loss": 0.0063, "step": 294190 }, { "epoch": 1.48, "learning_rate": 7.735847152781632e-05, "loss": 0.0126, "step": 294200 }, { "epoch": 1.48, "learning_rate": 7.73509038348023e-05, "loss": 0.0069, "step": 294210 }, { "epoch": 1.48, "learning_rate": 7.73433361417883e-05, "loss": 0.0063, "step": 294220 }, { "epoch": 1.48, "learning_rate": 7.733576844877428e-05, "loss": 0.0076, "step": 294230 }, { "epoch": 1.48, "learning_rate": 7.732820075576027e-05, "loss": 0.0084, "step": 294240 }, { "epoch": 1.48, "learning_rate": 7.732063306274627e-05, "loss": 0.0106, "step": 294250 }, { "epoch": 1.48, "learning_rate": 7.731306536973225e-05, "loss": 0.0063, "step": 294260 }, { "epoch": 1.48, "learning_rate": 7.730549767671824e-05, "loss": 0.0064, "step": 294270 }, { "epoch": 1.48, "learning_rate": 7.729792998370424e-05, "loss": 0.0059, "step": 294280 }, { "epoch": 1.48, "learning_rate": 7.729036229069022e-05, "loss": 0.008, "step": 294290 }, { "epoch": 1.48, "learning_rate": 7.728279459767621e-05, "loss": 0.006, "step": 294300 }, { "epoch": 1.48, "learning_rate": 7.72752269046622e-05, "loss": 0.0069, "step": 294310 }, { "epoch": 1.48, "learning_rate": 7.726765921164819e-05, "loss": 0.0056, "step": 294320 }, { "epoch": 1.48, "learning_rate": 7.726009151863419e-05, "loss": 0.0085, "step": 294330 }, { "epoch": 1.48, "learning_rate": 7.725252382562017e-05, "loss": 0.006, "step": 294340 }, { "epoch": 1.49, "learning_rate": 7.724495613260616e-05, "loss": 0.0062, "step": 294350 }, { "epoch": 1.49, "learning_rate": 7.723738843959216e-05, "loss": 0.0078, "step": 294360 }, { "epoch": 1.49, "learning_rate": 7.722982074657814e-05, "loss": 0.0065, "step": 294370 }, { "epoch": 1.49, "learning_rate": 7.722225305356413e-05, "loss": 0.0072, "step": 294380 }, { "epoch": 1.49, "learning_rate": 7.721468536055013e-05, "loss": 0.0113, "step": 294390 }, { "epoch": 1.49, "learning_rate": 7.720711766753611e-05, "loss": 0.008, "step": 294400 }, { "epoch": 1.49, "learning_rate": 7.71995499745221e-05, "loss": 0.0138, "step": 294410 }, { "epoch": 1.49, "learning_rate": 7.719198228150809e-05, "loss": 0.0105, "step": 294420 }, { "epoch": 1.49, "learning_rate": 7.718441458849407e-05, "loss": 0.007, "step": 294430 }, { "epoch": 1.49, "learning_rate": 7.717684689548005e-05, "loss": 0.0082, "step": 294440 }, { "epoch": 1.49, "learning_rate": 7.716927920246604e-05, "loss": 0.0067, "step": 294450 }, { "epoch": 1.49, "learning_rate": 7.716171150945204e-05, "loss": 0.0069, "step": 294460 }, { "epoch": 1.49, "learning_rate": 7.715414381643802e-05, "loss": 0.0057, "step": 294470 }, { "epoch": 1.49, "learning_rate": 7.714657612342402e-05, "loss": 0.0078, "step": 294480 }, { "epoch": 1.49, "learning_rate": 7.713900843041001e-05, "loss": 0.0061, "step": 294490 }, { "epoch": 1.49, "learning_rate": 7.713144073739599e-05, "loss": 0.0054, "step": 294500 }, { "epoch": 1.49, "learning_rate": 7.712387304438199e-05, "loss": 0.005, "step": 294510 }, { "epoch": 1.49, "learning_rate": 7.711630535136797e-05, "loss": 0.0081, "step": 294520 }, { "epoch": 1.49, "learning_rate": 7.710873765835396e-05, "loss": 0.0065, "step": 294530 }, { "epoch": 1.49, "learning_rate": 7.710116996533996e-05, "loss": 0.0077, "step": 294540 }, { "epoch": 1.49, "learning_rate": 7.709360227232594e-05, "loss": 0.0073, "step": 294550 }, { "epoch": 1.49, "learning_rate": 7.708603457931193e-05, "loss": 0.0071, "step": 294560 }, { "epoch": 1.49, "learning_rate": 7.707846688629793e-05, "loss": 0.0075, "step": 294570 }, { "epoch": 1.49, "learning_rate": 7.707089919328391e-05, "loss": 0.0074, "step": 294580 }, { "epoch": 1.49, "learning_rate": 7.70633315002699e-05, "loss": 0.0078, "step": 294590 }, { "epoch": 1.49, "learning_rate": 7.705576380725589e-05, "loss": 0.0102, "step": 294600 }, { "epoch": 1.49, "learning_rate": 7.704819611424188e-05, "loss": 0.0057, "step": 294610 }, { "epoch": 1.49, "learning_rate": 7.704062842122788e-05, "loss": 0.007, "step": 294620 }, { "epoch": 1.49, "learning_rate": 7.703306072821386e-05, "loss": 0.0061, "step": 294630 }, { "epoch": 1.49, "learning_rate": 7.702549303519985e-05, "loss": 0.006, "step": 294640 }, { "epoch": 1.49, "learning_rate": 7.701792534218585e-05, "loss": 0.0079, "step": 294650 }, { "epoch": 1.49, "learning_rate": 7.701035764917183e-05, "loss": 0.01, "step": 294660 }, { "epoch": 1.49, "learning_rate": 7.700278995615783e-05, "loss": 0.008, "step": 294670 }, { "epoch": 1.49, "learning_rate": 7.699522226314381e-05, "loss": 0.0068, "step": 294680 }, { "epoch": 1.49, "learning_rate": 7.69876545701298e-05, "loss": 0.0083, "step": 294690 }, { "epoch": 1.49, "learning_rate": 7.69800868771158e-05, "loss": 0.007, "step": 294700 }, { "epoch": 1.49, "learning_rate": 7.697251918410178e-05, "loss": 0.0062, "step": 294710 }, { "epoch": 1.49, "learning_rate": 7.696495149108777e-05, "loss": 0.0075, "step": 294720 }, { "epoch": 1.49, "learning_rate": 7.695738379807377e-05, "loss": 0.0099, "step": 294730 }, { "epoch": 1.49, "learning_rate": 7.694981610505975e-05, "loss": 0.0068, "step": 294740 }, { "epoch": 1.49, "learning_rate": 7.694224841204574e-05, "loss": 0.0059, "step": 294750 }, { "epoch": 1.49, "learning_rate": 7.693468071903173e-05, "loss": 0.0087, "step": 294760 }, { "epoch": 1.49, "learning_rate": 7.692711302601772e-05, "loss": 0.01, "step": 294770 }, { "epoch": 1.49, "learning_rate": 7.691954533300372e-05, "loss": 0.0083, "step": 294780 }, { "epoch": 1.49, "learning_rate": 7.69119776399897e-05, "loss": 0.0075, "step": 294790 }, { "epoch": 1.49, "learning_rate": 7.690440994697569e-05, "loss": 0.0076, "step": 294800 }, { "epoch": 1.49, "learning_rate": 7.689684225396169e-05, "loss": 0.006, "step": 294810 }, { "epoch": 1.49, "learning_rate": 7.688927456094767e-05, "loss": 0.0067, "step": 294820 }, { "epoch": 1.49, "learning_rate": 7.688170686793366e-05, "loss": 0.0067, "step": 294830 }, { "epoch": 1.49, "learning_rate": 7.687413917491965e-05, "loss": 0.0082, "step": 294840 }, { "epoch": 1.49, "learning_rate": 7.686657148190564e-05, "loss": 0.0059, "step": 294850 }, { "epoch": 1.49, "learning_rate": 7.685900378889164e-05, "loss": 0.0101, "step": 294860 }, { "epoch": 1.49, "learning_rate": 7.685143609587762e-05, "loss": 0.0071, "step": 294870 }, { "epoch": 1.49, "learning_rate": 7.684386840286361e-05, "loss": 0.0056, "step": 294880 }, { "epoch": 1.49, "learning_rate": 7.683630070984961e-05, "loss": 0.0071, "step": 294890 }, { "epoch": 1.49, "learning_rate": 7.682873301683559e-05, "loss": 0.0077, "step": 294900 }, { "epoch": 1.49, "learning_rate": 7.682116532382158e-05, "loss": 0.0056, "step": 294910 }, { "epoch": 1.49, "learning_rate": 7.681359763080758e-05, "loss": 0.0062, "step": 294920 }, { "epoch": 1.49, "learning_rate": 7.680602993779356e-05, "loss": 0.0079, "step": 294930 }, { "epoch": 1.49, "learning_rate": 7.679846224477955e-05, "loss": 0.0063, "step": 294940 }, { "epoch": 1.49, "learning_rate": 7.679089455176554e-05, "loss": 0.0067, "step": 294950 }, { "epoch": 1.49, "learning_rate": 7.678332685875153e-05, "loss": 0.0073, "step": 294960 }, { "epoch": 1.49, "learning_rate": 7.677575916573753e-05, "loss": 0.007, "step": 294970 }, { "epoch": 1.49, "learning_rate": 7.676819147272351e-05, "loss": 0.0083, "step": 294980 }, { "epoch": 1.49, "learning_rate": 7.67606237797095e-05, "loss": 0.0077, "step": 294990 }, { "epoch": 1.49, "learning_rate": 7.67530560866955e-05, "loss": 0.0065, "step": 295000 }, { "epoch": 1.49, "eval_cer": 0.9144304696620207, "eval_loss": 0.005469324998557568, "eval_runtime": 116.6115, "eval_samples_per_second": 17.151, "eval_steps_per_second": 4.288, "step": 295000 }, { "epoch": 1.49, "learning_rate": 7.674548839368148e-05, "loss": 0.0067, "step": 295010 }, { "epoch": 1.49, "learning_rate": 7.673792070066747e-05, "loss": 0.0055, "step": 295020 }, { "epoch": 1.49, "learning_rate": 7.673035300765346e-05, "loss": 0.007, "step": 295030 }, { "epoch": 1.49, "learning_rate": 7.672278531463945e-05, "loss": 0.01, "step": 295040 }, { "epoch": 1.49, "learning_rate": 7.671521762162545e-05, "loss": 0.0061, "step": 295050 }, { "epoch": 1.49, "learning_rate": 7.670764992861141e-05, "loss": 0.0081, "step": 295060 }, { "epoch": 1.49, "learning_rate": 7.670008223559741e-05, "loss": 0.0063, "step": 295070 }, { "epoch": 1.49, "learning_rate": 7.669251454258339e-05, "loss": 0.007, "step": 295080 }, { "epoch": 1.49, "learning_rate": 7.668494684956938e-05, "loss": 0.0096, "step": 295090 }, { "epoch": 1.49, "learning_rate": 7.667737915655538e-05, "loss": 0.0078, "step": 295100 }, { "epoch": 1.49, "learning_rate": 7.666981146354136e-05, "loss": 0.0063, "step": 295110 }, { "epoch": 1.49, "learning_rate": 7.666224377052736e-05, "loss": 0.0061, "step": 295120 }, { "epoch": 1.49, "learning_rate": 7.665467607751334e-05, "loss": 0.0099, "step": 295130 }, { "epoch": 1.49, "learning_rate": 7.664710838449933e-05, "loss": 0.0072, "step": 295140 }, { "epoch": 1.49, "learning_rate": 7.663954069148533e-05, "loss": 0.0074, "step": 295150 }, { "epoch": 1.49, "learning_rate": 7.663197299847131e-05, "loss": 0.0067, "step": 295160 }, { "epoch": 1.49, "learning_rate": 7.66244053054573e-05, "loss": 0.0086, "step": 295170 }, { "epoch": 1.49, "learning_rate": 7.66168376124433e-05, "loss": 0.0072, "step": 295180 }, { "epoch": 1.49, "learning_rate": 7.660926991942928e-05, "loss": 0.0104, "step": 295190 }, { "epoch": 1.49, "learning_rate": 7.660170222641528e-05, "loss": 0.0069, "step": 295200 }, { "epoch": 1.49, "learning_rate": 7.659413453340126e-05, "loss": 0.0116, "step": 295210 }, { "epoch": 1.49, "learning_rate": 7.658656684038725e-05, "loss": 0.0061, "step": 295220 }, { "epoch": 1.49, "learning_rate": 7.657899914737325e-05, "loss": 0.0082, "step": 295230 }, { "epoch": 1.49, "learning_rate": 7.657143145435923e-05, "loss": 0.0071, "step": 295240 }, { "epoch": 1.49, "learning_rate": 7.656386376134522e-05, "loss": 0.0071, "step": 295250 }, { "epoch": 1.49, "learning_rate": 7.655629606833122e-05, "loss": 0.0068, "step": 295260 }, { "epoch": 1.49, "learning_rate": 7.65487283753172e-05, "loss": 0.0085, "step": 295270 }, { "epoch": 1.49, "learning_rate": 7.65411606823032e-05, "loss": 0.0096, "step": 295280 }, { "epoch": 1.49, "learning_rate": 7.653359298928918e-05, "loss": 0.0075, "step": 295290 }, { "epoch": 1.49, "learning_rate": 7.652602529627517e-05, "loss": 0.0094, "step": 295300 }, { "epoch": 1.49, "learning_rate": 7.651845760326117e-05, "loss": 0.0071, "step": 295310 }, { "epoch": 1.49, "learning_rate": 7.651088991024715e-05, "loss": 0.0076, "step": 295320 }, { "epoch": 1.49, "learning_rate": 7.650332221723314e-05, "loss": 0.0115, "step": 295330 }, { "epoch": 1.49, "learning_rate": 7.649575452421914e-05, "loss": 0.0063, "step": 295340 }, { "epoch": 1.49, "learning_rate": 7.648818683120512e-05, "loss": 0.0067, "step": 295350 }, { "epoch": 1.49, "learning_rate": 7.648061913819111e-05, "loss": 0.0072, "step": 295360 }, { "epoch": 1.49, "learning_rate": 7.647305144517711e-05, "loss": 0.0073, "step": 295370 }, { "epoch": 1.49, "learning_rate": 7.646548375216309e-05, "loss": 0.0067, "step": 295380 }, { "epoch": 1.49, "learning_rate": 7.645791605914909e-05, "loss": 0.0086, "step": 295390 }, { "epoch": 1.49, "learning_rate": 7.645034836613507e-05, "loss": 0.004, "step": 295400 }, { "epoch": 1.49, "learning_rate": 7.644278067312106e-05, "loss": 0.0078, "step": 295410 }, { "epoch": 1.49, "learning_rate": 7.643521298010706e-05, "loss": 0.0082, "step": 295420 }, { "epoch": 1.49, "learning_rate": 7.642764528709304e-05, "loss": 0.0074, "step": 295430 }, { "epoch": 1.49, "learning_rate": 7.642007759407903e-05, "loss": 0.0063, "step": 295440 }, { "epoch": 1.49, "learning_rate": 7.641250990106503e-05, "loss": 0.0112, "step": 295450 }, { "epoch": 1.49, "learning_rate": 7.640494220805101e-05, "loss": 0.0077, "step": 295460 }, { "epoch": 1.49, "learning_rate": 7.6397374515037e-05, "loss": 0.0088, "step": 295470 }, { "epoch": 1.49, "learning_rate": 7.638980682202299e-05, "loss": 0.0057, "step": 295480 }, { "epoch": 1.49, "learning_rate": 7.638223912900898e-05, "loss": 0.0069, "step": 295490 }, { "epoch": 1.49, "learning_rate": 7.637467143599498e-05, "loss": 0.0092, "step": 295500 }, { "epoch": 1.49, "learning_rate": 7.636710374298096e-05, "loss": 0.0058, "step": 295510 }, { "epoch": 1.49, "learning_rate": 7.635953604996695e-05, "loss": 0.0087, "step": 295520 }, { "epoch": 1.49, "learning_rate": 7.635196835695295e-05, "loss": 0.0067, "step": 295530 }, { "epoch": 1.49, "learning_rate": 7.634440066393893e-05, "loss": 0.0073, "step": 295540 }, { "epoch": 1.49, "learning_rate": 7.633683297092492e-05, "loss": 0.0063, "step": 295550 }, { "epoch": 1.49, "learning_rate": 7.63292652779109e-05, "loss": 0.0087, "step": 295560 }, { "epoch": 1.49, "learning_rate": 7.63216975848969e-05, "loss": 0.0076, "step": 295570 }, { "epoch": 1.49, "learning_rate": 7.63141298918829e-05, "loss": 0.007, "step": 295580 }, { "epoch": 1.49, "learning_rate": 7.630656219886888e-05, "loss": 0.0091, "step": 295590 }, { "epoch": 1.49, "learning_rate": 7.629899450585487e-05, "loss": 0.0062, "step": 295600 }, { "epoch": 1.49, "learning_rate": 7.629142681284087e-05, "loss": 0.0067, "step": 295610 }, { "epoch": 1.49, "learning_rate": 7.628385911982685e-05, "loss": 0.0065, "step": 295620 }, { "epoch": 1.49, "learning_rate": 7.627629142681284e-05, "loss": 0.007, "step": 295630 }, { "epoch": 1.49, "learning_rate": 7.626872373379882e-05, "loss": 0.0077, "step": 295640 }, { "epoch": 1.49, "learning_rate": 7.626115604078482e-05, "loss": 0.0068, "step": 295650 }, { "epoch": 1.49, "learning_rate": 7.625358834777081e-05, "loss": 0.0072, "step": 295660 }, { "epoch": 1.49, "learning_rate": 7.62460206547568e-05, "loss": 0.0048, "step": 295670 }, { "epoch": 1.49, "learning_rate": 7.623845296174279e-05, "loss": 0.0106, "step": 295680 }, { "epoch": 1.49, "learning_rate": 7.623088526872876e-05, "loss": 0.0065, "step": 295690 }, { "epoch": 1.49, "learning_rate": 7.622331757571475e-05, "loss": 0.0078, "step": 295700 }, { "epoch": 1.49, "learning_rate": 7.621574988270075e-05, "loss": 0.0067, "step": 295710 }, { "epoch": 1.49, "learning_rate": 7.620818218968673e-05, "loss": 0.007, "step": 295720 }, { "epoch": 1.49, "learning_rate": 7.620061449667273e-05, "loss": 0.0092, "step": 295730 }, { "epoch": 1.49, "learning_rate": 7.619304680365871e-05, "loss": 0.0069, "step": 295740 }, { "epoch": 1.49, "learning_rate": 7.61854791106447e-05, "loss": 0.0068, "step": 295750 }, { "epoch": 1.49, "learning_rate": 7.61779114176307e-05, "loss": 0.0075, "step": 295760 }, { "epoch": 1.49, "learning_rate": 7.617034372461668e-05, "loss": 0.0059, "step": 295770 }, { "epoch": 1.49, "learning_rate": 7.616277603160267e-05, "loss": 0.008, "step": 295780 }, { "epoch": 1.49, "learning_rate": 7.615520833858867e-05, "loss": 0.0061, "step": 295790 }, { "epoch": 1.49, "learning_rate": 7.614764064557465e-05, "loss": 0.0073, "step": 295800 }, { "epoch": 1.49, "learning_rate": 7.614007295256064e-05, "loss": 0.0059, "step": 295810 }, { "epoch": 1.49, "learning_rate": 7.613250525954664e-05, "loss": 0.0083, "step": 295820 }, { "epoch": 1.49, "learning_rate": 7.612493756653262e-05, "loss": 0.0059, "step": 295830 }, { "epoch": 1.49, "learning_rate": 7.611736987351862e-05, "loss": 0.008, "step": 295840 }, { "epoch": 1.49, "learning_rate": 7.61098021805046e-05, "loss": 0.0081, "step": 295850 }, { "epoch": 1.49, "learning_rate": 7.610223448749059e-05, "loss": 0.0067, "step": 295860 }, { "epoch": 1.49, "learning_rate": 7.609466679447659e-05, "loss": 0.0074, "step": 295870 }, { "epoch": 1.49, "learning_rate": 7.608709910146257e-05, "loss": 0.0079, "step": 295880 }, { "epoch": 1.49, "learning_rate": 7.607953140844856e-05, "loss": 0.0084, "step": 295890 }, { "epoch": 1.49, "learning_rate": 7.607196371543456e-05, "loss": 0.0095, "step": 295900 }, { "epoch": 1.49, "learning_rate": 7.606439602242054e-05, "loss": 0.0072, "step": 295910 }, { "epoch": 1.49, "learning_rate": 7.605682832940654e-05, "loss": 0.0082, "step": 295920 }, { "epoch": 1.49, "learning_rate": 7.604926063639252e-05, "loss": 0.0078, "step": 295930 }, { "epoch": 1.49, "learning_rate": 7.604169294337851e-05, "loss": 0.0071, "step": 295940 }, { "epoch": 1.49, "learning_rate": 7.603412525036451e-05, "loss": 0.0079, "step": 295950 }, { "epoch": 1.49, "learning_rate": 7.602655755735049e-05, "loss": 0.007, "step": 295960 }, { "epoch": 1.49, "learning_rate": 7.601898986433648e-05, "loss": 0.0079, "step": 295970 }, { "epoch": 1.49, "learning_rate": 7.601142217132248e-05, "loss": 0.0076, "step": 295980 }, { "epoch": 1.49, "learning_rate": 7.600385447830846e-05, "loss": 0.0069, "step": 295990 }, { "epoch": 1.49, "learning_rate": 7.599628678529446e-05, "loss": 0.0075, "step": 296000 }, { "epoch": 1.49, "eval_cer": 0.9144605519419082, "eval_loss": 0.005476477090269327, "eval_runtime": 116.6265, "eval_samples_per_second": 17.149, "eval_steps_per_second": 4.287, "step": 296000 }, { "epoch": 1.49, "learning_rate": 7.598871909228044e-05, "loss": 0.0067, "step": 296010 }, { "epoch": 1.49, "learning_rate": 7.598115139926643e-05, "loss": 0.0109, "step": 296020 }, { "epoch": 1.49, "learning_rate": 7.597358370625243e-05, "loss": 0.012, "step": 296030 }, { "epoch": 1.49, "learning_rate": 7.596601601323841e-05, "loss": 0.0069, "step": 296040 }, { "epoch": 1.49, "learning_rate": 7.59584483202244e-05, "loss": 0.0075, "step": 296050 }, { "epoch": 1.49, "learning_rate": 7.59508806272104e-05, "loss": 0.0074, "step": 296060 }, { "epoch": 1.49, "learning_rate": 7.594331293419638e-05, "loss": 0.0083, "step": 296070 }, { "epoch": 1.49, "learning_rate": 7.593574524118237e-05, "loss": 0.0084, "step": 296080 }, { "epoch": 1.49, "learning_rate": 7.592817754816836e-05, "loss": 0.0063, "step": 296090 }, { "epoch": 1.49, "learning_rate": 7.592060985515435e-05, "loss": 0.0066, "step": 296100 }, { "epoch": 1.49, "learning_rate": 7.591304216214035e-05, "loss": 0.0106, "step": 296110 }, { "epoch": 1.49, "learning_rate": 7.590547446912633e-05, "loss": 0.0067, "step": 296120 }, { "epoch": 1.49, "learning_rate": 7.589790677611232e-05, "loss": 0.0062, "step": 296130 }, { "epoch": 1.49, "learning_rate": 7.589033908309832e-05, "loss": 0.0064, "step": 296140 }, { "epoch": 1.49, "learning_rate": 7.58827713900843e-05, "loss": 0.0087, "step": 296150 }, { "epoch": 1.49, "learning_rate": 7.58752036970703e-05, "loss": 0.006, "step": 296160 }, { "epoch": 1.49, "learning_rate": 7.586763600405628e-05, "loss": 0.0072, "step": 296170 }, { "epoch": 1.49, "learning_rate": 7.586006831104227e-05, "loss": 0.0075, "step": 296180 }, { "epoch": 1.49, "learning_rate": 7.585250061802827e-05, "loss": 0.008, "step": 296190 }, { "epoch": 1.49, "learning_rate": 7.584493292501425e-05, "loss": 0.0083, "step": 296200 }, { "epoch": 1.49, "learning_rate": 7.583736523200024e-05, "loss": 0.0053, "step": 296210 }, { "epoch": 1.49, "learning_rate": 7.582979753898624e-05, "loss": 0.0075, "step": 296220 }, { "epoch": 1.49, "learning_rate": 7.582222984597222e-05, "loss": 0.0063, "step": 296230 }, { "epoch": 1.49, "learning_rate": 7.581466215295821e-05, "loss": 0.0067, "step": 296240 }, { "epoch": 1.49, "learning_rate": 7.58070944599442e-05, "loss": 0.0102, "step": 296250 }, { "epoch": 1.49, "learning_rate": 7.579952676693019e-05, "loss": 0.0076, "step": 296260 }, { "epoch": 1.49, "learning_rate": 7.579195907391618e-05, "loss": 0.0065, "step": 296270 }, { "epoch": 1.49, "learning_rate": 7.578439138090217e-05, "loss": 0.009, "step": 296280 }, { "epoch": 1.49, "learning_rate": 7.577682368788816e-05, "loss": 0.0084, "step": 296290 }, { "epoch": 1.49, "learning_rate": 7.576925599487416e-05, "loss": 0.0066, "step": 296300 }, { "epoch": 1.49, "learning_rate": 7.576168830186014e-05, "loss": 0.0067, "step": 296310 }, { "epoch": 1.49, "learning_rate": 7.575412060884612e-05, "loss": 0.0096, "step": 296320 }, { "epoch": 1.5, "learning_rate": 7.57465529158321e-05, "loss": 0.007, "step": 296330 }, { "epoch": 1.5, "learning_rate": 7.57389852228181e-05, "loss": 0.0068, "step": 296340 }, { "epoch": 1.5, "learning_rate": 7.573141752980409e-05, "loss": 0.0079, "step": 296350 }, { "epoch": 1.5, "learning_rate": 7.572384983679007e-05, "loss": 0.0074, "step": 296360 }, { "epoch": 1.5, "learning_rate": 7.571628214377607e-05, "loss": 0.0084, "step": 296370 }, { "epoch": 1.5, "learning_rate": 7.570871445076205e-05, "loss": 0.0067, "step": 296380 }, { "epoch": 1.5, "learning_rate": 7.570114675774804e-05, "loss": 0.0066, "step": 296390 }, { "epoch": 1.5, "learning_rate": 7.569357906473404e-05, "loss": 0.0061, "step": 296400 }, { "epoch": 1.5, "learning_rate": 7.568601137172002e-05, "loss": 0.0053, "step": 296410 }, { "epoch": 1.5, "learning_rate": 7.567844367870601e-05, "loss": 0.0078, "step": 296420 }, { "epoch": 1.5, "learning_rate": 7.567087598569201e-05, "loss": 0.0101, "step": 296430 }, { "epoch": 1.5, "learning_rate": 7.566330829267799e-05, "loss": 0.0074, "step": 296440 }, { "epoch": 1.5, "learning_rate": 7.565574059966399e-05, "loss": 0.0083, "step": 296450 }, { "epoch": 1.5, "learning_rate": 7.564817290664997e-05, "loss": 0.0067, "step": 296460 }, { "epoch": 1.5, "learning_rate": 7.564060521363596e-05, "loss": 0.0077, "step": 296470 }, { "epoch": 1.5, "learning_rate": 7.563303752062196e-05, "loss": 0.0074, "step": 296480 }, { "epoch": 1.5, "learning_rate": 7.562546982760794e-05, "loss": 0.0094, "step": 296490 }, { "epoch": 1.5, "learning_rate": 7.561790213459393e-05, "loss": 0.0064, "step": 296500 }, { "epoch": 1.5, "learning_rate": 7.561033444157993e-05, "loss": 0.0056, "step": 296510 }, { "epoch": 1.5, "learning_rate": 7.560276674856591e-05, "loss": 0.0052, "step": 296520 }, { "epoch": 1.5, "learning_rate": 7.55951990555519e-05, "loss": 0.008, "step": 296530 }, { "epoch": 1.5, "learning_rate": 7.558763136253789e-05, "loss": 0.0072, "step": 296540 }, { "epoch": 1.5, "learning_rate": 7.558006366952388e-05, "loss": 0.0074, "step": 296550 }, { "epoch": 1.5, "learning_rate": 7.557249597650988e-05, "loss": 0.0062, "step": 296560 }, { "epoch": 1.5, "learning_rate": 7.556492828349586e-05, "loss": 0.0085, "step": 296570 }, { "epoch": 1.5, "learning_rate": 7.555736059048185e-05, "loss": 0.0082, "step": 296580 }, { "epoch": 1.5, "learning_rate": 7.554979289746785e-05, "loss": 0.006, "step": 296590 }, { "epoch": 1.5, "learning_rate": 7.554222520445383e-05, "loss": 0.0112, "step": 296600 }, { "epoch": 1.5, "learning_rate": 7.553465751143982e-05, "loss": 0.0074, "step": 296610 }, { "epoch": 1.5, "learning_rate": 7.55270898184258e-05, "loss": 0.0069, "step": 296620 }, { "epoch": 1.5, "learning_rate": 7.55195221254118e-05, "loss": 0.0064, "step": 296630 }, { "epoch": 1.5, "learning_rate": 7.55119544323978e-05, "loss": 0.0059, "step": 296640 }, { "epoch": 1.5, "learning_rate": 7.550438673938378e-05, "loss": 0.0065, "step": 296650 }, { "epoch": 1.5, "learning_rate": 7.549681904636977e-05, "loss": 0.0082, "step": 296660 }, { "epoch": 1.5, "learning_rate": 7.548925135335577e-05, "loss": 0.0066, "step": 296670 }, { "epoch": 1.5, "learning_rate": 7.548168366034175e-05, "loss": 0.0083, "step": 296680 }, { "epoch": 1.5, "learning_rate": 7.547411596732774e-05, "loss": 0.0079, "step": 296690 }, { "epoch": 1.5, "learning_rate": 7.546654827431373e-05, "loss": 0.0067, "step": 296700 }, { "epoch": 1.5, "learning_rate": 7.545898058129972e-05, "loss": 0.0068, "step": 296710 }, { "epoch": 1.5, "learning_rate": 7.545141288828572e-05, "loss": 0.0063, "step": 296720 }, { "epoch": 1.5, "learning_rate": 7.54438451952717e-05, "loss": 0.009, "step": 296730 }, { "epoch": 1.5, "learning_rate": 7.543627750225769e-05, "loss": 0.0069, "step": 296740 }, { "epoch": 1.5, "learning_rate": 7.542870980924369e-05, "loss": 0.0089, "step": 296750 }, { "epoch": 1.5, "learning_rate": 7.542114211622967e-05, "loss": 0.0067, "step": 296760 }, { "epoch": 1.5, "learning_rate": 7.541357442321566e-05, "loss": 0.0095, "step": 296770 }, { "epoch": 1.5, "learning_rate": 7.540600673020164e-05, "loss": 0.0113, "step": 296780 }, { "epoch": 1.5, "learning_rate": 7.539843903718764e-05, "loss": 0.0072, "step": 296790 }, { "epoch": 1.5, "learning_rate": 7.539087134417363e-05, "loss": 0.008, "step": 296800 }, { "epoch": 1.5, "learning_rate": 7.538330365115962e-05, "loss": 0.0073, "step": 296810 }, { "epoch": 1.5, "learning_rate": 7.537573595814561e-05, "loss": 0.0085, "step": 296820 }, { "epoch": 1.5, "learning_rate": 7.53681682651316e-05, "loss": 0.006, "step": 296830 }, { "epoch": 1.5, "learning_rate": 7.536060057211759e-05, "loss": 0.0074, "step": 296840 }, { "epoch": 1.5, "learning_rate": 7.535303287910358e-05, "loss": 0.006, "step": 296850 }, { "epoch": 1.5, "learning_rate": 7.534546518608958e-05, "loss": 0.0063, "step": 296860 }, { "epoch": 1.5, "learning_rate": 7.533789749307556e-05, "loss": 0.0105, "step": 296870 }, { "epoch": 1.5, "learning_rate": 7.533032980006155e-05, "loss": 0.0072, "step": 296880 }, { "epoch": 1.5, "learning_rate": 7.532276210704754e-05, "loss": 0.0072, "step": 296890 }, { "epoch": 1.5, "learning_rate": 7.531519441403353e-05, "loss": 0.0061, "step": 296900 }, { "epoch": 1.5, "learning_rate": 7.530762672101953e-05, "loss": 0.0054, "step": 296910 }, { "epoch": 1.5, "learning_rate": 7.53000590280055e-05, "loss": 0.0065, "step": 296920 }, { "epoch": 1.5, "learning_rate": 7.52924913349915e-05, "loss": 0.0061, "step": 296930 }, { "epoch": 1.5, "learning_rate": 7.528492364197747e-05, "loss": 0.0098, "step": 296940 }, { "epoch": 1.5, "learning_rate": 7.527735594896346e-05, "loss": 0.0078, "step": 296950 }, { "epoch": 1.5, "learning_rate": 7.526978825594946e-05, "loss": 0.0071, "step": 296960 }, { "epoch": 1.5, "learning_rate": 7.526222056293544e-05, "loss": 0.007, "step": 296970 }, { "epoch": 1.5, "learning_rate": 7.525465286992144e-05, "loss": 0.0074, "step": 296980 }, { "epoch": 1.5, "learning_rate": 7.524708517690742e-05, "loss": 0.0057, "step": 296990 }, { "epoch": 1.5, "learning_rate": 7.523951748389341e-05, "loss": 0.0049, "step": 297000 }, { "epoch": 1.5, "eval_cer": 0.9144440552077764, "eval_loss": 0.005415515974164009, "eval_runtime": 116.5765, "eval_samples_per_second": 17.156, "eval_steps_per_second": 4.289, "step": 297000 }, { "epoch": 1.5, "learning_rate": 7.523194979087941e-05, "loss": 0.0068, "step": 297010 }, { "epoch": 1.5, "learning_rate": 7.522438209786539e-05, "loss": 0.0077, "step": 297020 }, { "epoch": 1.5, "learning_rate": 7.521681440485138e-05, "loss": 0.0068, "step": 297030 }, { "epoch": 1.5, "learning_rate": 7.520924671183738e-05, "loss": 0.0065, "step": 297040 }, { "epoch": 1.5, "learning_rate": 7.520167901882336e-05, "loss": 0.0071, "step": 297050 }, { "epoch": 1.5, "learning_rate": 7.519411132580936e-05, "loss": 0.0077, "step": 297060 }, { "epoch": 1.5, "learning_rate": 7.518654363279534e-05, "loss": 0.0067, "step": 297070 }, { "epoch": 1.5, "learning_rate": 7.517897593978133e-05, "loss": 0.0072, "step": 297080 }, { "epoch": 1.5, "learning_rate": 7.517140824676733e-05, "loss": 0.0087, "step": 297090 }, { "epoch": 1.5, "learning_rate": 7.516384055375331e-05, "loss": 0.008, "step": 297100 }, { "epoch": 1.5, "learning_rate": 7.51562728607393e-05, "loss": 0.0071, "step": 297110 }, { "epoch": 1.5, "learning_rate": 7.51487051677253e-05, "loss": 0.0082, "step": 297120 }, { "epoch": 1.5, "learning_rate": 7.514113747471128e-05, "loss": 0.0081, "step": 297130 }, { "epoch": 1.5, "learning_rate": 7.513356978169727e-05, "loss": 0.0062, "step": 297140 }, { "epoch": 1.5, "learning_rate": 7.512600208868326e-05, "loss": 0.0102, "step": 297150 }, { "epoch": 1.5, "learning_rate": 7.511843439566925e-05, "loss": 0.005, "step": 297160 }, { "epoch": 1.5, "learning_rate": 7.511086670265525e-05, "loss": 0.0073, "step": 297170 }, { "epoch": 1.5, "learning_rate": 7.510329900964123e-05, "loss": 0.0075, "step": 297180 }, { "epoch": 1.5, "learning_rate": 7.509573131662722e-05, "loss": 0.0075, "step": 297190 }, { "epoch": 1.5, "learning_rate": 7.508816362361322e-05, "loss": 0.0079, "step": 297200 }, { "epoch": 1.5, "learning_rate": 7.50805959305992e-05, "loss": 0.0083, "step": 297210 }, { "epoch": 1.5, "learning_rate": 7.50730282375852e-05, "loss": 0.0067, "step": 297220 }, { "epoch": 1.5, "learning_rate": 7.506546054457118e-05, "loss": 0.0081, "step": 297230 }, { "epoch": 1.5, "learning_rate": 7.505789285155717e-05, "loss": 0.0052, "step": 297240 }, { "epoch": 1.5, "learning_rate": 7.505032515854317e-05, "loss": 0.0071, "step": 297250 }, { "epoch": 1.5, "learning_rate": 7.504275746552915e-05, "loss": 0.0063, "step": 297260 }, { "epoch": 1.5, "learning_rate": 7.503518977251514e-05, "loss": 0.0069, "step": 297270 }, { "epoch": 1.5, "learning_rate": 7.502762207950114e-05, "loss": 0.0098, "step": 297280 }, { "epoch": 1.5, "learning_rate": 7.502005438648712e-05, "loss": 0.0068, "step": 297290 }, { "epoch": 1.5, "learning_rate": 7.501248669347311e-05, "loss": 0.008, "step": 297300 }, { "epoch": 1.5, "learning_rate": 7.500491900045911e-05, "loss": 0.0093, "step": 297310 }, { "epoch": 1.5, "learning_rate": 7.499735130744509e-05, "loss": 0.0074, "step": 297320 }, { "epoch": 1.5, "learning_rate": 7.498978361443108e-05, "loss": 0.0066, "step": 297330 }, { "epoch": 1.5, "learning_rate": 7.498221592141707e-05, "loss": 0.0072, "step": 297340 }, { "epoch": 1.5, "learning_rate": 7.497464822840306e-05, "loss": 0.0057, "step": 297350 }, { "epoch": 1.5, "learning_rate": 7.496708053538906e-05, "loss": 0.0068, "step": 297360 }, { "epoch": 1.5, "learning_rate": 7.495951284237504e-05, "loss": 0.0062, "step": 297370 }, { "epoch": 1.5, "learning_rate": 7.495194514936103e-05, "loss": 0.0081, "step": 297380 }, { "epoch": 1.5, "learning_rate": 7.494437745634703e-05, "loss": 0.0072, "step": 297390 }, { "epoch": 1.5, "learning_rate": 7.493680976333301e-05, "loss": 0.0083, "step": 297400 }, { "epoch": 1.5, "learning_rate": 7.4929242070319e-05, "loss": 0.0105, "step": 297410 }, { "epoch": 1.5, "learning_rate": 7.492167437730499e-05, "loss": 0.0089, "step": 297420 }, { "epoch": 1.5, "learning_rate": 7.491410668429097e-05, "loss": 0.0091, "step": 297430 }, { "epoch": 1.5, "learning_rate": 7.490653899127696e-05, "loss": 0.0073, "step": 297440 }, { "epoch": 1.5, "learning_rate": 7.489897129826296e-05, "loss": 0.0078, "step": 297450 }, { "epoch": 1.5, "learning_rate": 7.489140360524894e-05, "loss": 0.0072, "step": 297460 }, { "epoch": 1.5, "learning_rate": 7.488383591223493e-05, "loss": 0.012, "step": 297470 }, { "epoch": 1.5, "learning_rate": 7.487626821922093e-05, "loss": 0.0064, "step": 297480 }, { "epoch": 1.5, "learning_rate": 7.486870052620691e-05, "loss": 0.0061, "step": 297490 }, { "epoch": 1.5, "learning_rate": 7.48611328331929e-05, "loss": 0.0076, "step": 297500 }, { "epoch": 1.5, "learning_rate": 7.485356514017889e-05, "loss": 0.0074, "step": 297510 }, { "epoch": 1.5, "learning_rate": 7.484599744716488e-05, "loss": 0.0064, "step": 297520 }, { "epoch": 1.5, "learning_rate": 7.483842975415088e-05, "loss": 0.0083, "step": 297530 }, { "epoch": 1.5, "learning_rate": 7.483086206113686e-05, "loss": 0.0057, "step": 297540 }, { "epoch": 1.5, "learning_rate": 7.482329436812285e-05, "loss": 0.0084, "step": 297550 }, { "epoch": 1.5, "learning_rate": 7.481572667510885e-05, "loss": 0.0094, "step": 297560 }, { "epoch": 1.5, "learning_rate": 7.480815898209483e-05, "loss": 0.0076, "step": 297570 }, { "epoch": 1.5, "learning_rate": 7.480059128908082e-05, "loss": 0.0096, "step": 297580 }, { "epoch": 1.5, "learning_rate": 7.47930235960668e-05, "loss": 0.0073, "step": 297590 }, { "epoch": 1.5, "learning_rate": 7.47854559030528e-05, "loss": 0.0095, "step": 297600 }, { "epoch": 1.5, "learning_rate": 7.47778882100388e-05, "loss": 0.0075, "step": 297610 }, { "epoch": 1.5, "learning_rate": 7.477032051702478e-05, "loss": 0.0059, "step": 297620 }, { "epoch": 1.5, "learning_rate": 7.476275282401077e-05, "loss": 0.0076, "step": 297630 }, { "epoch": 1.5, "learning_rate": 7.475518513099677e-05, "loss": 0.006, "step": 297640 }, { "epoch": 1.5, "learning_rate": 7.474761743798275e-05, "loss": 0.0071, "step": 297650 }, { "epoch": 1.5, "learning_rate": 7.474004974496874e-05, "loss": 0.0083, "step": 297660 }, { "epoch": 1.5, "learning_rate": 7.473248205195472e-05, "loss": 0.0084, "step": 297670 }, { "epoch": 1.5, "learning_rate": 7.472491435894072e-05, "loss": 0.0069, "step": 297680 }, { "epoch": 1.5, "learning_rate": 7.471734666592671e-05, "loss": 0.0066, "step": 297690 }, { "epoch": 1.5, "learning_rate": 7.47097789729127e-05, "loss": 0.0071, "step": 297700 }, { "epoch": 1.5, "learning_rate": 7.470221127989869e-05, "loss": 0.006, "step": 297710 }, { "epoch": 1.5, "learning_rate": 7.469464358688469e-05, "loss": 0.0086, "step": 297720 }, { "epoch": 1.5, "learning_rate": 7.468707589387067e-05, "loss": 0.0093, "step": 297730 }, { "epoch": 1.5, "learning_rate": 7.467950820085665e-05, "loss": 0.0127, "step": 297740 }, { "epoch": 1.5, "learning_rate": 7.467194050784264e-05, "loss": 0.0075, "step": 297750 }, { "epoch": 1.5, "learning_rate": 7.466437281482864e-05, "loss": 0.0071, "step": 297760 }, { "epoch": 1.5, "learning_rate": 7.465680512181462e-05, "loss": 0.0071, "step": 297770 }, { "epoch": 1.5, "learning_rate": 7.464923742880062e-05, "loss": 0.0073, "step": 297780 }, { "epoch": 1.5, "learning_rate": 7.46416697357866e-05, "loss": 0.0066, "step": 297790 }, { "epoch": 1.5, "learning_rate": 7.463410204277259e-05, "loss": 0.0081, "step": 297800 }, { "epoch": 1.5, "learning_rate": 7.462653434975859e-05, "loss": 0.0099, "step": 297810 }, { "epoch": 1.5, "learning_rate": 7.461896665674457e-05, "loss": 0.008, "step": 297820 }, { "epoch": 1.5, "learning_rate": 7.461139896373056e-05, "loss": 0.0078, "step": 297830 }, { "epoch": 1.5, "learning_rate": 7.460383127071656e-05, "loss": 0.0083, "step": 297840 }, { "epoch": 1.5, "learning_rate": 7.459626357770254e-05, "loss": 0.0074, "step": 297850 }, { "epoch": 1.5, "learning_rate": 7.458869588468853e-05, "loss": 0.008, "step": 297860 }, { "epoch": 1.5, "learning_rate": 7.458112819167452e-05, "loss": 0.008, "step": 297870 }, { "epoch": 1.5, "learning_rate": 7.457356049866051e-05, "loss": 0.0074, "step": 297880 }, { "epoch": 1.5, "learning_rate": 7.45659928056465e-05, "loss": 0.0077, "step": 297890 }, { "epoch": 1.5, "learning_rate": 7.455842511263249e-05, "loss": 0.0058, "step": 297900 }, { "epoch": 1.5, "learning_rate": 7.455085741961848e-05, "loss": 0.0062, "step": 297910 }, { "epoch": 1.5, "learning_rate": 7.454328972660448e-05, "loss": 0.0077, "step": 297920 }, { "epoch": 1.5, "learning_rate": 7.453572203359046e-05, "loss": 0.007, "step": 297930 }, { "epoch": 1.5, "learning_rate": 7.452815434057645e-05, "loss": 0.0075, "step": 297940 }, { "epoch": 1.5, "learning_rate": 7.452058664756244e-05, "loss": 0.0095, "step": 297950 }, { "epoch": 1.5, "learning_rate": 7.451301895454843e-05, "loss": 0.0078, "step": 297960 }, { "epoch": 1.5, "learning_rate": 7.450545126153443e-05, "loss": 0.0082, "step": 297970 }, { "epoch": 1.5, "learning_rate": 7.449788356852041e-05, "loss": 0.0068, "step": 297980 }, { "epoch": 1.5, "learning_rate": 7.44903158755064e-05, "loss": 0.0064, "step": 297990 }, { "epoch": 1.5, "learning_rate": 7.44827481824924e-05, "loss": 0.006, "step": 298000 }, { "epoch": 1.5, "eval_cer": 0.9144489071884033, "eval_loss": 0.0054661910980939865, "eval_runtime": 116.6326, "eval_samples_per_second": 17.148, "eval_steps_per_second": 4.287, "step": 298000 }, { "epoch": 1.5, "learning_rate": 7.447518048947838e-05, "loss": 0.007, "step": 298010 }, { "epoch": 1.5, "learning_rate": 7.446761279646437e-05, "loss": 0.0068, "step": 298020 }, { "epoch": 1.5, "learning_rate": 7.446004510345035e-05, "loss": 0.0082, "step": 298030 }, { "epoch": 1.5, "learning_rate": 7.445247741043634e-05, "loss": 0.0062, "step": 298040 }, { "epoch": 1.5, "learning_rate": 7.444490971742233e-05, "loss": 0.0069, "step": 298050 }, { "epoch": 1.5, "learning_rate": 7.443734202440833e-05, "loss": 0.007, "step": 298060 }, { "epoch": 1.5, "learning_rate": 7.442977433139431e-05, "loss": 0.0066, "step": 298070 }, { "epoch": 1.5, "learning_rate": 7.44222066383803e-05, "loss": 0.0067, "step": 298080 }, { "epoch": 1.5, "learning_rate": 7.44146389453663e-05, "loss": 0.0055, "step": 298090 }, { "epoch": 1.5, "learning_rate": 7.440707125235228e-05, "loss": 0.0058, "step": 298100 }, { "epoch": 1.5, "learning_rate": 7.439950355933827e-05, "loss": 0.0085, "step": 298110 }, { "epoch": 1.5, "learning_rate": 7.439193586632426e-05, "loss": 0.0068, "step": 298120 }, { "epoch": 1.5, "learning_rate": 7.438436817331025e-05, "loss": 0.0085, "step": 298130 }, { "epoch": 1.5, "learning_rate": 7.437680048029625e-05, "loss": 0.008, "step": 298140 }, { "epoch": 1.5, "learning_rate": 7.436923278728223e-05, "loss": 0.0079, "step": 298150 }, { "epoch": 1.5, "learning_rate": 7.436166509426822e-05, "loss": 0.007, "step": 298160 }, { "epoch": 1.5, "learning_rate": 7.435409740125422e-05, "loss": 0.0096, "step": 298170 }, { "epoch": 1.5, "learning_rate": 7.43465297082402e-05, "loss": 0.006, "step": 298180 }, { "epoch": 1.5, "learning_rate": 7.43389620152262e-05, "loss": 0.0064, "step": 298190 }, { "epoch": 1.5, "learning_rate": 7.433139432221217e-05, "loss": 0.0068, "step": 298200 }, { "epoch": 1.5, "learning_rate": 7.432382662919817e-05, "loss": 0.0062, "step": 298210 }, { "epoch": 1.5, "learning_rate": 7.431625893618416e-05, "loss": 0.0065, "step": 298220 }, { "epoch": 1.5, "learning_rate": 7.430869124317015e-05, "loss": 0.0086, "step": 298230 }, { "epoch": 1.5, "learning_rate": 7.430112355015614e-05, "loss": 0.0076, "step": 298240 }, { "epoch": 1.5, "learning_rate": 7.429355585714214e-05, "loss": 0.0069, "step": 298250 }, { "epoch": 1.5, "learning_rate": 7.428598816412812e-05, "loss": 0.0074, "step": 298260 }, { "epoch": 1.5, "learning_rate": 7.427842047111411e-05, "loss": 0.0106, "step": 298270 }, { "epoch": 1.5, "learning_rate": 7.427085277810011e-05, "loss": 0.0063, "step": 298280 }, { "epoch": 1.5, "learning_rate": 7.426328508508609e-05, "loss": 0.0075, "step": 298290 }, { "epoch": 1.5, "learning_rate": 7.425571739207208e-05, "loss": 0.0089, "step": 298300 }, { "epoch": 1.51, "learning_rate": 7.424814969905807e-05, "loss": 0.0078, "step": 298310 }, { "epoch": 1.51, "learning_rate": 7.424058200604406e-05, "loss": 0.0061, "step": 298320 }, { "epoch": 1.51, "learning_rate": 7.423301431303006e-05, "loss": 0.008, "step": 298330 }, { "epoch": 1.51, "learning_rate": 7.422544662001604e-05, "loss": 0.0078, "step": 298340 }, { "epoch": 1.51, "learning_rate": 7.421787892700203e-05, "loss": 0.0063, "step": 298350 }, { "epoch": 1.51, "learning_rate": 7.421031123398801e-05, "loss": 0.0066, "step": 298360 }, { "epoch": 1.51, "learning_rate": 7.420274354097401e-05, "loss": 0.0061, "step": 298370 }, { "epoch": 1.51, "learning_rate": 7.419517584795999e-05, "loss": 0.0082, "step": 298380 }, { "epoch": 1.51, "learning_rate": 7.418760815494598e-05, "loss": 0.0134, "step": 298390 }, { "epoch": 1.51, "learning_rate": 7.418004046193197e-05, "loss": 0.0077, "step": 298400 }, { "epoch": 1.51, "learning_rate": 7.417247276891796e-05, "loss": 0.006, "step": 298410 }, { "epoch": 1.51, "learning_rate": 7.416490507590396e-05, "loss": 0.0077, "step": 298420 }, { "epoch": 1.51, "learning_rate": 7.415733738288994e-05, "loss": 0.006, "step": 298430 }, { "epoch": 1.51, "learning_rate": 7.414976968987593e-05, "loss": 0.0089, "step": 298440 }, { "epoch": 1.51, "learning_rate": 7.414220199686193e-05, "loss": 0.0081, "step": 298450 }, { "epoch": 1.51, "learning_rate": 7.413463430384791e-05, "loss": 0.0078, "step": 298460 }, { "epoch": 1.51, "learning_rate": 7.41270666108339e-05, "loss": 0.0075, "step": 298470 }, { "epoch": 1.51, "learning_rate": 7.411949891781989e-05, "loss": 0.0088, "step": 298480 }, { "epoch": 1.51, "learning_rate": 7.411193122480588e-05, "loss": 0.0061, "step": 298490 }, { "epoch": 1.51, "learning_rate": 7.410436353179188e-05, "loss": 0.0078, "step": 298500 }, { "epoch": 1.51, "learning_rate": 7.409679583877786e-05, "loss": 0.0046, "step": 298510 }, { "epoch": 1.51, "learning_rate": 7.408922814576385e-05, "loss": 0.0084, "step": 298520 }, { "epoch": 1.51, "learning_rate": 7.408166045274985e-05, "loss": 0.0057, "step": 298530 }, { "epoch": 1.51, "learning_rate": 7.407409275973583e-05, "loss": 0.0056, "step": 298540 }, { "epoch": 1.51, "learning_rate": 7.406652506672182e-05, "loss": 0.0077, "step": 298550 }, { "epoch": 1.51, "learning_rate": 7.40589573737078e-05, "loss": 0.007, "step": 298560 }, { "epoch": 1.51, "learning_rate": 7.40513896806938e-05, "loss": 0.0072, "step": 298570 }, { "epoch": 1.51, "learning_rate": 7.40438219876798e-05, "loss": 0.0076, "step": 298580 }, { "epoch": 1.51, "learning_rate": 7.403625429466578e-05, "loss": 0.0083, "step": 298590 }, { "epoch": 1.51, "learning_rate": 7.402868660165177e-05, "loss": 0.0087, "step": 298600 }, { "epoch": 1.51, "learning_rate": 7.402111890863777e-05, "loss": 0.008, "step": 298610 }, { "epoch": 1.51, "learning_rate": 7.401355121562375e-05, "loss": 0.0082, "step": 298620 }, { "epoch": 1.51, "learning_rate": 7.400598352260974e-05, "loss": 0.0056, "step": 298630 }, { "epoch": 1.51, "learning_rate": 7.399841582959572e-05, "loss": 0.0064, "step": 298640 }, { "epoch": 1.51, "learning_rate": 7.399084813658172e-05, "loss": 0.0064, "step": 298650 }, { "epoch": 1.51, "learning_rate": 7.398328044356771e-05, "loss": 0.0062, "step": 298660 }, { "epoch": 1.51, "learning_rate": 7.39757127505537e-05, "loss": 0.0065, "step": 298670 }, { "epoch": 1.51, "learning_rate": 7.396814505753968e-05, "loss": 0.0072, "step": 298680 }, { "epoch": 1.51, "learning_rate": 7.396057736452567e-05, "loss": 0.0092, "step": 298690 }, { "epoch": 1.51, "learning_rate": 7.395300967151167e-05, "loss": 0.0088, "step": 298700 }, { "epoch": 1.51, "learning_rate": 7.394544197849765e-05, "loss": 0.0065, "step": 298710 }, { "epoch": 1.51, "learning_rate": 7.393787428548364e-05, "loss": 0.0073, "step": 298720 }, { "epoch": 1.51, "learning_rate": 7.393030659246964e-05, "loss": 0.0068, "step": 298730 }, { "epoch": 1.51, "learning_rate": 7.392273889945562e-05, "loss": 0.0048, "step": 298740 }, { "epoch": 1.51, "learning_rate": 7.391517120644161e-05, "loss": 0.0064, "step": 298750 }, { "epoch": 1.51, "learning_rate": 7.39076035134276e-05, "loss": 0.0092, "step": 298760 }, { "epoch": 1.51, "learning_rate": 7.390003582041359e-05, "loss": 0.0059, "step": 298770 }, { "epoch": 1.51, "learning_rate": 7.389246812739959e-05, "loss": 0.0068, "step": 298780 }, { "epoch": 1.51, "learning_rate": 7.388490043438557e-05, "loss": 0.0073, "step": 298790 }, { "epoch": 1.51, "learning_rate": 7.387733274137156e-05, "loss": 0.0067, "step": 298800 }, { "epoch": 1.51, "learning_rate": 7.386976504835756e-05, "loss": 0.0064, "step": 298810 }, { "epoch": 1.51, "learning_rate": 7.386219735534354e-05, "loss": 0.0075, "step": 298820 }, { "epoch": 1.51, "learning_rate": 7.385462966232953e-05, "loss": 0.0071, "step": 298830 }, { "epoch": 1.51, "learning_rate": 7.384706196931552e-05, "loss": 0.0071, "step": 298840 }, { "epoch": 1.51, "learning_rate": 7.383949427630151e-05, "loss": 0.0055, "step": 298850 }, { "epoch": 1.51, "learning_rate": 7.38319265832875e-05, "loss": 0.0074, "step": 298860 }, { "epoch": 1.51, "learning_rate": 7.382435889027349e-05, "loss": 0.0062, "step": 298870 }, { "epoch": 1.51, "learning_rate": 7.381679119725948e-05, "loss": 0.0074, "step": 298880 }, { "epoch": 1.51, "learning_rate": 7.380922350424548e-05, "loss": 0.0067, "step": 298890 }, { "epoch": 1.51, "learning_rate": 7.380165581123146e-05, "loss": 0.007, "step": 298900 }, { "epoch": 1.51, "learning_rate": 7.379408811821745e-05, "loss": 0.0056, "step": 298910 }, { "epoch": 1.51, "learning_rate": 7.378652042520344e-05, "loss": 0.0082, "step": 298920 }, { "epoch": 1.51, "learning_rate": 7.377895273218943e-05, "loss": 0.0061, "step": 298930 }, { "epoch": 1.51, "learning_rate": 7.377138503917543e-05, "loss": 0.0068, "step": 298940 }, { "epoch": 1.51, "learning_rate": 7.37638173461614e-05, "loss": 0.0071, "step": 298950 }, { "epoch": 1.51, "learning_rate": 7.37562496531474e-05, "loss": 0.006, "step": 298960 }, { "epoch": 1.51, "learning_rate": 7.37486819601334e-05, "loss": 0.0085, "step": 298970 }, { "epoch": 1.51, "learning_rate": 7.374111426711938e-05, "loss": 0.0067, "step": 298980 }, { "epoch": 1.51, "learning_rate": 7.373354657410536e-05, "loss": 0.0072, "step": 298990 }, { "epoch": 1.51, "learning_rate": 7.372597888109135e-05, "loss": 0.0058, "step": 299000 }, { "epoch": 1.51, "eval_cer": 0.9144362920387732, "eval_loss": 0.005306443199515343, "eval_runtime": 116.5784, "eval_samples_per_second": 17.156, "eval_steps_per_second": 4.289, "step": 299000 }, { "epoch": 1.51, "learning_rate": 7.371841118807734e-05, "loss": 0.0063, "step": 299010 }, { "epoch": 1.51, "learning_rate": 7.371084349506333e-05, "loss": 0.0097, "step": 299020 }, { "epoch": 1.51, "learning_rate": 7.370327580204933e-05, "loss": 0.0081, "step": 299030 }, { "epoch": 1.51, "learning_rate": 7.369570810903531e-05, "loss": 0.0069, "step": 299040 }, { "epoch": 1.51, "learning_rate": 7.36881404160213e-05, "loss": 0.0084, "step": 299050 }, { "epoch": 1.51, "learning_rate": 7.36805727230073e-05, "loss": 0.0088, "step": 299060 }, { "epoch": 1.51, "learning_rate": 7.367300502999328e-05, "loss": 0.0067, "step": 299070 }, { "epoch": 1.51, "learning_rate": 7.366543733697927e-05, "loss": 0.0069, "step": 299080 }, { "epoch": 1.51, "learning_rate": 7.365786964396526e-05, "loss": 0.007, "step": 299090 }, { "epoch": 1.51, "learning_rate": 7.365030195095125e-05, "loss": 0.0075, "step": 299100 }, { "epoch": 1.51, "learning_rate": 7.364273425793725e-05, "loss": 0.0069, "step": 299110 }, { "epoch": 1.51, "learning_rate": 7.363516656492323e-05, "loss": 0.0071, "step": 299120 }, { "epoch": 1.51, "learning_rate": 7.362759887190922e-05, "loss": 0.0091, "step": 299130 }, { "epoch": 1.51, "learning_rate": 7.362003117889522e-05, "loss": 0.0067, "step": 299140 }, { "epoch": 1.51, "learning_rate": 7.36124634858812e-05, "loss": 0.0079, "step": 299150 }, { "epoch": 1.51, "learning_rate": 7.360489579286719e-05, "loss": 0.0072, "step": 299160 }, { "epoch": 1.51, "learning_rate": 7.359732809985317e-05, "loss": 0.007, "step": 299170 }, { "epoch": 1.51, "learning_rate": 7.358976040683917e-05, "loss": 0.0054, "step": 299180 }, { "epoch": 1.51, "learning_rate": 7.358219271382516e-05, "loss": 0.0063, "step": 299190 }, { "epoch": 1.51, "learning_rate": 7.357462502081115e-05, "loss": 0.006, "step": 299200 }, { "epoch": 1.51, "learning_rate": 7.356705732779714e-05, "loss": 0.0068, "step": 299210 }, { "epoch": 1.51, "learning_rate": 7.355948963478314e-05, "loss": 0.0071, "step": 299220 }, { "epoch": 1.51, "learning_rate": 7.355192194176912e-05, "loss": 0.0076, "step": 299230 }, { "epoch": 1.51, "learning_rate": 7.354435424875511e-05, "loss": 0.0075, "step": 299240 }, { "epoch": 1.51, "learning_rate": 7.353678655574111e-05, "loss": 0.0082, "step": 299250 }, { "epoch": 1.51, "learning_rate": 7.352921886272709e-05, "loss": 0.008, "step": 299260 }, { "epoch": 1.51, "learning_rate": 7.352165116971308e-05, "loss": 0.0087, "step": 299270 }, { "epoch": 1.51, "learning_rate": 7.351408347669907e-05, "loss": 0.0056, "step": 299280 }, { "epoch": 1.51, "learning_rate": 7.350651578368506e-05, "loss": 0.0062, "step": 299290 }, { "epoch": 1.51, "learning_rate": 7.349894809067104e-05, "loss": 0.0081, "step": 299300 }, { "epoch": 1.51, "learning_rate": 7.349138039765704e-05, "loss": 0.0067, "step": 299310 }, { "epoch": 1.51, "learning_rate": 7.348381270464302e-05, "loss": 0.0076, "step": 299320 }, { "epoch": 1.51, "learning_rate": 7.347624501162901e-05, "loss": 0.0065, "step": 299330 }, { "epoch": 1.51, "learning_rate": 7.346867731861501e-05, "loss": 0.0069, "step": 299340 }, { "epoch": 1.51, "learning_rate": 7.346110962560099e-05, "loss": 0.0052, "step": 299350 }, { "epoch": 1.51, "learning_rate": 7.345354193258698e-05, "loss": 0.0068, "step": 299360 }, { "epoch": 1.51, "learning_rate": 7.344597423957297e-05, "loss": 0.0075, "step": 299370 }, { "epoch": 1.51, "learning_rate": 7.343840654655896e-05, "loss": 0.0095, "step": 299380 }, { "epoch": 1.51, "learning_rate": 7.343083885354496e-05, "loss": 0.009, "step": 299390 }, { "epoch": 1.51, "learning_rate": 7.342327116053094e-05, "loss": 0.0075, "step": 299400 }, { "epoch": 1.51, "learning_rate": 7.341570346751693e-05, "loss": 0.0111, "step": 299410 }, { "epoch": 1.51, "learning_rate": 7.340813577450293e-05, "loss": 0.0064, "step": 299420 }, { "epoch": 1.51, "learning_rate": 7.340056808148891e-05, "loss": 0.0072, "step": 299430 }, { "epoch": 1.51, "learning_rate": 7.33930003884749e-05, "loss": 0.0084, "step": 299440 }, { "epoch": 1.51, "learning_rate": 7.338543269546089e-05, "loss": 0.0067, "step": 299450 }, { "epoch": 1.51, "learning_rate": 7.337786500244688e-05, "loss": 0.0071, "step": 299460 }, { "epoch": 1.51, "learning_rate": 7.337029730943288e-05, "loss": 0.0068, "step": 299470 }, { "epoch": 1.51, "learning_rate": 7.336272961641886e-05, "loss": 0.0053, "step": 299480 }, { "epoch": 1.51, "learning_rate": 7.335516192340485e-05, "loss": 0.008, "step": 299490 }, { "epoch": 1.51, "learning_rate": 7.334759423039085e-05, "loss": 0.0074, "step": 299500 }, { "epoch": 1.51, "learning_rate": 7.334002653737683e-05, "loss": 0.007, "step": 299510 }, { "epoch": 1.51, "learning_rate": 7.333245884436282e-05, "loss": 0.0062, "step": 299520 }, { "epoch": 1.51, "learning_rate": 7.33248911513488e-05, "loss": 0.0082, "step": 299530 }, { "epoch": 1.51, "learning_rate": 7.33173234583348e-05, "loss": 0.0089, "step": 299540 }, { "epoch": 1.51, "learning_rate": 7.33097557653208e-05, "loss": 0.0056, "step": 299550 }, { "epoch": 1.51, "learning_rate": 7.330218807230678e-05, "loss": 0.0068, "step": 299560 }, { "epoch": 1.51, "learning_rate": 7.329462037929277e-05, "loss": 0.0046, "step": 299570 }, { "epoch": 1.51, "learning_rate": 7.328705268627877e-05, "loss": 0.0085, "step": 299580 }, { "epoch": 1.51, "learning_rate": 7.327948499326475e-05, "loss": 0.0064, "step": 299590 }, { "epoch": 1.51, "learning_rate": 7.327191730025074e-05, "loss": 0.0059, "step": 299600 }, { "epoch": 1.51, "learning_rate": 7.326434960723672e-05, "loss": 0.0089, "step": 299610 }, { "epoch": 1.51, "learning_rate": 7.32567819142227e-05, "loss": 0.0097, "step": 299620 }, { "epoch": 1.51, "learning_rate": 7.32492142212087e-05, "loss": 0.0079, "step": 299630 }, { "epoch": 1.51, "learning_rate": 7.32416465281947e-05, "loss": 0.0056, "step": 299640 }, { "epoch": 1.51, "learning_rate": 7.323407883518068e-05, "loss": 0.006, "step": 299650 }, { "epoch": 1.51, "learning_rate": 7.322651114216667e-05, "loss": 0.0078, "step": 299660 }, { "epoch": 1.51, "learning_rate": 7.321894344915267e-05, "loss": 0.0058, "step": 299670 }, { "epoch": 1.51, "learning_rate": 7.321137575613865e-05, "loss": 0.0073, "step": 299680 }, { "epoch": 1.51, "learning_rate": 7.320380806312464e-05, "loss": 0.0075, "step": 299690 }, { "epoch": 1.51, "learning_rate": 7.319624037011064e-05, "loss": 0.008, "step": 299700 }, { "epoch": 1.51, "learning_rate": 7.318867267709662e-05, "loss": 0.0083, "step": 299710 }, { "epoch": 1.51, "learning_rate": 7.318110498408261e-05, "loss": 0.0076, "step": 299720 }, { "epoch": 1.51, "learning_rate": 7.31735372910686e-05, "loss": 0.0068, "step": 299730 }, { "epoch": 1.51, "learning_rate": 7.316596959805459e-05, "loss": 0.0071, "step": 299740 }, { "epoch": 1.51, "learning_rate": 7.315840190504059e-05, "loss": 0.0085, "step": 299750 }, { "epoch": 1.51, "learning_rate": 7.315083421202657e-05, "loss": 0.0082, "step": 299760 }, { "epoch": 1.51, "learning_rate": 7.314326651901256e-05, "loss": 0.0051, "step": 299770 }, { "epoch": 1.51, "learning_rate": 7.313569882599856e-05, "loss": 0.0086, "step": 299780 }, { "epoch": 1.51, "learning_rate": 7.312813113298454e-05, "loss": 0.0059, "step": 299790 }, { "epoch": 1.51, "learning_rate": 7.312056343997053e-05, "loss": 0.0081, "step": 299800 }, { "epoch": 1.51, "learning_rate": 7.311299574695652e-05, "loss": 0.0081, "step": 299810 }, { "epoch": 1.51, "learning_rate": 7.310542805394251e-05, "loss": 0.008, "step": 299820 }, { "epoch": 1.51, "learning_rate": 7.30978603609285e-05, "loss": 0.0073, "step": 299830 }, { "epoch": 1.51, "learning_rate": 7.309029266791449e-05, "loss": 0.0076, "step": 299840 }, { "epoch": 1.51, "learning_rate": 7.308272497490048e-05, "loss": 0.0091, "step": 299850 }, { "epoch": 1.51, "learning_rate": 7.307515728188648e-05, "loss": 0.0067, "step": 299860 }, { "epoch": 1.51, "learning_rate": 7.306758958887246e-05, "loss": 0.0073, "step": 299870 }, { "epoch": 1.51, "learning_rate": 7.306002189585845e-05, "loss": 0.0073, "step": 299880 }, { "epoch": 1.51, "learning_rate": 7.305245420284443e-05, "loss": 0.0062, "step": 299890 }, { "epoch": 1.51, "learning_rate": 7.304488650983043e-05, "loss": 0.0089, "step": 299900 }, { "epoch": 1.51, "learning_rate": 7.303731881681642e-05, "loss": 0.0049, "step": 299910 }, { "epoch": 1.51, "learning_rate": 7.30297511238024e-05, "loss": 0.0078, "step": 299920 }, { "epoch": 1.51, "learning_rate": 7.302218343078839e-05, "loss": 0.0064, "step": 299930 }, { "epoch": 1.51, "learning_rate": 7.301461573777438e-05, "loss": 0.007, "step": 299940 }, { "epoch": 1.51, "learning_rate": 7.300704804476038e-05, "loss": 0.0083, "step": 299950 }, { "epoch": 1.51, "learning_rate": 7.299948035174636e-05, "loss": 0.0068, "step": 299960 }, { "epoch": 1.51, "learning_rate": 7.299191265873235e-05, "loss": 0.0079, "step": 299970 }, { "epoch": 1.51, "learning_rate": 7.298434496571834e-05, "loss": 0.0082, "step": 299980 }, { "epoch": 1.51, "learning_rate": 7.297677727270433e-05, "loss": 0.0087, "step": 299990 }, { "epoch": 1.51, "learning_rate": 7.296920957969033e-05, "loss": 0.0079, "step": 300000 }, { "epoch": 1.51, "eval_cer": 0.9144518183767796, "eval_loss": 0.0054466393776237965, "eval_runtime": 116.3507, "eval_samples_per_second": 17.189, "eval_steps_per_second": 4.297, "step": 300000 }, { "epoch": 1.51, "learning_rate": 7.29616418866763e-05, "loss": 0.0053, "step": 300010 }, { "epoch": 1.51, "learning_rate": 7.29540741936623e-05, "loss": 0.0059, "step": 300020 }, { "epoch": 1.51, "learning_rate": 7.29465065006483e-05, "loss": 0.0092, "step": 300030 }, { "epoch": 1.51, "learning_rate": 7.293893880763428e-05, "loss": 0.014, "step": 300040 }, { "epoch": 1.51, "learning_rate": 7.293137111462027e-05, "loss": 0.0071, "step": 300050 }, { "epoch": 1.51, "learning_rate": 7.292380342160625e-05, "loss": 0.008, "step": 300060 }, { "epoch": 1.51, "learning_rate": 7.291623572859225e-05, "loss": 0.0066, "step": 300070 }, { "epoch": 1.51, "learning_rate": 7.290866803557824e-05, "loss": 0.0085, "step": 300080 }, { "epoch": 1.51, "learning_rate": 7.290110034256423e-05, "loss": 0.0073, "step": 300090 }, { "epoch": 1.51, "learning_rate": 7.289353264955022e-05, "loss": 0.0087, "step": 300100 }, { "epoch": 1.51, "learning_rate": 7.288596495653622e-05, "loss": 0.0047, "step": 300110 }, { "epoch": 1.51, "learning_rate": 7.28783972635222e-05, "loss": 0.01, "step": 300120 }, { "epoch": 1.51, "learning_rate": 7.287082957050819e-05, "loss": 0.0071, "step": 300130 }, { "epoch": 1.51, "learning_rate": 7.286326187749417e-05, "loss": 0.0078, "step": 300140 }, { "epoch": 1.51, "learning_rate": 7.285569418448017e-05, "loss": 0.0104, "step": 300150 }, { "epoch": 1.51, "learning_rate": 7.284812649146616e-05, "loss": 0.0045, "step": 300160 }, { "epoch": 1.51, "learning_rate": 7.284055879845215e-05, "loss": 0.0074, "step": 300170 }, { "epoch": 1.51, "learning_rate": 7.283299110543814e-05, "loss": 0.0069, "step": 300180 }, { "epoch": 1.51, "learning_rate": 7.282542341242414e-05, "loss": 0.0084, "step": 300190 }, { "epoch": 1.51, "learning_rate": 7.281785571941012e-05, "loss": 0.007, "step": 300200 }, { "epoch": 1.51, "learning_rate": 7.281028802639611e-05, "loss": 0.0055, "step": 300210 }, { "epoch": 1.51, "learning_rate": 7.28027203333821e-05, "loss": 0.0085, "step": 300220 }, { "epoch": 1.51, "learning_rate": 7.279515264036809e-05, "loss": 0.0071, "step": 300230 }, { "epoch": 1.51, "learning_rate": 7.278758494735407e-05, "loss": 0.0068, "step": 300240 }, { "epoch": 1.51, "learning_rate": 7.278001725434006e-05, "loss": 0.0064, "step": 300250 }, { "epoch": 1.51, "learning_rate": 7.277244956132605e-05, "loss": 0.0061, "step": 300260 }, { "epoch": 1.51, "learning_rate": 7.276488186831204e-05, "loss": 0.0082, "step": 300270 }, { "epoch": 1.51, "learning_rate": 7.275731417529804e-05, "loss": 0.0063, "step": 300280 }, { "epoch": 1.51, "learning_rate": 7.274974648228402e-05, "loss": 0.0079, "step": 300290 }, { "epoch": 1.52, "learning_rate": 7.274217878927001e-05, "loss": 0.0097, "step": 300300 }, { "epoch": 1.52, "learning_rate": 7.273461109625601e-05, "loss": 0.0074, "step": 300310 }, { "epoch": 1.52, "learning_rate": 7.272704340324199e-05, "loss": 0.005, "step": 300320 }, { "epoch": 1.52, "learning_rate": 7.271947571022798e-05, "loss": 0.0068, "step": 300330 }, { "epoch": 1.52, "learning_rate": 7.271190801721397e-05, "loss": 0.0063, "step": 300340 }, { "epoch": 1.52, "learning_rate": 7.270434032419996e-05, "loss": 0.0092, "step": 300350 }, { "epoch": 1.52, "learning_rate": 7.269677263118596e-05, "loss": 0.0089, "step": 300360 }, { "epoch": 1.52, "learning_rate": 7.268920493817194e-05, "loss": 0.0102, "step": 300370 }, { "epoch": 1.52, "learning_rate": 7.268163724515793e-05, "loss": 0.0072, "step": 300380 }, { "epoch": 1.52, "learning_rate": 7.267406955214393e-05, "loss": 0.0042, "step": 300390 }, { "epoch": 1.52, "learning_rate": 7.266650185912991e-05, "loss": 0.0073, "step": 300400 }, { "epoch": 1.52, "learning_rate": 7.26589341661159e-05, "loss": 0.0056, "step": 300410 }, { "epoch": 1.52, "learning_rate": 7.265136647310188e-05, "loss": 0.0089, "step": 300420 }, { "epoch": 1.52, "learning_rate": 7.264379878008788e-05, "loss": 0.0074, "step": 300430 }, { "epoch": 1.52, "learning_rate": 7.263623108707387e-05, "loss": 0.0068, "step": 300440 }, { "epoch": 1.52, "learning_rate": 7.262866339405986e-05, "loss": 0.0075, "step": 300450 }, { "epoch": 1.52, "learning_rate": 7.262109570104585e-05, "loss": 0.0087, "step": 300460 }, { "epoch": 1.52, "learning_rate": 7.261352800803185e-05, "loss": 0.0055, "step": 300470 }, { "epoch": 1.52, "learning_rate": 7.260596031501783e-05, "loss": 0.0056, "step": 300480 }, { "epoch": 1.52, "learning_rate": 7.259839262200382e-05, "loss": 0.0067, "step": 300490 }, { "epoch": 1.52, "learning_rate": 7.25908249289898e-05, "loss": 0.0061, "step": 300500 }, { "epoch": 1.52, "learning_rate": 7.25832572359758e-05, "loss": 0.0073, "step": 300510 }, { "epoch": 1.52, "learning_rate": 7.25756895429618e-05, "loss": 0.0067, "step": 300520 }, { "epoch": 1.52, "learning_rate": 7.256812184994778e-05, "loss": 0.0076, "step": 300530 }, { "epoch": 1.52, "learning_rate": 7.256055415693377e-05, "loss": 0.0077, "step": 300540 }, { "epoch": 1.52, "learning_rate": 7.255298646391977e-05, "loss": 0.0078, "step": 300550 }, { "epoch": 1.52, "learning_rate": 7.254541877090575e-05, "loss": 0.0076, "step": 300560 }, { "epoch": 1.52, "learning_rate": 7.253785107789173e-05, "loss": 0.0073, "step": 300570 }, { "epoch": 1.52, "learning_rate": 7.253028338487772e-05, "loss": 0.0097, "step": 300580 }, { "epoch": 1.52, "learning_rate": 7.25227156918637e-05, "loss": 0.006, "step": 300590 }, { "epoch": 1.52, "learning_rate": 7.25151479988497e-05, "loss": 0.0063, "step": 300600 }, { "epoch": 1.52, "learning_rate": 7.25075803058357e-05, "loss": 0.0071, "step": 300610 }, { "epoch": 1.52, "learning_rate": 7.250001261282168e-05, "loss": 0.0064, "step": 300620 }, { "epoch": 1.52, "learning_rate": 7.249244491980767e-05, "loss": 0.0069, "step": 300630 }, { "epoch": 1.52, "learning_rate": 7.248487722679367e-05, "loss": 0.0053, "step": 300640 }, { "epoch": 1.52, "learning_rate": 7.247730953377965e-05, "loss": 0.0067, "step": 300650 }, { "epoch": 1.52, "learning_rate": 7.246974184076564e-05, "loss": 0.0069, "step": 300660 }, { "epoch": 1.52, "learning_rate": 7.246217414775164e-05, "loss": 0.0058, "step": 300670 }, { "epoch": 1.52, "learning_rate": 7.245460645473762e-05, "loss": 0.006, "step": 300680 }, { "epoch": 1.52, "learning_rate": 7.244703876172361e-05, "loss": 0.0074, "step": 300690 }, { "epoch": 1.52, "learning_rate": 7.24394710687096e-05, "loss": 0.0079, "step": 300700 }, { "epoch": 1.52, "learning_rate": 7.243190337569559e-05, "loss": 0.0064, "step": 300710 }, { "epoch": 1.52, "learning_rate": 7.242433568268159e-05, "loss": 0.007, "step": 300720 }, { "epoch": 1.52, "learning_rate": 7.241676798966757e-05, "loss": 0.0054, "step": 300730 }, { "epoch": 1.52, "learning_rate": 7.240920029665356e-05, "loss": 0.0078, "step": 300740 }, { "epoch": 1.52, "learning_rate": 7.240163260363956e-05, "loss": 0.006, "step": 300750 }, { "epoch": 1.52, "learning_rate": 7.239406491062554e-05, "loss": 0.0061, "step": 300760 }, { "epoch": 1.52, "learning_rate": 7.238649721761153e-05, "loss": 0.0049, "step": 300770 }, { "epoch": 1.52, "learning_rate": 7.237892952459751e-05, "loss": 0.0065, "step": 300780 }, { "epoch": 1.52, "learning_rate": 7.237136183158351e-05, "loss": 0.0072, "step": 300790 }, { "epoch": 1.52, "learning_rate": 7.23637941385695e-05, "loss": 0.0074, "step": 300800 }, { "epoch": 1.52, "learning_rate": 7.235622644555549e-05, "loss": 0.0064, "step": 300810 }, { "epoch": 1.52, "learning_rate": 7.234865875254148e-05, "loss": 0.0054, "step": 300820 }, { "epoch": 1.52, "learning_rate": 7.234109105952748e-05, "loss": 0.0069, "step": 300830 }, { "epoch": 1.52, "learning_rate": 7.233352336651346e-05, "loss": 0.0058, "step": 300840 }, { "epoch": 1.52, "learning_rate": 7.232595567349945e-05, "loss": 0.0074, "step": 300850 }, { "epoch": 1.52, "learning_rate": 7.231838798048543e-05, "loss": 0.0068, "step": 300860 }, { "epoch": 1.52, "learning_rate": 7.231082028747142e-05, "loss": 0.0062, "step": 300870 }, { "epoch": 1.52, "learning_rate": 7.230325259445741e-05, "loss": 0.0078, "step": 300880 }, { "epoch": 1.52, "learning_rate": 7.22956849014434e-05, "loss": 0.0069, "step": 300890 }, { "epoch": 1.52, "learning_rate": 7.228811720842939e-05, "loss": 0.0063, "step": 300900 }, { "epoch": 1.52, "learning_rate": 7.228054951541538e-05, "loss": 0.0072, "step": 300910 }, { "epoch": 1.52, "learning_rate": 7.227298182240138e-05, "loss": 0.0077, "step": 300920 }, { "epoch": 1.52, "learning_rate": 7.226541412938736e-05, "loss": 0.007, "step": 300930 }, { "epoch": 1.52, "learning_rate": 7.225784643637335e-05, "loss": 0.0064, "step": 300940 }, { "epoch": 1.52, "learning_rate": 7.225027874335933e-05, "loss": 0.0081, "step": 300950 }, { "epoch": 1.52, "learning_rate": 7.224271105034533e-05, "loss": 0.0075, "step": 300960 }, { "epoch": 1.52, "learning_rate": 7.223514335733132e-05, "loss": 0.0079, "step": 300970 }, { "epoch": 1.52, "learning_rate": 7.22275756643173e-05, "loss": 0.006, "step": 300980 }, { "epoch": 1.52, "learning_rate": 7.22200079713033e-05, "loss": 0.0083, "step": 300990 }, { "epoch": 1.52, "learning_rate": 7.22124402782893e-05, "loss": 0.0064, "step": 301000 }, { "epoch": 1.52, "eval_cer": 0.9144430848116509, "eval_loss": 0.00536463363096118, "eval_runtime": 116.4459, "eval_samples_per_second": 17.175, "eval_steps_per_second": 4.294, "step": 301000 }, { "epoch": 1.52, "learning_rate": 7.220487258527528e-05, "loss": 0.0084, "step": 301010 }, { "epoch": 1.52, "learning_rate": 7.219730489226127e-05, "loss": 0.0061, "step": 301020 }, { "epoch": 1.52, "learning_rate": 7.218973719924725e-05, "loss": 0.0083, "step": 301030 }, { "epoch": 1.52, "learning_rate": 7.218216950623325e-05, "loss": 0.0093, "step": 301040 }, { "epoch": 1.52, "learning_rate": 7.217460181321924e-05, "loss": 0.0066, "step": 301050 }, { "epoch": 1.52, "learning_rate": 7.216703412020523e-05, "loss": 0.0059, "step": 301060 }, { "epoch": 1.52, "learning_rate": 7.215946642719122e-05, "loss": 0.0087, "step": 301070 }, { "epoch": 1.52, "learning_rate": 7.215189873417722e-05, "loss": 0.0063, "step": 301080 }, { "epoch": 1.52, "learning_rate": 7.21443310411632e-05, "loss": 0.0064, "step": 301090 }, { "epoch": 1.52, "learning_rate": 7.213676334814919e-05, "loss": 0.008, "step": 301100 }, { "epoch": 1.52, "learning_rate": 7.212919565513517e-05, "loss": 0.0081, "step": 301110 }, { "epoch": 1.52, "learning_rate": 7.212162796212117e-05, "loss": 0.006, "step": 301120 }, { "epoch": 1.52, "learning_rate": 7.211406026910716e-05, "loss": 0.0057, "step": 301130 }, { "epoch": 1.52, "learning_rate": 7.210649257609314e-05, "loss": 0.0065, "step": 301140 }, { "epoch": 1.52, "learning_rate": 7.209892488307914e-05, "loss": 0.0058, "step": 301150 }, { "epoch": 1.52, "learning_rate": 7.209135719006513e-05, "loss": 0.0071, "step": 301160 }, { "epoch": 1.52, "learning_rate": 7.208378949705112e-05, "loss": 0.0048, "step": 301170 }, { "epoch": 1.52, "learning_rate": 7.207622180403711e-05, "loss": 0.0074, "step": 301180 }, { "epoch": 1.52, "learning_rate": 7.206865411102309e-05, "loss": 0.007, "step": 301190 }, { "epoch": 1.52, "learning_rate": 7.206108641800909e-05, "loss": 0.0068, "step": 301200 }, { "epoch": 1.52, "learning_rate": 7.205351872499507e-05, "loss": 0.0054, "step": 301210 }, { "epoch": 1.52, "learning_rate": 7.204595103198106e-05, "loss": 0.0094, "step": 301220 }, { "epoch": 1.52, "learning_rate": 7.203838333896705e-05, "loss": 0.0072, "step": 301230 }, { "epoch": 1.52, "learning_rate": 7.203081564595304e-05, "loss": 0.0104, "step": 301240 }, { "epoch": 1.52, "learning_rate": 7.202324795293904e-05, "loss": 0.0098, "step": 301250 }, { "epoch": 1.52, "learning_rate": 7.201568025992502e-05, "loss": 0.0074, "step": 301260 }, { "epoch": 1.52, "learning_rate": 7.200811256691101e-05, "loss": 0.0081, "step": 301270 }, { "epoch": 1.52, "learning_rate": 7.200054487389701e-05, "loss": 0.0073, "step": 301280 }, { "epoch": 1.52, "learning_rate": 7.199297718088299e-05, "loss": 0.0073, "step": 301290 }, { "epoch": 1.52, "learning_rate": 7.198540948786898e-05, "loss": 0.0067, "step": 301300 }, { "epoch": 1.52, "learning_rate": 7.197784179485496e-05, "loss": 0.0071, "step": 301310 }, { "epoch": 1.52, "learning_rate": 7.197027410184096e-05, "loss": 0.0067, "step": 301320 }, { "epoch": 1.52, "learning_rate": 7.196270640882695e-05, "loss": 0.0071, "step": 301330 }, { "epoch": 1.52, "learning_rate": 7.195513871581294e-05, "loss": 0.0073, "step": 301340 }, { "epoch": 1.52, "learning_rate": 7.194757102279893e-05, "loss": 0.0074, "step": 301350 }, { "epoch": 1.52, "learning_rate": 7.194000332978493e-05, "loss": 0.0065, "step": 301360 }, { "epoch": 1.52, "learning_rate": 7.193243563677091e-05, "loss": 0.0068, "step": 301370 }, { "epoch": 1.52, "learning_rate": 7.19248679437569e-05, "loss": 0.0084, "step": 301380 }, { "epoch": 1.52, "learning_rate": 7.191730025074288e-05, "loss": 0.0068, "step": 301390 }, { "epoch": 1.52, "learning_rate": 7.190973255772888e-05, "loss": 0.0073, "step": 301400 }, { "epoch": 1.52, "learning_rate": 7.190216486471487e-05, "loss": 0.0097, "step": 301410 }, { "epoch": 1.52, "learning_rate": 7.189459717170086e-05, "loss": 0.0067, "step": 301420 }, { "epoch": 1.52, "learning_rate": 7.188702947868685e-05, "loss": 0.0055, "step": 301430 }, { "epoch": 1.52, "learning_rate": 7.187946178567285e-05, "loss": 0.0078, "step": 301440 }, { "epoch": 1.52, "learning_rate": 7.187189409265883e-05, "loss": 0.0055, "step": 301450 }, { "epoch": 1.52, "learning_rate": 7.186432639964482e-05, "loss": 0.0052, "step": 301460 }, { "epoch": 1.52, "learning_rate": 7.18567587066308e-05, "loss": 0.0062, "step": 301470 }, { "epoch": 1.52, "learning_rate": 7.18491910136168e-05, "loss": 0.0064, "step": 301480 }, { "epoch": 1.52, "learning_rate": 7.18416233206028e-05, "loss": 0.0075, "step": 301490 }, { "epoch": 1.52, "learning_rate": 7.183405562758877e-05, "loss": 0.0075, "step": 301500 }, { "epoch": 1.52, "learning_rate": 7.182648793457476e-05, "loss": 0.0069, "step": 301510 }, { "epoch": 1.52, "learning_rate": 7.181892024156075e-05, "loss": 0.0059, "step": 301520 }, { "epoch": 1.52, "learning_rate": 7.181135254854675e-05, "loss": 0.0064, "step": 301530 }, { "epoch": 1.52, "learning_rate": 7.180378485553273e-05, "loss": 0.0088, "step": 301540 }, { "epoch": 1.52, "learning_rate": 7.179621716251872e-05, "loss": 0.0068, "step": 301550 }, { "epoch": 1.52, "learning_rate": 7.17886494695047e-05, "loss": 0.0098, "step": 301560 }, { "epoch": 1.52, "learning_rate": 7.17810817764907e-05, "loss": 0.009, "step": 301570 }, { "epoch": 1.52, "learning_rate": 7.17735140834767e-05, "loss": 0.007, "step": 301580 }, { "epoch": 1.52, "learning_rate": 7.176594639046268e-05, "loss": 0.0057, "step": 301590 }, { "epoch": 1.52, "learning_rate": 7.175837869744867e-05, "loss": 0.0063, "step": 301600 }, { "epoch": 1.52, "learning_rate": 7.175081100443467e-05, "loss": 0.0084, "step": 301610 }, { "epoch": 1.52, "learning_rate": 7.174324331142065e-05, "loss": 0.0068, "step": 301620 }, { "epoch": 1.52, "learning_rate": 7.173567561840664e-05, "loss": 0.0066, "step": 301630 }, { "epoch": 1.52, "learning_rate": 7.172810792539264e-05, "loss": 0.0089, "step": 301640 }, { "epoch": 1.52, "learning_rate": 7.172054023237862e-05, "loss": 0.0055, "step": 301650 }, { "epoch": 1.52, "learning_rate": 7.171297253936461e-05, "loss": 0.0064, "step": 301660 }, { "epoch": 1.52, "learning_rate": 7.17054048463506e-05, "loss": 0.0062, "step": 301670 }, { "epoch": 1.52, "learning_rate": 7.169783715333659e-05, "loss": 0.006, "step": 301680 }, { "epoch": 1.52, "learning_rate": 7.169026946032258e-05, "loss": 0.0064, "step": 301690 }, { "epoch": 1.52, "learning_rate": 7.168270176730857e-05, "loss": 0.0056, "step": 301700 }, { "epoch": 1.52, "learning_rate": 7.167513407429456e-05, "loss": 0.0059, "step": 301710 }, { "epoch": 1.52, "learning_rate": 7.166756638128056e-05, "loss": 0.0081, "step": 301720 }, { "epoch": 1.52, "learning_rate": 7.165999868826654e-05, "loss": 0.0062, "step": 301730 }, { "epoch": 1.52, "learning_rate": 7.165243099525253e-05, "loss": 0.0075, "step": 301740 }, { "epoch": 1.52, "learning_rate": 7.164486330223851e-05, "loss": 0.01, "step": 301750 }, { "epoch": 1.52, "learning_rate": 7.163729560922451e-05, "loss": 0.0084, "step": 301760 }, { "epoch": 1.52, "learning_rate": 7.16297279162105e-05, "loss": 0.0058, "step": 301770 }, { "epoch": 1.52, "learning_rate": 7.162216022319649e-05, "loss": 0.0065, "step": 301780 }, { "epoch": 1.52, "learning_rate": 7.161459253018248e-05, "loss": 0.0057, "step": 301790 }, { "epoch": 1.52, "learning_rate": 7.160702483716848e-05, "loss": 0.0075, "step": 301800 }, { "epoch": 1.52, "learning_rate": 7.159945714415446e-05, "loss": 0.0072, "step": 301810 }, { "epoch": 1.52, "learning_rate": 7.159188945114044e-05, "loss": 0.0066, "step": 301820 }, { "epoch": 1.52, "learning_rate": 7.158432175812643e-05, "loss": 0.0066, "step": 301830 }, { "epoch": 1.52, "learning_rate": 7.157675406511242e-05, "loss": 0.0069, "step": 301840 }, { "epoch": 1.52, "learning_rate": 7.156918637209841e-05, "loss": 0.0069, "step": 301850 }, { "epoch": 1.52, "learning_rate": 7.15616186790844e-05, "loss": 0.0073, "step": 301860 }, { "epoch": 1.52, "learning_rate": 7.155405098607039e-05, "loss": 0.0066, "step": 301870 }, { "epoch": 1.52, "learning_rate": 7.154648329305638e-05, "loss": 0.0064, "step": 301880 }, { "epoch": 1.52, "learning_rate": 7.153891560004238e-05, "loss": 0.0075, "step": 301890 }, { "epoch": 1.52, "learning_rate": 7.153134790702836e-05, "loss": 0.0084, "step": 301900 }, { "epoch": 1.52, "learning_rate": 7.152378021401435e-05, "loss": 0.0063, "step": 301910 }, { "epoch": 1.52, "learning_rate": 7.151621252100033e-05, "loss": 0.0074, "step": 301920 }, { "epoch": 1.52, "learning_rate": 7.150864482798633e-05, "loss": 0.0056, "step": 301930 }, { "epoch": 1.52, "learning_rate": 7.150107713497232e-05, "loss": 0.0065, "step": 301940 }, { "epoch": 1.52, "learning_rate": 7.14935094419583e-05, "loss": 0.0057, "step": 301950 }, { "epoch": 1.52, "learning_rate": 7.14859417489443e-05, "loss": 0.0093, "step": 301960 }, { "epoch": 1.52, "learning_rate": 7.14783740559303e-05, "loss": 0.006, "step": 301970 }, { "epoch": 1.52, "learning_rate": 7.147080636291628e-05, "loss": 0.007, "step": 301980 }, { "epoch": 1.52, "learning_rate": 7.146323866990227e-05, "loss": 0.0069, "step": 301990 }, { "epoch": 1.52, "learning_rate": 7.145567097688825e-05, "loss": 0.008, "step": 302000 }, { "epoch": 1.52, "eval_cer": 0.9144489071884033, "eval_loss": 0.0054143439047038555, "eval_runtime": 116.5206, "eval_samples_per_second": 17.164, "eval_steps_per_second": 4.291, "step": 302000 }, { "epoch": 1.52, "learning_rate": 7.144810328387425e-05, "loss": 0.0075, "step": 302010 }, { "epoch": 1.52, "learning_rate": 7.144053559086024e-05, "loss": 0.0073, "step": 302020 }, { "epoch": 1.52, "learning_rate": 7.143296789784623e-05, "loss": 0.007, "step": 302030 }, { "epoch": 1.52, "learning_rate": 7.142540020483222e-05, "loss": 0.0069, "step": 302040 }, { "epoch": 1.52, "learning_rate": 7.141783251181822e-05, "loss": 0.0078, "step": 302050 }, { "epoch": 1.52, "learning_rate": 7.14102648188042e-05, "loss": 0.0078, "step": 302060 }, { "epoch": 1.52, "learning_rate": 7.140269712579019e-05, "loss": 0.0089, "step": 302070 }, { "epoch": 1.52, "learning_rate": 7.139512943277617e-05, "loss": 0.0071, "step": 302080 }, { "epoch": 1.52, "learning_rate": 7.138756173976217e-05, "loss": 0.0062, "step": 302090 }, { "epoch": 1.52, "learning_rate": 7.137999404674816e-05, "loss": 0.0092, "step": 302100 }, { "epoch": 1.52, "learning_rate": 7.137242635373414e-05, "loss": 0.0076, "step": 302110 }, { "epoch": 1.52, "learning_rate": 7.136485866072014e-05, "loss": 0.0074, "step": 302120 }, { "epoch": 1.52, "learning_rate": 7.135729096770612e-05, "loss": 0.0078, "step": 302130 }, { "epoch": 1.52, "learning_rate": 7.134972327469212e-05, "loss": 0.0068, "step": 302140 }, { "epoch": 1.52, "learning_rate": 7.13421555816781e-05, "loss": 0.0097, "step": 302150 }, { "epoch": 1.52, "learning_rate": 7.133458788866409e-05, "loss": 0.0065, "step": 302160 }, { "epoch": 1.52, "learning_rate": 7.132702019565009e-05, "loss": 0.0067, "step": 302170 }, { "epoch": 1.52, "learning_rate": 7.131945250263607e-05, "loss": 0.0072, "step": 302180 }, { "epoch": 1.52, "learning_rate": 7.131188480962206e-05, "loss": 0.0072, "step": 302190 }, { "epoch": 1.52, "learning_rate": 7.130431711660805e-05, "loss": 0.0072, "step": 302200 }, { "epoch": 1.52, "learning_rate": 7.129674942359404e-05, "loss": 0.006, "step": 302210 }, { "epoch": 1.52, "learning_rate": 7.128918173058004e-05, "loss": 0.0081, "step": 302220 }, { "epoch": 1.52, "learning_rate": 7.128161403756602e-05, "loss": 0.0082, "step": 302230 }, { "epoch": 1.52, "learning_rate": 7.127404634455201e-05, "loss": 0.0083, "step": 302240 }, { "epoch": 1.52, "learning_rate": 7.1266478651538e-05, "loss": 0.0059, "step": 302250 }, { "epoch": 1.52, "learning_rate": 7.125891095852399e-05, "loss": 0.009, "step": 302260 }, { "epoch": 1.52, "learning_rate": 7.125134326550998e-05, "loss": 0.0063, "step": 302270 }, { "epoch": 1.53, "learning_rate": 7.124377557249596e-05, "loss": 0.0061, "step": 302280 }, { "epoch": 1.53, "learning_rate": 7.123620787948196e-05, "loss": 0.0075, "step": 302290 }, { "epoch": 1.53, "learning_rate": 7.122864018646795e-05, "loss": 0.0074, "step": 302300 }, { "epoch": 1.53, "learning_rate": 7.122107249345394e-05, "loss": 0.0064, "step": 302310 }, { "epoch": 1.53, "learning_rate": 7.121350480043993e-05, "loss": 0.0095, "step": 302320 }, { "epoch": 1.53, "learning_rate": 7.120593710742593e-05, "loss": 0.0054, "step": 302330 }, { "epoch": 1.53, "learning_rate": 7.119836941441191e-05, "loss": 0.0072, "step": 302340 }, { "epoch": 1.53, "learning_rate": 7.11908017213979e-05, "loss": 0.0077, "step": 302350 }, { "epoch": 1.53, "learning_rate": 7.118323402838388e-05, "loss": 0.006, "step": 302360 }, { "epoch": 1.53, "learning_rate": 7.117566633536988e-05, "loss": 0.0071, "step": 302370 }, { "epoch": 1.53, "learning_rate": 7.116809864235587e-05, "loss": 0.0073, "step": 302380 }, { "epoch": 1.53, "learning_rate": 7.116053094934186e-05, "loss": 0.0079, "step": 302390 }, { "epoch": 1.53, "learning_rate": 7.115296325632785e-05, "loss": 0.008, "step": 302400 }, { "epoch": 1.53, "learning_rate": 7.114539556331385e-05, "loss": 0.0082, "step": 302410 }, { "epoch": 1.53, "learning_rate": 7.113782787029983e-05, "loss": 0.0085, "step": 302420 }, { "epoch": 1.53, "learning_rate": 7.113026017728582e-05, "loss": 0.0088, "step": 302430 }, { "epoch": 1.53, "learning_rate": 7.11226924842718e-05, "loss": 0.0096, "step": 302440 }, { "epoch": 1.53, "learning_rate": 7.111512479125778e-05, "loss": 0.0068, "step": 302450 }, { "epoch": 1.53, "learning_rate": 7.110755709824378e-05, "loss": 0.0063, "step": 302460 }, { "epoch": 1.53, "learning_rate": 7.109998940522977e-05, "loss": 0.0062, "step": 302470 }, { "epoch": 1.53, "learning_rate": 7.109242171221576e-05, "loss": 0.007, "step": 302480 }, { "epoch": 1.53, "learning_rate": 7.108485401920175e-05, "loss": 0.0101, "step": 302490 }, { "epoch": 1.53, "learning_rate": 7.107728632618775e-05, "loss": 0.0096, "step": 302500 }, { "epoch": 1.53, "learning_rate": 7.106971863317373e-05, "loss": 0.0063, "step": 302510 }, { "epoch": 1.53, "learning_rate": 7.106215094015972e-05, "loss": 0.0061, "step": 302520 }, { "epoch": 1.53, "learning_rate": 7.10545832471457e-05, "loss": 0.0089, "step": 302530 }, { "epoch": 1.53, "learning_rate": 7.10470155541317e-05, "loss": 0.0049, "step": 302540 }, { "epoch": 1.53, "learning_rate": 7.10394478611177e-05, "loss": 0.008, "step": 302550 }, { "epoch": 1.53, "learning_rate": 7.103188016810368e-05, "loss": 0.008, "step": 302560 }, { "epoch": 1.53, "learning_rate": 7.102431247508967e-05, "loss": 0.0065, "step": 302570 }, { "epoch": 1.53, "learning_rate": 7.101674478207567e-05, "loss": 0.0072, "step": 302580 }, { "epoch": 1.53, "learning_rate": 7.100917708906165e-05, "loss": 0.0067, "step": 302590 }, { "epoch": 1.53, "learning_rate": 7.100160939604764e-05, "loss": 0.0093, "step": 302600 }, { "epoch": 1.53, "learning_rate": 7.099404170303364e-05, "loss": 0.0074, "step": 302610 }, { "epoch": 1.53, "learning_rate": 7.098647401001962e-05, "loss": 0.0062, "step": 302620 }, { "epoch": 1.53, "learning_rate": 7.097890631700561e-05, "loss": 0.0067, "step": 302630 }, { "epoch": 1.53, "learning_rate": 7.09713386239916e-05, "loss": 0.0081, "step": 302640 }, { "epoch": 1.53, "learning_rate": 7.096377093097759e-05, "loss": 0.0096, "step": 302650 }, { "epoch": 1.53, "learning_rate": 7.095620323796358e-05, "loss": 0.0079, "step": 302660 }, { "epoch": 1.53, "learning_rate": 7.094863554494957e-05, "loss": 0.007, "step": 302670 }, { "epoch": 1.53, "learning_rate": 7.094106785193556e-05, "loss": 0.0068, "step": 302680 }, { "epoch": 1.53, "learning_rate": 7.093350015892156e-05, "loss": 0.006, "step": 302690 }, { "epoch": 1.53, "learning_rate": 7.092593246590754e-05, "loss": 0.0064, "step": 302700 }, { "epoch": 1.53, "learning_rate": 7.091836477289353e-05, "loss": 0.007, "step": 302710 }, { "epoch": 1.53, "learning_rate": 7.091079707987951e-05, "loss": 0.0063, "step": 302720 }, { "epoch": 1.53, "learning_rate": 7.090322938686551e-05, "loss": 0.0093, "step": 302730 }, { "epoch": 1.53, "learning_rate": 7.08956616938515e-05, "loss": 0.0096, "step": 302740 }, { "epoch": 1.53, "learning_rate": 7.088809400083749e-05, "loss": 0.0067, "step": 302750 }, { "epoch": 1.53, "learning_rate": 7.088052630782347e-05, "loss": 0.0074, "step": 302760 }, { "epoch": 1.53, "learning_rate": 7.087295861480946e-05, "loss": 0.0087, "step": 302770 }, { "epoch": 1.53, "learning_rate": 7.086539092179546e-05, "loss": 0.0074, "step": 302780 }, { "epoch": 1.53, "learning_rate": 7.085782322878144e-05, "loss": 0.0058, "step": 302790 }, { "epoch": 1.53, "learning_rate": 7.085025553576743e-05, "loss": 0.008, "step": 302800 }, { "epoch": 1.53, "learning_rate": 7.084268784275341e-05, "loss": 0.0074, "step": 302810 }, { "epoch": 1.53, "learning_rate": 7.083512014973941e-05, "loss": 0.0066, "step": 302820 }, { "epoch": 1.53, "learning_rate": 7.08275524567254e-05, "loss": 0.0078, "step": 302830 }, { "epoch": 1.53, "learning_rate": 7.081998476371139e-05, "loss": 0.007, "step": 302840 }, { "epoch": 1.53, "learning_rate": 7.081241707069738e-05, "loss": 0.0062, "step": 302850 }, { "epoch": 1.53, "learning_rate": 7.080484937768338e-05, "loss": 0.0077, "step": 302860 }, { "epoch": 1.53, "learning_rate": 7.079728168466936e-05, "loss": 0.0072, "step": 302870 }, { "epoch": 1.53, "learning_rate": 7.078971399165535e-05, "loss": 0.0065, "step": 302880 }, { "epoch": 1.53, "learning_rate": 7.078214629864133e-05, "loss": 0.0054, "step": 302890 }, { "epoch": 1.53, "learning_rate": 7.077457860562733e-05, "loss": 0.0096, "step": 302900 }, { "epoch": 1.53, "learning_rate": 7.076701091261332e-05, "loss": 0.0075, "step": 302910 }, { "epoch": 1.53, "learning_rate": 7.07594432195993e-05, "loss": 0.008, "step": 302920 }, { "epoch": 1.53, "learning_rate": 7.07518755265853e-05, "loss": 0.0098, "step": 302930 }, { "epoch": 1.53, "learning_rate": 7.07443078335713e-05, "loss": 0.0062, "step": 302940 }, { "epoch": 1.53, "learning_rate": 7.073674014055728e-05, "loss": 0.0063, "step": 302950 }, { "epoch": 1.53, "learning_rate": 7.072917244754327e-05, "loss": 0.0054, "step": 302960 }, { "epoch": 1.53, "learning_rate": 7.072160475452925e-05, "loss": 0.0065, "step": 302970 }, { "epoch": 1.53, "learning_rate": 7.071403706151525e-05, "loss": 0.0086, "step": 302980 }, { "epoch": 1.53, "learning_rate": 7.070646936850124e-05, "loss": 0.0093, "step": 302990 }, { "epoch": 1.53, "learning_rate": 7.069890167548722e-05, "loss": 0.0051, "step": 303000 }, { "epoch": 1.53, "eval_cer": 0.9144556999612812, "eval_loss": 0.00549934571608901, "eval_runtime": 116.3379, "eval_samples_per_second": 17.191, "eval_steps_per_second": 4.298, "step": 303000 }, { "epoch": 1.53, "learning_rate": 7.069133398247322e-05, "loss": 0.0096, "step": 303010 }, { "epoch": 1.53, "learning_rate": 7.068376628945921e-05, "loss": 0.0077, "step": 303020 }, { "epoch": 1.53, "learning_rate": 7.06761985964452e-05, "loss": 0.0057, "step": 303030 }, { "epoch": 1.53, "learning_rate": 7.066863090343119e-05, "loss": 0.0071, "step": 303040 }, { "epoch": 1.53, "learning_rate": 7.066106321041717e-05, "loss": 0.0069, "step": 303050 }, { "epoch": 1.53, "learning_rate": 7.065349551740317e-05, "loss": 0.0091, "step": 303060 }, { "epoch": 1.53, "learning_rate": 7.064592782438915e-05, "loss": 0.0078, "step": 303070 }, { "epoch": 1.53, "learning_rate": 7.063836013137514e-05, "loss": 0.0095, "step": 303080 }, { "epoch": 1.53, "learning_rate": 7.063079243836113e-05, "loss": 0.006, "step": 303090 }, { "epoch": 1.53, "learning_rate": 7.062322474534712e-05, "loss": 0.0077, "step": 303100 }, { "epoch": 1.53, "learning_rate": 7.061565705233312e-05, "loss": 0.0072, "step": 303110 }, { "epoch": 1.53, "learning_rate": 7.06080893593191e-05, "loss": 0.0081, "step": 303120 }, { "epoch": 1.53, "learning_rate": 7.060052166630509e-05, "loss": 0.0073, "step": 303130 }, { "epoch": 1.53, "learning_rate": 7.059295397329109e-05, "loss": 0.0089, "step": 303140 }, { "epoch": 1.53, "learning_rate": 7.058538628027707e-05, "loss": 0.0067, "step": 303150 }, { "epoch": 1.53, "learning_rate": 7.057781858726306e-05, "loss": 0.0056, "step": 303160 }, { "epoch": 1.53, "learning_rate": 7.057025089424904e-05, "loss": 0.0055, "step": 303170 }, { "epoch": 1.53, "learning_rate": 7.056268320123504e-05, "loss": 0.0075, "step": 303180 }, { "epoch": 1.53, "learning_rate": 7.055511550822103e-05, "loss": 0.0068, "step": 303190 }, { "epoch": 1.53, "learning_rate": 7.054754781520702e-05, "loss": 0.008, "step": 303200 }, { "epoch": 1.53, "learning_rate": 7.053998012219301e-05, "loss": 0.0089, "step": 303210 }, { "epoch": 1.53, "learning_rate": 7.0532412429179e-05, "loss": 0.0065, "step": 303220 }, { "epoch": 1.53, "learning_rate": 7.052484473616499e-05, "loss": 0.0073, "step": 303230 }, { "epoch": 1.53, "learning_rate": 7.051727704315098e-05, "loss": 0.0082, "step": 303240 }, { "epoch": 1.53, "learning_rate": 7.050970935013696e-05, "loss": 0.0073, "step": 303250 }, { "epoch": 1.53, "learning_rate": 7.050214165712296e-05, "loss": 0.007, "step": 303260 }, { "epoch": 1.53, "learning_rate": 7.049457396410895e-05, "loss": 0.0088, "step": 303270 }, { "epoch": 1.53, "learning_rate": 7.048700627109494e-05, "loss": 0.0083, "step": 303280 }, { "epoch": 1.53, "learning_rate": 7.047943857808093e-05, "loss": 0.006, "step": 303290 }, { "epoch": 1.53, "learning_rate": 7.047187088506693e-05, "loss": 0.0064, "step": 303300 }, { "epoch": 1.53, "learning_rate": 7.046430319205291e-05, "loss": 0.0067, "step": 303310 }, { "epoch": 1.53, "learning_rate": 7.04567354990389e-05, "loss": 0.0073, "step": 303320 }, { "epoch": 1.53, "learning_rate": 7.044916780602488e-05, "loss": 0.0047, "step": 303330 }, { "epoch": 1.53, "learning_rate": 7.044160011301088e-05, "loss": 0.0075, "step": 303340 }, { "epoch": 1.53, "learning_rate": 7.043403241999687e-05, "loss": 0.0067, "step": 303350 }, { "epoch": 1.53, "learning_rate": 7.042646472698285e-05, "loss": 0.0064, "step": 303360 }, { "epoch": 1.53, "learning_rate": 7.041889703396885e-05, "loss": 0.0077, "step": 303370 }, { "epoch": 1.53, "learning_rate": 7.041132934095484e-05, "loss": 0.009, "step": 303380 }, { "epoch": 1.53, "learning_rate": 7.040376164794083e-05, "loss": 0.0069, "step": 303390 }, { "epoch": 1.53, "learning_rate": 7.039619395492681e-05, "loss": 0.0076, "step": 303400 }, { "epoch": 1.53, "learning_rate": 7.03886262619128e-05, "loss": 0.0062, "step": 303410 }, { "epoch": 1.53, "learning_rate": 7.038105856889878e-05, "loss": 0.0063, "step": 303420 }, { "epoch": 1.53, "learning_rate": 7.037349087588478e-05, "loss": 0.0075, "step": 303430 }, { "epoch": 1.53, "learning_rate": 7.036592318287077e-05, "loss": 0.0072, "step": 303440 }, { "epoch": 1.53, "learning_rate": 7.035835548985676e-05, "loss": 0.0051, "step": 303450 }, { "epoch": 1.53, "learning_rate": 7.035078779684275e-05, "loss": 0.0079, "step": 303460 }, { "epoch": 1.53, "learning_rate": 7.034322010382875e-05, "loss": 0.006, "step": 303470 }, { "epoch": 1.53, "learning_rate": 7.033565241081473e-05, "loss": 0.0071, "step": 303480 }, { "epoch": 1.53, "learning_rate": 7.032808471780072e-05, "loss": 0.0067, "step": 303490 }, { "epoch": 1.53, "learning_rate": 7.03205170247867e-05, "loss": 0.0072, "step": 303500 }, { "epoch": 1.53, "learning_rate": 7.03129493317727e-05, "loss": 0.0088, "step": 303510 }, { "epoch": 1.53, "learning_rate": 7.03053816387587e-05, "loss": 0.0078, "step": 303520 }, { "epoch": 1.53, "learning_rate": 7.029781394574467e-05, "loss": 0.0072, "step": 303530 }, { "epoch": 1.53, "learning_rate": 7.029024625273067e-05, "loss": 0.011, "step": 303540 }, { "epoch": 1.53, "learning_rate": 7.028267855971666e-05, "loss": 0.0076, "step": 303550 }, { "epoch": 1.53, "learning_rate": 7.027511086670265e-05, "loss": 0.008, "step": 303560 }, { "epoch": 1.53, "learning_rate": 7.026754317368864e-05, "loss": 0.0067, "step": 303570 }, { "epoch": 1.53, "learning_rate": 7.025997548067464e-05, "loss": 0.0056, "step": 303580 }, { "epoch": 1.53, "learning_rate": 7.025240778766062e-05, "loss": 0.0051, "step": 303590 }, { "epoch": 1.53, "learning_rate": 7.024484009464661e-05, "loss": 0.0074, "step": 303600 }, { "epoch": 1.53, "learning_rate": 7.02372724016326e-05, "loss": 0.0107, "step": 303610 }, { "epoch": 1.53, "learning_rate": 7.022970470861859e-05, "loss": 0.0066, "step": 303620 }, { "epoch": 1.53, "learning_rate": 7.022213701560458e-05, "loss": 0.0066, "step": 303630 }, { "epoch": 1.53, "learning_rate": 7.021456932259057e-05, "loss": 0.0059, "step": 303640 }, { "epoch": 1.53, "learning_rate": 7.020700162957656e-05, "loss": 0.0058, "step": 303650 }, { "epoch": 1.53, "learning_rate": 7.019943393656256e-05, "loss": 0.0054, "step": 303660 }, { "epoch": 1.53, "learning_rate": 7.019186624354854e-05, "loss": 0.0069, "step": 303670 }, { "epoch": 1.53, "learning_rate": 7.018429855053453e-05, "loss": 0.0056, "step": 303680 }, { "epoch": 1.53, "learning_rate": 7.017673085752051e-05, "loss": 0.0067, "step": 303690 }, { "epoch": 1.53, "learning_rate": 7.01691631645065e-05, "loss": 0.0097, "step": 303700 }, { "epoch": 1.53, "learning_rate": 7.016159547149249e-05, "loss": 0.0091, "step": 303710 }, { "epoch": 1.53, "learning_rate": 7.015402777847848e-05, "loss": 0.0069, "step": 303720 }, { "epoch": 1.53, "learning_rate": 7.014646008546447e-05, "loss": 0.0083, "step": 303730 }, { "epoch": 1.53, "learning_rate": 7.013889239245046e-05, "loss": 0.0072, "step": 303740 }, { "epoch": 1.53, "learning_rate": 7.013132469943646e-05, "loss": 0.0057, "step": 303750 }, { "epoch": 1.53, "learning_rate": 7.012375700642244e-05, "loss": 0.0057, "step": 303760 }, { "epoch": 1.53, "learning_rate": 7.011618931340843e-05, "loss": 0.0078, "step": 303770 }, { "epoch": 1.53, "learning_rate": 7.010862162039441e-05, "loss": 0.0086, "step": 303780 }, { "epoch": 1.53, "learning_rate": 7.010105392738041e-05, "loss": 0.0063, "step": 303790 }, { "epoch": 1.53, "learning_rate": 7.00934862343664e-05, "loss": 0.0054, "step": 303800 }, { "epoch": 1.53, "learning_rate": 7.008591854135239e-05, "loss": 0.0068, "step": 303810 }, { "epoch": 1.53, "learning_rate": 7.007835084833838e-05, "loss": 0.0075, "step": 303820 }, { "epoch": 1.53, "learning_rate": 7.007078315532438e-05, "loss": 0.0051, "step": 303830 }, { "epoch": 1.53, "learning_rate": 7.006321546231036e-05, "loss": 0.0055, "step": 303840 }, { "epoch": 1.53, "learning_rate": 7.005564776929635e-05, "loss": 0.004, "step": 303850 }, { "epoch": 1.53, "learning_rate": 7.004808007628233e-05, "loss": 0.0081, "step": 303860 }, { "epoch": 1.53, "learning_rate": 7.004051238326833e-05, "loss": 0.0083, "step": 303870 }, { "epoch": 1.53, "learning_rate": 7.003294469025432e-05, "loss": 0.0058, "step": 303880 }, { "epoch": 1.53, "learning_rate": 7.00253769972403e-05, "loss": 0.0081, "step": 303890 }, { "epoch": 1.53, "learning_rate": 7.00178093042263e-05, "loss": 0.0089, "step": 303900 }, { "epoch": 1.53, "learning_rate": 7.00102416112123e-05, "loss": 0.0087, "step": 303910 }, { "epoch": 1.53, "learning_rate": 7.000267391819828e-05, "loss": 0.0066, "step": 303920 }, { "epoch": 1.53, "learning_rate": 6.999510622518427e-05, "loss": 0.0092, "step": 303930 }, { "epoch": 1.53, "learning_rate": 6.998753853217025e-05, "loss": 0.0053, "step": 303940 }, { "epoch": 1.53, "learning_rate": 6.997997083915625e-05, "loss": 0.0073, "step": 303950 }, { "epoch": 1.53, "learning_rate": 6.997240314614224e-05, "loss": 0.0078, "step": 303960 }, { "epoch": 1.53, "learning_rate": 6.996483545312822e-05, "loss": 0.0074, "step": 303970 }, { "epoch": 1.53, "learning_rate": 6.995726776011422e-05, "loss": 0.0089, "step": 303980 }, { "epoch": 1.53, "learning_rate": 6.994970006710021e-05, "loss": 0.01, "step": 303990 }, { "epoch": 1.53, "learning_rate": 6.99421323740862e-05, "loss": 0.0086, "step": 304000 }, { "epoch": 1.53, "eval_cer": 0.9144459960000272, "eval_loss": 0.005344762932509184, "eval_runtime": 116.3874, "eval_samples_per_second": 17.184, "eval_steps_per_second": 4.296, "step": 304000 }, { "epoch": 1.53, "learning_rate": 6.993456468107218e-05, "loss": 0.0104, "step": 304010 }, { "epoch": 1.53, "learning_rate": 6.992699698805817e-05, "loss": 0.0061, "step": 304020 }, { "epoch": 1.53, "learning_rate": 6.991942929504417e-05, "loss": 0.0075, "step": 304030 }, { "epoch": 1.53, "learning_rate": 6.991186160203015e-05, "loss": 0.0075, "step": 304040 }, { "epoch": 1.53, "learning_rate": 6.990429390901614e-05, "loss": 0.0103, "step": 304050 }, { "epoch": 1.53, "learning_rate": 6.989672621600212e-05, "loss": 0.009, "step": 304060 }, { "epoch": 1.53, "learning_rate": 6.988915852298812e-05, "loss": 0.0096, "step": 304070 }, { "epoch": 1.53, "learning_rate": 6.988159082997411e-05, "loss": 0.0083, "step": 304080 }, { "epoch": 1.53, "learning_rate": 6.98740231369601e-05, "loss": 0.0059, "step": 304090 }, { "epoch": 1.53, "learning_rate": 6.986645544394609e-05, "loss": 0.0074, "step": 304100 }, { "epoch": 1.53, "learning_rate": 6.985888775093209e-05, "loss": 0.0088, "step": 304110 }, { "epoch": 1.53, "learning_rate": 6.985132005791807e-05, "loss": 0.009, "step": 304120 }, { "epoch": 1.53, "learning_rate": 6.984375236490406e-05, "loss": 0.006, "step": 304130 }, { "epoch": 1.53, "learning_rate": 6.983618467189004e-05, "loss": 0.0071, "step": 304140 }, { "epoch": 1.53, "learning_rate": 6.982861697887604e-05, "loss": 0.0086, "step": 304150 }, { "epoch": 1.53, "learning_rate": 6.982104928586203e-05, "loss": 0.0077, "step": 304160 }, { "epoch": 1.53, "learning_rate": 6.981348159284802e-05, "loss": 0.0076, "step": 304170 }, { "epoch": 1.53, "learning_rate": 6.980591389983401e-05, "loss": 0.0059, "step": 304180 }, { "epoch": 1.53, "learning_rate": 6.979834620682e-05, "loss": 0.008, "step": 304190 }, { "epoch": 1.53, "learning_rate": 6.979077851380599e-05, "loss": 0.0072, "step": 304200 }, { "epoch": 1.53, "learning_rate": 6.978321082079198e-05, "loss": 0.0058, "step": 304210 }, { "epoch": 1.53, "learning_rate": 6.977564312777796e-05, "loss": 0.0063, "step": 304220 }, { "epoch": 1.53, "learning_rate": 6.976807543476396e-05, "loss": 0.0078, "step": 304230 }, { "epoch": 1.53, "learning_rate": 6.976050774174995e-05, "loss": 0.0091, "step": 304240 }, { "epoch": 1.53, "learning_rate": 6.975294004873593e-05, "loss": 0.0068, "step": 304250 }, { "epoch": 1.54, "learning_rate": 6.974537235572193e-05, "loss": 0.0074, "step": 304260 }, { "epoch": 1.54, "learning_rate": 6.973780466270792e-05, "loss": 0.0067, "step": 304270 }, { "epoch": 1.54, "learning_rate": 6.97302369696939e-05, "loss": 0.0097, "step": 304280 }, { "epoch": 1.54, "learning_rate": 6.97226692766799e-05, "loss": 0.0082, "step": 304290 }, { "epoch": 1.54, "learning_rate": 6.971510158366588e-05, "loss": 0.0078, "step": 304300 }, { "epoch": 1.54, "learning_rate": 6.970753389065188e-05, "loss": 0.0093, "step": 304310 }, { "epoch": 1.54, "learning_rate": 6.969996619763787e-05, "loss": 0.0068, "step": 304320 }, { "epoch": 1.54, "learning_rate": 6.969239850462385e-05, "loss": 0.0098, "step": 304330 }, { "epoch": 1.54, "learning_rate": 6.968483081160984e-05, "loss": 0.01, "step": 304340 }, { "epoch": 1.54, "learning_rate": 6.967726311859583e-05, "loss": 0.0062, "step": 304350 }, { "epoch": 1.54, "learning_rate": 6.966969542558183e-05, "loss": 0.0081, "step": 304360 }, { "epoch": 1.54, "learning_rate": 6.966212773256781e-05, "loss": 0.0085, "step": 304370 }, { "epoch": 1.54, "learning_rate": 6.96545600395538e-05, "loss": 0.0072, "step": 304380 }, { "epoch": 1.54, "learning_rate": 6.964699234653978e-05, "loss": 0.0075, "step": 304390 }, { "epoch": 1.54, "learning_rate": 6.963942465352578e-05, "loss": 0.0048, "step": 304400 }, { "epoch": 1.54, "learning_rate": 6.963185696051177e-05, "loss": 0.0064, "step": 304410 }, { "epoch": 1.54, "learning_rate": 6.962428926749775e-05, "loss": 0.0057, "step": 304420 }, { "epoch": 1.54, "learning_rate": 6.961672157448375e-05, "loss": 0.0063, "step": 304430 }, { "epoch": 1.54, "learning_rate": 6.960915388146974e-05, "loss": 0.0069, "step": 304440 }, { "epoch": 1.54, "learning_rate": 6.960158618845573e-05, "loss": 0.0072, "step": 304450 }, { "epoch": 1.54, "learning_rate": 6.959401849544172e-05, "loss": 0.0065, "step": 304460 }, { "epoch": 1.54, "learning_rate": 6.95864508024277e-05, "loss": 0.0063, "step": 304470 }, { "epoch": 1.54, "learning_rate": 6.95788831094137e-05, "loss": 0.009, "step": 304480 }, { "epoch": 1.54, "learning_rate": 6.957131541639969e-05, "loss": 0.0058, "step": 304490 }, { "epoch": 1.54, "learning_rate": 6.956374772338567e-05, "loss": 0.0067, "step": 304500 }, { "epoch": 1.54, "learning_rate": 6.955618003037167e-05, "loss": 0.0064, "step": 304510 }, { "epoch": 1.54, "learning_rate": 6.954861233735766e-05, "loss": 0.0096, "step": 304520 }, { "epoch": 1.54, "learning_rate": 6.954104464434365e-05, "loss": 0.0095, "step": 304530 }, { "epoch": 1.54, "learning_rate": 6.953347695132964e-05, "loss": 0.0055, "step": 304540 }, { "epoch": 1.54, "learning_rate": 6.952590925831564e-05, "loss": 0.0069, "step": 304550 }, { "epoch": 1.54, "learning_rate": 6.951834156530162e-05, "loss": 0.0061, "step": 304560 }, { "epoch": 1.54, "learning_rate": 6.951077387228761e-05, "loss": 0.0067, "step": 304570 }, { "epoch": 1.54, "learning_rate": 6.95032061792736e-05, "loss": 0.0065, "step": 304580 }, { "epoch": 1.54, "learning_rate": 6.949563848625959e-05, "loss": 0.0052, "step": 304590 }, { "epoch": 1.54, "learning_rate": 6.948807079324558e-05, "loss": 0.0079, "step": 304600 }, { "epoch": 1.54, "learning_rate": 6.948050310023157e-05, "loss": 0.0062, "step": 304610 }, { "epoch": 1.54, "learning_rate": 6.947293540721756e-05, "loss": 0.0096, "step": 304620 }, { "epoch": 1.54, "learning_rate": 6.946536771420355e-05, "loss": 0.0075, "step": 304630 }, { "epoch": 1.54, "learning_rate": 6.945780002118954e-05, "loss": 0.0071, "step": 304640 }, { "epoch": 1.54, "learning_rate": 6.945023232817552e-05, "loss": 0.0062, "step": 304650 }, { "epoch": 1.54, "learning_rate": 6.944266463516151e-05, "loss": 0.0061, "step": 304660 }, { "epoch": 1.54, "learning_rate": 6.94350969421475e-05, "loss": 0.0064, "step": 304670 }, { "epoch": 1.54, "learning_rate": 6.942752924913349e-05, "loss": 0.0068, "step": 304680 }, { "epoch": 1.54, "learning_rate": 6.941996155611948e-05, "loss": 0.0057, "step": 304690 }, { "epoch": 1.54, "learning_rate": 6.941239386310547e-05, "loss": 0.0057, "step": 304700 }, { "epoch": 1.54, "learning_rate": 6.940482617009146e-05, "loss": 0.0083, "step": 304710 }, { "epoch": 1.54, "learning_rate": 6.939725847707746e-05, "loss": 0.0068, "step": 304720 }, { "epoch": 1.54, "learning_rate": 6.938969078406344e-05, "loss": 0.0071, "step": 304730 }, { "epoch": 1.54, "learning_rate": 6.938212309104943e-05, "loss": 0.0071, "step": 304740 }, { "epoch": 1.54, "learning_rate": 6.937455539803541e-05, "loss": 0.0073, "step": 304750 }, { "epoch": 1.54, "learning_rate": 6.936698770502141e-05, "loss": 0.0086, "step": 304760 }, { "epoch": 1.54, "learning_rate": 6.93594200120074e-05, "loss": 0.0068, "step": 304770 }, { "epoch": 1.54, "learning_rate": 6.935185231899339e-05, "loss": 0.0077, "step": 304780 }, { "epoch": 1.54, "learning_rate": 6.934428462597938e-05, "loss": 0.0075, "step": 304790 }, { "epoch": 1.54, "learning_rate": 6.933671693296538e-05, "loss": 0.0065, "step": 304800 }, { "epoch": 1.54, "learning_rate": 6.932914923995136e-05, "loss": 0.0065, "step": 304810 }, { "epoch": 1.54, "learning_rate": 6.932158154693735e-05, "loss": 0.009, "step": 304820 }, { "epoch": 1.54, "learning_rate": 6.931401385392333e-05, "loss": 0.006, "step": 304830 }, { "epoch": 1.54, "learning_rate": 6.930644616090933e-05, "loss": 0.005, "step": 304840 }, { "epoch": 1.54, "learning_rate": 6.929887846789532e-05, "loss": 0.0064, "step": 304850 }, { "epoch": 1.54, "learning_rate": 6.92913107748813e-05, "loss": 0.0072, "step": 304860 }, { "epoch": 1.54, "learning_rate": 6.92837430818673e-05, "loss": 0.0061, "step": 304870 }, { "epoch": 1.54, "learning_rate": 6.92761753888533e-05, "loss": 0.0061, "step": 304880 }, { "epoch": 1.54, "learning_rate": 6.926860769583928e-05, "loss": 0.007, "step": 304890 }, { "epoch": 1.54, "learning_rate": 6.926104000282527e-05, "loss": 0.0063, "step": 304900 }, { "epoch": 1.54, "learning_rate": 6.925347230981125e-05, "loss": 0.0073, "step": 304910 }, { "epoch": 1.54, "learning_rate": 6.924590461679725e-05, "loss": 0.007, "step": 304920 }, { "epoch": 1.54, "learning_rate": 6.923833692378324e-05, "loss": 0.006, "step": 304930 }, { "epoch": 1.54, "learning_rate": 6.923076923076922e-05, "loss": 0.0057, "step": 304940 }, { "epoch": 1.54, "learning_rate": 6.922320153775522e-05, "loss": 0.0056, "step": 304950 }, { "epoch": 1.54, "learning_rate": 6.92156338447412e-05, "loss": 0.0055, "step": 304960 }, { "epoch": 1.54, "learning_rate": 6.92080661517272e-05, "loss": 0.0077, "step": 304970 }, { "epoch": 1.54, "learning_rate": 6.920049845871318e-05, "loss": 0.0074, "step": 304980 }, { "epoch": 1.54, "learning_rate": 6.919293076569917e-05, "loss": 0.0056, "step": 304990 }, { "epoch": 1.54, "learning_rate": 6.918536307268517e-05, "loss": 0.0072, "step": 305000 }, { "epoch": 1.54, "eval_cer": 0.9144392032271493, "eval_loss": 0.0054320478811860085, "eval_runtime": 116.39, "eval_samples_per_second": 17.184, "eval_steps_per_second": 4.296, "step": 305000 }, { "epoch": 1.54, "learning_rate": 6.917779537967115e-05, "loss": 0.0077, "step": 305010 }, { "epoch": 1.54, "learning_rate": 6.917022768665714e-05, "loss": 0.0075, "step": 305020 }, { "epoch": 1.54, "learning_rate": 6.916265999364312e-05, "loss": 0.0113, "step": 305030 }, { "epoch": 1.54, "learning_rate": 6.915509230062912e-05, "loss": 0.0112, "step": 305040 }, { "epoch": 1.54, "learning_rate": 6.914752460761511e-05, "loss": 0.0063, "step": 305050 }, { "epoch": 1.54, "learning_rate": 6.91399569146011e-05, "loss": 0.0066, "step": 305060 }, { "epoch": 1.54, "learning_rate": 6.913238922158709e-05, "loss": 0.0076, "step": 305070 }, { "epoch": 1.54, "learning_rate": 6.912482152857309e-05, "loss": 0.0063, "step": 305080 }, { "epoch": 1.54, "learning_rate": 6.911725383555907e-05, "loss": 0.0071, "step": 305090 }, { "epoch": 1.54, "learning_rate": 6.910968614254506e-05, "loss": 0.0077, "step": 305100 }, { "epoch": 1.54, "learning_rate": 6.910211844953104e-05, "loss": 0.0052, "step": 305110 }, { "epoch": 1.54, "learning_rate": 6.909455075651704e-05, "loss": 0.0065, "step": 305120 }, { "epoch": 1.54, "learning_rate": 6.908698306350303e-05, "loss": 0.0074, "step": 305130 }, { "epoch": 1.54, "learning_rate": 6.907941537048902e-05, "loss": 0.0073, "step": 305140 }, { "epoch": 1.54, "learning_rate": 6.907184767747501e-05, "loss": 0.0064, "step": 305150 }, { "epoch": 1.54, "learning_rate": 6.9064279984461e-05, "loss": 0.0052, "step": 305160 }, { "epoch": 1.54, "learning_rate": 6.905671229144699e-05, "loss": 0.0068, "step": 305170 }, { "epoch": 1.54, "learning_rate": 6.904914459843298e-05, "loss": 0.0085, "step": 305180 }, { "epoch": 1.54, "learning_rate": 6.904157690541896e-05, "loss": 0.0084, "step": 305190 }, { "epoch": 1.54, "learning_rate": 6.903400921240496e-05, "loss": 0.0076, "step": 305200 }, { "epoch": 1.54, "learning_rate": 6.902644151939095e-05, "loss": 0.0077, "step": 305210 }, { "epoch": 1.54, "learning_rate": 6.901887382637693e-05, "loss": 0.0082, "step": 305220 }, { "epoch": 1.54, "learning_rate": 6.901130613336293e-05, "loss": 0.007, "step": 305230 }, { "epoch": 1.54, "learning_rate": 6.900373844034892e-05, "loss": 0.0057, "step": 305240 }, { "epoch": 1.54, "learning_rate": 6.89961707473349e-05, "loss": 0.0061, "step": 305250 }, { "epoch": 1.54, "learning_rate": 6.89886030543209e-05, "loss": 0.0083, "step": 305260 }, { "epoch": 1.54, "learning_rate": 6.898103536130688e-05, "loss": 0.007, "step": 305270 }, { "epoch": 1.54, "learning_rate": 6.897346766829286e-05, "loss": 0.0073, "step": 305280 }, { "epoch": 1.54, "learning_rate": 6.896589997527886e-05, "loss": 0.0125, "step": 305290 }, { "epoch": 1.54, "learning_rate": 6.895833228226485e-05, "loss": 0.0074, "step": 305300 }, { "epoch": 1.54, "learning_rate": 6.895076458925084e-05, "loss": 0.0065, "step": 305310 }, { "epoch": 1.54, "learning_rate": 6.894319689623683e-05, "loss": 0.0071, "step": 305320 }, { "epoch": 1.54, "learning_rate": 6.893562920322283e-05, "loss": 0.008, "step": 305330 }, { "epoch": 1.54, "learning_rate": 6.89280615102088e-05, "loss": 0.0071, "step": 305340 }, { "epoch": 1.54, "learning_rate": 6.89204938171948e-05, "loss": 0.0078, "step": 305350 }, { "epoch": 1.54, "learning_rate": 6.891292612418078e-05, "loss": 0.0078, "step": 305360 }, { "epoch": 1.54, "learning_rate": 6.890535843116678e-05, "loss": 0.0088, "step": 305370 }, { "epoch": 1.54, "learning_rate": 6.889779073815277e-05, "loss": 0.0065, "step": 305380 }, { "epoch": 1.54, "learning_rate": 6.889022304513875e-05, "loss": 0.0063, "step": 305390 }, { "epoch": 1.54, "learning_rate": 6.888265535212475e-05, "loss": 0.0081, "step": 305400 }, { "epoch": 1.54, "learning_rate": 6.887508765911074e-05, "loss": 0.0076, "step": 305410 }, { "epoch": 1.54, "learning_rate": 6.886751996609673e-05, "loss": 0.0055, "step": 305420 }, { "epoch": 1.54, "learning_rate": 6.885995227308272e-05, "loss": 0.0075, "step": 305430 }, { "epoch": 1.54, "learning_rate": 6.88523845800687e-05, "loss": 0.0064, "step": 305440 }, { "epoch": 1.54, "learning_rate": 6.88448168870547e-05, "loss": 0.008, "step": 305450 }, { "epoch": 1.54, "learning_rate": 6.883724919404069e-05, "loss": 0.0097, "step": 305460 }, { "epoch": 1.54, "learning_rate": 6.882968150102667e-05, "loss": 0.0075, "step": 305470 }, { "epoch": 1.54, "learning_rate": 6.882211380801267e-05, "loss": 0.0073, "step": 305480 }, { "epoch": 1.54, "learning_rate": 6.881454611499866e-05, "loss": 0.0097, "step": 305490 }, { "epoch": 1.54, "learning_rate": 6.880697842198465e-05, "loss": 0.0072, "step": 305500 }, { "epoch": 1.54, "learning_rate": 6.879941072897064e-05, "loss": 0.0097, "step": 305510 }, { "epoch": 1.54, "learning_rate": 6.879184303595664e-05, "loss": 0.0062, "step": 305520 }, { "epoch": 1.54, "learning_rate": 6.878427534294262e-05, "loss": 0.0083, "step": 305530 }, { "epoch": 1.54, "learning_rate": 6.877670764992861e-05, "loss": 0.0087, "step": 305540 }, { "epoch": 1.54, "learning_rate": 6.876913995691459e-05, "loss": 0.0063, "step": 305550 }, { "epoch": 1.54, "learning_rate": 6.876157226390059e-05, "loss": 0.0082, "step": 305560 }, { "epoch": 1.54, "learning_rate": 6.875400457088658e-05, "loss": 0.0079, "step": 305570 }, { "epoch": 1.54, "learning_rate": 6.874643687787256e-05, "loss": 0.0066, "step": 305580 }, { "epoch": 1.54, "learning_rate": 6.873886918485855e-05, "loss": 0.0066, "step": 305590 }, { "epoch": 1.54, "learning_rate": 6.873130149184454e-05, "loss": 0.0063, "step": 305600 }, { "epoch": 1.54, "learning_rate": 6.872373379883054e-05, "loss": 0.0062, "step": 305610 }, { "epoch": 1.54, "learning_rate": 6.871616610581652e-05, "loss": 0.0075, "step": 305620 }, { "epoch": 1.54, "learning_rate": 6.870859841280251e-05, "loss": 0.0075, "step": 305630 }, { "epoch": 1.54, "learning_rate": 6.87010307197885e-05, "loss": 0.0067, "step": 305640 }, { "epoch": 1.54, "learning_rate": 6.869346302677449e-05, "loss": 0.0067, "step": 305650 }, { "epoch": 1.54, "learning_rate": 6.868589533376048e-05, "loss": 0.0052, "step": 305660 }, { "epoch": 1.54, "learning_rate": 6.867832764074647e-05, "loss": 0.007, "step": 305670 }, { "epoch": 1.54, "learning_rate": 6.867075994773246e-05, "loss": 0.0059, "step": 305680 }, { "epoch": 1.54, "learning_rate": 6.866319225471846e-05, "loss": 0.0081, "step": 305690 }, { "epoch": 1.54, "learning_rate": 6.865562456170444e-05, "loss": 0.0098, "step": 305700 }, { "epoch": 1.54, "learning_rate": 6.864805686869043e-05, "loss": 0.0078, "step": 305710 }, { "epoch": 1.54, "learning_rate": 6.864048917567641e-05, "loss": 0.0078, "step": 305720 }, { "epoch": 1.54, "learning_rate": 6.863292148266241e-05, "loss": 0.0102, "step": 305730 }, { "epoch": 1.54, "learning_rate": 6.86253537896484e-05, "loss": 0.0075, "step": 305740 }, { "epoch": 1.54, "learning_rate": 6.861778609663438e-05, "loss": 0.01, "step": 305750 }, { "epoch": 1.54, "learning_rate": 6.861021840362038e-05, "loss": 0.0059, "step": 305760 }, { "epoch": 1.54, "learning_rate": 6.860265071060637e-05, "loss": 0.0093, "step": 305770 }, { "epoch": 1.54, "learning_rate": 6.859508301759236e-05, "loss": 0.0073, "step": 305780 }, { "epoch": 1.54, "learning_rate": 6.858751532457835e-05, "loss": 0.0054, "step": 305790 }, { "epoch": 1.54, "learning_rate": 6.857994763156433e-05, "loss": 0.0063, "step": 305800 }, { "epoch": 1.54, "learning_rate": 6.857237993855033e-05, "loss": 0.0071, "step": 305810 }, { "epoch": 1.54, "learning_rate": 6.856481224553632e-05, "loss": 0.0067, "step": 305820 }, { "epoch": 1.54, "learning_rate": 6.85572445525223e-05, "loss": 0.0083, "step": 305830 }, { "epoch": 1.54, "learning_rate": 6.85496768595083e-05, "loss": 0.0068, "step": 305840 }, { "epoch": 1.54, "learning_rate": 6.85421091664943e-05, "loss": 0.0068, "step": 305850 }, { "epoch": 1.54, "learning_rate": 6.853454147348028e-05, "loss": 0.0065, "step": 305860 }, { "epoch": 1.54, "learning_rate": 6.852697378046627e-05, "loss": 0.0068, "step": 305870 }, { "epoch": 1.54, "learning_rate": 6.851940608745225e-05, "loss": 0.0063, "step": 305880 }, { "epoch": 1.54, "learning_rate": 6.851183839443825e-05, "loss": 0.0102, "step": 305890 }, { "epoch": 1.54, "learning_rate": 6.850427070142423e-05, "loss": 0.0069, "step": 305900 }, { "epoch": 1.54, "learning_rate": 6.849670300841022e-05, "loss": 0.0071, "step": 305910 }, { "epoch": 1.54, "learning_rate": 6.84891353153962e-05, "loss": 0.0068, "step": 305920 }, { "epoch": 1.54, "learning_rate": 6.84815676223822e-05, "loss": 0.0069, "step": 305930 }, { "epoch": 1.54, "learning_rate": 6.84739999293682e-05, "loss": 0.0066, "step": 305940 }, { "epoch": 1.54, "learning_rate": 6.846643223635418e-05, "loss": 0.0081, "step": 305950 }, { "epoch": 1.54, "learning_rate": 6.845886454334017e-05, "loss": 0.0058, "step": 305960 }, { "epoch": 1.54, "learning_rate": 6.845129685032617e-05, "loss": 0.0064, "step": 305970 }, { "epoch": 1.54, "learning_rate": 6.844372915731215e-05, "loss": 0.0072, "step": 305980 }, { "epoch": 1.54, "learning_rate": 6.843616146429814e-05, "loss": 0.0072, "step": 305990 }, { "epoch": 1.54, "learning_rate": 6.842859377128412e-05, "loss": 0.0088, "step": 306000 }, { "epoch": 1.54, "eval_cer": 0.9144450256039017, "eval_loss": 0.00540526770055294, "eval_runtime": 116.2539, "eval_samples_per_second": 17.204, "eval_steps_per_second": 4.301, "step": 306000 }, { "epoch": 1.54, "learning_rate": 6.842102607827012e-05, "loss": 0.0125, "step": 306010 }, { "epoch": 1.54, "learning_rate": 6.841345838525611e-05, "loss": 0.0056, "step": 306020 }, { "epoch": 1.54, "learning_rate": 6.84058906922421e-05, "loss": 0.0085, "step": 306030 }, { "epoch": 1.54, "learning_rate": 6.839832299922809e-05, "loss": 0.0083, "step": 306040 }, { "epoch": 1.54, "learning_rate": 6.839075530621409e-05, "loss": 0.0074, "step": 306050 }, { "epoch": 1.54, "learning_rate": 6.838318761320007e-05, "loss": 0.005, "step": 306060 }, { "epoch": 1.54, "learning_rate": 6.837561992018606e-05, "loss": 0.0062, "step": 306070 }, { "epoch": 1.54, "learning_rate": 6.836805222717204e-05, "loss": 0.0113, "step": 306080 }, { "epoch": 1.54, "learning_rate": 6.836048453415804e-05, "loss": 0.0057, "step": 306090 }, { "epoch": 1.54, "learning_rate": 6.835291684114403e-05, "loss": 0.0053, "step": 306100 }, { "epoch": 1.54, "learning_rate": 6.834534914813001e-05, "loss": 0.0088, "step": 306110 }, { "epoch": 1.54, "learning_rate": 6.833778145511601e-05, "loss": 0.0087, "step": 306120 }, { "epoch": 1.54, "learning_rate": 6.8330213762102e-05, "loss": 0.01, "step": 306130 }, { "epoch": 1.54, "learning_rate": 6.832264606908799e-05, "loss": 0.0061, "step": 306140 }, { "epoch": 1.54, "learning_rate": 6.831507837607398e-05, "loss": 0.0076, "step": 306150 }, { "epoch": 1.54, "learning_rate": 6.830751068305996e-05, "loss": 0.0066, "step": 306160 }, { "epoch": 1.54, "learning_rate": 6.829994299004596e-05, "loss": 0.0066, "step": 306170 }, { "epoch": 1.54, "learning_rate": 6.829237529703195e-05, "loss": 0.0064, "step": 306180 }, { "epoch": 1.54, "learning_rate": 6.828480760401793e-05, "loss": 0.0071, "step": 306190 }, { "epoch": 1.54, "learning_rate": 6.827723991100393e-05, "loss": 0.0068, "step": 306200 }, { "epoch": 1.54, "learning_rate": 6.826967221798991e-05, "loss": 0.0074, "step": 306210 }, { "epoch": 1.54, "learning_rate": 6.82621045249759e-05, "loss": 0.0069, "step": 306220 }, { "epoch": 1.54, "learning_rate": 6.825453683196189e-05, "loss": 0.0043, "step": 306230 }, { "epoch": 1.55, "learning_rate": 6.824696913894788e-05, "loss": 0.0071, "step": 306240 }, { "epoch": 1.55, "learning_rate": 6.823940144593386e-05, "loss": 0.0071, "step": 306250 }, { "epoch": 1.55, "learning_rate": 6.823183375291986e-05, "loss": 0.0093, "step": 306260 }, { "epoch": 1.55, "learning_rate": 6.822426605990585e-05, "loss": 0.0074, "step": 306270 }, { "epoch": 1.55, "learning_rate": 6.821669836689183e-05, "loss": 0.008, "step": 306280 }, { "epoch": 1.55, "learning_rate": 6.820913067387783e-05, "loss": 0.0068, "step": 306290 }, { "epoch": 1.55, "learning_rate": 6.820156298086382e-05, "loss": 0.0068, "step": 306300 }, { "epoch": 1.55, "learning_rate": 6.81939952878498e-05, "loss": 0.0055, "step": 306310 }, { "epoch": 1.55, "learning_rate": 6.81864275948358e-05, "loss": 0.0073, "step": 306320 }, { "epoch": 1.55, "learning_rate": 6.817885990182178e-05, "loss": 0.0097, "step": 306330 }, { "epoch": 1.55, "learning_rate": 6.817129220880778e-05, "loss": 0.007, "step": 306340 }, { "epoch": 1.55, "learning_rate": 6.816372451579377e-05, "loss": 0.0064, "step": 306350 }, { "epoch": 1.55, "learning_rate": 6.815615682277975e-05, "loss": 0.0081, "step": 306360 }, { "epoch": 1.55, "learning_rate": 6.814858912976575e-05, "loss": 0.0076, "step": 306370 }, { "epoch": 1.55, "learning_rate": 6.814102143675174e-05, "loss": 0.0065, "step": 306380 }, { "epoch": 1.55, "learning_rate": 6.813345374373773e-05, "loss": 0.0073, "step": 306390 }, { "epoch": 1.55, "learning_rate": 6.812588605072372e-05, "loss": 0.0066, "step": 306400 }, { "epoch": 1.55, "learning_rate": 6.81183183577097e-05, "loss": 0.0068, "step": 306410 }, { "epoch": 1.55, "learning_rate": 6.81107506646957e-05, "loss": 0.0067, "step": 306420 }, { "epoch": 1.55, "learning_rate": 6.810318297168169e-05, "loss": 0.0062, "step": 306430 }, { "epoch": 1.55, "learning_rate": 6.809561527866767e-05, "loss": 0.0067, "step": 306440 }, { "epoch": 1.55, "learning_rate": 6.808804758565367e-05, "loss": 0.0063, "step": 306450 }, { "epoch": 1.55, "learning_rate": 6.808047989263966e-05, "loss": 0.0082, "step": 306460 }, { "epoch": 1.55, "learning_rate": 6.807291219962564e-05, "loss": 0.0057, "step": 306470 }, { "epoch": 1.55, "learning_rate": 6.806534450661164e-05, "loss": 0.0066, "step": 306480 }, { "epoch": 1.55, "learning_rate": 6.805777681359763e-05, "loss": 0.0072, "step": 306490 }, { "epoch": 1.55, "learning_rate": 6.805020912058362e-05, "loss": 0.0057, "step": 306500 }, { "epoch": 1.55, "learning_rate": 6.804264142756961e-05, "loss": 0.0081, "step": 306510 }, { "epoch": 1.55, "learning_rate": 6.803507373455559e-05, "loss": 0.0069, "step": 306520 }, { "epoch": 1.55, "learning_rate": 6.802750604154157e-05, "loss": 0.0066, "step": 306530 }, { "epoch": 1.55, "learning_rate": 6.801993834852757e-05, "loss": 0.0049, "step": 306540 }, { "epoch": 1.55, "learning_rate": 6.801237065551356e-05, "loss": 0.0082, "step": 306550 }, { "epoch": 1.55, "learning_rate": 6.800480296249955e-05, "loss": 0.0088, "step": 306560 }, { "epoch": 1.55, "learning_rate": 6.799723526948554e-05, "loss": 0.0056, "step": 306570 }, { "epoch": 1.55, "learning_rate": 6.798966757647154e-05, "loss": 0.0099, "step": 306580 }, { "epoch": 1.55, "learning_rate": 6.798209988345752e-05, "loss": 0.0051, "step": 306590 }, { "epoch": 1.55, "learning_rate": 6.797453219044351e-05, "loss": 0.0076, "step": 306600 }, { "epoch": 1.55, "learning_rate": 6.79669644974295e-05, "loss": 0.0061, "step": 306610 }, { "epoch": 1.55, "learning_rate": 6.795939680441549e-05, "loss": 0.0079, "step": 306620 }, { "epoch": 1.55, "learning_rate": 6.795182911140148e-05, "loss": 0.006, "step": 306630 }, { "epoch": 1.55, "learning_rate": 6.794426141838746e-05, "loss": 0.013, "step": 306640 }, { "epoch": 1.55, "learning_rate": 6.793669372537346e-05, "loss": 0.0068, "step": 306650 }, { "epoch": 1.55, "learning_rate": 6.792912603235945e-05, "loss": 0.0089, "step": 306660 }, { "epoch": 1.55, "learning_rate": 6.792155833934544e-05, "loss": 0.0074, "step": 306670 }, { "epoch": 1.55, "learning_rate": 6.791399064633143e-05, "loss": 0.0064, "step": 306680 }, { "epoch": 1.55, "learning_rate": 6.790642295331741e-05, "loss": 0.0063, "step": 306690 }, { "epoch": 1.55, "learning_rate": 6.789885526030341e-05, "loss": 0.008, "step": 306700 }, { "epoch": 1.55, "learning_rate": 6.78912875672894e-05, "loss": 0.0067, "step": 306710 }, { "epoch": 1.55, "learning_rate": 6.788371987427538e-05, "loss": 0.0059, "step": 306720 }, { "epoch": 1.55, "learning_rate": 6.787615218126138e-05, "loss": 0.0082, "step": 306730 }, { "epoch": 1.55, "learning_rate": 6.786858448824737e-05, "loss": 0.0068, "step": 306740 }, { "epoch": 1.55, "learning_rate": 6.786101679523336e-05, "loss": 0.007, "step": 306750 }, { "epoch": 1.55, "learning_rate": 6.785344910221935e-05, "loss": 0.0094, "step": 306760 }, { "epoch": 1.55, "learning_rate": 6.784588140920533e-05, "loss": 0.0067, "step": 306770 }, { "epoch": 1.55, "learning_rate": 6.783831371619133e-05, "loss": 0.0062, "step": 306780 }, { "epoch": 1.55, "learning_rate": 6.783074602317732e-05, "loss": 0.0094, "step": 306790 }, { "epoch": 1.55, "learning_rate": 6.78231783301633e-05, "loss": 0.0059, "step": 306800 }, { "epoch": 1.55, "learning_rate": 6.78156106371493e-05, "loss": 0.0077, "step": 306810 }, { "epoch": 1.55, "learning_rate": 6.78080429441353e-05, "loss": 0.0076, "step": 306820 }, { "epoch": 1.55, "learning_rate": 6.780047525112127e-05, "loss": 0.0093, "step": 306830 }, { "epoch": 1.55, "learning_rate": 6.779290755810726e-05, "loss": 0.0072, "step": 306840 }, { "epoch": 1.55, "learning_rate": 6.778533986509325e-05, "loss": 0.008, "step": 306850 }, { "epoch": 1.55, "learning_rate": 6.777777217207923e-05, "loss": 0.0065, "step": 306860 }, { "epoch": 1.55, "learning_rate": 6.777020447906523e-05, "loss": 0.0074, "step": 306870 }, { "epoch": 1.55, "learning_rate": 6.776263678605122e-05, "loss": 0.0068, "step": 306880 }, { "epoch": 1.55, "learning_rate": 6.77550690930372e-05, "loss": 0.0058, "step": 306890 }, { "epoch": 1.55, "learning_rate": 6.77475014000232e-05, "loss": 0.0067, "step": 306900 }, { "epoch": 1.55, "learning_rate": 6.77399337070092e-05, "loss": 0.0065, "step": 306910 }, { "epoch": 1.55, "learning_rate": 6.773236601399518e-05, "loss": 0.0066, "step": 306920 }, { "epoch": 1.55, "learning_rate": 6.772479832098117e-05, "loss": 0.0066, "step": 306930 }, { "epoch": 1.55, "learning_rate": 6.771723062796717e-05, "loss": 0.0056, "step": 306940 }, { "epoch": 1.55, "learning_rate": 6.770966293495315e-05, "loss": 0.0055, "step": 306950 }, { "epoch": 1.55, "learning_rate": 6.770209524193914e-05, "loss": 0.0072, "step": 306960 }, { "epoch": 1.55, "learning_rate": 6.769452754892512e-05, "loss": 0.0055, "step": 306970 }, { "epoch": 1.55, "learning_rate": 6.768695985591112e-05, "loss": 0.0095, "step": 306980 }, { "epoch": 1.55, "learning_rate": 6.767939216289711e-05, "loss": 0.0047, "step": 306990 }, { "epoch": 1.55, "learning_rate": 6.76718244698831e-05, "loss": 0.0055, "step": 307000 }, { "epoch": 1.55, "eval_cer": 0.9144605519419082, "eval_loss": 0.005416039377450943, "eval_runtime": 116.4069, "eval_samples_per_second": 17.181, "eval_steps_per_second": 4.295, "step": 307000 }, { "epoch": 1.55, "learning_rate": 6.766425677686909e-05, "loss": 0.0072, "step": 307010 }, { "epoch": 1.55, "learning_rate": 6.765668908385508e-05, "loss": 0.0061, "step": 307020 }, { "epoch": 1.55, "learning_rate": 6.764912139084107e-05, "loss": 0.0074, "step": 307030 }, { "epoch": 1.55, "learning_rate": 6.764155369782706e-05, "loss": 0.0077, "step": 307040 }, { "epoch": 1.55, "learning_rate": 6.763398600481304e-05, "loss": 0.009, "step": 307050 }, { "epoch": 1.55, "learning_rate": 6.762641831179904e-05, "loss": 0.0073, "step": 307060 }, { "epoch": 1.55, "learning_rate": 6.761885061878503e-05, "loss": 0.0068, "step": 307070 }, { "epoch": 1.55, "learning_rate": 6.761128292577101e-05, "loss": 0.0065, "step": 307080 }, { "epoch": 1.55, "learning_rate": 6.760371523275701e-05, "loss": 0.0078, "step": 307090 }, { "epoch": 1.55, "learning_rate": 6.7596147539743e-05, "loss": 0.0068, "step": 307100 }, { "epoch": 1.55, "learning_rate": 6.758857984672899e-05, "loss": 0.0069, "step": 307110 }, { "epoch": 1.55, "learning_rate": 6.758101215371498e-05, "loss": 0.0059, "step": 307120 }, { "epoch": 1.55, "learning_rate": 6.757344446070096e-05, "loss": 0.0061, "step": 307130 }, { "epoch": 1.55, "learning_rate": 6.756587676768696e-05, "loss": 0.0079, "step": 307140 }, { "epoch": 1.55, "learning_rate": 6.755830907467295e-05, "loss": 0.0074, "step": 307150 }, { "epoch": 1.55, "learning_rate": 6.755074138165893e-05, "loss": 0.0074, "step": 307160 }, { "epoch": 1.55, "learning_rate": 6.754317368864491e-05, "loss": 0.0064, "step": 307170 }, { "epoch": 1.55, "learning_rate": 6.753560599563091e-05, "loss": 0.0069, "step": 307180 }, { "epoch": 1.55, "learning_rate": 6.75280383026169e-05, "loss": 0.0056, "step": 307190 }, { "epoch": 1.55, "learning_rate": 6.752047060960289e-05, "loss": 0.0062, "step": 307200 }, { "epoch": 1.55, "learning_rate": 6.751290291658888e-05, "loss": 0.0093, "step": 307210 }, { "epoch": 1.55, "learning_rate": 6.750533522357486e-05, "loss": 0.0079, "step": 307220 }, { "epoch": 1.55, "learning_rate": 6.749776753056086e-05, "loss": 0.006, "step": 307230 }, { "epoch": 1.55, "learning_rate": 6.749019983754685e-05, "loss": 0.0075, "step": 307240 }, { "epoch": 1.55, "learning_rate": 6.748263214453283e-05, "loss": 0.0054, "step": 307250 }, { "epoch": 1.55, "learning_rate": 6.747506445151883e-05, "loss": 0.0066, "step": 307260 }, { "epoch": 1.55, "learning_rate": 6.746749675850482e-05, "loss": 0.0086, "step": 307270 }, { "epoch": 1.55, "learning_rate": 6.74599290654908e-05, "loss": 0.0054, "step": 307280 }, { "epoch": 1.55, "learning_rate": 6.74523613724768e-05, "loss": 0.0071, "step": 307290 }, { "epoch": 1.55, "learning_rate": 6.744479367946278e-05, "loss": 0.007, "step": 307300 }, { "epoch": 1.55, "learning_rate": 6.743722598644878e-05, "loss": 0.0066, "step": 307310 }, { "epoch": 1.55, "learning_rate": 6.742965829343477e-05, "loss": 0.0073, "step": 307320 }, { "epoch": 1.55, "learning_rate": 6.742209060042075e-05, "loss": 0.006, "step": 307330 }, { "epoch": 1.55, "learning_rate": 6.741452290740675e-05, "loss": 0.0069, "step": 307340 }, { "epoch": 1.55, "learning_rate": 6.740695521439274e-05, "loss": 0.0068, "step": 307350 }, { "epoch": 1.55, "learning_rate": 6.739938752137872e-05, "loss": 0.0062, "step": 307360 }, { "epoch": 1.55, "learning_rate": 6.739181982836472e-05, "loss": 0.0045, "step": 307370 }, { "epoch": 1.55, "learning_rate": 6.73842521353507e-05, "loss": 0.006, "step": 307380 }, { "epoch": 1.55, "learning_rate": 6.73766844423367e-05, "loss": 0.0059, "step": 307390 }, { "epoch": 1.55, "learning_rate": 6.736911674932269e-05, "loss": 0.0059, "step": 307400 }, { "epoch": 1.55, "learning_rate": 6.736154905630867e-05, "loss": 0.0067, "step": 307410 }, { "epoch": 1.55, "learning_rate": 6.735398136329467e-05, "loss": 0.0072, "step": 307420 }, { "epoch": 1.55, "learning_rate": 6.734641367028066e-05, "loss": 0.0053, "step": 307430 }, { "epoch": 1.55, "learning_rate": 6.733884597726664e-05, "loss": 0.0061, "step": 307440 }, { "epoch": 1.55, "learning_rate": 6.733127828425264e-05, "loss": 0.0079, "step": 307450 }, { "epoch": 1.55, "learning_rate": 6.732371059123863e-05, "loss": 0.0144, "step": 307460 }, { "epoch": 1.55, "learning_rate": 6.731614289822462e-05, "loss": 0.0054, "step": 307470 }, { "epoch": 1.55, "learning_rate": 6.73085752052106e-05, "loss": 0.0063, "step": 307480 }, { "epoch": 1.55, "learning_rate": 6.730100751219659e-05, "loss": 0.0064, "step": 307490 }, { "epoch": 1.55, "learning_rate": 6.729343981918257e-05, "loss": 0.0069, "step": 307500 }, { "epoch": 1.55, "learning_rate": 6.728587212616857e-05, "loss": 0.0077, "step": 307510 }, { "epoch": 1.55, "learning_rate": 6.727830443315456e-05, "loss": 0.0096, "step": 307520 }, { "epoch": 1.55, "learning_rate": 6.727073674014055e-05, "loss": 0.0054, "step": 307530 }, { "epoch": 1.55, "learning_rate": 6.726316904712654e-05, "loss": 0.0062, "step": 307540 }, { "epoch": 1.55, "learning_rate": 6.725560135411254e-05, "loss": 0.0076, "step": 307550 }, { "epoch": 1.55, "learning_rate": 6.724803366109852e-05, "loss": 0.0062, "step": 307560 }, { "epoch": 1.55, "learning_rate": 6.724046596808451e-05, "loss": 0.0057, "step": 307570 }, { "epoch": 1.55, "learning_rate": 6.723289827507049e-05, "loss": 0.011, "step": 307580 }, { "epoch": 1.55, "learning_rate": 6.722533058205649e-05, "loss": 0.0045, "step": 307590 }, { "epoch": 1.55, "learning_rate": 6.721776288904248e-05, "loss": 0.0067, "step": 307600 }, { "epoch": 1.55, "learning_rate": 6.721019519602846e-05, "loss": 0.0079, "step": 307610 }, { "epoch": 1.55, "learning_rate": 6.720262750301446e-05, "loss": 0.0064, "step": 307620 }, { "epoch": 1.55, "learning_rate": 6.719505981000045e-05, "loss": 0.0074, "step": 307630 }, { "epoch": 1.55, "learning_rate": 6.718749211698644e-05, "loss": 0.0046, "step": 307640 }, { "epoch": 1.55, "learning_rate": 6.717992442397243e-05, "loss": 0.0071, "step": 307650 }, { "epoch": 1.55, "learning_rate": 6.717235673095841e-05, "loss": 0.0054, "step": 307660 }, { "epoch": 1.55, "learning_rate": 6.716478903794441e-05, "loss": 0.0056, "step": 307670 }, { "epoch": 1.55, "learning_rate": 6.71572213449304e-05, "loss": 0.0076, "step": 307680 }, { "epoch": 1.55, "learning_rate": 6.714965365191638e-05, "loss": 0.0085, "step": 307690 }, { "epoch": 1.55, "learning_rate": 6.714208595890238e-05, "loss": 0.007, "step": 307700 }, { "epoch": 1.55, "learning_rate": 6.713451826588837e-05, "loss": 0.0072, "step": 307710 }, { "epoch": 1.55, "learning_rate": 6.712695057287436e-05, "loss": 0.0068, "step": 307720 }, { "epoch": 1.55, "learning_rate": 6.711938287986035e-05, "loss": 0.0056, "step": 307730 }, { "epoch": 1.55, "learning_rate": 6.711181518684633e-05, "loss": 0.0065, "step": 307740 }, { "epoch": 1.55, "learning_rate": 6.710424749383233e-05, "loss": 0.0054, "step": 307750 }, { "epoch": 1.55, "learning_rate": 6.709667980081832e-05, "loss": 0.0056, "step": 307760 }, { "epoch": 1.55, "learning_rate": 6.70891121078043e-05, "loss": 0.0088, "step": 307770 }, { "epoch": 1.55, "learning_rate": 6.70815444147903e-05, "loss": 0.0073, "step": 307780 }, { "epoch": 1.55, "learning_rate": 6.707397672177628e-05, "loss": 0.008, "step": 307790 }, { "epoch": 1.55, "learning_rate": 6.706640902876227e-05, "loss": 0.0063, "step": 307800 }, { "epoch": 1.55, "learning_rate": 6.705884133574826e-05, "loss": 0.0079, "step": 307810 }, { "epoch": 1.55, "learning_rate": 6.705127364273425e-05, "loss": 0.0056, "step": 307820 }, { "epoch": 1.55, "learning_rate": 6.704370594972023e-05, "loss": 0.0079, "step": 307830 }, { "epoch": 1.55, "learning_rate": 6.703613825670623e-05, "loss": 0.007, "step": 307840 }, { "epoch": 1.55, "learning_rate": 6.702857056369222e-05, "loss": 0.0076, "step": 307850 }, { "epoch": 1.55, "learning_rate": 6.70210028706782e-05, "loss": 0.0084, "step": 307860 }, { "epoch": 1.55, "learning_rate": 6.70134351776642e-05, "loss": 0.0082, "step": 307870 }, { "epoch": 1.55, "learning_rate": 6.70058674846502e-05, "loss": 0.0076, "step": 307880 }, { "epoch": 1.55, "learning_rate": 6.699829979163618e-05, "loss": 0.0079, "step": 307890 }, { "epoch": 1.55, "learning_rate": 6.699073209862217e-05, "loss": 0.0054, "step": 307900 }, { "epoch": 1.55, "learning_rate": 6.698316440560817e-05, "loss": 0.0069, "step": 307910 }, { "epoch": 1.55, "learning_rate": 6.697559671259415e-05, "loss": 0.0058, "step": 307920 }, { "epoch": 1.55, "learning_rate": 6.696802901958014e-05, "loss": 0.0079, "step": 307930 }, { "epoch": 1.55, "learning_rate": 6.696046132656612e-05, "loss": 0.0084, "step": 307940 }, { "epoch": 1.55, "learning_rate": 6.695289363355212e-05, "loss": 0.0076, "step": 307950 }, { "epoch": 1.55, "learning_rate": 6.694532594053811e-05, "loss": 0.006, "step": 307960 }, { "epoch": 1.55, "learning_rate": 6.69377582475241e-05, "loss": 0.0067, "step": 307970 }, { "epoch": 1.55, "learning_rate": 6.693019055451009e-05, "loss": 0.0098, "step": 307980 }, { "epoch": 1.55, "learning_rate": 6.692262286149608e-05, "loss": 0.0056, "step": 307990 }, { "epoch": 1.55, "learning_rate": 6.691505516848207e-05, "loss": 0.0078, "step": 308000 }, { "epoch": 1.55, "eval_cer": 0.9144828710527925, "eval_loss": 0.005395396146923304, "eval_runtime": 116.4162, "eval_samples_per_second": 17.18, "eval_steps_per_second": 4.295, "step": 308000 }, { "epoch": 1.55, "learning_rate": 6.690748747546806e-05, "loss": 0.006, "step": 308010 }, { "epoch": 1.55, "learning_rate": 6.689991978245404e-05, "loss": 0.0053, "step": 308020 }, { "epoch": 1.55, "learning_rate": 6.689235208944004e-05, "loss": 0.0059, "step": 308030 }, { "epoch": 1.55, "learning_rate": 6.688478439642603e-05, "loss": 0.0071, "step": 308040 }, { "epoch": 1.55, "learning_rate": 6.687721670341201e-05, "loss": 0.0075, "step": 308050 }, { "epoch": 1.55, "learning_rate": 6.686964901039801e-05, "loss": 0.0048, "step": 308060 }, { "epoch": 1.55, "learning_rate": 6.6862081317384e-05, "loss": 0.0096, "step": 308070 }, { "epoch": 1.55, "learning_rate": 6.685451362436999e-05, "loss": 0.0086, "step": 308080 }, { "epoch": 1.55, "learning_rate": 6.684694593135598e-05, "loss": 0.0062, "step": 308090 }, { "epoch": 1.55, "learning_rate": 6.683937823834196e-05, "loss": 0.0048, "step": 308100 }, { "epoch": 1.55, "learning_rate": 6.683181054532794e-05, "loss": 0.0063, "step": 308110 }, { "epoch": 1.55, "learning_rate": 6.682424285231394e-05, "loss": 0.0091, "step": 308120 }, { "epoch": 1.55, "learning_rate": 6.681667515929993e-05, "loss": 0.006, "step": 308130 }, { "epoch": 1.55, "learning_rate": 6.680910746628591e-05, "loss": 0.0075, "step": 308140 }, { "epoch": 1.55, "learning_rate": 6.680153977327191e-05, "loss": 0.0061, "step": 308150 }, { "epoch": 1.55, "learning_rate": 6.67939720802579e-05, "loss": 0.0084, "step": 308160 }, { "epoch": 1.55, "learning_rate": 6.678640438724389e-05, "loss": 0.0074, "step": 308170 }, { "epoch": 1.55, "learning_rate": 6.677883669422988e-05, "loss": 0.0083, "step": 308180 }, { "epoch": 1.55, "learning_rate": 6.677126900121586e-05, "loss": 0.0069, "step": 308190 }, { "epoch": 1.55, "learning_rate": 6.676370130820186e-05, "loss": 0.0066, "step": 308200 }, { "epoch": 1.55, "learning_rate": 6.675613361518785e-05, "loss": 0.007, "step": 308210 }, { "epoch": 1.56, "learning_rate": 6.674856592217383e-05, "loss": 0.0074, "step": 308220 }, { "epoch": 1.56, "learning_rate": 6.674099822915983e-05, "loss": 0.0068, "step": 308230 }, { "epoch": 1.56, "learning_rate": 6.673343053614582e-05, "loss": 0.0075, "step": 308240 }, { "epoch": 1.56, "learning_rate": 6.67258628431318e-05, "loss": 0.0067, "step": 308250 }, { "epoch": 1.56, "learning_rate": 6.67182951501178e-05, "loss": 0.0096, "step": 308260 }, { "epoch": 1.56, "learning_rate": 6.671072745710378e-05, "loss": 0.0067, "step": 308270 }, { "epoch": 1.56, "learning_rate": 6.670315976408978e-05, "loss": 0.0069, "step": 308280 }, { "epoch": 1.56, "learning_rate": 6.669559207107577e-05, "loss": 0.0078, "step": 308290 }, { "epoch": 1.56, "learning_rate": 6.668802437806175e-05, "loss": 0.0092, "step": 308300 }, { "epoch": 1.56, "learning_rate": 6.668045668504775e-05, "loss": 0.0076, "step": 308310 }, { "epoch": 1.56, "learning_rate": 6.667288899203374e-05, "loss": 0.0076, "step": 308320 }, { "epoch": 1.56, "learning_rate": 6.666532129901972e-05, "loss": 0.0058, "step": 308330 }, { "epoch": 1.56, "learning_rate": 6.665775360600572e-05, "loss": 0.0059, "step": 308340 }, { "epoch": 1.56, "learning_rate": 6.66501859129917e-05, "loss": 0.0076, "step": 308350 }, { "epoch": 1.56, "learning_rate": 6.66426182199777e-05, "loss": 0.0062, "step": 308360 }, { "epoch": 1.56, "learning_rate": 6.663505052696369e-05, "loss": 0.0086, "step": 308370 }, { "epoch": 1.56, "learning_rate": 6.662748283394967e-05, "loss": 0.0079, "step": 308380 }, { "epoch": 1.56, "learning_rate": 6.661991514093567e-05, "loss": 0.0084, "step": 308390 }, { "epoch": 1.56, "learning_rate": 6.661234744792166e-05, "loss": 0.0066, "step": 308400 }, { "epoch": 1.56, "learning_rate": 6.660477975490764e-05, "loss": 0.0073, "step": 308410 }, { "epoch": 1.56, "learning_rate": 6.659721206189363e-05, "loss": 0.0106, "step": 308420 }, { "epoch": 1.56, "learning_rate": 6.658964436887962e-05, "loss": 0.0071, "step": 308430 }, { "epoch": 1.56, "learning_rate": 6.658207667586562e-05, "loss": 0.0098, "step": 308440 }, { "epoch": 1.56, "learning_rate": 6.65745089828516e-05, "loss": 0.0068, "step": 308450 }, { "epoch": 1.56, "learning_rate": 6.656694128983759e-05, "loss": 0.0061, "step": 308460 }, { "epoch": 1.56, "learning_rate": 6.655937359682357e-05, "loss": 0.0077, "step": 308470 }, { "epoch": 1.56, "learning_rate": 6.655180590380957e-05, "loss": 0.0062, "step": 308480 }, { "epoch": 1.56, "learning_rate": 6.654423821079556e-05, "loss": 0.0051, "step": 308490 }, { "epoch": 1.56, "learning_rate": 6.653667051778154e-05, "loss": 0.0074, "step": 308500 }, { "epoch": 1.56, "learning_rate": 6.652910282476754e-05, "loss": 0.0078, "step": 308510 }, { "epoch": 1.56, "learning_rate": 6.652153513175353e-05, "loss": 0.0066, "step": 308520 }, { "epoch": 1.56, "learning_rate": 6.651396743873952e-05, "loss": 0.0079, "step": 308530 }, { "epoch": 1.56, "learning_rate": 6.650639974572551e-05, "loss": 0.0084, "step": 308540 }, { "epoch": 1.56, "learning_rate": 6.649883205271149e-05, "loss": 0.006, "step": 308550 }, { "epoch": 1.56, "learning_rate": 6.649126435969749e-05, "loss": 0.0072, "step": 308560 }, { "epoch": 1.56, "learning_rate": 6.648369666668348e-05, "loss": 0.0064, "step": 308570 }, { "epoch": 1.56, "learning_rate": 6.647612897366946e-05, "loss": 0.008, "step": 308580 }, { "epoch": 1.56, "learning_rate": 6.646856128065546e-05, "loss": 0.0065, "step": 308590 }, { "epoch": 1.56, "learning_rate": 6.646099358764145e-05, "loss": 0.0066, "step": 308600 }, { "epoch": 1.56, "learning_rate": 6.645342589462744e-05, "loss": 0.0071, "step": 308610 }, { "epoch": 1.56, "learning_rate": 6.644585820161343e-05, "loss": 0.011, "step": 308620 }, { "epoch": 1.56, "learning_rate": 6.643829050859941e-05, "loss": 0.0062, "step": 308630 }, { "epoch": 1.56, "learning_rate": 6.64307228155854e-05, "loss": 0.0068, "step": 308640 }, { "epoch": 1.56, "learning_rate": 6.64231551225714e-05, "loss": 0.0056, "step": 308650 }, { "epoch": 1.56, "learning_rate": 6.641558742955738e-05, "loss": 0.0078, "step": 308660 }, { "epoch": 1.56, "learning_rate": 6.640801973654338e-05, "loss": 0.006, "step": 308670 }, { "epoch": 1.56, "learning_rate": 6.640045204352937e-05, "loss": 0.0074, "step": 308680 }, { "epoch": 1.56, "learning_rate": 6.639288435051535e-05, "loss": 0.0064, "step": 308690 }, { "epoch": 1.56, "learning_rate": 6.638531665750135e-05, "loss": 0.0081, "step": 308700 }, { "epoch": 1.56, "learning_rate": 6.637774896448733e-05, "loss": 0.0063, "step": 308710 }, { "epoch": 1.56, "learning_rate": 6.637018127147333e-05, "loss": 0.007, "step": 308720 }, { "epoch": 1.56, "learning_rate": 6.636261357845931e-05, "loss": 0.0086, "step": 308730 }, { "epoch": 1.56, "learning_rate": 6.63550458854453e-05, "loss": 0.008, "step": 308740 }, { "epoch": 1.56, "learning_rate": 6.634747819243128e-05, "loss": 0.0072, "step": 308750 }, { "epoch": 1.56, "learning_rate": 6.633991049941728e-05, "loss": 0.0061, "step": 308760 }, { "epoch": 1.56, "learning_rate": 6.633234280640327e-05, "loss": 0.0095, "step": 308770 }, { "epoch": 1.56, "learning_rate": 6.632477511338926e-05, "loss": 0.006, "step": 308780 }, { "epoch": 1.56, "learning_rate": 6.631720742037525e-05, "loss": 0.0078, "step": 308790 }, { "epoch": 1.56, "learning_rate": 6.630963972736123e-05, "loss": 0.0055, "step": 308800 }, { "epoch": 1.56, "learning_rate": 6.630207203434723e-05, "loss": 0.008, "step": 308810 }, { "epoch": 1.56, "learning_rate": 6.629450434133322e-05, "loss": 0.0083, "step": 308820 }, { "epoch": 1.56, "learning_rate": 6.62869366483192e-05, "loss": 0.007, "step": 308830 }, { "epoch": 1.56, "learning_rate": 6.62793689553052e-05, "loss": 0.0086, "step": 308840 }, { "epoch": 1.56, "learning_rate": 6.627180126229119e-05, "loss": 0.0069, "step": 308850 }, { "epoch": 1.56, "learning_rate": 6.626423356927717e-05, "loss": 0.0089, "step": 308860 }, { "epoch": 1.56, "learning_rate": 6.625666587626317e-05, "loss": 0.0047, "step": 308870 }, { "epoch": 1.56, "learning_rate": 6.624909818324916e-05, "loss": 0.0088, "step": 308880 }, { "epoch": 1.56, "learning_rate": 6.624153049023515e-05, "loss": 0.008, "step": 308890 }, { "epoch": 1.56, "learning_rate": 6.623396279722114e-05, "loss": 0.0058, "step": 308900 }, { "epoch": 1.56, "learning_rate": 6.622639510420712e-05, "loss": 0.0088, "step": 308910 }, { "epoch": 1.56, "learning_rate": 6.621882741119312e-05, "loss": 0.0094, "step": 308920 }, { "epoch": 1.56, "learning_rate": 6.621125971817911e-05, "loss": 0.0074, "step": 308930 }, { "epoch": 1.56, "learning_rate": 6.62036920251651e-05, "loss": 0.0065, "step": 308940 }, { "epoch": 1.56, "learning_rate": 6.619612433215109e-05, "loss": 0.0074, "step": 308950 }, { "epoch": 1.56, "learning_rate": 6.618855663913708e-05, "loss": 0.007, "step": 308960 }, { "epoch": 1.56, "learning_rate": 6.618098894612307e-05, "loss": 0.0071, "step": 308970 }, { "epoch": 1.56, "learning_rate": 6.617342125310906e-05, "loss": 0.0077, "step": 308980 }, { "epoch": 1.56, "learning_rate": 6.616585356009504e-05, "loss": 0.0065, "step": 308990 }, { "epoch": 1.56, "learning_rate": 6.615828586708104e-05, "loss": 0.0052, "step": 309000 }, { "epoch": 1.56, "eval_cer": 0.9144654039225352, "eval_loss": 0.005355709232389927, "eval_runtime": 116.4345, "eval_samples_per_second": 17.177, "eval_steps_per_second": 4.294, "step": 309000 }, { "epoch": 1.56, "learning_rate": 6.615071817406703e-05, "loss": 0.0082, "step": 309010 }, { "epoch": 1.56, "learning_rate": 6.614315048105301e-05, "loss": 0.0056, "step": 309020 }, { "epoch": 1.56, "learning_rate": 6.613558278803901e-05, "loss": 0.0066, "step": 309030 }, { "epoch": 1.56, "learning_rate": 6.612801509502499e-05, "loss": 0.0057, "step": 309040 }, { "epoch": 1.56, "learning_rate": 6.612044740201098e-05, "loss": 0.0063, "step": 309050 }, { "epoch": 1.56, "learning_rate": 6.611287970899697e-05, "loss": 0.0065, "step": 309060 }, { "epoch": 1.56, "learning_rate": 6.610531201598296e-05, "loss": 0.0085, "step": 309070 }, { "epoch": 1.56, "learning_rate": 6.609774432296894e-05, "loss": 0.0082, "step": 309080 }, { "epoch": 1.56, "learning_rate": 6.609017662995494e-05, "loss": 0.0081, "step": 309090 }, { "epoch": 1.56, "learning_rate": 6.608260893694093e-05, "loss": 0.0068, "step": 309100 }, { "epoch": 1.56, "learning_rate": 6.607504124392691e-05, "loss": 0.0075, "step": 309110 }, { "epoch": 1.56, "learning_rate": 6.606747355091291e-05, "loss": 0.006, "step": 309120 }, { "epoch": 1.56, "learning_rate": 6.60599058578989e-05, "loss": 0.0046, "step": 309130 }, { "epoch": 1.56, "learning_rate": 6.605233816488489e-05, "loss": 0.0077, "step": 309140 }, { "epoch": 1.56, "learning_rate": 6.604477047187088e-05, "loss": 0.0083, "step": 309150 }, { "epoch": 1.56, "learning_rate": 6.603720277885686e-05, "loss": 0.0071, "step": 309160 }, { "epoch": 1.56, "learning_rate": 6.602963508584286e-05, "loss": 0.0089, "step": 309170 }, { "epoch": 1.56, "learning_rate": 6.602206739282885e-05, "loss": 0.0094, "step": 309180 }, { "epoch": 1.56, "learning_rate": 6.601449969981483e-05, "loss": 0.0074, "step": 309190 }, { "epoch": 1.56, "learning_rate": 6.600693200680083e-05, "loss": 0.0073, "step": 309200 }, { "epoch": 1.56, "learning_rate": 6.599936431378682e-05, "loss": 0.0079, "step": 309210 }, { "epoch": 1.56, "learning_rate": 6.59917966207728e-05, "loss": 0.0078, "step": 309220 }, { "epoch": 1.56, "learning_rate": 6.59842289277588e-05, "loss": 0.0074, "step": 309230 }, { "epoch": 1.56, "learning_rate": 6.597666123474478e-05, "loss": 0.006, "step": 309240 }, { "epoch": 1.56, "learning_rate": 6.596909354173078e-05, "loss": 0.0065, "step": 309250 }, { "epoch": 1.56, "learning_rate": 6.596152584871677e-05, "loss": 0.0091, "step": 309260 }, { "epoch": 1.56, "learning_rate": 6.595395815570275e-05, "loss": 0.0084, "step": 309270 }, { "epoch": 1.56, "learning_rate": 6.594639046268875e-05, "loss": 0.0071, "step": 309280 }, { "epoch": 1.56, "learning_rate": 6.593882276967474e-05, "loss": 0.007, "step": 309290 }, { "epoch": 1.56, "learning_rate": 6.593125507666072e-05, "loss": 0.0074, "step": 309300 }, { "epoch": 1.56, "learning_rate": 6.592368738364672e-05, "loss": 0.0062, "step": 309310 }, { "epoch": 1.56, "learning_rate": 6.59161196906327e-05, "loss": 0.0062, "step": 309320 }, { "epoch": 1.56, "learning_rate": 6.59085519976187e-05, "loss": 0.0055, "step": 309330 }, { "epoch": 1.56, "learning_rate": 6.590098430460469e-05, "loss": 0.0056, "step": 309340 }, { "epoch": 1.56, "learning_rate": 6.589341661159067e-05, "loss": 0.0068, "step": 309350 }, { "epoch": 1.56, "learning_rate": 6.588584891857665e-05, "loss": 0.0082, "step": 309360 }, { "epoch": 1.56, "learning_rate": 6.587828122556265e-05, "loss": 0.0057, "step": 309370 }, { "epoch": 1.56, "learning_rate": 6.587071353254864e-05, "loss": 0.0072, "step": 309380 }, { "epoch": 1.56, "learning_rate": 6.586314583953462e-05, "loss": 0.0054, "step": 309390 }, { "epoch": 1.56, "learning_rate": 6.585557814652062e-05, "loss": 0.0064, "step": 309400 }, { "epoch": 1.56, "learning_rate": 6.584801045350661e-05, "loss": 0.0051, "step": 309410 }, { "epoch": 1.56, "learning_rate": 6.58404427604926e-05, "loss": 0.0063, "step": 309420 }, { "epoch": 1.56, "learning_rate": 6.583287506747859e-05, "loss": 0.0069, "step": 309430 }, { "epoch": 1.56, "learning_rate": 6.582530737446457e-05, "loss": 0.0074, "step": 309440 }, { "epoch": 1.56, "learning_rate": 6.581773968145057e-05, "loss": 0.0085, "step": 309450 }, { "epoch": 1.56, "learning_rate": 6.581017198843656e-05, "loss": 0.0067, "step": 309460 }, { "epoch": 1.56, "learning_rate": 6.580260429542254e-05, "loss": 0.0057, "step": 309470 }, { "epoch": 1.56, "learning_rate": 6.579503660240854e-05, "loss": 0.0059, "step": 309480 }, { "epoch": 1.56, "learning_rate": 6.578746890939453e-05, "loss": 0.0066, "step": 309490 }, { "epoch": 1.56, "learning_rate": 6.577990121638052e-05, "loss": 0.0068, "step": 309500 }, { "epoch": 1.56, "learning_rate": 6.577233352336651e-05, "loss": 0.0071, "step": 309510 }, { "epoch": 1.56, "learning_rate": 6.576476583035249e-05, "loss": 0.0051, "step": 309520 }, { "epoch": 1.56, "learning_rate": 6.575719813733849e-05, "loss": 0.0078, "step": 309530 }, { "epoch": 1.56, "learning_rate": 6.574963044432448e-05, "loss": 0.0099, "step": 309540 }, { "epoch": 1.56, "learning_rate": 6.574206275131046e-05, "loss": 0.0066, "step": 309550 }, { "epoch": 1.56, "learning_rate": 6.573449505829646e-05, "loss": 0.0068, "step": 309560 }, { "epoch": 1.56, "learning_rate": 6.572692736528245e-05, "loss": 0.0096, "step": 309570 }, { "epoch": 1.56, "learning_rate": 6.571935967226843e-05, "loss": 0.0057, "step": 309580 }, { "epoch": 1.56, "learning_rate": 6.571179197925443e-05, "loss": 0.0083, "step": 309590 }, { "epoch": 1.56, "learning_rate": 6.570422428624041e-05, "loss": 0.0078, "step": 309600 }, { "epoch": 1.56, "learning_rate": 6.56966565932264e-05, "loss": 0.0067, "step": 309610 }, { "epoch": 1.56, "learning_rate": 6.56890889002124e-05, "loss": 0.0077, "step": 309620 }, { "epoch": 1.56, "learning_rate": 6.568152120719838e-05, "loss": 0.0077, "step": 309630 }, { "epoch": 1.56, "learning_rate": 6.567395351418438e-05, "loss": 0.0062, "step": 309640 }, { "epoch": 1.56, "learning_rate": 6.566638582117037e-05, "loss": 0.0069, "step": 309650 }, { "epoch": 1.56, "learning_rate": 6.565881812815635e-05, "loss": 0.0068, "step": 309660 }, { "epoch": 1.56, "learning_rate": 6.565125043514234e-05, "loss": 0.0048, "step": 309670 }, { "epoch": 1.56, "learning_rate": 6.564368274212833e-05, "loss": 0.0072, "step": 309680 }, { "epoch": 1.56, "learning_rate": 6.563611504911431e-05, "loss": 0.0064, "step": 309690 }, { "epoch": 1.56, "learning_rate": 6.562854735610031e-05, "loss": 0.0038, "step": 309700 }, { "epoch": 1.56, "learning_rate": 6.56209796630863e-05, "loss": 0.0061, "step": 309710 }, { "epoch": 1.56, "learning_rate": 6.561341197007228e-05, "loss": 0.0047, "step": 309720 }, { "epoch": 1.56, "learning_rate": 6.560584427705828e-05, "loss": 0.0103, "step": 309730 }, { "epoch": 1.56, "learning_rate": 6.559827658404427e-05, "loss": 0.0058, "step": 309740 }, { "epoch": 1.56, "learning_rate": 6.559070889103025e-05, "loss": 0.0065, "step": 309750 }, { "epoch": 1.56, "learning_rate": 6.558314119801625e-05, "loss": 0.0057, "step": 309760 }, { "epoch": 1.56, "learning_rate": 6.557557350500223e-05, "loss": 0.0065, "step": 309770 }, { "epoch": 1.56, "learning_rate": 6.556800581198823e-05, "loss": 0.0057, "step": 309780 }, { "epoch": 1.56, "learning_rate": 6.556043811897422e-05, "loss": 0.0079, "step": 309790 }, { "epoch": 1.56, "learning_rate": 6.55528704259602e-05, "loss": 0.0057, "step": 309800 }, { "epoch": 1.56, "learning_rate": 6.55453027329462e-05, "loss": 0.0073, "step": 309810 }, { "epoch": 1.56, "learning_rate": 6.553773503993219e-05, "loss": 0.0065, "step": 309820 }, { "epoch": 1.56, "learning_rate": 6.553016734691817e-05, "loss": 0.0079, "step": 309830 }, { "epoch": 1.56, "learning_rate": 6.552259965390417e-05, "loss": 0.008, "step": 309840 }, { "epoch": 1.56, "learning_rate": 6.551503196089016e-05, "loss": 0.0057, "step": 309850 }, { "epoch": 1.56, "learning_rate": 6.550746426787615e-05, "loss": 0.008, "step": 309860 }, { "epoch": 1.56, "learning_rate": 6.549989657486214e-05, "loss": 0.0053, "step": 309870 }, { "epoch": 1.56, "learning_rate": 6.549232888184812e-05, "loss": 0.0069, "step": 309880 }, { "epoch": 1.56, "learning_rate": 6.548476118883412e-05, "loss": 0.0066, "step": 309890 }, { "epoch": 1.56, "learning_rate": 6.547719349582011e-05, "loss": 0.0072, "step": 309900 }, { "epoch": 1.56, "learning_rate": 6.54696258028061e-05, "loss": 0.0085, "step": 309910 }, { "epoch": 1.56, "learning_rate": 6.546205810979209e-05, "loss": 0.0072, "step": 309920 }, { "epoch": 1.56, "learning_rate": 6.545449041677808e-05, "loss": 0.0072, "step": 309930 }, { "epoch": 1.56, "learning_rate": 6.544692272376406e-05, "loss": 0.0106, "step": 309940 }, { "epoch": 1.56, "learning_rate": 6.543935503075006e-05, "loss": 0.0073, "step": 309950 }, { "epoch": 1.56, "learning_rate": 6.543178733773604e-05, "loss": 0.008, "step": 309960 }, { "epoch": 1.56, "learning_rate": 6.542421964472204e-05, "loss": 0.0071, "step": 309970 }, { "epoch": 1.56, "learning_rate": 6.541665195170802e-05, "loss": 0.0087, "step": 309980 }, { "epoch": 1.56, "learning_rate": 6.540908425869401e-05, "loss": 0.009, "step": 309990 }, { "epoch": 1.56, "learning_rate": 6.540151656568e-05, "loss": 0.0062, "step": 310000 }, { "epoch": 1.56, "eval_cer": 0.9144556999612812, "eval_loss": 0.005289402790367603, "eval_runtime": 116.4374, "eval_samples_per_second": 17.177, "eval_steps_per_second": 4.294, "step": 310000 }, { "epoch": 1.56, "learning_rate": 6.539394887266599e-05, "loss": 0.0071, "step": 310010 }, { "epoch": 1.56, "learning_rate": 6.538638117965198e-05, "loss": 0.0064, "step": 310020 }, { "epoch": 1.56, "learning_rate": 6.537881348663797e-05, "loss": 0.008, "step": 310030 }, { "epoch": 1.56, "learning_rate": 6.537124579362396e-05, "loss": 0.0061, "step": 310040 }, { "epoch": 1.56, "learning_rate": 6.536367810060994e-05, "loss": 0.0065, "step": 310050 }, { "epoch": 1.56, "learning_rate": 6.535611040759594e-05, "loss": 0.0053, "step": 310060 }, { "epoch": 1.56, "learning_rate": 6.534854271458193e-05, "loss": 0.0089, "step": 310070 }, { "epoch": 1.56, "learning_rate": 6.534097502156791e-05, "loss": 0.0059, "step": 310080 }, { "epoch": 1.56, "learning_rate": 6.533340732855391e-05, "loss": 0.008, "step": 310090 }, { "epoch": 1.56, "learning_rate": 6.53258396355399e-05, "loss": 0.0063, "step": 310100 }, { "epoch": 1.56, "learning_rate": 6.531827194252588e-05, "loss": 0.0075, "step": 310110 }, { "epoch": 1.56, "learning_rate": 6.531070424951188e-05, "loss": 0.0075, "step": 310120 }, { "epoch": 1.56, "learning_rate": 6.530313655649786e-05, "loss": 0.0068, "step": 310130 }, { "epoch": 1.56, "learning_rate": 6.529556886348386e-05, "loss": 0.0083, "step": 310140 }, { "epoch": 1.56, "learning_rate": 6.528800117046985e-05, "loss": 0.006, "step": 310150 }, { "epoch": 1.56, "learning_rate": 6.528043347745583e-05, "loss": 0.0073, "step": 310160 }, { "epoch": 1.56, "learning_rate": 6.527286578444183e-05, "loss": 0.0054, "step": 310170 }, { "epoch": 1.56, "learning_rate": 6.526529809142782e-05, "loss": 0.006, "step": 310180 }, { "epoch": 1.56, "learning_rate": 6.52577303984138e-05, "loss": 0.0056, "step": 310190 }, { "epoch": 1.56, "learning_rate": 6.52501627053998e-05, "loss": 0.0058, "step": 310200 }, { "epoch": 1.57, "learning_rate": 6.524259501238578e-05, "loss": 0.0086, "step": 310210 }, { "epoch": 1.57, "learning_rate": 6.523502731937178e-05, "loss": 0.0056, "step": 310220 }, { "epoch": 1.57, "learning_rate": 6.522745962635777e-05, "loss": 0.0059, "step": 310230 }, { "epoch": 1.57, "learning_rate": 6.521989193334375e-05, "loss": 0.0073, "step": 310240 }, { "epoch": 1.57, "learning_rate": 6.521232424032975e-05, "loss": 0.0052, "step": 310250 }, { "epoch": 1.57, "learning_rate": 6.520475654731574e-05, "loss": 0.0063, "step": 310260 }, { "epoch": 1.57, "learning_rate": 6.519718885430172e-05, "loss": 0.0072, "step": 310270 }, { "epoch": 1.57, "learning_rate": 6.518962116128772e-05, "loss": 0.0068, "step": 310280 }, { "epoch": 1.57, "learning_rate": 6.51820534682737e-05, "loss": 0.0062, "step": 310290 }, { "epoch": 1.57, "learning_rate": 6.51744857752597e-05, "loss": 0.0074, "step": 310300 }, { "epoch": 1.57, "learning_rate": 6.516691808224568e-05, "loss": 0.0062, "step": 310310 }, { "epoch": 1.57, "learning_rate": 6.515935038923167e-05, "loss": 0.0067, "step": 310320 }, { "epoch": 1.57, "learning_rate": 6.515178269621765e-05, "loss": 0.0091, "step": 310330 }, { "epoch": 1.57, "learning_rate": 6.514421500320365e-05, "loss": 0.0099, "step": 310340 }, { "epoch": 1.57, "learning_rate": 6.513664731018964e-05, "loss": 0.0092, "step": 310350 }, { "epoch": 1.57, "learning_rate": 6.512907961717562e-05, "loss": 0.0072, "step": 310360 }, { "epoch": 1.57, "learning_rate": 6.512151192416162e-05, "loss": 0.0095, "step": 310370 }, { "epoch": 1.57, "learning_rate": 6.511394423114761e-05, "loss": 0.0074, "step": 310380 }, { "epoch": 1.57, "learning_rate": 6.51063765381336e-05, "loss": 0.0071, "step": 310390 }, { "epoch": 1.57, "learning_rate": 6.509880884511959e-05, "loss": 0.0075, "step": 310400 }, { "epoch": 1.57, "learning_rate": 6.509124115210557e-05, "loss": 0.0095, "step": 310410 }, { "epoch": 1.57, "learning_rate": 6.508367345909157e-05, "loss": 0.0077, "step": 310420 }, { "epoch": 1.57, "learning_rate": 6.507610576607756e-05, "loss": 0.0069, "step": 310430 }, { "epoch": 1.57, "learning_rate": 6.506853807306354e-05, "loss": 0.0061, "step": 310440 }, { "epoch": 1.57, "learning_rate": 6.506097038004954e-05, "loss": 0.0069, "step": 310450 }, { "epoch": 1.57, "learning_rate": 6.505340268703553e-05, "loss": 0.0079, "step": 310460 }, { "epoch": 1.57, "learning_rate": 6.504583499402152e-05, "loss": 0.005, "step": 310470 }, { "epoch": 1.57, "learning_rate": 6.503826730100751e-05, "loss": 0.0068, "step": 310480 }, { "epoch": 1.57, "learning_rate": 6.503069960799349e-05, "loss": 0.0088, "step": 310490 }, { "epoch": 1.57, "learning_rate": 6.502313191497949e-05, "loss": 0.0069, "step": 310500 }, { "epoch": 1.57, "learning_rate": 6.501556422196548e-05, "loss": 0.0059, "step": 310510 }, { "epoch": 1.57, "learning_rate": 6.500799652895146e-05, "loss": 0.0073, "step": 310520 }, { "epoch": 1.57, "learning_rate": 6.500042883593746e-05, "loss": 0.0067, "step": 310530 }, { "epoch": 1.57, "learning_rate": 6.499286114292345e-05, "loss": 0.0078, "step": 310540 }, { "epoch": 1.57, "learning_rate": 6.498529344990943e-05, "loss": 0.0056, "step": 310550 }, { "epoch": 1.57, "learning_rate": 6.497772575689543e-05, "loss": 0.0057, "step": 310560 }, { "epoch": 1.57, "learning_rate": 6.497015806388141e-05, "loss": 0.0079, "step": 310570 }, { "epoch": 1.57, "learning_rate": 6.49625903708674e-05, "loss": 0.0071, "step": 310580 }, { "epoch": 1.57, "learning_rate": 6.49550226778534e-05, "loss": 0.0073, "step": 310590 }, { "epoch": 1.57, "learning_rate": 6.494745498483938e-05, "loss": 0.0084, "step": 310600 }, { "epoch": 1.57, "learning_rate": 6.493988729182536e-05, "loss": 0.006, "step": 310610 }, { "epoch": 1.57, "learning_rate": 6.493231959881136e-05, "loss": 0.0061, "step": 310620 }, { "epoch": 1.57, "learning_rate": 6.492475190579735e-05, "loss": 0.0083, "step": 310630 }, { "epoch": 1.57, "learning_rate": 6.491718421278334e-05, "loss": 0.0067, "step": 310640 }, { "epoch": 1.57, "learning_rate": 6.490961651976933e-05, "loss": 0.0049, "step": 310650 }, { "epoch": 1.57, "learning_rate": 6.490204882675531e-05, "loss": 0.0057, "step": 310660 }, { "epoch": 1.57, "learning_rate": 6.48944811337413e-05, "loss": 0.0096, "step": 310670 }, { "epoch": 1.57, "learning_rate": 6.48869134407273e-05, "loss": 0.0073, "step": 310680 }, { "epoch": 1.57, "learning_rate": 6.487934574771328e-05, "loss": 0.008, "step": 310690 }, { "epoch": 1.57, "learning_rate": 6.487177805469928e-05, "loss": 0.0058, "step": 310700 }, { "epoch": 1.57, "learning_rate": 6.486421036168527e-05, "loss": 0.0095, "step": 310710 }, { "epoch": 1.57, "learning_rate": 6.485664266867125e-05, "loss": 0.0091, "step": 310720 }, { "epoch": 1.57, "learning_rate": 6.484907497565725e-05, "loss": 0.0083, "step": 310730 }, { "epoch": 1.57, "learning_rate": 6.484150728264323e-05, "loss": 0.0067, "step": 310740 }, { "epoch": 1.57, "learning_rate": 6.483393958962923e-05, "loss": 0.0064, "step": 310750 }, { "epoch": 1.57, "learning_rate": 6.482637189661522e-05, "loss": 0.0069, "step": 310760 }, { "epoch": 1.57, "learning_rate": 6.48188042036012e-05, "loss": 0.007, "step": 310770 }, { "epoch": 1.57, "learning_rate": 6.48112365105872e-05, "loss": 0.0091, "step": 310780 }, { "epoch": 1.57, "learning_rate": 6.480366881757319e-05, "loss": 0.0056, "step": 310790 }, { "epoch": 1.57, "learning_rate": 6.479610112455917e-05, "loss": 0.0063, "step": 310800 }, { "epoch": 1.57, "learning_rate": 6.478853343154517e-05, "loss": 0.0067, "step": 310810 }, { "epoch": 1.57, "learning_rate": 6.478096573853116e-05, "loss": 0.0068, "step": 310820 }, { "epoch": 1.57, "learning_rate": 6.477339804551715e-05, "loss": 0.008, "step": 310830 }, { "epoch": 1.57, "learning_rate": 6.476583035250314e-05, "loss": 0.0079, "step": 310840 }, { "epoch": 1.57, "learning_rate": 6.475826265948912e-05, "loss": 0.0058, "step": 310850 }, { "epoch": 1.57, "learning_rate": 6.475069496647512e-05, "loss": 0.0067, "step": 310860 }, { "epoch": 1.57, "learning_rate": 6.474312727346111e-05, "loss": 0.0081, "step": 310870 }, { "epoch": 1.57, "learning_rate": 6.473555958044709e-05, "loss": 0.0055, "step": 310880 }, { "epoch": 1.57, "learning_rate": 6.472799188743309e-05, "loss": 0.0061, "step": 310890 }, { "epoch": 1.57, "learning_rate": 6.472042419441908e-05, "loss": 0.0062, "step": 310900 }, { "epoch": 1.57, "learning_rate": 6.471285650140506e-05, "loss": 0.0057, "step": 310910 }, { "epoch": 1.57, "learning_rate": 6.470528880839106e-05, "loss": 0.0058, "step": 310920 }, { "epoch": 1.57, "learning_rate": 6.469772111537704e-05, "loss": 0.007, "step": 310930 }, { "epoch": 1.57, "learning_rate": 6.469015342236302e-05, "loss": 0.0061, "step": 310940 }, { "epoch": 1.57, "learning_rate": 6.468258572934902e-05, "loss": 0.0087, "step": 310950 }, { "epoch": 1.57, "learning_rate": 6.467501803633501e-05, "loss": 0.0065, "step": 310960 }, { "epoch": 1.57, "learning_rate": 6.4667450343321e-05, "loss": 0.0058, "step": 310970 }, { "epoch": 1.57, "learning_rate": 6.465988265030699e-05, "loss": 0.0079, "step": 310980 }, { "epoch": 1.57, "learning_rate": 6.465231495729298e-05, "loss": 0.0088, "step": 310990 }, { "epoch": 1.57, "learning_rate": 6.464474726427897e-05, "loss": 0.0083, "step": 311000 }, { "epoch": 1.57, "eval_cer": 0.9144498775845288, "eval_loss": 0.005227969028055668, "eval_runtime": 116.309, "eval_samples_per_second": 17.196, "eval_steps_per_second": 4.299, "step": 311000 }, { "epoch": 1.57, "learning_rate": 6.463717957126496e-05, "loss": 0.0074, "step": 311010 }, { "epoch": 1.57, "learning_rate": 6.462961187825094e-05, "loss": 0.0069, "step": 311020 }, { "epoch": 1.57, "learning_rate": 6.462204418523694e-05, "loss": 0.0093, "step": 311030 }, { "epoch": 1.57, "learning_rate": 6.461447649222293e-05, "loss": 0.007, "step": 311040 }, { "epoch": 1.57, "learning_rate": 6.460690879920891e-05, "loss": 0.0064, "step": 311050 }, { "epoch": 1.57, "learning_rate": 6.459934110619491e-05, "loss": 0.0075, "step": 311060 }, { "epoch": 1.57, "learning_rate": 6.45917734131809e-05, "loss": 0.0049, "step": 311070 }, { "epoch": 1.57, "learning_rate": 6.458420572016688e-05, "loss": 0.0071, "step": 311080 }, { "epoch": 1.57, "learning_rate": 6.457663802715288e-05, "loss": 0.0084, "step": 311090 }, { "epoch": 1.57, "learning_rate": 6.456907033413886e-05, "loss": 0.0062, "step": 311100 }, { "epoch": 1.57, "learning_rate": 6.456150264112486e-05, "loss": 0.0065, "step": 311110 }, { "epoch": 1.57, "learning_rate": 6.455393494811085e-05, "loss": 0.0064, "step": 311120 }, { "epoch": 1.57, "learning_rate": 6.454636725509683e-05, "loss": 0.0056, "step": 311130 }, { "epoch": 1.57, "learning_rate": 6.453879956208283e-05, "loss": 0.0076, "step": 311140 }, { "epoch": 1.57, "learning_rate": 6.453123186906882e-05, "loss": 0.0056, "step": 311150 }, { "epoch": 1.57, "learning_rate": 6.45236641760548e-05, "loss": 0.0082, "step": 311160 }, { "epoch": 1.57, "learning_rate": 6.45160964830408e-05, "loss": 0.0076, "step": 311170 }, { "epoch": 1.57, "learning_rate": 6.450852879002678e-05, "loss": 0.009, "step": 311180 }, { "epoch": 1.57, "learning_rate": 6.450096109701278e-05, "loss": 0.0083, "step": 311190 }, { "epoch": 1.57, "learning_rate": 6.449339340399877e-05, "loss": 0.0094, "step": 311200 }, { "epoch": 1.57, "learning_rate": 6.448582571098475e-05, "loss": 0.0058, "step": 311210 }, { "epoch": 1.57, "learning_rate": 6.447825801797075e-05, "loss": 0.0053, "step": 311220 }, { "epoch": 1.57, "learning_rate": 6.447069032495674e-05, "loss": 0.0088, "step": 311230 }, { "epoch": 1.57, "learning_rate": 6.446312263194272e-05, "loss": 0.0074, "step": 311240 }, { "epoch": 1.57, "learning_rate": 6.44555549389287e-05, "loss": 0.0051, "step": 311250 }, { "epoch": 1.57, "learning_rate": 6.44479872459147e-05, "loss": 0.0056, "step": 311260 }, { "epoch": 1.57, "learning_rate": 6.44404195529007e-05, "loss": 0.0059, "step": 311270 }, { "epoch": 1.57, "learning_rate": 6.443285185988668e-05, "loss": 0.0093, "step": 311280 }, { "epoch": 1.57, "learning_rate": 6.442528416687267e-05, "loss": 0.0091, "step": 311290 }, { "epoch": 1.57, "learning_rate": 6.441771647385865e-05, "loss": 0.0074, "step": 311300 }, { "epoch": 1.57, "learning_rate": 6.441014878084465e-05, "loss": 0.0075, "step": 311310 }, { "epoch": 1.57, "learning_rate": 6.440258108783064e-05, "loss": 0.0086, "step": 311320 }, { "epoch": 1.57, "learning_rate": 6.439501339481662e-05, "loss": 0.0055, "step": 311330 }, { "epoch": 1.57, "learning_rate": 6.438744570180262e-05, "loss": 0.0061, "step": 311340 }, { "epoch": 1.57, "learning_rate": 6.437987800878861e-05, "loss": 0.0097, "step": 311350 }, { "epoch": 1.57, "learning_rate": 6.43723103157746e-05, "loss": 0.0076, "step": 311360 }, { "epoch": 1.57, "learning_rate": 6.436474262276059e-05, "loss": 0.0057, "step": 311370 }, { "epoch": 1.57, "learning_rate": 6.435717492974657e-05, "loss": 0.0064, "step": 311380 }, { "epoch": 1.57, "learning_rate": 6.434960723673257e-05, "loss": 0.0076, "step": 311390 }, { "epoch": 1.57, "learning_rate": 6.434203954371856e-05, "loss": 0.009, "step": 311400 }, { "epoch": 1.57, "learning_rate": 6.433447185070454e-05, "loss": 0.0062, "step": 311410 }, { "epoch": 1.57, "learning_rate": 6.432690415769054e-05, "loss": 0.0073, "step": 311420 }, { "epoch": 1.57, "learning_rate": 6.431933646467653e-05, "loss": 0.0062, "step": 311430 }, { "epoch": 1.57, "learning_rate": 6.431176877166251e-05, "loss": 0.0061, "step": 311440 }, { "epoch": 1.57, "learning_rate": 6.430420107864851e-05, "loss": 0.009, "step": 311450 }, { "epoch": 1.57, "learning_rate": 6.429663338563449e-05, "loss": 0.0048, "step": 311460 }, { "epoch": 1.57, "learning_rate": 6.428906569262049e-05, "loss": 0.006, "step": 311470 }, { "epoch": 1.57, "learning_rate": 6.428149799960648e-05, "loss": 0.0069, "step": 311480 }, { "epoch": 1.57, "learning_rate": 6.427393030659246e-05, "loss": 0.0058, "step": 311490 }, { "epoch": 1.57, "learning_rate": 6.426636261357846e-05, "loss": 0.0084, "step": 311500 }, { "epoch": 1.57, "learning_rate": 6.425879492056445e-05, "loss": 0.0074, "step": 311510 }, { "epoch": 1.57, "learning_rate": 6.425122722755043e-05, "loss": 0.0065, "step": 311520 }, { "epoch": 1.57, "learning_rate": 6.424365953453643e-05, "loss": 0.0047, "step": 311530 }, { "epoch": 1.57, "learning_rate": 6.423609184152241e-05, "loss": 0.0063, "step": 311540 }, { "epoch": 1.57, "learning_rate": 6.42285241485084e-05, "loss": 0.0058, "step": 311550 }, { "epoch": 1.57, "learning_rate": 6.422095645549439e-05, "loss": 0.0083, "step": 311560 }, { "epoch": 1.57, "learning_rate": 6.421338876248038e-05, "loss": 0.0067, "step": 311570 }, { "epoch": 1.57, "learning_rate": 6.420582106946636e-05, "loss": 0.0072, "step": 311580 }, { "epoch": 1.57, "learning_rate": 6.419825337645236e-05, "loss": 0.0071, "step": 311590 }, { "epoch": 1.57, "learning_rate": 6.419068568343835e-05, "loss": 0.0052, "step": 311600 }, { "epoch": 1.57, "learning_rate": 6.418311799042433e-05, "loss": 0.009, "step": 311610 }, { "epoch": 1.57, "learning_rate": 6.417555029741033e-05, "loss": 0.0065, "step": 311620 }, { "epoch": 1.57, "learning_rate": 6.416798260439631e-05, "loss": 0.0084, "step": 311630 }, { "epoch": 1.57, "learning_rate": 6.41604149113823e-05, "loss": 0.006, "step": 311640 }, { "epoch": 1.57, "learning_rate": 6.41528472183683e-05, "loss": 0.0054, "step": 311650 }, { "epoch": 1.57, "learning_rate": 6.414527952535428e-05, "loss": 0.0065, "step": 311660 }, { "epoch": 1.57, "learning_rate": 6.413771183234028e-05, "loss": 0.0051, "step": 311670 }, { "epoch": 1.57, "learning_rate": 6.413014413932627e-05, "loss": 0.0064, "step": 311680 }, { "epoch": 1.57, "learning_rate": 6.412257644631225e-05, "loss": 0.0071, "step": 311690 }, { "epoch": 1.57, "learning_rate": 6.411500875329825e-05, "loss": 0.0074, "step": 311700 }, { "epoch": 1.57, "learning_rate": 6.410744106028423e-05, "loss": 0.0068, "step": 311710 }, { "epoch": 1.57, "learning_rate": 6.409987336727023e-05, "loss": 0.0068, "step": 311720 }, { "epoch": 1.57, "learning_rate": 6.409230567425622e-05, "loss": 0.0096, "step": 311730 }, { "epoch": 1.57, "learning_rate": 6.40847379812422e-05, "loss": 0.0062, "step": 311740 }, { "epoch": 1.57, "learning_rate": 6.40771702882282e-05, "loss": 0.0053, "step": 311750 }, { "epoch": 1.57, "learning_rate": 6.406960259521419e-05, "loss": 0.0085, "step": 311760 }, { "epoch": 1.57, "learning_rate": 6.406203490220017e-05, "loss": 0.0086, "step": 311770 }, { "epoch": 1.57, "learning_rate": 6.405446720918617e-05, "loss": 0.0075, "step": 311780 }, { "epoch": 1.57, "learning_rate": 6.404689951617216e-05, "loss": 0.0074, "step": 311790 }, { "epoch": 1.57, "learning_rate": 6.403933182315814e-05, "loss": 0.0072, "step": 311800 }, { "epoch": 1.57, "learning_rate": 6.403176413014414e-05, "loss": 0.0057, "step": 311810 }, { "epoch": 1.57, "learning_rate": 6.402419643713012e-05, "loss": 0.0071, "step": 311820 }, { "epoch": 1.57, "learning_rate": 6.401662874411612e-05, "loss": 0.0059, "step": 311830 }, { "epoch": 1.57, "learning_rate": 6.400906105110211e-05, "loss": 0.0096, "step": 311840 }, { "epoch": 1.57, "learning_rate": 6.400149335808809e-05, "loss": 0.0076, "step": 311850 }, { "epoch": 1.57, "learning_rate": 6.399392566507409e-05, "loss": 0.0061, "step": 311860 }, { "epoch": 1.57, "learning_rate": 6.398635797206007e-05, "loss": 0.0072, "step": 311870 }, { "epoch": 1.57, "learning_rate": 6.397879027904606e-05, "loss": 0.006, "step": 311880 }, { "epoch": 1.57, "learning_rate": 6.397122258603205e-05, "loss": 0.0079, "step": 311890 }, { "epoch": 1.57, "learning_rate": 6.396365489301804e-05, "loss": 0.0074, "step": 311900 }, { "epoch": 1.57, "learning_rate": 6.395608720000402e-05, "loss": 0.0141, "step": 311910 }, { "epoch": 1.57, "learning_rate": 6.394851950699002e-05, "loss": 0.0067, "step": 311920 }, { "epoch": 1.57, "learning_rate": 6.394095181397601e-05, "loss": 0.0048, "step": 311930 }, { "epoch": 1.57, "learning_rate": 6.3933384120962e-05, "loss": 0.0065, "step": 311940 }, { "epoch": 1.57, "learning_rate": 6.392581642794799e-05, "loss": 0.0063, "step": 311950 }, { "epoch": 1.57, "learning_rate": 6.391824873493398e-05, "loss": 0.009, "step": 311960 }, { "epoch": 1.57, "learning_rate": 6.391068104191996e-05, "loss": 0.0116, "step": 311970 }, { "epoch": 1.57, "learning_rate": 6.390311334890596e-05, "loss": 0.0053, "step": 311980 }, { "epoch": 1.57, "learning_rate": 6.389554565589194e-05, "loss": 0.0093, "step": 311990 }, { "epoch": 1.57, "learning_rate": 6.388797796287794e-05, "loss": 0.0116, "step": 312000 }, { "epoch": 1.57, "eval_cer": 0.914462492734159, "eval_loss": 0.005281941965222359, "eval_runtime": 116.1751, "eval_samples_per_second": 17.215, "eval_steps_per_second": 4.304, "step": 312000 }, { "epoch": 1.57, "learning_rate": 6.388041026986393e-05, "loss": 0.0074, "step": 312010 }, { "epoch": 1.57, "learning_rate": 6.387284257684991e-05, "loss": 0.0085, "step": 312020 }, { "epoch": 1.57, "learning_rate": 6.386527488383591e-05, "loss": 0.0098, "step": 312030 }, { "epoch": 1.57, "learning_rate": 6.38577071908219e-05, "loss": 0.0057, "step": 312040 }, { "epoch": 1.57, "learning_rate": 6.385013949780788e-05, "loss": 0.0077, "step": 312050 }, { "epoch": 1.57, "learning_rate": 6.384257180479388e-05, "loss": 0.0076, "step": 312060 }, { "epoch": 1.57, "learning_rate": 6.383500411177986e-05, "loss": 0.0061, "step": 312070 }, { "epoch": 1.57, "learning_rate": 6.382743641876586e-05, "loss": 0.0083, "step": 312080 }, { "epoch": 1.57, "learning_rate": 6.381986872575185e-05, "loss": 0.0068, "step": 312090 }, { "epoch": 1.57, "learning_rate": 6.381230103273783e-05, "loss": 0.0113, "step": 312100 }, { "epoch": 1.57, "learning_rate": 6.380473333972383e-05, "loss": 0.0067, "step": 312110 }, { "epoch": 1.57, "learning_rate": 6.379716564670982e-05, "loss": 0.0053, "step": 312120 }, { "epoch": 1.57, "learning_rate": 6.37895979536958e-05, "loss": 0.0075, "step": 312130 }, { "epoch": 1.57, "learning_rate": 6.37820302606818e-05, "loss": 0.0063, "step": 312140 }, { "epoch": 1.57, "learning_rate": 6.377446256766778e-05, "loss": 0.0078, "step": 312150 }, { "epoch": 1.57, "learning_rate": 6.376689487465377e-05, "loss": 0.0063, "step": 312160 }, { "epoch": 1.57, "learning_rate": 6.375932718163977e-05, "loss": 0.0066, "step": 312170 }, { "epoch": 1.57, "learning_rate": 6.375175948862575e-05, "loss": 0.0091, "step": 312180 }, { "epoch": 1.58, "learning_rate": 6.374419179561173e-05, "loss": 0.0051, "step": 312190 }, { "epoch": 1.58, "learning_rate": 6.373662410259773e-05, "loss": 0.0053, "step": 312200 }, { "epoch": 1.58, "learning_rate": 6.372905640958372e-05, "loss": 0.0057, "step": 312210 }, { "epoch": 1.58, "learning_rate": 6.37214887165697e-05, "loss": 0.0068, "step": 312220 }, { "epoch": 1.58, "learning_rate": 6.37139210235557e-05, "loss": 0.0069, "step": 312230 }, { "epoch": 1.58, "learning_rate": 6.37063533305417e-05, "loss": 0.0058, "step": 312240 }, { "epoch": 1.58, "learning_rate": 6.369878563752768e-05, "loss": 0.0069, "step": 312250 }, { "epoch": 1.58, "learning_rate": 6.369121794451367e-05, "loss": 0.0083, "step": 312260 }, { "epoch": 1.58, "learning_rate": 6.368365025149965e-05, "loss": 0.0057, "step": 312270 }, { "epoch": 1.58, "learning_rate": 6.367608255848565e-05, "loss": 0.0076, "step": 312280 }, { "epoch": 1.58, "learning_rate": 6.366851486547164e-05, "loss": 0.0061, "step": 312290 }, { "epoch": 1.58, "learning_rate": 6.366094717245762e-05, "loss": 0.0067, "step": 312300 }, { "epoch": 1.58, "learning_rate": 6.365337947944362e-05, "loss": 0.0096, "step": 312310 }, { "epoch": 1.58, "learning_rate": 6.364581178642961e-05, "loss": 0.007, "step": 312320 }, { "epoch": 1.58, "learning_rate": 6.36382440934156e-05, "loss": 0.0074, "step": 312330 }, { "epoch": 1.58, "learning_rate": 6.363067640040159e-05, "loss": 0.0059, "step": 312340 }, { "epoch": 1.58, "learning_rate": 6.362310870738757e-05, "loss": 0.0072, "step": 312350 }, { "epoch": 1.58, "learning_rate": 6.361554101437357e-05, "loss": 0.0058, "step": 312360 }, { "epoch": 1.58, "learning_rate": 6.360797332135956e-05, "loss": 0.0071, "step": 312370 }, { "epoch": 1.58, "learning_rate": 6.360040562834554e-05, "loss": 0.0079, "step": 312380 }, { "epoch": 1.58, "learning_rate": 6.359283793533154e-05, "loss": 0.0066, "step": 312390 }, { "epoch": 1.58, "learning_rate": 6.358527024231753e-05, "loss": 0.0072, "step": 312400 }, { "epoch": 1.58, "learning_rate": 6.357770254930351e-05, "loss": 0.0055, "step": 312410 }, { "epoch": 1.58, "learning_rate": 6.357013485628951e-05, "loss": 0.0116, "step": 312420 }, { "epoch": 1.58, "learning_rate": 6.356256716327549e-05, "loss": 0.0061, "step": 312430 }, { "epoch": 1.58, "learning_rate": 6.355499947026149e-05, "loss": 0.0059, "step": 312440 }, { "epoch": 1.58, "learning_rate": 6.354743177724748e-05, "loss": 0.0065, "step": 312450 }, { "epoch": 1.58, "learning_rate": 6.353986408423346e-05, "loss": 0.0078, "step": 312460 }, { "epoch": 1.58, "learning_rate": 6.353229639121946e-05, "loss": 0.0099, "step": 312470 }, { "epoch": 1.58, "learning_rate": 6.352472869820545e-05, "loss": 0.0075, "step": 312480 }, { "epoch": 1.58, "learning_rate": 6.351716100519143e-05, "loss": 0.0071, "step": 312490 }, { "epoch": 1.58, "learning_rate": 6.350959331217741e-05, "loss": 0.0069, "step": 312500 }, { "epoch": 1.58, "learning_rate": 6.350202561916341e-05, "loss": 0.0078, "step": 312510 }, { "epoch": 1.58, "learning_rate": 6.349445792614939e-05, "loss": 0.0062, "step": 312520 }, { "epoch": 1.58, "learning_rate": 6.348689023313539e-05, "loss": 0.007, "step": 312530 }, { "epoch": 1.58, "learning_rate": 6.347932254012138e-05, "loss": 0.0062, "step": 312540 }, { "epoch": 1.58, "learning_rate": 6.347175484710736e-05, "loss": 0.0061, "step": 312550 }, { "epoch": 1.58, "learning_rate": 6.346418715409336e-05, "loss": 0.0057, "step": 312560 }, { "epoch": 1.58, "learning_rate": 6.345661946107935e-05, "loss": 0.0063, "step": 312570 }, { "epoch": 1.58, "learning_rate": 6.344905176806533e-05, "loss": 0.0075, "step": 312580 }, { "epoch": 1.58, "learning_rate": 6.344148407505133e-05, "loss": 0.0084, "step": 312590 }, { "epoch": 1.58, "learning_rate": 6.343391638203731e-05, "loss": 0.007, "step": 312600 }, { "epoch": 1.58, "learning_rate": 6.34263486890233e-05, "loss": 0.0091, "step": 312610 }, { "epoch": 1.58, "learning_rate": 6.34187809960093e-05, "loss": 0.0091, "step": 312620 }, { "epoch": 1.58, "learning_rate": 6.341121330299528e-05, "loss": 0.0078, "step": 312630 }, { "epoch": 1.58, "learning_rate": 6.340364560998128e-05, "loss": 0.0065, "step": 312640 }, { "epoch": 1.58, "learning_rate": 6.339607791696727e-05, "loss": 0.0074, "step": 312650 }, { "epoch": 1.58, "learning_rate": 6.338851022395325e-05, "loss": 0.0062, "step": 312660 }, { "epoch": 1.58, "learning_rate": 6.338094253093925e-05, "loss": 0.0091, "step": 312670 }, { "epoch": 1.58, "learning_rate": 6.337337483792523e-05, "loss": 0.0055, "step": 312680 }, { "epoch": 1.58, "learning_rate": 6.336580714491122e-05, "loss": 0.0082, "step": 312690 }, { "epoch": 1.58, "learning_rate": 6.335823945189722e-05, "loss": 0.0072, "step": 312700 }, { "epoch": 1.58, "learning_rate": 6.33506717588832e-05, "loss": 0.0069, "step": 312710 }, { "epoch": 1.58, "learning_rate": 6.33431040658692e-05, "loss": 0.0067, "step": 312720 }, { "epoch": 1.58, "learning_rate": 6.333553637285519e-05, "loss": 0.0057, "step": 312730 }, { "epoch": 1.58, "learning_rate": 6.332796867984117e-05, "loss": 0.0067, "step": 312740 }, { "epoch": 1.58, "learning_rate": 6.332040098682717e-05, "loss": 0.0058, "step": 312750 }, { "epoch": 1.58, "learning_rate": 6.331283329381316e-05, "loss": 0.0074, "step": 312760 }, { "epoch": 1.58, "learning_rate": 6.330526560079914e-05, "loss": 0.0092, "step": 312770 }, { "epoch": 1.58, "learning_rate": 6.329769790778514e-05, "loss": 0.0074, "step": 312780 }, { "epoch": 1.58, "learning_rate": 6.329013021477112e-05, "loss": 0.0072, "step": 312790 }, { "epoch": 1.58, "learning_rate": 6.328256252175712e-05, "loss": 0.0074, "step": 312800 }, { "epoch": 1.58, "learning_rate": 6.32749948287431e-05, "loss": 0.0109, "step": 312810 }, { "epoch": 1.58, "learning_rate": 6.326742713572909e-05, "loss": 0.0049, "step": 312820 }, { "epoch": 1.58, "learning_rate": 6.325985944271507e-05, "loss": 0.0059, "step": 312830 }, { "epoch": 1.58, "learning_rate": 6.325229174970107e-05, "loss": 0.0071, "step": 312840 }, { "epoch": 1.58, "learning_rate": 6.324472405668706e-05, "loss": 0.0057, "step": 312850 }, { "epoch": 1.58, "learning_rate": 6.323715636367304e-05, "loss": 0.0076, "step": 312860 }, { "epoch": 1.58, "learning_rate": 6.322958867065904e-05, "loss": 0.0063, "step": 312870 }, { "epoch": 1.58, "learning_rate": 6.322202097764502e-05, "loss": 0.0085, "step": 312880 }, { "epoch": 1.58, "learning_rate": 6.321445328463102e-05, "loss": 0.0087, "step": 312890 }, { "epoch": 1.58, "learning_rate": 6.320688559161701e-05, "loss": 0.0072, "step": 312900 }, { "epoch": 1.58, "learning_rate": 6.319931789860299e-05, "loss": 0.0064, "step": 312910 }, { "epoch": 1.58, "learning_rate": 6.319175020558899e-05, "loss": 0.007, "step": 312920 }, { "epoch": 1.58, "learning_rate": 6.318418251257498e-05, "loss": 0.0057, "step": 312930 }, { "epoch": 1.58, "learning_rate": 6.317661481956096e-05, "loss": 0.0083, "step": 312940 }, { "epoch": 1.58, "learning_rate": 6.316904712654696e-05, "loss": 0.0072, "step": 312950 }, { "epoch": 1.58, "learning_rate": 6.316147943353294e-05, "loss": 0.0083, "step": 312960 }, { "epoch": 1.58, "learning_rate": 6.315391174051894e-05, "loss": 0.0072, "step": 312970 }, { "epoch": 1.58, "learning_rate": 6.314634404750493e-05, "loss": 0.007, "step": 312980 }, { "epoch": 1.58, "learning_rate": 6.313877635449091e-05, "loss": 0.0075, "step": 312990 }, { "epoch": 1.58, "learning_rate": 6.313120866147691e-05, "loss": 0.0064, "step": 313000 }, { "epoch": 1.58, "eval_cer": 0.914438232831024, "eval_loss": 0.005189271178096533, "eval_runtime": 116.2305, "eval_samples_per_second": 17.207, "eval_steps_per_second": 4.302, "step": 313000 }, { "epoch": 1.58, "learning_rate": 6.31236409684629e-05, "loss": 0.0081, "step": 313010 }, { "epoch": 1.58, "learning_rate": 6.311607327544888e-05, "loss": 0.008, "step": 313020 }, { "epoch": 1.58, "learning_rate": 6.310850558243488e-05, "loss": 0.0079, "step": 313030 }, { "epoch": 1.58, "learning_rate": 6.310093788942086e-05, "loss": 0.0079, "step": 313040 }, { "epoch": 1.58, "learning_rate": 6.309337019640685e-05, "loss": 0.006, "step": 313050 }, { "epoch": 1.58, "learning_rate": 6.308580250339285e-05, "loss": 0.0071, "step": 313060 }, { "epoch": 1.58, "learning_rate": 6.307823481037883e-05, "loss": 0.0065, "step": 313070 }, { "epoch": 1.58, "learning_rate": 6.307066711736483e-05, "loss": 0.0082, "step": 313080 }, { "epoch": 1.58, "learning_rate": 6.306309942435082e-05, "loss": 0.0056, "step": 313090 }, { "epoch": 1.58, "learning_rate": 6.30555317313368e-05, "loss": 0.0062, "step": 313100 }, { "epoch": 1.58, "learning_rate": 6.30479640383228e-05, "loss": 0.0075, "step": 313110 }, { "epoch": 1.58, "learning_rate": 6.304039634530878e-05, "loss": 0.0068, "step": 313120 }, { "epoch": 1.58, "learning_rate": 6.303282865229476e-05, "loss": 0.0097, "step": 313130 }, { "epoch": 1.58, "learning_rate": 6.302526095928076e-05, "loss": 0.0082, "step": 313140 }, { "epoch": 1.58, "learning_rate": 6.301769326626675e-05, "loss": 0.0066, "step": 313150 }, { "epoch": 1.58, "learning_rate": 6.301012557325273e-05, "loss": 0.0063, "step": 313160 }, { "epoch": 1.58, "learning_rate": 6.300255788023873e-05, "loss": 0.0052, "step": 313170 }, { "epoch": 1.58, "learning_rate": 6.299499018722472e-05, "loss": 0.0084, "step": 313180 }, { "epoch": 1.58, "learning_rate": 6.29874224942107e-05, "loss": 0.0069, "step": 313190 }, { "epoch": 1.58, "learning_rate": 6.29798548011967e-05, "loss": 0.006, "step": 313200 }, { "epoch": 1.58, "learning_rate": 6.29722871081827e-05, "loss": 0.0059, "step": 313210 }, { "epoch": 1.58, "learning_rate": 6.296471941516867e-05, "loss": 0.0078, "step": 313220 }, { "epoch": 1.58, "learning_rate": 6.295715172215467e-05, "loss": 0.0079, "step": 313230 }, { "epoch": 1.58, "learning_rate": 6.294958402914065e-05, "loss": 0.0084, "step": 313240 }, { "epoch": 1.58, "learning_rate": 6.294201633612665e-05, "loss": 0.005, "step": 313250 }, { "epoch": 1.58, "learning_rate": 6.293444864311264e-05, "loss": 0.0064, "step": 313260 }, { "epoch": 1.58, "learning_rate": 6.292688095009862e-05, "loss": 0.0063, "step": 313270 }, { "epoch": 1.58, "learning_rate": 6.291931325708462e-05, "loss": 0.0055, "step": 313280 }, { "epoch": 1.58, "learning_rate": 6.291174556407061e-05, "loss": 0.0051, "step": 313290 }, { "epoch": 1.58, "learning_rate": 6.29041778710566e-05, "loss": 0.0096, "step": 313300 }, { "epoch": 1.58, "learning_rate": 6.289661017804259e-05, "loss": 0.0071, "step": 313310 }, { "epoch": 1.58, "learning_rate": 6.288904248502857e-05, "loss": 0.007, "step": 313320 }, { "epoch": 1.58, "learning_rate": 6.288147479201457e-05, "loss": 0.006, "step": 313330 }, { "epoch": 1.58, "learning_rate": 6.287390709900056e-05, "loss": 0.0093, "step": 313340 }, { "epoch": 1.58, "learning_rate": 6.286633940598654e-05, "loss": 0.0055, "step": 313350 }, { "epoch": 1.58, "learning_rate": 6.285877171297254e-05, "loss": 0.0064, "step": 313360 }, { "epoch": 1.58, "learning_rate": 6.285120401995853e-05, "loss": 0.0061, "step": 313370 }, { "epoch": 1.58, "learning_rate": 6.284363632694451e-05, "loss": 0.0057, "step": 313380 }, { "epoch": 1.58, "learning_rate": 6.283606863393051e-05, "loss": 0.0065, "step": 313390 }, { "epoch": 1.58, "learning_rate": 6.282850094091649e-05, "loss": 0.0065, "step": 313400 }, { "epoch": 1.58, "learning_rate": 6.282093324790249e-05, "loss": 0.006, "step": 313410 }, { "epoch": 1.58, "learning_rate": 6.281336555488848e-05, "loss": 0.0071, "step": 313420 }, { "epoch": 1.58, "learning_rate": 6.280579786187446e-05, "loss": 0.0079, "step": 313430 }, { "epoch": 1.58, "learning_rate": 6.279823016886044e-05, "loss": 0.0054, "step": 313440 }, { "epoch": 1.58, "learning_rate": 6.279066247584644e-05, "loss": 0.0086, "step": 313450 }, { "epoch": 1.58, "learning_rate": 6.278309478283243e-05, "loss": 0.0073, "step": 313460 }, { "epoch": 1.58, "learning_rate": 6.277552708981841e-05, "loss": 0.0057, "step": 313470 }, { "epoch": 1.58, "learning_rate": 6.276795939680441e-05, "loss": 0.0092, "step": 313480 }, { "epoch": 1.58, "learning_rate": 6.276039170379039e-05, "loss": 0.0064, "step": 313490 }, { "epoch": 1.58, "learning_rate": 6.275282401077639e-05, "loss": 0.0063, "step": 313500 }, { "epoch": 1.58, "learning_rate": 6.274525631776238e-05, "loss": 0.0059, "step": 313510 }, { "epoch": 1.58, "learning_rate": 6.273768862474836e-05, "loss": 0.0059, "step": 313520 }, { "epoch": 1.58, "learning_rate": 6.273012093173436e-05, "loss": 0.01, "step": 313530 }, { "epoch": 1.58, "learning_rate": 6.272255323872035e-05, "loss": 0.0077, "step": 313540 }, { "epoch": 1.58, "learning_rate": 6.271498554570633e-05, "loss": 0.0061, "step": 313550 }, { "epoch": 1.58, "learning_rate": 6.270741785269233e-05, "loss": 0.0055, "step": 313560 }, { "epoch": 1.58, "learning_rate": 6.269985015967831e-05, "loss": 0.0097, "step": 313570 }, { "epoch": 1.58, "learning_rate": 6.26922824666643e-05, "loss": 0.0067, "step": 313580 }, { "epoch": 1.58, "learning_rate": 6.26847147736503e-05, "loss": 0.0078, "step": 313590 }, { "epoch": 1.58, "learning_rate": 6.267714708063628e-05, "loss": 0.0096, "step": 313600 }, { "epoch": 1.58, "learning_rate": 6.266957938762228e-05, "loss": 0.0053, "step": 313610 }, { "epoch": 1.58, "learning_rate": 6.266201169460827e-05, "loss": 0.0077, "step": 313620 }, { "epoch": 1.58, "learning_rate": 6.265444400159425e-05, "loss": 0.0075, "step": 313630 }, { "epoch": 1.58, "learning_rate": 6.264687630858025e-05, "loss": 0.0069, "step": 313640 }, { "epoch": 1.58, "learning_rate": 6.263930861556623e-05, "loss": 0.0069, "step": 313650 }, { "epoch": 1.58, "learning_rate": 6.263174092255222e-05, "loss": 0.0054, "step": 313660 }, { "epoch": 1.58, "learning_rate": 6.262417322953822e-05, "loss": 0.0074, "step": 313670 }, { "epoch": 1.58, "learning_rate": 6.26166055365242e-05, "loss": 0.005, "step": 313680 }, { "epoch": 1.58, "learning_rate": 6.26090378435102e-05, "loss": 0.0053, "step": 313690 }, { "epoch": 1.58, "learning_rate": 6.260147015049619e-05, "loss": 0.0051, "step": 313700 }, { "epoch": 1.58, "learning_rate": 6.259390245748217e-05, "loss": 0.0068, "step": 313710 }, { "epoch": 1.58, "learning_rate": 6.258633476446817e-05, "loss": 0.0058, "step": 313720 }, { "epoch": 1.58, "learning_rate": 6.257876707145416e-05, "loss": 0.0069, "step": 313730 }, { "epoch": 1.58, "learning_rate": 6.257119937844014e-05, "loss": 0.0061, "step": 313740 }, { "epoch": 1.58, "learning_rate": 6.256363168542614e-05, "loss": 0.0087, "step": 313750 }, { "epoch": 1.58, "learning_rate": 6.255606399241212e-05, "loss": 0.0069, "step": 313760 }, { "epoch": 1.58, "learning_rate": 6.25484962993981e-05, "loss": 0.0055, "step": 313770 }, { "epoch": 1.58, "learning_rate": 6.25409286063841e-05, "loss": 0.0074, "step": 313780 }, { "epoch": 1.58, "learning_rate": 6.253336091337009e-05, "loss": 0.008, "step": 313790 }, { "epoch": 1.58, "learning_rate": 6.252579322035607e-05, "loss": 0.0065, "step": 313800 }, { "epoch": 1.58, "learning_rate": 6.251822552734207e-05, "loss": 0.0059, "step": 313810 }, { "epoch": 1.58, "learning_rate": 6.251065783432806e-05, "loss": 0.0073, "step": 313820 }, { "epoch": 1.58, "learning_rate": 6.250309014131404e-05, "loss": 0.0069, "step": 313830 }, { "epoch": 1.58, "learning_rate": 6.249552244830004e-05, "loss": 0.0077, "step": 313840 }, { "epoch": 1.58, "learning_rate": 6.248795475528602e-05, "loss": 0.0075, "step": 313850 }, { "epoch": 1.58, "learning_rate": 6.248038706227202e-05, "loss": 0.0089, "step": 313860 }, { "epoch": 1.58, "learning_rate": 6.247281936925801e-05, "loss": 0.006, "step": 313870 }, { "epoch": 1.58, "learning_rate": 6.246525167624399e-05, "loss": 0.0064, "step": 313880 }, { "epoch": 1.58, "learning_rate": 6.245768398322999e-05, "loss": 0.0064, "step": 313890 }, { "epoch": 1.58, "learning_rate": 6.245011629021598e-05, "loss": 0.0062, "step": 313900 }, { "epoch": 1.58, "learning_rate": 6.244254859720196e-05, "loss": 0.0072, "step": 313910 }, { "epoch": 1.58, "learning_rate": 6.243498090418796e-05, "loss": 0.0105, "step": 313920 }, { "epoch": 1.58, "learning_rate": 6.242741321117394e-05, "loss": 0.0067, "step": 313930 }, { "epoch": 1.58, "learning_rate": 6.241984551815994e-05, "loss": 0.007, "step": 313940 }, { "epoch": 1.58, "learning_rate": 6.241227782514593e-05, "loss": 0.0062, "step": 313950 }, { "epoch": 1.58, "learning_rate": 6.240471013213191e-05, "loss": 0.008, "step": 313960 }, { "epoch": 1.58, "learning_rate": 6.23971424391179e-05, "loss": 0.0068, "step": 313970 }, { "epoch": 1.58, "learning_rate": 6.23895747461039e-05, "loss": 0.0085, "step": 313980 }, { "epoch": 1.58, "learning_rate": 6.238200705308988e-05, "loss": 0.0067, "step": 313990 }, { "epoch": 1.58, "learning_rate": 6.237443936007588e-05, "loss": 0.0059, "step": 314000 }, { "epoch": 1.58, "eval_cer": 0.9144314400581461, "eval_loss": 0.005062195006757975, "eval_runtime": 116.4946, "eval_samples_per_second": 17.168, "eval_steps_per_second": 4.292, "step": 314000 }, { "epoch": 1.58, "learning_rate": 6.236687166706186e-05, "loss": 0.0077, "step": 314010 }, { "epoch": 1.58, "learning_rate": 6.235930397404785e-05, "loss": 0.0077, "step": 314020 }, { "epoch": 1.58, "learning_rate": 6.235173628103385e-05, "loss": 0.0076, "step": 314030 }, { "epoch": 1.58, "learning_rate": 6.234416858801983e-05, "loss": 0.009, "step": 314040 }, { "epoch": 1.58, "learning_rate": 6.233660089500583e-05, "loss": 0.0073, "step": 314050 }, { "epoch": 1.58, "learning_rate": 6.232903320199182e-05, "loss": 0.0057, "step": 314060 }, { "epoch": 1.58, "learning_rate": 6.23214655089778e-05, "loss": 0.008, "step": 314070 }, { "epoch": 1.58, "learning_rate": 6.231389781596378e-05, "loss": 0.0063, "step": 314080 }, { "epoch": 1.58, "learning_rate": 6.230633012294978e-05, "loss": 0.0072, "step": 314090 }, { "epoch": 1.58, "learning_rate": 6.229876242993576e-05, "loss": 0.0063, "step": 314100 }, { "epoch": 1.58, "learning_rate": 6.229119473692176e-05, "loss": 0.0078, "step": 314110 }, { "epoch": 1.58, "learning_rate": 6.228362704390775e-05, "loss": 0.0059, "step": 314120 }, { "epoch": 1.58, "learning_rate": 6.227605935089373e-05, "loss": 0.0054, "step": 314130 }, { "epoch": 1.58, "learning_rate": 6.226849165787973e-05, "loss": 0.0108, "step": 314140 }, { "epoch": 1.58, "learning_rate": 6.226092396486572e-05, "loss": 0.0088, "step": 314150 }, { "epoch": 1.58, "learning_rate": 6.22533562718517e-05, "loss": 0.0065, "step": 314160 }, { "epoch": 1.59, "learning_rate": 6.22457885788377e-05, "loss": 0.0061, "step": 314170 }, { "epoch": 1.59, "learning_rate": 6.223822088582369e-05, "loss": 0.0057, "step": 314180 }, { "epoch": 1.59, "learning_rate": 6.223065319280967e-05, "loss": 0.0055, "step": 314190 }, { "epoch": 1.59, "learning_rate": 6.222308549979567e-05, "loss": 0.0079, "step": 314200 }, { "epoch": 1.59, "learning_rate": 6.221551780678165e-05, "loss": 0.0067, "step": 314210 }, { "epoch": 1.59, "learning_rate": 6.220795011376765e-05, "loss": 0.0054, "step": 314220 }, { "epoch": 1.59, "learning_rate": 6.220038242075364e-05, "loss": 0.008, "step": 314230 }, { "epoch": 1.59, "learning_rate": 6.219281472773962e-05, "loss": 0.0059, "step": 314240 }, { "epoch": 1.59, "learning_rate": 6.218524703472562e-05, "loss": 0.0077, "step": 314250 }, { "epoch": 1.59, "learning_rate": 6.217767934171161e-05, "loss": 0.0044, "step": 314260 }, { "epoch": 1.59, "learning_rate": 6.21701116486976e-05, "loss": 0.006, "step": 314270 }, { "epoch": 1.59, "learning_rate": 6.216254395568359e-05, "loss": 0.0055, "step": 314280 }, { "epoch": 1.59, "learning_rate": 6.215497626266957e-05, "loss": 0.0078, "step": 314290 }, { "epoch": 1.59, "learning_rate": 6.214740856965557e-05, "loss": 0.0053, "step": 314300 }, { "epoch": 1.59, "learning_rate": 6.213984087664156e-05, "loss": 0.0059, "step": 314310 }, { "epoch": 1.59, "learning_rate": 6.213227318362754e-05, "loss": 0.0065, "step": 314320 }, { "epoch": 1.59, "learning_rate": 6.212470549061354e-05, "loss": 0.0067, "step": 314330 }, { "epoch": 1.59, "learning_rate": 6.211713779759953e-05, "loss": 0.0048, "step": 314340 }, { "epoch": 1.59, "learning_rate": 6.210957010458551e-05, "loss": 0.0059, "step": 314350 }, { "epoch": 1.59, "learning_rate": 6.210200241157151e-05, "loss": 0.0077, "step": 314360 }, { "epoch": 1.59, "learning_rate": 6.209443471855749e-05, "loss": 0.0072, "step": 314370 }, { "epoch": 1.59, "learning_rate": 6.208686702554347e-05, "loss": 0.0073, "step": 314380 }, { "epoch": 1.59, "learning_rate": 6.207929933252947e-05, "loss": 0.008, "step": 314390 }, { "epoch": 1.59, "learning_rate": 6.207173163951546e-05, "loss": 0.009, "step": 314400 }, { "epoch": 1.59, "learning_rate": 6.206416394650144e-05, "loss": 0.0056, "step": 314410 }, { "epoch": 1.59, "learning_rate": 6.205659625348744e-05, "loss": 0.0077, "step": 314420 }, { "epoch": 1.59, "learning_rate": 6.204902856047343e-05, "loss": 0.009, "step": 314430 }, { "epoch": 1.59, "learning_rate": 6.204146086745941e-05, "loss": 0.0066, "step": 314440 }, { "epoch": 1.59, "learning_rate": 6.203389317444541e-05, "loss": 0.0058, "step": 314450 }, { "epoch": 1.59, "learning_rate": 6.202632548143139e-05, "loss": 0.0071, "step": 314460 }, { "epoch": 1.59, "learning_rate": 6.201875778841739e-05, "loss": 0.0058, "step": 314470 }, { "epoch": 1.59, "learning_rate": 6.201119009540338e-05, "loss": 0.0066, "step": 314480 }, { "epoch": 1.59, "learning_rate": 6.200362240238936e-05, "loss": 0.0054, "step": 314490 }, { "epoch": 1.59, "learning_rate": 6.199605470937536e-05, "loss": 0.0047, "step": 314500 }, { "epoch": 1.59, "learning_rate": 6.198848701636135e-05, "loss": 0.0054, "step": 314510 }, { "epoch": 1.59, "learning_rate": 6.198091932334733e-05, "loss": 0.0074, "step": 314520 }, { "epoch": 1.59, "learning_rate": 6.197335163033333e-05, "loss": 0.0062, "step": 314530 }, { "epoch": 1.59, "learning_rate": 6.196578393731931e-05, "loss": 0.0069, "step": 314540 }, { "epoch": 1.59, "learning_rate": 6.19582162443053e-05, "loss": 0.0075, "step": 314550 }, { "epoch": 1.59, "learning_rate": 6.19506485512913e-05, "loss": 0.0078, "step": 314560 }, { "epoch": 1.59, "learning_rate": 6.194308085827728e-05, "loss": 0.0059, "step": 314570 }, { "epoch": 1.59, "learning_rate": 6.193551316526328e-05, "loss": 0.009, "step": 314580 }, { "epoch": 1.59, "learning_rate": 6.192794547224927e-05, "loss": 0.005, "step": 314590 }, { "epoch": 1.59, "learning_rate": 6.192037777923525e-05, "loss": 0.0057, "step": 314600 }, { "epoch": 1.59, "learning_rate": 6.191281008622125e-05, "loss": 0.0071, "step": 314610 }, { "epoch": 1.59, "learning_rate": 6.190524239320723e-05, "loss": 0.0094, "step": 314620 }, { "epoch": 1.59, "learning_rate": 6.189767470019322e-05, "loss": 0.0065, "step": 314630 }, { "epoch": 1.59, "learning_rate": 6.189010700717922e-05, "loss": 0.0076, "step": 314640 }, { "epoch": 1.59, "learning_rate": 6.18825393141652e-05, "loss": 0.0073, "step": 314650 }, { "epoch": 1.59, "learning_rate": 6.18749716211512e-05, "loss": 0.008, "step": 314660 }, { "epoch": 1.59, "learning_rate": 6.186740392813719e-05, "loss": 0.0083, "step": 314670 }, { "epoch": 1.59, "learning_rate": 6.185983623512317e-05, "loss": 0.0071, "step": 314680 }, { "epoch": 1.59, "learning_rate": 6.185226854210917e-05, "loss": 0.0076, "step": 314690 }, { "epoch": 1.59, "learning_rate": 6.184470084909515e-05, "loss": 0.0044, "step": 314700 }, { "epoch": 1.59, "learning_rate": 6.183713315608114e-05, "loss": 0.0069, "step": 314710 }, { "epoch": 1.59, "learning_rate": 6.182956546306712e-05, "loss": 0.0063, "step": 314720 }, { "epoch": 1.59, "learning_rate": 6.182199777005312e-05, "loss": 0.0069, "step": 314730 }, { "epoch": 1.59, "learning_rate": 6.18144300770391e-05, "loss": 0.0115, "step": 314740 }, { "epoch": 1.59, "learning_rate": 6.18068623840251e-05, "loss": 0.006, "step": 314750 }, { "epoch": 1.59, "learning_rate": 6.179929469101109e-05, "loss": 0.0079, "step": 314760 }, { "epoch": 1.59, "learning_rate": 6.179172699799707e-05, "loss": 0.0067, "step": 314770 }, { "epoch": 1.59, "learning_rate": 6.178415930498307e-05, "loss": 0.007, "step": 314780 }, { "epoch": 1.59, "learning_rate": 6.177659161196906e-05, "loss": 0.0061, "step": 314790 }, { "epoch": 1.59, "learning_rate": 6.176902391895504e-05, "loss": 0.0072, "step": 314800 }, { "epoch": 1.59, "learning_rate": 6.176145622594104e-05, "loss": 0.0067, "step": 314810 }, { "epoch": 1.59, "learning_rate": 6.175388853292702e-05, "loss": 0.0058, "step": 314820 }, { "epoch": 1.59, "learning_rate": 6.174632083991302e-05, "loss": 0.007, "step": 314830 }, { "epoch": 1.59, "learning_rate": 6.173875314689901e-05, "loss": 0.007, "step": 314840 }, { "epoch": 1.59, "learning_rate": 6.173118545388499e-05, "loss": 0.0058, "step": 314850 }, { "epoch": 1.59, "learning_rate": 6.172361776087099e-05, "loss": 0.0064, "step": 314860 }, { "epoch": 1.59, "learning_rate": 6.171605006785698e-05, "loss": 0.0074, "step": 314870 }, { "epoch": 1.59, "learning_rate": 6.170848237484296e-05, "loss": 0.0107, "step": 314880 }, { "epoch": 1.59, "learning_rate": 6.170091468182896e-05, "loss": 0.0055, "step": 314890 }, { "epoch": 1.59, "learning_rate": 6.169334698881494e-05, "loss": 0.0083, "step": 314900 }, { "epoch": 1.59, "learning_rate": 6.168577929580093e-05, "loss": 0.0074, "step": 314910 }, { "epoch": 1.59, "learning_rate": 6.167821160278693e-05, "loss": 0.0082, "step": 314920 }, { "epoch": 1.59, "learning_rate": 6.167064390977291e-05, "loss": 0.0071, "step": 314930 }, { "epoch": 1.59, "learning_rate": 6.16630762167589e-05, "loss": 0.0073, "step": 314940 }, { "epoch": 1.59, "learning_rate": 6.16555085237449e-05, "loss": 0.007, "step": 314950 }, { "epoch": 1.59, "learning_rate": 6.164794083073088e-05, "loss": 0.0045, "step": 314960 }, { "epoch": 1.59, "learning_rate": 6.164037313771688e-05, "loss": 0.0061, "step": 314970 }, { "epoch": 1.59, "learning_rate": 6.163280544470286e-05, "loss": 0.0056, "step": 314980 }, { "epoch": 1.59, "learning_rate": 6.162523775168885e-05, "loss": 0.0069, "step": 314990 }, { "epoch": 1.59, "learning_rate": 6.161767005867485e-05, "loss": 0.0065, "step": 315000 }, { "epoch": 1.59, "eval_cer": 0.9144207657007667, "eval_loss": 0.005126504693180323, "eval_runtime": 116.2813, "eval_samples_per_second": 17.2, "eval_steps_per_second": 4.3, "step": 315000 }, { "epoch": 1.59, "learning_rate": 6.161010236566083e-05, "loss": 0.0066, "step": 315010 }, { "epoch": 1.59, "learning_rate": 6.160253467264681e-05, "loss": 0.0056, "step": 315020 }, { "epoch": 1.59, "learning_rate": 6.159496697963281e-05, "loss": 0.005, "step": 315030 }, { "epoch": 1.59, "learning_rate": 6.15873992866188e-05, "loss": 0.0087, "step": 315040 }, { "epoch": 1.59, "learning_rate": 6.157983159360478e-05, "loss": 0.0079, "step": 315050 }, { "epoch": 1.59, "learning_rate": 6.157226390059078e-05, "loss": 0.0066, "step": 315060 }, { "epoch": 1.59, "learning_rate": 6.156469620757676e-05, "loss": 0.0067, "step": 315070 }, { "epoch": 1.59, "learning_rate": 6.155712851456275e-05, "loss": 0.0095, "step": 315080 }, { "epoch": 1.59, "learning_rate": 6.154956082154875e-05, "loss": 0.0076, "step": 315090 }, { "epoch": 1.59, "learning_rate": 6.154199312853473e-05, "loss": 0.0104, "step": 315100 }, { "epoch": 1.59, "learning_rate": 6.153442543552073e-05, "loss": 0.0092, "step": 315110 }, { "epoch": 1.59, "learning_rate": 6.152685774250672e-05, "loss": 0.0069, "step": 315120 }, { "epoch": 1.59, "learning_rate": 6.15192900494927e-05, "loss": 0.0068, "step": 315130 }, { "epoch": 1.59, "learning_rate": 6.15117223564787e-05, "loss": 0.0065, "step": 315140 }, { "epoch": 1.59, "learning_rate": 6.150415466346469e-05, "loss": 0.007, "step": 315150 }, { "epoch": 1.59, "learning_rate": 6.149658697045067e-05, "loss": 0.0081, "step": 315160 }, { "epoch": 1.59, "learning_rate": 6.148901927743667e-05, "loss": 0.0069, "step": 315170 }, { "epoch": 1.59, "learning_rate": 6.148145158442265e-05, "loss": 0.0062, "step": 315180 }, { "epoch": 1.59, "learning_rate": 6.147388389140865e-05, "loss": 0.0071, "step": 315190 }, { "epoch": 1.59, "learning_rate": 6.146631619839464e-05, "loss": 0.0067, "step": 315200 }, { "epoch": 1.59, "learning_rate": 6.145874850538062e-05, "loss": 0.0073, "step": 315210 }, { "epoch": 1.59, "learning_rate": 6.145118081236662e-05, "loss": 0.0079, "step": 315220 }, { "epoch": 1.59, "learning_rate": 6.144361311935261e-05, "loss": 0.0061, "step": 315230 }, { "epoch": 1.59, "learning_rate": 6.14360454263386e-05, "loss": 0.0062, "step": 315240 }, { "epoch": 1.59, "learning_rate": 6.142847773332459e-05, "loss": 0.0074, "step": 315250 }, { "epoch": 1.59, "learning_rate": 6.142091004031057e-05, "loss": 0.0063, "step": 315260 }, { "epoch": 1.59, "learning_rate": 6.141334234729656e-05, "loss": 0.0068, "step": 315270 }, { "epoch": 1.59, "learning_rate": 6.140577465428256e-05, "loss": 0.0056, "step": 315280 }, { "epoch": 1.59, "learning_rate": 6.139820696126854e-05, "loss": 0.006, "step": 315290 }, { "epoch": 1.59, "learning_rate": 6.139063926825454e-05, "loss": 0.0071, "step": 315300 }, { "epoch": 1.59, "learning_rate": 6.138307157524053e-05, "loss": 0.0074, "step": 315310 }, { "epoch": 1.59, "learning_rate": 6.137550388222651e-05, "loss": 0.0052, "step": 315320 }, { "epoch": 1.59, "learning_rate": 6.13679361892125e-05, "loss": 0.0058, "step": 315330 }, { "epoch": 1.59, "learning_rate": 6.136036849619849e-05, "loss": 0.0059, "step": 315340 }, { "epoch": 1.59, "learning_rate": 6.135280080318447e-05, "loss": 0.0061, "step": 315350 }, { "epoch": 1.59, "learning_rate": 6.134523311017047e-05, "loss": 0.0066, "step": 315360 }, { "epoch": 1.59, "learning_rate": 6.133766541715646e-05, "loss": 0.006, "step": 315370 }, { "epoch": 1.59, "learning_rate": 6.133009772414244e-05, "loss": 0.0069, "step": 315380 }, { "epoch": 1.59, "learning_rate": 6.132253003112844e-05, "loss": 0.0068, "step": 315390 }, { "epoch": 1.59, "learning_rate": 6.131496233811443e-05, "loss": 0.0075, "step": 315400 }, { "epoch": 1.59, "learning_rate": 6.130739464510041e-05, "loss": 0.0056, "step": 315410 }, { "epoch": 1.59, "learning_rate": 6.129982695208641e-05, "loss": 0.0073, "step": 315420 }, { "epoch": 1.59, "learning_rate": 6.129225925907239e-05, "loss": 0.0071, "step": 315430 }, { "epoch": 1.59, "learning_rate": 6.128469156605838e-05, "loss": 0.0067, "step": 315440 }, { "epoch": 1.59, "learning_rate": 6.127712387304438e-05, "loss": 0.0065, "step": 315450 }, { "epoch": 1.59, "learning_rate": 6.126955618003036e-05, "loss": 0.0083, "step": 315460 }, { "epoch": 1.59, "learning_rate": 6.126198848701636e-05, "loss": 0.0102, "step": 315470 }, { "epoch": 1.59, "learning_rate": 6.125442079400235e-05, "loss": 0.0066, "step": 315480 }, { "epoch": 1.59, "learning_rate": 6.124685310098833e-05, "loss": 0.0063, "step": 315490 }, { "epoch": 1.59, "learning_rate": 6.123928540797433e-05, "loss": 0.0067, "step": 315500 }, { "epoch": 1.59, "learning_rate": 6.123171771496031e-05, "loss": 0.0053, "step": 315510 }, { "epoch": 1.59, "learning_rate": 6.12241500219463e-05, "loss": 0.0068, "step": 315520 }, { "epoch": 1.59, "learning_rate": 6.12165823289323e-05, "loss": 0.0058, "step": 315530 }, { "epoch": 1.59, "learning_rate": 6.120901463591828e-05, "loss": 0.0059, "step": 315540 }, { "epoch": 1.59, "learning_rate": 6.120144694290428e-05, "loss": 0.0056, "step": 315550 }, { "epoch": 1.59, "learning_rate": 6.119387924989027e-05, "loss": 0.0081, "step": 315560 }, { "epoch": 1.59, "learning_rate": 6.118631155687625e-05, "loss": 0.0082, "step": 315570 }, { "epoch": 1.59, "learning_rate": 6.117874386386225e-05, "loss": 0.0081, "step": 315580 }, { "epoch": 1.59, "learning_rate": 6.117117617084823e-05, "loss": 0.0059, "step": 315590 }, { "epoch": 1.59, "learning_rate": 6.116360847783422e-05, "loss": 0.0094, "step": 315600 }, { "epoch": 1.59, "learning_rate": 6.115604078482022e-05, "loss": 0.0084, "step": 315610 }, { "epoch": 1.59, "learning_rate": 6.11484730918062e-05, "loss": 0.006, "step": 315620 }, { "epoch": 1.59, "learning_rate": 6.11409053987922e-05, "loss": 0.0066, "step": 315630 }, { "epoch": 1.59, "learning_rate": 6.113333770577818e-05, "loss": 0.0074, "step": 315640 }, { "epoch": 1.59, "learning_rate": 6.112577001276417e-05, "loss": 0.0058, "step": 315650 }, { "epoch": 1.59, "learning_rate": 6.111820231975015e-05, "loss": 0.0058, "step": 315660 }, { "epoch": 1.59, "learning_rate": 6.111063462673615e-05, "loss": 0.0076, "step": 315670 }, { "epoch": 1.59, "learning_rate": 6.110306693372214e-05, "loss": 0.0055, "step": 315680 }, { "epoch": 1.59, "learning_rate": 6.109549924070812e-05, "loss": 0.0111, "step": 315690 }, { "epoch": 1.59, "learning_rate": 6.108793154769412e-05, "loss": 0.0078, "step": 315700 }, { "epoch": 1.59, "learning_rate": 6.10803638546801e-05, "loss": 0.0075, "step": 315710 }, { "epoch": 1.59, "learning_rate": 6.10727961616661e-05, "loss": 0.0073, "step": 315720 }, { "epoch": 1.59, "learning_rate": 6.106522846865209e-05, "loss": 0.0062, "step": 315730 }, { "epoch": 1.59, "learning_rate": 6.105766077563807e-05, "loss": 0.009, "step": 315740 }, { "epoch": 1.59, "learning_rate": 6.105009308262407e-05, "loss": 0.0069, "step": 315750 }, { "epoch": 1.59, "learning_rate": 6.104252538961006e-05, "loss": 0.0073, "step": 315760 }, { "epoch": 1.59, "learning_rate": 6.1034957696596043e-05, "loss": 0.0092, "step": 315770 }, { "epoch": 1.59, "learning_rate": 6.102739000358204e-05, "loss": 0.0078, "step": 315780 }, { "epoch": 1.59, "learning_rate": 6.101982231056803e-05, "loss": 0.0065, "step": 315790 }, { "epoch": 1.59, "learning_rate": 6.1012254617554015e-05, "loss": 0.0066, "step": 315800 }, { "epoch": 1.59, "learning_rate": 6.100468692454e-05, "loss": 0.007, "step": 315810 }, { "epoch": 1.59, "learning_rate": 6.0997119231526e-05, "loss": 0.007, "step": 315820 }, { "epoch": 1.59, "learning_rate": 6.0989551538511986e-05, "loss": 0.0057, "step": 315830 }, { "epoch": 1.59, "learning_rate": 6.0981983845497975e-05, "loss": 0.0086, "step": 315840 }, { "epoch": 1.59, "learning_rate": 6.097441615248396e-05, "loss": 0.012, "step": 315850 }, { "epoch": 1.59, "learning_rate": 6.096684845946996e-05, "loss": 0.0072, "step": 315860 }, { "epoch": 1.59, "learning_rate": 6.0959280766455946e-05, "loss": 0.0114, "step": 315870 }, { "epoch": 1.59, "learning_rate": 6.0951713073441934e-05, "loss": 0.0061, "step": 315880 }, { "epoch": 1.59, "learning_rate": 6.094414538042792e-05, "loss": 0.0058, "step": 315890 }, { "epoch": 1.59, "learning_rate": 6.093657768741392e-05, "loss": 0.007, "step": 315900 }, { "epoch": 1.59, "learning_rate": 6.0929009994399906e-05, "loss": 0.005, "step": 315910 }, { "epoch": 1.59, "learning_rate": 6.0921442301385894e-05, "loss": 0.0061, "step": 315920 }, { "epoch": 1.59, "learning_rate": 6.091387460837188e-05, "loss": 0.0048, "step": 315930 }, { "epoch": 1.59, "learning_rate": 6.090630691535788e-05, "loss": 0.0077, "step": 315940 }, { "epoch": 1.59, "learning_rate": 6.089873922234386e-05, "loss": 0.0074, "step": 315950 }, { "epoch": 1.59, "learning_rate": 6.089117152932985e-05, "loss": 0.0066, "step": 315960 }, { "epoch": 1.59, "learning_rate": 6.0883603836315835e-05, "loss": 0.0072, "step": 315970 }, { "epoch": 1.59, "learning_rate": 6.087603614330182e-05, "loss": 0.0065, "step": 315980 }, { "epoch": 1.59, "learning_rate": 6.086846845028782e-05, "loss": 0.0066, "step": 315990 }, { "epoch": 1.59, "learning_rate": 6.0860900757273806e-05, "loss": 0.0074, "step": 316000 }, { "epoch": 1.59, "eval_cer": 0.9144411440194001, "eval_loss": 0.005030008032917976, "eval_runtime": 116.3264, "eval_samples_per_second": 17.193, "eval_steps_per_second": 4.298, "step": 316000 }, { "epoch": 1.59, "learning_rate": 6.0853333064259795e-05, "loss": 0.0076, "step": 316010 }, { "epoch": 1.59, "learning_rate": 6.084576537124578e-05, "loss": 0.0054, "step": 316020 }, { "epoch": 1.59, "learning_rate": 6.083819767823178e-05, "loss": 0.0062, "step": 316030 }, { "epoch": 1.59, "learning_rate": 6.0830629985217766e-05, "loss": 0.0065, "step": 316040 }, { "epoch": 1.59, "learning_rate": 6.0823062292203754e-05, "loss": 0.0074, "step": 316050 }, { "epoch": 1.59, "learning_rate": 6.081549459918974e-05, "loss": 0.0079, "step": 316060 }, { "epoch": 1.59, "learning_rate": 6.080792690617574e-05, "loss": 0.0049, "step": 316070 }, { "epoch": 1.59, "learning_rate": 6.0800359213161726e-05, "loss": 0.0077, "step": 316080 }, { "epoch": 1.59, "learning_rate": 6.0792791520147714e-05, "loss": 0.0063, "step": 316090 }, { "epoch": 1.59, "learning_rate": 6.078522382713371e-05, "loss": 0.0048, "step": 316100 }, { "epoch": 1.59, "learning_rate": 6.07776561341197e-05, "loss": 0.0065, "step": 316110 }, { "epoch": 1.59, "learning_rate": 6.0770088441105685e-05, "loss": 0.0096, "step": 316120 }, { "epoch": 1.59, "learning_rate": 6.0762520748091674e-05, "loss": 0.0071, "step": 316130 }, { "epoch": 1.59, "learning_rate": 6.075495305507767e-05, "loss": 0.0065, "step": 316140 }, { "epoch": 1.6, "learning_rate": 6.074738536206366e-05, "loss": 0.008, "step": 316150 }, { "epoch": 1.6, "learning_rate": 6.0739817669049645e-05, "loss": 0.0064, "step": 316160 }, { "epoch": 1.6, "learning_rate": 6.073224997603563e-05, "loss": 0.0063, "step": 316170 }, { "epoch": 1.6, "learning_rate": 6.072468228302163e-05, "loss": 0.0061, "step": 316180 }, { "epoch": 1.6, "learning_rate": 6.0717114590007616e-05, "loss": 0.0071, "step": 316190 }, { "epoch": 1.6, "learning_rate": 6.0709546896993605e-05, "loss": 0.0059, "step": 316200 }, { "epoch": 1.6, "learning_rate": 6.070197920397959e-05, "loss": 0.0062, "step": 316210 }, { "epoch": 1.6, "learning_rate": 6.069441151096559e-05, "loss": 0.0078, "step": 316220 }, { "epoch": 1.6, "learning_rate": 6.0686843817951576e-05, "loss": 0.0047, "step": 316230 }, { "epoch": 1.6, "learning_rate": 6.0679276124937564e-05, "loss": 0.0082, "step": 316240 }, { "epoch": 1.6, "learning_rate": 6.067170843192355e-05, "loss": 0.0061, "step": 316250 }, { "epoch": 1.6, "learning_rate": 6.066414073890955e-05, "loss": 0.007, "step": 316260 }, { "epoch": 1.6, "learning_rate": 6.065657304589553e-05, "loss": 0.0065, "step": 316270 }, { "epoch": 1.6, "learning_rate": 6.064900535288152e-05, "loss": 0.0071, "step": 316280 }, { "epoch": 1.6, "learning_rate": 6.0641437659867505e-05, "loss": 0.0086, "step": 316290 }, { "epoch": 1.6, "learning_rate": 6.0633869966853494e-05, "loss": 0.0066, "step": 316300 }, { "epoch": 1.6, "learning_rate": 6.062630227383949e-05, "loss": 0.0069, "step": 316310 }, { "epoch": 1.6, "learning_rate": 6.061873458082548e-05, "loss": 0.0085, "step": 316320 }, { "epoch": 1.6, "learning_rate": 6.0611166887811465e-05, "loss": 0.0069, "step": 316330 }, { "epoch": 1.6, "learning_rate": 6.060359919479745e-05, "loss": 0.0051, "step": 316340 }, { "epoch": 1.6, "learning_rate": 6.059603150178345e-05, "loss": 0.0067, "step": 316350 }, { "epoch": 1.6, "learning_rate": 6.0588463808769436e-05, "loss": 0.008, "step": 316360 }, { "epoch": 1.6, "learning_rate": 6.0580896115755425e-05, "loss": 0.0068, "step": 316370 }, { "epoch": 1.6, "learning_rate": 6.057332842274141e-05, "loss": 0.0075, "step": 316380 }, { "epoch": 1.6, "learning_rate": 6.056576072972741e-05, "loss": 0.0064, "step": 316390 }, { "epoch": 1.6, "learning_rate": 6.0558193036713396e-05, "loss": 0.0074, "step": 316400 }, { "epoch": 1.6, "learning_rate": 6.0550625343699384e-05, "loss": 0.0068, "step": 316410 }, { "epoch": 1.6, "learning_rate": 6.054305765068537e-05, "loss": 0.008, "step": 316420 }, { "epoch": 1.6, "learning_rate": 6.053548995767137e-05, "loss": 0.0083, "step": 316430 }, { "epoch": 1.6, "learning_rate": 6.0527922264657356e-05, "loss": 0.0059, "step": 316440 }, { "epoch": 1.6, "learning_rate": 6.0520354571643344e-05, "loss": 0.0067, "step": 316450 }, { "epoch": 1.6, "learning_rate": 6.051278687862933e-05, "loss": 0.006, "step": 316460 }, { "epoch": 1.6, "learning_rate": 6.050521918561533e-05, "loss": 0.0087, "step": 316470 }, { "epoch": 1.6, "learning_rate": 6.0497651492601315e-05, "loss": 0.0085, "step": 316480 }, { "epoch": 1.6, "learning_rate": 6.0490083799587304e-05, "loss": 0.0067, "step": 316490 }, { "epoch": 1.6, "learning_rate": 6.048251610657329e-05, "loss": 0.0072, "step": 316500 }, { "epoch": 1.6, "learning_rate": 6.047494841355929e-05, "loss": 0.0058, "step": 316510 }, { "epoch": 1.6, "learning_rate": 6.0467380720545275e-05, "loss": 0.0068, "step": 316520 }, { "epoch": 1.6, "learning_rate": 6.045981302753126e-05, "loss": 0.0078, "step": 316530 }, { "epoch": 1.6, "learning_rate": 6.045224533451725e-05, "loss": 0.0058, "step": 316540 }, { "epoch": 1.6, "learning_rate": 6.0444677641503247e-05, "loss": 0.0058, "step": 316550 }, { "epoch": 1.6, "learning_rate": 6.0437109948489235e-05, "loss": 0.0059, "step": 316560 }, { "epoch": 1.6, "learning_rate": 6.042954225547522e-05, "loss": 0.0072, "step": 316570 }, { "epoch": 1.6, "learning_rate": 6.0421974562461204e-05, "loss": 0.0066, "step": 316580 }, { "epoch": 1.6, "learning_rate": 6.04144068694472e-05, "loss": 0.0072, "step": 316590 }, { "epoch": 1.6, "learning_rate": 6.040683917643319e-05, "loss": 0.0076, "step": 316600 }, { "epoch": 1.6, "learning_rate": 6.0399271483419176e-05, "loss": 0.0056, "step": 316610 }, { "epoch": 1.6, "learning_rate": 6.0391703790405164e-05, "loss": 0.0062, "step": 316620 }, { "epoch": 1.6, "learning_rate": 6.038413609739116e-05, "loss": 0.0059, "step": 316630 }, { "epoch": 1.6, "learning_rate": 6.037656840437715e-05, "loss": 0.0069, "step": 316640 }, { "epoch": 1.6, "learning_rate": 6.0369000711363135e-05, "loss": 0.0065, "step": 316650 }, { "epoch": 1.6, "learning_rate": 6.0361433018349124e-05, "loss": 0.0063, "step": 316660 }, { "epoch": 1.6, "learning_rate": 6.035386532533512e-05, "loss": 0.0062, "step": 316670 }, { "epoch": 1.6, "learning_rate": 6.034629763232111e-05, "loss": 0.0071, "step": 316680 }, { "epoch": 1.6, "learning_rate": 6.0338729939307095e-05, "loss": 0.0061, "step": 316690 }, { "epoch": 1.6, "learning_rate": 6.033116224629308e-05, "loss": 0.0063, "step": 316700 }, { "epoch": 1.6, "learning_rate": 6.032359455327908e-05, "loss": 0.0057, "step": 316710 }, { "epoch": 1.6, "learning_rate": 6.0316026860265067e-05, "loss": 0.0077, "step": 316720 }, { "epoch": 1.6, "learning_rate": 6.0308459167251055e-05, "loss": 0.0075, "step": 316730 }, { "epoch": 1.6, "learning_rate": 6.030089147423704e-05, "loss": 0.0062, "step": 316740 }, { "epoch": 1.6, "learning_rate": 6.029332378122304e-05, "loss": 0.0076, "step": 316750 }, { "epoch": 1.6, "learning_rate": 6.0285756088209026e-05, "loss": 0.0052, "step": 316760 }, { "epoch": 1.6, "learning_rate": 6.0278188395195014e-05, "loss": 0.0074, "step": 316770 }, { "epoch": 1.6, "learning_rate": 6.0270620702181e-05, "loss": 0.0052, "step": 316780 }, { "epoch": 1.6, "learning_rate": 6.0263053009167e-05, "loss": 0.0064, "step": 316790 }, { "epoch": 1.6, "learning_rate": 6.0255485316152986e-05, "loss": 0.0097, "step": 316800 }, { "epoch": 1.6, "learning_rate": 6.0247917623138974e-05, "loss": 0.0076, "step": 316810 }, { "epoch": 1.6, "learning_rate": 6.024034993012496e-05, "loss": 0.0068, "step": 316820 }, { "epoch": 1.6, "learning_rate": 6.023278223711096e-05, "loss": 0.0074, "step": 316830 }, { "epoch": 1.6, "learning_rate": 6.0225214544096946e-05, "loss": 0.0074, "step": 316840 }, { "epoch": 1.6, "learning_rate": 6.0217646851082934e-05, "loss": 0.0053, "step": 316850 }, { "epoch": 1.6, "learning_rate": 6.021007915806892e-05, "loss": 0.0082, "step": 316860 }, { "epoch": 1.6, "learning_rate": 6.020251146505492e-05, "loss": 0.008, "step": 316870 }, { "epoch": 1.6, "learning_rate": 6.0194943772040905e-05, "loss": 0.0058, "step": 316880 }, { "epoch": 1.6, "learning_rate": 6.018737607902689e-05, "loss": 0.0061, "step": 316890 }, { "epoch": 1.6, "learning_rate": 6.0179808386012875e-05, "loss": 0.007, "step": 316900 }, { "epoch": 1.6, "learning_rate": 6.017224069299886e-05, "loss": 0.0055, "step": 316910 }, { "epoch": 1.6, "learning_rate": 6.016467299998486e-05, "loss": 0.0083, "step": 316920 }, { "epoch": 1.6, "learning_rate": 6.0157105306970846e-05, "loss": 0.0068, "step": 316930 }, { "epoch": 1.6, "learning_rate": 6.0149537613956834e-05, "loss": 0.0087, "step": 316940 }, { "epoch": 1.6, "learning_rate": 6.014196992094282e-05, "loss": 0.007, "step": 316950 }, { "epoch": 1.6, "learning_rate": 6.013440222792882e-05, "loss": 0.0087, "step": 316960 }, { "epoch": 1.6, "learning_rate": 6.0126834534914806e-05, "loss": 0.006, "step": 316970 }, { "epoch": 1.6, "learning_rate": 6.0119266841900794e-05, "loss": 0.0063, "step": 316980 }, { "epoch": 1.6, "learning_rate": 6.011169914888678e-05, "loss": 0.0073, "step": 316990 }, { "epoch": 1.6, "learning_rate": 6.010413145587278e-05, "loss": 0.0076, "step": 317000 }, { "epoch": 1.6, "eval_cer": 0.9144518183767796, "eval_loss": 0.005164159927517176, "eval_runtime": 116.3465, "eval_samples_per_second": 17.19, "eval_steps_per_second": 4.298, "step": 317000 }, { "epoch": 1.6, "learning_rate": 6.0096563762858766e-05, "loss": 0.0069, "step": 317010 }, { "epoch": 1.6, "learning_rate": 6.0088996069844754e-05, "loss": 0.0065, "step": 317020 }, { "epoch": 1.6, "learning_rate": 6.008142837683074e-05, "loss": 0.0062, "step": 317030 }, { "epoch": 1.6, "learning_rate": 6.007386068381674e-05, "loss": 0.0066, "step": 317040 }, { "epoch": 1.6, "learning_rate": 6.0066292990802725e-05, "loss": 0.0097, "step": 317050 }, { "epoch": 1.6, "learning_rate": 6.0058725297788713e-05, "loss": 0.0098, "step": 317060 }, { "epoch": 1.6, "learning_rate": 6.005115760477471e-05, "loss": 0.0077, "step": 317070 }, { "epoch": 1.6, "learning_rate": 6.00435899117607e-05, "loss": 0.0087, "step": 317080 }, { "epoch": 1.6, "learning_rate": 6.0036022218746685e-05, "loss": 0.0061, "step": 317090 }, { "epoch": 1.6, "learning_rate": 6.002845452573267e-05, "loss": 0.0078, "step": 317100 }, { "epoch": 1.6, "learning_rate": 6.002088683271867e-05, "loss": 0.0063, "step": 317110 }, { "epoch": 1.6, "learning_rate": 6.0013319139704656e-05, "loss": 0.0056, "step": 317120 }, { "epoch": 1.6, "learning_rate": 6.0005751446690645e-05, "loss": 0.0068, "step": 317130 }, { "epoch": 1.6, "learning_rate": 5.999818375367663e-05, "loss": 0.0067, "step": 317140 }, { "epoch": 1.6, "learning_rate": 5.999061606066263e-05, "loss": 0.0079, "step": 317150 }, { "epoch": 1.6, "learning_rate": 5.9983048367648616e-05, "loss": 0.0064, "step": 317160 }, { "epoch": 1.6, "learning_rate": 5.9975480674634604e-05, "loss": 0.0052, "step": 317170 }, { "epoch": 1.6, "learning_rate": 5.996791298162059e-05, "loss": 0.007, "step": 317180 }, { "epoch": 1.6, "learning_rate": 5.996034528860659e-05, "loss": 0.0075, "step": 317190 }, { "epoch": 1.6, "learning_rate": 5.9952777595592576e-05, "loss": 0.008, "step": 317200 }, { "epoch": 1.6, "learning_rate": 5.994520990257856e-05, "loss": 0.006, "step": 317210 }, { "epoch": 1.6, "learning_rate": 5.9937642209564545e-05, "loss": 0.0053, "step": 317220 }, { "epoch": 1.6, "learning_rate": 5.9930074516550533e-05, "loss": 0.0084, "step": 317230 }, { "epoch": 1.6, "learning_rate": 5.992250682353653e-05, "loss": 0.0062, "step": 317240 }, { "epoch": 1.6, "learning_rate": 5.991493913052252e-05, "loss": 0.0077, "step": 317250 }, { "epoch": 1.6, "learning_rate": 5.9907371437508505e-05, "loss": 0.005, "step": 317260 }, { "epoch": 1.6, "learning_rate": 5.989980374449449e-05, "loss": 0.0086, "step": 317270 }, { "epoch": 1.6, "learning_rate": 5.989223605148049e-05, "loss": 0.0063, "step": 317280 }, { "epoch": 1.6, "learning_rate": 5.9884668358466476e-05, "loss": 0.0075, "step": 317290 }, { "epoch": 1.6, "learning_rate": 5.9877100665452465e-05, "loss": 0.0057, "step": 317300 }, { "epoch": 1.6, "learning_rate": 5.986953297243845e-05, "loss": 0.0062, "step": 317310 }, { "epoch": 1.6, "learning_rate": 5.986196527942445e-05, "loss": 0.0073, "step": 317320 }, { "epoch": 1.6, "learning_rate": 5.9854397586410436e-05, "loss": 0.0052, "step": 317330 }, { "epoch": 1.6, "learning_rate": 5.9846829893396424e-05, "loss": 0.0067, "step": 317340 }, { "epoch": 1.6, "learning_rate": 5.983926220038241e-05, "loss": 0.0061, "step": 317350 }, { "epoch": 1.6, "learning_rate": 5.983169450736841e-05, "loss": 0.0076, "step": 317360 }, { "epoch": 1.6, "learning_rate": 5.9824126814354396e-05, "loss": 0.0066, "step": 317370 }, { "epoch": 1.6, "learning_rate": 5.9816559121340384e-05, "loss": 0.0073, "step": 317380 }, { "epoch": 1.6, "learning_rate": 5.980899142832637e-05, "loss": 0.0079, "step": 317390 }, { "epoch": 1.6, "learning_rate": 5.980142373531237e-05, "loss": 0.0068, "step": 317400 }, { "epoch": 1.6, "learning_rate": 5.9793856042298355e-05, "loss": 0.0058, "step": 317410 }, { "epoch": 1.6, "learning_rate": 5.9786288349284344e-05, "loss": 0.0076, "step": 317420 }, { "epoch": 1.6, "learning_rate": 5.977872065627033e-05, "loss": 0.0062, "step": 317430 }, { "epoch": 1.6, "learning_rate": 5.977115296325633e-05, "loss": 0.0058, "step": 317440 }, { "epoch": 1.6, "learning_rate": 5.9763585270242315e-05, "loss": 0.0078, "step": 317450 }, { "epoch": 1.6, "learning_rate": 5.97560175772283e-05, "loss": 0.0063, "step": 317460 }, { "epoch": 1.6, "learning_rate": 5.974844988421429e-05, "loss": 0.0071, "step": 317470 }, { "epoch": 1.6, "learning_rate": 5.9740882191200286e-05, "loss": 0.0093, "step": 317480 }, { "epoch": 1.6, "learning_rate": 5.9733314498186275e-05, "loss": 0.008, "step": 317490 }, { "epoch": 1.6, "learning_rate": 5.972574680517226e-05, "loss": 0.0071, "step": 317500 }, { "epoch": 1.6, "learning_rate": 5.971817911215825e-05, "loss": 0.0058, "step": 317510 }, { "epoch": 1.6, "learning_rate": 5.9710611419144246e-05, "loss": 0.0073, "step": 317520 }, { "epoch": 1.6, "learning_rate": 5.970304372613023e-05, "loss": 0.006, "step": 317530 }, { "epoch": 1.6, "learning_rate": 5.9695476033116216e-05, "loss": 0.0058, "step": 317540 }, { "epoch": 1.6, "learning_rate": 5.9687908340102204e-05, "loss": 0.0071, "step": 317550 }, { "epoch": 1.6, "learning_rate": 5.96803406470882e-05, "loss": 0.0058, "step": 317560 }, { "epoch": 1.6, "learning_rate": 5.967277295407419e-05, "loss": 0.0102, "step": 317570 }, { "epoch": 1.6, "learning_rate": 5.9665205261060175e-05, "loss": 0.0068, "step": 317580 }, { "epoch": 1.6, "learning_rate": 5.9657637568046164e-05, "loss": 0.007, "step": 317590 }, { "epoch": 1.6, "learning_rate": 5.965006987503216e-05, "loss": 0.0071, "step": 317600 }, { "epoch": 1.6, "learning_rate": 5.964250218201815e-05, "loss": 0.0059, "step": 317610 }, { "epoch": 1.6, "learning_rate": 5.9634934489004135e-05, "loss": 0.0073, "step": 317620 }, { "epoch": 1.6, "learning_rate": 5.962736679599012e-05, "loss": 0.0061, "step": 317630 }, { "epoch": 1.6, "learning_rate": 5.961979910297612e-05, "loss": 0.0059, "step": 317640 }, { "epoch": 1.6, "learning_rate": 5.9612231409962106e-05, "loss": 0.0068, "step": 317650 }, { "epoch": 1.6, "learning_rate": 5.9604663716948095e-05, "loss": 0.0069, "step": 317660 }, { "epoch": 1.6, "learning_rate": 5.959709602393408e-05, "loss": 0.0069, "step": 317670 }, { "epoch": 1.6, "learning_rate": 5.958952833092008e-05, "loss": 0.0069, "step": 317680 }, { "epoch": 1.6, "learning_rate": 5.9581960637906066e-05, "loss": 0.0072, "step": 317690 }, { "epoch": 1.6, "learning_rate": 5.9574392944892054e-05, "loss": 0.0059, "step": 317700 }, { "epoch": 1.6, "learning_rate": 5.956682525187804e-05, "loss": 0.0089, "step": 317710 }, { "epoch": 1.6, "learning_rate": 5.955925755886404e-05, "loss": 0.0069, "step": 317720 }, { "epoch": 1.6, "learning_rate": 5.9551689865850026e-05, "loss": 0.008, "step": 317730 }, { "epoch": 1.6, "learning_rate": 5.9544122172836014e-05, "loss": 0.0074, "step": 317740 }, { "epoch": 1.6, "learning_rate": 5.9536554479822e-05, "loss": 0.006, "step": 317750 }, { "epoch": 1.6, "learning_rate": 5.9528986786808e-05, "loss": 0.0089, "step": 317760 }, { "epoch": 1.6, "learning_rate": 5.9521419093793985e-05, "loss": 0.0076, "step": 317770 }, { "epoch": 1.6, "learning_rate": 5.9513851400779974e-05, "loss": 0.009, "step": 317780 }, { "epoch": 1.6, "learning_rate": 5.950628370776596e-05, "loss": 0.0052, "step": 317790 }, { "epoch": 1.6, "learning_rate": 5.949871601475196e-05, "loss": 0.0056, "step": 317800 }, { "epoch": 1.6, "learning_rate": 5.9491148321737945e-05, "loss": 0.007, "step": 317810 }, { "epoch": 1.6, "learning_rate": 5.948358062872393e-05, "loss": 0.0084, "step": 317820 }, { "epoch": 1.6, "learning_rate": 5.947601293570992e-05, "loss": 0.0083, "step": 317830 }, { "epoch": 1.6, "learning_rate": 5.94684452426959e-05, "loss": 0.0069, "step": 317840 }, { "epoch": 1.6, "learning_rate": 5.94608775496819e-05, "loss": 0.0071, "step": 317850 }, { "epoch": 1.6, "learning_rate": 5.9453309856667886e-05, "loss": 0.0088, "step": 317860 }, { "epoch": 1.6, "learning_rate": 5.9445742163653874e-05, "loss": 0.0059, "step": 317870 }, { "epoch": 1.6, "learning_rate": 5.943817447063986e-05, "loss": 0.005, "step": 317880 }, { "epoch": 1.6, "learning_rate": 5.943060677762586e-05, "loss": 0.0065, "step": 317890 }, { "epoch": 1.6, "learning_rate": 5.9423039084611846e-05, "loss": 0.0062, "step": 317900 }, { "epoch": 1.6, "learning_rate": 5.9415471391597834e-05, "loss": 0.0061, "step": 317910 }, { "epoch": 1.6, "learning_rate": 5.940790369858382e-05, "loss": 0.0065, "step": 317920 }, { "epoch": 1.6, "learning_rate": 5.940033600556982e-05, "loss": 0.0065, "step": 317930 }, { "epoch": 1.6, "learning_rate": 5.9392768312555805e-05, "loss": 0.0059, "step": 317940 }, { "epoch": 1.6, "learning_rate": 5.9385200619541794e-05, "loss": 0.0065, "step": 317950 }, { "epoch": 1.6, "learning_rate": 5.937763292652778e-05, "loss": 0.0058, "step": 317960 }, { "epoch": 1.6, "learning_rate": 5.937006523351378e-05, "loss": 0.0075, "step": 317970 }, { "epoch": 1.6, "learning_rate": 5.9362497540499765e-05, "loss": 0.0061, "step": 317980 }, { "epoch": 1.6, "learning_rate": 5.935492984748575e-05, "loss": 0.0076, "step": 317990 }, { "epoch": 1.6, "learning_rate": 5.934736215447174e-05, "loss": 0.0051, "step": 318000 }, { "epoch": 1.6, "eval_cer": 0.9144285288697699, "eval_loss": 0.005206539761275053, "eval_runtime": 116.4709, "eval_samples_per_second": 17.172, "eval_steps_per_second": 4.293, "step": 318000 }, { "epoch": 1.6, "learning_rate": 5.9339794461457737e-05, "loss": 0.0057, "step": 318010 }, { "epoch": 1.6, "learning_rate": 5.9332226768443725e-05, "loss": 0.0096, "step": 318020 }, { "epoch": 1.6, "learning_rate": 5.932465907542971e-05, "loss": 0.0058, "step": 318030 }, { "epoch": 1.6, "learning_rate": 5.931709138241571e-05, "loss": 0.0061, "step": 318040 }, { "epoch": 1.6, "learning_rate": 5.9309523689401696e-05, "loss": 0.0083, "step": 318050 }, { "epoch": 1.6, "learning_rate": 5.9301955996387684e-05, "loss": 0.006, "step": 318060 }, { "epoch": 1.6, "learning_rate": 5.929438830337367e-05, "loss": 0.0071, "step": 318070 }, { "epoch": 1.6, "learning_rate": 5.928682061035967e-05, "loss": 0.0052, "step": 318080 }, { "epoch": 1.6, "learning_rate": 5.9279252917345656e-05, "loss": 0.0086, "step": 318090 }, { "epoch": 1.6, "learning_rate": 5.9271685224331644e-05, "loss": 0.0057, "step": 318100 }, { "epoch": 1.6, "learning_rate": 5.926411753131763e-05, "loss": 0.0086, "step": 318110 }, { "epoch": 1.6, "learning_rate": 5.925654983830363e-05, "loss": 0.0067, "step": 318120 }, { "epoch": 1.6, "learning_rate": 5.9248982145289615e-05, "loss": 0.0071, "step": 318130 }, { "epoch": 1.61, "learning_rate": 5.9241414452275604e-05, "loss": 0.0093, "step": 318140 }, { "epoch": 1.61, "learning_rate": 5.9233846759261585e-05, "loss": 0.0101, "step": 318150 }, { "epoch": 1.61, "learning_rate": 5.922627906624757e-05, "loss": 0.0071, "step": 318160 }, { "epoch": 1.61, "learning_rate": 5.921871137323357e-05, "loss": 0.0059, "step": 318170 }, { "epoch": 1.61, "learning_rate": 5.9211143680219557e-05, "loss": 0.0075, "step": 318180 }, { "epoch": 1.61, "learning_rate": 5.9203575987205545e-05, "loss": 0.0091, "step": 318190 }, { "epoch": 1.61, "learning_rate": 5.919600829419153e-05, "loss": 0.0086, "step": 318200 }, { "epoch": 1.61, "learning_rate": 5.918844060117753e-05, "loss": 0.0073, "step": 318210 }, { "epoch": 1.61, "learning_rate": 5.9180872908163516e-05, "loss": 0.0065, "step": 318220 }, { "epoch": 1.61, "learning_rate": 5.9173305215149504e-05, "loss": 0.0087, "step": 318230 }, { "epoch": 1.61, "learning_rate": 5.916573752213549e-05, "loss": 0.0068, "step": 318240 }, { "epoch": 1.61, "learning_rate": 5.915816982912149e-05, "loss": 0.0059, "step": 318250 }, { "epoch": 1.61, "learning_rate": 5.9150602136107476e-05, "loss": 0.0065, "step": 318260 }, { "epoch": 1.61, "learning_rate": 5.9143034443093464e-05, "loss": 0.0059, "step": 318270 }, { "epoch": 1.61, "learning_rate": 5.913546675007945e-05, "loss": 0.005, "step": 318280 }, { "epoch": 1.61, "learning_rate": 5.912789905706545e-05, "loss": 0.0077, "step": 318290 }, { "epoch": 1.61, "learning_rate": 5.9120331364051436e-05, "loss": 0.0081, "step": 318300 }, { "epoch": 1.61, "learning_rate": 5.9112763671037424e-05, "loss": 0.0063, "step": 318310 }, { "epoch": 1.61, "learning_rate": 5.910519597802341e-05, "loss": 0.006, "step": 318320 }, { "epoch": 1.61, "learning_rate": 5.909762828500941e-05, "loss": 0.0059, "step": 318330 }, { "epoch": 1.61, "learning_rate": 5.9090060591995395e-05, "loss": 0.0064, "step": 318340 }, { "epoch": 1.61, "learning_rate": 5.908249289898138e-05, "loss": 0.0062, "step": 318350 }, { "epoch": 1.61, "learning_rate": 5.907492520596737e-05, "loss": 0.0063, "step": 318360 }, { "epoch": 1.61, "learning_rate": 5.9067357512953367e-05, "loss": 0.0069, "step": 318370 }, { "epoch": 1.61, "learning_rate": 5.9059789819939355e-05, "loss": 0.0082, "step": 318380 }, { "epoch": 1.61, "learning_rate": 5.905222212692534e-05, "loss": 0.0062, "step": 318390 }, { "epoch": 1.61, "learning_rate": 5.904465443391133e-05, "loss": 0.0085, "step": 318400 }, { "epoch": 1.61, "learning_rate": 5.9037086740897326e-05, "loss": 0.0064, "step": 318410 }, { "epoch": 1.61, "learning_rate": 5.9029519047883314e-05, "loss": 0.0086, "step": 318420 }, { "epoch": 1.61, "learning_rate": 5.90219513548693e-05, "loss": 0.0088, "step": 318430 }, { "epoch": 1.61, "learning_rate": 5.901438366185529e-05, "loss": 0.008, "step": 318440 }, { "epoch": 1.61, "learning_rate": 5.9006815968841286e-05, "loss": 0.0071, "step": 318450 }, { "epoch": 1.61, "learning_rate": 5.8999248275827274e-05, "loss": 0.0057, "step": 318460 }, { "epoch": 1.61, "learning_rate": 5.8991680582813256e-05, "loss": 0.0068, "step": 318470 }, { "epoch": 1.61, "learning_rate": 5.8984112889799244e-05, "loss": 0.0056, "step": 318480 }, { "epoch": 1.61, "learning_rate": 5.897654519678523e-05, "loss": 0.0068, "step": 318490 }, { "epoch": 1.61, "learning_rate": 5.896897750377123e-05, "loss": 0.0065, "step": 318500 }, { "epoch": 1.61, "learning_rate": 5.8961409810757215e-05, "loss": 0.0062, "step": 318510 }, { "epoch": 1.61, "learning_rate": 5.8953842117743203e-05, "loss": 0.0077, "step": 318520 }, { "epoch": 1.61, "learning_rate": 5.89462744247292e-05, "loss": 0.0063, "step": 318530 }, { "epoch": 1.61, "learning_rate": 5.893870673171519e-05, "loss": 0.006, "step": 318540 }, { "epoch": 1.61, "learning_rate": 5.8931139038701175e-05, "loss": 0.0079, "step": 318550 }, { "epoch": 1.61, "learning_rate": 5.892357134568716e-05, "loss": 0.0075, "step": 318560 }, { "epoch": 1.61, "learning_rate": 5.891600365267316e-05, "loss": 0.008, "step": 318570 }, { "epoch": 1.61, "learning_rate": 5.8908435959659146e-05, "loss": 0.0098, "step": 318580 }, { "epoch": 1.61, "learning_rate": 5.8900868266645135e-05, "loss": 0.0068, "step": 318590 }, { "epoch": 1.61, "learning_rate": 5.889330057363112e-05, "loss": 0.0039, "step": 318600 }, { "epoch": 1.61, "learning_rate": 5.888573288061712e-05, "loss": 0.0062, "step": 318610 }, { "epoch": 1.61, "learning_rate": 5.8878165187603106e-05, "loss": 0.0086, "step": 318620 }, { "epoch": 1.61, "learning_rate": 5.8870597494589094e-05, "loss": 0.0049, "step": 318630 }, { "epoch": 1.61, "learning_rate": 5.886302980157508e-05, "loss": 0.0069, "step": 318640 }, { "epoch": 1.61, "learning_rate": 5.885546210856108e-05, "loss": 0.0065, "step": 318650 }, { "epoch": 1.61, "learning_rate": 5.8847894415547066e-05, "loss": 0.0085, "step": 318660 }, { "epoch": 1.61, "learning_rate": 5.8840326722533054e-05, "loss": 0.0062, "step": 318670 }, { "epoch": 1.61, "learning_rate": 5.883275902951904e-05, "loss": 0.0072, "step": 318680 }, { "epoch": 1.61, "learning_rate": 5.882519133650504e-05, "loss": 0.0058, "step": 318690 }, { "epoch": 1.61, "learning_rate": 5.8817623643491025e-05, "loss": 0.0081, "step": 318700 }, { "epoch": 1.61, "learning_rate": 5.8810055950477013e-05, "loss": 0.0069, "step": 318710 }, { "epoch": 1.61, "learning_rate": 5.8802488257463e-05, "loss": 0.0081, "step": 318720 }, { "epoch": 1.61, "learning_rate": 5.8794920564449e-05, "loss": 0.0075, "step": 318730 }, { "epoch": 1.61, "learning_rate": 5.8787352871434985e-05, "loss": 0.0055, "step": 318740 }, { "epoch": 1.61, "learning_rate": 5.877978517842097e-05, "loss": 0.0058, "step": 318750 }, { "epoch": 1.61, "learning_rate": 5.877221748540696e-05, "loss": 0.0067, "step": 318760 }, { "epoch": 1.61, "learning_rate": 5.8764649792392956e-05, "loss": 0.0051, "step": 318770 }, { "epoch": 1.61, "learning_rate": 5.875708209937894e-05, "loss": 0.0097, "step": 318780 }, { "epoch": 1.61, "learning_rate": 5.8749514406364926e-05, "loss": 0.0085, "step": 318790 }, { "epoch": 1.61, "learning_rate": 5.8741946713350914e-05, "loss": 0.0066, "step": 318800 }, { "epoch": 1.61, "learning_rate": 5.87343790203369e-05, "loss": 0.009, "step": 318810 }, { "epoch": 1.61, "learning_rate": 5.87268113273229e-05, "loss": 0.0054, "step": 318820 }, { "epoch": 1.61, "learning_rate": 5.8719243634308886e-05, "loss": 0.009, "step": 318830 }, { "epoch": 1.61, "learning_rate": 5.8711675941294874e-05, "loss": 0.0059, "step": 318840 }, { "epoch": 1.61, "learning_rate": 5.870410824828086e-05, "loss": 0.0086, "step": 318850 }, { "epoch": 1.61, "learning_rate": 5.869654055526686e-05, "loss": 0.0051, "step": 318860 }, { "epoch": 1.61, "learning_rate": 5.8688972862252845e-05, "loss": 0.0066, "step": 318870 }, { "epoch": 1.61, "learning_rate": 5.8681405169238834e-05, "loss": 0.0086, "step": 318880 }, { "epoch": 1.61, "learning_rate": 5.867383747622482e-05, "loss": 0.0096, "step": 318890 }, { "epoch": 1.61, "learning_rate": 5.866626978321082e-05, "loss": 0.0101, "step": 318900 }, { "epoch": 1.61, "learning_rate": 5.8658702090196805e-05, "loss": 0.0054, "step": 318910 }, { "epoch": 1.61, "learning_rate": 5.865113439718279e-05, "loss": 0.004, "step": 318920 }, { "epoch": 1.61, "learning_rate": 5.864356670416878e-05, "loss": 0.0062, "step": 318930 }, { "epoch": 1.61, "learning_rate": 5.8635999011154776e-05, "loss": 0.0064, "step": 318940 }, { "epoch": 1.61, "learning_rate": 5.8628431318140765e-05, "loss": 0.0063, "step": 318950 }, { "epoch": 1.61, "learning_rate": 5.862086362512675e-05, "loss": 0.0061, "step": 318960 }, { "epoch": 1.61, "learning_rate": 5.861329593211274e-05, "loss": 0.0076, "step": 318970 }, { "epoch": 1.61, "learning_rate": 5.8605728239098736e-05, "loss": 0.0083, "step": 318980 }, { "epoch": 1.61, "learning_rate": 5.8598160546084724e-05, "loss": 0.0108, "step": 318990 }, { "epoch": 1.61, "learning_rate": 5.859059285307071e-05, "loss": 0.0057, "step": 319000 }, { "epoch": 1.61, "eval_cer": 0.9144294992658953, "eval_loss": 0.00516105629503727, "eval_runtime": 116.3084, "eval_samples_per_second": 17.196, "eval_steps_per_second": 4.299, "step": 319000 }, { "epoch": 1.61, "learning_rate": 5.858302516005671e-05, "loss": 0.0061, "step": 319010 }, { "epoch": 1.61, "learning_rate": 5.8575457467042696e-05, "loss": 0.0062, "step": 319020 }, { "epoch": 1.61, "learning_rate": 5.8567889774028684e-05, "loss": 0.0084, "step": 319030 }, { "epoch": 1.61, "learning_rate": 5.856032208101467e-05, "loss": 0.0066, "step": 319040 }, { "epoch": 1.61, "learning_rate": 5.855275438800067e-05, "loss": 0.0077, "step": 319050 }, { "epoch": 1.61, "learning_rate": 5.8545186694986655e-05, "loss": 0.0092, "step": 319060 }, { "epoch": 1.61, "learning_rate": 5.8537619001972644e-05, "loss": 0.0067, "step": 319070 }, { "epoch": 1.61, "learning_rate": 5.853005130895863e-05, "loss": 0.0057, "step": 319080 }, { "epoch": 1.61, "learning_rate": 5.852248361594463e-05, "loss": 0.0092, "step": 319090 }, { "epoch": 1.61, "learning_rate": 5.851491592293061e-05, "loss": 0.0064, "step": 319100 }, { "epoch": 1.61, "learning_rate": 5.8507348229916596e-05, "loss": 0.0076, "step": 319110 }, { "epoch": 1.61, "learning_rate": 5.8499780536902585e-05, "loss": 0.0085, "step": 319120 }, { "epoch": 1.61, "learning_rate": 5.849221284388857e-05, "loss": 0.0044, "step": 319130 }, { "epoch": 1.61, "learning_rate": 5.848464515087457e-05, "loss": 0.008, "step": 319140 }, { "epoch": 1.61, "learning_rate": 5.8477077457860556e-05, "loss": 0.0072, "step": 319150 }, { "epoch": 1.61, "learning_rate": 5.8469509764846544e-05, "loss": 0.0083, "step": 319160 }, { "epoch": 1.61, "learning_rate": 5.846194207183253e-05, "loss": 0.0095, "step": 319170 }, { "epoch": 1.61, "learning_rate": 5.845437437881853e-05, "loss": 0.0075, "step": 319180 }, { "epoch": 1.61, "learning_rate": 5.8446806685804516e-05, "loss": 0.007, "step": 319190 }, { "epoch": 1.61, "learning_rate": 5.8439238992790504e-05, "loss": 0.0062, "step": 319200 }, { "epoch": 1.61, "learning_rate": 5.843167129977649e-05, "loss": 0.0054, "step": 319210 }, { "epoch": 1.61, "learning_rate": 5.842410360676249e-05, "loss": 0.0069, "step": 319220 }, { "epoch": 1.61, "learning_rate": 5.8416535913748475e-05, "loss": 0.0071, "step": 319230 }, { "epoch": 1.61, "learning_rate": 5.8408968220734464e-05, "loss": 0.0068, "step": 319240 }, { "epoch": 1.61, "learning_rate": 5.840140052772045e-05, "loss": 0.0089, "step": 319250 }, { "epoch": 1.61, "learning_rate": 5.839383283470645e-05, "loss": 0.0065, "step": 319260 }, { "epoch": 1.61, "learning_rate": 5.8386265141692435e-05, "loss": 0.0081, "step": 319270 }, { "epoch": 1.61, "learning_rate": 5.837869744867842e-05, "loss": 0.0071, "step": 319280 }, { "epoch": 1.61, "learning_rate": 5.837112975566441e-05, "loss": 0.011, "step": 319290 }, { "epoch": 1.61, "learning_rate": 5.8363562062650406e-05, "loss": 0.0049, "step": 319300 }, { "epoch": 1.61, "learning_rate": 5.8355994369636395e-05, "loss": 0.0064, "step": 319310 }, { "epoch": 1.61, "learning_rate": 5.834842667662238e-05, "loss": 0.0052, "step": 319320 }, { "epoch": 1.61, "learning_rate": 5.834085898360837e-05, "loss": 0.0066, "step": 319330 }, { "epoch": 1.61, "learning_rate": 5.8333291290594366e-05, "loss": 0.0067, "step": 319340 }, { "epoch": 1.61, "learning_rate": 5.8325723597580354e-05, "loss": 0.009, "step": 319350 }, { "epoch": 1.61, "learning_rate": 5.831815590456634e-05, "loss": 0.0066, "step": 319360 }, { "epoch": 1.61, "learning_rate": 5.831058821155233e-05, "loss": 0.0077, "step": 319370 }, { "epoch": 1.61, "learning_rate": 5.8303020518538326e-05, "loss": 0.0061, "step": 319380 }, { "epoch": 1.61, "learning_rate": 5.8295452825524314e-05, "loss": 0.0071, "step": 319390 }, { "epoch": 1.61, "learning_rate": 5.82878851325103e-05, "loss": 0.0054, "step": 319400 }, { "epoch": 1.61, "learning_rate": 5.8280317439496284e-05, "loss": 0.0068, "step": 319410 }, { "epoch": 1.61, "learning_rate": 5.827274974648227e-05, "loss": 0.0091, "step": 319420 }, { "epoch": 1.61, "learning_rate": 5.826518205346827e-05, "loss": 0.0054, "step": 319430 }, { "epoch": 1.61, "learning_rate": 5.8257614360454255e-05, "loss": 0.0053, "step": 319440 }, { "epoch": 1.61, "learning_rate": 5.825004666744024e-05, "loss": 0.0069, "step": 319450 }, { "epoch": 1.61, "learning_rate": 5.824247897442623e-05, "loss": 0.0067, "step": 319460 }, { "epoch": 1.61, "learning_rate": 5.8234911281412227e-05, "loss": 0.0081, "step": 319470 }, { "epoch": 1.61, "learning_rate": 5.8227343588398215e-05, "loss": 0.0082, "step": 319480 }, { "epoch": 1.61, "learning_rate": 5.82197758953842e-05, "loss": 0.0065, "step": 319490 }, { "epoch": 1.61, "learning_rate": 5.82122082023702e-05, "loss": 0.0079, "step": 319500 }, { "epoch": 1.61, "learning_rate": 5.8204640509356186e-05, "loss": 0.0068, "step": 319510 }, { "epoch": 1.61, "learning_rate": 5.8197072816342174e-05, "loss": 0.0086, "step": 319520 }, { "epoch": 1.61, "learning_rate": 5.818950512332816e-05, "loss": 0.0051, "step": 319530 }, { "epoch": 1.61, "learning_rate": 5.818193743031416e-05, "loss": 0.0059, "step": 319540 }, { "epoch": 1.61, "learning_rate": 5.8174369737300146e-05, "loss": 0.0054, "step": 319550 }, { "epoch": 1.61, "learning_rate": 5.8166802044286134e-05, "loss": 0.0054, "step": 319560 }, { "epoch": 1.61, "learning_rate": 5.815923435127212e-05, "loss": 0.0069, "step": 319570 }, { "epoch": 1.61, "learning_rate": 5.815166665825812e-05, "loss": 0.0065, "step": 319580 }, { "epoch": 1.61, "learning_rate": 5.8144098965244105e-05, "loss": 0.0051, "step": 319590 }, { "epoch": 1.61, "learning_rate": 5.8136531272230094e-05, "loss": 0.0063, "step": 319600 }, { "epoch": 1.61, "learning_rate": 5.812896357921608e-05, "loss": 0.006, "step": 319610 }, { "epoch": 1.61, "learning_rate": 5.812139588620208e-05, "loss": 0.0071, "step": 319620 }, { "epoch": 1.61, "learning_rate": 5.8113828193188065e-05, "loss": 0.0074, "step": 319630 }, { "epoch": 1.61, "learning_rate": 5.810626050017405e-05, "loss": 0.006, "step": 319640 }, { "epoch": 1.61, "learning_rate": 5.809869280716004e-05, "loss": 0.0062, "step": 319650 }, { "epoch": 1.61, "learning_rate": 5.8091125114146037e-05, "loss": 0.0068, "step": 319660 }, { "epoch": 1.61, "learning_rate": 5.8083557421132025e-05, "loss": 0.0065, "step": 319670 }, { "epoch": 1.61, "learning_rate": 5.807598972811801e-05, "loss": 0.0054, "step": 319680 }, { "epoch": 1.61, "learning_rate": 5.8068422035104e-05, "loss": 0.0051, "step": 319690 }, { "epoch": 1.61, "learning_rate": 5.8060854342089996e-05, "loss": 0.0055, "step": 319700 }, { "epoch": 1.61, "learning_rate": 5.8053286649075984e-05, "loss": 0.0077, "step": 319710 }, { "epoch": 1.61, "learning_rate": 5.804571895606197e-05, "loss": 0.0066, "step": 319720 }, { "epoch": 1.61, "learning_rate": 5.8038151263047954e-05, "loss": 0.0051, "step": 319730 }, { "epoch": 1.61, "learning_rate": 5.803058357003394e-05, "loss": 0.0069, "step": 319740 }, { "epoch": 1.61, "learning_rate": 5.802301587701994e-05, "loss": 0.0064, "step": 319750 }, { "epoch": 1.61, "learning_rate": 5.8015448184005926e-05, "loss": 0.0076, "step": 319760 }, { "epoch": 1.61, "learning_rate": 5.8007880490991914e-05, "loss": 0.0087, "step": 319770 }, { "epoch": 1.61, "learning_rate": 5.80003127979779e-05, "loss": 0.0068, "step": 319780 }, { "epoch": 1.61, "learning_rate": 5.79927451049639e-05, "loss": 0.0076, "step": 319790 }, { "epoch": 1.61, "learning_rate": 5.7985177411949885e-05, "loss": 0.0065, "step": 319800 }, { "epoch": 1.61, "learning_rate": 5.7977609718935873e-05, "loss": 0.0077, "step": 319810 }, { "epoch": 1.61, "learning_rate": 5.797004202592186e-05, "loss": 0.0048, "step": 319820 }, { "epoch": 1.61, "learning_rate": 5.7962474332907857e-05, "loss": 0.0057, "step": 319830 }, { "epoch": 1.61, "learning_rate": 5.7954906639893845e-05, "loss": 0.0054, "step": 319840 }, { "epoch": 1.61, "learning_rate": 5.794733894687983e-05, "loss": 0.0062, "step": 319850 }, { "epoch": 1.61, "learning_rate": 5.793977125386582e-05, "loss": 0.0056, "step": 319860 }, { "epoch": 1.61, "learning_rate": 5.7932203560851816e-05, "loss": 0.0083, "step": 319870 }, { "epoch": 1.61, "learning_rate": 5.7924635867837804e-05, "loss": 0.0064, "step": 319880 }, { "epoch": 1.61, "learning_rate": 5.791706817482379e-05, "loss": 0.0063, "step": 319890 }, { "epoch": 1.61, "learning_rate": 5.790950048180978e-05, "loss": 0.0069, "step": 319900 }, { "epoch": 1.61, "learning_rate": 5.7901932788795776e-05, "loss": 0.008, "step": 319910 }, { "epoch": 1.61, "learning_rate": 5.7894365095781764e-05, "loss": 0.0068, "step": 319920 }, { "epoch": 1.61, "learning_rate": 5.788679740276775e-05, "loss": 0.0064, "step": 319930 }, { "epoch": 1.61, "learning_rate": 5.787922970975374e-05, "loss": 0.0066, "step": 319940 }, { "epoch": 1.61, "learning_rate": 5.7871662016739736e-05, "loss": 0.007, "step": 319950 }, { "epoch": 1.61, "learning_rate": 5.7864094323725724e-05, "loss": 0.0054, "step": 319960 }, { "epoch": 1.61, "learning_rate": 5.785652663071171e-05, "loss": 0.0068, "step": 319970 }, { "epoch": 1.61, "learning_rate": 5.784895893769771e-05, "loss": 0.0068, "step": 319980 }, { "epoch": 1.61, "learning_rate": 5.7841391244683695e-05, "loss": 0.0073, "step": 319990 }, { "epoch": 1.61, "learning_rate": 5.7833823551669683e-05, "loss": 0.0058, "step": 320000 }, { "epoch": 1.61, "eval_cer": 0.9144392032271493, "eval_loss": 0.005123169161379337, "eval_runtime": 116.2037, "eval_samples_per_second": 17.211, "eval_steps_per_second": 4.303, "step": 320000 }, { "epoch": 1.61, "learning_rate": 5.782625585865567e-05, "loss": 0.0062, "step": 320010 }, { "epoch": 1.61, "learning_rate": 5.781868816564167e-05, "loss": 0.0058, "step": 320020 }, { "epoch": 1.61, "learning_rate": 5.7811120472627655e-05, "loss": 0.0101, "step": 320030 }, { "epoch": 1.61, "learning_rate": 5.7803552779613636e-05, "loss": 0.0063, "step": 320040 }, { "epoch": 1.61, "learning_rate": 5.7795985086599625e-05, "loss": 0.007, "step": 320050 }, { "epoch": 1.61, "learning_rate": 5.778841739358561e-05, "loss": 0.0061, "step": 320060 }, { "epoch": 1.61, "learning_rate": 5.778084970057161e-05, "loss": 0.0097, "step": 320070 }, { "epoch": 1.61, "learning_rate": 5.7773282007557596e-05, "loss": 0.0067, "step": 320080 }, { "epoch": 1.61, "learning_rate": 5.7765714314543584e-05, "loss": 0.0064, "step": 320090 }, { "epoch": 1.61, "learning_rate": 5.775814662152957e-05, "loss": 0.0095, "step": 320100 }, { "epoch": 1.61, "learning_rate": 5.775057892851557e-05, "loss": 0.0074, "step": 320110 }, { "epoch": 1.62, "learning_rate": 5.7743011235501556e-05, "loss": 0.0069, "step": 320120 }, { "epoch": 1.62, "learning_rate": 5.7735443542487544e-05, "loss": 0.0064, "step": 320130 }, { "epoch": 1.62, "learning_rate": 5.772787584947353e-05, "loss": 0.0096, "step": 320140 }, { "epoch": 1.62, "learning_rate": 5.772030815645953e-05, "loss": 0.0079, "step": 320150 }, { "epoch": 1.62, "learning_rate": 5.7712740463445515e-05, "loss": 0.0063, "step": 320160 }, { "epoch": 1.62, "learning_rate": 5.7705172770431503e-05, "loss": 0.0073, "step": 320170 }, { "epoch": 1.62, "learning_rate": 5.769760507741749e-05, "loss": 0.0079, "step": 320180 }, { "epoch": 1.62, "learning_rate": 5.769003738440349e-05, "loss": 0.0073, "step": 320190 }, { "epoch": 1.62, "learning_rate": 5.7682469691389475e-05, "loss": 0.0075, "step": 320200 }, { "epoch": 1.62, "learning_rate": 5.767490199837546e-05, "loss": 0.0073, "step": 320210 }, { "epoch": 1.62, "learning_rate": 5.766733430536145e-05, "loss": 0.008, "step": 320220 }, { "epoch": 1.62, "learning_rate": 5.7659766612347446e-05, "loss": 0.0054, "step": 320230 }, { "epoch": 1.62, "learning_rate": 5.7652198919333435e-05, "loss": 0.0061, "step": 320240 }, { "epoch": 1.62, "learning_rate": 5.764463122631942e-05, "loss": 0.0054, "step": 320250 }, { "epoch": 1.62, "learning_rate": 5.763706353330541e-05, "loss": 0.0067, "step": 320260 }, { "epoch": 1.62, "learning_rate": 5.7629495840291406e-05, "loss": 0.0111, "step": 320270 }, { "epoch": 1.62, "learning_rate": 5.7621928147277394e-05, "loss": 0.0069, "step": 320280 }, { "epoch": 1.62, "learning_rate": 5.761436045426338e-05, "loss": 0.0095, "step": 320290 }, { "epoch": 1.62, "learning_rate": 5.760679276124937e-05, "loss": 0.0072, "step": 320300 }, { "epoch": 1.62, "learning_rate": 5.7599225068235366e-05, "loss": 0.0067, "step": 320310 }, { "epoch": 1.62, "learning_rate": 5.7591657375221354e-05, "loss": 0.0068, "step": 320320 }, { "epoch": 1.62, "learning_rate": 5.758408968220734e-05, "loss": 0.0074, "step": 320330 }, { "epoch": 1.62, "learning_rate": 5.757652198919333e-05, "loss": 0.0091, "step": 320340 }, { "epoch": 1.62, "learning_rate": 5.756895429617931e-05, "loss": 0.0069, "step": 320350 }, { "epoch": 1.62, "learning_rate": 5.756138660316531e-05, "loss": 0.0071, "step": 320360 }, { "epoch": 1.62, "learning_rate": 5.7553818910151295e-05, "loss": 0.0051, "step": 320370 }, { "epoch": 1.62, "learning_rate": 5.754625121713728e-05, "loss": 0.0111, "step": 320380 }, { "epoch": 1.62, "learning_rate": 5.753868352412327e-05, "loss": 0.0073, "step": 320390 }, { "epoch": 1.62, "learning_rate": 5.7531115831109266e-05, "loss": 0.0086, "step": 320400 }, { "epoch": 1.62, "learning_rate": 5.7523548138095255e-05, "loss": 0.0071, "step": 320410 }, { "epoch": 1.62, "learning_rate": 5.751598044508124e-05, "loss": 0.0068, "step": 320420 }, { "epoch": 1.62, "learning_rate": 5.750841275206723e-05, "loss": 0.0078, "step": 320430 }, { "epoch": 1.62, "learning_rate": 5.7500845059053226e-05, "loss": 0.0063, "step": 320440 }, { "epoch": 1.62, "learning_rate": 5.7493277366039214e-05, "loss": 0.0086, "step": 320450 }, { "epoch": 1.62, "learning_rate": 5.74857096730252e-05, "loss": 0.0121, "step": 320460 }, { "epoch": 1.62, "learning_rate": 5.74781419800112e-05, "loss": 0.006, "step": 320470 }, { "epoch": 1.62, "learning_rate": 5.7470574286997186e-05, "loss": 0.0058, "step": 320480 }, { "epoch": 1.62, "learning_rate": 5.7463006593983174e-05, "loss": 0.0068, "step": 320490 }, { "epoch": 1.62, "learning_rate": 5.745543890096916e-05, "loss": 0.0085, "step": 320500 }, { "epoch": 1.62, "learning_rate": 5.744787120795516e-05, "loss": 0.0091, "step": 320510 }, { "epoch": 1.62, "learning_rate": 5.7440303514941145e-05, "loss": 0.0061, "step": 320520 }, { "epoch": 1.62, "learning_rate": 5.7432735821927134e-05, "loss": 0.0053, "step": 320530 }, { "epoch": 1.62, "learning_rate": 5.742516812891312e-05, "loss": 0.0058, "step": 320540 }, { "epoch": 1.62, "learning_rate": 5.741760043589912e-05, "loss": 0.0077, "step": 320550 }, { "epoch": 1.62, "learning_rate": 5.7410032742885105e-05, "loss": 0.0059, "step": 320560 }, { "epoch": 1.62, "learning_rate": 5.740246504987109e-05, "loss": 0.0064, "step": 320570 }, { "epoch": 1.62, "learning_rate": 5.739489735685708e-05, "loss": 0.0097, "step": 320580 }, { "epoch": 1.62, "learning_rate": 5.7387329663843076e-05, "loss": 0.0064, "step": 320590 }, { "epoch": 1.62, "learning_rate": 5.7379761970829065e-05, "loss": 0.0062, "step": 320600 }, { "epoch": 1.62, "learning_rate": 5.737219427781505e-05, "loss": 0.0073, "step": 320610 }, { "epoch": 1.62, "learning_rate": 5.736462658480104e-05, "loss": 0.0063, "step": 320620 }, { "epoch": 1.62, "learning_rate": 5.7357058891787036e-05, "loss": 0.0048, "step": 320630 }, { "epoch": 1.62, "learning_rate": 5.7349491198773024e-05, "loss": 0.0083, "step": 320640 }, { "epoch": 1.62, "learning_rate": 5.734192350575901e-05, "loss": 0.0062, "step": 320650 }, { "epoch": 1.62, "learning_rate": 5.7334355812745e-05, "loss": 0.0056, "step": 320660 }, { "epoch": 1.62, "learning_rate": 5.732678811973098e-05, "loss": 0.0065, "step": 320670 }, { "epoch": 1.62, "learning_rate": 5.731922042671698e-05, "loss": 0.0081, "step": 320680 }, { "epoch": 1.62, "learning_rate": 5.7311652733702965e-05, "loss": 0.0077, "step": 320690 }, { "epoch": 1.62, "learning_rate": 5.7304085040688954e-05, "loss": 0.0084, "step": 320700 }, { "epoch": 1.62, "learning_rate": 5.729651734767494e-05, "loss": 0.0056, "step": 320710 }, { "epoch": 1.62, "learning_rate": 5.728894965466094e-05, "loss": 0.0057, "step": 320720 }, { "epoch": 1.62, "learning_rate": 5.7281381961646925e-05, "loss": 0.0055, "step": 320730 }, { "epoch": 1.62, "learning_rate": 5.727381426863291e-05, "loss": 0.0072, "step": 320740 }, { "epoch": 1.62, "learning_rate": 5.72662465756189e-05, "loss": 0.0093, "step": 320750 }, { "epoch": 1.62, "learning_rate": 5.7258678882604896e-05, "loss": 0.0072, "step": 320760 }, { "epoch": 1.62, "learning_rate": 5.7251111189590885e-05, "loss": 0.0069, "step": 320770 }, { "epoch": 1.62, "learning_rate": 5.724354349657687e-05, "loss": 0.0053, "step": 320780 }, { "epoch": 1.62, "learning_rate": 5.723597580356286e-05, "loss": 0.005, "step": 320790 }, { "epoch": 1.62, "learning_rate": 5.7228408110548856e-05, "loss": 0.0065, "step": 320800 }, { "epoch": 1.62, "learning_rate": 5.7220840417534844e-05, "loss": 0.0106, "step": 320810 }, { "epoch": 1.62, "learning_rate": 5.721327272452083e-05, "loss": 0.0052, "step": 320820 }, { "epoch": 1.62, "learning_rate": 5.720570503150682e-05, "loss": 0.0081, "step": 320830 }, { "epoch": 1.62, "learning_rate": 5.7198137338492816e-05, "loss": 0.0075, "step": 320840 }, { "epoch": 1.62, "learning_rate": 5.7190569645478804e-05, "loss": 0.0066, "step": 320850 }, { "epoch": 1.62, "learning_rate": 5.718300195246479e-05, "loss": 0.0069, "step": 320860 }, { "epoch": 1.62, "learning_rate": 5.717543425945078e-05, "loss": 0.0069, "step": 320870 }, { "epoch": 1.62, "learning_rate": 5.7167866566436775e-05, "loss": 0.0077, "step": 320880 }, { "epoch": 1.62, "learning_rate": 5.7160298873422764e-05, "loss": 0.0083, "step": 320890 }, { "epoch": 1.62, "learning_rate": 5.715273118040875e-05, "loss": 0.0066, "step": 320900 }, { "epoch": 1.62, "learning_rate": 5.714516348739474e-05, "loss": 0.0062, "step": 320910 }, { "epoch": 1.62, "learning_rate": 5.7137595794380735e-05, "loss": 0.0055, "step": 320920 }, { "epoch": 1.62, "learning_rate": 5.713002810136672e-05, "loss": 0.0054, "step": 320930 }, { "epoch": 1.62, "learning_rate": 5.712246040835271e-05, "loss": 0.0047, "step": 320940 }, { "epoch": 1.62, "learning_rate": 5.7114892715338707e-05, "loss": 0.0066, "step": 320950 }, { "epoch": 1.62, "learning_rate": 5.7107325022324695e-05, "loss": 0.0055, "step": 320960 }, { "epoch": 1.62, "learning_rate": 5.709975732931068e-05, "loss": 0.0076, "step": 320970 }, { "epoch": 1.62, "learning_rate": 5.7092189636296664e-05, "loss": 0.006, "step": 320980 }, { "epoch": 1.62, "learning_rate": 5.708462194328265e-05, "loss": 0.0064, "step": 320990 }, { "epoch": 1.62, "learning_rate": 5.707705425026865e-05, "loss": 0.0058, "step": 321000 }, { "epoch": 1.62, "eval_cer": 0.9144275584736445, "eval_loss": 0.005066942423582077, "eval_runtime": 116.3307, "eval_samples_per_second": 17.192, "eval_steps_per_second": 4.298, "step": 321000 }, { "epoch": 1.62, "learning_rate": 5.7069486557254636e-05, "loss": 0.0067, "step": 321010 }, { "epoch": 1.62, "learning_rate": 5.7061918864240624e-05, "loss": 0.0066, "step": 321020 }, { "epoch": 1.62, "learning_rate": 5.705435117122661e-05, "loss": 0.0074, "step": 321030 }, { "epoch": 1.62, "learning_rate": 5.704678347821261e-05, "loss": 0.0073, "step": 321040 }, { "epoch": 1.62, "learning_rate": 5.7039215785198595e-05, "loss": 0.006, "step": 321050 }, { "epoch": 1.62, "learning_rate": 5.7031648092184584e-05, "loss": 0.0063, "step": 321060 }, { "epoch": 1.62, "learning_rate": 5.702408039917057e-05, "loss": 0.0073, "step": 321070 }, { "epoch": 1.62, "learning_rate": 5.701651270615657e-05, "loss": 0.0084, "step": 321080 }, { "epoch": 1.62, "learning_rate": 5.7008945013142555e-05, "loss": 0.0063, "step": 321090 }, { "epoch": 1.62, "learning_rate": 5.700137732012854e-05, "loss": 0.0073, "step": 321100 }, { "epoch": 1.62, "learning_rate": 5.699380962711453e-05, "loss": 0.0075, "step": 321110 }, { "epoch": 1.62, "learning_rate": 5.6986241934100527e-05, "loss": 0.0048, "step": 321120 }, { "epoch": 1.62, "learning_rate": 5.6978674241086515e-05, "loss": 0.0081, "step": 321130 }, { "epoch": 1.62, "learning_rate": 5.69711065480725e-05, "loss": 0.0051, "step": 321140 }, { "epoch": 1.62, "learning_rate": 5.696353885505849e-05, "loss": 0.0049, "step": 321150 }, { "epoch": 1.62, "learning_rate": 5.6955971162044486e-05, "loss": 0.0075, "step": 321160 }, { "epoch": 1.62, "learning_rate": 5.6948403469030474e-05, "loss": 0.0055, "step": 321170 }, { "epoch": 1.62, "learning_rate": 5.694083577601646e-05, "loss": 0.006, "step": 321180 }, { "epoch": 1.62, "learning_rate": 5.693326808300245e-05, "loss": 0.0059, "step": 321190 }, { "epoch": 1.62, "learning_rate": 5.6925700389988446e-05, "loss": 0.0061, "step": 321200 }, { "epoch": 1.62, "learning_rate": 5.6918132696974434e-05, "loss": 0.0073, "step": 321210 }, { "epoch": 1.62, "learning_rate": 5.691056500396042e-05, "loss": 0.0091, "step": 321220 }, { "epoch": 1.62, "learning_rate": 5.690299731094641e-05, "loss": 0.0055, "step": 321230 }, { "epoch": 1.62, "learning_rate": 5.6895429617932406e-05, "loss": 0.0092, "step": 321240 }, { "epoch": 1.62, "learning_rate": 5.6887861924918394e-05, "loss": 0.0049, "step": 321250 }, { "epoch": 1.62, "learning_rate": 5.688029423190438e-05, "loss": 0.0062, "step": 321260 }, { "epoch": 1.62, "learning_rate": 5.687272653889037e-05, "loss": 0.008, "step": 321270 }, { "epoch": 1.62, "learning_rate": 5.6865158845876365e-05, "loss": 0.0071, "step": 321280 }, { "epoch": 1.62, "learning_rate": 5.685759115286235e-05, "loss": 0.0074, "step": 321290 }, { "epoch": 1.62, "learning_rate": 5.6850023459848335e-05, "loss": 0.0072, "step": 321300 }, { "epoch": 1.62, "learning_rate": 5.684245576683432e-05, "loss": 0.0055, "step": 321310 }, { "epoch": 1.62, "learning_rate": 5.683488807382031e-05, "loss": 0.0065, "step": 321320 }, { "epoch": 1.62, "learning_rate": 5.6827320380806306e-05, "loss": 0.0072, "step": 321330 }, { "epoch": 1.62, "learning_rate": 5.6819752687792294e-05, "loss": 0.0072, "step": 321340 }, { "epoch": 1.62, "learning_rate": 5.681218499477828e-05, "loss": 0.007, "step": 321350 }, { "epoch": 1.62, "learning_rate": 5.680461730176427e-05, "loss": 0.005, "step": 321360 }, { "epoch": 1.62, "learning_rate": 5.6797049608750266e-05, "loss": 0.0076, "step": 321370 }, { "epoch": 1.62, "learning_rate": 5.6789481915736254e-05, "loss": 0.0077, "step": 321380 }, { "epoch": 1.62, "learning_rate": 5.678191422272224e-05, "loss": 0.0076, "step": 321390 }, { "epoch": 1.62, "learning_rate": 5.677434652970823e-05, "loss": 0.0068, "step": 321400 }, { "epoch": 1.62, "learning_rate": 5.6766778836694226e-05, "loss": 0.0083, "step": 321410 }, { "epoch": 1.62, "learning_rate": 5.6759211143680214e-05, "loss": 0.0073, "step": 321420 }, { "epoch": 1.62, "learning_rate": 5.67516434506662e-05, "loss": 0.007, "step": 321430 }, { "epoch": 1.62, "learning_rate": 5.67440757576522e-05, "loss": 0.0064, "step": 321440 }, { "epoch": 1.62, "learning_rate": 5.6736508064638185e-05, "loss": 0.0048, "step": 321450 }, { "epoch": 1.62, "learning_rate": 5.6728940371624173e-05, "loss": 0.0069, "step": 321460 }, { "epoch": 1.62, "learning_rate": 5.672137267861016e-05, "loss": 0.0057, "step": 321470 }, { "epoch": 1.62, "learning_rate": 5.671380498559616e-05, "loss": 0.0065, "step": 321480 }, { "epoch": 1.62, "learning_rate": 5.6706237292582145e-05, "loss": 0.0063, "step": 321490 }, { "epoch": 1.62, "learning_rate": 5.669866959956813e-05, "loss": 0.007, "step": 321500 }, { "epoch": 1.62, "learning_rate": 5.669110190655412e-05, "loss": 0.0067, "step": 321510 }, { "epoch": 1.62, "learning_rate": 5.6683534213540116e-05, "loss": 0.0053, "step": 321520 }, { "epoch": 1.62, "learning_rate": 5.6675966520526105e-05, "loss": 0.0071, "step": 321530 }, { "epoch": 1.62, "learning_rate": 5.666839882751209e-05, "loss": 0.0053, "step": 321540 }, { "epoch": 1.62, "learning_rate": 5.666083113449808e-05, "loss": 0.0065, "step": 321550 }, { "epoch": 1.62, "learning_rate": 5.6653263441484076e-05, "loss": 0.0089, "step": 321560 }, { "epoch": 1.62, "learning_rate": 5.6645695748470064e-05, "loss": 0.0059, "step": 321570 }, { "epoch": 1.62, "learning_rate": 5.663812805545605e-05, "loss": 0.0062, "step": 321580 }, { "epoch": 1.62, "learning_rate": 5.663056036244204e-05, "loss": 0.008, "step": 321590 }, { "epoch": 1.62, "learning_rate": 5.6622992669428036e-05, "loss": 0.0064, "step": 321600 }, { "epoch": 1.62, "learning_rate": 5.661542497641402e-05, "loss": 0.0064, "step": 321610 }, { "epoch": 1.62, "learning_rate": 5.6607857283400005e-05, "loss": 0.0061, "step": 321620 }, { "epoch": 1.62, "learning_rate": 5.6600289590385993e-05, "loss": 0.0108, "step": 321630 }, { "epoch": 1.62, "learning_rate": 5.659272189737198e-05, "loss": 0.0069, "step": 321640 }, { "epoch": 1.62, "learning_rate": 5.658515420435798e-05, "loss": 0.0081, "step": 321650 }, { "epoch": 1.62, "learning_rate": 5.6577586511343965e-05, "loss": 0.0051, "step": 321660 }, { "epoch": 1.62, "learning_rate": 5.657001881832995e-05, "loss": 0.0055, "step": 321670 }, { "epoch": 1.62, "learning_rate": 5.656245112531594e-05, "loss": 0.0066, "step": 321680 }, { "epoch": 1.62, "learning_rate": 5.6554883432301936e-05, "loss": 0.007, "step": 321690 }, { "epoch": 1.62, "learning_rate": 5.6547315739287925e-05, "loss": 0.0076, "step": 321700 }, { "epoch": 1.62, "learning_rate": 5.653974804627391e-05, "loss": 0.0067, "step": 321710 }, { "epoch": 1.62, "learning_rate": 5.65321803532599e-05, "loss": 0.0083, "step": 321720 }, { "epoch": 1.62, "learning_rate": 5.6524612660245896e-05, "loss": 0.007, "step": 321730 }, { "epoch": 1.62, "learning_rate": 5.6517044967231884e-05, "loss": 0.0067, "step": 321740 }, { "epoch": 1.62, "learning_rate": 5.650947727421787e-05, "loss": 0.0053, "step": 321750 }, { "epoch": 1.62, "learning_rate": 5.650190958120386e-05, "loss": 0.0057, "step": 321760 }, { "epoch": 1.62, "learning_rate": 5.6494341888189856e-05, "loss": 0.0054, "step": 321770 }, { "epoch": 1.62, "learning_rate": 5.6486774195175844e-05, "loss": 0.0094, "step": 321780 }, { "epoch": 1.62, "learning_rate": 5.647920650216183e-05, "loss": 0.0074, "step": 321790 }, { "epoch": 1.62, "learning_rate": 5.647163880914782e-05, "loss": 0.0083, "step": 321800 }, { "epoch": 1.62, "learning_rate": 5.6464071116133815e-05, "loss": 0.0068, "step": 321810 }, { "epoch": 1.62, "learning_rate": 5.6456503423119804e-05, "loss": 0.0084, "step": 321820 }, { "epoch": 1.62, "learning_rate": 5.644893573010579e-05, "loss": 0.0065, "step": 321830 }, { "epoch": 1.62, "learning_rate": 5.644136803709178e-05, "loss": 0.0083, "step": 321840 }, { "epoch": 1.62, "learning_rate": 5.6433800344077775e-05, "loss": 0.0057, "step": 321850 }, { "epoch": 1.62, "learning_rate": 5.642623265106376e-05, "loss": 0.0073, "step": 321860 }, { "epoch": 1.62, "learning_rate": 5.641866495804975e-05, "loss": 0.0073, "step": 321870 }, { "epoch": 1.62, "learning_rate": 5.641109726503574e-05, "loss": 0.0058, "step": 321880 }, { "epoch": 1.62, "learning_rate": 5.6403529572021735e-05, "loss": 0.0077, "step": 321890 }, { "epoch": 1.62, "learning_rate": 5.639596187900772e-05, "loss": 0.0055, "step": 321900 }, { "epoch": 1.62, "learning_rate": 5.638839418599371e-05, "loss": 0.0082, "step": 321910 }, { "epoch": 1.62, "learning_rate": 5.6380826492979706e-05, "loss": 0.0059, "step": 321920 }, { "epoch": 1.62, "learning_rate": 5.637325879996569e-05, "loss": 0.008, "step": 321930 }, { "epoch": 1.62, "learning_rate": 5.6365691106951676e-05, "loss": 0.006, "step": 321940 }, { "epoch": 1.62, "learning_rate": 5.6358123413937664e-05, "loss": 0.006, "step": 321950 }, { "epoch": 1.62, "learning_rate": 5.635055572092365e-05, "loss": 0.0076, "step": 321960 }, { "epoch": 1.62, "learning_rate": 5.634298802790965e-05, "loss": 0.007, "step": 321970 }, { "epoch": 1.62, "learning_rate": 5.6335420334895635e-05, "loss": 0.0064, "step": 321980 }, { "epoch": 1.62, "learning_rate": 5.6327852641881624e-05, "loss": 0.0076, "step": 321990 }, { "epoch": 1.62, "learning_rate": 5.632028494886761e-05, "loss": 0.0095, "step": 322000 }, { "epoch": 1.62, "eval_cer": 0.9144197953046413, "eval_loss": 0.005024084821343422, "eval_runtime": 116.2702, "eval_samples_per_second": 17.201, "eval_steps_per_second": 4.3, "step": 322000 }, { "epoch": 1.62, "learning_rate": 5.631271725585361e-05, "loss": 0.0047, "step": 322010 }, { "epoch": 1.62, "learning_rate": 5.6305149562839595e-05, "loss": 0.0077, "step": 322020 }, { "epoch": 1.62, "learning_rate": 5.629758186982558e-05, "loss": 0.0073, "step": 322030 }, { "epoch": 1.62, "learning_rate": 5.629001417681157e-05, "loss": 0.0077, "step": 322040 }, { "epoch": 1.62, "learning_rate": 5.6282446483797566e-05, "loss": 0.0058, "step": 322050 }, { "epoch": 1.62, "learning_rate": 5.6274878790783555e-05, "loss": 0.0077, "step": 322060 }, { "epoch": 1.62, "learning_rate": 5.626731109776954e-05, "loss": 0.0051, "step": 322070 }, { "epoch": 1.62, "learning_rate": 5.625974340475553e-05, "loss": 0.007, "step": 322080 }, { "epoch": 1.62, "learning_rate": 5.6252175711741526e-05, "loss": 0.0064, "step": 322090 }, { "epoch": 1.63, "learning_rate": 5.6244608018727514e-05, "loss": 0.0057, "step": 322100 }, { "epoch": 1.63, "learning_rate": 5.62370403257135e-05, "loss": 0.0074, "step": 322110 }, { "epoch": 1.63, "learning_rate": 5.622947263269949e-05, "loss": 0.0089, "step": 322120 }, { "epoch": 1.63, "learning_rate": 5.6221904939685486e-05, "loss": 0.0082, "step": 322130 }, { "epoch": 1.63, "learning_rate": 5.6214337246671474e-05, "loss": 0.0073, "step": 322140 }, { "epoch": 1.63, "learning_rate": 5.620676955365746e-05, "loss": 0.008, "step": 322150 }, { "epoch": 1.63, "learning_rate": 5.619920186064345e-05, "loss": 0.0058, "step": 322160 }, { "epoch": 1.63, "learning_rate": 5.6191634167629445e-05, "loss": 0.0068, "step": 322170 }, { "epoch": 1.63, "learning_rate": 5.6184066474615434e-05, "loss": 0.0082, "step": 322180 }, { "epoch": 1.63, "learning_rate": 5.617649878160142e-05, "loss": 0.0055, "step": 322190 }, { "epoch": 1.63, "learning_rate": 5.616893108858741e-05, "loss": 0.0061, "step": 322200 }, { "epoch": 1.63, "learning_rate": 5.6161363395573405e-05, "loss": 0.0058, "step": 322210 }, { "epoch": 1.63, "learning_rate": 5.615379570255939e-05, "loss": 0.0062, "step": 322220 }, { "epoch": 1.63, "learning_rate": 5.614622800954538e-05, "loss": 0.0057, "step": 322230 }, { "epoch": 1.63, "learning_rate": 5.613866031653136e-05, "loss": 0.007, "step": 322240 }, { "epoch": 1.63, "learning_rate": 5.613109262351735e-05, "loss": 0.0066, "step": 322250 }, { "epoch": 1.63, "learning_rate": 5.6123524930503346e-05, "loss": 0.0056, "step": 322260 }, { "epoch": 1.63, "learning_rate": 5.6115957237489334e-05, "loss": 0.0062, "step": 322270 }, { "epoch": 1.63, "learning_rate": 5.610838954447532e-05, "loss": 0.0075, "step": 322280 }, { "epoch": 1.63, "learning_rate": 5.610082185146131e-05, "loss": 0.0052, "step": 322290 }, { "epoch": 1.63, "learning_rate": 5.6093254158447306e-05, "loss": 0.005, "step": 322300 }, { "epoch": 1.63, "learning_rate": 5.6085686465433294e-05, "loss": 0.0066, "step": 322310 }, { "epoch": 1.63, "learning_rate": 5.607811877241928e-05, "loss": 0.0055, "step": 322320 }, { "epoch": 1.63, "learning_rate": 5.607055107940527e-05, "loss": 0.0098, "step": 322330 }, { "epoch": 1.63, "learning_rate": 5.6062983386391265e-05, "loss": 0.0065, "step": 322340 }, { "epoch": 1.63, "learning_rate": 5.6055415693377254e-05, "loss": 0.006, "step": 322350 }, { "epoch": 1.63, "learning_rate": 5.604784800036324e-05, "loss": 0.0069, "step": 322360 }, { "epoch": 1.63, "learning_rate": 5.604028030734923e-05, "loss": 0.0062, "step": 322370 }, { "epoch": 1.63, "learning_rate": 5.6032712614335225e-05, "loss": 0.0052, "step": 322380 }, { "epoch": 1.63, "learning_rate": 5.602514492132121e-05, "loss": 0.0063, "step": 322390 }, { "epoch": 1.63, "learning_rate": 5.60175772283072e-05, "loss": 0.0086, "step": 322400 }, { "epoch": 1.63, "learning_rate": 5.6010009535293197e-05, "loss": 0.0087, "step": 322410 }, { "epoch": 1.63, "learning_rate": 5.6002441842279185e-05, "loss": 0.0064, "step": 322420 }, { "epoch": 1.63, "learning_rate": 5.599487414926517e-05, "loss": 0.0066, "step": 322430 }, { "epoch": 1.63, "learning_rate": 5.598730645625116e-05, "loss": 0.0081, "step": 322440 }, { "epoch": 1.63, "learning_rate": 5.5979738763237156e-05, "loss": 0.0065, "step": 322450 }, { "epoch": 1.63, "learning_rate": 5.5972171070223144e-05, "loss": 0.0062, "step": 322460 }, { "epoch": 1.63, "learning_rate": 5.596460337720913e-05, "loss": 0.0076, "step": 322470 }, { "epoch": 1.63, "learning_rate": 5.595703568419512e-05, "loss": 0.0081, "step": 322480 }, { "epoch": 1.63, "learning_rate": 5.5949467991181116e-05, "loss": 0.0089, "step": 322490 }, { "epoch": 1.63, "learning_rate": 5.5941900298167104e-05, "loss": 0.0059, "step": 322500 }, { "epoch": 1.63, "learning_rate": 5.593433260515309e-05, "loss": 0.0063, "step": 322510 }, { "epoch": 1.63, "learning_rate": 5.592676491213908e-05, "loss": 0.0063, "step": 322520 }, { "epoch": 1.63, "learning_rate": 5.5919197219125075e-05, "loss": 0.0072, "step": 322530 }, { "epoch": 1.63, "learning_rate": 5.5911629526111064e-05, "loss": 0.007, "step": 322540 }, { "epoch": 1.63, "learning_rate": 5.5904061833097045e-05, "loss": 0.0074, "step": 322550 }, { "epoch": 1.63, "learning_rate": 5.589649414008303e-05, "loss": 0.0066, "step": 322560 }, { "epoch": 1.63, "learning_rate": 5.588892644706902e-05, "loss": 0.0079, "step": 322570 }, { "epoch": 1.63, "learning_rate": 5.5881358754055017e-05, "loss": 0.0072, "step": 322580 }, { "epoch": 1.63, "learning_rate": 5.5873791061041005e-05, "loss": 0.0077, "step": 322590 }, { "epoch": 1.63, "learning_rate": 5.586622336802699e-05, "loss": 0.0061, "step": 322600 }, { "epoch": 1.63, "learning_rate": 5.585865567501298e-05, "loss": 0.0073, "step": 322610 }, { "epoch": 1.63, "learning_rate": 5.5851087981998976e-05, "loss": 0.0057, "step": 322620 }, { "epoch": 1.63, "learning_rate": 5.5843520288984964e-05, "loss": 0.0065, "step": 322630 }, { "epoch": 1.63, "learning_rate": 5.583595259597095e-05, "loss": 0.0071, "step": 322640 }, { "epoch": 1.63, "learning_rate": 5.582838490295694e-05, "loss": 0.0054, "step": 322650 }, { "epoch": 1.63, "learning_rate": 5.5820817209942936e-05, "loss": 0.0065, "step": 322660 }, { "epoch": 1.63, "learning_rate": 5.5813249516928924e-05, "loss": 0.0087, "step": 322670 }, { "epoch": 1.63, "learning_rate": 5.580568182391491e-05, "loss": 0.0058, "step": 322680 }, { "epoch": 1.63, "learning_rate": 5.57981141309009e-05, "loss": 0.0066, "step": 322690 }, { "epoch": 1.63, "learning_rate": 5.5790546437886896e-05, "loss": 0.0063, "step": 322700 }, { "epoch": 1.63, "learning_rate": 5.5782978744872884e-05, "loss": 0.0073, "step": 322710 }, { "epoch": 1.63, "learning_rate": 5.577541105185887e-05, "loss": 0.0077, "step": 322720 }, { "epoch": 1.63, "learning_rate": 5.576784335884486e-05, "loss": 0.0062, "step": 322730 }, { "epoch": 1.63, "learning_rate": 5.5760275665830855e-05, "loss": 0.006, "step": 322740 }, { "epoch": 1.63, "learning_rate": 5.5752707972816843e-05, "loss": 0.0042, "step": 322750 }, { "epoch": 1.63, "learning_rate": 5.574514027980283e-05, "loss": 0.0058, "step": 322760 }, { "epoch": 1.63, "learning_rate": 5.573757258678882e-05, "loss": 0.0053, "step": 322770 }, { "epoch": 1.63, "learning_rate": 5.5730004893774815e-05, "loss": 0.0052, "step": 322780 }, { "epoch": 1.63, "learning_rate": 5.57224372007608e-05, "loss": 0.0082, "step": 322790 }, { "epoch": 1.63, "learning_rate": 5.571486950774679e-05, "loss": 0.0067, "step": 322800 }, { "epoch": 1.63, "learning_rate": 5.570730181473278e-05, "loss": 0.0055, "step": 322810 }, { "epoch": 1.63, "learning_rate": 5.5699734121718774e-05, "loss": 0.0075, "step": 322820 }, { "epoch": 1.63, "learning_rate": 5.569216642870476e-05, "loss": 0.0058, "step": 322830 }, { "epoch": 1.63, "learning_rate": 5.568459873569075e-05, "loss": 0.006, "step": 322840 }, { "epoch": 1.63, "learning_rate": 5.567703104267674e-05, "loss": 0.0076, "step": 322850 }, { "epoch": 1.63, "learning_rate": 5.5669463349662734e-05, "loss": 0.0065, "step": 322860 }, { "epoch": 1.63, "learning_rate": 5.5661895656648716e-05, "loss": 0.0074, "step": 322870 }, { "epoch": 1.63, "learning_rate": 5.5654327963634704e-05, "loss": 0.005, "step": 322880 }, { "epoch": 1.63, "learning_rate": 5.564676027062069e-05, "loss": 0.0075, "step": 322890 }, { "epoch": 1.63, "learning_rate": 5.563919257760669e-05, "loss": 0.0076, "step": 322900 }, { "epoch": 1.63, "learning_rate": 5.5631624884592675e-05, "loss": 0.0087, "step": 322910 }, { "epoch": 1.63, "learning_rate": 5.5624057191578663e-05, "loss": 0.0095, "step": 322920 }, { "epoch": 1.63, "learning_rate": 5.561648949856465e-05, "loss": 0.0069, "step": 322930 }, { "epoch": 1.63, "learning_rate": 5.560892180555065e-05, "loss": 0.0066, "step": 322940 }, { "epoch": 1.63, "learning_rate": 5.5601354112536635e-05, "loss": 0.0063, "step": 322950 }, { "epoch": 1.63, "learning_rate": 5.559378641952262e-05, "loss": 0.0069, "step": 322960 }, { "epoch": 1.63, "learning_rate": 5.558621872650861e-05, "loss": 0.0068, "step": 322970 }, { "epoch": 1.63, "learning_rate": 5.5578651033494606e-05, "loss": 0.0054, "step": 322980 }, { "epoch": 1.63, "learning_rate": 5.5571083340480595e-05, "loss": 0.0081, "step": 322990 }, { "epoch": 1.63, "learning_rate": 5.556351564746658e-05, "loss": 0.0101, "step": 323000 }, { "epoch": 1.63, "eval_cer": 0.9144265880775191, "eval_loss": 0.004934444557875395, "eval_runtime": 116.3298, "eval_samples_per_second": 17.192, "eval_steps_per_second": 4.298, "step": 323000 }, { "epoch": 1.63, "learning_rate": 5.555594795445257e-05, "loss": 0.0076, "step": 323010 }, { "epoch": 1.63, "learning_rate": 5.5548380261438566e-05, "loss": 0.0071, "step": 323020 }, { "epoch": 1.63, "learning_rate": 5.5540812568424554e-05, "loss": 0.007, "step": 323030 }, { "epoch": 1.63, "learning_rate": 5.553324487541054e-05, "loss": 0.0069, "step": 323040 }, { "epoch": 1.63, "learning_rate": 5.552567718239653e-05, "loss": 0.0064, "step": 323050 }, { "epoch": 1.63, "learning_rate": 5.5518109489382526e-05, "loss": 0.0081, "step": 323060 }, { "epoch": 1.63, "learning_rate": 5.5510541796368514e-05, "loss": 0.0067, "step": 323070 }, { "epoch": 1.63, "learning_rate": 5.55029741033545e-05, "loss": 0.0052, "step": 323080 }, { "epoch": 1.63, "learning_rate": 5.549540641034049e-05, "loss": 0.0076, "step": 323090 }, { "epoch": 1.63, "learning_rate": 5.5487838717326485e-05, "loss": 0.0065, "step": 323100 }, { "epoch": 1.63, "learning_rate": 5.5480271024312473e-05, "loss": 0.0061, "step": 323110 }, { "epoch": 1.63, "learning_rate": 5.547270333129846e-05, "loss": 0.0058, "step": 323120 }, { "epoch": 1.63, "learning_rate": 5.546513563828445e-05, "loss": 0.0091, "step": 323130 }, { "epoch": 1.63, "learning_rate": 5.5457567945270445e-05, "loss": 0.0063, "step": 323140 }, { "epoch": 1.63, "learning_rate": 5.545000025225643e-05, "loss": 0.0047, "step": 323150 }, { "epoch": 1.63, "learning_rate": 5.544243255924242e-05, "loss": 0.0058, "step": 323160 }, { "epoch": 1.63, "learning_rate": 5.543486486622841e-05, "loss": 0.0081, "step": 323170 }, { "epoch": 1.63, "learning_rate": 5.542729717321439e-05, "loss": 0.0066, "step": 323180 }, { "epoch": 1.63, "learning_rate": 5.5419729480200386e-05, "loss": 0.0108, "step": 323190 }, { "epoch": 1.63, "learning_rate": 5.5412161787186374e-05, "loss": 0.0061, "step": 323200 }, { "epoch": 1.63, "learning_rate": 5.540459409417236e-05, "loss": 0.0065, "step": 323210 }, { "epoch": 1.63, "learning_rate": 5.539702640115835e-05, "loss": 0.0055, "step": 323220 }, { "epoch": 1.63, "learning_rate": 5.5389458708144346e-05, "loss": 0.0066, "step": 323230 }, { "epoch": 1.63, "learning_rate": 5.5381891015130334e-05, "loss": 0.0061, "step": 323240 }, { "epoch": 1.63, "learning_rate": 5.537432332211632e-05, "loss": 0.0073, "step": 323250 }, { "epoch": 1.63, "learning_rate": 5.536675562910231e-05, "loss": 0.0065, "step": 323260 }, { "epoch": 1.63, "learning_rate": 5.5359187936088305e-05, "loss": 0.0066, "step": 323270 }, { "epoch": 1.63, "learning_rate": 5.5351620243074294e-05, "loss": 0.0078, "step": 323280 }, { "epoch": 1.63, "learning_rate": 5.534405255006028e-05, "loss": 0.0071, "step": 323290 }, { "epoch": 1.63, "learning_rate": 5.533648485704627e-05, "loss": 0.0064, "step": 323300 }, { "epoch": 1.63, "learning_rate": 5.5328917164032265e-05, "loss": 0.0044, "step": 323310 }, { "epoch": 1.63, "learning_rate": 5.532134947101825e-05, "loss": 0.0085, "step": 323320 }, { "epoch": 1.63, "learning_rate": 5.531378177800424e-05, "loss": 0.0062, "step": 323330 }, { "epoch": 1.63, "learning_rate": 5.530621408499023e-05, "loss": 0.0063, "step": 323340 }, { "epoch": 1.63, "learning_rate": 5.5298646391976225e-05, "loss": 0.0052, "step": 323350 }, { "epoch": 1.63, "learning_rate": 5.529107869896221e-05, "loss": 0.0064, "step": 323360 }, { "epoch": 1.63, "learning_rate": 5.52835110059482e-05, "loss": 0.0067, "step": 323370 }, { "epoch": 1.63, "learning_rate": 5.5275943312934196e-05, "loss": 0.0062, "step": 323380 }, { "epoch": 1.63, "learning_rate": 5.5268375619920184e-05, "loss": 0.0066, "step": 323390 }, { "epoch": 1.63, "learning_rate": 5.526080792690617e-05, "loss": 0.0066, "step": 323400 }, { "epoch": 1.63, "learning_rate": 5.525324023389216e-05, "loss": 0.0072, "step": 323410 }, { "epoch": 1.63, "learning_rate": 5.5245672540878156e-05, "loss": 0.0057, "step": 323420 }, { "epoch": 1.63, "learning_rate": 5.5238104847864144e-05, "loss": 0.0056, "step": 323430 }, { "epoch": 1.63, "learning_rate": 5.523053715485013e-05, "loss": 0.0076, "step": 323440 }, { "epoch": 1.63, "learning_rate": 5.522296946183612e-05, "loss": 0.0077, "step": 323450 }, { "epoch": 1.63, "learning_rate": 5.5215401768822115e-05, "loss": 0.0054, "step": 323460 }, { "epoch": 1.63, "learning_rate": 5.5207834075808104e-05, "loss": 0.0079, "step": 323470 }, { "epoch": 1.63, "learning_rate": 5.520026638279409e-05, "loss": 0.0045, "step": 323480 }, { "epoch": 1.63, "learning_rate": 5.519269868978008e-05, "loss": 0.0053, "step": 323490 }, { "epoch": 1.63, "learning_rate": 5.518513099676606e-05, "loss": 0.0058, "step": 323500 }, { "epoch": 1.63, "learning_rate": 5.5177563303752056e-05, "loss": 0.0069, "step": 323510 }, { "epoch": 1.63, "learning_rate": 5.5169995610738045e-05, "loss": 0.0095, "step": 323520 }, { "epoch": 1.63, "learning_rate": 5.516242791772403e-05, "loss": 0.0064, "step": 323530 }, { "epoch": 1.63, "learning_rate": 5.515486022471002e-05, "loss": 0.0061, "step": 323540 }, { "epoch": 1.63, "learning_rate": 5.5147292531696016e-05, "loss": 0.0052, "step": 323550 }, { "epoch": 1.63, "learning_rate": 5.5139724838682004e-05, "loss": 0.0095, "step": 323560 }, { "epoch": 1.63, "learning_rate": 5.513215714566799e-05, "loss": 0.0071, "step": 323570 }, { "epoch": 1.63, "learning_rate": 5.512458945265398e-05, "loss": 0.0086, "step": 323580 }, { "epoch": 1.63, "learning_rate": 5.5117021759639976e-05, "loss": 0.007, "step": 323590 }, { "epoch": 1.63, "learning_rate": 5.5109454066625964e-05, "loss": 0.0049, "step": 323600 }, { "epoch": 1.63, "learning_rate": 5.510188637361195e-05, "loss": 0.0072, "step": 323610 }, { "epoch": 1.63, "learning_rate": 5.509431868059794e-05, "loss": 0.0065, "step": 323620 }, { "epoch": 1.63, "learning_rate": 5.5086750987583935e-05, "loss": 0.0077, "step": 323630 }, { "epoch": 1.63, "learning_rate": 5.5079183294569924e-05, "loss": 0.0056, "step": 323640 }, { "epoch": 1.63, "learning_rate": 5.507161560155591e-05, "loss": 0.0075, "step": 323650 }, { "epoch": 1.63, "learning_rate": 5.50640479085419e-05, "loss": 0.0072, "step": 323660 }, { "epoch": 1.63, "learning_rate": 5.5056480215527895e-05, "loss": 0.0085, "step": 323670 }, { "epoch": 1.63, "learning_rate": 5.504891252251388e-05, "loss": 0.0053, "step": 323680 }, { "epoch": 1.63, "learning_rate": 5.504134482949987e-05, "loss": 0.0074, "step": 323690 }, { "epoch": 1.63, "learning_rate": 5.503377713648586e-05, "loss": 0.0072, "step": 323700 }, { "epoch": 1.63, "learning_rate": 5.5026209443471855e-05, "loss": 0.0058, "step": 323710 }, { "epoch": 1.63, "learning_rate": 5.501864175045784e-05, "loss": 0.0072, "step": 323720 }, { "epoch": 1.63, "learning_rate": 5.501107405744383e-05, "loss": 0.0061, "step": 323730 }, { "epoch": 1.63, "learning_rate": 5.500350636442982e-05, "loss": 0.0036, "step": 323740 }, { "epoch": 1.63, "learning_rate": 5.4995938671415814e-05, "loss": 0.0065, "step": 323750 }, { "epoch": 1.63, "learning_rate": 5.49883709784018e-05, "loss": 0.0052, "step": 323760 }, { "epoch": 1.63, "learning_rate": 5.498080328538779e-05, "loss": 0.0075, "step": 323770 }, { "epoch": 1.63, "learning_rate": 5.497323559237378e-05, "loss": 0.0079, "step": 323780 }, { "epoch": 1.63, "learning_rate": 5.4965667899359774e-05, "loss": 0.0075, "step": 323790 }, { "epoch": 1.63, "learning_rate": 5.495810020634576e-05, "loss": 0.0076, "step": 323800 }, { "epoch": 1.63, "learning_rate": 5.4950532513331744e-05, "loss": 0.0067, "step": 323810 }, { "epoch": 1.63, "learning_rate": 5.494296482031773e-05, "loss": 0.0086, "step": 323820 }, { "epoch": 1.63, "learning_rate": 5.493539712730373e-05, "loss": 0.0076, "step": 323830 }, { "epoch": 1.63, "learning_rate": 5.4927829434289715e-05, "loss": 0.0071, "step": 323840 }, { "epoch": 1.63, "learning_rate": 5.49202617412757e-05, "loss": 0.0066, "step": 323850 }, { "epoch": 1.63, "learning_rate": 5.491269404826169e-05, "loss": 0.0059, "step": 323860 }, { "epoch": 1.63, "learning_rate": 5.4905126355247687e-05, "loss": 0.008, "step": 323870 }, { "epoch": 1.63, "learning_rate": 5.4897558662233675e-05, "loss": 0.0056, "step": 323880 }, { "epoch": 1.63, "learning_rate": 5.488999096921966e-05, "loss": 0.0103, "step": 323890 }, { "epoch": 1.63, "learning_rate": 5.488242327620565e-05, "loss": 0.0066, "step": 323900 }, { "epoch": 1.63, "learning_rate": 5.4874855583191646e-05, "loss": 0.0068, "step": 323910 }, { "epoch": 1.63, "learning_rate": 5.4867287890177634e-05, "loss": 0.0071, "step": 323920 }, { "epoch": 1.63, "learning_rate": 5.485972019716362e-05, "loss": 0.0086, "step": 323930 }, { "epoch": 1.63, "learning_rate": 5.485215250414961e-05, "loss": 0.0066, "step": 323940 }, { "epoch": 1.63, "learning_rate": 5.4844584811135606e-05, "loss": 0.0064, "step": 323950 }, { "epoch": 1.63, "learning_rate": 5.4837017118121594e-05, "loss": 0.0071, "step": 323960 }, { "epoch": 1.63, "learning_rate": 5.482944942510758e-05, "loss": 0.0073, "step": 323970 }, { "epoch": 1.63, "learning_rate": 5.482188173209357e-05, "loss": 0.0062, "step": 323980 }, { "epoch": 1.63, "learning_rate": 5.4814314039079565e-05, "loss": 0.0081, "step": 323990 }, { "epoch": 1.63, "learning_rate": 5.4806746346065554e-05, "loss": 0.0068, "step": 324000 }, { "epoch": 1.63, "eval_cer": 0.9144275584736445, "eval_loss": 0.0047448608092963696, "eval_runtime": 116.3969, "eval_samples_per_second": 17.183, "eval_steps_per_second": 4.296, "step": 324000 }, { "epoch": 1.63, "learning_rate": 5.479917865305154e-05, "loss": 0.0069, "step": 324010 }, { "epoch": 1.63, "learning_rate": 5.479161096003753e-05, "loss": 0.0065, "step": 324020 }, { "epoch": 1.63, "learning_rate": 5.4784043267023525e-05, "loss": 0.0084, "step": 324030 }, { "epoch": 1.63, "learning_rate": 5.477647557400951e-05, "loss": 0.0074, "step": 324040 }, { "epoch": 1.63, "learning_rate": 5.47689078809955e-05, "loss": 0.0069, "step": 324050 }, { "epoch": 1.63, "learning_rate": 5.476134018798149e-05, "loss": 0.0065, "step": 324060 }, { "epoch": 1.63, "learning_rate": 5.4753772494967485e-05, "loss": 0.007, "step": 324070 }, { "epoch": 1.64, "learning_rate": 5.474620480195347e-05, "loss": 0.0067, "step": 324080 }, { "epoch": 1.64, "learning_rate": 5.473863710893946e-05, "loss": 0.0093, "step": 324090 }, { "epoch": 1.64, "learning_rate": 5.473106941592545e-05, "loss": 0.006, "step": 324100 }, { "epoch": 1.64, "learning_rate": 5.4723501722911444e-05, "loss": 0.0075, "step": 324110 }, { "epoch": 1.64, "learning_rate": 5.4715934029897426e-05, "loss": 0.0054, "step": 324120 }, { "epoch": 1.64, "learning_rate": 5.4708366336883414e-05, "loss": 0.0069, "step": 324130 }, { "epoch": 1.64, "learning_rate": 5.47007986438694e-05, "loss": 0.0072, "step": 324140 }, { "epoch": 1.64, "learning_rate": 5.469323095085539e-05, "loss": 0.0071, "step": 324150 }, { "epoch": 1.64, "learning_rate": 5.4685663257841386e-05, "loss": 0.0072, "step": 324160 }, { "epoch": 1.64, "learning_rate": 5.4678095564827374e-05, "loss": 0.0058, "step": 324170 }, { "epoch": 1.64, "learning_rate": 5.467052787181336e-05, "loss": 0.0061, "step": 324180 }, { "epoch": 1.64, "learning_rate": 5.466296017879935e-05, "loss": 0.0073, "step": 324190 }, { "epoch": 1.64, "learning_rate": 5.4655392485785345e-05, "loss": 0.0065, "step": 324200 }, { "epoch": 1.64, "learning_rate": 5.4647824792771333e-05, "loss": 0.0056, "step": 324210 }, { "epoch": 1.64, "learning_rate": 5.464025709975732e-05, "loss": 0.0056, "step": 324220 }, { "epoch": 1.64, "learning_rate": 5.463268940674331e-05, "loss": 0.0078, "step": 324230 }, { "epoch": 1.64, "learning_rate": 5.4625121713729305e-05, "loss": 0.0054, "step": 324240 }, { "epoch": 1.64, "learning_rate": 5.461755402071529e-05, "loss": 0.0061, "step": 324250 }, { "epoch": 1.64, "learning_rate": 5.460998632770128e-05, "loss": 0.0065, "step": 324260 }, { "epoch": 1.64, "learning_rate": 5.460241863468727e-05, "loss": 0.0062, "step": 324270 }, { "epoch": 1.64, "learning_rate": 5.4594850941673264e-05, "loss": 0.0072, "step": 324280 }, { "epoch": 1.64, "learning_rate": 5.458728324865925e-05, "loss": 0.0056, "step": 324290 }, { "epoch": 1.64, "learning_rate": 5.457971555564524e-05, "loss": 0.0071, "step": 324300 }, { "epoch": 1.64, "learning_rate": 5.457214786263123e-05, "loss": 0.0067, "step": 324310 }, { "epoch": 1.64, "learning_rate": 5.4564580169617224e-05, "loss": 0.0071, "step": 324320 }, { "epoch": 1.64, "learning_rate": 5.455701247660321e-05, "loss": 0.0051, "step": 324330 }, { "epoch": 1.64, "learning_rate": 5.45494447835892e-05, "loss": 0.0076, "step": 324340 }, { "epoch": 1.64, "learning_rate": 5.4541877090575196e-05, "loss": 0.0072, "step": 324350 }, { "epoch": 1.64, "learning_rate": 5.4534309397561184e-05, "loss": 0.0065, "step": 324360 }, { "epoch": 1.64, "learning_rate": 5.452674170454717e-05, "loss": 0.0089, "step": 324370 }, { "epoch": 1.64, "learning_rate": 5.451917401153316e-05, "loss": 0.0091, "step": 324380 }, { "epoch": 1.64, "learning_rate": 5.4511606318519155e-05, "loss": 0.0074, "step": 324390 }, { "epoch": 1.64, "learning_rate": 5.4504038625505143e-05, "loss": 0.0059, "step": 324400 }, { "epoch": 1.64, "learning_rate": 5.449647093249113e-05, "loss": 0.0057, "step": 324410 }, { "epoch": 1.64, "learning_rate": 5.448890323947712e-05, "loss": 0.0063, "step": 324420 }, { "epoch": 1.64, "learning_rate": 5.4481335546463115e-05, "loss": 0.0082, "step": 324430 }, { "epoch": 1.64, "learning_rate": 5.4473767853449096e-05, "loss": 0.0085, "step": 324440 }, { "epoch": 1.64, "learning_rate": 5.4466200160435085e-05, "loss": 0.0056, "step": 324450 }, { "epoch": 1.64, "learning_rate": 5.445863246742107e-05, "loss": 0.0079, "step": 324460 }, { "epoch": 1.64, "learning_rate": 5.445106477440706e-05, "loss": 0.0075, "step": 324470 }, { "epoch": 1.64, "learning_rate": 5.4443497081393056e-05, "loss": 0.0063, "step": 324480 }, { "epoch": 1.64, "learning_rate": 5.4435929388379044e-05, "loss": 0.0066, "step": 324490 }, { "epoch": 1.64, "learning_rate": 5.442836169536503e-05, "loss": 0.0084, "step": 324500 }, { "epoch": 1.64, "learning_rate": 5.442079400235102e-05, "loss": 0.0064, "step": 324510 }, { "epoch": 1.64, "learning_rate": 5.4413226309337016e-05, "loss": 0.0057, "step": 324520 }, { "epoch": 1.64, "learning_rate": 5.4405658616323004e-05, "loss": 0.0065, "step": 324530 }, { "epoch": 1.64, "learning_rate": 5.439809092330899e-05, "loss": 0.0057, "step": 324540 }, { "epoch": 1.64, "learning_rate": 5.439052323029498e-05, "loss": 0.0064, "step": 324550 }, { "epoch": 1.64, "learning_rate": 5.4382955537280975e-05, "loss": 0.0064, "step": 324560 }, { "epoch": 1.64, "learning_rate": 5.4375387844266963e-05, "loss": 0.0058, "step": 324570 }, { "epoch": 1.64, "learning_rate": 5.436782015125295e-05, "loss": 0.0059, "step": 324580 }, { "epoch": 1.64, "learning_rate": 5.436025245823894e-05, "loss": 0.0095, "step": 324590 }, { "epoch": 1.64, "learning_rate": 5.4352684765224935e-05, "loss": 0.0076, "step": 324600 }, { "epoch": 1.64, "learning_rate": 5.434511707221092e-05, "loss": 0.0049, "step": 324610 }, { "epoch": 1.64, "learning_rate": 5.433754937919691e-05, "loss": 0.01, "step": 324620 }, { "epoch": 1.64, "learning_rate": 5.43299816861829e-05, "loss": 0.0053, "step": 324630 }, { "epoch": 1.64, "learning_rate": 5.4322413993168895e-05, "loss": 0.0069, "step": 324640 }, { "epoch": 1.64, "learning_rate": 5.431484630015488e-05, "loss": 0.0045, "step": 324650 }, { "epoch": 1.64, "learning_rate": 5.430727860714087e-05, "loss": 0.0069, "step": 324660 }, { "epoch": 1.64, "learning_rate": 5.429971091412686e-05, "loss": 0.006, "step": 324670 }, { "epoch": 1.64, "learning_rate": 5.4292143221112854e-05, "loss": 0.0091, "step": 324680 }, { "epoch": 1.64, "learning_rate": 5.428457552809884e-05, "loss": 0.0076, "step": 324690 }, { "epoch": 1.64, "learning_rate": 5.427700783508483e-05, "loss": 0.0126, "step": 324700 }, { "epoch": 1.64, "learning_rate": 5.426944014207082e-05, "loss": 0.0071, "step": 324710 }, { "epoch": 1.64, "learning_rate": 5.4261872449056814e-05, "loss": 0.0073, "step": 324720 }, { "epoch": 1.64, "learning_rate": 5.42543047560428e-05, "loss": 0.0106, "step": 324730 }, { "epoch": 1.64, "learning_rate": 5.424673706302879e-05, "loss": 0.0081, "step": 324740 }, { "epoch": 1.64, "learning_rate": 5.423916937001477e-05, "loss": 0.0068, "step": 324750 }, { "epoch": 1.64, "learning_rate": 5.423160167700076e-05, "loss": 0.0057, "step": 324760 }, { "epoch": 1.64, "learning_rate": 5.4224033983986755e-05, "loss": 0.0072, "step": 324770 }, { "epoch": 1.64, "learning_rate": 5.421646629097274e-05, "loss": 0.007, "step": 324780 }, { "epoch": 1.64, "learning_rate": 5.420889859795873e-05, "loss": 0.0055, "step": 324790 }, { "epoch": 1.64, "learning_rate": 5.4201330904944726e-05, "loss": 0.005, "step": 324800 }, { "epoch": 1.64, "learning_rate": 5.4193763211930715e-05, "loss": 0.0055, "step": 324810 }, { "epoch": 1.64, "learning_rate": 5.41861955189167e-05, "loss": 0.0084, "step": 324820 }, { "epoch": 1.64, "learning_rate": 5.417862782590269e-05, "loss": 0.0056, "step": 324830 }, { "epoch": 1.64, "learning_rate": 5.4171060132888686e-05, "loss": 0.0082, "step": 324840 }, { "epoch": 1.64, "learning_rate": 5.4163492439874674e-05, "loss": 0.0076, "step": 324850 }, { "epoch": 1.64, "learning_rate": 5.415592474686066e-05, "loss": 0.0077, "step": 324860 }, { "epoch": 1.64, "learning_rate": 5.414835705384665e-05, "loss": 0.0074, "step": 324870 }, { "epoch": 1.64, "learning_rate": 5.4140789360832646e-05, "loss": 0.0086, "step": 324880 }, { "epoch": 1.64, "learning_rate": 5.4133221667818634e-05, "loss": 0.0054, "step": 324890 }, { "epoch": 1.64, "learning_rate": 5.412565397480462e-05, "loss": 0.0055, "step": 324900 }, { "epoch": 1.64, "learning_rate": 5.411808628179061e-05, "loss": 0.0066, "step": 324910 }, { "epoch": 1.64, "learning_rate": 5.4110518588776605e-05, "loss": 0.0067, "step": 324920 }, { "epoch": 1.64, "learning_rate": 5.4102950895762594e-05, "loss": 0.0068, "step": 324930 }, { "epoch": 1.64, "learning_rate": 5.409538320274858e-05, "loss": 0.0059, "step": 324940 }, { "epoch": 1.64, "learning_rate": 5.408781550973457e-05, "loss": 0.0069, "step": 324950 }, { "epoch": 1.64, "learning_rate": 5.4080247816720565e-05, "loss": 0.0056, "step": 324960 }, { "epoch": 1.64, "learning_rate": 5.407268012370655e-05, "loss": 0.008, "step": 324970 }, { "epoch": 1.64, "learning_rate": 5.406511243069254e-05, "loss": 0.0053, "step": 324980 }, { "epoch": 1.64, "learning_rate": 5.405754473767853e-05, "loss": 0.0056, "step": 324990 }, { "epoch": 1.64, "learning_rate": 5.4049977044664525e-05, "loss": 0.0063, "step": 325000 }, { "epoch": 1.64, "eval_cer": 0.9144333808503969, "eval_loss": 0.005062679760158062, "eval_runtime": 116.3486, "eval_samples_per_second": 17.19, "eval_steps_per_second": 4.297, "step": 325000 }, { "epoch": 1.64, "learning_rate": 5.404240935165051e-05, "loss": 0.007, "step": 325010 }, { "epoch": 1.64, "learning_rate": 5.40348416586365e-05, "loss": 0.0077, "step": 325020 }, { "epoch": 1.64, "learning_rate": 5.402727396562249e-05, "loss": 0.0079, "step": 325030 }, { "epoch": 1.64, "learning_rate": 5.4019706272608484e-05, "loss": 0.0076, "step": 325040 }, { "epoch": 1.64, "learning_rate": 5.401213857959447e-05, "loss": 0.006, "step": 325050 }, { "epoch": 1.64, "learning_rate": 5.400457088658046e-05, "loss": 0.0066, "step": 325060 }, { "epoch": 1.64, "learning_rate": 5.399700319356644e-05, "loss": 0.0053, "step": 325070 }, { "epoch": 1.64, "learning_rate": 5.398943550055243e-05, "loss": 0.007, "step": 325080 }, { "epoch": 1.64, "learning_rate": 5.3981867807538425e-05, "loss": 0.0064, "step": 325090 }, { "epoch": 1.64, "learning_rate": 5.3974300114524414e-05, "loss": 0.0067, "step": 325100 }, { "epoch": 1.64, "learning_rate": 5.39667324215104e-05, "loss": 0.0075, "step": 325110 }, { "epoch": 1.64, "learning_rate": 5.395916472849639e-05, "loss": 0.0091, "step": 325120 }, { "epoch": 1.64, "learning_rate": 5.3951597035482385e-05, "loss": 0.0125, "step": 325130 }, { "epoch": 1.64, "learning_rate": 5.394402934246837e-05, "loss": 0.0075, "step": 325140 }, { "epoch": 1.64, "learning_rate": 5.393646164945436e-05, "loss": 0.006, "step": 325150 }, { "epoch": 1.64, "learning_rate": 5.392889395644035e-05, "loss": 0.0045, "step": 325160 }, { "epoch": 1.64, "learning_rate": 5.3921326263426345e-05, "loss": 0.0059, "step": 325170 }, { "epoch": 1.64, "learning_rate": 5.391375857041233e-05, "loss": 0.0058, "step": 325180 }, { "epoch": 1.64, "learning_rate": 5.390619087739832e-05, "loss": 0.0107, "step": 325190 }, { "epoch": 1.64, "learning_rate": 5.389862318438431e-05, "loss": 0.0068, "step": 325200 }, { "epoch": 1.64, "learning_rate": 5.3891055491370304e-05, "loss": 0.0062, "step": 325210 }, { "epoch": 1.64, "learning_rate": 5.388348779835629e-05, "loss": 0.0075, "step": 325220 }, { "epoch": 1.64, "learning_rate": 5.387592010534228e-05, "loss": 0.005, "step": 325230 }, { "epoch": 1.64, "learning_rate": 5.386835241232827e-05, "loss": 0.0049, "step": 325240 }, { "epoch": 1.64, "learning_rate": 5.3860784719314264e-05, "loss": 0.0078, "step": 325250 }, { "epoch": 1.64, "learning_rate": 5.385321702630025e-05, "loss": 0.0071, "step": 325260 }, { "epoch": 1.64, "learning_rate": 5.384564933328624e-05, "loss": 0.0063, "step": 325270 }, { "epoch": 1.64, "learning_rate": 5.383808164027223e-05, "loss": 0.0062, "step": 325280 }, { "epoch": 1.64, "learning_rate": 5.3830513947258224e-05, "loss": 0.0057, "step": 325290 }, { "epoch": 1.64, "learning_rate": 5.382294625424421e-05, "loss": 0.0052, "step": 325300 }, { "epoch": 1.64, "learning_rate": 5.38153785612302e-05, "loss": 0.0066, "step": 325310 }, { "epoch": 1.64, "learning_rate": 5.3807810868216195e-05, "loss": 0.0076, "step": 325320 }, { "epoch": 1.64, "learning_rate": 5.380024317520218e-05, "loss": 0.0061, "step": 325330 }, { "epoch": 1.64, "learning_rate": 5.379267548218817e-05, "loss": 0.0056, "step": 325340 }, { "epoch": 1.64, "learning_rate": 5.378510778917416e-05, "loss": 0.0062, "step": 325350 }, { "epoch": 1.64, "learning_rate": 5.3777540096160155e-05, "loss": 0.0065, "step": 325360 }, { "epoch": 1.64, "learning_rate": 5.376997240314614e-05, "loss": 0.0066, "step": 325370 }, { "epoch": 1.64, "learning_rate": 5.3762404710132124e-05, "loss": 0.0066, "step": 325380 }, { "epoch": 1.64, "learning_rate": 5.375483701711811e-05, "loss": 0.0084, "step": 325390 }, { "epoch": 1.64, "learning_rate": 5.37472693241041e-05, "loss": 0.0073, "step": 325400 }, { "epoch": 1.64, "learning_rate": 5.3739701631090096e-05, "loss": 0.0084, "step": 325410 }, { "epoch": 1.64, "learning_rate": 5.3732133938076084e-05, "loss": 0.0061, "step": 325420 }, { "epoch": 1.64, "learning_rate": 5.372456624506207e-05, "loss": 0.0078, "step": 325430 }, { "epoch": 1.64, "learning_rate": 5.371699855204806e-05, "loss": 0.0065, "step": 325440 }, { "epoch": 1.64, "learning_rate": 5.3709430859034055e-05, "loss": 0.0085, "step": 325450 }, { "epoch": 1.64, "learning_rate": 5.3701863166020044e-05, "loss": 0.0056, "step": 325460 }, { "epoch": 1.64, "learning_rate": 5.369429547300603e-05, "loss": 0.0065, "step": 325470 }, { "epoch": 1.64, "learning_rate": 5.368672777999202e-05, "loss": 0.0058, "step": 325480 }, { "epoch": 1.64, "learning_rate": 5.3679160086978015e-05, "loss": 0.0061, "step": 325490 }, { "epoch": 1.64, "learning_rate": 5.3671592393964e-05, "loss": 0.0058, "step": 325500 }, { "epoch": 1.64, "learning_rate": 5.366402470094999e-05, "loss": 0.0066, "step": 325510 }, { "epoch": 1.64, "learning_rate": 5.365645700793598e-05, "loss": 0.006, "step": 325520 }, { "epoch": 1.64, "learning_rate": 5.3648889314921975e-05, "loss": 0.0062, "step": 325530 }, { "epoch": 1.64, "learning_rate": 5.364132162190796e-05, "loss": 0.0098, "step": 325540 }, { "epoch": 1.64, "learning_rate": 5.363375392889395e-05, "loss": 0.005, "step": 325550 }, { "epoch": 1.64, "learning_rate": 5.362618623587994e-05, "loss": 0.0064, "step": 325560 }, { "epoch": 1.64, "learning_rate": 5.3618618542865934e-05, "loss": 0.0107, "step": 325570 }, { "epoch": 1.64, "learning_rate": 5.361105084985192e-05, "loss": 0.0061, "step": 325580 }, { "epoch": 1.64, "learning_rate": 5.360348315683791e-05, "loss": 0.0074, "step": 325590 }, { "epoch": 1.64, "learning_rate": 5.35959154638239e-05, "loss": 0.0061, "step": 325600 }, { "epoch": 1.64, "learning_rate": 5.3588347770809894e-05, "loss": 0.0067, "step": 325610 }, { "epoch": 1.64, "learning_rate": 5.358078007779588e-05, "loss": 0.0098, "step": 325620 }, { "epoch": 1.64, "learning_rate": 5.357321238478187e-05, "loss": 0.0064, "step": 325630 }, { "epoch": 1.64, "learning_rate": 5.356564469176786e-05, "loss": 0.0078, "step": 325640 }, { "epoch": 1.64, "learning_rate": 5.3558076998753854e-05, "loss": 0.0058, "step": 325650 }, { "epoch": 1.64, "learning_rate": 5.355050930573984e-05, "loss": 0.0048, "step": 325660 }, { "epoch": 1.64, "learning_rate": 5.354294161272583e-05, "loss": 0.0049, "step": 325670 }, { "epoch": 1.64, "learning_rate": 5.353537391971182e-05, "loss": 0.0088, "step": 325680 }, { "epoch": 1.64, "learning_rate": 5.3527806226697813e-05, "loss": 0.0072, "step": 325690 }, { "epoch": 1.64, "learning_rate": 5.3520238533683795e-05, "loss": 0.0063, "step": 325700 }, { "epoch": 1.64, "learning_rate": 5.351267084066978e-05, "loss": 0.0052, "step": 325710 }, { "epoch": 1.64, "learning_rate": 5.350510314765577e-05, "loss": 0.006, "step": 325720 }, { "epoch": 1.64, "learning_rate": 5.349753545464176e-05, "loss": 0.0066, "step": 325730 }, { "epoch": 1.64, "learning_rate": 5.3489967761627754e-05, "loss": 0.0058, "step": 325740 }, { "epoch": 1.64, "learning_rate": 5.348240006861374e-05, "loss": 0.0047, "step": 325750 }, { "epoch": 1.64, "learning_rate": 5.347483237559973e-05, "loss": 0.0066, "step": 325760 }, { "epoch": 1.64, "learning_rate": 5.3467264682585726e-05, "loss": 0.0099, "step": 325770 }, { "epoch": 1.64, "learning_rate": 5.3459696989571714e-05, "loss": 0.0074, "step": 325780 }, { "epoch": 1.64, "learning_rate": 5.34521292965577e-05, "loss": 0.0064, "step": 325790 }, { "epoch": 1.64, "learning_rate": 5.344456160354369e-05, "loss": 0.006, "step": 325800 }, { "epoch": 1.64, "learning_rate": 5.3436993910529686e-05, "loss": 0.0066, "step": 325810 }, { "epoch": 1.64, "learning_rate": 5.3429426217515674e-05, "loss": 0.0056, "step": 325820 }, { "epoch": 1.64, "learning_rate": 5.342185852450166e-05, "loss": 0.0071, "step": 325830 }, { "epoch": 1.64, "learning_rate": 5.341429083148765e-05, "loss": 0.0056, "step": 325840 }, { "epoch": 1.64, "learning_rate": 5.3406723138473645e-05, "loss": 0.0098, "step": 325850 }, { "epoch": 1.64, "learning_rate": 5.3399155445459633e-05, "loss": 0.0076, "step": 325860 }, { "epoch": 1.64, "learning_rate": 5.339158775244562e-05, "loss": 0.0083, "step": 325870 }, { "epoch": 1.64, "learning_rate": 5.338402005943161e-05, "loss": 0.0071, "step": 325880 }, { "epoch": 1.64, "learning_rate": 5.3376452366417605e-05, "loss": 0.0045, "step": 325890 }, { "epoch": 1.64, "learning_rate": 5.336888467340359e-05, "loss": 0.0074, "step": 325900 }, { "epoch": 1.64, "learning_rate": 5.336131698038958e-05, "loss": 0.0057, "step": 325910 }, { "epoch": 1.64, "learning_rate": 5.335374928737557e-05, "loss": 0.0084, "step": 325920 }, { "epoch": 1.64, "learning_rate": 5.3346181594361565e-05, "loss": 0.0069, "step": 325930 }, { "epoch": 1.64, "learning_rate": 5.333861390134755e-05, "loss": 0.0058, "step": 325940 }, { "epoch": 1.64, "learning_rate": 5.333104620833354e-05, "loss": 0.0073, "step": 325950 }, { "epoch": 1.64, "learning_rate": 5.332347851531953e-05, "loss": 0.0063, "step": 325960 }, { "epoch": 1.64, "learning_rate": 5.3315910822305524e-05, "loss": 0.0053, "step": 325970 }, { "epoch": 1.64, "learning_rate": 5.330834312929151e-05, "loss": 0.0067, "step": 325980 }, { "epoch": 1.64, "learning_rate": 5.33007754362775e-05, "loss": 0.005, "step": 325990 }, { "epoch": 1.64, "learning_rate": 5.329320774326349e-05, "loss": 0.0066, "step": 326000 }, { "epoch": 1.64, "eval_cer": 0.914412032135638, "eval_loss": 0.004975411109626293, "eval_runtime": 116.3509, "eval_samples_per_second": 17.189, "eval_steps_per_second": 4.297, "step": 326000 }, { "epoch": 1.64, "learning_rate": 5.328564005024947e-05, "loss": 0.011, "step": 326010 }, { "epoch": 1.64, "learning_rate": 5.3278072357235465e-05, "loss": 0.0051, "step": 326020 }, { "epoch": 1.64, "learning_rate": 5.3270504664221453e-05, "loss": 0.0072, "step": 326030 }, { "epoch": 1.64, "learning_rate": 5.326293697120744e-05, "loss": 0.0059, "step": 326040 }, { "epoch": 1.64, "learning_rate": 5.325536927819343e-05, "loss": 0.0075, "step": 326050 }, { "epoch": 1.65, "learning_rate": 5.3247801585179425e-05, "loss": 0.0085, "step": 326060 }, { "epoch": 1.65, "learning_rate": 5.324023389216541e-05, "loss": 0.0048, "step": 326070 }, { "epoch": 1.65, "learning_rate": 5.32326661991514e-05, "loss": 0.0082, "step": 326080 }, { "epoch": 1.65, "learning_rate": 5.322509850613739e-05, "loss": 0.0052, "step": 326090 }, { "epoch": 1.65, "learning_rate": 5.3217530813123385e-05, "loss": 0.0062, "step": 326100 }, { "epoch": 1.65, "learning_rate": 5.320996312010937e-05, "loss": 0.0062, "step": 326110 }, { "epoch": 1.65, "learning_rate": 5.320239542709536e-05, "loss": 0.0097, "step": 326120 }, { "epoch": 1.65, "learning_rate": 5.319482773408135e-05, "loss": 0.008, "step": 326130 }, { "epoch": 1.65, "learning_rate": 5.3187260041067344e-05, "loss": 0.0063, "step": 326140 }, { "epoch": 1.65, "learning_rate": 5.317969234805333e-05, "loss": 0.0053, "step": 326150 }, { "epoch": 1.65, "learning_rate": 5.317212465503932e-05, "loss": 0.0079, "step": 326160 }, { "epoch": 1.65, "learning_rate": 5.316455696202531e-05, "loss": 0.0066, "step": 326170 }, { "epoch": 1.65, "learning_rate": 5.3156989269011304e-05, "loss": 0.0106, "step": 326180 }, { "epoch": 1.65, "learning_rate": 5.314942157599729e-05, "loss": 0.0068, "step": 326190 }, { "epoch": 1.65, "learning_rate": 5.314185388298328e-05, "loss": 0.0056, "step": 326200 }, { "epoch": 1.65, "learning_rate": 5.313428618996927e-05, "loss": 0.0085, "step": 326210 }, { "epoch": 1.65, "learning_rate": 5.3126718496955264e-05, "loss": 0.0069, "step": 326220 }, { "epoch": 1.65, "learning_rate": 5.311915080394125e-05, "loss": 0.0075, "step": 326230 }, { "epoch": 1.65, "learning_rate": 5.311158311092724e-05, "loss": 0.0056, "step": 326240 }, { "epoch": 1.65, "learning_rate": 5.310401541791323e-05, "loss": 0.0067, "step": 326250 }, { "epoch": 1.65, "learning_rate": 5.309644772489922e-05, "loss": 0.0059, "step": 326260 }, { "epoch": 1.65, "learning_rate": 5.308888003188521e-05, "loss": 0.0073, "step": 326270 }, { "epoch": 1.65, "learning_rate": 5.30813123388712e-05, "loss": 0.0054, "step": 326280 }, { "epoch": 1.65, "learning_rate": 5.3073744645857195e-05, "loss": 0.0104, "step": 326290 }, { "epoch": 1.65, "learning_rate": 5.306617695284318e-05, "loss": 0.0088, "step": 326300 }, { "epoch": 1.65, "learning_rate": 5.305860925982917e-05, "loss": 0.0071, "step": 326310 }, { "epoch": 1.65, "learning_rate": 5.305104156681515e-05, "loss": 0.0067, "step": 326320 }, { "epoch": 1.65, "learning_rate": 5.304347387380114e-05, "loss": 0.0068, "step": 326330 }, { "epoch": 1.65, "learning_rate": 5.3035906180787136e-05, "loss": 0.0055, "step": 326340 }, { "epoch": 1.65, "learning_rate": 5.3028338487773124e-05, "loss": 0.0084, "step": 326350 }, { "epoch": 1.65, "learning_rate": 5.302077079475911e-05, "loss": 0.0065, "step": 326360 }, { "epoch": 1.65, "learning_rate": 5.30132031017451e-05, "loss": 0.0058, "step": 326370 }, { "epoch": 1.65, "learning_rate": 5.3005635408731095e-05, "loss": 0.0065, "step": 326380 }, { "epoch": 1.65, "learning_rate": 5.2998067715717084e-05, "loss": 0.0056, "step": 326390 }, { "epoch": 1.65, "learning_rate": 5.299050002270307e-05, "loss": 0.008, "step": 326400 }, { "epoch": 1.65, "learning_rate": 5.298293232968906e-05, "loss": 0.0062, "step": 326410 }, { "epoch": 1.65, "learning_rate": 5.2975364636675055e-05, "loss": 0.0047, "step": 326420 }, { "epoch": 1.65, "learning_rate": 5.296779694366104e-05, "loss": 0.0076, "step": 326430 }, { "epoch": 1.65, "learning_rate": 5.296022925064703e-05, "loss": 0.0056, "step": 326440 }, { "epoch": 1.65, "learning_rate": 5.295266155763302e-05, "loss": 0.0085, "step": 326450 }, { "epoch": 1.65, "learning_rate": 5.2945093864619015e-05, "loss": 0.0072, "step": 326460 }, { "epoch": 1.65, "learning_rate": 5.2937526171605e-05, "loss": 0.0063, "step": 326470 }, { "epoch": 1.65, "learning_rate": 5.292995847859099e-05, "loss": 0.0086, "step": 326480 }, { "epoch": 1.65, "learning_rate": 5.292239078557698e-05, "loss": 0.0087, "step": 326490 }, { "epoch": 1.65, "learning_rate": 5.2914823092562974e-05, "loss": 0.0062, "step": 326500 }, { "epoch": 1.65, "learning_rate": 5.290725539954896e-05, "loss": 0.0056, "step": 326510 }, { "epoch": 1.65, "learning_rate": 5.289968770653495e-05, "loss": 0.007, "step": 326520 }, { "epoch": 1.65, "learning_rate": 5.289212001352094e-05, "loss": 0.0064, "step": 326530 }, { "epoch": 1.65, "learning_rate": 5.2884552320506934e-05, "loss": 0.0077, "step": 326540 }, { "epoch": 1.65, "learning_rate": 5.287698462749292e-05, "loss": 0.0058, "step": 326550 }, { "epoch": 1.65, "learning_rate": 5.286941693447891e-05, "loss": 0.0064, "step": 326560 }, { "epoch": 1.65, "learning_rate": 5.28618492414649e-05, "loss": 0.005, "step": 326570 }, { "epoch": 1.65, "learning_rate": 5.2854281548450894e-05, "loss": 0.007, "step": 326580 }, { "epoch": 1.65, "learning_rate": 5.284671385543688e-05, "loss": 0.0078, "step": 326590 }, { "epoch": 1.65, "learning_rate": 5.283914616242287e-05, "loss": 0.0068, "step": 326600 }, { "epoch": 1.65, "learning_rate": 5.283157846940886e-05, "loss": 0.0074, "step": 326610 }, { "epoch": 1.65, "learning_rate": 5.282401077639485e-05, "loss": 0.0074, "step": 326620 }, { "epoch": 1.65, "learning_rate": 5.281644308338084e-05, "loss": 0.0056, "step": 326630 }, { "epoch": 1.65, "learning_rate": 5.280887539036682e-05, "loss": 0.0094, "step": 326640 }, { "epoch": 1.65, "learning_rate": 5.280130769735281e-05, "loss": 0.005, "step": 326650 }, { "epoch": 1.65, "learning_rate": 5.27937400043388e-05, "loss": 0.0063, "step": 326660 }, { "epoch": 1.65, "learning_rate": 5.2786172311324794e-05, "loss": 0.0066, "step": 326670 }, { "epoch": 1.65, "learning_rate": 5.277860461831078e-05, "loss": 0.006, "step": 326680 }, { "epoch": 1.65, "learning_rate": 5.277103692529677e-05, "loss": 0.0072, "step": 326690 }, { "epoch": 1.65, "learning_rate": 5.276346923228276e-05, "loss": 0.0085, "step": 326700 }, { "epoch": 1.65, "learning_rate": 5.2755901539268754e-05, "loss": 0.0073, "step": 326710 }, { "epoch": 1.65, "learning_rate": 5.274833384625474e-05, "loss": 0.0079, "step": 326720 }, { "epoch": 1.65, "learning_rate": 5.274076615324073e-05, "loss": 0.0054, "step": 326730 }, { "epoch": 1.65, "learning_rate": 5.2733198460226725e-05, "loss": 0.0058, "step": 326740 }, { "epoch": 1.65, "learning_rate": 5.2725630767212714e-05, "loss": 0.006, "step": 326750 }, { "epoch": 1.65, "learning_rate": 5.27180630741987e-05, "loss": 0.0063, "step": 326760 }, { "epoch": 1.65, "learning_rate": 5.271049538118469e-05, "loss": 0.0084, "step": 326770 }, { "epoch": 1.65, "learning_rate": 5.2702927688170685e-05, "loss": 0.0062, "step": 326780 }, { "epoch": 1.65, "learning_rate": 5.269535999515667e-05, "loss": 0.0049, "step": 326790 }, { "epoch": 1.65, "learning_rate": 5.268779230214266e-05, "loss": 0.005, "step": 326800 }, { "epoch": 1.65, "learning_rate": 5.268022460912865e-05, "loss": 0.0072, "step": 326810 }, { "epoch": 1.65, "learning_rate": 5.2672656916114645e-05, "loss": 0.0053, "step": 326820 }, { "epoch": 1.65, "learning_rate": 5.266508922310063e-05, "loss": 0.0061, "step": 326830 }, { "epoch": 1.65, "learning_rate": 5.265752153008662e-05, "loss": 0.0073, "step": 326840 }, { "epoch": 1.65, "learning_rate": 5.264995383707261e-05, "loss": 0.0075, "step": 326850 }, { "epoch": 1.65, "learning_rate": 5.2642386144058604e-05, "loss": 0.0065, "step": 326860 }, { "epoch": 1.65, "learning_rate": 5.263481845104459e-05, "loss": 0.0069, "step": 326870 }, { "epoch": 1.65, "learning_rate": 5.262725075803058e-05, "loss": 0.0062, "step": 326880 }, { "epoch": 1.65, "learning_rate": 5.261968306501657e-05, "loss": 0.0064, "step": 326890 }, { "epoch": 1.65, "learning_rate": 5.2612115372002564e-05, "loss": 0.0066, "step": 326900 }, { "epoch": 1.65, "learning_rate": 5.260454767898855e-05, "loss": 0.0084, "step": 326910 }, { "epoch": 1.65, "learning_rate": 5.259697998597454e-05, "loss": 0.0079, "step": 326920 }, { "epoch": 1.65, "learning_rate": 5.258941229296053e-05, "loss": 0.0051, "step": 326930 }, { "epoch": 1.65, "learning_rate": 5.2581844599946524e-05, "loss": 0.0061, "step": 326940 }, { "epoch": 1.65, "learning_rate": 5.2574276906932505e-05, "loss": 0.0071, "step": 326950 }, { "epoch": 1.65, "learning_rate": 5.256670921391849e-05, "loss": 0.0057, "step": 326960 }, { "epoch": 1.65, "learning_rate": 5.255914152090448e-05, "loss": 0.007, "step": 326970 }, { "epoch": 1.65, "learning_rate": 5.255157382789047e-05, "loss": 0.0067, "step": 326980 }, { "epoch": 1.65, "learning_rate": 5.2544006134876465e-05, "loss": 0.0071, "step": 326990 }, { "epoch": 1.65, "learning_rate": 5.253643844186245e-05, "loss": 0.0055, "step": 327000 }, { "epoch": 1.65, "eval_cer": 0.9144285288697699, "eval_loss": 0.004966360051184893, "eval_runtime": 116.3822, "eval_samples_per_second": 17.185, "eval_steps_per_second": 4.296, "step": 327000 }, { "epoch": 1.65, "learning_rate": 5.252887074884844e-05, "loss": 0.0079, "step": 327010 }, { "epoch": 1.65, "learning_rate": 5.252130305583443e-05, "loss": 0.0102, "step": 327020 }, { "epoch": 1.65, "learning_rate": 5.2513735362820424e-05, "loss": 0.0109, "step": 327030 }, { "epoch": 1.65, "learning_rate": 5.250616766980641e-05, "loss": 0.0065, "step": 327040 }, { "epoch": 1.65, "learning_rate": 5.24985999767924e-05, "loss": 0.0065, "step": 327050 }, { "epoch": 1.65, "learning_rate": 5.249103228377839e-05, "loss": 0.0087, "step": 327060 }, { "epoch": 1.65, "learning_rate": 5.2483464590764384e-05, "loss": 0.0074, "step": 327070 }, { "epoch": 1.65, "learning_rate": 5.247589689775037e-05, "loss": 0.0052, "step": 327080 }, { "epoch": 1.65, "learning_rate": 5.246832920473636e-05, "loss": 0.007, "step": 327090 }, { "epoch": 1.65, "learning_rate": 5.246076151172235e-05, "loss": 0.0056, "step": 327100 }, { "epoch": 1.65, "learning_rate": 5.2453193818708344e-05, "loss": 0.0069, "step": 327110 }, { "epoch": 1.65, "learning_rate": 5.244562612569433e-05, "loss": 0.0079, "step": 327120 }, { "epoch": 1.65, "learning_rate": 5.243805843268032e-05, "loss": 0.0064, "step": 327130 }, { "epoch": 1.65, "learning_rate": 5.243049073966631e-05, "loss": 0.0081, "step": 327140 }, { "epoch": 1.65, "learning_rate": 5.2422923046652303e-05, "loss": 0.007, "step": 327150 }, { "epoch": 1.65, "learning_rate": 5.241535535363829e-05, "loss": 0.0039, "step": 327160 }, { "epoch": 1.65, "learning_rate": 5.240778766062428e-05, "loss": 0.009, "step": 327170 }, { "epoch": 1.65, "learning_rate": 5.240021996761027e-05, "loss": 0.0051, "step": 327180 }, { "epoch": 1.65, "learning_rate": 5.239265227459626e-05, "loss": 0.0056, "step": 327190 }, { "epoch": 1.65, "learning_rate": 5.238508458158225e-05, "loss": 0.0177, "step": 327200 }, { "epoch": 1.65, "learning_rate": 5.237751688856824e-05, "loss": 0.0072, "step": 327210 }, { "epoch": 1.65, "learning_rate": 5.236994919555423e-05, "loss": 0.0075, "step": 327220 }, { "epoch": 1.65, "learning_rate": 5.236238150254022e-05, "loss": 0.0069, "step": 327230 }, { "epoch": 1.65, "learning_rate": 5.235481380952621e-05, "loss": 0.0094, "step": 327240 }, { "epoch": 1.65, "learning_rate": 5.23472461165122e-05, "loss": 0.007, "step": 327250 }, { "epoch": 1.65, "learning_rate": 5.2339678423498194e-05, "loss": 0.0071, "step": 327260 }, { "epoch": 1.65, "learning_rate": 5.2332110730484176e-05, "loss": 0.0079, "step": 327270 }, { "epoch": 1.65, "learning_rate": 5.2324543037470164e-05, "loss": 0.0082, "step": 327280 }, { "epoch": 1.65, "learning_rate": 5.231697534445615e-05, "loss": 0.0086, "step": 327290 }, { "epoch": 1.65, "learning_rate": 5.230940765144214e-05, "loss": 0.0068, "step": 327300 }, { "epoch": 1.65, "learning_rate": 5.2301839958428135e-05, "loss": 0.0058, "step": 327310 }, { "epoch": 1.65, "learning_rate": 5.2294272265414123e-05, "loss": 0.0074, "step": 327320 }, { "epoch": 1.65, "learning_rate": 5.228670457240011e-05, "loss": 0.006, "step": 327330 }, { "epoch": 1.65, "learning_rate": 5.22791368793861e-05, "loss": 0.0045, "step": 327340 }, { "epoch": 1.65, "learning_rate": 5.2271569186372095e-05, "loss": 0.0054, "step": 327350 }, { "epoch": 1.65, "learning_rate": 5.226400149335808e-05, "loss": 0.0073, "step": 327360 }, { "epoch": 1.65, "learning_rate": 5.225643380034407e-05, "loss": 0.007, "step": 327370 }, { "epoch": 1.65, "learning_rate": 5.224886610733006e-05, "loss": 0.0062, "step": 327380 }, { "epoch": 1.65, "learning_rate": 5.2241298414316055e-05, "loss": 0.0051, "step": 327390 }, { "epoch": 1.65, "learning_rate": 5.223373072130204e-05, "loss": 0.0068, "step": 327400 }, { "epoch": 1.65, "learning_rate": 5.222616302828803e-05, "loss": 0.0075, "step": 327410 }, { "epoch": 1.65, "learning_rate": 5.221859533527402e-05, "loss": 0.006, "step": 327420 }, { "epoch": 1.65, "learning_rate": 5.2211027642260014e-05, "loss": 0.0065, "step": 327430 }, { "epoch": 1.65, "learning_rate": 5.2203459949246e-05, "loss": 0.0067, "step": 327440 }, { "epoch": 1.65, "learning_rate": 5.219589225623199e-05, "loss": 0.0053, "step": 327450 }, { "epoch": 1.65, "learning_rate": 5.218832456321798e-05, "loss": 0.006, "step": 327460 }, { "epoch": 1.65, "learning_rate": 5.2180756870203974e-05, "loss": 0.0081, "step": 327470 }, { "epoch": 1.65, "learning_rate": 5.217318917718996e-05, "loss": 0.0066, "step": 327480 }, { "epoch": 1.65, "learning_rate": 5.216562148417595e-05, "loss": 0.0057, "step": 327490 }, { "epoch": 1.65, "learning_rate": 5.215805379116194e-05, "loss": 0.0068, "step": 327500 }, { "epoch": 1.65, "learning_rate": 5.2150486098147933e-05, "loss": 0.0053, "step": 327510 }, { "epoch": 1.65, "learning_rate": 5.214291840513392e-05, "loss": 0.0056, "step": 327520 }, { "epoch": 1.65, "learning_rate": 5.213535071211991e-05, "loss": 0.0052, "step": 327530 }, { "epoch": 1.65, "learning_rate": 5.21277830191059e-05, "loss": 0.0065, "step": 327540 }, { "epoch": 1.65, "learning_rate": 5.212021532609189e-05, "loss": 0.0069, "step": 327550 }, { "epoch": 1.65, "learning_rate": 5.211264763307788e-05, "loss": 0.0082, "step": 327560 }, { "epoch": 1.65, "learning_rate": 5.210507994006387e-05, "loss": 0.0077, "step": 327570 }, { "epoch": 1.65, "learning_rate": 5.209751224704985e-05, "loss": 0.0063, "step": 327580 }, { "epoch": 1.65, "learning_rate": 5.208994455403584e-05, "loss": 0.0051, "step": 327590 }, { "epoch": 1.65, "learning_rate": 5.2082376861021834e-05, "loss": 0.0084, "step": 327600 }, { "epoch": 1.65, "learning_rate": 5.207480916800782e-05, "loss": 0.0051, "step": 327610 }, { "epoch": 1.65, "learning_rate": 5.206724147499381e-05, "loss": 0.0061, "step": 327620 }, { "epoch": 1.65, "learning_rate": 5.20596737819798e-05, "loss": 0.0087, "step": 327630 }, { "epoch": 1.65, "learning_rate": 5.2052106088965794e-05, "loss": 0.0055, "step": 327640 }, { "epoch": 1.65, "learning_rate": 5.204453839595178e-05, "loss": 0.009, "step": 327650 }, { "epoch": 1.65, "learning_rate": 5.203697070293777e-05, "loss": 0.0076, "step": 327660 }, { "epoch": 1.65, "learning_rate": 5.202940300992376e-05, "loss": 0.0053, "step": 327670 }, { "epoch": 1.65, "learning_rate": 5.2021835316909754e-05, "loss": 0.005, "step": 327680 }, { "epoch": 1.65, "learning_rate": 5.201426762389574e-05, "loss": 0.007, "step": 327690 }, { "epoch": 1.65, "learning_rate": 5.200669993088173e-05, "loss": 0.008, "step": 327700 }, { "epoch": 1.65, "learning_rate": 5.1999132237867725e-05, "loss": 0.0068, "step": 327710 }, { "epoch": 1.65, "learning_rate": 5.199156454485371e-05, "loss": 0.0075, "step": 327720 }, { "epoch": 1.65, "learning_rate": 5.19839968518397e-05, "loss": 0.007, "step": 327730 }, { "epoch": 1.65, "learning_rate": 5.197642915882569e-05, "loss": 0.0112, "step": 327740 }, { "epoch": 1.65, "learning_rate": 5.1968861465811685e-05, "loss": 0.0058, "step": 327750 }, { "epoch": 1.65, "learning_rate": 5.196129377279767e-05, "loss": 0.0075, "step": 327760 }, { "epoch": 1.65, "learning_rate": 5.195372607978366e-05, "loss": 0.0057, "step": 327770 }, { "epoch": 1.65, "learning_rate": 5.194615838676965e-05, "loss": 0.0113, "step": 327780 }, { "epoch": 1.65, "learning_rate": 5.1938590693755644e-05, "loss": 0.0053, "step": 327790 }, { "epoch": 1.65, "learning_rate": 5.193102300074163e-05, "loss": 0.0079, "step": 327800 }, { "epoch": 1.65, "learning_rate": 5.192345530772762e-05, "loss": 0.0062, "step": 327810 }, { "epoch": 1.65, "learning_rate": 5.191588761471361e-05, "loss": 0.0065, "step": 327820 }, { "epoch": 1.65, "learning_rate": 5.1908319921699604e-05, "loss": 0.0099, "step": 327830 }, { "epoch": 1.65, "learning_rate": 5.190075222868559e-05, "loss": 0.0071, "step": 327840 }, { "epoch": 1.65, "learning_rate": 5.189318453567158e-05, "loss": 0.0053, "step": 327850 }, { "epoch": 1.65, "learning_rate": 5.188561684265757e-05, "loss": 0.0043, "step": 327860 }, { "epoch": 1.65, "learning_rate": 5.1878049149643564e-05, "loss": 0.0089, "step": 327870 }, { "epoch": 1.65, "learning_rate": 5.187048145662955e-05, "loss": 0.0082, "step": 327880 }, { "epoch": 1.65, "learning_rate": 5.186291376361554e-05, "loss": 0.0058, "step": 327890 }, { "epoch": 1.65, "learning_rate": 5.185534607060152e-05, "loss": 0.0063, "step": 327900 }, { "epoch": 1.65, "learning_rate": 5.184777837758751e-05, "loss": 0.0061, "step": 327910 }, { "epoch": 1.65, "learning_rate": 5.1840210684573505e-05, "loss": 0.007, "step": 327920 }, { "epoch": 1.65, "learning_rate": 5.183264299155949e-05, "loss": 0.0065, "step": 327930 }, { "epoch": 1.65, "learning_rate": 5.182507529854548e-05, "loss": 0.0063, "step": 327940 }, { "epoch": 1.65, "learning_rate": 5.181750760553147e-05, "loss": 0.005, "step": 327950 }, { "epoch": 1.65, "learning_rate": 5.1809939912517464e-05, "loss": 0.0075, "step": 327960 }, { "epoch": 1.65, "learning_rate": 5.180237221950345e-05, "loss": 0.0065, "step": 327970 }, { "epoch": 1.65, "learning_rate": 5.179480452648944e-05, "loss": 0.0056, "step": 327980 }, { "epoch": 1.65, "learning_rate": 5.178723683347543e-05, "loss": 0.0077, "step": 327990 }, { "epoch": 1.65, "learning_rate": 5.1779669140461424e-05, "loss": 0.0089, "step": 328000 }, { "epoch": 1.65, "eval_cer": 0.9144556999612812, "eval_loss": 0.0049345288425683975, "eval_runtime": 116.3068, "eval_samples_per_second": 17.196, "eval_steps_per_second": 4.299, "step": 328000 }, { "epoch": 1.65, "learning_rate": 5.177210144744741e-05, "loss": 0.0068, "step": 328010 }, { "epoch": 1.65, "learning_rate": 5.17645337544334e-05, "loss": 0.0093, "step": 328020 }, { "epoch": 1.65, "learning_rate": 5.175696606141939e-05, "loss": 0.0074, "step": 328030 }, { "epoch": 1.65, "learning_rate": 5.1749398368405384e-05, "loss": 0.006, "step": 328040 }, { "epoch": 1.66, "learning_rate": 5.174183067539137e-05, "loss": 0.0054, "step": 328050 }, { "epoch": 1.66, "learning_rate": 5.173426298237736e-05, "loss": 0.0055, "step": 328060 }, { "epoch": 1.66, "learning_rate": 5.172669528936335e-05, "loss": 0.0067, "step": 328070 }, { "epoch": 1.66, "learning_rate": 5.171912759634934e-05, "loss": 0.0064, "step": 328080 }, { "epoch": 1.66, "learning_rate": 5.171155990333533e-05, "loss": 0.0057, "step": 328090 }, { "epoch": 1.66, "learning_rate": 5.170399221032132e-05, "loss": 0.0059, "step": 328100 }, { "epoch": 1.66, "learning_rate": 5.169642451730731e-05, "loss": 0.0055, "step": 328110 }, { "epoch": 1.66, "learning_rate": 5.16888568242933e-05, "loss": 0.0057, "step": 328120 }, { "epoch": 1.66, "learning_rate": 5.168128913127929e-05, "loss": 0.0062, "step": 328130 }, { "epoch": 1.66, "learning_rate": 5.167372143826528e-05, "loss": 0.008, "step": 328140 }, { "epoch": 1.66, "learning_rate": 5.166615374525127e-05, "loss": 0.0073, "step": 328150 }, { "epoch": 1.66, "learning_rate": 5.165858605223726e-05, "loss": 0.005, "step": 328160 }, { "epoch": 1.66, "learning_rate": 5.165101835922325e-05, "loss": 0.0052, "step": 328170 }, { "epoch": 1.66, "learning_rate": 5.164345066620924e-05, "loss": 0.0042, "step": 328180 }, { "epoch": 1.66, "learning_rate": 5.163588297319523e-05, "loss": 0.0054, "step": 328190 }, { "epoch": 1.66, "learning_rate": 5.162831528018122e-05, "loss": 0.007, "step": 328200 }, { "epoch": 1.66, "learning_rate": 5.1620747587167204e-05, "loss": 0.0072, "step": 328210 }, { "epoch": 1.66, "learning_rate": 5.161317989415319e-05, "loss": 0.0086, "step": 328220 }, { "epoch": 1.66, "learning_rate": 5.160561220113918e-05, "loss": 0.0044, "step": 328230 }, { "epoch": 1.66, "learning_rate": 5.1598044508125175e-05, "loss": 0.0058, "step": 328240 }, { "epoch": 1.66, "learning_rate": 5.159047681511116e-05, "loss": 0.0049, "step": 328250 }, { "epoch": 1.66, "learning_rate": 5.158290912209715e-05, "loss": 0.0066, "step": 328260 }, { "epoch": 1.66, "learning_rate": 5.157534142908314e-05, "loss": 0.0059, "step": 328270 }, { "epoch": 1.66, "learning_rate": 5.1567773736069135e-05, "loss": 0.0073, "step": 328280 }, { "epoch": 1.66, "learning_rate": 5.156020604305512e-05, "loss": 0.0068, "step": 328290 }, { "epoch": 1.66, "learning_rate": 5.155263835004111e-05, "loss": 0.008, "step": 328300 }, { "epoch": 1.66, "learning_rate": 5.15450706570271e-05, "loss": 0.0054, "step": 328310 }, { "epoch": 1.66, "learning_rate": 5.1537502964013094e-05, "loss": 0.0054, "step": 328320 }, { "epoch": 1.66, "learning_rate": 5.152993527099908e-05, "loss": 0.0074, "step": 328330 }, { "epoch": 1.66, "learning_rate": 5.152236757798507e-05, "loss": 0.0094, "step": 328340 }, { "epoch": 1.66, "learning_rate": 5.151479988497106e-05, "loss": 0.0084, "step": 328350 }, { "epoch": 1.66, "learning_rate": 5.1507232191957054e-05, "loss": 0.0069, "step": 328360 }, { "epoch": 1.66, "learning_rate": 5.149966449894304e-05, "loss": 0.005, "step": 328370 }, { "epoch": 1.66, "learning_rate": 5.149209680592903e-05, "loss": 0.0066, "step": 328380 }, { "epoch": 1.66, "learning_rate": 5.148452911291502e-05, "loss": 0.0059, "step": 328390 }, { "epoch": 1.66, "learning_rate": 5.1476961419901014e-05, "loss": 0.0079, "step": 328400 }, { "epoch": 1.66, "learning_rate": 5.1469393726887e-05, "loss": 0.0079, "step": 328410 }, { "epoch": 1.66, "learning_rate": 5.146182603387299e-05, "loss": 0.0074, "step": 328420 }, { "epoch": 1.66, "learning_rate": 5.145425834085898e-05, "loss": 0.0066, "step": 328430 }, { "epoch": 1.66, "learning_rate": 5.144669064784497e-05, "loss": 0.0048, "step": 328440 }, { "epoch": 1.66, "learning_rate": 5.143912295483096e-05, "loss": 0.0058, "step": 328450 }, { "epoch": 1.66, "learning_rate": 5.143155526181695e-05, "loss": 0.0061, "step": 328460 }, { "epoch": 1.66, "learning_rate": 5.142398756880294e-05, "loss": 0.0051, "step": 328470 }, { "epoch": 1.66, "learning_rate": 5.141641987578893e-05, "loss": 0.006, "step": 328480 }, { "epoch": 1.66, "learning_rate": 5.140885218277492e-05, "loss": 0.006, "step": 328490 }, { "epoch": 1.66, "learning_rate": 5.140128448976091e-05, "loss": 0.0077, "step": 328500 }, { "epoch": 1.66, "learning_rate": 5.13937167967469e-05, "loss": 0.0054, "step": 328510 }, { "epoch": 1.66, "learning_rate": 5.138614910373288e-05, "loss": 0.0043, "step": 328520 }, { "epoch": 1.66, "learning_rate": 5.1378581410718874e-05, "loss": 0.0055, "step": 328530 }, { "epoch": 1.66, "learning_rate": 5.137101371770486e-05, "loss": 0.0091, "step": 328540 }, { "epoch": 1.66, "learning_rate": 5.136344602469085e-05, "loss": 0.0063, "step": 328550 }, { "epoch": 1.66, "learning_rate": 5.135587833167684e-05, "loss": 0.0076, "step": 328560 }, { "epoch": 1.66, "learning_rate": 5.1348310638662834e-05, "loss": 0.0081, "step": 328570 }, { "epoch": 1.66, "learning_rate": 5.134074294564882e-05, "loss": 0.0067, "step": 328580 }, { "epoch": 1.66, "learning_rate": 5.133317525263481e-05, "loss": 0.0059, "step": 328590 }, { "epoch": 1.66, "learning_rate": 5.13256075596208e-05, "loss": 0.0071, "step": 328600 }, { "epoch": 1.66, "learning_rate": 5.1318039866606793e-05, "loss": 0.007, "step": 328610 }, { "epoch": 1.66, "learning_rate": 5.131047217359278e-05, "loss": 0.0085, "step": 328620 }, { "epoch": 1.66, "learning_rate": 5.130290448057877e-05, "loss": 0.0058, "step": 328630 }, { "epoch": 1.66, "learning_rate": 5.129533678756476e-05, "loss": 0.0056, "step": 328640 }, { "epoch": 1.66, "learning_rate": 5.128776909455075e-05, "loss": 0.0051, "step": 328650 }, { "epoch": 1.66, "learning_rate": 5.128020140153674e-05, "loss": 0.005, "step": 328660 }, { "epoch": 1.66, "learning_rate": 5.127263370852273e-05, "loss": 0.0089, "step": 328670 }, { "epoch": 1.66, "learning_rate": 5.1265066015508724e-05, "loss": 0.0107, "step": 328680 }, { "epoch": 1.66, "learning_rate": 5.125749832249471e-05, "loss": 0.0069, "step": 328690 }, { "epoch": 1.66, "learning_rate": 5.12499306294807e-05, "loss": 0.0051, "step": 328700 }, { "epoch": 1.66, "learning_rate": 5.124236293646669e-05, "loss": 0.006, "step": 328710 }, { "epoch": 1.66, "learning_rate": 5.1234795243452684e-05, "loss": 0.0064, "step": 328720 }, { "epoch": 1.66, "learning_rate": 5.122722755043867e-05, "loss": 0.0046, "step": 328730 }, { "epoch": 1.66, "learning_rate": 5.121965985742466e-05, "loss": 0.0052, "step": 328740 }, { "epoch": 1.66, "learning_rate": 5.121209216441065e-05, "loss": 0.0061, "step": 328750 }, { "epoch": 1.66, "learning_rate": 5.1204524471396644e-05, "loss": 0.0053, "step": 328760 }, { "epoch": 1.66, "learning_rate": 5.119695677838263e-05, "loss": 0.0052, "step": 328770 }, { "epoch": 1.66, "learning_rate": 5.118938908536862e-05, "loss": 0.0067, "step": 328780 }, { "epoch": 1.66, "learning_rate": 5.118182139235461e-05, "loss": 0.0086, "step": 328790 }, { "epoch": 1.66, "learning_rate": 5.1174253699340603e-05, "loss": 0.0061, "step": 328800 }, { "epoch": 1.66, "learning_rate": 5.116668600632659e-05, "loss": 0.0055, "step": 328810 }, { "epoch": 1.66, "learning_rate": 5.115911831331258e-05, "loss": 0.0063, "step": 328820 }, { "epoch": 1.66, "learning_rate": 5.115155062029857e-05, "loss": 0.006, "step": 328830 }, { "epoch": 1.66, "learning_rate": 5.114398292728455e-05, "loss": 0.005, "step": 328840 }, { "epoch": 1.66, "learning_rate": 5.1136415234270545e-05, "loss": 0.0048, "step": 328850 }, { "epoch": 1.66, "learning_rate": 5.112884754125653e-05, "loss": 0.0061, "step": 328860 }, { "epoch": 1.66, "learning_rate": 5.112127984824252e-05, "loss": 0.0079, "step": 328870 }, { "epoch": 1.66, "learning_rate": 5.111371215522851e-05, "loss": 0.0086, "step": 328880 }, { "epoch": 1.66, "learning_rate": 5.1106144462214504e-05, "loss": 0.0037, "step": 328890 }, { "epoch": 1.66, "learning_rate": 5.109857676920049e-05, "loss": 0.0052, "step": 328900 }, { "epoch": 1.66, "learning_rate": 5.109100907618648e-05, "loss": 0.0073, "step": 328910 }, { "epoch": 1.66, "learning_rate": 5.108344138317247e-05, "loss": 0.0055, "step": 328920 }, { "epoch": 1.66, "learning_rate": 5.1075873690158464e-05, "loss": 0.0083, "step": 328930 }, { "epoch": 1.66, "learning_rate": 5.106830599714445e-05, "loss": 0.0063, "step": 328940 }, { "epoch": 1.66, "learning_rate": 5.106073830413044e-05, "loss": 0.0069, "step": 328950 }, { "epoch": 1.66, "learning_rate": 5.105317061111643e-05, "loss": 0.0074, "step": 328960 }, { "epoch": 1.66, "learning_rate": 5.1045602918102423e-05, "loss": 0.006, "step": 328970 }, { "epoch": 1.66, "learning_rate": 5.103803522508841e-05, "loss": 0.0075, "step": 328980 }, { "epoch": 1.66, "learning_rate": 5.10304675320744e-05, "loss": 0.0056, "step": 328990 }, { "epoch": 1.66, "learning_rate": 5.102289983906039e-05, "loss": 0.0058, "step": 329000 }, { "epoch": 1.66, "eval_cer": 0.914447936792278, "eval_loss": 0.004932132083922625, "eval_runtime": 116.3131, "eval_samples_per_second": 17.195, "eval_steps_per_second": 4.299, "step": 329000 }, { "epoch": 1.66, "learning_rate": 5.101533214604638e-05, "loss": 0.0061, "step": 329010 }, { "epoch": 1.66, "learning_rate": 5.100776445303237e-05, "loss": 0.0075, "step": 329020 }, { "epoch": 1.66, "learning_rate": 5.100019676001836e-05, "loss": 0.0103, "step": 329030 }, { "epoch": 1.66, "learning_rate": 5.099262906700435e-05, "loss": 0.0059, "step": 329040 }, { "epoch": 1.66, "learning_rate": 5.098506137399034e-05, "loss": 0.0064, "step": 329050 }, { "epoch": 1.66, "learning_rate": 5.097749368097633e-05, "loss": 0.0049, "step": 329060 }, { "epoch": 1.66, "learning_rate": 5.096992598796232e-05, "loss": 0.0054, "step": 329070 }, { "epoch": 1.66, "learning_rate": 5.096235829494831e-05, "loss": 0.007, "step": 329080 }, { "epoch": 1.66, "learning_rate": 5.09547906019343e-05, "loss": 0.0062, "step": 329090 }, { "epoch": 1.66, "learning_rate": 5.094722290892029e-05, "loss": 0.0097, "step": 329100 }, { "epoch": 1.66, "learning_rate": 5.093965521590628e-05, "loss": 0.0046, "step": 329110 }, { "epoch": 1.66, "learning_rate": 5.093208752289227e-05, "loss": 0.0081, "step": 329120 }, { "epoch": 1.66, "learning_rate": 5.092451982987826e-05, "loss": 0.0062, "step": 329130 }, { "epoch": 1.66, "learning_rate": 5.091695213686425e-05, "loss": 0.0056, "step": 329140 }, { "epoch": 1.66, "learning_rate": 5.090938444385023e-05, "loss": 0.0063, "step": 329150 }, { "epoch": 1.66, "learning_rate": 5.090181675083622e-05, "loss": 0.0051, "step": 329160 }, { "epoch": 1.66, "learning_rate": 5.0894249057822215e-05, "loss": 0.0069, "step": 329170 }, { "epoch": 1.66, "learning_rate": 5.08866813648082e-05, "loss": 0.0091, "step": 329180 }, { "epoch": 1.66, "learning_rate": 5.087911367179419e-05, "loss": 0.0064, "step": 329190 }, { "epoch": 1.66, "learning_rate": 5.087154597878018e-05, "loss": 0.0076, "step": 329200 }, { "epoch": 1.66, "learning_rate": 5.0863978285766175e-05, "loss": 0.0081, "step": 329210 }, { "epoch": 1.66, "learning_rate": 5.085641059275216e-05, "loss": 0.0079, "step": 329220 }, { "epoch": 1.66, "learning_rate": 5.084884289973815e-05, "loss": 0.0092, "step": 329230 }, { "epoch": 1.66, "learning_rate": 5.084127520672414e-05, "loss": 0.0064, "step": 329240 }, { "epoch": 1.66, "learning_rate": 5.0833707513710134e-05, "loss": 0.0042, "step": 329250 }, { "epoch": 1.66, "learning_rate": 5.082613982069612e-05, "loss": 0.0072, "step": 329260 }, { "epoch": 1.66, "learning_rate": 5.081857212768211e-05, "loss": 0.0075, "step": 329270 }, { "epoch": 1.66, "learning_rate": 5.08110044346681e-05, "loss": 0.0083, "step": 329280 }, { "epoch": 1.66, "learning_rate": 5.0803436741654094e-05, "loss": 0.0065, "step": 329290 }, { "epoch": 1.66, "learning_rate": 5.079586904864008e-05, "loss": 0.0045, "step": 329300 }, { "epoch": 1.66, "learning_rate": 5.078830135562607e-05, "loss": 0.0063, "step": 329310 }, { "epoch": 1.66, "learning_rate": 5.078073366261206e-05, "loss": 0.0064, "step": 329320 }, { "epoch": 1.66, "learning_rate": 5.0773165969598054e-05, "loss": 0.0069, "step": 329330 }, { "epoch": 1.66, "learning_rate": 5.076559827658404e-05, "loss": 0.0073, "step": 329340 }, { "epoch": 1.66, "learning_rate": 5.075803058357003e-05, "loss": 0.0062, "step": 329350 }, { "epoch": 1.66, "learning_rate": 5.075046289055602e-05, "loss": 0.0078, "step": 329360 }, { "epoch": 1.66, "learning_rate": 5.074289519754201e-05, "loss": 0.0059, "step": 329370 }, { "epoch": 1.66, "learning_rate": 5.0735327504528e-05, "loss": 0.0109, "step": 329380 }, { "epoch": 1.66, "learning_rate": 5.072775981151399e-05, "loss": 0.0044, "step": 329390 }, { "epoch": 1.66, "learning_rate": 5.072019211849998e-05, "loss": 0.0061, "step": 329400 }, { "epoch": 1.66, "learning_rate": 5.071262442548597e-05, "loss": 0.0076, "step": 329410 }, { "epoch": 1.66, "learning_rate": 5.070505673247196e-05, "loss": 0.0054, "step": 329420 }, { "epoch": 1.66, "learning_rate": 5.069748903945795e-05, "loss": 0.0061, "step": 329430 }, { "epoch": 1.66, "learning_rate": 5.068992134644394e-05, "loss": 0.0068, "step": 329440 }, { "epoch": 1.66, "learning_rate": 5.068235365342993e-05, "loss": 0.0077, "step": 329450 }, { "epoch": 1.66, "learning_rate": 5.067478596041592e-05, "loss": 0.008, "step": 329460 }, { "epoch": 1.66, "learning_rate": 5.06672182674019e-05, "loss": 0.0062, "step": 329470 }, { "epoch": 1.66, "learning_rate": 5.065965057438789e-05, "loss": 0.0064, "step": 329480 }, { "epoch": 1.66, "learning_rate": 5.065208288137388e-05, "loss": 0.0072, "step": 329490 }, { "epoch": 1.66, "learning_rate": 5.0644515188359874e-05, "loss": 0.0054, "step": 329500 }, { "epoch": 1.66, "learning_rate": 5.063694749534586e-05, "loss": 0.0047, "step": 329510 }, { "epoch": 1.66, "learning_rate": 5.062937980233185e-05, "loss": 0.0085, "step": 329520 }, { "epoch": 1.66, "learning_rate": 5.062181210931784e-05, "loss": 0.007, "step": 329530 }, { "epoch": 1.66, "learning_rate": 5.061424441630383e-05, "loss": 0.0064, "step": 329540 }, { "epoch": 1.66, "learning_rate": 5.060667672328982e-05, "loss": 0.0057, "step": 329550 }, { "epoch": 1.66, "learning_rate": 5.059910903027581e-05, "loss": 0.0054, "step": 329560 }, { "epoch": 1.66, "learning_rate": 5.05915413372618e-05, "loss": 0.0071, "step": 329570 }, { "epoch": 1.66, "learning_rate": 5.058397364424779e-05, "loss": 0.0069, "step": 329580 }, { "epoch": 1.66, "learning_rate": 5.057640595123378e-05, "loss": 0.0068, "step": 329590 }, { "epoch": 1.66, "learning_rate": 5.056883825821977e-05, "loss": 0.0047, "step": 329600 }, { "epoch": 1.66, "learning_rate": 5.056127056520576e-05, "loss": 0.006, "step": 329610 }, { "epoch": 1.66, "learning_rate": 5.055370287219175e-05, "loss": 0.0069, "step": 329620 }, { "epoch": 1.66, "learning_rate": 5.054613517917774e-05, "loss": 0.0072, "step": 329630 }, { "epoch": 1.66, "learning_rate": 5.053856748616373e-05, "loss": 0.0065, "step": 329640 }, { "epoch": 1.66, "learning_rate": 5.0530999793149724e-05, "loss": 0.0072, "step": 329650 }, { "epoch": 1.66, "learning_rate": 5.052343210013571e-05, "loss": 0.0083, "step": 329660 }, { "epoch": 1.66, "learning_rate": 5.05158644071217e-05, "loss": 0.0061, "step": 329670 }, { "epoch": 1.66, "learning_rate": 5.050829671410769e-05, "loss": 0.0061, "step": 329680 }, { "epoch": 1.66, "learning_rate": 5.0500729021093684e-05, "loss": 0.0079, "step": 329690 }, { "epoch": 1.66, "learning_rate": 5.049316132807967e-05, "loss": 0.0057, "step": 329700 }, { "epoch": 1.66, "learning_rate": 5.048559363506566e-05, "loss": 0.0061, "step": 329710 }, { "epoch": 1.66, "learning_rate": 5.047802594205165e-05, "loss": 0.0071, "step": 329720 }, { "epoch": 1.66, "learning_rate": 5.047045824903764e-05, "loss": 0.0062, "step": 329730 }, { "epoch": 1.66, "learning_rate": 5.046289055602363e-05, "loss": 0.0075, "step": 329740 }, { "epoch": 1.66, "learning_rate": 5.045532286300962e-05, "loss": 0.0062, "step": 329750 }, { "epoch": 1.66, "learning_rate": 5.044775516999561e-05, "loss": 0.0061, "step": 329760 }, { "epoch": 1.66, "learning_rate": 5.04401874769816e-05, "loss": 0.0073, "step": 329770 }, { "epoch": 1.66, "learning_rate": 5.0432619783967584e-05, "loss": 0.0082, "step": 329780 }, { "epoch": 1.66, "learning_rate": 5.042505209095357e-05, "loss": 0.0096, "step": 329790 }, { "epoch": 1.66, "learning_rate": 5.041748439793956e-05, "loss": 0.0054, "step": 329800 }, { "epoch": 1.66, "learning_rate": 5.040991670492555e-05, "loss": 0.0064, "step": 329810 }, { "epoch": 1.66, "learning_rate": 5.0402349011911544e-05, "loss": 0.0067, "step": 329820 }, { "epoch": 1.66, "learning_rate": 5.039478131889753e-05, "loss": 0.0074, "step": 329830 }, { "epoch": 1.66, "learning_rate": 5.038721362588352e-05, "loss": 0.0054, "step": 329840 }, { "epoch": 1.66, "learning_rate": 5.037964593286951e-05, "loss": 0.006, "step": 329850 }, { "epoch": 1.66, "learning_rate": 5.0372078239855504e-05, "loss": 0.0051, "step": 329860 }, { "epoch": 1.66, "learning_rate": 5.036451054684149e-05, "loss": 0.0104, "step": 329870 }, { "epoch": 1.66, "learning_rate": 5.035694285382748e-05, "loss": 0.0092, "step": 329880 }, { "epoch": 1.66, "learning_rate": 5.034937516081347e-05, "loss": 0.0056, "step": 329890 }, { "epoch": 1.66, "learning_rate": 5.034180746779946e-05, "loss": 0.0066, "step": 329900 }, { "epoch": 1.66, "learning_rate": 5.033423977478545e-05, "loss": 0.0043, "step": 329910 }, { "epoch": 1.66, "learning_rate": 5.032667208177144e-05, "loss": 0.0056, "step": 329920 }, { "epoch": 1.66, "learning_rate": 5.031910438875743e-05, "loss": 0.0056, "step": 329930 }, { "epoch": 1.66, "learning_rate": 5.031153669574342e-05, "loss": 0.0047, "step": 329940 }, { "epoch": 1.66, "learning_rate": 5.030396900272941e-05, "loss": 0.0059, "step": 329950 }, { "epoch": 1.66, "learning_rate": 5.02964013097154e-05, "loss": 0.0065, "step": 329960 }, { "epoch": 1.66, "learning_rate": 5.028883361670139e-05, "loss": 0.0067, "step": 329970 }, { "epoch": 1.66, "learning_rate": 5.028126592368738e-05, "loss": 0.0058, "step": 329980 }, { "epoch": 1.66, "learning_rate": 5.027369823067337e-05, "loss": 0.0065, "step": 329990 }, { "epoch": 1.66, "learning_rate": 5.026613053765936e-05, "loss": 0.0077, "step": 330000 }, { "epoch": 1.66, "eval_cer": 0.9144411440194001, "eval_loss": 0.0048608663491904736, "eval_runtime": 116.3415, "eval_samples_per_second": 17.191, "eval_steps_per_second": 4.298, "step": 330000 }, { "epoch": 1.66, "learning_rate": 5.025856284464535e-05, "loss": 0.0047, "step": 330010 }, { "epoch": 1.66, "learning_rate": 5.025099515163134e-05, "loss": 0.0089, "step": 330020 }, { "epoch": 1.67, "learning_rate": 5.024342745861733e-05, "loss": 0.0044, "step": 330030 }, { "epoch": 1.67, "learning_rate": 5.023585976560332e-05, "loss": 0.0054, "step": 330040 }, { "epoch": 1.67, "learning_rate": 5.022829207258931e-05, "loss": 0.0054, "step": 330050 }, { "epoch": 1.67, "learning_rate": 5.02207243795753e-05, "loss": 0.0059, "step": 330060 }, { "epoch": 1.67, "learning_rate": 5.021315668656129e-05, "loss": 0.0058, "step": 330070 }, { "epoch": 1.67, "learning_rate": 5.020558899354728e-05, "loss": 0.0048, "step": 330080 }, { "epoch": 1.67, "learning_rate": 5.019802130053326e-05, "loss": 0.0071, "step": 330090 }, { "epoch": 1.67, "learning_rate": 5.0190453607519255e-05, "loss": 0.0059, "step": 330100 }, { "epoch": 1.67, "learning_rate": 5.018288591450524e-05, "loss": 0.0076, "step": 330110 }, { "epoch": 1.67, "learning_rate": 5.017531822149123e-05, "loss": 0.0066, "step": 330120 }, { "epoch": 1.67, "learning_rate": 5.016775052847722e-05, "loss": 0.0075, "step": 330130 }, { "epoch": 1.67, "learning_rate": 5.0160182835463214e-05, "loss": 0.007, "step": 330140 }, { "epoch": 1.67, "learning_rate": 5.01526151424492e-05, "loss": 0.01, "step": 330150 }, { "epoch": 1.67, "learning_rate": 5.014504744943519e-05, "loss": 0.0053, "step": 330160 }, { "epoch": 1.67, "learning_rate": 5.013747975642118e-05, "loss": 0.0063, "step": 330170 }, { "epoch": 1.67, "learning_rate": 5.0129912063407174e-05, "loss": 0.0064, "step": 330180 }, { "epoch": 1.67, "learning_rate": 5.012234437039316e-05, "loss": 0.0063, "step": 330190 }, { "epoch": 1.67, "learning_rate": 5.011477667737915e-05, "loss": 0.0055, "step": 330200 }, { "epoch": 1.67, "learning_rate": 5.010720898436514e-05, "loss": 0.0057, "step": 330210 }, { "epoch": 1.67, "learning_rate": 5.0099641291351134e-05, "loss": 0.0065, "step": 330220 }, { "epoch": 1.67, "learning_rate": 5.009207359833712e-05, "loss": 0.0079, "step": 330230 }, { "epoch": 1.67, "learning_rate": 5.008450590532311e-05, "loss": 0.0063, "step": 330240 }, { "epoch": 1.67, "learning_rate": 5.00769382123091e-05, "loss": 0.005, "step": 330250 }, { "epoch": 1.67, "learning_rate": 5.0069370519295093e-05, "loss": 0.0066, "step": 330260 }, { "epoch": 1.67, "learning_rate": 5.006180282628108e-05, "loss": 0.0073, "step": 330270 }, { "epoch": 1.67, "learning_rate": 5.005423513326707e-05, "loss": 0.0053, "step": 330280 }, { "epoch": 1.67, "learning_rate": 5.004666744025306e-05, "loss": 0.0074, "step": 330290 }, { "epoch": 1.67, "learning_rate": 5.003909974723905e-05, "loss": 0.006, "step": 330300 }, { "epoch": 1.67, "learning_rate": 5.003153205422504e-05, "loss": 0.0068, "step": 330310 }, { "epoch": 1.67, "learning_rate": 5.002396436121103e-05, "loss": 0.006, "step": 330320 }, { "epoch": 1.67, "learning_rate": 5.001639666819702e-05, "loss": 0.0099, "step": 330330 }, { "epoch": 1.67, "learning_rate": 5.000882897518301e-05, "loss": 0.0059, "step": 330340 }, { "epoch": 1.67, "learning_rate": 5.0001261282169e-05, "loss": 0.0059, "step": 330350 }, { "epoch": 1.67, "learning_rate": 4.999369358915499e-05, "loss": 0.0065, "step": 330360 }, { "epoch": 1.67, "learning_rate": 4.998612589614098e-05, "loss": 0.0073, "step": 330370 }, { "epoch": 1.67, "learning_rate": 4.997855820312697e-05, "loss": 0.0072, "step": 330380 }, { "epoch": 1.67, "learning_rate": 4.997099051011296e-05, "loss": 0.0075, "step": 330390 }, { "epoch": 1.67, "learning_rate": 4.996342281709895e-05, "loss": 0.0042, "step": 330400 }, { "epoch": 1.67, "learning_rate": 4.995585512408493e-05, "loss": 0.0054, "step": 330410 }, { "epoch": 1.67, "learning_rate": 4.994828743107092e-05, "loss": 0.0071, "step": 330420 }, { "epoch": 1.67, "learning_rate": 4.9940719738056913e-05, "loss": 0.0069, "step": 330430 }, { "epoch": 1.67, "learning_rate": 4.99331520450429e-05, "loss": 0.0085, "step": 330440 }, { "epoch": 1.67, "learning_rate": 4.992558435202889e-05, "loss": 0.0114, "step": 330450 }, { "epoch": 1.67, "learning_rate": 4.991801665901488e-05, "loss": 0.0063, "step": 330460 }, { "epoch": 1.67, "learning_rate": 4.991044896600087e-05, "loss": 0.0049, "step": 330470 }, { "epoch": 1.67, "learning_rate": 4.990288127298686e-05, "loss": 0.0147, "step": 330480 }, { "epoch": 1.67, "learning_rate": 4.989531357997285e-05, "loss": 0.0079, "step": 330490 }, { "epoch": 1.67, "learning_rate": 4.988774588695884e-05, "loss": 0.0078, "step": 330500 }, { "epoch": 1.67, "learning_rate": 4.988017819394483e-05, "loss": 0.0068, "step": 330510 }, { "epoch": 1.67, "learning_rate": 4.987261050093082e-05, "loss": 0.0068, "step": 330520 }, { "epoch": 1.67, "learning_rate": 4.986504280791681e-05, "loss": 0.0074, "step": 330530 }, { "epoch": 1.67, "learning_rate": 4.98574751149028e-05, "loss": 0.0063, "step": 330540 }, { "epoch": 1.67, "learning_rate": 4.984990742188879e-05, "loss": 0.0065, "step": 330550 }, { "epoch": 1.67, "learning_rate": 4.984233972887478e-05, "loss": 0.0055, "step": 330560 }, { "epoch": 1.67, "learning_rate": 4.983477203586077e-05, "loss": 0.0076, "step": 330570 }, { "epoch": 1.67, "learning_rate": 4.982720434284676e-05, "loss": 0.0055, "step": 330580 }, { "epoch": 1.67, "learning_rate": 4.981963664983275e-05, "loss": 0.0046, "step": 330590 }, { "epoch": 1.67, "learning_rate": 4.981206895681874e-05, "loss": 0.0068, "step": 330600 }, { "epoch": 1.67, "learning_rate": 4.980450126380473e-05, "loss": 0.0074, "step": 330610 }, { "epoch": 1.67, "learning_rate": 4.9796933570790724e-05, "loss": 0.006, "step": 330620 }, { "epoch": 1.67, "learning_rate": 4.978936587777671e-05, "loss": 0.0085, "step": 330630 }, { "epoch": 1.67, "learning_rate": 4.97817981847627e-05, "loss": 0.0052, "step": 330640 }, { "epoch": 1.67, "learning_rate": 4.977423049174869e-05, "loss": 0.0072, "step": 330650 }, { "epoch": 1.67, "learning_rate": 4.976666279873468e-05, "loss": 0.0066, "step": 330660 }, { "epoch": 1.67, "learning_rate": 4.975909510572067e-05, "loss": 0.0069, "step": 330670 }, { "epoch": 1.67, "learning_rate": 4.975152741270666e-05, "loss": 0.0071, "step": 330680 }, { "epoch": 1.67, "learning_rate": 4.974395971969265e-05, "loss": 0.0065, "step": 330690 }, { "epoch": 1.67, "learning_rate": 4.973639202667864e-05, "loss": 0.0071, "step": 330700 }, { "epoch": 1.67, "learning_rate": 4.972882433366463e-05, "loss": 0.0089, "step": 330710 }, { "epoch": 1.67, "learning_rate": 4.972125664065061e-05, "loss": 0.0071, "step": 330720 }, { "epoch": 1.67, "learning_rate": 4.97136889476366e-05, "loss": 0.0068, "step": 330730 }, { "epoch": 1.67, "learning_rate": 4.970612125462259e-05, "loss": 0.0069, "step": 330740 }, { "epoch": 1.67, "learning_rate": 4.9698553561608584e-05, "loss": 0.0073, "step": 330750 }, { "epoch": 1.67, "learning_rate": 4.969098586859457e-05, "loss": 0.005, "step": 330760 }, { "epoch": 1.67, "learning_rate": 4.968341817558056e-05, "loss": 0.0039, "step": 330770 }, { "epoch": 1.67, "learning_rate": 4.967585048256655e-05, "loss": 0.0102, "step": 330780 }, { "epoch": 1.67, "learning_rate": 4.9668282789552544e-05, "loss": 0.0076, "step": 330790 }, { "epoch": 1.67, "learning_rate": 4.966071509653853e-05, "loss": 0.006, "step": 330800 }, { "epoch": 1.67, "learning_rate": 4.965314740352452e-05, "loss": 0.0046, "step": 330810 }, { "epoch": 1.67, "learning_rate": 4.964557971051051e-05, "loss": 0.0051, "step": 330820 }, { "epoch": 1.67, "learning_rate": 4.96380120174965e-05, "loss": 0.0071, "step": 330830 }, { "epoch": 1.67, "learning_rate": 4.963044432448249e-05, "loss": 0.0065, "step": 330840 }, { "epoch": 1.67, "learning_rate": 4.962287663146848e-05, "loss": 0.0063, "step": 330850 }, { "epoch": 1.67, "learning_rate": 4.961530893845447e-05, "loss": 0.0069, "step": 330860 }, { "epoch": 1.67, "learning_rate": 4.960774124544046e-05, "loss": 0.0075, "step": 330870 }, { "epoch": 1.67, "learning_rate": 4.960017355242645e-05, "loss": 0.0052, "step": 330880 }, { "epoch": 1.67, "learning_rate": 4.959260585941244e-05, "loss": 0.0052, "step": 330890 }, { "epoch": 1.67, "learning_rate": 4.958503816639843e-05, "loss": 0.0063, "step": 330900 }, { "epoch": 1.67, "learning_rate": 4.957747047338442e-05, "loss": 0.0069, "step": 330910 }, { "epoch": 1.67, "learning_rate": 4.956990278037041e-05, "loss": 0.007, "step": 330920 }, { "epoch": 1.67, "learning_rate": 4.95623350873564e-05, "loss": 0.0081, "step": 330930 }, { "epoch": 1.67, "learning_rate": 4.955476739434239e-05, "loss": 0.0058, "step": 330940 }, { "epoch": 1.67, "learning_rate": 4.954719970132838e-05, "loss": 0.0089, "step": 330950 }, { "epoch": 1.67, "learning_rate": 4.953963200831437e-05, "loss": 0.007, "step": 330960 }, { "epoch": 1.67, "learning_rate": 4.953206431530036e-05, "loss": 0.006, "step": 330970 }, { "epoch": 1.67, "learning_rate": 4.952449662228635e-05, "loss": 0.0066, "step": 330980 }, { "epoch": 1.67, "learning_rate": 4.951692892927234e-05, "loss": 0.0059, "step": 330990 }, { "epoch": 1.67, "learning_rate": 4.950936123625833e-05, "loss": 0.0054, "step": 331000 }, { "epoch": 1.67, "eval_cer": 0.9144440552077764, "eval_loss": 0.004910916555672884, "eval_runtime": 116.3705, "eval_samples_per_second": 17.186, "eval_steps_per_second": 4.297, "step": 331000 }, { "epoch": 1.67, "learning_rate": 4.950179354324432e-05, "loss": 0.0073, "step": 331010 }, { "epoch": 1.67, "learning_rate": 4.9494225850230306e-05, "loss": 0.0054, "step": 331020 }, { "epoch": 1.67, "learning_rate": 4.94866581572163e-05, "loss": 0.0066, "step": 331030 }, { "epoch": 1.67, "learning_rate": 4.947909046420228e-05, "loss": 0.0073, "step": 331040 }, { "epoch": 1.67, "learning_rate": 4.947152277118827e-05, "loss": 0.0093, "step": 331050 }, { "epoch": 1.67, "learning_rate": 4.946395507817426e-05, "loss": 0.0066, "step": 331060 }, { "epoch": 1.67, "learning_rate": 4.9456387385160254e-05, "loss": 0.0041, "step": 331070 }, { "epoch": 1.67, "learning_rate": 4.944881969214624e-05, "loss": 0.0065, "step": 331080 }, { "epoch": 1.67, "learning_rate": 4.944125199913223e-05, "loss": 0.005, "step": 331090 }, { "epoch": 1.67, "learning_rate": 4.943368430611822e-05, "loss": 0.0068, "step": 331100 }, { "epoch": 1.67, "learning_rate": 4.9426116613104214e-05, "loss": 0.0081, "step": 331110 }, { "epoch": 1.67, "learning_rate": 4.94185489200902e-05, "loss": 0.006, "step": 331120 }, { "epoch": 1.67, "learning_rate": 4.941098122707619e-05, "loss": 0.0072, "step": 331130 }, { "epoch": 1.67, "learning_rate": 4.940341353406218e-05, "loss": 0.0058, "step": 331140 }, { "epoch": 1.67, "learning_rate": 4.9395845841048174e-05, "loss": 0.0077, "step": 331150 }, { "epoch": 1.67, "learning_rate": 4.938827814803416e-05, "loss": 0.005, "step": 331160 }, { "epoch": 1.67, "learning_rate": 4.938071045502015e-05, "loss": 0.0091, "step": 331170 }, { "epoch": 1.67, "learning_rate": 4.937314276200614e-05, "loss": 0.006, "step": 331180 }, { "epoch": 1.67, "learning_rate": 4.936557506899213e-05, "loss": 0.0051, "step": 331190 }, { "epoch": 1.67, "learning_rate": 4.935800737597812e-05, "loss": 0.0047, "step": 331200 }, { "epoch": 1.67, "learning_rate": 4.935043968296411e-05, "loss": 0.006, "step": 331210 }, { "epoch": 1.67, "learning_rate": 4.93428719899501e-05, "loss": 0.0071, "step": 331220 }, { "epoch": 1.67, "learning_rate": 4.933530429693609e-05, "loss": 0.0066, "step": 331230 }, { "epoch": 1.67, "learning_rate": 4.932773660392208e-05, "loss": 0.0072, "step": 331240 }, { "epoch": 1.67, "learning_rate": 4.932016891090807e-05, "loss": 0.0072, "step": 331250 }, { "epoch": 1.67, "learning_rate": 4.931260121789406e-05, "loss": 0.0077, "step": 331260 }, { "epoch": 1.67, "learning_rate": 4.930503352488005e-05, "loss": 0.0057, "step": 331270 }, { "epoch": 1.67, "learning_rate": 4.929746583186604e-05, "loss": 0.0063, "step": 331280 }, { "epoch": 1.67, "learning_rate": 4.928989813885203e-05, "loss": 0.0064, "step": 331290 }, { "epoch": 1.67, "learning_rate": 4.928233044583802e-05, "loss": 0.0052, "step": 331300 }, { "epoch": 1.67, "learning_rate": 4.927476275282401e-05, "loss": 0.008, "step": 331310 }, { "epoch": 1.67, "learning_rate": 4.926719505981e-05, "loss": 0.0098, "step": 331320 }, { "epoch": 1.67, "learning_rate": 4.925962736679599e-05, "loss": 0.0051, "step": 331330 }, { "epoch": 1.67, "learning_rate": 4.925205967378198e-05, "loss": 0.0079, "step": 331340 }, { "epoch": 1.67, "learning_rate": 4.924449198076796e-05, "loss": 0.0053, "step": 331350 }, { "epoch": 1.67, "learning_rate": 4.923692428775395e-05, "loss": 0.0054, "step": 331360 }, { "epoch": 1.67, "learning_rate": 4.922935659473994e-05, "loss": 0.0062, "step": 331370 }, { "epoch": 1.67, "learning_rate": 4.922178890172593e-05, "loss": 0.0085, "step": 331380 }, { "epoch": 1.67, "learning_rate": 4.921422120871192e-05, "loss": 0.0054, "step": 331390 }, { "epoch": 1.67, "learning_rate": 4.920665351569791e-05, "loss": 0.006, "step": 331400 }, { "epoch": 1.67, "learning_rate": 4.91990858226839e-05, "loss": 0.007, "step": 331410 }, { "epoch": 1.67, "learning_rate": 4.919151812966989e-05, "loss": 0.0071, "step": 331420 }, { "epoch": 1.67, "learning_rate": 4.918395043665588e-05, "loss": 0.0067, "step": 331430 }, { "epoch": 1.67, "learning_rate": 4.917638274364187e-05, "loss": 0.0056, "step": 331440 }, { "epoch": 1.67, "learning_rate": 4.916881505062786e-05, "loss": 0.005, "step": 331450 }, { "epoch": 1.67, "learning_rate": 4.916124735761385e-05, "loss": 0.0062, "step": 331460 }, { "epoch": 1.67, "learning_rate": 4.915367966459984e-05, "loss": 0.0053, "step": 331470 }, { "epoch": 1.67, "learning_rate": 4.914611197158583e-05, "loss": 0.0065, "step": 331480 }, { "epoch": 1.67, "learning_rate": 4.913854427857182e-05, "loss": 0.0052, "step": 331490 }, { "epoch": 1.67, "learning_rate": 4.913097658555781e-05, "loss": 0.0074, "step": 331500 }, { "epoch": 1.67, "learning_rate": 4.91234088925438e-05, "loss": 0.0082, "step": 331510 }, { "epoch": 1.67, "learning_rate": 4.911584119952979e-05, "loss": 0.0073, "step": 331520 }, { "epoch": 1.67, "learning_rate": 4.910827350651578e-05, "loss": 0.0059, "step": 331530 }, { "epoch": 1.67, "learning_rate": 4.910070581350177e-05, "loss": 0.0064, "step": 331540 }, { "epoch": 1.67, "learning_rate": 4.909313812048776e-05, "loss": 0.0079, "step": 331550 }, { "epoch": 1.67, "learning_rate": 4.908557042747375e-05, "loss": 0.0069, "step": 331560 }, { "epoch": 1.67, "learning_rate": 4.907800273445974e-05, "loss": 0.0056, "step": 331570 }, { "epoch": 1.67, "learning_rate": 4.907043504144573e-05, "loss": 0.0063, "step": 331580 }, { "epoch": 1.67, "learning_rate": 4.906286734843172e-05, "loss": 0.0058, "step": 331590 }, { "epoch": 1.67, "learning_rate": 4.905529965541771e-05, "loss": 0.0055, "step": 331600 }, { "epoch": 1.67, "learning_rate": 4.90477319624037e-05, "loss": 0.0057, "step": 331610 }, { "epoch": 1.67, "learning_rate": 4.904016426938969e-05, "loss": 0.0061, "step": 331620 }, { "epoch": 1.67, "learning_rate": 4.903259657637568e-05, "loss": 0.0098, "step": 331630 }, { "epoch": 1.67, "learning_rate": 4.902502888336167e-05, "loss": 0.0059, "step": 331640 }, { "epoch": 1.67, "learning_rate": 4.901746119034766e-05, "loss": 0.0063, "step": 331650 }, { "epoch": 1.67, "learning_rate": 4.900989349733365e-05, "loss": 0.0059, "step": 331660 }, { "epoch": 1.67, "learning_rate": 4.900232580431963e-05, "loss": 0.0053, "step": 331670 }, { "epoch": 1.67, "learning_rate": 4.8994758111305624e-05, "loss": 0.0057, "step": 331680 }, { "epoch": 1.67, "learning_rate": 4.898719041829161e-05, "loss": 0.0047, "step": 331690 }, { "epoch": 1.67, "learning_rate": 4.89796227252776e-05, "loss": 0.0072, "step": 331700 }, { "epoch": 1.67, "learning_rate": 4.897205503226359e-05, "loss": 0.0072, "step": 331710 }, { "epoch": 1.67, "learning_rate": 4.8964487339249583e-05, "loss": 0.006, "step": 331720 }, { "epoch": 1.67, "learning_rate": 4.895691964623557e-05, "loss": 0.0048, "step": 331730 }, { "epoch": 1.67, "learning_rate": 4.894935195322156e-05, "loss": 0.0062, "step": 331740 }, { "epoch": 1.67, "learning_rate": 4.894178426020755e-05, "loss": 0.0061, "step": 331750 }, { "epoch": 1.67, "learning_rate": 4.893421656719354e-05, "loss": 0.006, "step": 331760 }, { "epoch": 1.67, "learning_rate": 4.892664887417953e-05, "loss": 0.0085, "step": 331770 }, { "epoch": 1.67, "learning_rate": 4.891908118116552e-05, "loss": 0.007, "step": 331780 }, { "epoch": 1.67, "learning_rate": 4.891151348815151e-05, "loss": 0.0071, "step": 331790 }, { "epoch": 1.67, "learning_rate": 4.89039457951375e-05, "loss": 0.0085, "step": 331800 }, { "epoch": 1.67, "learning_rate": 4.889637810212349e-05, "loss": 0.0073, "step": 331810 }, { "epoch": 1.67, "learning_rate": 4.888881040910948e-05, "loss": 0.0093, "step": 331820 }, { "epoch": 1.67, "learning_rate": 4.888124271609547e-05, "loss": 0.0111, "step": 331830 }, { "epoch": 1.67, "learning_rate": 4.887367502308146e-05, "loss": 0.0066, "step": 331840 }, { "epoch": 1.67, "learning_rate": 4.886610733006745e-05, "loss": 0.0075, "step": 331850 }, { "epoch": 1.67, "learning_rate": 4.885853963705344e-05, "loss": 0.0053, "step": 331860 }, { "epoch": 1.67, "learning_rate": 4.885097194403943e-05, "loss": 0.008, "step": 331870 }, { "epoch": 1.67, "learning_rate": 4.884340425102542e-05, "loss": 0.0072, "step": 331880 }, { "epoch": 1.67, "learning_rate": 4.883583655801141e-05, "loss": 0.0046, "step": 331890 }, { "epoch": 1.67, "learning_rate": 4.88282688649974e-05, "loss": 0.0066, "step": 331900 }, { "epoch": 1.67, "learning_rate": 4.882070117198339e-05, "loss": 0.0073, "step": 331910 }, { "epoch": 1.67, "learning_rate": 4.881313347896938e-05, "loss": 0.0062, "step": 331920 }, { "epoch": 1.67, "learning_rate": 4.880556578595537e-05, "loss": 0.0063, "step": 331930 }, { "epoch": 1.67, "learning_rate": 4.879799809294136e-05, "loss": 0.0088, "step": 331940 }, { "epoch": 1.67, "learning_rate": 4.8790430399927346e-05, "loss": 0.0054, "step": 331950 }, { "epoch": 1.67, "learning_rate": 4.878286270691334e-05, "loss": 0.0048, "step": 331960 }, { "epoch": 1.67, "learning_rate": 4.877529501389933e-05, "loss": 0.0063, "step": 331970 }, { "epoch": 1.67, "learning_rate": 4.876772732088531e-05, "loss": 0.0073, "step": 331980 }, { "epoch": 1.67, "learning_rate": 4.87601596278713e-05, "loss": 0.0064, "step": 331990 }, { "epoch": 1.67, "learning_rate": 4.875259193485729e-05, "loss": 0.0059, "step": 332000 }, { "epoch": 1.67, "eval_cer": 0.9144421144155256, "eval_loss": 0.004793255589902401, "eval_runtime": 116.2412, "eval_samples_per_second": 17.206, "eval_steps_per_second": 4.301, "step": 332000 }, { "epoch": 1.68, "learning_rate": 4.874502424184328e-05, "loss": 0.0078, "step": 332010 }, { "epoch": 1.68, "learning_rate": 4.873745654882927e-05, "loss": 0.0072, "step": 332020 }, { "epoch": 1.68, "learning_rate": 4.872988885581526e-05, "loss": 0.0064, "step": 332030 }, { "epoch": 1.68, "learning_rate": 4.8722321162801254e-05, "loss": 0.0058, "step": 332040 }, { "epoch": 1.68, "learning_rate": 4.871475346978724e-05, "loss": 0.0059, "step": 332050 }, { "epoch": 1.68, "learning_rate": 4.870718577677323e-05, "loss": 0.0055, "step": 332060 }, { "epoch": 1.68, "learning_rate": 4.869961808375922e-05, "loss": 0.0055, "step": 332070 }, { "epoch": 1.68, "learning_rate": 4.8692050390745214e-05, "loss": 0.0047, "step": 332080 }, { "epoch": 1.68, "learning_rate": 4.86844826977312e-05, "loss": 0.0085, "step": 332090 }, { "epoch": 1.68, "learning_rate": 4.867691500471719e-05, "loss": 0.0058, "step": 332100 }, { "epoch": 1.68, "learning_rate": 4.866934731170318e-05, "loss": 0.0076, "step": 332110 }, { "epoch": 1.68, "learning_rate": 4.866177961868917e-05, "loss": 0.0057, "step": 332120 }, { "epoch": 1.68, "learning_rate": 4.865421192567516e-05, "loss": 0.0072, "step": 332130 }, { "epoch": 1.68, "learning_rate": 4.864664423266115e-05, "loss": 0.0079, "step": 332140 }, { "epoch": 1.68, "learning_rate": 4.863907653964714e-05, "loss": 0.0051, "step": 332150 }, { "epoch": 1.68, "learning_rate": 4.863150884663313e-05, "loss": 0.0096, "step": 332160 }, { "epoch": 1.68, "learning_rate": 4.862394115361912e-05, "loss": 0.0077, "step": 332170 }, { "epoch": 1.68, "learning_rate": 4.861637346060511e-05, "loss": 0.0078, "step": 332180 }, { "epoch": 1.68, "learning_rate": 4.86088057675911e-05, "loss": 0.0073, "step": 332190 }, { "epoch": 1.68, "learning_rate": 4.860123807457709e-05, "loss": 0.006, "step": 332200 }, { "epoch": 1.68, "learning_rate": 4.859367038156308e-05, "loss": 0.007, "step": 332210 }, { "epoch": 1.68, "learning_rate": 4.858610268854907e-05, "loss": 0.006, "step": 332220 }, { "epoch": 1.68, "learning_rate": 4.857853499553506e-05, "loss": 0.0058, "step": 332230 }, { "epoch": 1.68, "learning_rate": 4.857096730252105e-05, "loss": 0.0128, "step": 332240 }, { "epoch": 1.68, "learning_rate": 4.856339960950704e-05, "loss": 0.0053, "step": 332250 }, { "epoch": 1.68, "learning_rate": 4.855583191649303e-05, "loss": 0.0079, "step": 332260 }, { "epoch": 1.68, "learning_rate": 4.854826422347902e-05, "loss": 0.0048, "step": 332270 }, { "epoch": 1.68, "learning_rate": 4.854069653046501e-05, "loss": 0.0041, "step": 332280 }, { "epoch": 1.68, "learning_rate": 4.853312883745099e-05, "loss": 0.0061, "step": 332290 }, { "epoch": 1.68, "learning_rate": 4.852556114443698e-05, "loss": 0.0059, "step": 332300 }, { "epoch": 1.68, "learning_rate": 4.851799345142297e-05, "loss": 0.0077, "step": 332310 }, { "epoch": 1.68, "learning_rate": 4.851042575840896e-05, "loss": 0.0062, "step": 332320 }, { "epoch": 1.68, "learning_rate": 4.850285806539495e-05, "loss": 0.0076, "step": 332330 }, { "epoch": 1.68, "learning_rate": 4.849529037238094e-05, "loss": 0.0054, "step": 332340 }, { "epoch": 1.68, "learning_rate": 4.848772267936693e-05, "loss": 0.0063, "step": 332350 }, { "epoch": 1.68, "learning_rate": 4.848015498635292e-05, "loss": 0.0049, "step": 332360 }, { "epoch": 1.68, "learning_rate": 4.847258729333891e-05, "loss": 0.0073, "step": 332370 }, { "epoch": 1.68, "learning_rate": 4.84650196003249e-05, "loss": 0.0047, "step": 332380 }, { "epoch": 1.68, "learning_rate": 4.845745190731089e-05, "loss": 0.0057, "step": 332390 }, { "epoch": 1.68, "learning_rate": 4.844988421429688e-05, "loss": 0.0062, "step": 332400 }, { "epoch": 1.68, "learning_rate": 4.844231652128287e-05, "loss": 0.0053, "step": 332410 }, { "epoch": 1.68, "learning_rate": 4.843474882826886e-05, "loss": 0.0067, "step": 332420 }, { "epoch": 1.68, "learning_rate": 4.842718113525485e-05, "loss": 0.0082, "step": 332430 }, { "epoch": 1.68, "learning_rate": 4.841961344224084e-05, "loss": 0.0077, "step": 332440 }, { "epoch": 1.68, "learning_rate": 4.841204574922683e-05, "loss": 0.0062, "step": 332450 }, { "epoch": 1.68, "learning_rate": 4.840447805621282e-05, "loss": 0.0062, "step": 332460 }, { "epoch": 1.68, "learning_rate": 4.839691036319881e-05, "loss": 0.0064, "step": 332470 }, { "epoch": 1.68, "learning_rate": 4.8389342670184797e-05, "loss": 0.0048, "step": 332480 }, { "epoch": 1.68, "learning_rate": 4.838177497717079e-05, "loss": 0.0069, "step": 332490 }, { "epoch": 1.68, "learning_rate": 4.837420728415678e-05, "loss": 0.0083, "step": 332500 }, { "epoch": 1.68, "learning_rate": 4.836663959114277e-05, "loss": 0.0052, "step": 332510 }, { "epoch": 1.68, "learning_rate": 4.8359071898128756e-05, "loss": 0.0063, "step": 332520 }, { "epoch": 1.68, "learning_rate": 4.835150420511475e-05, "loss": 0.0067, "step": 332530 }, { "epoch": 1.68, "learning_rate": 4.834393651210074e-05, "loss": 0.0063, "step": 332540 }, { "epoch": 1.68, "learning_rate": 4.833636881908673e-05, "loss": 0.0054, "step": 332550 }, { "epoch": 1.68, "learning_rate": 4.832880112607272e-05, "loss": 0.0073, "step": 332560 }, { "epoch": 1.68, "learning_rate": 4.832123343305871e-05, "loss": 0.0052, "step": 332570 }, { "epoch": 1.68, "learning_rate": 4.83136657400447e-05, "loss": 0.006, "step": 332580 }, { "epoch": 1.68, "learning_rate": 4.830609804703069e-05, "loss": 0.0072, "step": 332590 }, { "epoch": 1.68, "learning_rate": 4.829853035401668e-05, "loss": 0.0064, "step": 332600 }, { "epoch": 1.68, "learning_rate": 4.8290962661002664e-05, "loss": 0.0056, "step": 332610 }, { "epoch": 1.68, "learning_rate": 4.828339496798865e-05, "loss": 0.0087, "step": 332620 }, { "epoch": 1.68, "learning_rate": 4.827582727497464e-05, "loss": 0.0063, "step": 332630 }, { "epoch": 1.68, "learning_rate": 4.826825958196063e-05, "loss": 0.0065, "step": 332640 }, { "epoch": 1.68, "learning_rate": 4.826069188894662e-05, "loss": 0.0103, "step": 332650 }, { "epoch": 1.68, "learning_rate": 4.825312419593261e-05, "loss": 0.0067, "step": 332660 }, { "epoch": 1.68, "learning_rate": 4.82455565029186e-05, "loss": 0.0058, "step": 332670 }, { "epoch": 1.68, "learning_rate": 4.823798880990459e-05, "loss": 0.0103, "step": 332680 }, { "epoch": 1.68, "learning_rate": 4.823042111689058e-05, "loss": 0.0078, "step": 332690 }, { "epoch": 1.68, "learning_rate": 4.822285342387657e-05, "loss": 0.0063, "step": 332700 }, { "epoch": 1.68, "learning_rate": 4.821528573086256e-05, "loss": 0.0053, "step": 332710 }, { "epoch": 1.68, "learning_rate": 4.820771803784855e-05, "loss": 0.0062, "step": 332720 }, { "epoch": 1.68, "learning_rate": 4.820015034483454e-05, "loss": 0.006, "step": 332730 }, { "epoch": 1.68, "learning_rate": 4.819258265182053e-05, "loss": 0.0092, "step": 332740 }, { "epoch": 1.68, "learning_rate": 4.818501495880652e-05, "loss": 0.0075, "step": 332750 }, { "epoch": 1.68, "learning_rate": 4.817744726579251e-05, "loss": 0.0056, "step": 332760 }, { "epoch": 1.68, "learning_rate": 4.81698795727785e-05, "loss": 0.0045, "step": 332770 }, { "epoch": 1.68, "learning_rate": 4.816231187976449e-05, "loss": 0.0064, "step": 332780 }, { "epoch": 1.68, "learning_rate": 4.815474418675048e-05, "loss": 0.0082, "step": 332790 }, { "epoch": 1.68, "learning_rate": 4.814717649373647e-05, "loss": 0.0057, "step": 332800 }, { "epoch": 1.68, "learning_rate": 4.813960880072246e-05, "loss": 0.0071, "step": 332810 }, { "epoch": 1.68, "learning_rate": 4.813204110770845e-05, "loss": 0.0075, "step": 332820 }, { "epoch": 1.68, "learning_rate": 4.812447341469444e-05, "loss": 0.0053, "step": 332830 }, { "epoch": 1.68, "learning_rate": 4.8116905721680427e-05, "loss": 0.0061, "step": 332840 }, { "epoch": 1.68, "learning_rate": 4.810933802866642e-05, "loss": 0.0057, "step": 332850 }, { "epoch": 1.68, "learning_rate": 4.810177033565241e-05, "loss": 0.0053, "step": 332860 }, { "epoch": 1.68, "learning_rate": 4.80942026426384e-05, "loss": 0.0063, "step": 332870 }, { "epoch": 1.68, "learning_rate": 4.8086634949624386e-05, "loss": 0.0077, "step": 332880 }, { "epoch": 1.68, "learning_rate": 4.807906725661038e-05, "loss": 0.0077, "step": 332890 }, { "epoch": 1.68, "learning_rate": 4.807149956359637e-05, "loss": 0.0059, "step": 332900 }, { "epoch": 1.68, "learning_rate": 4.806393187058236e-05, "loss": 0.0076, "step": 332910 }, { "epoch": 1.68, "learning_rate": 4.805636417756834e-05, "loss": 0.0043, "step": 332920 }, { "epoch": 1.68, "learning_rate": 4.804879648455433e-05, "loss": 0.0062, "step": 332930 }, { "epoch": 1.68, "learning_rate": 4.804122879154032e-05, "loss": 0.0071, "step": 332940 }, { "epoch": 1.68, "learning_rate": 4.803366109852631e-05, "loss": 0.0102, "step": 332950 }, { "epoch": 1.68, "learning_rate": 4.80260934055123e-05, "loss": 0.0053, "step": 332960 }, { "epoch": 1.68, "learning_rate": 4.801852571249829e-05, "loss": 0.0071, "step": 332970 }, { "epoch": 1.68, "learning_rate": 4.801095801948428e-05, "loss": 0.005, "step": 332980 }, { "epoch": 1.68, "learning_rate": 4.800339032647027e-05, "loss": 0.0076, "step": 332990 }, { "epoch": 1.68, "learning_rate": 4.799582263345626e-05, "loss": 0.0072, "step": 333000 }, { "epoch": 1.68, "eval_cer": 0.9144343512465224, "eval_loss": 0.004823221359401941, "eval_runtime": 116.4518, "eval_samples_per_second": 17.174, "eval_steps_per_second": 4.294, "step": 333000 }, { "epoch": 1.68, "learning_rate": 4.7988254940442253e-05, "loss": 0.0063, "step": 333010 }, { "epoch": 1.68, "learning_rate": 4.798068724742824e-05, "loss": 0.0085, "step": 333020 }, { "epoch": 1.68, "learning_rate": 4.797311955441423e-05, "loss": 0.0098, "step": 333030 }, { "epoch": 1.68, "learning_rate": 4.796555186140022e-05, "loss": 0.0063, "step": 333040 }, { "epoch": 1.68, "learning_rate": 4.795798416838621e-05, "loss": 0.007, "step": 333050 }, { "epoch": 1.68, "learning_rate": 4.79504164753722e-05, "loss": 0.0047, "step": 333060 }, { "epoch": 1.68, "learning_rate": 4.794284878235819e-05, "loss": 0.0058, "step": 333070 }, { "epoch": 1.68, "learning_rate": 4.793528108934418e-05, "loss": 0.0054, "step": 333080 }, { "epoch": 1.68, "learning_rate": 4.792771339633017e-05, "loss": 0.005, "step": 333090 }, { "epoch": 1.68, "learning_rate": 4.792014570331616e-05, "loss": 0.0067, "step": 333100 }, { "epoch": 1.68, "learning_rate": 4.791257801030215e-05, "loss": 0.0078, "step": 333110 }, { "epoch": 1.68, "learning_rate": 4.790501031728814e-05, "loss": 0.0058, "step": 333120 }, { "epoch": 1.68, "learning_rate": 4.789744262427413e-05, "loss": 0.0052, "step": 333130 }, { "epoch": 1.68, "learning_rate": 4.788987493126012e-05, "loss": 0.0071, "step": 333140 }, { "epoch": 1.68, "learning_rate": 4.788230723824611e-05, "loss": 0.0071, "step": 333150 }, { "epoch": 1.68, "learning_rate": 4.78747395452321e-05, "loss": 0.0076, "step": 333160 }, { "epoch": 1.68, "learning_rate": 4.786717185221809e-05, "loss": 0.0059, "step": 333170 }, { "epoch": 1.68, "learning_rate": 4.785960415920408e-05, "loss": 0.0061, "step": 333180 }, { "epoch": 1.68, "learning_rate": 4.785203646619007e-05, "loss": 0.0063, "step": 333190 }, { "epoch": 1.68, "learning_rate": 4.784446877317606e-05, "loss": 0.0068, "step": 333200 }, { "epoch": 1.68, "learning_rate": 4.783690108016205e-05, "loss": 0.0064, "step": 333210 }, { "epoch": 1.68, "learning_rate": 4.782933338714804e-05, "loss": 0.0055, "step": 333220 }, { "epoch": 1.68, "learning_rate": 4.782176569413403e-05, "loss": 0.009, "step": 333230 }, { "epoch": 1.68, "learning_rate": 4.781419800112001e-05, "loss": 0.0056, "step": 333240 }, { "epoch": 1.68, "learning_rate": 4.7806630308106e-05, "loss": 0.0065, "step": 333250 }, { "epoch": 1.68, "learning_rate": 4.779906261509199e-05, "loss": 0.0059, "step": 333260 }, { "epoch": 1.68, "learning_rate": 4.779149492207798e-05, "loss": 0.0052, "step": 333270 }, { "epoch": 1.68, "learning_rate": 4.778392722906397e-05, "loss": 0.007, "step": 333280 }, { "epoch": 1.68, "learning_rate": 4.777635953604996e-05, "loss": 0.0054, "step": 333290 }, { "epoch": 1.68, "learning_rate": 4.776879184303595e-05, "loss": 0.0061, "step": 333300 }, { "epoch": 1.68, "learning_rate": 4.776122415002194e-05, "loss": 0.0083, "step": 333310 }, { "epoch": 1.68, "learning_rate": 4.775365645700793e-05, "loss": 0.0088, "step": 333320 }, { "epoch": 1.68, "learning_rate": 4.774608876399392e-05, "loss": 0.0064, "step": 333330 }, { "epoch": 1.68, "learning_rate": 4.773852107097991e-05, "loss": 0.0067, "step": 333340 }, { "epoch": 1.68, "learning_rate": 4.77309533779659e-05, "loss": 0.0057, "step": 333350 }, { "epoch": 1.68, "learning_rate": 4.772338568495189e-05, "loss": 0.0064, "step": 333360 }, { "epoch": 1.68, "learning_rate": 4.771581799193788e-05, "loss": 0.0083, "step": 333370 }, { "epoch": 1.68, "learning_rate": 4.770825029892387e-05, "loss": 0.0071, "step": 333380 }, { "epoch": 1.68, "learning_rate": 4.770068260590986e-05, "loss": 0.007, "step": 333390 }, { "epoch": 1.68, "learning_rate": 4.769311491289585e-05, "loss": 0.0073, "step": 333400 }, { "epoch": 1.68, "learning_rate": 4.7685547219881836e-05, "loss": 0.0054, "step": 333410 }, { "epoch": 1.68, "learning_rate": 4.767797952686783e-05, "loss": 0.0053, "step": 333420 }, { "epoch": 1.68, "learning_rate": 4.767041183385382e-05, "loss": 0.0076, "step": 333430 }, { "epoch": 1.68, "learning_rate": 4.766284414083981e-05, "loss": 0.0068, "step": 333440 }, { "epoch": 1.68, "learning_rate": 4.7655276447825796e-05, "loss": 0.0053, "step": 333450 }, { "epoch": 1.68, "learning_rate": 4.764770875481179e-05, "loss": 0.0062, "step": 333460 }, { "epoch": 1.68, "learning_rate": 4.764014106179778e-05, "loss": 0.0041, "step": 333470 }, { "epoch": 1.68, "learning_rate": 4.763257336878377e-05, "loss": 0.0063, "step": 333480 }, { "epoch": 1.68, "learning_rate": 4.7625005675769756e-05, "loss": 0.0047, "step": 333490 }, { "epoch": 1.68, "learning_rate": 4.761743798275575e-05, "loss": 0.0067, "step": 333500 }, { "epoch": 1.68, "learning_rate": 4.760987028974174e-05, "loss": 0.0066, "step": 333510 }, { "epoch": 1.68, "learning_rate": 4.760230259672773e-05, "loss": 0.0079, "step": 333520 }, { "epoch": 1.68, "learning_rate": 4.759473490371372e-05, "loss": 0.0053, "step": 333530 }, { "epoch": 1.68, "learning_rate": 4.758716721069971e-05, "loss": 0.0076, "step": 333540 }, { "epoch": 1.68, "learning_rate": 4.757959951768569e-05, "loss": 0.0054, "step": 333550 }, { "epoch": 1.68, "learning_rate": 4.757203182467168e-05, "loss": 0.0064, "step": 333560 }, { "epoch": 1.68, "learning_rate": 4.756446413165767e-05, "loss": 0.0072, "step": 333570 }, { "epoch": 1.68, "learning_rate": 4.755689643864366e-05, "loss": 0.0075, "step": 333580 }, { "epoch": 1.68, "learning_rate": 4.754932874562965e-05, "loss": 0.0073, "step": 333590 }, { "epoch": 1.68, "learning_rate": 4.754176105261564e-05, "loss": 0.005, "step": 333600 }, { "epoch": 1.68, "learning_rate": 4.753419335960163e-05, "loss": 0.0054, "step": 333610 }, { "epoch": 1.68, "learning_rate": 4.752662566658762e-05, "loss": 0.0049, "step": 333620 }, { "epoch": 1.68, "learning_rate": 4.751905797357361e-05, "loss": 0.0068, "step": 333630 }, { "epoch": 1.68, "learning_rate": 4.75114902805596e-05, "loss": 0.0076, "step": 333640 }, { "epoch": 1.68, "learning_rate": 4.750392258754559e-05, "loss": 0.0063, "step": 333650 }, { "epoch": 1.68, "learning_rate": 4.749635489453158e-05, "loss": 0.006, "step": 333660 }, { "epoch": 1.68, "learning_rate": 4.748878720151757e-05, "loss": 0.0072, "step": 333670 }, { "epoch": 1.68, "learning_rate": 4.748121950850356e-05, "loss": 0.0076, "step": 333680 }, { "epoch": 1.68, "learning_rate": 4.747365181548955e-05, "loss": 0.0061, "step": 333690 }, { "epoch": 1.68, "learning_rate": 4.746608412247554e-05, "loss": 0.0067, "step": 333700 }, { "epoch": 1.68, "learning_rate": 4.745851642946153e-05, "loss": 0.0062, "step": 333710 }, { "epoch": 1.68, "learning_rate": 4.745094873644752e-05, "loss": 0.0057, "step": 333720 }, { "epoch": 1.68, "learning_rate": 4.744338104343351e-05, "loss": 0.006, "step": 333730 }, { "epoch": 1.68, "learning_rate": 4.74358133504195e-05, "loss": 0.0053, "step": 333740 }, { "epoch": 1.68, "learning_rate": 4.742824565740549e-05, "loss": 0.0064, "step": 333750 }, { "epoch": 1.68, "learning_rate": 4.742067796439148e-05, "loss": 0.0058, "step": 333760 }, { "epoch": 1.68, "learning_rate": 4.7413110271377466e-05, "loss": 0.0072, "step": 333770 }, { "epoch": 1.68, "learning_rate": 4.740554257836346e-05, "loss": 0.0066, "step": 333780 }, { "epoch": 1.68, "learning_rate": 4.739797488534945e-05, "loss": 0.0058, "step": 333790 }, { "epoch": 1.68, "learning_rate": 4.739040719233544e-05, "loss": 0.0045, "step": 333800 }, { "epoch": 1.68, "learning_rate": 4.7382839499321426e-05, "loss": 0.0066, "step": 333810 }, { "epoch": 1.68, "learning_rate": 4.737527180630742e-05, "loss": 0.0061, "step": 333820 }, { "epoch": 1.68, "learning_rate": 4.736770411329341e-05, "loss": 0.0084, "step": 333830 }, { "epoch": 1.68, "learning_rate": 4.73601364202794e-05, "loss": 0.0077, "step": 333840 }, { "epoch": 1.68, "learning_rate": 4.7352568727265386e-05, "loss": 0.0063, "step": 333850 }, { "epoch": 1.68, "learning_rate": 4.734500103425138e-05, "loss": 0.0057, "step": 333860 }, { "epoch": 1.68, "learning_rate": 4.733743334123736e-05, "loss": 0.0069, "step": 333870 }, { "epoch": 1.68, "learning_rate": 4.732986564822335e-05, "loss": 0.0082, "step": 333880 }, { "epoch": 1.68, "learning_rate": 4.732229795520934e-05, "loss": 0.0067, "step": 333890 }, { "epoch": 1.68, "learning_rate": 4.731473026219533e-05, "loss": 0.0067, "step": 333900 }, { "epoch": 1.68, "learning_rate": 4.730716256918132e-05, "loss": 0.0056, "step": 333910 }, { "epoch": 1.68, "learning_rate": 4.729959487616731e-05, "loss": 0.0071, "step": 333920 }, { "epoch": 1.68, "learning_rate": 4.72920271831533e-05, "loss": 0.0055, "step": 333930 }, { "epoch": 1.68, "learning_rate": 4.7284459490139287e-05, "loss": 0.0058, "step": 333940 }, { "epoch": 1.68, "learning_rate": 4.727689179712528e-05, "loss": 0.0054, "step": 333950 }, { "epoch": 1.68, "learning_rate": 4.726932410411127e-05, "loss": 0.0055, "step": 333960 }, { "epoch": 1.68, "learning_rate": 4.726175641109726e-05, "loss": 0.0065, "step": 333970 }, { "epoch": 1.68, "learning_rate": 4.725418871808325e-05, "loss": 0.0061, "step": 333980 }, { "epoch": 1.69, "learning_rate": 4.724662102506924e-05, "loss": 0.0064, "step": 333990 }, { "epoch": 1.69, "learning_rate": 4.723905333205523e-05, "loss": 0.0081, "step": 334000 }, { "epoch": 1.69, "eval_cer": 0.9144139729278888, "eval_loss": 0.004758420865982771, "eval_runtime": 116.3871, "eval_samples_per_second": 17.184, "eval_steps_per_second": 4.296, "step": 334000 }, { "epoch": 1.69, "learning_rate": 4.723148563904122e-05, "loss": 0.0067, "step": 334010 }, { "epoch": 1.69, "learning_rate": 4.722391794602721e-05, "loss": 0.0079, "step": 334020 }, { "epoch": 1.69, "learning_rate": 4.72163502530132e-05, "loss": 0.0056, "step": 334030 }, { "epoch": 1.69, "learning_rate": 4.720878255999919e-05, "loss": 0.0057, "step": 334040 }, { "epoch": 1.69, "learning_rate": 4.720121486698518e-05, "loss": 0.0066, "step": 334050 }, { "epoch": 1.69, "learning_rate": 4.719364717397117e-05, "loss": 0.0047, "step": 334060 }, { "epoch": 1.69, "learning_rate": 4.718607948095716e-05, "loss": 0.0055, "step": 334070 }, { "epoch": 1.69, "learning_rate": 4.717851178794315e-05, "loss": 0.0054, "step": 334080 }, { "epoch": 1.69, "learning_rate": 4.717094409492914e-05, "loss": 0.0056, "step": 334090 }, { "epoch": 1.69, "learning_rate": 4.716337640191513e-05, "loss": 0.0063, "step": 334100 }, { "epoch": 1.69, "learning_rate": 4.715580870890112e-05, "loss": 0.0049, "step": 334110 }, { "epoch": 1.69, "learning_rate": 4.714824101588711e-05, "loss": 0.0084, "step": 334120 }, { "epoch": 1.69, "learning_rate": 4.7140673322873097e-05, "loss": 0.0062, "step": 334130 }, { "epoch": 1.69, "learning_rate": 4.713310562985909e-05, "loss": 0.0079, "step": 334140 }, { "epoch": 1.69, "learning_rate": 4.712553793684508e-05, "loss": 0.0068, "step": 334150 }, { "epoch": 1.69, "learning_rate": 4.711797024383107e-05, "loss": 0.005, "step": 334160 }, { "epoch": 1.69, "learning_rate": 4.7110402550817056e-05, "loss": 0.0062, "step": 334170 }, { "epoch": 1.69, "learning_rate": 4.710283485780304e-05, "loss": 0.0061, "step": 334180 }, { "epoch": 1.69, "learning_rate": 4.709526716478903e-05, "loss": 0.0077, "step": 334190 }, { "epoch": 1.69, "learning_rate": 4.708769947177502e-05, "loss": 0.0071, "step": 334200 }, { "epoch": 1.69, "learning_rate": 4.708013177876101e-05, "loss": 0.0054, "step": 334210 }, { "epoch": 1.69, "learning_rate": 4.7072564085747e-05, "loss": 0.0055, "step": 334220 }, { "epoch": 1.69, "learning_rate": 4.706499639273299e-05, "loss": 0.0054, "step": 334230 }, { "epoch": 1.69, "learning_rate": 4.705742869971898e-05, "loss": 0.0063, "step": 334240 }, { "epoch": 1.69, "learning_rate": 4.704986100670497e-05, "loss": 0.0072, "step": 334250 }, { "epoch": 1.69, "learning_rate": 4.704229331369096e-05, "loss": 0.0065, "step": 334260 }, { "epoch": 1.69, "learning_rate": 4.703472562067695e-05, "loss": 0.0057, "step": 334270 }, { "epoch": 1.69, "learning_rate": 4.702715792766294e-05, "loss": 0.007, "step": 334280 }, { "epoch": 1.69, "learning_rate": 4.701959023464893e-05, "loss": 0.0077, "step": 334290 }, { "epoch": 1.69, "learning_rate": 4.7012022541634917e-05, "loss": 0.0053, "step": 334300 }, { "epoch": 1.69, "learning_rate": 4.700445484862091e-05, "loss": 0.0077, "step": 334310 }, { "epoch": 1.69, "learning_rate": 4.69968871556069e-05, "loss": 0.006, "step": 334320 }, { "epoch": 1.69, "learning_rate": 4.698931946259289e-05, "loss": 0.0054, "step": 334330 }, { "epoch": 1.69, "learning_rate": 4.6981751769578876e-05, "loss": 0.007, "step": 334340 }, { "epoch": 1.69, "learning_rate": 4.697418407656487e-05, "loss": 0.0092, "step": 334350 }, { "epoch": 1.69, "learning_rate": 4.696661638355086e-05, "loss": 0.0062, "step": 334360 }, { "epoch": 1.69, "learning_rate": 4.695904869053685e-05, "loss": 0.0054, "step": 334370 }, { "epoch": 1.69, "learning_rate": 4.6951480997522836e-05, "loss": 0.0071, "step": 334380 }, { "epoch": 1.69, "learning_rate": 4.694391330450883e-05, "loss": 0.0065, "step": 334390 }, { "epoch": 1.69, "learning_rate": 4.693634561149482e-05, "loss": 0.0054, "step": 334400 }, { "epoch": 1.69, "learning_rate": 4.692877791848081e-05, "loss": 0.0058, "step": 334410 }, { "epoch": 1.69, "learning_rate": 4.6921210225466796e-05, "loss": 0.0064, "step": 334420 }, { "epoch": 1.69, "learning_rate": 4.691364253245279e-05, "loss": 0.0092, "step": 334430 }, { "epoch": 1.69, "learning_rate": 4.690607483943878e-05, "loss": 0.0063, "step": 334440 }, { "epoch": 1.69, "learning_rate": 4.689850714642477e-05, "loss": 0.007, "step": 334450 }, { "epoch": 1.69, "learning_rate": 4.6890939453410755e-05, "loss": 0.008, "step": 334460 }, { "epoch": 1.69, "learning_rate": 4.688337176039675e-05, "loss": 0.0057, "step": 334470 }, { "epoch": 1.69, "learning_rate": 4.687580406738274e-05, "loss": 0.0063, "step": 334480 }, { "epoch": 1.69, "learning_rate": 4.686823637436872e-05, "loss": 0.007, "step": 334490 }, { "epoch": 1.69, "learning_rate": 4.686066868135471e-05, "loss": 0.005, "step": 334500 }, { "epoch": 1.69, "learning_rate": 4.68531009883407e-05, "loss": 0.0052, "step": 334510 }, { "epoch": 1.69, "learning_rate": 4.684553329532669e-05, "loss": 0.0083, "step": 334520 }, { "epoch": 1.69, "learning_rate": 4.683796560231268e-05, "loss": 0.0053, "step": 334530 }, { "epoch": 1.69, "learning_rate": 4.683039790929867e-05, "loss": 0.0062, "step": 334540 }, { "epoch": 1.69, "learning_rate": 4.682283021628466e-05, "loss": 0.0061, "step": 334550 }, { "epoch": 1.69, "learning_rate": 4.681526252327065e-05, "loss": 0.0077, "step": 334560 }, { "epoch": 1.69, "learning_rate": 4.680769483025664e-05, "loss": 0.0069, "step": 334570 }, { "epoch": 1.69, "learning_rate": 4.680012713724263e-05, "loss": 0.0068, "step": 334580 }, { "epoch": 1.69, "learning_rate": 4.679255944422862e-05, "loss": 0.0057, "step": 334590 }, { "epoch": 1.69, "learning_rate": 4.678499175121461e-05, "loss": 0.0062, "step": 334600 }, { "epoch": 1.69, "learning_rate": 4.67774240582006e-05, "loss": 0.0063, "step": 334610 }, { "epoch": 1.69, "learning_rate": 4.676985636518659e-05, "loss": 0.0067, "step": 334620 }, { "epoch": 1.69, "learning_rate": 4.676228867217258e-05, "loss": 0.0064, "step": 334630 }, { "epoch": 1.69, "learning_rate": 4.675472097915857e-05, "loss": 0.0065, "step": 334640 }, { "epoch": 1.69, "learning_rate": 4.674715328614456e-05, "loss": 0.0052, "step": 334650 }, { "epoch": 1.69, "learning_rate": 4.673958559313055e-05, "loss": 0.0077, "step": 334660 }, { "epoch": 1.69, "learning_rate": 4.673201790011654e-05, "loss": 0.0085, "step": 334670 }, { "epoch": 1.69, "learning_rate": 4.672445020710253e-05, "loss": 0.0051, "step": 334680 }, { "epoch": 1.69, "learning_rate": 4.671688251408852e-05, "loss": 0.0065, "step": 334690 }, { "epoch": 1.69, "learning_rate": 4.6709314821074506e-05, "loss": 0.0103, "step": 334700 }, { "epoch": 1.69, "learning_rate": 4.67017471280605e-05, "loss": 0.006, "step": 334710 }, { "epoch": 1.69, "learning_rate": 4.669417943504649e-05, "loss": 0.0038, "step": 334720 }, { "epoch": 1.69, "learning_rate": 4.668661174203248e-05, "loss": 0.0072, "step": 334730 }, { "epoch": 1.69, "learning_rate": 4.6679044049018466e-05, "loss": 0.0054, "step": 334740 }, { "epoch": 1.69, "learning_rate": 4.667147635600446e-05, "loss": 0.0074, "step": 334750 }, { "epoch": 1.69, "learning_rate": 4.666390866299045e-05, "loss": 0.0067, "step": 334760 }, { "epoch": 1.69, "learning_rate": 4.665634096997644e-05, "loss": 0.006, "step": 334770 }, { "epoch": 1.69, "learning_rate": 4.6648773276962426e-05, "loss": 0.0057, "step": 334780 }, { "epoch": 1.69, "learning_rate": 4.664120558394842e-05, "loss": 0.007, "step": 334790 }, { "epoch": 1.69, "learning_rate": 4.663363789093441e-05, "loss": 0.0046, "step": 334800 }, { "epoch": 1.69, "learning_rate": 4.662607019792039e-05, "loss": 0.0064, "step": 334810 }, { "epoch": 1.69, "learning_rate": 4.661850250490638e-05, "loss": 0.0055, "step": 334820 }, { "epoch": 1.69, "learning_rate": 4.661093481189237e-05, "loss": 0.0067, "step": 334830 }, { "epoch": 1.69, "learning_rate": 4.660336711887836e-05, "loss": 0.006, "step": 334840 }, { "epoch": 1.69, "learning_rate": 4.659579942586435e-05, "loss": 0.008, "step": 334850 }, { "epoch": 1.69, "learning_rate": 4.658823173285034e-05, "loss": 0.0054, "step": 334860 }, { "epoch": 1.69, "learning_rate": 4.6580664039836326e-05, "loss": 0.0061, "step": 334870 }, { "epoch": 1.69, "learning_rate": 4.657309634682232e-05, "loss": 0.0051, "step": 334880 }, { "epoch": 1.69, "learning_rate": 4.656552865380831e-05, "loss": 0.0077, "step": 334890 }, { "epoch": 1.69, "learning_rate": 4.65579609607943e-05, "loss": 0.0082, "step": 334900 }, { "epoch": 1.69, "learning_rate": 4.6550393267780286e-05, "loss": 0.0065, "step": 334910 }, { "epoch": 1.69, "learning_rate": 4.654282557476628e-05, "loss": 0.0058, "step": 334920 }, { "epoch": 1.69, "learning_rate": 4.653525788175227e-05, "loss": 0.0081, "step": 334930 }, { "epoch": 1.69, "learning_rate": 4.652769018873826e-05, "loss": 0.0062, "step": 334940 }, { "epoch": 1.69, "learning_rate": 4.652012249572425e-05, "loss": 0.0059, "step": 334950 }, { "epoch": 1.69, "learning_rate": 4.651255480271024e-05, "loss": 0.006, "step": 334960 }, { "epoch": 1.69, "learning_rate": 4.650498710969623e-05, "loss": 0.0077, "step": 334970 }, { "epoch": 1.69, "learning_rate": 4.649741941668222e-05, "loss": 0.0078, "step": 334980 }, { "epoch": 1.69, "learning_rate": 4.648985172366821e-05, "loss": 0.0055, "step": 334990 }, { "epoch": 1.69, "learning_rate": 4.64822840306542e-05, "loss": 0.0063, "step": 335000 }, { "epoch": 1.69, "eval_cer": 0.914412032135638, "eval_loss": 0.004865641705691814, "eval_runtime": 116.3195, "eval_samples_per_second": 17.194, "eval_steps_per_second": 4.299, "step": 335000 }, { "epoch": 1.69, "learning_rate": 4.647471633764019e-05, "loss": 0.0069, "step": 335010 }, { "epoch": 1.69, "learning_rate": 4.646714864462618e-05, "loss": 0.0059, "step": 335020 }, { "epoch": 1.69, "learning_rate": 4.645958095161217e-05, "loss": 0.0082, "step": 335030 }, { "epoch": 1.69, "learning_rate": 4.645201325859816e-05, "loss": 0.0048, "step": 335040 }, { "epoch": 1.69, "learning_rate": 4.644444556558415e-05, "loss": 0.0066, "step": 335050 }, { "epoch": 1.69, "learning_rate": 4.6436877872570136e-05, "loss": 0.0062, "step": 335060 }, { "epoch": 1.69, "learning_rate": 4.642931017955613e-05, "loss": 0.0057, "step": 335070 }, { "epoch": 1.69, "learning_rate": 4.642174248654212e-05, "loss": 0.0091, "step": 335080 }, { "epoch": 1.69, "learning_rate": 4.641417479352811e-05, "loss": 0.0062, "step": 335090 }, { "epoch": 1.69, "learning_rate": 4.6406607100514096e-05, "loss": 0.0069, "step": 335100 }, { "epoch": 1.69, "learning_rate": 4.639903940750009e-05, "loss": 0.0076, "step": 335110 }, { "epoch": 1.69, "learning_rate": 4.639147171448607e-05, "loss": 0.0059, "step": 335120 }, { "epoch": 1.69, "learning_rate": 4.638390402147206e-05, "loss": 0.0074, "step": 335130 }, { "epoch": 1.69, "learning_rate": 4.637633632845805e-05, "loss": 0.0059, "step": 335140 }, { "epoch": 1.69, "learning_rate": 4.636876863544404e-05, "loss": 0.0051, "step": 335150 }, { "epoch": 1.69, "learning_rate": 4.636120094243003e-05, "loss": 0.0076, "step": 335160 }, { "epoch": 1.69, "learning_rate": 4.635363324941602e-05, "loss": 0.0045, "step": 335170 }, { "epoch": 1.69, "learning_rate": 4.634606555640201e-05, "loss": 0.0079, "step": 335180 }, { "epoch": 1.69, "learning_rate": 4.6338497863388e-05, "loss": 0.0068, "step": 335190 }, { "epoch": 1.69, "learning_rate": 4.633093017037399e-05, "loss": 0.0057, "step": 335200 }, { "epoch": 1.69, "learning_rate": 4.632336247735998e-05, "loss": 0.0059, "step": 335210 }, { "epoch": 1.69, "learning_rate": 4.631579478434597e-05, "loss": 0.0055, "step": 335220 }, { "epoch": 1.69, "learning_rate": 4.6308227091331956e-05, "loss": 0.006, "step": 335230 }, { "epoch": 1.69, "learning_rate": 4.630065939831795e-05, "loss": 0.0073, "step": 335240 }, { "epoch": 1.69, "learning_rate": 4.629309170530394e-05, "loss": 0.0068, "step": 335250 }, { "epoch": 1.69, "learning_rate": 4.628552401228993e-05, "loss": 0.0061, "step": 335260 }, { "epoch": 1.69, "learning_rate": 4.6277956319275916e-05, "loss": 0.006, "step": 335270 }, { "epoch": 1.69, "learning_rate": 4.627038862626191e-05, "loss": 0.0042, "step": 335280 }, { "epoch": 1.69, "learning_rate": 4.62628209332479e-05, "loss": 0.0061, "step": 335290 }, { "epoch": 1.69, "learning_rate": 4.625525324023389e-05, "loss": 0.0066, "step": 335300 }, { "epoch": 1.69, "learning_rate": 4.6247685547219876e-05, "loss": 0.0051, "step": 335310 }, { "epoch": 1.69, "learning_rate": 4.624011785420587e-05, "loss": 0.0057, "step": 335320 }, { "epoch": 1.69, "learning_rate": 4.623255016119186e-05, "loss": 0.0054, "step": 335330 }, { "epoch": 1.69, "learning_rate": 4.622498246817785e-05, "loss": 0.0044, "step": 335340 }, { "epoch": 1.69, "learning_rate": 4.6217414775163835e-05, "loss": 0.0059, "step": 335350 }, { "epoch": 1.69, "learning_rate": 4.620984708214983e-05, "loss": 0.0078, "step": 335360 }, { "epoch": 1.69, "learning_rate": 4.620227938913582e-05, "loss": 0.0073, "step": 335370 }, { "epoch": 1.69, "learning_rate": 4.619471169612181e-05, "loss": 0.0075, "step": 335380 }, { "epoch": 1.69, "learning_rate": 4.6187144003107795e-05, "loss": 0.0086, "step": 335390 }, { "epoch": 1.69, "learning_rate": 4.617957631009379e-05, "loss": 0.0073, "step": 335400 }, { "epoch": 1.69, "learning_rate": 4.617200861707978e-05, "loss": 0.0049, "step": 335410 }, { "epoch": 1.69, "learning_rate": 4.6164440924065767e-05, "loss": 0.0059, "step": 335420 }, { "epoch": 1.69, "learning_rate": 4.6156873231051755e-05, "loss": 0.0082, "step": 335430 }, { "epoch": 1.69, "learning_rate": 4.614930553803774e-05, "loss": 0.0066, "step": 335440 }, { "epoch": 1.69, "learning_rate": 4.614173784502373e-05, "loss": 0.0059, "step": 335450 }, { "epoch": 1.69, "learning_rate": 4.613417015200972e-05, "loss": 0.0082, "step": 335460 }, { "epoch": 1.69, "learning_rate": 4.612660245899571e-05, "loss": 0.0087, "step": 335470 }, { "epoch": 1.69, "learning_rate": 4.61190347659817e-05, "loss": 0.0059, "step": 335480 }, { "epoch": 1.69, "learning_rate": 4.611146707296769e-05, "loss": 0.0066, "step": 335490 }, { "epoch": 1.69, "learning_rate": 4.610389937995368e-05, "loss": 0.0058, "step": 335500 }, { "epoch": 1.69, "learning_rate": 4.609633168693967e-05, "loss": 0.0061, "step": 335510 }, { "epoch": 1.69, "learning_rate": 4.608876399392566e-05, "loss": 0.0069, "step": 335520 }, { "epoch": 1.69, "learning_rate": 4.608119630091165e-05, "loss": 0.0057, "step": 335530 }, { "epoch": 1.69, "learning_rate": 4.607362860789764e-05, "loss": 0.0062, "step": 335540 }, { "epoch": 1.69, "learning_rate": 4.606606091488363e-05, "loss": 0.0069, "step": 335550 }, { "epoch": 1.69, "learning_rate": 4.605849322186962e-05, "loss": 0.0059, "step": 335560 }, { "epoch": 1.69, "learning_rate": 4.605092552885561e-05, "loss": 0.0071, "step": 335570 }, { "epoch": 1.69, "learning_rate": 4.60433578358416e-05, "loss": 0.0059, "step": 335580 }, { "epoch": 1.69, "learning_rate": 4.6035790142827587e-05, "loss": 0.0078, "step": 335590 }, { "epoch": 1.69, "learning_rate": 4.602822244981358e-05, "loss": 0.007, "step": 335600 }, { "epoch": 1.69, "learning_rate": 4.602065475679957e-05, "loss": 0.0075, "step": 335610 }, { "epoch": 1.69, "learning_rate": 4.601308706378556e-05, "loss": 0.005, "step": 335620 }, { "epoch": 1.69, "learning_rate": 4.6005519370771546e-05, "loss": 0.0069, "step": 335630 }, { "epoch": 1.69, "learning_rate": 4.599795167775754e-05, "loss": 0.0056, "step": 335640 }, { "epoch": 1.69, "learning_rate": 4.599038398474353e-05, "loss": 0.0063, "step": 335650 }, { "epoch": 1.69, "learning_rate": 4.598281629172952e-05, "loss": 0.0057, "step": 335660 }, { "epoch": 1.69, "learning_rate": 4.5975248598715506e-05, "loss": 0.0081, "step": 335670 }, { "epoch": 1.69, "learning_rate": 4.59676809057015e-05, "loss": 0.0072, "step": 335680 }, { "epoch": 1.69, "learning_rate": 4.596011321268749e-05, "loss": 0.0059, "step": 335690 }, { "epoch": 1.69, "learning_rate": 4.595254551967348e-05, "loss": 0.0053, "step": 335700 }, { "epoch": 1.69, "learning_rate": 4.5944977826659466e-05, "loss": 0.0068, "step": 335710 }, { "epoch": 1.69, "learning_rate": 4.593741013364546e-05, "loss": 0.0073, "step": 335720 }, { "epoch": 1.69, "learning_rate": 4.592984244063145e-05, "loss": 0.0072, "step": 335730 }, { "epoch": 1.69, "learning_rate": 4.592227474761744e-05, "loss": 0.0061, "step": 335740 }, { "epoch": 1.69, "learning_rate": 4.591470705460342e-05, "loss": 0.0065, "step": 335750 }, { "epoch": 1.69, "learning_rate": 4.5907139361589407e-05, "loss": 0.0057, "step": 335760 }, { "epoch": 1.69, "learning_rate": 4.58995716685754e-05, "loss": 0.0083, "step": 335770 }, { "epoch": 1.69, "learning_rate": 4.589200397556139e-05, "loss": 0.0059, "step": 335780 }, { "epoch": 1.69, "learning_rate": 4.588443628254738e-05, "loss": 0.0071, "step": 335790 }, { "epoch": 1.69, "learning_rate": 4.5876868589533366e-05, "loss": 0.0055, "step": 335800 }, { "epoch": 1.69, "learning_rate": 4.586930089651936e-05, "loss": 0.0068, "step": 335810 }, { "epoch": 1.69, "learning_rate": 4.586173320350535e-05, "loss": 0.0072, "step": 335820 }, { "epoch": 1.69, "learning_rate": 4.585416551049134e-05, "loss": 0.0105, "step": 335830 }, { "epoch": 1.69, "learning_rate": 4.5846597817477326e-05, "loss": 0.0052, "step": 335840 }, { "epoch": 1.69, "learning_rate": 4.583903012446332e-05, "loss": 0.0067, "step": 335850 }, { "epoch": 1.69, "learning_rate": 4.583146243144931e-05, "loss": 0.0062, "step": 335860 }, { "epoch": 1.69, "learning_rate": 4.58238947384353e-05, "loss": 0.0067, "step": 335870 }, { "epoch": 1.69, "learning_rate": 4.5816327045421286e-05, "loss": 0.0083, "step": 335880 }, { "epoch": 1.69, "learning_rate": 4.580875935240728e-05, "loss": 0.0067, "step": 335890 }, { "epoch": 1.69, "learning_rate": 4.580119165939327e-05, "loss": 0.0049, "step": 335900 }, { "epoch": 1.69, "learning_rate": 4.579362396637926e-05, "loss": 0.0074, "step": 335910 }, { "epoch": 1.69, "learning_rate": 4.578605627336525e-05, "loss": 0.0057, "step": 335920 }, { "epoch": 1.69, "learning_rate": 4.577848858035124e-05, "loss": 0.0063, "step": 335930 }, { "epoch": 1.69, "learning_rate": 4.577092088733723e-05, "loss": 0.0054, "step": 335940 }, { "epoch": 1.69, "learning_rate": 4.576335319432322e-05, "loss": 0.0056, "step": 335950 }, { "epoch": 1.69, "learning_rate": 4.575578550130921e-05, "loss": 0.0079, "step": 335960 }, { "epoch": 1.7, "learning_rate": 4.57482178082952e-05, "loss": 0.0071, "step": 335970 }, { "epoch": 1.7, "learning_rate": 4.574065011528119e-05, "loss": 0.0078, "step": 335980 }, { "epoch": 1.7, "learning_rate": 4.5733082422267176e-05, "loss": 0.0053, "step": 335990 }, { "epoch": 1.7, "learning_rate": 4.572551472925317e-05, "loss": 0.0091, "step": 336000 }, { "epoch": 1.7, "eval_cer": 0.9144372624348985, "eval_loss": 0.004783105570822954, "eval_runtime": 116.4347, "eval_samples_per_second": 17.177, "eval_steps_per_second": 4.294, "step": 336000 }, { "epoch": 1.7, "learning_rate": 4.571794703623916e-05, "loss": 0.0069, "step": 336010 }, { "epoch": 1.7, "learning_rate": 4.571037934322515e-05, "loss": 0.0058, "step": 336020 }, { "epoch": 1.7, "learning_rate": 4.5702811650211136e-05, "loss": 0.0051, "step": 336030 }, { "epoch": 1.7, "learning_rate": 4.569524395719713e-05, "loss": 0.0056, "step": 336040 }, { "epoch": 1.7, "learning_rate": 4.568767626418312e-05, "loss": 0.0051, "step": 336050 }, { "epoch": 1.7, "learning_rate": 4.568010857116911e-05, "loss": 0.0053, "step": 336060 }, { "epoch": 1.7, "learning_rate": 4.567254087815509e-05, "loss": 0.0045, "step": 336070 }, { "epoch": 1.7, "learning_rate": 4.566497318514108e-05, "loss": 0.0095, "step": 336080 }, { "epoch": 1.7, "learning_rate": 4.565740549212707e-05, "loss": 0.0062, "step": 336090 }, { "epoch": 1.7, "learning_rate": 4.564983779911306e-05, "loss": 0.0072, "step": 336100 }, { "epoch": 1.7, "learning_rate": 4.564227010609905e-05, "loss": 0.0063, "step": 336110 }, { "epoch": 1.7, "learning_rate": 4.563470241308504e-05, "loss": 0.0064, "step": 336120 }, { "epoch": 1.7, "learning_rate": 4.562713472007103e-05, "loss": 0.0051, "step": 336130 }, { "epoch": 1.7, "learning_rate": 4.561956702705702e-05, "loss": 0.0052, "step": 336140 }, { "epoch": 1.7, "learning_rate": 4.561199933404301e-05, "loss": 0.0054, "step": 336150 }, { "epoch": 1.7, "learning_rate": 4.5604431641028996e-05, "loss": 0.0078, "step": 336160 }, { "epoch": 1.7, "learning_rate": 4.559686394801499e-05, "loss": 0.0081, "step": 336170 }, { "epoch": 1.7, "learning_rate": 4.558929625500098e-05, "loss": 0.0054, "step": 336180 }, { "epoch": 1.7, "learning_rate": 4.558172856198697e-05, "loss": 0.0065, "step": 336190 }, { "epoch": 1.7, "learning_rate": 4.5574160868972956e-05, "loss": 0.0063, "step": 336200 }, { "epoch": 1.7, "learning_rate": 4.556659317595895e-05, "loss": 0.0074, "step": 336210 }, { "epoch": 1.7, "learning_rate": 4.555902548294494e-05, "loss": 0.006, "step": 336220 }, { "epoch": 1.7, "learning_rate": 4.555145778993093e-05, "loss": 0.0054, "step": 336230 }, { "epoch": 1.7, "learning_rate": 4.5543890096916916e-05, "loss": 0.0071, "step": 336240 }, { "epoch": 1.7, "learning_rate": 4.553632240390291e-05, "loss": 0.0063, "step": 336250 }, { "epoch": 1.7, "learning_rate": 4.55287547108889e-05, "loss": 0.008, "step": 336260 }, { "epoch": 1.7, "learning_rate": 4.552118701787489e-05, "loss": 0.0064, "step": 336270 }, { "epoch": 1.7, "learning_rate": 4.5513619324860875e-05, "loss": 0.0058, "step": 336280 }, { "epoch": 1.7, "learning_rate": 4.550605163184687e-05, "loss": 0.0053, "step": 336290 }, { "epoch": 1.7, "learning_rate": 4.549848393883286e-05, "loss": 0.0078, "step": 336300 }, { "epoch": 1.7, "learning_rate": 4.549091624581885e-05, "loss": 0.0067, "step": 336310 }, { "epoch": 1.7, "learning_rate": 4.5483348552804835e-05, "loss": 0.0065, "step": 336320 }, { "epoch": 1.7, "learning_rate": 4.547578085979083e-05, "loss": 0.0051, "step": 336330 }, { "epoch": 1.7, "learning_rate": 4.546821316677682e-05, "loss": 0.0046, "step": 336340 }, { "epoch": 1.7, "learning_rate": 4.5460645473762806e-05, "loss": 0.0062, "step": 336350 }, { "epoch": 1.7, "learning_rate": 4.5453077780748795e-05, "loss": 0.0053, "step": 336360 }, { "epoch": 1.7, "learning_rate": 4.544551008773479e-05, "loss": 0.0066, "step": 336370 }, { "epoch": 1.7, "learning_rate": 4.543794239472077e-05, "loss": 0.0047, "step": 336380 }, { "epoch": 1.7, "learning_rate": 4.543037470170676e-05, "loss": 0.0074, "step": 336390 }, { "epoch": 1.7, "learning_rate": 4.542280700869275e-05, "loss": 0.006, "step": 336400 }, { "epoch": 1.7, "learning_rate": 4.541523931567874e-05, "loss": 0.0055, "step": 336410 }, { "epoch": 1.7, "learning_rate": 4.540767162266473e-05, "loss": 0.0057, "step": 336420 }, { "epoch": 1.7, "learning_rate": 4.540010392965072e-05, "loss": 0.0078, "step": 336430 }, { "epoch": 1.7, "learning_rate": 4.539253623663671e-05, "loss": 0.0083, "step": 336440 }, { "epoch": 1.7, "learning_rate": 4.53849685436227e-05, "loss": 0.0073, "step": 336450 }, { "epoch": 1.7, "learning_rate": 4.537740085060869e-05, "loss": 0.0081, "step": 336460 }, { "epoch": 1.7, "learning_rate": 4.536983315759468e-05, "loss": 0.0101, "step": 336470 }, { "epoch": 1.7, "learning_rate": 4.536226546458067e-05, "loss": 0.0045, "step": 336480 }, { "epoch": 1.7, "learning_rate": 4.535469777156666e-05, "loss": 0.0062, "step": 336490 }, { "epoch": 1.7, "learning_rate": 4.534713007855265e-05, "loss": 0.0068, "step": 336500 }, { "epoch": 1.7, "learning_rate": 4.533956238553864e-05, "loss": 0.0059, "step": 336510 }, { "epoch": 1.7, "learning_rate": 4.5331994692524626e-05, "loss": 0.0054, "step": 336520 }, { "epoch": 1.7, "learning_rate": 4.532442699951062e-05, "loss": 0.0053, "step": 336530 }, { "epoch": 1.7, "learning_rate": 4.531685930649661e-05, "loss": 0.0053, "step": 336540 }, { "epoch": 1.7, "learning_rate": 4.53092916134826e-05, "loss": 0.0074, "step": 336550 }, { "epoch": 1.7, "learning_rate": 4.5301723920468586e-05, "loss": 0.006, "step": 336560 }, { "epoch": 1.7, "learning_rate": 4.529415622745458e-05, "loss": 0.0074, "step": 336570 }, { "epoch": 1.7, "learning_rate": 4.528658853444057e-05, "loss": 0.008, "step": 336580 }, { "epoch": 1.7, "learning_rate": 4.527902084142656e-05, "loss": 0.0058, "step": 336590 }, { "epoch": 1.7, "learning_rate": 4.5271453148412546e-05, "loss": 0.0074, "step": 336600 }, { "epoch": 1.7, "learning_rate": 4.526388545539854e-05, "loss": 0.0058, "step": 336610 }, { "epoch": 1.7, "learning_rate": 4.525631776238453e-05, "loss": 0.0071, "step": 336620 }, { "epoch": 1.7, "learning_rate": 4.524875006937052e-05, "loss": 0.0054, "step": 336630 }, { "epoch": 1.7, "learning_rate": 4.5241182376356505e-05, "loss": 0.006, "step": 336640 }, { "epoch": 1.7, "learning_rate": 4.52336146833425e-05, "loss": 0.0074, "step": 336650 }, { "epoch": 1.7, "learning_rate": 4.522604699032849e-05, "loss": 0.0057, "step": 336660 }, { "epoch": 1.7, "learning_rate": 4.521847929731448e-05, "loss": 0.0073, "step": 336670 }, { "epoch": 1.7, "learning_rate": 4.5210911604300465e-05, "loss": 0.006, "step": 336680 }, { "epoch": 1.7, "learning_rate": 4.5203343911286446e-05, "loss": 0.0101, "step": 336690 }, { "epoch": 1.7, "learning_rate": 4.519577621827244e-05, "loss": 0.0062, "step": 336700 }, { "epoch": 1.7, "learning_rate": 4.518820852525843e-05, "loss": 0.0059, "step": 336710 }, { "epoch": 1.7, "learning_rate": 4.518064083224442e-05, "loss": 0.0092, "step": 336720 }, { "epoch": 1.7, "learning_rate": 4.5173073139230406e-05, "loss": 0.0065, "step": 336730 }, { "epoch": 1.7, "learning_rate": 4.51655054462164e-05, "loss": 0.0066, "step": 336740 }, { "epoch": 1.7, "learning_rate": 4.515793775320239e-05, "loss": 0.0131, "step": 336750 }, { "epoch": 1.7, "learning_rate": 4.515037006018838e-05, "loss": 0.0071, "step": 336760 }, { "epoch": 1.7, "learning_rate": 4.5142802367174366e-05, "loss": 0.0053, "step": 336770 }, { "epoch": 1.7, "learning_rate": 4.513523467416036e-05, "loss": 0.0057, "step": 336780 }, { "epoch": 1.7, "learning_rate": 4.512766698114635e-05, "loss": 0.0061, "step": 336790 }, { "epoch": 1.7, "learning_rate": 4.512009928813234e-05, "loss": 0.006, "step": 336800 }, { "epoch": 1.7, "learning_rate": 4.5112531595118325e-05, "loss": 0.0052, "step": 336810 }, { "epoch": 1.7, "learning_rate": 4.510496390210432e-05, "loss": 0.0057, "step": 336820 }, { "epoch": 1.7, "learning_rate": 4.509739620909031e-05, "loss": 0.0076, "step": 336830 }, { "epoch": 1.7, "learning_rate": 4.50898285160763e-05, "loss": 0.0068, "step": 336840 }, { "epoch": 1.7, "learning_rate": 4.5082260823062285e-05, "loss": 0.0063, "step": 336850 }, { "epoch": 1.7, "learning_rate": 4.507469313004828e-05, "loss": 0.0075, "step": 336860 }, { "epoch": 1.7, "learning_rate": 4.506712543703427e-05, "loss": 0.0063, "step": 336870 }, { "epoch": 1.7, "learning_rate": 4.5059557744020257e-05, "loss": 0.0067, "step": 336880 }, { "epoch": 1.7, "learning_rate": 4.505199005100625e-05, "loss": 0.0069, "step": 336890 }, { "epoch": 1.7, "learning_rate": 4.504442235799224e-05, "loss": 0.0053, "step": 336900 }, { "epoch": 1.7, "learning_rate": 4.503685466497823e-05, "loss": 0.0047, "step": 336910 }, { "epoch": 1.7, "learning_rate": 4.5029286971964216e-05, "loss": 0.0073, "step": 336920 }, { "epoch": 1.7, "learning_rate": 4.502171927895021e-05, "loss": 0.006, "step": 336930 }, { "epoch": 1.7, "learning_rate": 4.50141515859362e-05, "loss": 0.0068, "step": 336940 }, { "epoch": 1.7, "learning_rate": 4.500658389292219e-05, "loss": 0.006, "step": 336950 }, { "epoch": 1.7, "learning_rate": 4.4999016199908176e-05, "loss": 0.0063, "step": 336960 }, { "epoch": 1.7, "learning_rate": 4.499144850689417e-05, "loss": 0.0073, "step": 336970 }, { "epoch": 1.7, "learning_rate": 4.498388081388016e-05, "loss": 0.0079, "step": 336980 }, { "epoch": 1.7, "learning_rate": 4.497631312086615e-05, "loss": 0.0066, "step": 336990 }, { "epoch": 1.7, "learning_rate": 4.4968745427852135e-05, "loss": 0.0093, "step": 337000 }, { "epoch": 1.7, "eval_cer": 0.9144333808503969, "eval_loss": 0.004760997835546732, "eval_runtime": 116.4296, "eval_samples_per_second": 17.178, "eval_steps_per_second": 4.294, "step": 337000 }, { "epoch": 1.7, "learning_rate": 4.496117773483812e-05, "loss": 0.0047, "step": 337010 }, { "epoch": 1.7, "learning_rate": 4.495361004182411e-05, "loss": 0.0063, "step": 337020 }, { "epoch": 1.7, "learning_rate": 4.49460423488101e-05, "loss": 0.0046, "step": 337030 }, { "epoch": 1.7, "learning_rate": 4.493847465579609e-05, "loss": 0.0063, "step": 337040 }, { "epoch": 1.7, "learning_rate": 4.4930906962782077e-05, "loss": 0.0099, "step": 337050 }, { "epoch": 1.7, "learning_rate": 4.492333926976807e-05, "loss": 0.0069, "step": 337060 }, { "epoch": 1.7, "learning_rate": 4.491577157675406e-05, "loss": 0.0062, "step": 337070 }, { "epoch": 1.7, "learning_rate": 4.490820388374005e-05, "loss": 0.0075, "step": 337080 }, { "epoch": 1.7, "learning_rate": 4.4900636190726036e-05, "loss": 0.0078, "step": 337090 }, { "epoch": 1.7, "learning_rate": 4.489306849771203e-05, "loss": 0.0058, "step": 337100 }, { "epoch": 1.7, "learning_rate": 4.488550080469802e-05, "loss": 0.0065, "step": 337110 }, { "epoch": 1.7, "learning_rate": 4.487793311168401e-05, "loss": 0.0054, "step": 337120 }, { "epoch": 1.7, "learning_rate": 4.4870365418669996e-05, "loss": 0.0059, "step": 337130 }, { "epoch": 1.7, "learning_rate": 4.486279772565599e-05, "loss": 0.0052, "step": 337140 }, { "epoch": 1.7, "learning_rate": 4.485523003264198e-05, "loss": 0.007, "step": 337150 }, { "epoch": 1.7, "learning_rate": 4.484766233962797e-05, "loss": 0.0076, "step": 337160 }, { "epoch": 1.7, "learning_rate": 4.4840094646613956e-05, "loss": 0.0063, "step": 337170 }, { "epoch": 1.7, "learning_rate": 4.483252695359995e-05, "loss": 0.0064, "step": 337180 }, { "epoch": 1.7, "learning_rate": 4.482495926058594e-05, "loss": 0.0086, "step": 337190 }, { "epoch": 1.7, "learning_rate": 4.481739156757193e-05, "loss": 0.0061, "step": 337200 }, { "epoch": 1.7, "learning_rate": 4.4809823874557915e-05, "loss": 0.0081, "step": 337210 }, { "epoch": 1.7, "learning_rate": 4.480225618154391e-05, "loss": 0.0066, "step": 337220 }, { "epoch": 1.7, "learning_rate": 4.47946884885299e-05, "loss": 0.004, "step": 337230 }, { "epoch": 1.7, "learning_rate": 4.4787120795515887e-05, "loss": 0.0083, "step": 337240 }, { "epoch": 1.7, "learning_rate": 4.4779553102501875e-05, "loss": 0.0059, "step": 337250 }, { "epoch": 1.7, "learning_rate": 4.477198540948787e-05, "loss": 0.0072, "step": 337260 }, { "epoch": 1.7, "learning_rate": 4.476441771647386e-05, "loss": 0.0081, "step": 337270 }, { "epoch": 1.7, "learning_rate": 4.4756850023459846e-05, "loss": 0.0069, "step": 337280 }, { "epoch": 1.7, "learning_rate": 4.4749282330445834e-05, "loss": 0.0051, "step": 337290 }, { "epoch": 1.7, "learning_rate": 4.474171463743183e-05, "loss": 0.0052, "step": 337300 }, { "epoch": 1.7, "learning_rate": 4.473414694441782e-05, "loss": 0.0058, "step": 337310 }, { "epoch": 1.7, "learning_rate": 4.47265792514038e-05, "loss": 0.0069, "step": 337320 }, { "epoch": 1.7, "learning_rate": 4.471901155838979e-05, "loss": 0.0078, "step": 337330 }, { "epoch": 1.7, "learning_rate": 4.4711443865375776e-05, "loss": 0.0058, "step": 337340 }, { "epoch": 1.7, "learning_rate": 4.470387617236177e-05, "loss": 0.0075, "step": 337350 }, { "epoch": 1.7, "learning_rate": 4.469630847934776e-05, "loss": 0.0071, "step": 337360 }, { "epoch": 1.7, "learning_rate": 4.468874078633375e-05, "loss": 0.0091, "step": 337370 }, { "epoch": 1.7, "learning_rate": 4.468117309331974e-05, "loss": 0.0056, "step": 337380 }, { "epoch": 1.7, "learning_rate": 4.467360540030573e-05, "loss": 0.0069, "step": 337390 }, { "epoch": 1.7, "learning_rate": 4.466603770729172e-05, "loss": 0.0068, "step": 337400 }, { "epoch": 1.7, "learning_rate": 4.465847001427771e-05, "loss": 0.0066, "step": 337410 }, { "epoch": 1.7, "learning_rate": 4.46509023212637e-05, "loss": 0.0051, "step": 337420 }, { "epoch": 1.7, "learning_rate": 4.464333462824969e-05, "loss": 0.0067, "step": 337430 }, { "epoch": 1.7, "learning_rate": 4.463576693523568e-05, "loss": 0.0064, "step": 337440 }, { "epoch": 1.7, "learning_rate": 4.4628199242221666e-05, "loss": 0.0078, "step": 337450 }, { "epoch": 1.7, "learning_rate": 4.462063154920766e-05, "loss": 0.0059, "step": 337460 }, { "epoch": 1.7, "learning_rate": 4.461306385619365e-05, "loss": 0.0077, "step": 337470 }, { "epoch": 1.7, "learning_rate": 4.460549616317964e-05, "loss": 0.0059, "step": 337480 }, { "epoch": 1.7, "learning_rate": 4.4597928470165626e-05, "loss": 0.0067, "step": 337490 }, { "epoch": 1.7, "learning_rate": 4.459036077715162e-05, "loss": 0.0036, "step": 337500 }, { "epoch": 1.7, "learning_rate": 4.458279308413761e-05, "loss": 0.0088, "step": 337510 }, { "epoch": 1.7, "learning_rate": 4.45752253911236e-05, "loss": 0.0046, "step": 337520 }, { "epoch": 1.7, "learning_rate": 4.4567657698109586e-05, "loss": 0.006, "step": 337530 }, { "epoch": 1.7, "learning_rate": 4.456009000509558e-05, "loss": 0.0055, "step": 337540 }, { "epoch": 1.7, "learning_rate": 4.455252231208157e-05, "loss": 0.006, "step": 337550 }, { "epoch": 1.7, "learning_rate": 4.454495461906756e-05, "loss": 0.0061, "step": 337560 }, { "epoch": 1.7, "learning_rate": 4.4537386926053545e-05, "loss": 0.0077, "step": 337570 }, { "epoch": 1.7, "learning_rate": 4.452981923303954e-05, "loss": 0.0061, "step": 337580 }, { "epoch": 1.7, "learning_rate": 4.452225154002553e-05, "loss": 0.0047, "step": 337590 }, { "epoch": 1.7, "learning_rate": 4.451468384701152e-05, "loss": 0.0062, "step": 337600 }, { "epoch": 1.7, "learning_rate": 4.4507116153997505e-05, "loss": 0.0073, "step": 337610 }, { "epoch": 1.7, "learning_rate": 4.44995484609835e-05, "loss": 0.0052, "step": 337620 }, { "epoch": 1.7, "learning_rate": 4.449198076796949e-05, "loss": 0.0055, "step": 337630 }, { "epoch": 1.7, "learning_rate": 4.448441307495547e-05, "loss": 0.0051, "step": 337640 }, { "epoch": 1.7, "learning_rate": 4.447684538194146e-05, "loss": 0.0088, "step": 337650 }, { "epoch": 1.7, "learning_rate": 4.4469277688927446e-05, "loss": 0.0046, "step": 337660 }, { "epoch": 1.7, "learning_rate": 4.446170999591344e-05, "loss": 0.0065, "step": 337670 }, { "epoch": 1.7, "learning_rate": 4.445414230289943e-05, "loss": 0.0053, "step": 337680 }, { "epoch": 1.7, "learning_rate": 4.444657460988542e-05, "loss": 0.0069, "step": 337690 }, { "epoch": 1.7, "learning_rate": 4.4439006916871406e-05, "loss": 0.0086, "step": 337700 }, { "epoch": 1.7, "learning_rate": 4.44314392238574e-05, "loss": 0.0049, "step": 337710 }, { "epoch": 1.7, "learning_rate": 4.442387153084339e-05, "loss": 0.0051, "step": 337720 }, { "epoch": 1.7, "learning_rate": 4.441630383782938e-05, "loss": 0.0066, "step": 337730 }, { "epoch": 1.7, "learning_rate": 4.4408736144815365e-05, "loss": 0.0051, "step": 337740 }, { "epoch": 1.7, "learning_rate": 4.440116845180136e-05, "loss": 0.0081, "step": 337750 }, { "epoch": 1.7, "learning_rate": 4.439360075878735e-05, "loss": 0.0089, "step": 337760 }, { "epoch": 1.7, "learning_rate": 4.438603306577334e-05, "loss": 0.0074, "step": 337770 }, { "epoch": 1.7, "learning_rate": 4.4378465372759325e-05, "loss": 0.0059, "step": 337780 }, { "epoch": 1.7, "learning_rate": 4.437089767974532e-05, "loss": 0.0081, "step": 337790 }, { "epoch": 1.7, "learning_rate": 4.436332998673131e-05, "loss": 0.0053, "step": 337800 }, { "epoch": 1.7, "learning_rate": 4.4355762293717296e-05, "loss": 0.0054, "step": 337810 }, { "epoch": 1.7, "learning_rate": 4.4348194600703285e-05, "loss": 0.0073, "step": 337820 }, { "epoch": 1.7, "learning_rate": 4.434062690768928e-05, "loss": 0.0065, "step": 337830 }, { "epoch": 1.7, "learning_rate": 4.433305921467527e-05, "loss": 0.0059, "step": 337840 }, { "epoch": 1.7, "learning_rate": 4.4325491521661256e-05, "loss": 0.0074, "step": 337850 }, { "epoch": 1.7, "learning_rate": 4.431792382864725e-05, "loss": 0.0055, "step": 337860 }, { "epoch": 1.7, "learning_rate": 4.431035613563324e-05, "loss": 0.0066, "step": 337870 }, { "epoch": 1.7, "learning_rate": 4.430278844261923e-05, "loss": 0.0077, "step": 337880 }, { "epoch": 1.7, "learning_rate": 4.4295220749605216e-05, "loss": 0.0065, "step": 337890 }, { "epoch": 1.7, "learning_rate": 4.428765305659121e-05, "loss": 0.006, "step": 337900 }, { "epoch": 1.7, "learning_rate": 4.42800853635772e-05, "loss": 0.0057, "step": 337910 }, { "epoch": 1.7, "learning_rate": 4.427251767056319e-05, "loss": 0.0091, "step": 337920 }, { "epoch": 1.7, "learning_rate": 4.4264949977549175e-05, "loss": 0.005, "step": 337930 }, { "epoch": 1.7, "learning_rate": 4.425738228453517e-05, "loss": 0.0074, "step": 337940 }, { "epoch": 1.7, "learning_rate": 4.424981459152115e-05, "loss": 0.0055, "step": 337950 }, { "epoch": 1.71, "learning_rate": 4.424224689850714e-05, "loss": 0.0051, "step": 337960 }, { "epoch": 1.71, "learning_rate": 4.423467920549313e-05, "loss": 0.0061, "step": 337970 }, { "epoch": 1.71, "learning_rate": 4.4227111512479116e-05, "loss": 0.0051, "step": 337980 }, { "epoch": 1.71, "learning_rate": 4.421954381946511e-05, "loss": 0.0076, "step": 337990 }, { "epoch": 1.71, "learning_rate": 4.42119761264511e-05, "loss": 0.0061, "step": 338000 }, { "epoch": 1.71, "eval_cer": 0.9144197953046413, "eval_loss": 0.004835808649659157, "eval_runtime": 116.338, "eval_samples_per_second": 17.191, "eval_steps_per_second": 4.298, "step": 338000 }, { "epoch": 1.71, "learning_rate": 4.420440843343709e-05, "loss": 0.0052, "step": 338010 }, { "epoch": 1.71, "learning_rate": 4.4196840740423076e-05, "loss": 0.0073, "step": 338020 }, { "epoch": 1.71, "learning_rate": 4.418927304740907e-05, "loss": 0.0061, "step": 338030 }, { "epoch": 1.71, "learning_rate": 4.418170535439506e-05, "loss": 0.0081, "step": 338040 }, { "epoch": 1.71, "learning_rate": 4.417413766138105e-05, "loss": 0.0062, "step": 338050 }, { "epoch": 1.71, "learning_rate": 4.4166569968367036e-05, "loss": 0.0063, "step": 338060 }, { "epoch": 1.71, "learning_rate": 4.415900227535303e-05, "loss": 0.0064, "step": 338070 }, { "epoch": 1.71, "learning_rate": 4.415143458233902e-05, "loss": 0.0085, "step": 338080 }, { "epoch": 1.71, "learning_rate": 4.414386688932501e-05, "loss": 0.0073, "step": 338090 }, { "epoch": 1.71, "learning_rate": 4.4136299196310995e-05, "loss": 0.0043, "step": 338100 }, { "epoch": 1.71, "learning_rate": 4.412873150329699e-05, "loss": 0.006, "step": 338110 }, { "epoch": 1.71, "learning_rate": 4.412116381028298e-05, "loss": 0.0068, "step": 338120 }, { "epoch": 1.71, "learning_rate": 4.411359611726897e-05, "loss": 0.0068, "step": 338130 }, { "epoch": 1.71, "learning_rate": 4.4106028424254955e-05, "loss": 0.007, "step": 338140 }, { "epoch": 1.71, "learning_rate": 4.409846073124095e-05, "loss": 0.0064, "step": 338150 }, { "epoch": 1.71, "learning_rate": 4.409089303822694e-05, "loss": 0.006, "step": 338160 }, { "epoch": 1.71, "learning_rate": 4.4083325345212926e-05, "loss": 0.0074, "step": 338170 }, { "epoch": 1.71, "learning_rate": 4.4075757652198915e-05, "loss": 0.0069, "step": 338180 }, { "epoch": 1.71, "learning_rate": 4.406818995918491e-05, "loss": 0.0075, "step": 338190 }, { "epoch": 1.71, "learning_rate": 4.40606222661709e-05, "loss": 0.007, "step": 338200 }, { "epoch": 1.71, "learning_rate": 4.4053054573156886e-05, "loss": 0.0054, "step": 338210 }, { "epoch": 1.71, "learning_rate": 4.4045486880142874e-05, "loss": 0.0054, "step": 338220 }, { "epoch": 1.71, "learning_rate": 4.403791918712887e-05, "loss": 0.0064, "step": 338230 }, { "epoch": 1.71, "learning_rate": 4.403035149411486e-05, "loss": 0.0067, "step": 338240 }, { "epoch": 1.71, "learning_rate": 4.4022783801100846e-05, "loss": 0.0066, "step": 338250 }, { "epoch": 1.71, "learning_rate": 4.401521610808683e-05, "loss": 0.0067, "step": 338260 }, { "epoch": 1.71, "learning_rate": 4.4007648415072815e-05, "loss": 0.0086, "step": 338270 }, { "epoch": 1.71, "learning_rate": 4.400008072205881e-05, "loss": 0.0064, "step": 338280 }, { "epoch": 1.71, "learning_rate": 4.39925130290448e-05, "loss": 0.0062, "step": 338290 }, { "epoch": 1.71, "learning_rate": 4.398494533603079e-05, "loss": 0.0055, "step": 338300 }, { "epoch": 1.71, "learning_rate": 4.3977377643016775e-05, "loss": 0.0065, "step": 338310 }, { "epoch": 1.71, "learning_rate": 4.396980995000277e-05, "loss": 0.0056, "step": 338320 }, { "epoch": 1.71, "learning_rate": 4.396224225698876e-05, "loss": 0.0073, "step": 338330 }, { "epoch": 1.71, "learning_rate": 4.3954674563974747e-05, "loss": 0.0077, "step": 338340 }, { "epoch": 1.71, "learning_rate": 4.394710687096074e-05, "loss": 0.0057, "step": 338350 }, { "epoch": 1.71, "learning_rate": 4.393953917794673e-05, "loss": 0.0068, "step": 338360 }, { "epoch": 1.71, "learning_rate": 4.393197148493272e-05, "loss": 0.0055, "step": 338370 }, { "epoch": 1.71, "learning_rate": 4.3924403791918706e-05, "loss": 0.0074, "step": 338380 }, { "epoch": 1.71, "learning_rate": 4.39168360989047e-05, "loss": 0.0068, "step": 338390 }, { "epoch": 1.71, "learning_rate": 4.390926840589069e-05, "loss": 0.0083, "step": 338400 }, { "epoch": 1.71, "learning_rate": 4.390170071287668e-05, "loss": 0.0039, "step": 338410 }, { "epoch": 1.71, "learning_rate": 4.3894133019862666e-05, "loss": 0.0062, "step": 338420 }, { "epoch": 1.71, "learning_rate": 4.388656532684866e-05, "loss": 0.006, "step": 338430 }, { "epoch": 1.71, "learning_rate": 4.387899763383465e-05, "loss": 0.0053, "step": 338440 }, { "epoch": 1.71, "learning_rate": 4.387142994082064e-05, "loss": 0.0062, "step": 338450 }, { "epoch": 1.71, "learning_rate": 4.3863862247806625e-05, "loss": 0.0075, "step": 338460 }, { "epoch": 1.71, "learning_rate": 4.385629455479262e-05, "loss": 0.0064, "step": 338470 }, { "epoch": 1.71, "learning_rate": 4.384872686177861e-05, "loss": 0.0044, "step": 338480 }, { "epoch": 1.71, "learning_rate": 4.38411591687646e-05, "loss": 0.0056, "step": 338490 }, { "epoch": 1.71, "learning_rate": 4.3833591475750585e-05, "loss": 0.0052, "step": 338500 }, { "epoch": 1.71, "learning_rate": 4.382602378273658e-05, "loss": 0.0062, "step": 338510 }, { "epoch": 1.71, "learning_rate": 4.381845608972257e-05, "loss": 0.0057, "step": 338520 }, { "epoch": 1.71, "learning_rate": 4.3810888396708557e-05, "loss": 0.0059, "step": 338530 }, { "epoch": 1.71, "learning_rate": 4.3803320703694545e-05, "loss": 0.0097, "step": 338540 }, { "epoch": 1.71, "learning_rate": 4.379575301068054e-05, "loss": 0.0064, "step": 338550 }, { "epoch": 1.71, "learning_rate": 4.378818531766653e-05, "loss": 0.0055, "step": 338560 }, { "epoch": 1.71, "learning_rate": 4.3780617624652516e-05, "loss": 0.0067, "step": 338570 }, { "epoch": 1.71, "learning_rate": 4.37730499316385e-05, "loss": 0.0058, "step": 338580 }, { "epoch": 1.71, "learning_rate": 4.3765482238624486e-05, "loss": 0.0065, "step": 338590 }, { "epoch": 1.71, "learning_rate": 4.375791454561048e-05, "loss": 0.005, "step": 338600 }, { "epoch": 1.71, "learning_rate": 4.375034685259647e-05, "loss": 0.0068, "step": 338610 }, { "epoch": 1.71, "learning_rate": 4.374277915958246e-05, "loss": 0.0063, "step": 338620 }, { "epoch": 1.71, "learning_rate": 4.3735211466568446e-05, "loss": 0.0051, "step": 338630 }, { "epoch": 1.71, "learning_rate": 4.372764377355444e-05, "loss": 0.0058, "step": 338640 }, { "epoch": 1.71, "learning_rate": 4.372007608054043e-05, "loss": 0.0053, "step": 338650 }, { "epoch": 1.71, "learning_rate": 4.371250838752642e-05, "loss": 0.005, "step": 338660 }, { "epoch": 1.71, "learning_rate": 4.3704940694512405e-05, "loss": 0.0071, "step": 338670 }, { "epoch": 1.71, "learning_rate": 4.36973730014984e-05, "loss": 0.006, "step": 338680 }, { "epoch": 1.71, "learning_rate": 4.368980530848439e-05, "loss": 0.008, "step": 338690 }, { "epoch": 1.71, "learning_rate": 4.3682237615470377e-05, "loss": 0.0083, "step": 338700 }, { "epoch": 1.71, "learning_rate": 4.3674669922456365e-05, "loss": 0.0058, "step": 338710 }, { "epoch": 1.71, "learning_rate": 4.366710222944236e-05, "loss": 0.0097, "step": 338720 }, { "epoch": 1.71, "learning_rate": 4.365953453642835e-05, "loss": 0.0068, "step": 338730 }, { "epoch": 1.71, "learning_rate": 4.3651966843414336e-05, "loss": 0.0063, "step": 338740 }, { "epoch": 1.71, "learning_rate": 4.3644399150400324e-05, "loss": 0.0063, "step": 338750 }, { "epoch": 1.71, "learning_rate": 4.363683145738632e-05, "loss": 0.0098, "step": 338760 }, { "epoch": 1.71, "learning_rate": 4.362926376437231e-05, "loss": 0.0066, "step": 338770 }, { "epoch": 1.71, "learning_rate": 4.3621696071358296e-05, "loss": 0.0088, "step": 338780 }, { "epoch": 1.71, "learning_rate": 4.3614128378344284e-05, "loss": 0.0079, "step": 338790 }, { "epoch": 1.71, "learning_rate": 4.360656068533028e-05, "loss": 0.0072, "step": 338800 }, { "epoch": 1.71, "learning_rate": 4.359899299231627e-05, "loss": 0.0053, "step": 338810 }, { "epoch": 1.71, "learning_rate": 4.3591425299302256e-05, "loss": 0.0056, "step": 338820 }, { "epoch": 1.71, "learning_rate": 4.358385760628825e-05, "loss": 0.0082, "step": 338830 }, { "epoch": 1.71, "learning_rate": 4.357628991327424e-05, "loss": 0.0049, "step": 338840 }, { "epoch": 1.71, "learning_rate": 4.356872222026023e-05, "loss": 0.0061, "step": 338850 }, { "epoch": 1.71, "learning_rate": 4.3561154527246215e-05, "loss": 0.005, "step": 338860 }, { "epoch": 1.71, "learning_rate": 4.355358683423221e-05, "loss": 0.0063, "step": 338870 }, { "epoch": 1.71, "learning_rate": 4.35460191412182e-05, "loss": 0.0066, "step": 338880 }, { "epoch": 1.71, "learning_rate": 4.353845144820418e-05, "loss": 0.0061, "step": 338890 }, { "epoch": 1.71, "learning_rate": 4.353088375519017e-05, "loss": 0.0038, "step": 338900 }, { "epoch": 1.71, "learning_rate": 4.3523316062176156e-05, "loss": 0.006, "step": 338910 }, { "epoch": 1.71, "learning_rate": 4.351574836916215e-05, "loss": 0.0068, "step": 338920 }, { "epoch": 1.71, "learning_rate": 4.350818067614814e-05, "loss": 0.0049, "step": 338930 }, { "epoch": 1.71, "learning_rate": 4.350061298313413e-05, "loss": 0.0044, "step": 338940 }, { "epoch": 1.71, "learning_rate": 4.3493045290120116e-05, "loss": 0.0057, "step": 338950 }, { "epoch": 1.71, "learning_rate": 4.348547759710611e-05, "loss": 0.008, "step": 338960 }, { "epoch": 1.71, "learning_rate": 4.34779099040921e-05, "loss": 0.0053, "step": 338970 }, { "epoch": 1.71, "learning_rate": 4.347034221107809e-05, "loss": 0.0043, "step": 338980 }, { "epoch": 1.71, "learning_rate": 4.3462774518064076e-05, "loss": 0.0088, "step": 338990 }, { "epoch": 1.71, "learning_rate": 4.345520682505007e-05, "loss": 0.0057, "step": 339000 }, { "epoch": 1.71, "eval_cer": 0.9144285288697699, "eval_loss": 0.0047121611423790455, "eval_runtime": 116.4797, "eval_samples_per_second": 17.17, "eval_steps_per_second": 4.293, "step": 339000 }, { "epoch": 1.71, "learning_rate": 4.344763913203606e-05, "loss": 0.0056, "step": 339010 }, { "epoch": 1.71, "learning_rate": 4.344007143902205e-05, "loss": 0.0057, "step": 339020 }, { "epoch": 1.71, "learning_rate": 4.3432503746008035e-05, "loss": 0.0096, "step": 339030 }, { "epoch": 1.71, "learning_rate": 4.342493605299403e-05, "loss": 0.0079, "step": 339040 }, { "epoch": 1.71, "learning_rate": 4.341736835998002e-05, "loss": 0.0053, "step": 339050 }, { "epoch": 1.71, "learning_rate": 4.340980066696601e-05, "loss": 0.0053, "step": 339060 }, { "epoch": 1.71, "learning_rate": 4.3402232973951995e-05, "loss": 0.0061, "step": 339070 }, { "epoch": 1.71, "learning_rate": 4.339466528093799e-05, "loss": 0.0059, "step": 339080 }, { "epoch": 1.71, "learning_rate": 4.338709758792398e-05, "loss": 0.0054, "step": 339090 }, { "epoch": 1.71, "learning_rate": 4.3379529894909966e-05, "loss": 0.006, "step": 339100 }, { "epoch": 1.71, "learning_rate": 4.3371962201895955e-05, "loss": 0.006, "step": 339110 }, { "epoch": 1.71, "learning_rate": 4.336439450888195e-05, "loss": 0.0072, "step": 339120 }, { "epoch": 1.71, "learning_rate": 4.335682681586794e-05, "loss": 0.0068, "step": 339130 }, { "epoch": 1.71, "learning_rate": 4.3349259122853926e-05, "loss": 0.0074, "step": 339140 }, { "epoch": 1.71, "learning_rate": 4.3341691429839914e-05, "loss": 0.006, "step": 339150 }, { "epoch": 1.71, "learning_rate": 4.333412373682591e-05, "loss": 0.0088, "step": 339160 }, { "epoch": 1.71, "learning_rate": 4.33265560438119e-05, "loss": 0.0069, "step": 339170 }, { "epoch": 1.71, "learning_rate": 4.3318988350797886e-05, "loss": 0.0055, "step": 339180 }, { "epoch": 1.71, "learning_rate": 4.3311420657783874e-05, "loss": 0.0068, "step": 339190 }, { "epoch": 1.71, "learning_rate": 4.330385296476987e-05, "loss": 0.0065, "step": 339200 }, { "epoch": 1.71, "learning_rate": 4.329628527175585e-05, "loss": 0.0048, "step": 339210 }, { "epoch": 1.71, "learning_rate": 4.328871757874184e-05, "loss": 0.0055, "step": 339220 }, { "epoch": 1.71, "learning_rate": 4.328114988572783e-05, "loss": 0.0065, "step": 339230 }, { "epoch": 1.71, "learning_rate": 4.3273582192713815e-05, "loss": 0.0081, "step": 339240 }, { "epoch": 1.71, "learning_rate": 4.326601449969981e-05, "loss": 0.0062, "step": 339250 }, { "epoch": 1.71, "learning_rate": 4.32584468066858e-05, "loss": 0.006, "step": 339260 }, { "epoch": 1.71, "learning_rate": 4.3250879113671786e-05, "loss": 0.0072, "step": 339270 }, { "epoch": 1.71, "learning_rate": 4.3243311420657775e-05, "loss": 0.0056, "step": 339280 }, { "epoch": 1.71, "learning_rate": 4.323574372764377e-05, "loss": 0.0035, "step": 339290 }, { "epoch": 1.71, "learning_rate": 4.322817603462976e-05, "loss": 0.0066, "step": 339300 }, { "epoch": 1.71, "learning_rate": 4.3220608341615746e-05, "loss": 0.0064, "step": 339310 }, { "epoch": 1.71, "learning_rate": 4.321304064860174e-05, "loss": 0.0061, "step": 339320 }, { "epoch": 1.71, "learning_rate": 4.320547295558773e-05, "loss": 0.0085, "step": 339330 }, { "epoch": 1.71, "learning_rate": 4.319790526257372e-05, "loss": 0.0052, "step": 339340 }, { "epoch": 1.71, "learning_rate": 4.3190337569559706e-05, "loss": 0.0055, "step": 339350 }, { "epoch": 1.71, "learning_rate": 4.31827698765457e-05, "loss": 0.0058, "step": 339360 }, { "epoch": 1.71, "learning_rate": 4.317520218353169e-05, "loss": 0.008, "step": 339370 }, { "epoch": 1.71, "learning_rate": 4.316763449051768e-05, "loss": 0.0047, "step": 339380 }, { "epoch": 1.71, "learning_rate": 4.3160066797503665e-05, "loss": 0.0064, "step": 339390 }, { "epoch": 1.71, "learning_rate": 4.315249910448966e-05, "loss": 0.0051, "step": 339400 }, { "epoch": 1.71, "learning_rate": 4.314493141147565e-05, "loss": 0.0086, "step": 339410 }, { "epoch": 1.71, "learning_rate": 4.313736371846164e-05, "loss": 0.0058, "step": 339420 }, { "epoch": 1.71, "learning_rate": 4.3129796025447625e-05, "loss": 0.0042, "step": 339430 }, { "epoch": 1.71, "learning_rate": 4.312222833243362e-05, "loss": 0.0052, "step": 339440 }, { "epoch": 1.71, "learning_rate": 4.311466063941961e-05, "loss": 0.0068, "step": 339450 }, { "epoch": 1.71, "learning_rate": 4.3107092946405596e-05, "loss": 0.0057, "step": 339460 }, { "epoch": 1.71, "learning_rate": 4.3099525253391585e-05, "loss": 0.0072, "step": 339470 }, { "epoch": 1.71, "learning_rate": 4.309195756037758e-05, "loss": 0.0063, "step": 339480 }, { "epoch": 1.71, "learning_rate": 4.308438986736357e-05, "loss": 0.0076, "step": 339490 }, { "epoch": 1.71, "learning_rate": 4.3076822174349556e-05, "loss": 0.0069, "step": 339500 }, { "epoch": 1.71, "learning_rate": 4.3069254481335544e-05, "loss": 0.0092, "step": 339510 }, { "epoch": 1.71, "learning_rate": 4.3061686788321526e-05, "loss": 0.0055, "step": 339520 }, { "epoch": 1.71, "learning_rate": 4.305411909530752e-05, "loss": 0.0074, "step": 339530 }, { "epoch": 1.71, "learning_rate": 4.304655140229351e-05, "loss": 0.0057, "step": 339540 }, { "epoch": 1.71, "learning_rate": 4.30389837092795e-05, "loss": 0.0046, "step": 339550 }, { "epoch": 1.71, "learning_rate": 4.3031416016265485e-05, "loss": 0.0076, "step": 339560 }, { "epoch": 1.71, "learning_rate": 4.302384832325148e-05, "loss": 0.0076, "step": 339570 }, { "epoch": 1.71, "learning_rate": 4.301628063023747e-05, "loss": 0.0079, "step": 339580 }, { "epoch": 1.71, "learning_rate": 4.300871293722346e-05, "loss": 0.0073, "step": 339590 }, { "epoch": 1.71, "learning_rate": 4.3001145244209445e-05, "loss": 0.0071, "step": 339600 }, { "epoch": 1.71, "learning_rate": 4.299357755119544e-05, "loss": 0.0081, "step": 339610 }, { "epoch": 1.71, "learning_rate": 4.298600985818143e-05, "loss": 0.0052, "step": 339620 }, { "epoch": 1.71, "learning_rate": 4.2978442165167416e-05, "loss": 0.0045, "step": 339630 }, { "epoch": 1.71, "learning_rate": 4.2970874472153405e-05, "loss": 0.0059, "step": 339640 }, { "epoch": 1.71, "learning_rate": 4.29633067791394e-05, "loss": 0.0093, "step": 339650 }, { "epoch": 1.71, "learning_rate": 4.295573908612539e-05, "loss": 0.0054, "step": 339660 }, { "epoch": 1.71, "learning_rate": 4.2948171393111376e-05, "loss": 0.0073, "step": 339670 }, { "epoch": 1.71, "learning_rate": 4.2940603700097364e-05, "loss": 0.0057, "step": 339680 }, { "epoch": 1.71, "learning_rate": 4.293303600708336e-05, "loss": 0.0059, "step": 339690 }, { "epoch": 1.71, "learning_rate": 4.292546831406935e-05, "loss": 0.0089, "step": 339700 }, { "epoch": 1.71, "learning_rate": 4.2917900621055336e-05, "loss": 0.0073, "step": 339710 }, { "epoch": 1.71, "learning_rate": 4.2910332928041324e-05, "loss": 0.0065, "step": 339720 }, { "epoch": 1.71, "learning_rate": 4.290276523502732e-05, "loss": 0.0063, "step": 339730 }, { "epoch": 1.71, "learning_rate": 4.289519754201331e-05, "loss": 0.0082, "step": 339740 }, { "epoch": 1.71, "learning_rate": 4.2887629848999295e-05, "loss": 0.0068, "step": 339750 }, { "epoch": 1.71, "learning_rate": 4.2880062155985284e-05, "loss": 0.0062, "step": 339760 }, { "epoch": 1.71, "learning_rate": 4.287249446297128e-05, "loss": 0.006, "step": 339770 }, { "epoch": 1.71, "learning_rate": 4.286492676995727e-05, "loss": 0.0077, "step": 339780 }, { "epoch": 1.71, "learning_rate": 4.2857359076943255e-05, "loss": 0.0062, "step": 339790 }, { "epoch": 1.71, "learning_rate": 4.284979138392925e-05, "loss": 0.0059, "step": 339800 }, { "epoch": 1.71, "learning_rate": 4.284222369091524e-05, "loss": 0.0071, "step": 339810 }, { "epoch": 1.71, "learning_rate": 4.2834655997901227e-05, "loss": 0.0053, "step": 339820 }, { "epoch": 1.71, "learning_rate": 4.2827088304887215e-05, "loss": 0.0069, "step": 339830 }, { "epoch": 1.71, "learning_rate": 4.2819520611873196e-05, "loss": 0.0071, "step": 339840 }, { "epoch": 1.71, "learning_rate": 4.281195291885919e-05, "loss": 0.0059, "step": 339850 }, { "epoch": 1.71, "learning_rate": 4.280438522584518e-05, "loss": 0.0069, "step": 339860 }, { "epoch": 1.71, "learning_rate": 4.279681753283117e-05, "loss": 0.0058, "step": 339870 }, { "epoch": 1.71, "learning_rate": 4.2789249839817156e-05, "loss": 0.0058, "step": 339880 }, { "epoch": 1.71, "learning_rate": 4.278168214680315e-05, "loss": 0.0055, "step": 339890 }, { "epoch": 1.71, "learning_rate": 4.277411445378914e-05, "loss": 0.0046, "step": 339900 }, { "epoch": 1.71, "learning_rate": 4.276654676077513e-05, "loss": 0.0054, "step": 339910 }, { "epoch": 1.71, "learning_rate": 4.2758979067761115e-05, "loss": 0.006, "step": 339920 }, { "epoch": 1.71, "learning_rate": 4.275141137474711e-05, "loss": 0.0065, "step": 339930 }, { "epoch": 1.72, "learning_rate": 4.27438436817331e-05, "loss": 0.0072, "step": 339940 }, { "epoch": 1.72, "learning_rate": 4.273627598871909e-05, "loss": 0.0046, "step": 339950 }, { "epoch": 1.72, "learning_rate": 4.2728708295705075e-05, "loss": 0.0049, "step": 339960 }, { "epoch": 1.72, "learning_rate": 4.272114060269107e-05, "loss": 0.0051, "step": 339970 }, { "epoch": 1.72, "learning_rate": 4.271357290967706e-05, "loss": 0.0068, "step": 339980 }, { "epoch": 1.72, "learning_rate": 4.2706005216663047e-05, "loss": 0.0073, "step": 339990 }, { "epoch": 1.72, "learning_rate": 4.2698437523649035e-05, "loss": 0.0059, "step": 340000 }, { "epoch": 1.72, "eval_cer": 0.9144217360968921, "eval_loss": 0.004758994095027447, "eval_runtime": 116.784, "eval_samples_per_second": 17.126, "eval_steps_per_second": 4.281, "step": 340000 }, { "epoch": 1.72, "learning_rate": 4.269086983063503e-05, "loss": 0.0051, "step": 340010 }, { "epoch": 1.72, "learning_rate": 4.268330213762102e-05, "loss": 0.009, "step": 340020 }, { "epoch": 1.72, "learning_rate": 4.2675734444607006e-05, "loss": 0.0068, "step": 340030 }, { "epoch": 1.72, "learning_rate": 4.2668166751592994e-05, "loss": 0.0054, "step": 340040 }, { "epoch": 1.72, "learning_rate": 4.266059905857899e-05, "loss": 0.0063, "step": 340050 }, { "epoch": 1.72, "learning_rate": 4.265303136556498e-05, "loss": 0.0078, "step": 340060 }, { "epoch": 1.72, "learning_rate": 4.2645463672550966e-05, "loss": 0.006, "step": 340070 }, { "epoch": 1.72, "learning_rate": 4.2637895979536954e-05, "loss": 0.005, "step": 340080 }, { "epoch": 1.72, "learning_rate": 4.263032828652295e-05, "loss": 0.0083, "step": 340090 }, { "epoch": 1.72, "learning_rate": 4.262276059350894e-05, "loss": 0.005, "step": 340100 }, { "epoch": 1.72, "learning_rate": 4.2615192900494926e-05, "loss": 0.006, "step": 340110 }, { "epoch": 1.72, "learning_rate": 4.2607625207480914e-05, "loss": 0.0039, "step": 340120 }, { "epoch": 1.72, "learning_rate": 4.260005751446691e-05, "loss": 0.0057, "step": 340130 }, { "epoch": 1.72, "learning_rate": 4.25924898214529e-05, "loss": 0.0061, "step": 340140 }, { "epoch": 1.72, "learning_rate": 4.258492212843888e-05, "loss": 0.0055, "step": 340150 }, { "epoch": 1.72, "learning_rate": 4.2577354435424867e-05, "loss": 0.0045, "step": 340160 }, { "epoch": 1.72, "learning_rate": 4.2569786742410855e-05, "loss": 0.0068, "step": 340170 }, { "epoch": 1.72, "learning_rate": 4.256221904939685e-05, "loss": 0.0073, "step": 340180 }, { "epoch": 1.72, "learning_rate": 4.255465135638284e-05, "loss": 0.0052, "step": 340190 }, { "epoch": 1.72, "learning_rate": 4.2547083663368826e-05, "loss": 0.0063, "step": 340200 }, { "epoch": 1.72, "learning_rate": 4.2539515970354814e-05, "loss": 0.0065, "step": 340210 }, { "epoch": 1.72, "learning_rate": 4.253194827734081e-05, "loss": 0.0062, "step": 340220 }, { "epoch": 1.72, "learning_rate": 4.25243805843268e-05, "loss": 0.0036, "step": 340230 }, { "epoch": 1.72, "learning_rate": 4.2516812891312786e-05, "loss": 0.0061, "step": 340240 }, { "epoch": 1.72, "learning_rate": 4.2509245198298774e-05, "loss": 0.0046, "step": 340250 }, { "epoch": 1.72, "learning_rate": 4.250167750528477e-05, "loss": 0.006, "step": 340260 }, { "epoch": 1.72, "learning_rate": 4.249410981227076e-05, "loss": 0.0045, "step": 340270 }, { "epoch": 1.72, "learning_rate": 4.2486542119256746e-05, "loss": 0.008, "step": 340280 }, { "epoch": 1.72, "learning_rate": 4.247897442624274e-05, "loss": 0.0056, "step": 340290 }, { "epoch": 1.72, "learning_rate": 4.247140673322873e-05, "loss": 0.0051, "step": 340300 }, { "epoch": 1.72, "learning_rate": 4.246383904021472e-05, "loss": 0.0075, "step": 340310 }, { "epoch": 1.72, "learning_rate": 4.2456271347200705e-05, "loss": 0.009, "step": 340320 }, { "epoch": 1.72, "learning_rate": 4.24487036541867e-05, "loss": 0.0065, "step": 340330 }, { "epoch": 1.72, "learning_rate": 4.244113596117269e-05, "loss": 0.0075, "step": 340340 }, { "epoch": 1.72, "learning_rate": 4.243356826815868e-05, "loss": 0.0053, "step": 340350 }, { "epoch": 1.72, "learning_rate": 4.2426000575144665e-05, "loss": 0.006, "step": 340360 }, { "epoch": 1.72, "learning_rate": 4.241843288213066e-05, "loss": 0.0073, "step": 340370 }, { "epoch": 1.72, "learning_rate": 4.241086518911665e-05, "loss": 0.0066, "step": 340380 }, { "epoch": 1.72, "learning_rate": 4.2403297496102636e-05, "loss": 0.0062, "step": 340390 }, { "epoch": 1.72, "learning_rate": 4.2395729803088625e-05, "loss": 0.0073, "step": 340400 }, { "epoch": 1.72, "learning_rate": 4.238816211007462e-05, "loss": 0.008, "step": 340410 }, { "epoch": 1.72, "learning_rate": 4.238059441706061e-05, "loss": 0.0076, "step": 340420 }, { "epoch": 1.72, "learning_rate": 4.2373026724046596e-05, "loss": 0.007, "step": 340430 }, { "epoch": 1.72, "learning_rate": 4.2365459031032584e-05, "loss": 0.0072, "step": 340440 }, { "epoch": 1.72, "learning_rate": 4.235789133801858e-05, "loss": 0.006, "step": 340450 }, { "epoch": 1.72, "learning_rate": 4.235032364500456e-05, "loss": 0.0092, "step": 340460 }, { "epoch": 1.72, "learning_rate": 4.234275595199055e-05, "loss": 0.0055, "step": 340470 }, { "epoch": 1.72, "learning_rate": 4.233518825897654e-05, "loss": 0.0064, "step": 340480 }, { "epoch": 1.72, "learning_rate": 4.2327620565962525e-05, "loss": 0.0072, "step": 340490 }, { "epoch": 1.72, "learning_rate": 4.232005287294852e-05, "loss": 0.0061, "step": 340500 }, { "epoch": 1.72, "learning_rate": 4.231248517993451e-05, "loss": 0.0072, "step": 340510 }, { "epoch": 1.72, "learning_rate": 4.23049174869205e-05, "loss": 0.0052, "step": 340520 }, { "epoch": 1.72, "learning_rate": 4.2297349793906485e-05, "loss": 0.0049, "step": 340530 }, { "epoch": 1.72, "learning_rate": 4.228978210089248e-05, "loss": 0.0066, "step": 340540 }, { "epoch": 1.72, "learning_rate": 4.228221440787847e-05, "loss": 0.0053, "step": 340550 }, { "epoch": 1.72, "learning_rate": 4.2274646714864456e-05, "loss": 0.0096, "step": 340560 }, { "epoch": 1.72, "learning_rate": 4.2267079021850445e-05, "loss": 0.0053, "step": 340570 }, { "epoch": 1.72, "learning_rate": 4.225951132883644e-05, "loss": 0.0084, "step": 340580 }, { "epoch": 1.72, "learning_rate": 4.225194363582243e-05, "loss": 0.0061, "step": 340590 }, { "epoch": 1.72, "learning_rate": 4.2244375942808416e-05, "loss": 0.007, "step": 340600 }, { "epoch": 1.72, "learning_rate": 4.2236808249794404e-05, "loss": 0.0062, "step": 340610 }, { "epoch": 1.72, "learning_rate": 4.22292405567804e-05, "loss": 0.0078, "step": 340620 }, { "epoch": 1.72, "learning_rate": 4.222167286376639e-05, "loss": 0.0053, "step": 340630 }, { "epoch": 1.72, "learning_rate": 4.2214105170752376e-05, "loss": 0.0128, "step": 340640 }, { "epoch": 1.72, "learning_rate": 4.2206537477738364e-05, "loss": 0.005, "step": 340650 }, { "epoch": 1.72, "learning_rate": 4.219896978472436e-05, "loss": 0.0052, "step": 340660 }, { "epoch": 1.72, "learning_rate": 4.219140209171035e-05, "loss": 0.0058, "step": 340670 }, { "epoch": 1.72, "learning_rate": 4.2183834398696335e-05, "loss": 0.0069, "step": 340680 }, { "epoch": 1.72, "learning_rate": 4.2176266705682324e-05, "loss": 0.0061, "step": 340690 }, { "epoch": 1.72, "learning_rate": 4.216869901266832e-05, "loss": 0.0078, "step": 340700 }, { "epoch": 1.72, "learning_rate": 4.216113131965431e-05, "loss": 0.0069, "step": 340710 }, { "epoch": 1.72, "learning_rate": 4.2153563626640295e-05, "loss": 0.007, "step": 340720 }, { "epoch": 1.72, "learning_rate": 4.214599593362628e-05, "loss": 0.0065, "step": 340730 }, { "epoch": 1.72, "learning_rate": 4.213842824061228e-05, "loss": 0.0075, "step": 340740 }, { "epoch": 1.72, "learning_rate": 4.2130860547598266e-05, "loss": 0.0069, "step": 340750 }, { "epoch": 1.72, "learning_rate": 4.2123292854584255e-05, "loss": 0.0065, "step": 340760 }, { "epoch": 1.72, "learning_rate": 4.211572516157025e-05, "loss": 0.0065, "step": 340770 }, { "epoch": 1.72, "learning_rate": 4.210815746855623e-05, "loss": 0.0082, "step": 340780 }, { "epoch": 1.72, "learning_rate": 4.210058977554222e-05, "loss": 0.0045, "step": 340790 }, { "epoch": 1.72, "learning_rate": 4.209302208252821e-05, "loss": 0.0057, "step": 340800 }, { "epoch": 1.72, "learning_rate": 4.2085454389514196e-05, "loss": 0.0063, "step": 340810 }, { "epoch": 1.72, "learning_rate": 4.207788669650019e-05, "loss": 0.0062, "step": 340820 }, { "epoch": 1.72, "learning_rate": 4.207031900348618e-05, "loss": 0.0097, "step": 340830 }, { "epoch": 1.72, "learning_rate": 4.206275131047217e-05, "loss": 0.0082, "step": 340840 }, { "epoch": 1.72, "learning_rate": 4.2055183617458155e-05, "loss": 0.0061, "step": 340850 }, { "epoch": 1.72, "learning_rate": 4.204761592444415e-05, "loss": 0.0058, "step": 340860 }, { "epoch": 1.72, "learning_rate": 4.204004823143014e-05, "loss": 0.0086, "step": 340870 }, { "epoch": 1.72, "learning_rate": 4.203248053841613e-05, "loss": 0.0055, "step": 340880 }, { "epoch": 1.72, "learning_rate": 4.2024912845402115e-05, "loss": 0.0048, "step": 340890 }, { "epoch": 1.72, "learning_rate": 4.201734515238811e-05, "loss": 0.0063, "step": 340900 }, { "epoch": 1.72, "learning_rate": 4.20097774593741e-05, "loss": 0.0054, "step": 340910 }, { "epoch": 1.72, "learning_rate": 4.2002209766360086e-05, "loss": 0.0048, "step": 340920 }, { "epoch": 1.72, "learning_rate": 4.1994642073346075e-05, "loss": 0.0056, "step": 340930 }, { "epoch": 1.72, "learning_rate": 4.198707438033207e-05, "loss": 0.0067, "step": 340940 }, { "epoch": 1.72, "learning_rate": 4.197950668731806e-05, "loss": 0.0076, "step": 340950 }, { "epoch": 1.72, "learning_rate": 4.1971938994304046e-05, "loss": 0.0057, "step": 340960 }, { "epoch": 1.72, "learning_rate": 4.1964371301290034e-05, "loss": 0.006, "step": 340970 }, { "epoch": 1.72, "learning_rate": 4.195680360827603e-05, "loss": 0.0066, "step": 340980 }, { "epoch": 1.72, "learning_rate": 4.194923591526202e-05, "loss": 0.0058, "step": 340990 }, { "epoch": 1.72, "learning_rate": 4.1941668222248006e-05, "loss": 0.0053, "step": 341000 }, { "epoch": 1.72, "eval_cer": 0.9144285288697699, "eval_loss": 0.00470845028758049, "eval_runtime": 116.8214, "eval_samples_per_second": 17.12, "eval_steps_per_second": 4.28, "step": 341000 }, { "epoch": 1.72, "learning_rate": 4.1934100529233994e-05, "loss": 0.0051, "step": 341010 }, { "epoch": 1.72, "learning_rate": 4.192653283621999e-05, "loss": 0.0075, "step": 341020 }, { "epoch": 1.72, "learning_rate": 4.191896514320598e-05, "loss": 0.0072, "step": 341030 }, { "epoch": 1.72, "learning_rate": 4.1911397450191965e-05, "loss": 0.007, "step": 341040 }, { "epoch": 1.72, "learning_rate": 4.1903829757177954e-05, "loss": 0.0043, "step": 341050 }, { "epoch": 1.72, "learning_rate": 4.189626206416395e-05, "loss": 0.0071, "step": 341060 }, { "epoch": 1.72, "learning_rate": 4.188869437114994e-05, "loss": 0.0068, "step": 341070 }, { "epoch": 1.72, "learning_rate": 4.1881126678135925e-05, "loss": 0.0062, "step": 341080 }, { "epoch": 1.72, "learning_rate": 4.1873558985121906e-05, "loss": 0.005, "step": 341090 }, { "epoch": 1.72, "learning_rate": 4.1865991292107895e-05, "loss": 0.0064, "step": 341100 }, { "epoch": 1.72, "learning_rate": 4.185842359909389e-05, "loss": 0.0053, "step": 341110 }, { "epoch": 1.72, "learning_rate": 4.185085590607988e-05, "loss": 0.008, "step": 341120 }, { "epoch": 1.72, "learning_rate": 4.1843288213065866e-05, "loss": 0.0063, "step": 341130 }, { "epoch": 1.72, "learning_rate": 4.1835720520051854e-05, "loss": 0.0068, "step": 341140 }, { "epoch": 1.72, "learning_rate": 4.182815282703785e-05, "loss": 0.0061, "step": 341150 }, { "epoch": 1.72, "learning_rate": 4.182058513402384e-05, "loss": 0.0113, "step": 341160 }, { "epoch": 1.72, "learning_rate": 4.1813017441009826e-05, "loss": 0.0062, "step": 341170 }, { "epoch": 1.72, "learning_rate": 4.1805449747995814e-05, "loss": 0.005, "step": 341180 }, { "epoch": 1.72, "learning_rate": 4.179788205498181e-05, "loss": 0.0057, "step": 341190 }, { "epoch": 1.72, "learning_rate": 4.17903143619678e-05, "loss": 0.007, "step": 341200 }, { "epoch": 1.72, "learning_rate": 4.1782746668953785e-05, "loss": 0.0044, "step": 341210 }, { "epoch": 1.72, "learning_rate": 4.1775178975939774e-05, "loss": 0.006, "step": 341220 }, { "epoch": 1.72, "learning_rate": 4.176761128292577e-05, "loss": 0.0066, "step": 341230 }, { "epoch": 1.72, "learning_rate": 4.176004358991176e-05, "loss": 0.0058, "step": 341240 }, { "epoch": 1.72, "learning_rate": 4.1752475896897745e-05, "loss": 0.006, "step": 341250 }, { "epoch": 1.72, "learning_rate": 4.174490820388374e-05, "loss": 0.008, "step": 341260 }, { "epoch": 1.72, "learning_rate": 4.173734051086973e-05, "loss": 0.0061, "step": 341270 }, { "epoch": 1.72, "learning_rate": 4.1729772817855717e-05, "loss": 0.0052, "step": 341280 }, { "epoch": 1.72, "learning_rate": 4.1722205124841705e-05, "loss": 0.005, "step": 341290 }, { "epoch": 1.72, "learning_rate": 4.17146374318277e-05, "loss": 0.008, "step": 341300 }, { "epoch": 1.72, "learning_rate": 4.170706973881369e-05, "loss": 0.0053, "step": 341310 }, { "epoch": 1.72, "learning_rate": 4.1699502045799676e-05, "loss": 0.0055, "step": 341320 }, { "epoch": 1.72, "learning_rate": 4.1691934352785664e-05, "loss": 0.0079, "step": 341330 }, { "epoch": 1.72, "learning_rate": 4.168436665977166e-05, "loss": 0.0067, "step": 341340 }, { "epoch": 1.72, "learning_rate": 4.167679896675765e-05, "loss": 0.0054, "step": 341350 }, { "epoch": 1.72, "learning_rate": 4.1669231273743636e-05, "loss": 0.0045, "step": 341360 }, { "epoch": 1.72, "learning_rate": 4.1661663580729624e-05, "loss": 0.0064, "step": 341370 }, { "epoch": 1.72, "learning_rate": 4.165409588771562e-05, "loss": 0.0085, "step": 341380 }, { "epoch": 1.72, "learning_rate": 4.164652819470161e-05, "loss": 0.0081, "step": 341390 }, { "epoch": 1.72, "learning_rate": 4.1638960501687595e-05, "loss": 0.0069, "step": 341400 }, { "epoch": 1.72, "learning_rate": 4.163139280867358e-05, "loss": 0.0059, "step": 341410 }, { "epoch": 1.72, "learning_rate": 4.1623825115659565e-05, "loss": 0.0055, "step": 341420 }, { "epoch": 1.72, "learning_rate": 4.161625742264556e-05, "loss": 0.0084, "step": 341430 }, { "epoch": 1.72, "learning_rate": 4.160868972963155e-05, "loss": 0.0103, "step": 341440 }, { "epoch": 1.72, "learning_rate": 4.1601122036617537e-05, "loss": 0.008, "step": 341450 }, { "epoch": 1.72, "learning_rate": 4.1593554343603525e-05, "loss": 0.0066, "step": 341460 }, { "epoch": 1.72, "learning_rate": 4.158598665058952e-05, "loss": 0.0068, "step": 341470 }, { "epoch": 1.72, "learning_rate": 4.157841895757551e-05, "loss": 0.0056, "step": 341480 }, { "epoch": 1.72, "learning_rate": 4.1570851264561496e-05, "loss": 0.0064, "step": 341490 }, { "epoch": 1.72, "learning_rate": 4.1563283571547484e-05, "loss": 0.0059, "step": 341500 }, { "epoch": 1.72, "learning_rate": 4.155571587853348e-05, "loss": 0.0075, "step": 341510 }, { "epoch": 1.72, "learning_rate": 4.154814818551947e-05, "loss": 0.0071, "step": 341520 }, { "epoch": 1.72, "learning_rate": 4.1540580492505456e-05, "loss": 0.0058, "step": 341530 }, { "epoch": 1.72, "learning_rate": 4.1533012799491444e-05, "loss": 0.0074, "step": 341540 }, { "epoch": 1.72, "learning_rate": 4.152544510647744e-05, "loss": 0.0079, "step": 341550 }, { "epoch": 1.72, "learning_rate": 4.151787741346343e-05, "loss": 0.0065, "step": 341560 }, { "epoch": 1.72, "learning_rate": 4.1510309720449416e-05, "loss": 0.0062, "step": 341570 }, { "epoch": 1.72, "learning_rate": 4.1502742027435404e-05, "loss": 0.0051, "step": 341580 }, { "epoch": 1.72, "learning_rate": 4.14951743344214e-05, "loss": 0.0048, "step": 341590 }, { "epoch": 1.72, "learning_rate": 4.148760664140739e-05, "loss": 0.0072, "step": 341600 }, { "epoch": 1.72, "learning_rate": 4.1480038948393375e-05, "loss": 0.0066, "step": 341610 }, { "epoch": 1.72, "learning_rate": 4.1472471255379363e-05, "loss": 0.0046, "step": 341620 }, { "epoch": 1.72, "learning_rate": 4.146490356236536e-05, "loss": 0.0052, "step": 341630 }, { "epoch": 1.72, "learning_rate": 4.1457335869351347e-05, "loss": 0.0059, "step": 341640 }, { "epoch": 1.72, "learning_rate": 4.1449768176337335e-05, "loss": 0.0054, "step": 341650 }, { "epoch": 1.72, "learning_rate": 4.144220048332332e-05, "loss": 0.0076, "step": 341660 }, { "epoch": 1.72, "learning_rate": 4.143463279030932e-05, "loss": 0.0065, "step": 341670 }, { "epoch": 1.72, "learning_rate": 4.1427065097295306e-05, "loss": 0.0062, "step": 341680 }, { "epoch": 1.72, "learning_rate": 4.1419497404281294e-05, "loss": 0.0076, "step": 341690 }, { "epoch": 1.72, "learning_rate": 4.141192971126728e-05, "loss": 0.0071, "step": 341700 }, { "epoch": 1.72, "learning_rate": 4.140436201825328e-05, "loss": 0.0058, "step": 341710 }, { "epoch": 1.72, "learning_rate": 4.139679432523926e-05, "loss": 0.0105, "step": 341720 }, { "epoch": 1.72, "learning_rate": 4.138922663222525e-05, "loss": 0.0065, "step": 341730 }, { "epoch": 1.72, "learning_rate": 4.1381658939211236e-05, "loss": 0.0053, "step": 341740 }, { "epoch": 1.72, "learning_rate": 4.137409124619723e-05, "loss": 0.0054, "step": 341750 }, { "epoch": 1.72, "learning_rate": 4.136652355318322e-05, "loss": 0.0069, "step": 341760 }, { "epoch": 1.72, "learning_rate": 4.135895586016921e-05, "loss": 0.0062, "step": 341770 }, { "epoch": 1.72, "learning_rate": 4.1351388167155195e-05, "loss": 0.0079, "step": 341780 }, { "epoch": 1.72, "learning_rate": 4.134382047414119e-05, "loss": 0.0088, "step": 341790 }, { "epoch": 1.72, "learning_rate": 4.133625278112718e-05, "loss": 0.0043, "step": 341800 }, { "epoch": 1.72, "learning_rate": 4.132868508811317e-05, "loss": 0.0067, "step": 341810 }, { "epoch": 1.72, "learning_rate": 4.1321117395099155e-05, "loss": 0.0071, "step": 341820 }, { "epoch": 1.72, "learning_rate": 4.131354970208515e-05, "loss": 0.0077, "step": 341830 }, { "epoch": 1.72, "learning_rate": 4.130598200907114e-05, "loss": 0.0054, "step": 341840 }, { "epoch": 1.72, "learning_rate": 4.1298414316057126e-05, "loss": 0.0046, "step": 341850 }, { "epoch": 1.72, "learning_rate": 4.1290846623043115e-05, "loss": 0.006, "step": 341860 }, { "epoch": 1.72, "learning_rate": 4.128327893002911e-05, "loss": 0.006, "step": 341870 }, { "epoch": 1.72, "learning_rate": 4.12757112370151e-05, "loss": 0.0065, "step": 341880 }, { "epoch": 1.72, "learning_rate": 4.1268143544001086e-05, "loss": 0.005, "step": 341890 }, { "epoch": 1.72, "learning_rate": 4.1260575850987074e-05, "loss": 0.0054, "step": 341900 }, { "epoch": 1.72, "learning_rate": 4.125300815797307e-05, "loss": 0.0073, "step": 341910 }, { "epoch": 1.73, "learning_rate": 4.124544046495906e-05, "loss": 0.0047, "step": 341920 }, { "epoch": 1.73, "learning_rate": 4.1237872771945046e-05, "loss": 0.0055, "step": 341930 }, { "epoch": 1.73, "learning_rate": 4.1230305078931034e-05, "loss": 0.0078, "step": 341940 }, { "epoch": 1.73, "learning_rate": 4.122273738591703e-05, "loss": 0.0069, "step": 341950 }, { "epoch": 1.73, "learning_rate": 4.121516969290302e-05, "loss": 0.0068, "step": 341960 }, { "epoch": 1.73, "learning_rate": 4.1207601999889005e-05, "loss": 0.0088, "step": 341970 }, { "epoch": 1.73, "learning_rate": 4.1200034306874993e-05, "loss": 0.0068, "step": 341980 }, { "epoch": 1.73, "learning_rate": 4.119246661386099e-05, "loss": 0.0071, "step": 341990 }, { "epoch": 1.73, "learning_rate": 4.118489892084698e-05, "loss": 0.0068, "step": 342000 }, { "epoch": 1.73, "eval_cer": 0.9144217360968921, "eval_loss": 0.004726854152977467, "eval_runtime": 116.8239, "eval_samples_per_second": 17.12, "eval_steps_per_second": 4.28, "step": 342000 }, { "epoch": 1.73, "learning_rate": 4.1177331227832965e-05, "loss": 0.0063, "step": 342010 }, { "epoch": 1.73, "learning_rate": 4.116976353481895e-05, "loss": 0.0071, "step": 342020 }, { "epoch": 1.73, "learning_rate": 4.116219584180495e-05, "loss": 0.0046, "step": 342030 }, { "epoch": 1.73, "learning_rate": 4.115462814879093e-05, "loss": 0.0056, "step": 342040 }, { "epoch": 1.73, "learning_rate": 4.114706045577692e-05, "loss": 0.0053, "step": 342050 }, { "epoch": 1.73, "learning_rate": 4.1139492762762906e-05, "loss": 0.0069, "step": 342060 }, { "epoch": 1.73, "learning_rate": 4.1131925069748894e-05, "loss": 0.0048, "step": 342070 }, { "epoch": 1.73, "learning_rate": 4.112435737673489e-05, "loss": 0.0054, "step": 342080 }, { "epoch": 1.73, "learning_rate": 4.111678968372088e-05, "loss": 0.0062, "step": 342090 }, { "epoch": 1.73, "learning_rate": 4.1109221990706866e-05, "loss": 0.0048, "step": 342100 }, { "epoch": 1.73, "learning_rate": 4.1101654297692854e-05, "loss": 0.0073, "step": 342110 }, { "epoch": 1.73, "learning_rate": 4.109408660467885e-05, "loss": 0.0064, "step": 342120 }, { "epoch": 1.73, "learning_rate": 4.108651891166484e-05, "loss": 0.0045, "step": 342130 }, { "epoch": 1.73, "learning_rate": 4.1078951218650825e-05, "loss": 0.0069, "step": 342140 }, { "epoch": 1.73, "learning_rate": 4.1071383525636814e-05, "loss": 0.0068, "step": 342150 }, { "epoch": 1.73, "learning_rate": 4.106381583262281e-05, "loss": 0.0057, "step": 342160 }, { "epoch": 1.73, "learning_rate": 4.10562481396088e-05, "loss": 0.0061, "step": 342170 }, { "epoch": 1.73, "learning_rate": 4.1048680446594785e-05, "loss": 0.0061, "step": 342180 }, { "epoch": 1.73, "learning_rate": 4.104111275358077e-05, "loss": 0.0098, "step": 342190 }, { "epoch": 1.73, "learning_rate": 4.103354506056677e-05, "loss": 0.0062, "step": 342200 }, { "epoch": 1.73, "learning_rate": 4.1025977367552756e-05, "loss": 0.0056, "step": 342210 }, { "epoch": 1.73, "learning_rate": 4.1018409674538745e-05, "loss": 0.0046, "step": 342220 }, { "epoch": 1.73, "learning_rate": 4.101084198152474e-05, "loss": 0.0079, "step": 342230 }, { "epoch": 1.73, "learning_rate": 4.100327428851073e-05, "loss": 0.0059, "step": 342240 }, { "epoch": 1.73, "learning_rate": 4.0995706595496716e-05, "loss": 0.0053, "step": 342250 }, { "epoch": 1.73, "learning_rate": 4.0988138902482704e-05, "loss": 0.0065, "step": 342260 }, { "epoch": 1.73, "learning_rate": 4.09805712094687e-05, "loss": 0.0084, "step": 342270 }, { "epoch": 1.73, "learning_rate": 4.097300351645469e-05, "loss": 0.0067, "step": 342280 }, { "epoch": 1.73, "learning_rate": 4.0965435823440676e-05, "loss": 0.0063, "step": 342290 }, { "epoch": 1.73, "learning_rate": 4.0957868130426664e-05, "loss": 0.0072, "step": 342300 }, { "epoch": 1.73, "learning_rate": 4.095030043741266e-05, "loss": 0.0047, "step": 342310 }, { "epoch": 1.73, "learning_rate": 4.094273274439865e-05, "loss": 0.0089, "step": 342320 }, { "epoch": 1.73, "learning_rate": 4.0935165051384635e-05, "loss": 0.0066, "step": 342330 }, { "epoch": 1.73, "learning_rate": 4.0927597358370624e-05, "loss": 0.0065, "step": 342340 }, { "epoch": 1.73, "learning_rate": 4.0920029665356605e-05, "loss": 0.0095, "step": 342350 }, { "epoch": 1.73, "learning_rate": 4.09124619723426e-05, "loss": 0.0055, "step": 342360 }, { "epoch": 1.73, "learning_rate": 4.090489427932859e-05, "loss": 0.0069, "step": 342370 }, { "epoch": 1.73, "learning_rate": 4.0897326586314576e-05, "loss": 0.0068, "step": 342380 }, { "epoch": 1.73, "learning_rate": 4.0889758893300565e-05, "loss": 0.0051, "step": 342390 }, { "epoch": 1.73, "learning_rate": 4.088219120028656e-05, "loss": 0.0047, "step": 342400 }, { "epoch": 1.73, "learning_rate": 4.087462350727255e-05, "loss": 0.0069, "step": 342410 }, { "epoch": 1.73, "learning_rate": 4.0867055814258536e-05, "loss": 0.0069, "step": 342420 }, { "epoch": 1.73, "learning_rate": 4.0859488121244524e-05, "loss": 0.0048, "step": 342430 }, { "epoch": 1.73, "learning_rate": 4.085192042823052e-05, "loss": 0.006, "step": 342440 }, { "epoch": 1.73, "learning_rate": 4.084435273521651e-05, "loss": 0.007, "step": 342450 }, { "epoch": 1.73, "learning_rate": 4.0836785042202496e-05, "loss": 0.0052, "step": 342460 }, { "epoch": 1.73, "learning_rate": 4.0829217349188484e-05, "loss": 0.0079, "step": 342470 }, { "epoch": 1.73, "learning_rate": 4.082164965617448e-05, "loss": 0.0064, "step": 342480 }, { "epoch": 1.73, "learning_rate": 4.081408196316047e-05, "loss": 0.0064, "step": 342490 }, { "epoch": 1.73, "learning_rate": 4.0806514270146455e-05, "loss": 0.007, "step": 342500 }, { "epoch": 1.73, "learning_rate": 4.0798946577132444e-05, "loss": 0.0072, "step": 342510 }, { "epoch": 1.73, "learning_rate": 4.079137888411844e-05, "loss": 0.0057, "step": 342520 }, { "epoch": 1.73, "learning_rate": 4.078381119110443e-05, "loss": 0.007, "step": 342530 }, { "epoch": 1.73, "learning_rate": 4.0776243498090415e-05, "loss": 0.0066, "step": 342540 }, { "epoch": 1.73, "learning_rate": 4.07686758050764e-05, "loss": 0.0059, "step": 342550 }, { "epoch": 1.73, "learning_rate": 4.07611081120624e-05, "loss": 0.0103, "step": 342560 }, { "epoch": 1.73, "learning_rate": 4.0753540419048386e-05, "loss": 0.0053, "step": 342570 }, { "epoch": 1.73, "learning_rate": 4.0745972726034375e-05, "loss": 0.0115, "step": 342580 }, { "epoch": 1.73, "learning_rate": 4.073840503302036e-05, "loss": 0.0059, "step": 342590 }, { "epoch": 1.73, "learning_rate": 4.073083734000636e-05, "loss": 0.0067, "step": 342600 }, { "epoch": 1.73, "learning_rate": 4.0723269646992346e-05, "loss": 0.0077, "step": 342610 }, { "epoch": 1.73, "learning_rate": 4.0715701953978334e-05, "loss": 0.0071, "step": 342620 }, { "epoch": 1.73, "learning_rate": 4.070813426096432e-05, "loss": 0.0063, "step": 342630 }, { "epoch": 1.73, "learning_rate": 4.070056656795032e-05, "loss": 0.0078, "step": 342640 }, { "epoch": 1.73, "learning_rate": 4.0692998874936306e-05, "loss": 0.0079, "step": 342650 }, { "epoch": 1.73, "learning_rate": 4.068543118192229e-05, "loss": 0.0065, "step": 342660 }, { "epoch": 1.73, "learning_rate": 4.0677863488908275e-05, "loss": 0.0073, "step": 342670 }, { "epoch": 1.73, "learning_rate": 4.067029579589427e-05, "loss": 0.0058, "step": 342680 }, { "epoch": 1.73, "learning_rate": 4.066272810288026e-05, "loss": 0.007, "step": 342690 }, { "epoch": 1.73, "learning_rate": 4.065516040986625e-05, "loss": 0.0076, "step": 342700 }, { "epoch": 1.73, "learning_rate": 4.0647592716852235e-05, "loss": 0.0068, "step": 342710 }, { "epoch": 1.73, "learning_rate": 4.064002502383823e-05, "loss": 0.009, "step": 342720 }, { "epoch": 1.73, "learning_rate": 4.063245733082422e-05, "loss": 0.007, "step": 342730 }, { "epoch": 1.73, "learning_rate": 4.0624889637810207e-05, "loss": 0.0054, "step": 342740 }, { "epoch": 1.73, "learning_rate": 4.0617321944796195e-05, "loss": 0.0063, "step": 342750 }, { "epoch": 1.73, "learning_rate": 4.060975425178219e-05, "loss": 0.0059, "step": 342760 }, { "epoch": 1.73, "learning_rate": 4.060218655876818e-05, "loss": 0.0069, "step": 342770 }, { "epoch": 1.73, "learning_rate": 4.0594618865754166e-05, "loss": 0.0049, "step": 342780 }, { "epoch": 1.73, "learning_rate": 4.0587051172740154e-05, "loss": 0.0064, "step": 342790 }, { "epoch": 1.73, "learning_rate": 4.057948347972615e-05, "loss": 0.0067, "step": 342800 }, { "epoch": 1.73, "learning_rate": 4.057191578671214e-05, "loss": 0.0055, "step": 342810 }, { "epoch": 1.73, "learning_rate": 4.0564348093698126e-05, "loss": 0.0057, "step": 342820 }, { "epoch": 1.73, "learning_rate": 4.0556780400684114e-05, "loss": 0.0058, "step": 342830 }, { "epoch": 1.73, "learning_rate": 4.054921270767011e-05, "loss": 0.0053, "step": 342840 }, { "epoch": 1.73, "learning_rate": 4.05416450146561e-05, "loss": 0.0053, "step": 342850 }, { "epoch": 1.73, "learning_rate": 4.0534077321642085e-05, "loss": 0.0059, "step": 342860 }, { "epoch": 1.73, "learning_rate": 4.0526509628628074e-05, "loss": 0.0048, "step": 342870 }, { "epoch": 1.73, "learning_rate": 4.051894193561407e-05, "loss": 0.0057, "step": 342880 }, { "epoch": 1.73, "learning_rate": 4.051137424260006e-05, "loss": 0.0048, "step": 342890 }, { "epoch": 1.73, "learning_rate": 4.0503806549586045e-05, "loss": 0.0066, "step": 342900 }, { "epoch": 1.73, "learning_rate": 4.049623885657203e-05, "loss": 0.0056, "step": 342910 }, { "epoch": 1.73, "learning_rate": 4.048867116355803e-05, "loss": 0.0063, "step": 342920 }, { "epoch": 1.73, "learning_rate": 4.0481103470544017e-05, "loss": 0.0047, "step": 342930 }, { "epoch": 1.73, "learning_rate": 4.0473535777530005e-05, "loss": 0.0053, "step": 342940 }, { "epoch": 1.73, "learning_rate": 4.046596808451599e-05, "loss": 0.0052, "step": 342950 }, { "epoch": 1.73, "learning_rate": 4.045840039150199e-05, "loss": 0.0072, "step": 342960 }, { "epoch": 1.73, "learning_rate": 4.0450832698487976e-05, "loss": 0.0061, "step": 342970 }, { "epoch": 1.73, "learning_rate": 4.044326500547396e-05, "loss": 0.0084, "step": 342980 }, { "epoch": 1.73, "learning_rate": 4.0435697312459946e-05, "loss": 0.0058, "step": 342990 }, { "epoch": 1.73, "learning_rate": 4.0428129619445934e-05, "loss": 0.005, "step": 343000 }, { "epoch": 1.73, "eval_cer": 0.9144333808503969, "eval_loss": 0.00461353175342083, "eval_runtime": 116.7176, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 343000 }, { "epoch": 1.73, "learning_rate": 4.042056192643193e-05, "loss": 0.0097, "step": 343010 }, { "epoch": 1.73, "learning_rate": 4.041299423341792e-05, "loss": 0.0053, "step": 343020 }, { "epoch": 1.73, "learning_rate": 4.0405426540403906e-05, "loss": 0.0051, "step": 343030 }, { "epoch": 1.73, "learning_rate": 4.0397858847389894e-05, "loss": 0.0072, "step": 343040 }, { "epoch": 1.73, "learning_rate": 4.039029115437589e-05, "loss": 0.0068, "step": 343050 }, { "epoch": 1.73, "learning_rate": 4.038272346136188e-05, "loss": 0.0061, "step": 343060 }, { "epoch": 1.73, "learning_rate": 4.0375155768347865e-05, "loss": 0.0049, "step": 343070 }, { "epoch": 1.73, "learning_rate": 4.0367588075333853e-05, "loss": 0.0053, "step": 343080 }, { "epoch": 1.73, "learning_rate": 4.036002038231985e-05, "loss": 0.0069, "step": 343090 }, { "epoch": 1.73, "learning_rate": 4.0352452689305837e-05, "loss": 0.0059, "step": 343100 }, { "epoch": 1.73, "learning_rate": 4.0344884996291825e-05, "loss": 0.0052, "step": 343110 }, { "epoch": 1.73, "learning_rate": 4.033731730327781e-05, "loss": 0.0053, "step": 343120 }, { "epoch": 1.73, "learning_rate": 4.032974961026381e-05, "loss": 0.0062, "step": 343130 }, { "epoch": 1.73, "learning_rate": 4.0322181917249796e-05, "loss": 0.0082, "step": 343140 }, { "epoch": 1.73, "learning_rate": 4.0314614224235784e-05, "loss": 0.0063, "step": 343150 }, { "epoch": 1.73, "learning_rate": 4.030704653122177e-05, "loss": 0.0066, "step": 343160 }, { "epoch": 1.73, "learning_rate": 4.029947883820777e-05, "loss": 0.0068, "step": 343170 }, { "epoch": 1.73, "learning_rate": 4.0291911145193756e-05, "loss": 0.0046, "step": 343180 }, { "epoch": 1.73, "learning_rate": 4.0284343452179744e-05, "loss": 0.0071, "step": 343190 }, { "epoch": 1.73, "learning_rate": 4.027677575916574e-05, "loss": 0.0074, "step": 343200 }, { "epoch": 1.73, "learning_rate": 4.026920806615173e-05, "loss": 0.0063, "step": 343210 }, { "epoch": 1.73, "learning_rate": 4.0261640373137716e-05, "loss": 0.0068, "step": 343220 }, { "epoch": 1.73, "learning_rate": 4.0254072680123704e-05, "loss": 0.0082, "step": 343230 }, { "epoch": 1.73, "learning_rate": 4.02465049871097e-05, "loss": 0.0053, "step": 343240 }, { "epoch": 1.73, "learning_rate": 4.023893729409569e-05, "loss": 0.0062, "step": 343250 }, { "epoch": 1.73, "learning_rate": 4.0231369601081675e-05, "loss": 0.0057, "step": 343260 }, { "epoch": 1.73, "learning_rate": 4.0223801908067663e-05, "loss": 0.0064, "step": 343270 }, { "epoch": 1.73, "learning_rate": 4.021623421505366e-05, "loss": 0.0058, "step": 343280 }, { "epoch": 1.73, "learning_rate": 4.020866652203964e-05, "loss": 0.0077, "step": 343290 }, { "epoch": 1.73, "learning_rate": 4.020109882902563e-05, "loss": 0.0051, "step": 343300 }, { "epoch": 1.73, "learning_rate": 4.0193531136011616e-05, "loss": 0.006, "step": 343310 }, { "epoch": 1.73, "learning_rate": 4.0185963442997605e-05, "loss": 0.0057, "step": 343320 }, { "epoch": 1.73, "learning_rate": 4.01783957499836e-05, "loss": 0.0051, "step": 343330 }, { "epoch": 1.73, "learning_rate": 4.017082805696959e-05, "loss": 0.0068, "step": 343340 }, { "epoch": 1.73, "learning_rate": 4.0163260363955576e-05, "loss": 0.0071, "step": 343350 }, { "epoch": 1.73, "learning_rate": 4.0155692670941564e-05, "loss": 0.0065, "step": 343360 }, { "epoch": 1.73, "learning_rate": 4.014812497792756e-05, "loss": 0.0055, "step": 343370 }, { "epoch": 1.73, "learning_rate": 4.014055728491355e-05, "loss": 0.0046, "step": 343380 }, { "epoch": 1.73, "learning_rate": 4.0132989591899536e-05, "loss": 0.0059, "step": 343390 }, { "epoch": 1.73, "learning_rate": 4.0125421898885524e-05, "loss": 0.0051, "step": 343400 }, { "epoch": 1.73, "learning_rate": 4.011785420587152e-05, "loss": 0.0074, "step": 343410 }, { "epoch": 1.73, "learning_rate": 4.011028651285751e-05, "loss": 0.0082, "step": 343420 }, { "epoch": 1.73, "learning_rate": 4.0102718819843495e-05, "loss": 0.0094, "step": 343430 }, { "epoch": 1.73, "learning_rate": 4.0095151126829483e-05, "loss": 0.0072, "step": 343440 }, { "epoch": 1.73, "learning_rate": 4.008758343381548e-05, "loss": 0.0063, "step": 343450 }, { "epoch": 1.73, "learning_rate": 4.008001574080147e-05, "loss": 0.0069, "step": 343460 }, { "epoch": 1.73, "learning_rate": 4.0072448047787455e-05, "loss": 0.0055, "step": 343470 }, { "epoch": 1.73, "learning_rate": 4.006488035477344e-05, "loss": 0.0058, "step": 343480 }, { "epoch": 1.73, "learning_rate": 4.005731266175944e-05, "loss": 0.0049, "step": 343490 }, { "epoch": 1.73, "learning_rate": 4.0049744968745426e-05, "loss": 0.0045, "step": 343500 }, { "epoch": 1.73, "learning_rate": 4.0042177275731415e-05, "loss": 0.0066, "step": 343510 }, { "epoch": 1.73, "learning_rate": 4.00346095827174e-05, "loss": 0.0058, "step": 343520 }, { "epoch": 1.73, "learning_rate": 4.00270418897034e-05, "loss": 0.007, "step": 343530 }, { "epoch": 1.73, "learning_rate": 4.0019474196689386e-05, "loss": 0.0057, "step": 343540 }, { "epoch": 1.73, "learning_rate": 4.0011906503675374e-05, "loss": 0.0053, "step": 343550 }, { "epoch": 1.73, "learning_rate": 4.000433881066136e-05, "loss": 0.0064, "step": 343560 }, { "epoch": 1.73, "learning_rate": 3.999677111764736e-05, "loss": 0.0071, "step": 343570 }, { "epoch": 1.73, "learning_rate": 3.9989203424633346e-05, "loss": 0.0059, "step": 343580 }, { "epoch": 1.73, "learning_rate": 3.9981635731619334e-05, "loss": 0.0073, "step": 343590 }, { "epoch": 1.73, "learning_rate": 3.997406803860532e-05, "loss": 0.0049, "step": 343600 }, { "epoch": 1.73, "learning_rate": 3.9966500345591304e-05, "loss": 0.009, "step": 343610 }, { "epoch": 1.73, "learning_rate": 3.99589326525773e-05, "loss": 0.0062, "step": 343620 }, { "epoch": 1.73, "learning_rate": 3.995136495956329e-05, "loss": 0.0051, "step": 343630 }, { "epoch": 1.73, "learning_rate": 3.9943797266549275e-05, "loss": 0.0065, "step": 343640 }, { "epoch": 1.73, "learning_rate": 3.993622957353527e-05, "loss": 0.0075, "step": 343650 }, { "epoch": 1.73, "learning_rate": 3.992866188052126e-05, "loss": 0.0078, "step": 343660 }, { "epoch": 1.73, "learning_rate": 3.9921094187507246e-05, "loss": 0.0067, "step": 343670 }, { "epoch": 1.73, "learning_rate": 3.9913526494493235e-05, "loss": 0.0072, "step": 343680 }, { "epoch": 1.73, "learning_rate": 3.990595880147923e-05, "loss": 0.0067, "step": 343690 }, { "epoch": 1.73, "learning_rate": 3.989839110846522e-05, "loss": 0.0054, "step": 343700 }, { "epoch": 1.73, "learning_rate": 3.9890823415451206e-05, "loss": 0.004, "step": 343710 }, { "epoch": 1.73, "learning_rate": 3.9883255722437194e-05, "loss": 0.0059, "step": 343720 }, { "epoch": 1.73, "learning_rate": 3.987568802942319e-05, "loss": 0.0056, "step": 343730 }, { "epoch": 1.73, "learning_rate": 3.986812033640918e-05, "loss": 0.009, "step": 343740 }, { "epoch": 1.73, "learning_rate": 3.9860552643395166e-05, "loss": 0.0057, "step": 343750 }, { "epoch": 1.73, "learning_rate": 3.9852984950381154e-05, "loss": 0.0057, "step": 343760 }, { "epoch": 1.73, "learning_rate": 3.984541725736715e-05, "loss": 0.0081, "step": 343770 }, { "epoch": 1.73, "learning_rate": 3.983784956435314e-05, "loss": 0.0077, "step": 343780 }, { "epoch": 1.73, "learning_rate": 3.9830281871339125e-05, "loss": 0.0064, "step": 343790 }, { "epoch": 1.73, "learning_rate": 3.9822714178325114e-05, "loss": 0.0055, "step": 343800 }, { "epoch": 1.73, "learning_rate": 3.981514648531111e-05, "loss": 0.0061, "step": 343810 }, { "epoch": 1.73, "learning_rate": 3.98075787922971e-05, "loss": 0.0097, "step": 343820 }, { "epoch": 1.73, "learning_rate": 3.9800011099283085e-05, "loss": 0.0053, "step": 343830 }, { "epoch": 1.73, "learning_rate": 3.979244340626907e-05, "loss": 0.0065, "step": 343840 }, { "epoch": 1.73, "learning_rate": 3.978487571325507e-05, "loss": 0.0078, "step": 343850 }, { "epoch": 1.73, "learning_rate": 3.9777308020241056e-05, "loss": 0.0046, "step": 343860 }, { "epoch": 1.73, "learning_rate": 3.9769740327227045e-05, "loss": 0.0046, "step": 343870 }, { "epoch": 1.73, "learning_rate": 3.976217263421303e-05, "loss": 0.0062, "step": 343880 }, { "epoch": 1.73, "learning_rate": 3.975460494119903e-05, "loss": 0.0072, "step": 343890 }, { "epoch": 1.74, "learning_rate": 3.9747037248185016e-05, "loss": 0.0063, "step": 343900 }, { "epoch": 1.74, "learning_rate": 3.9739469555171004e-05, "loss": 0.0057, "step": 343910 }, { "epoch": 1.74, "learning_rate": 3.9731901862156986e-05, "loss": 0.0048, "step": 343920 }, { "epoch": 1.74, "learning_rate": 3.9724334169142974e-05, "loss": 0.0049, "step": 343930 }, { "epoch": 1.74, "learning_rate": 3.971676647612897e-05, "loss": 0.0052, "step": 343940 }, { "epoch": 1.74, "learning_rate": 3.970919878311496e-05, "loss": 0.006, "step": 343950 }, { "epoch": 1.74, "learning_rate": 3.9701631090100945e-05, "loss": 0.0057, "step": 343960 }, { "epoch": 1.74, "learning_rate": 3.9694063397086934e-05, "loss": 0.0078, "step": 343970 }, { "epoch": 1.74, "learning_rate": 3.968649570407293e-05, "loss": 0.0077, "step": 343980 }, { "epoch": 1.74, "learning_rate": 3.967892801105892e-05, "loss": 0.0074, "step": 343990 }, { "epoch": 1.74, "learning_rate": 3.9671360318044905e-05, "loss": 0.004, "step": 344000 }, { "epoch": 1.74, "eval_cer": 0.9144217360968921, "eval_loss": 0.004634759854525328, "eval_runtime": 116.8176, "eval_samples_per_second": 17.121, "eval_steps_per_second": 4.28, "step": 344000 }, { "epoch": 1.74, "learning_rate": 3.966379262503089e-05, "loss": 0.0071, "step": 344010 }, { "epoch": 1.74, "learning_rate": 3.965622493201689e-05, "loss": 0.0069, "step": 344020 }, { "epoch": 1.74, "learning_rate": 3.9648657239002876e-05, "loss": 0.0049, "step": 344030 }, { "epoch": 1.74, "learning_rate": 3.9641089545988865e-05, "loss": 0.0071, "step": 344040 }, { "epoch": 1.74, "learning_rate": 3.963352185297485e-05, "loss": 0.0043, "step": 344050 }, { "epoch": 1.74, "learning_rate": 3.962595415996085e-05, "loss": 0.0085, "step": 344060 }, { "epoch": 1.74, "learning_rate": 3.9618386466946836e-05, "loss": 0.0061, "step": 344070 }, { "epoch": 1.74, "learning_rate": 3.9610818773932824e-05, "loss": 0.0047, "step": 344080 }, { "epoch": 1.74, "learning_rate": 3.960325108091881e-05, "loss": 0.0069, "step": 344090 }, { "epoch": 1.74, "learning_rate": 3.959568338790481e-05, "loss": 0.006, "step": 344100 }, { "epoch": 1.74, "learning_rate": 3.9588115694890796e-05, "loss": 0.008, "step": 344110 }, { "epoch": 1.74, "learning_rate": 3.9580548001876784e-05, "loss": 0.0061, "step": 344120 }, { "epoch": 1.74, "learning_rate": 3.957298030886277e-05, "loss": 0.0058, "step": 344130 }, { "epoch": 1.74, "learning_rate": 3.956541261584877e-05, "loss": 0.0058, "step": 344140 }, { "epoch": 1.74, "learning_rate": 3.9557844922834755e-05, "loss": 0.0065, "step": 344150 }, { "epoch": 1.74, "learning_rate": 3.9550277229820744e-05, "loss": 0.0053, "step": 344160 }, { "epoch": 1.74, "learning_rate": 3.954270953680674e-05, "loss": 0.005, "step": 344170 }, { "epoch": 1.74, "learning_rate": 3.953514184379273e-05, "loss": 0.0058, "step": 344180 }, { "epoch": 1.74, "learning_rate": 3.9527574150778715e-05, "loss": 0.0086, "step": 344190 }, { "epoch": 1.74, "learning_rate": 3.95200064577647e-05, "loss": 0.0051, "step": 344200 }, { "epoch": 1.74, "learning_rate": 3.95124387647507e-05, "loss": 0.0068, "step": 344210 }, { "epoch": 1.74, "learning_rate": 3.9504871071736687e-05, "loss": 0.008, "step": 344220 }, { "epoch": 1.74, "learning_rate": 3.949730337872267e-05, "loss": 0.0076, "step": 344230 }, { "epoch": 1.74, "learning_rate": 3.9489735685708656e-05, "loss": 0.0068, "step": 344240 }, { "epoch": 1.74, "learning_rate": 3.9482167992694644e-05, "loss": 0.0052, "step": 344250 }, { "epoch": 1.74, "learning_rate": 3.947460029968064e-05, "loss": 0.0058, "step": 344260 }, { "epoch": 1.74, "learning_rate": 3.946703260666663e-05, "loss": 0.0042, "step": 344270 }, { "epoch": 1.74, "learning_rate": 3.9459464913652616e-05, "loss": 0.0044, "step": 344280 }, { "epoch": 1.74, "learning_rate": 3.9451897220638604e-05, "loss": 0.0074, "step": 344290 }, { "epoch": 1.74, "learning_rate": 3.94443295276246e-05, "loss": 0.0056, "step": 344300 }, { "epoch": 1.74, "learning_rate": 3.943676183461059e-05, "loss": 0.0066, "step": 344310 }, { "epoch": 1.74, "learning_rate": 3.9429194141596575e-05, "loss": 0.0057, "step": 344320 }, { "epoch": 1.74, "learning_rate": 3.9421626448582564e-05, "loss": 0.0079, "step": 344330 }, { "epoch": 1.74, "learning_rate": 3.941405875556856e-05, "loss": 0.0056, "step": 344340 }, { "epoch": 1.74, "learning_rate": 3.940649106255455e-05, "loss": 0.0071, "step": 344350 }, { "epoch": 1.74, "learning_rate": 3.9398923369540535e-05, "loss": 0.0073, "step": 344360 }, { "epoch": 1.74, "learning_rate": 3.939135567652652e-05, "loss": 0.0046, "step": 344370 }, { "epoch": 1.74, "learning_rate": 3.938378798351252e-05, "loss": 0.0057, "step": 344380 }, { "epoch": 1.74, "learning_rate": 3.9376220290498507e-05, "loss": 0.0047, "step": 344390 }, { "epoch": 1.74, "learning_rate": 3.9368652597484495e-05, "loss": 0.0077, "step": 344400 }, { "epoch": 1.74, "learning_rate": 3.936108490447048e-05, "loss": 0.0065, "step": 344410 }, { "epoch": 1.74, "learning_rate": 3.935351721145648e-05, "loss": 0.0087, "step": 344420 }, { "epoch": 1.74, "learning_rate": 3.9345949518442466e-05, "loss": 0.0074, "step": 344430 }, { "epoch": 1.74, "learning_rate": 3.9338381825428454e-05, "loss": 0.0076, "step": 344440 }, { "epoch": 1.74, "learning_rate": 3.933081413241444e-05, "loss": 0.004, "step": 344450 }, { "epoch": 1.74, "learning_rate": 3.932324643940044e-05, "loss": 0.007, "step": 344460 }, { "epoch": 1.74, "learning_rate": 3.9315678746386426e-05, "loss": 0.0054, "step": 344470 }, { "epoch": 1.74, "learning_rate": 3.9308111053372414e-05, "loss": 0.0067, "step": 344480 }, { "epoch": 1.74, "learning_rate": 3.93005433603584e-05, "loss": 0.0064, "step": 344490 }, { "epoch": 1.74, "learning_rate": 3.92929756673444e-05, "loss": 0.0089, "step": 344500 }, { "epoch": 1.74, "learning_rate": 3.9285407974330386e-05, "loss": 0.0056, "step": 344510 }, { "epoch": 1.74, "learning_rate": 3.9277840281316374e-05, "loss": 0.0054, "step": 344520 }, { "epoch": 1.74, "learning_rate": 3.927027258830236e-05, "loss": 0.0081, "step": 344530 }, { "epoch": 1.74, "learning_rate": 3.926270489528836e-05, "loss": 0.0077, "step": 344540 }, { "epoch": 1.74, "learning_rate": 3.925513720227434e-05, "loss": 0.0066, "step": 344550 }, { "epoch": 1.74, "learning_rate": 3.924756950926033e-05, "loss": 0.0067, "step": 344560 }, { "epoch": 1.74, "learning_rate": 3.9240001816246315e-05, "loss": 0.0054, "step": 344570 }, { "epoch": 1.74, "learning_rate": 3.92324341232323e-05, "loss": 0.0057, "step": 344580 }, { "epoch": 1.74, "learning_rate": 3.92248664302183e-05, "loss": 0.0048, "step": 344590 }, { "epoch": 1.74, "learning_rate": 3.9217298737204286e-05, "loss": 0.0055, "step": 344600 }, { "epoch": 1.74, "learning_rate": 3.9209731044190274e-05, "loss": 0.0067, "step": 344610 }, { "epoch": 1.74, "learning_rate": 3.920216335117627e-05, "loss": 0.0039, "step": 344620 }, { "epoch": 1.74, "learning_rate": 3.919459565816226e-05, "loss": 0.0081, "step": 344630 }, { "epoch": 1.74, "learning_rate": 3.9187027965148246e-05, "loss": 0.0068, "step": 344640 }, { "epoch": 1.74, "learning_rate": 3.9179460272134234e-05, "loss": 0.0084, "step": 344650 }, { "epoch": 1.74, "learning_rate": 3.917189257912023e-05, "loss": 0.0059, "step": 344660 }, { "epoch": 1.74, "learning_rate": 3.916432488610622e-05, "loss": 0.0053, "step": 344670 }, { "epoch": 1.74, "learning_rate": 3.9156757193092206e-05, "loss": 0.0054, "step": 344680 }, { "epoch": 1.74, "learning_rate": 3.9149189500078194e-05, "loss": 0.0067, "step": 344690 }, { "epoch": 1.74, "learning_rate": 3.914162180706419e-05, "loss": 0.0059, "step": 344700 }, { "epoch": 1.74, "learning_rate": 3.913405411405018e-05, "loss": 0.0134, "step": 344710 }, { "epoch": 1.74, "learning_rate": 3.9126486421036165e-05, "loss": 0.0066, "step": 344720 }, { "epoch": 1.74, "learning_rate": 3.9118918728022153e-05, "loss": 0.0062, "step": 344730 }, { "epoch": 1.74, "learning_rate": 3.911135103500815e-05, "loss": 0.0071, "step": 344740 }, { "epoch": 1.74, "learning_rate": 3.910378334199414e-05, "loss": 0.006, "step": 344750 }, { "epoch": 1.74, "learning_rate": 3.9096215648980125e-05, "loss": 0.0063, "step": 344760 }, { "epoch": 1.74, "learning_rate": 3.908864795596611e-05, "loss": 0.0044, "step": 344770 }, { "epoch": 1.74, "learning_rate": 3.908108026295211e-05, "loss": 0.0082, "step": 344780 }, { "epoch": 1.74, "learning_rate": 3.9073512569938096e-05, "loss": 0.0064, "step": 344790 }, { "epoch": 1.74, "learning_rate": 3.9065944876924085e-05, "loss": 0.0052, "step": 344800 }, { "epoch": 1.74, "learning_rate": 3.905837718391007e-05, "loss": 0.0063, "step": 344810 }, { "epoch": 1.74, "learning_rate": 3.905080949089607e-05, "loss": 0.007, "step": 344820 }, { "epoch": 1.74, "learning_rate": 3.9043241797882056e-05, "loss": 0.0061, "step": 344830 }, { "epoch": 1.74, "learning_rate": 3.9035674104868044e-05, "loss": 0.0064, "step": 344840 }, { "epoch": 1.74, "learning_rate": 3.902810641185403e-05, "loss": 0.0058, "step": 344850 }, { "epoch": 1.74, "learning_rate": 3.9020538718840014e-05, "loss": 0.0058, "step": 344860 }, { "epoch": 1.74, "learning_rate": 3.901297102582601e-05, "loss": 0.0072, "step": 344870 }, { "epoch": 1.74, "learning_rate": 3.9005403332812e-05, "loss": 0.0099, "step": 344880 }, { "epoch": 1.74, "learning_rate": 3.8997835639797985e-05, "loss": 0.0063, "step": 344890 }, { "epoch": 1.74, "learning_rate": 3.8990267946783973e-05, "loss": 0.0065, "step": 344900 }, { "epoch": 1.74, "learning_rate": 3.898270025376997e-05, "loss": 0.0067, "step": 344910 }, { "epoch": 1.74, "learning_rate": 3.897513256075596e-05, "loss": 0.0049, "step": 344920 }, { "epoch": 1.74, "learning_rate": 3.8967564867741945e-05, "loss": 0.0058, "step": 344930 }, { "epoch": 1.74, "learning_rate": 3.895999717472793e-05, "loss": 0.0062, "step": 344940 }, { "epoch": 1.74, "learning_rate": 3.895242948171393e-05, "loss": 0.0068, "step": 344950 }, { "epoch": 1.74, "learning_rate": 3.8944861788699916e-05, "loss": 0.0059, "step": 344960 }, { "epoch": 1.74, "learning_rate": 3.8937294095685905e-05, "loss": 0.0075, "step": 344970 }, { "epoch": 1.74, "learning_rate": 3.892972640267189e-05, "loss": 0.0096, "step": 344980 }, { "epoch": 1.74, "learning_rate": 3.892215870965789e-05, "loss": 0.0054, "step": 344990 }, { "epoch": 1.74, "learning_rate": 3.8914591016643876e-05, "loss": 0.0079, "step": 345000 }, { "epoch": 1.74, "eval_cer": 0.9144159137201398, "eval_loss": 0.004668357782065868, "eval_runtime": 116.7577, "eval_samples_per_second": 17.129, "eval_steps_per_second": 4.282, "step": 345000 }, { "epoch": 1.74, "learning_rate": 3.8907023323629864e-05, "loss": 0.0054, "step": 345010 }, { "epoch": 1.74, "learning_rate": 3.889945563061585e-05, "loss": 0.0093, "step": 345020 }, { "epoch": 1.74, "learning_rate": 3.889188793760185e-05, "loss": 0.0057, "step": 345030 }, { "epoch": 1.74, "learning_rate": 3.8884320244587836e-05, "loss": 0.0052, "step": 345040 }, { "epoch": 1.74, "learning_rate": 3.8876752551573824e-05, "loss": 0.0057, "step": 345050 }, { "epoch": 1.74, "learning_rate": 3.886918485855981e-05, "loss": 0.0091, "step": 345060 }, { "epoch": 1.74, "learning_rate": 3.886161716554581e-05, "loss": 0.0057, "step": 345070 }, { "epoch": 1.74, "learning_rate": 3.8854049472531795e-05, "loss": 0.0076, "step": 345080 }, { "epoch": 1.74, "learning_rate": 3.8846481779517784e-05, "loss": 0.0075, "step": 345090 }, { "epoch": 1.74, "learning_rate": 3.883891408650377e-05, "loss": 0.005, "step": 345100 }, { "epoch": 1.74, "learning_rate": 3.883134639348977e-05, "loss": 0.0061, "step": 345110 }, { "epoch": 1.74, "learning_rate": 3.8823778700475755e-05, "loss": 0.0042, "step": 345120 }, { "epoch": 1.74, "learning_rate": 3.881621100746174e-05, "loss": 0.0061, "step": 345130 }, { "epoch": 1.74, "learning_rate": 3.880864331444774e-05, "loss": 0.0062, "step": 345140 }, { "epoch": 1.74, "learning_rate": 3.8801075621433726e-05, "loss": 0.0064, "step": 345150 }, { "epoch": 1.74, "learning_rate": 3.8793507928419715e-05, "loss": 0.0068, "step": 345160 }, { "epoch": 1.74, "learning_rate": 3.87859402354057e-05, "loss": 0.0053, "step": 345170 }, { "epoch": 1.74, "learning_rate": 3.8778372542391684e-05, "loss": 0.0078, "step": 345180 }, { "epoch": 1.74, "learning_rate": 3.877080484937768e-05, "loss": 0.0056, "step": 345190 }, { "epoch": 1.74, "learning_rate": 3.876323715636367e-05, "loss": 0.0088, "step": 345200 }, { "epoch": 1.74, "learning_rate": 3.8755669463349656e-05, "loss": 0.0048, "step": 345210 }, { "epoch": 1.74, "learning_rate": 3.8748101770335644e-05, "loss": 0.0066, "step": 345220 }, { "epoch": 1.74, "learning_rate": 3.874053407732164e-05, "loss": 0.0075, "step": 345230 }, { "epoch": 1.74, "learning_rate": 3.873296638430763e-05, "loss": 0.0082, "step": 345240 }, { "epoch": 1.74, "learning_rate": 3.8725398691293615e-05, "loss": 0.0077, "step": 345250 }, { "epoch": 1.74, "learning_rate": 3.8717830998279604e-05, "loss": 0.0069, "step": 345260 }, { "epoch": 1.74, "learning_rate": 3.87102633052656e-05, "loss": 0.0043, "step": 345270 }, { "epoch": 1.74, "learning_rate": 3.870269561225159e-05, "loss": 0.0068, "step": 345280 }, { "epoch": 1.74, "learning_rate": 3.8695127919237575e-05, "loss": 0.0066, "step": 345290 }, { "epoch": 1.74, "learning_rate": 3.868756022622356e-05, "loss": 0.0074, "step": 345300 }, { "epoch": 1.74, "learning_rate": 3.867999253320956e-05, "loss": 0.0054, "step": 345310 }, { "epoch": 1.74, "learning_rate": 3.8672424840195546e-05, "loss": 0.0057, "step": 345320 }, { "epoch": 1.74, "learning_rate": 3.8664857147181535e-05, "loss": 0.005, "step": 345330 }, { "epoch": 1.74, "learning_rate": 3.865728945416752e-05, "loss": 0.006, "step": 345340 }, { "epoch": 1.74, "learning_rate": 3.864972176115352e-05, "loss": 0.0061, "step": 345350 }, { "epoch": 1.74, "learning_rate": 3.8642154068139506e-05, "loss": 0.0063, "step": 345360 }, { "epoch": 1.74, "learning_rate": 3.8634586375125494e-05, "loss": 0.0065, "step": 345370 }, { "epoch": 1.74, "learning_rate": 3.862701868211148e-05, "loss": 0.0054, "step": 345380 }, { "epoch": 1.74, "learning_rate": 3.861945098909748e-05, "loss": 0.0048, "step": 345390 }, { "epoch": 1.74, "learning_rate": 3.8611883296083466e-05, "loss": 0.0046, "step": 345400 }, { "epoch": 1.74, "learning_rate": 3.8604315603069454e-05, "loss": 0.0056, "step": 345410 }, { "epoch": 1.74, "learning_rate": 3.859674791005544e-05, "loss": 0.0069, "step": 345420 }, { "epoch": 1.74, "learning_rate": 3.858918021704144e-05, "loss": 0.0073, "step": 345430 }, { "epoch": 1.74, "learning_rate": 3.8581612524027425e-05, "loss": 0.0071, "step": 345440 }, { "epoch": 1.74, "learning_rate": 3.8574044831013414e-05, "loss": 0.005, "step": 345450 }, { "epoch": 1.74, "learning_rate": 3.85664771379994e-05, "loss": 0.0052, "step": 345460 }, { "epoch": 1.74, "learning_rate": 3.85589094449854e-05, "loss": 0.0077, "step": 345470 }, { "epoch": 1.74, "learning_rate": 3.8551341751971385e-05, "loss": 0.0066, "step": 345480 }, { "epoch": 1.74, "learning_rate": 3.8543774058957366e-05, "loss": 0.0061, "step": 345490 }, { "epoch": 1.74, "learning_rate": 3.8536206365943355e-05, "loss": 0.0095, "step": 345500 }, { "epoch": 1.74, "learning_rate": 3.852863867292934e-05, "loss": 0.0059, "step": 345510 }, { "epoch": 1.74, "learning_rate": 3.852107097991534e-05, "loss": 0.007, "step": 345520 }, { "epoch": 1.74, "learning_rate": 3.8513503286901326e-05, "loss": 0.0054, "step": 345530 }, { "epoch": 1.74, "learning_rate": 3.8505935593887314e-05, "loss": 0.0059, "step": 345540 }, { "epoch": 1.74, "learning_rate": 3.84983679008733e-05, "loss": 0.006, "step": 345550 }, { "epoch": 1.74, "learning_rate": 3.84908002078593e-05, "loss": 0.0055, "step": 345560 }, { "epoch": 1.74, "learning_rate": 3.8483232514845286e-05, "loss": 0.0058, "step": 345570 }, { "epoch": 1.74, "learning_rate": 3.8475664821831274e-05, "loss": 0.006, "step": 345580 }, { "epoch": 1.74, "learning_rate": 3.846809712881727e-05, "loss": 0.0055, "step": 345590 }, { "epoch": 1.74, "learning_rate": 3.846052943580326e-05, "loss": 0.006, "step": 345600 }, { "epoch": 1.74, "learning_rate": 3.8452961742789245e-05, "loss": 0.0085, "step": 345610 }, { "epoch": 1.74, "learning_rate": 3.8445394049775234e-05, "loss": 0.007, "step": 345620 }, { "epoch": 1.74, "learning_rate": 3.843782635676123e-05, "loss": 0.0061, "step": 345630 }, { "epoch": 1.74, "learning_rate": 3.843025866374722e-05, "loss": 0.0053, "step": 345640 }, { "epoch": 1.74, "learning_rate": 3.8422690970733205e-05, "loss": 0.0087, "step": 345650 }, { "epoch": 1.74, "learning_rate": 3.841512327771919e-05, "loss": 0.0074, "step": 345660 }, { "epoch": 1.74, "learning_rate": 3.840755558470519e-05, "loss": 0.007, "step": 345670 }, { "epoch": 1.74, "learning_rate": 3.8399987891691177e-05, "loss": 0.0061, "step": 345680 }, { "epoch": 1.74, "learning_rate": 3.8392420198677165e-05, "loss": 0.0064, "step": 345690 }, { "epoch": 1.74, "learning_rate": 3.838485250566315e-05, "loss": 0.0063, "step": 345700 }, { "epoch": 1.74, "learning_rate": 3.837728481264915e-05, "loss": 0.0058, "step": 345710 }, { "epoch": 1.74, "learning_rate": 3.8369717119635136e-05, "loss": 0.0058, "step": 345720 }, { "epoch": 1.74, "learning_rate": 3.8362149426621124e-05, "loss": 0.0081, "step": 345730 }, { "epoch": 1.74, "learning_rate": 3.835458173360711e-05, "loss": 0.006, "step": 345740 }, { "epoch": 1.74, "learning_rate": 3.834701404059311e-05, "loss": 0.0068, "step": 345750 }, { "epoch": 1.74, "learning_rate": 3.8339446347579096e-05, "loss": 0.0095, "step": 345760 }, { "epoch": 1.74, "learning_rate": 3.8331878654565084e-05, "loss": 0.0067, "step": 345770 }, { "epoch": 1.74, "learning_rate": 3.832431096155107e-05, "loss": 0.0074, "step": 345780 }, { "epoch": 1.74, "learning_rate": 3.831674326853707e-05, "loss": 0.0081, "step": 345790 }, { "epoch": 1.74, "learning_rate": 3.8309175575523055e-05, "loss": 0.0062, "step": 345800 }, { "epoch": 1.74, "learning_rate": 3.830160788250904e-05, "loss": 0.0085, "step": 345810 }, { "epoch": 1.74, "learning_rate": 3.8294040189495025e-05, "loss": 0.008, "step": 345820 }, { "epoch": 1.74, "learning_rate": 3.828647249648101e-05, "loss": 0.0078, "step": 345830 }, { "epoch": 1.74, "learning_rate": 3.827890480346701e-05, "loss": 0.0052, "step": 345840 }, { "epoch": 1.74, "learning_rate": 3.8271337110452997e-05, "loss": 0.0059, "step": 345850 }, { "epoch": 1.74, "learning_rate": 3.8263769417438985e-05, "loss": 0.0075, "step": 345860 }, { "epoch": 1.74, "learning_rate": 3.825620172442497e-05, "loss": 0.0065, "step": 345870 }, { "epoch": 1.75, "learning_rate": 3.824863403141097e-05, "loss": 0.006, "step": 345880 }, { "epoch": 1.75, "learning_rate": 3.8241066338396956e-05, "loss": 0.0058, "step": 345890 }, { "epoch": 1.75, "learning_rate": 3.8233498645382944e-05, "loss": 0.0072, "step": 345900 }, { "epoch": 1.75, "learning_rate": 3.822593095236893e-05, "loss": 0.0054, "step": 345910 }, { "epoch": 1.75, "learning_rate": 3.821836325935493e-05, "loss": 0.0044, "step": 345920 }, { "epoch": 1.75, "learning_rate": 3.8210795566340916e-05, "loss": 0.0052, "step": 345930 }, { "epoch": 1.75, "learning_rate": 3.8203227873326904e-05, "loss": 0.0063, "step": 345940 }, { "epoch": 1.75, "learning_rate": 3.819566018031289e-05, "loss": 0.0081, "step": 345950 }, { "epoch": 1.75, "learning_rate": 3.818809248729889e-05, "loss": 0.0048, "step": 345960 }, { "epoch": 1.75, "learning_rate": 3.8180524794284876e-05, "loss": 0.0071, "step": 345970 }, { "epoch": 1.75, "learning_rate": 3.8172957101270864e-05, "loss": 0.0067, "step": 345980 }, { "epoch": 1.75, "learning_rate": 3.816538940825685e-05, "loss": 0.0069, "step": 345990 }, { "epoch": 1.75, "learning_rate": 3.815782171524285e-05, "loss": 0.0062, "step": 346000 }, { "epoch": 1.75, "eval_cer": 0.9144227064930175, "eval_loss": 0.004535060841590166, "eval_runtime": 116.7184, "eval_samples_per_second": 17.135, "eval_steps_per_second": 4.284, "step": 346000 }, { "epoch": 1.75, "learning_rate": 3.8150254022228835e-05, "loss": 0.0045, "step": 346010 }, { "epoch": 1.75, "learning_rate": 3.8142686329214823e-05, "loss": 0.0068, "step": 346020 }, { "epoch": 1.75, "learning_rate": 3.813511863620081e-05, "loss": 0.0056, "step": 346030 }, { "epoch": 1.75, "learning_rate": 3.812755094318681e-05, "loss": 0.0063, "step": 346040 }, { "epoch": 1.75, "learning_rate": 3.8119983250172795e-05, "loss": 0.0082, "step": 346050 }, { "epoch": 1.75, "learning_rate": 3.811241555715878e-05, "loss": 0.0056, "step": 346060 }, { "epoch": 1.75, "learning_rate": 3.810484786414477e-05, "loss": 0.006, "step": 346070 }, { "epoch": 1.75, "learning_rate": 3.8097280171130766e-05, "loss": 0.0068, "step": 346080 }, { "epoch": 1.75, "learning_rate": 3.8089712478116754e-05, "loss": 0.0063, "step": 346090 }, { "epoch": 1.75, "learning_rate": 3.808214478510274e-05, "loss": 0.0052, "step": 346100 }, { "epoch": 1.75, "learning_rate": 3.807457709208874e-05, "loss": 0.0067, "step": 346110 }, { "epoch": 1.75, "learning_rate": 3.806700939907472e-05, "loss": 0.0057, "step": 346120 }, { "epoch": 1.75, "learning_rate": 3.805944170606071e-05, "loss": 0.006, "step": 346130 }, { "epoch": 1.75, "learning_rate": 3.8051874013046696e-05, "loss": 0.0069, "step": 346140 }, { "epoch": 1.75, "learning_rate": 3.8044306320032684e-05, "loss": 0.0065, "step": 346150 }, { "epoch": 1.75, "learning_rate": 3.803673862701868e-05, "loss": 0.0046, "step": 346160 }, { "epoch": 1.75, "learning_rate": 3.802917093400467e-05, "loss": 0.0074, "step": 346170 }, { "epoch": 1.75, "learning_rate": 3.8021603240990655e-05, "loss": 0.0064, "step": 346180 }, { "epoch": 1.75, "learning_rate": 3.8014035547976643e-05, "loss": 0.0057, "step": 346190 }, { "epoch": 1.75, "learning_rate": 3.800646785496264e-05, "loss": 0.0058, "step": 346200 }, { "epoch": 1.75, "learning_rate": 3.799890016194863e-05, "loss": 0.0045, "step": 346210 }, { "epoch": 1.75, "learning_rate": 3.7991332468934615e-05, "loss": 0.0068, "step": 346220 }, { "epoch": 1.75, "learning_rate": 3.79837647759206e-05, "loss": 0.0056, "step": 346230 }, { "epoch": 1.75, "learning_rate": 3.79761970829066e-05, "loss": 0.0063, "step": 346240 }, { "epoch": 1.75, "learning_rate": 3.7968629389892586e-05, "loss": 0.006, "step": 346250 }, { "epoch": 1.75, "learning_rate": 3.7961061696878575e-05, "loss": 0.0075, "step": 346260 }, { "epoch": 1.75, "learning_rate": 3.795349400386456e-05, "loss": 0.006, "step": 346270 }, { "epoch": 1.75, "learning_rate": 3.794592631085056e-05, "loss": 0.0064, "step": 346280 }, { "epoch": 1.75, "learning_rate": 3.7938358617836546e-05, "loss": 0.0062, "step": 346290 }, { "epoch": 1.75, "learning_rate": 3.7930790924822534e-05, "loss": 0.0079, "step": 346300 }, { "epoch": 1.75, "learning_rate": 3.792322323180852e-05, "loss": 0.0078, "step": 346310 }, { "epoch": 1.75, "learning_rate": 3.791565553879452e-05, "loss": 0.0055, "step": 346320 }, { "epoch": 1.75, "learning_rate": 3.7908087845780506e-05, "loss": 0.0073, "step": 346330 }, { "epoch": 1.75, "learning_rate": 3.7900520152766494e-05, "loss": 0.0086, "step": 346340 }, { "epoch": 1.75, "learning_rate": 3.789295245975248e-05, "loss": 0.005, "step": 346350 }, { "epoch": 1.75, "learning_rate": 3.788538476673848e-05, "loss": 0.0055, "step": 346360 }, { "epoch": 1.75, "learning_rate": 3.7877817073724465e-05, "loss": 0.0074, "step": 346370 }, { "epoch": 1.75, "learning_rate": 3.7870249380710453e-05, "loss": 0.005, "step": 346380 }, { "epoch": 1.75, "learning_rate": 3.786268168769644e-05, "loss": 0.0048, "step": 346390 }, { "epoch": 1.75, "learning_rate": 3.785511399468244e-05, "loss": 0.0066, "step": 346400 }, { "epoch": 1.75, "learning_rate": 3.7847546301668425e-05, "loss": 0.0066, "step": 346410 }, { "epoch": 1.75, "learning_rate": 3.783997860865441e-05, "loss": 0.0054, "step": 346420 }, { "epoch": 1.75, "learning_rate": 3.7832410915640395e-05, "loss": 0.0075, "step": 346430 }, { "epoch": 1.75, "learning_rate": 3.782484322262638e-05, "loss": 0.0052, "step": 346440 }, { "epoch": 1.75, "learning_rate": 3.781727552961238e-05, "loss": 0.0071, "step": 346450 }, { "epoch": 1.75, "learning_rate": 3.7809707836598366e-05, "loss": 0.0061, "step": 346460 }, { "epoch": 1.75, "learning_rate": 3.7802140143584354e-05, "loss": 0.0063, "step": 346470 }, { "epoch": 1.75, "learning_rate": 3.779457245057034e-05, "loss": 0.0049, "step": 346480 }, { "epoch": 1.75, "learning_rate": 3.778700475755634e-05, "loss": 0.0053, "step": 346490 }, { "epoch": 1.75, "learning_rate": 3.7779437064542326e-05, "loss": 0.0065, "step": 346500 }, { "epoch": 1.75, "learning_rate": 3.7771869371528314e-05, "loss": 0.006, "step": 346510 }, { "epoch": 1.75, "learning_rate": 3.77643016785143e-05, "loss": 0.0049, "step": 346520 }, { "epoch": 1.75, "learning_rate": 3.77567339855003e-05, "loss": 0.0072, "step": 346530 }, { "epoch": 1.75, "learning_rate": 3.7749166292486285e-05, "loss": 0.0076, "step": 346540 }, { "epoch": 1.75, "learning_rate": 3.7741598599472274e-05, "loss": 0.0044, "step": 346550 }, { "epoch": 1.75, "learning_rate": 3.773403090645827e-05, "loss": 0.0061, "step": 346560 }, { "epoch": 1.75, "learning_rate": 3.772646321344426e-05, "loss": 0.0045, "step": 346570 }, { "epoch": 1.75, "learning_rate": 3.7718895520430245e-05, "loss": 0.0057, "step": 346580 }, { "epoch": 1.75, "learning_rate": 3.771132782741623e-05, "loss": 0.0055, "step": 346590 }, { "epoch": 1.75, "learning_rate": 3.770376013440223e-05, "loss": 0.0078, "step": 346600 }, { "epoch": 1.75, "learning_rate": 3.7696192441388216e-05, "loss": 0.0065, "step": 346610 }, { "epoch": 1.75, "learning_rate": 3.7688624748374205e-05, "loss": 0.0057, "step": 346620 }, { "epoch": 1.75, "learning_rate": 3.768105705536019e-05, "loss": 0.0061, "step": 346630 }, { "epoch": 1.75, "learning_rate": 3.767348936234619e-05, "loss": 0.0075, "step": 346640 }, { "epoch": 1.75, "learning_rate": 3.7665921669332176e-05, "loss": 0.0052, "step": 346650 }, { "epoch": 1.75, "learning_rate": 3.7658353976318164e-05, "loss": 0.006, "step": 346660 }, { "epoch": 1.75, "learning_rate": 3.765078628330415e-05, "loss": 0.0056, "step": 346670 }, { "epoch": 1.75, "learning_rate": 3.764321859029015e-05, "loss": 0.007, "step": 346680 }, { "epoch": 1.75, "learning_rate": 3.7635650897276136e-05, "loss": 0.0046, "step": 346690 }, { "epoch": 1.75, "learning_rate": 3.7628083204262124e-05, "loss": 0.0056, "step": 346700 }, { "epoch": 1.75, "learning_rate": 3.762051551124811e-05, "loss": 0.0077, "step": 346710 }, { "epoch": 1.75, "learning_rate": 3.761294781823411e-05, "loss": 0.0058, "step": 346720 }, { "epoch": 1.75, "learning_rate": 3.7605380125220095e-05, "loss": 0.0078, "step": 346730 }, { "epoch": 1.75, "learning_rate": 3.7597812432206084e-05, "loss": 0.009, "step": 346740 }, { "epoch": 1.75, "learning_rate": 3.7590244739192065e-05, "loss": 0.009, "step": 346750 }, { "epoch": 1.75, "learning_rate": 3.758267704617805e-05, "loss": 0.0087, "step": 346760 }, { "epoch": 1.75, "learning_rate": 3.757510935316405e-05, "loss": 0.0054, "step": 346770 }, { "epoch": 1.75, "learning_rate": 3.7567541660150036e-05, "loss": 0.0058, "step": 346780 }, { "epoch": 1.75, "learning_rate": 3.7559973967136025e-05, "loss": 0.0065, "step": 346790 }, { "epoch": 1.75, "learning_rate": 3.755240627412201e-05, "loss": 0.007, "step": 346800 }, { "epoch": 1.75, "learning_rate": 3.754483858110801e-05, "loss": 0.0063, "step": 346810 }, { "epoch": 1.75, "learning_rate": 3.7537270888093996e-05, "loss": 0.0052, "step": 346820 }, { "epoch": 1.75, "learning_rate": 3.7529703195079984e-05, "loss": 0.0088, "step": 346830 }, { "epoch": 1.75, "learning_rate": 3.752213550206597e-05, "loss": 0.0053, "step": 346840 }, { "epoch": 1.75, "learning_rate": 3.751456780905197e-05, "loss": 0.0047, "step": 346850 }, { "epoch": 1.75, "learning_rate": 3.7507000116037956e-05, "loss": 0.0074, "step": 346860 }, { "epoch": 1.75, "learning_rate": 3.7499432423023944e-05, "loss": 0.0058, "step": 346870 }, { "epoch": 1.75, "learning_rate": 3.749186473000993e-05, "loss": 0.0057, "step": 346880 }, { "epoch": 1.75, "learning_rate": 3.748429703699593e-05, "loss": 0.0068, "step": 346890 }, { "epoch": 1.75, "learning_rate": 3.7476729343981915e-05, "loss": 0.0081, "step": 346900 }, { "epoch": 1.75, "learning_rate": 3.7469161650967904e-05, "loss": 0.006, "step": 346910 }, { "epoch": 1.75, "learning_rate": 3.746159395795389e-05, "loss": 0.0073, "step": 346920 }, { "epoch": 1.75, "learning_rate": 3.745402626493989e-05, "loss": 0.0053, "step": 346930 }, { "epoch": 1.75, "learning_rate": 3.7446458571925875e-05, "loss": 0.0062, "step": 346940 }, { "epoch": 1.75, "learning_rate": 3.743889087891186e-05, "loss": 0.0063, "step": 346950 }, { "epoch": 1.75, "learning_rate": 3.743132318589785e-05, "loss": 0.0113, "step": 346960 }, { "epoch": 1.75, "learning_rate": 3.7423755492883846e-05, "loss": 0.0055, "step": 346970 }, { "epoch": 1.75, "learning_rate": 3.741618779986983e-05, "loss": 0.0074, "step": 346980 }, { "epoch": 1.75, "learning_rate": 3.740862010685582e-05, "loss": 0.0075, "step": 346990 }, { "epoch": 1.75, "learning_rate": 3.740105241384181e-05, "loss": 0.0079, "step": 347000 }, { "epoch": 1.75, "eval_cer": 0.9144304696620207, "eval_loss": 0.004600143525749445, "eval_runtime": 116.8017, "eval_samples_per_second": 17.123, "eval_steps_per_second": 4.281, "step": 347000 }, { "epoch": 1.75, "learning_rate": 3.73934847208278e-05, "loss": 0.0062, "step": 347010 }, { "epoch": 1.75, "learning_rate": 3.738591702781379e-05, "loss": 0.0065, "step": 347020 }, { "epoch": 1.75, "learning_rate": 3.737834933479978e-05, "loss": 0.0069, "step": 347030 }, { "epoch": 1.75, "learning_rate": 3.737078164178577e-05, "loss": 0.0059, "step": 347040 }, { "epoch": 1.75, "learning_rate": 3.736321394877176e-05, "loss": 0.0075, "step": 347050 }, { "epoch": 1.75, "learning_rate": 3.735564625575775e-05, "loss": 0.0058, "step": 347060 }, { "epoch": 1.75, "learning_rate": 3.734807856274374e-05, "loss": 0.005, "step": 347070 }, { "epoch": 1.75, "learning_rate": 3.734051086972973e-05, "loss": 0.0054, "step": 347080 }, { "epoch": 1.75, "learning_rate": 3.733294317671572e-05, "loss": 0.0065, "step": 347090 }, { "epoch": 1.75, "learning_rate": 3.732537548370171e-05, "loss": 0.006, "step": 347100 }, { "epoch": 1.75, "learning_rate": 3.73178077906877e-05, "loss": 0.0053, "step": 347110 }, { "epoch": 1.75, "learning_rate": 3.731024009767369e-05, "loss": 0.0061, "step": 347120 }, { "epoch": 1.75, "learning_rate": 3.730267240465968e-05, "loss": 0.0052, "step": 347130 }, { "epoch": 1.75, "learning_rate": 3.7295104711645667e-05, "loss": 0.0065, "step": 347140 }, { "epoch": 1.75, "learning_rate": 3.7287537018631655e-05, "loss": 0.0074, "step": 347150 }, { "epoch": 1.75, "learning_rate": 3.727996932561764e-05, "loss": 0.0094, "step": 347160 }, { "epoch": 1.75, "learning_rate": 3.727240163260364e-05, "loss": 0.0055, "step": 347170 }, { "epoch": 1.75, "learning_rate": 3.7264833939589626e-05, "loss": 0.0071, "step": 347180 }, { "epoch": 1.75, "learning_rate": 3.7257266246575614e-05, "loss": 0.0047, "step": 347190 }, { "epoch": 1.75, "learning_rate": 3.72496985535616e-05, "loss": 0.0053, "step": 347200 }, { "epoch": 1.75, "learning_rate": 3.72421308605476e-05, "loss": 0.0105, "step": 347210 }, { "epoch": 1.75, "learning_rate": 3.7234563167533586e-05, "loss": 0.0057, "step": 347220 }, { "epoch": 1.75, "learning_rate": 3.7226995474519574e-05, "loss": 0.0101, "step": 347230 }, { "epoch": 1.75, "learning_rate": 3.721942778150556e-05, "loss": 0.0075, "step": 347240 }, { "epoch": 1.75, "learning_rate": 3.721186008849156e-05, "loss": 0.0086, "step": 347250 }, { "epoch": 1.75, "learning_rate": 3.7204292395477545e-05, "loss": 0.0041, "step": 347260 }, { "epoch": 1.75, "learning_rate": 3.7196724702463534e-05, "loss": 0.0052, "step": 347270 }, { "epoch": 1.75, "learning_rate": 3.718915700944952e-05, "loss": 0.0081, "step": 347280 }, { "epoch": 1.75, "learning_rate": 3.718158931643552e-05, "loss": 0.0068, "step": 347290 }, { "epoch": 1.75, "learning_rate": 3.71740216234215e-05, "loss": 0.0076, "step": 347300 }, { "epoch": 1.75, "learning_rate": 3.716645393040749e-05, "loss": 0.007, "step": 347310 }, { "epoch": 1.75, "learning_rate": 3.715888623739348e-05, "loss": 0.0053, "step": 347320 }, { "epoch": 1.75, "learning_rate": 3.715131854437947e-05, "loss": 0.0055, "step": 347330 }, { "epoch": 1.75, "learning_rate": 3.714375085136546e-05, "loss": 0.0054, "step": 347340 }, { "epoch": 1.75, "learning_rate": 3.713618315835145e-05, "loss": 0.0044, "step": 347350 }, { "epoch": 1.75, "learning_rate": 3.712861546533744e-05, "loss": 0.0051, "step": 347360 }, { "epoch": 1.75, "learning_rate": 3.712104777232343e-05, "loss": 0.0054, "step": 347370 }, { "epoch": 1.75, "learning_rate": 3.711348007930942e-05, "loss": 0.012, "step": 347380 }, { "epoch": 1.75, "learning_rate": 3.710591238629541e-05, "loss": 0.0051, "step": 347390 }, { "epoch": 1.75, "learning_rate": 3.70983446932814e-05, "loss": 0.0054, "step": 347400 }, { "epoch": 1.75, "learning_rate": 3.709077700026739e-05, "loss": 0.005, "step": 347410 }, { "epoch": 1.75, "learning_rate": 3.708320930725338e-05, "loss": 0.0052, "step": 347420 }, { "epoch": 1.75, "learning_rate": 3.707564161423937e-05, "loss": 0.0039, "step": 347430 }, { "epoch": 1.75, "learning_rate": 3.706807392122536e-05, "loss": 0.0063, "step": 347440 }, { "epoch": 1.75, "learning_rate": 3.706050622821135e-05, "loss": 0.0048, "step": 347450 }, { "epoch": 1.75, "learning_rate": 3.705293853519734e-05, "loss": 0.0059, "step": 347460 }, { "epoch": 1.75, "learning_rate": 3.7045370842183325e-05, "loss": 0.0068, "step": 347470 }, { "epoch": 1.75, "learning_rate": 3.7037803149169313e-05, "loss": 0.0062, "step": 347480 }, { "epoch": 1.75, "learning_rate": 3.70302354561553e-05, "loss": 0.0056, "step": 347490 }, { "epoch": 1.75, "learning_rate": 3.70226677631413e-05, "loss": 0.0055, "step": 347500 }, { "epoch": 1.75, "learning_rate": 3.7015100070127285e-05, "loss": 0.0087, "step": 347510 }, { "epoch": 1.75, "learning_rate": 3.700753237711327e-05, "loss": 0.0067, "step": 347520 }, { "epoch": 1.75, "learning_rate": 3.699996468409927e-05, "loss": 0.0058, "step": 347530 }, { "epoch": 1.75, "learning_rate": 3.6992396991085256e-05, "loss": 0.0068, "step": 347540 }, { "epoch": 1.75, "learning_rate": 3.6984829298071244e-05, "loss": 0.0073, "step": 347550 }, { "epoch": 1.75, "learning_rate": 3.697726160505723e-05, "loss": 0.0046, "step": 347560 }, { "epoch": 1.75, "learning_rate": 3.696969391204323e-05, "loss": 0.0054, "step": 347570 }, { "epoch": 1.75, "learning_rate": 3.6962126219029216e-05, "loss": 0.0063, "step": 347580 }, { "epoch": 1.75, "learning_rate": 3.6954558526015204e-05, "loss": 0.0057, "step": 347590 }, { "epoch": 1.75, "learning_rate": 3.694699083300119e-05, "loss": 0.0049, "step": 347600 }, { "epoch": 1.75, "learning_rate": 3.693942313998718e-05, "loss": 0.0051, "step": 347610 }, { "epoch": 1.75, "learning_rate": 3.693185544697317e-05, "loss": 0.0057, "step": 347620 }, { "epoch": 1.75, "learning_rate": 3.692428775395916e-05, "loss": 0.0054, "step": 347630 }, { "epoch": 1.75, "learning_rate": 3.691672006094515e-05, "loss": 0.0059, "step": 347640 }, { "epoch": 1.75, "learning_rate": 3.690915236793114e-05, "loss": 0.0066, "step": 347650 }, { "epoch": 1.75, "learning_rate": 3.690158467491713e-05, "loss": 0.0049, "step": 347660 }, { "epoch": 1.75, "learning_rate": 3.689401698190312e-05, "loss": 0.0087, "step": 347670 }, { "epoch": 1.75, "learning_rate": 3.688644928888911e-05, "loss": 0.0101, "step": 347680 }, { "epoch": 1.75, "learning_rate": 3.68788815958751e-05, "loss": 0.0065, "step": 347690 }, { "epoch": 1.75, "learning_rate": 3.687131390286109e-05, "loss": 0.0083, "step": 347700 }, { "epoch": 1.75, "learning_rate": 3.6863746209847076e-05, "loss": 0.0049, "step": 347710 }, { "epoch": 1.75, "learning_rate": 3.685617851683307e-05, "loss": 0.0056, "step": 347720 }, { "epoch": 1.75, "learning_rate": 3.684861082381906e-05, "loss": 0.0087, "step": 347730 }, { "epoch": 1.75, "learning_rate": 3.684104313080505e-05, "loss": 0.0044, "step": 347740 }, { "epoch": 1.75, "learning_rate": 3.6833475437791036e-05, "loss": 0.006, "step": 347750 }, { "epoch": 1.75, "learning_rate": 3.682590774477703e-05, "loss": 0.0091, "step": 347760 }, { "epoch": 1.75, "learning_rate": 3.681834005176301e-05, "loss": 0.0048, "step": 347770 }, { "epoch": 1.75, "learning_rate": 3.681077235874901e-05, "loss": 0.0067, "step": 347780 }, { "epoch": 1.75, "learning_rate": 3.6803204665734996e-05, "loss": 0.0066, "step": 347790 }, { "epoch": 1.75, "learning_rate": 3.6795636972720984e-05, "loss": 0.0047, "step": 347800 }, { "epoch": 1.75, "learning_rate": 3.678806927970697e-05, "loss": 0.0043, "step": 347810 }, { "epoch": 1.75, "learning_rate": 3.678050158669297e-05, "loss": 0.006, "step": 347820 }, { "epoch": 1.75, "learning_rate": 3.6772933893678955e-05, "loss": 0.0074, "step": 347830 }, { "epoch": 1.75, "learning_rate": 3.6765366200664943e-05, "loss": 0.0063, "step": 347840 }, { "epoch": 1.75, "learning_rate": 3.675779850765093e-05, "loss": 0.0069, "step": 347850 }, { "epoch": 1.75, "learning_rate": 3.675023081463693e-05, "loss": 0.0062, "step": 347860 }, { "epoch": 1.76, "learning_rate": 3.6742663121622915e-05, "loss": 0.0044, "step": 347870 }, { "epoch": 1.76, "learning_rate": 3.67350954286089e-05, "loss": 0.0063, "step": 347880 }, { "epoch": 1.76, "learning_rate": 3.672752773559489e-05, "loss": 0.0053, "step": 347890 }, { "epoch": 1.76, "learning_rate": 3.6719960042580886e-05, "loss": 0.0053, "step": 347900 }, { "epoch": 1.76, "learning_rate": 3.6712392349566875e-05, "loss": 0.007, "step": 347910 }, { "epoch": 1.76, "learning_rate": 3.670482465655286e-05, "loss": 0.0066, "step": 347920 }, { "epoch": 1.76, "learning_rate": 3.669725696353885e-05, "loss": 0.0059, "step": 347930 }, { "epoch": 1.76, "learning_rate": 3.668968927052484e-05, "loss": 0.0073, "step": 347940 }, { "epoch": 1.76, "learning_rate": 3.668212157751083e-05, "loss": 0.0048, "step": 347950 }, { "epoch": 1.76, "learning_rate": 3.667455388449682e-05, "loss": 0.0055, "step": 347960 }, { "epoch": 1.76, "learning_rate": 3.666698619148281e-05, "loss": 0.0062, "step": 347970 }, { "epoch": 1.76, "learning_rate": 3.66594184984688e-05, "loss": 0.0037, "step": 347980 }, { "epoch": 1.76, "learning_rate": 3.665185080545479e-05, "loss": 0.0064, "step": 347990 }, { "epoch": 1.76, "learning_rate": 3.664428311244078e-05, "loss": 0.0056, "step": 348000 }, { "epoch": 1.76, "eval_cer": 0.9144324104542716, "eval_loss": 0.004651382099837065, "eval_runtime": 116.6456, "eval_samples_per_second": 17.146, "eval_steps_per_second": 4.286, "step": 348000 }, { "epoch": 1.76, "learning_rate": 3.663671541942677e-05, "loss": 0.0051, "step": 348010 }, { "epoch": 1.76, "learning_rate": 3.662914772641276e-05, "loss": 0.0062, "step": 348020 }, { "epoch": 1.76, "learning_rate": 3.662158003339875e-05, "loss": 0.0045, "step": 348030 }, { "epoch": 1.76, "learning_rate": 3.661401234038474e-05, "loss": 0.0053, "step": 348040 }, { "epoch": 1.76, "learning_rate": 3.660644464737073e-05, "loss": 0.0071, "step": 348050 }, { "epoch": 1.76, "learning_rate": 3.659887695435672e-05, "loss": 0.0084, "step": 348060 }, { "epoch": 1.76, "learning_rate": 3.6591309261342706e-05, "loss": 0.0073, "step": 348070 }, { "epoch": 1.76, "learning_rate": 3.6583741568328695e-05, "loss": 0.0064, "step": 348080 }, { "epoch": 1.76, "learning_rate": 3.657617387531468e-05, "loss": 0.0076, "step": 348090 }, { "epoch": 1.76, "learning_rate": 3.656860618230068e-05, "loss": 0.006, "step": 348100 }, { "epoch": 1.76, "learning_rate": 3.6561038489286666e-05, "loss": 0.0061, "step": 348110 }, { "epoch": 1.76, "learning_rate": 3.6553470796272654e-05, "loss": 0.0059, "step": 348120 }, { "epoch": 1.76, "learning_rate": 3.654590310325864e-05, "loss": 0.0067, "step": 348130 }, { "epoch": 1.76, "learning_rate": 3.653833541024464e-05, "loss": 0.0065, "step": 348140 }, { "epoch": 1.76, "learning_rate": 3.6530767717230626e-05, "loss": 0.0071, "step": 348150 }, { "epoch": 1.76, "learning_rate": 3.6523200024216614e-05, "loss": 0.0065, "step": 348160 }, { "epoch": 1.76, "learning_rate": 3.65156323312026e-05, "loss": 0.0049, "step": 348170 }, { "epoch": 1.76, "learning_rate": 3.65080646381886e-05, "loss": 0.0052, "step": 348180 }, { "epoch": 1.76, "learning_rate": 3.6500496945174585e-05, "loss": 0.005, "step": 348190 }, { "epoch": 1.76, "learning_rate": 3.6492929252160574e-05, "loss": 0.0067, "step": 348200 }, { "epoch": 1.76, "learning_rate": 3.648536155914656e-05, "loss": 0.0047, "step": 348210 }, { "epoch": 1.76, "learning_rate": 3.647779386613256e-05, "loss": 0.0057, "step": 348220 }, { "epoch": 1.76, "learning_rate": 3.6470226173118545e-05, "loss": 0.0072, "step": 348230 }, { "epoch": 1.76, "learning_rate": 3.646265848010453e-05, "loss": 0.0074, "step": 348240 }, { "epoch": 1.76, "learning_rate": 3.645509078709052e-05, "loss": 0.0062, "step": 348250 }, { "epoch": 1.76, "learning_rate": 3.644752309407651e-05, "loss": 0.0088, "step": 348260 }, { "epoch": 1.76, "learning_rate": 3.64399554010625e-05, "loss": 0.005, "step": 348270 }, { "epoch": 1.76, "learning_rate": 3.643238770804849e-05, "loss": 0.0068, "step": 348280 }, { "epoch": 1.76, "learning_rate": 3.642482001503448e-05, "loss": 0.008, "step": 348290 }, { "epoch": 1.76, "learning_rate": 3.641725232202047e-05, "loss": 0.0054, "step": 348300 }, { "epoch": 1.76, "learning_rate": 3.640968462900646e-05, "loss": 0.0052, "step": 348310 }, { "epoch": 1.76, "learning_rate": 3.640211693599245e-05, "loss": 0.0045, "step": 348320 }, { "epoch": 1.76, "learning_rate": 3.639454924297844e-05, "loss": 0.0062, "step": 348330 }, { "epoch": 1.76, "learning_rate": 3.638698154996443e-05, "loss": 0.0066, "step": 348340 }, { "epoch": 1.76, "learning_rate": 3.637941385695042e-05, "loss": 0.0072, "step": 348350 }, { "epoch": 1.76, "learning_rate": 3.637184616393641e-05, "loss": 0.0066, "step": 348360 }, { "epoch": 1.76, "learning_rate": 3.63642784709224e-05, "loss": 0.0064, "step": 348370 }, { "epoch": 1.76, "learning_rate": 3.635671077790839e-05, "loss": 0.0044, "step": 348380 }, { "epoch": 1.76, "learning_rate": 3.634914308489438e-05, "loss": 0.0041, "step": 348390 }, { "epoch": 1.76, "learning_rate": 3.6341575391880365e-05, "loss": 0.0069, "step": 348400 }, { "epoch": 1.76, "learning_rate": 3.633400769886635e-05, "loss": 0.0063, "step": 348410 }, { "epoch": 1.76, "learning_rate": 3.632644000585234e-05, "loss": 0.0091, "step": 348420 }, { "epoch": 1.76, "learning_rate": 3.6318872312838336e-05, "loss": 0.0045, "step": 348430 }, { "epoch": 1.76, "learning_rate": 3.6311304619824325e-05, "loss": 0.0057, "step": 348440 }, { "epoch": 1.76, "learning_rate": 3.630373692681031e-05, "loss": 0.0059, "step": 348450 }, { "epoch": 1.76, "learning_rate": 3.62961692337963e-05, "loss": 0.0113, "step": 348460 }, { "epoch": 1.76, "learning_rate": 3.6288601540782296e-05, "loss": 0.008, "step": 348470 }, { "epoch": 1.76, "learning_rate": 3.6281033847768284e-05, "loss": 0.0051, "step": 348480 }, { "epoch": 1.76, "learning_rate": 3.627346615475427e-05, "loss": 0.0062, "step": 348490 }, { "epoch": 1.76, "learning_rate": 3.626589846174027e-05, "loss": 0.0041, "step": 348500 }, { "epoch": 1.76, "learning_rate": 3.6258330768726256e-05, "loss": 0.0054, "step": 348510 }, { "epoch": 1.76, "learning_rate": 3.6250763075712244e-05, "loss": 0.0074, "step": 348520 }, { "epoch": 1.76, "learning_rate": 3.624319538269823e-05, "loss": 0.0054, "step": 348530 }, { "epoch": 1.76, "learning_rate": 3.623562768968423e-05, "loss": 0.0067, "step": 348540 }, { "epoch": 1.76, "learning_rate": 3.6228059996670215e-05, "loss": 0.0054, "step": 348550 }, { "epoch": 1.76, "learning_rate": 3.62204923036562e-05, "loss": 0.006, "step": 348560 }, { "epoch": 1.76, "learning_rate": 3.621292461064219e-05, "loss": 0.0057, "step": 348570 }, { "epoch": 1.76, "learning_rate": 3.620535691762818e-05, "loss": 0.0062, "step": 348580 }, { "epoch": 1.76, "learning_rate": 3.619778922461417e-05, "loss": 0.0042, "step": 348590 }, { "epoch": 1.76, "learning_rate": 3.6190221531600157e-05, "loss": 0.0101, "step": 348600 }, { "epoch": 1.76, "learning_rate": 3.618265383858615e-05, "loss": 0.0049, "step": 348610 }, { "epoch": 1.76, "learning_rate": 3.617508614557214e-05, "loss": 0.0036, "step": 348620 }, { "epoch": 1.76, "learning_rate": 3.616751845255813e-05, "loss": 0.0084, "step": 348630 }, { "epoch": 1.76, "learning_rate": 3.6159950759544116e-05, "loss": 0.0058, "step": 348640 }, { "epoch": 1.76, "learning_rate": 3.615238306653011e-05, "loss": 0.0055, "step": 348650 }, { "epoch": 1.76, "learning_rate": 3.61448153735161e-05, "loss": 0.0067, "step": 348660 }, { "epoch": 1.76, "learning_rate": 3.613724768050209e-05, "loss": 0.0059, "step": 348670 }, { "epoch": 1.76, "learning_rate": 3.6129679987488076e-05, "loss": 0.0082, "step": 348680 }, { "epoch": 1.76, "learning_rate": 3.612211229447407e-05, "loss": 0.0046, "step": 348690 }, { "epoch": 1.76, "learning_rate": 3.611454460146006e-05, "loss": 0.0054, "step": 348700 }, { "epoch": 1.76, "learning_rate": 3.610697690844605e-05, "loss": 0.0062, "step": 348710 }, { "epoch": 1.76, "learning_rate": 3.6099409215432035e-05, "loss": 0.0056, "step": 348720 }, { "epoch": 1.76, "learning_rate": 3.6091841522418024e-05, "loss": 0.0083, "step": 348730 }, { "epoch": 1.76, "learning_rate": 3.608427382940401e-05, "loss": 0.0051, "step": 348740 }, { "epoch": 1.76, "learning_rate": 3.607670613639001e-05, "loss": 0.0064, "step": 348750 }, { "epoch": 1.76, "learning_rate": 3.6069138443375995e-05, "loss": 0.0074, "step": 348760 }, { "epoch": 1.76, "learning_rate": 3.606157075036198e-05, "loss": 0.0064, "step": 348770 }, { "epoch": 1.76, "learning_rate": 3.605400305734797e-05, "loss": 0.0091, "step": 348780 }, { "epoch": 1.76, "learning_rate": 3.6046435364333967e-05, "loss": 0.0059, "step": 348790 }, { "epoch": 1.76, "learning_rate": 3.6038867671319955e-05, "loss": 0.0053, "step": 348800 }, { "epoch": 1.76, "learning_rate": 3.603129997830594e-05, "loss": 0.0054, "step": 348810 }, { "epoch": 1.76, "learning_rate": 3.602373228529193e-05, "loss": 0.005, "step": 348820 }, { "epoch": 1.76, "learning_rate": 3.6016164592277926e-05, "loss": 0.0072, "step": 348830 }, { "epoch": 1.76, "learning_rate": 3.6008596899263914e-05, "loss": 0.005, "step": 348840 }, { "epoch": 1.76, "learning_rate": 3.60010292062499e-05, "loss": 0.0062, "step": 348850 }, { "epoch": 1.76, "learning_rate": 3.599346151323589e-05, "loss": 0.0082, "step": 348860 }, { "epoch": 1.76, "learning_rate": 3.598589382022188e-05, "loss": 0.0085, "step": 348870 }, { "epoch": 1.76, "learning_rate": 3.597832612720787e-05, "loss": 0.0054, "step": 348880 }, { "epoch": 1.76, "learning_rate": 3.597075843419386e-05, "loss": 0.0048, "step": 348890 }, { "epoch": 1.76, "learning_rate": 3.596319074117985e-05, "loss": 0.0046, "step": 348900 }, { "epoch": 1.76, "learning_rate": 3.595562304816584e-05, "loss": 0.0062, "step": 348910 }, { "epoch": 1.76, "learning_rate": 3.594805535515183e-05, "loss": 0.0054, "step": 348920 }, { "epoch": 1.76, "learning_rate": 3.594048766213782e-05, "loss": 0.0078, "step": 348930 }, { "epoch": 1.76, "learning_rate": 3.593291996912381e-05, "loss": 0.0057, "step": 348940 }, { "epoch": 1.76, "learning_rate": 3.59253522761098e-05, "loss": 0.0057, "step": 348950 }, { "epoch": 1.76, "learning_rate": 3.591778458309579e-05, "loss": 0.0079, "step": 348960 }, { "epoch": 1.76, "learning_rate": 3.591021689008178e-05, "loss": 0.0054, "step": 348970 }, { "epoch": 1.76, "learning_rate": 3.590264919706777e-05, "loss": 0.0056, "step": 348980 }, { "epoch": 1.76, "learning_rate": 3.589508150405376e-05, "loss": 0.0069, "step": 348990 }, { "epoch": 1.76, "learning_rate": 3.5887513811039746e-05, "loss": 0.0054, "step": 349000 }, { "epoch": 1.76, "eval_cer": 0.9144188249085159, "eval_loss": 0.004665224812924862, "eval_runtime": 116.662, "eval_samples_per_second": 17.144, "eval_steps_per_second": 4.286, "step": 349000 }, { "epoch": 1.76, "learning_rate": 3.587994611802574e-05, "loss": 0.0094, "step": 349010 }, { "epoch": 1.76, "learning_rate": 3.587237842501173e-05, "loss": 0.0063, "step": 349020 }, { "epoch": 1.76, "learning_rate": 3.586481073199772e-05, "loss": 0.006, "step": 349030 }, { "epoch": 1.76, "learning_rate": 3.5857243038983706e-05, "loss": 0.0056, "step": 349040 }, { "epoch": 1.76, "learning_rate": 3.5849675345969694e-05, "loss": 0.0042, "step": 349050 }, { "epoch": 1.76, "learning_rate": 3.584210765295568e-05, "loss": 0.0072, "step": 349060 }, { "epoch": 1.76, "learning_rate": 3.583453995994168e-05, "loss": 0.0063, "step": 349070 }, { "epoch": 1.76, "learning_rate": 3.5826972266927666e-05, "loss": 0.0065, "step": 349080 }, { "epoch": 1.76, "learning_rate": 3.5819404573913654e-05, "loss": 0.0065, "step": 349090 }, { "epoch": 1.76, "learning_rate": 3.581183688089964e-05, "loss": 0.0072, "step": 349100 }, { "epoch": 1.76, "learning_rate": 3.580426918788564e-05, "loss": 0.0069, "step": 349110 }, { "epoch": 1.76, "learning_rate": 3.5796701494871625e-05, "loss": 0.0074, "step": 349120 }, { "epoch": 1.76, "learning_rate": 3.5789133801857613e-05, "loss": 0.011, "step": 349130 }, { "epoch": 1.76, "learning_rate": 3.57815661088436e-05, "loss": 0.0094, "step": 349140 }, { "epoch": 1.76, "learning_rate": 3.57739984158296e-05, "loss": 0.0077, "step": 349150 }, { "epoch": 1.76, "learning_rate": 3.5766430722815585e-05, "loss": 0.0053, "step": 349160 }, { "epoch": 1.76, "learning_rate": 3.575886302980157e-05, "loss": 0.0089, "step": 349170 }, { "epoch": 1.76, "learning_rate": 3.575129533678756e-05, "loss": 0.005, "step": 349180 }, { "epoch": 1.76, "learning_rate": 3.574372764377355e-05, "loss": 0.0079, "step": 349190 }, { "epoch": 1.76, "learning_rate": 3.573615995075954e-05, "loss": 0.0064, "step": 349200 }, { "epoch": 1.76, "learning_rate": 3.572859225774553e-05, "loss": 0.0062, "step": 349210 }, { "epoch": 1.76, "learning_rate": 3.572102456473152e-05, "loss": 0.0062, "step": 349220 }, { "epoch": 1.76, "learning_rate": 3.571345687171751e-05, "loss": 0.0078, "step": 349230 }, { "epoch": 1.76, "learning_rate": 3.57058891787035e-05, "loss": 0.006, "step": 349240 }, { "epoch": 1.76, "learning_rate": 3.569832148568949e-05, "loss": 0.0065, "step": 349250 }, { "epoch": 1.76, "learning_rate": 3.569075379267548e-05, "loss": 0.006, "step": 349260 }, { "epoch": 1.76, "learning_rate": 3.568318609966147e-05, "loss": 0.0066, "step": 349270 }, { "epoch": 1.76, "learning_rate": 3.567561840664746e-05, "loss": 0.0059, "step": 349280 }, { "epoch": 1.76, "learning_rate": 3.566805071363345e-05, "loss": 0.0164, "step": 349290 }, { "epoch": 1.76, "learning_rate": 3.566048302061944e-05, "loss": 0.0047, "step": 349300 }, { "epoch": 1.76, "learning_rate": 3.565291532760543e-05, "loss": 0.0071, "step": 349310 }, { "epoch": 1.76, "learning_rate": 3.564534763459142e-05, "loss": 0.0049, "step": 349320 }, { "epoch": 1.76, "learning_rate": 3.563777994157741e-05, "loss": 0.0056, "step": 349330 }, { "epoch": 1.76, "learning_rate": 3.563021224856339e-05, "loss": 0.0062, "step": 349340 }, { "epoch": 1.76, "learning_rate": 3.562264455554938e-05, "loss": 0.0037, "step": 349350 }, { "epoch": 1.76, "learning_rate": 3.5615076862535376e-05, "loss": 0.0049, "step": 349360 }, { "epoch": 1.76, "learning_rate": 3.5607509169521365e-05, "loss": 0.0062, "step": 349370 }, { "epoch": 1.76, "learning_rate": 3.559994147650735e-05, "loss": 0.0054, "step": 349380 }, { "epoch": 1.76, "learning_rate": 3.559237378349334e-05, "loss": 0.0051, "step": 349390 }, { "epoch": 1.76, "learning_rate": 3.5584806090479336e-05, "loss": 0.0072, "step": 349400 }, { "epoch": 1.76, "learning_rate": 3.5577238397465324e-05, "loss": 0.0067, "step": 349410 }, { "epoch": 1.76, "learning_rate": 3.556967070445131e-05, "loss": 0.0044, "step": 349420 }, { "epoch": 1.76, "learning_rate": 3.55621030114373e-05, "loss": 0.0078, "step": 349430 }, { "epoch": 1.76, "learning_rate": 3.5554535318423296e-05, "loss": 0.0062, "step": 349440 }, { "epoch": 1.76, "learning_rate": 3.5546967625409284e-05, "loss": 0.0049, "step": 349450 }, { "epoch": 1.76, "learning_rate": 3.553939993239527e-05, "loss": 0.0062, "step": 349460 }, { "epoch": 1.76, "learning_rate": 3.553183223938127e-05, "loss": 0.0075, "step": 349470 }, { "epoch": 1.76, "learning_rate": 3.5524264546367255e-05, "loss": 0.0068, "step": 349480 }, { "epoch": 1.76, "learning_rate": 3.5516696853353244e-05, "loss": 0.0057, "step": 349490 }, { "epoch": 1.76, "learning_rate": 3.550912916033923e-05, "loss": 0.0046, "step": 349500 }, { "epoch": 1.76, "learning_rate": 3.550156146732522e-05, "loss": 0.0088, "step": 349510 }, { "epoch": 1.76, "learning_rate": 3.549399377431121e-05, "loss": 0.0046, "step": 349520 }, { "epoch": 1.76, "learning_rate": 3.5486426081297196e-05, "loss": 0.006, "step": 349530 }, { "epoch": 1.76, "learning_rate": 3.547885838828319e-05, "loss": 0.0052, "step": 349540 }, { "epoch": 1.76, "learning_rate": 3.547129069526918e-05, "loss": 0.0061, "step": 349550 }, { "epoch": 1.76, "learning_rate": 3.546372300225517e-05, "loss": 0.0055, "step": 349560 }, { "epoch": 1.76, "learning_rate": 3.5456155309241156e-05, "loss": 0.0058, "step": 349570 }, { "epoch": 1.76, "learning_rate": 3.544858761622715e-05, "loss": 0.0061, "step": 349580 }, { "epoch": 1.76, "learning_rate": 3.544101992321314e-05, "loss": 0.0054, "step": 349590 }, { "epoch": 1.76, "learning_rate": 3.543345223019913e-05, "loss": 0.0048, "step": 349600 }, { "epoch": 1.76, "learning_rate": 3.5425884537185116e-05, "loss": 0.0068, "step": 349610 }, { "epoch": 1.76, "learning_rate": 3.541831684417111e-05, "loss": 0.0054, "step": 349620 }, { "epoch": 1.76, "learning_rate": 3.54107491511571e-05, "loss": 0.0058, "step": 349630 }, { "epoch": 1.76, "learning_rate": 3.540318145814309e-05, "loss": 0.0053, "step": 349640 }, { "epoch": 1.76, "learning_rate": 3.5395613765129075e-05, "loss": 0.0084, "step": 349650 }, { "epoch": 1.76, "learning_rate": 3.5388046072115064e-05, "loss": 0.0062, "step": 349660 }, { "epoch": 1.76, "learning_rate": 3.538047837910105e-05, "loss": 0.0054, "step": 349670 }, { "epoch": 1.76, "learning_rate": 3.537291068608705e-05, "loss": 0.0074, "step": 349680 }, { "epoch": 1.76, "learning_rate": 3.5365342993073035e-05, "loss": 0.0071, "step": 349690 }, { "epoch": 1.76, "learning_rate": 3.535777530005902e-05, "loss": 0.0049, "step": 349700 }, { "epoch": 1.76, "learning_rate": 3.535020760704501e-05, "loss": 0.0072, "step": 349710 }, { "epoch": 1.76, "learning_rate": 3.5342639914031006e-05, "loss": 0.0076, "step": 349720 }, { "epoch": 1.76, "learning_rate": 3.5335072221016995e-05, "loss": 0.0053, "step": 349730 }, { "epoch": 1.76, "learning_rate": 3.532750452800298e-05, "loss": 0.0065, "step": 349740 }, { "epoch": 1.76, "learning_rate": 3.531993683498897e-05, "loss": 0.006, "step": 349750 }, { "epoch": 1.76, "learning_rate": 3.5312369141974966e-05, "loss": 0.0056, "step": 349760 }, { "epoch": 1.76, "learning_rate": 3.5304801448960954e-05, "loss": 0.0109, "step": 349770 }, { "epoch": 1.76, "learning_rate": 3.529723375594694e-05, "loss": 0.0068, "step": 349780 }, { "epoch": 1.76, "learning_rate": 3.528966606293293e-05, "loss": 0.0063, "step": 349790 }, { "epoch": 1.76, "learning_rate": 3.5282098369918926e-05, "loss": 0.0061, "step": 349800 }, { "epoch": 1.76, "learning_rate": 3.527453067690491e-05, "loss": 0.0064, "step": 349810 }, { "epoch": 1.76, "learning_rate": 3.52669629838909e-05, "loss": 0.0091, "step": 349820 }, { "epoch": 1.76, "learning_rate": 3.525939529087689e-05, "loss": 0.0051, "step": 349830 }, { "epoch": 1.76, "learning_rate": 3.525182759786288e-05, "loss": 0.0073, "step": 349840 }, { "epoch": 1.77, "learning_rate": 3.524425990484887e-05, "loss": 0.0059, "step": 349850 }, { "epoch": 1.77, "learning_rate": 3.523669221183486e-05, "loss": 0.0061, "step": 349860 }, { "epoch": 1.77, "learning_rate": 3.522912451882085e-05, "loss": 0.0062, "step": 349870 }, { "epoch": 1.77, "learning_rate": 3.522155682580684e-05, "loss": 0.0074, "step": 349880 }, { "epoch": 1.77, "learning_rate": 3.5213989132792826e-05, "loss": 0.0059, "step": 349890 }, { "epoch": 1.77, "learning_rate": 3.520642143977882e-05, "loss": 0.0059, "step": 349900 }, { "epoch": 1.77, "learning_rate": 3.519885374676481e-05, "loss": 0.0063, "step": 349910 }, { "epoch": 1.77, "learning_rate": 3.51912860537508e-05, "loss": 0.0047, "step": 349920 }, { "epoch": 1.77, "learning_rate": 3.5183718360736786e-05, "loss": 0.0072, "step": 349930 }, { "epoch": 1.77, "learning_rate": 3.517615066772278e-05, "loss": 0.0068, "step": 349940 }, { "epoch": 1.77, "learning_rate": 3.516858297470877e-05, "loss": 0.0076, "step": 349950 }, { "epoch": 1.77, "learning_rate": 3.516101528169476e-05, "loss": 0.0082, "step": 349960 }, { "epoch": 1.77, "learning_rate": 3.5153447588680746e-05, "loss": 0.0096, "step": 349970 }, { "epoch": 1.77, "learning_rate": 3.5145879895666734e-05, "loss": 0.0061, "step": 349980 }, { "epoch": 1.77, "learning_rate": 3.513831220265272e-05, "loss": 0.0044, "step": 349990 }, { "epoch": 1.77, "learning_rate": 3.513074450963872e-05, "loss": 0.0051, "step": 350000 }, { "epoch": 1.77, "eval_cer": 0.9144498775845288, "eval_loss": 0.004672383423894644, "eval_runtime": 116.7279, "eval_samples_per_second": 17.134, "eval_steps_per_second": 4.283, "step": 350000 }, { "epoch": 1.77, "learning_rate": 3.5123176816624705e-05, "loss": 0.0076, "step": 350010 }, { "epoch": 1.77, "learning_rate": 3.5115609123610694e-05, "loss": 0.0069, "step": 350020 }, { "epoch": 1.77, "learning_rate": 3.510804143059668e-05, "loss": 0.0082, "step": 350030 }, { "epoch": 1.77, "learning_rate": 3.510047373758268e-05, "loss": 0.0051, "step": 350040 }, { "epoch": 1.77, "learning_rate": 3.5092906044568665e-05, "loss": 0.0067, "step": 350050 }, { "epoch": 1.77, "learning_rate": 3.508533835155465e-05, "loss": 0.0053, "step": 350060 }, { "epoch": 1.77, "learning_rate": 3.507777065854064e-05, "loss": 0.0052, "step": 350070 }, { "epoch": 1.77, "learning_rate": 3.5070202965526637e-05, "loss": 0.0058, "step": 350080 }, { "epoch": 1.77, "learning_rate": 3.5062635272512625e-05, "loss": 0.0075, "step": 350090 }, { "epoch": 1.77, "learning_rate": 3.505506757949861e-05, "loss": 0.0058, "step": 350100 }, { "epoch": 1.77, "learning_rate": 3.50474998864846e-05, "loss": 0.0072, "step": 350110 }, { "epoch": 1.77, "learning_rate": 3.5039932193470596e-05, "loss": 0.0071, "step": 350120 }, { "epoch": 1.77, "learning_rate": 3.503236450045658e-05, "loss": 0.0058, "step": 350130 }, { "epoch": 1.77, "learning_rate": 3.5024796807442566e-05, "loss": 0.0053, "step": 350140 }, { "epoch": 1.77, "learning_rate": 3.501722911442856e-05, "loss": 0.0057, "step": 350150 }, { "epoch": 1.77, "learning_rate": 3.500966142141455e-05, "loss": 0.006, "step": 350160 }, { "epoch": 1.77, "learning_rate": 3.500209372840054e-05, "loss": 0.005, "step": 350170 }, { "epoch": 1.77, "learning_rate": 3.499452603538653e-05, "loss": 0.0094, "step": 350180 }, { "epoch": 1.77, "learning_rate": 3.498695834237252e-05, "loss": 0.0097, "step": 350190 }, { "epoch": 1.77, "learning_rate": 3.497939064935851e-05, "loss": 0.0058, "step": 350200 }, { "epoch": 1.77, "learning_rate": 3.49718229563445e-05, "loss": 0.0055, "step": 350210 }, { "epoch": 1.77, "learning_rate": 3.496425526333049e-05, "loss": 0.0064, "step": 350220 }, { "epoch": 1.77, "learning_rate": 3.495668757031648e-05, "loss": 0.0089, "step": 350230 }, { "epoch": 1.77, "learning_rate": 3.494911987730247e-05, "loss": 0.0043, "step": 350240 }, { "epoch": 1.77, "learning_rate": 3.4941552184288457e-05, "loss": 0.0054, "step": 350250 }, { "epoch": 1.77, "learning_rate": 3.493398449127445e-05, "loss": 0.0076, "step": 350260 }, { "epoch": 1.77, "learning_rate": 3.492641679826044e-05, "loss": 0.0048, "step": 350270 }, { "epoch": 1.77, "learning_rate": 3.491884910524642e-05, "loss": 0.007, "step": 350280 }, { "epoch": 1.77, "learning_rate": 3.4911281412232416e-05, "loss": 0.0082, "step": 350290 }, { "epoch": 1.77, "learning_rate": 3.4903713719218404e-05, "loss": 0.0069, "step": 350300 }, { "epoch": 1.77, "learning_rate": 3.489614602620439e-05, "loss": 0.0076, "step": 350310 }, { "epoch": 1.77, "learning_rate": 3.488857833319038e-05, "loss": 0.0048, "step": 350320 }, { "epoch": 1.77, "learning_rate": 3.4881010640176376e-05, "loss": 0.0054, "step": 350330 }, { "epoch": 1.77, "learning_rate": 3.4873442947162364e-05, "loss": 0.0047, "step": 350340 }, { "epoch": 1.77, "learning_rate": 3.486587525414835e-05, "loss": 0.0046, "step": 350350 }, { "epoch": 1.77, "learning_rate": 3.485830756113434e-05, "loss": 0.0062, "step": 350360 }, { "epoch": 1.77, "learning_rate": 3.4850739868120336e-05, "loss": 0.0062, "step": 350370 }, { "epoch": 1.77, "learning_rate": 3.4843172175106324e-05, "loss": 0.0056, "step": 350380 }, { "epoch": 1.77, "learning_rate": 3.483560448209231e-05, "loss": 0.0066, "step": 350390 }, { "epoch": 1.77, "learning_rate": 3.48280367890783e-05, "loss": 0.0049, "step": 350400 }, { "epoch": 1.77, "learning_rate": 3.4820469096064295e-05, "loss": 0.0058, "step": 350410 }, { "epoch": 1.77, "learning_rate": 3.4812901403050283e-05, "loss": 0.0108, "step": 350420 }, { "epoch": 1.77, "learning_rate": 3.480533371003627e-05, "loss": 0.0065, "step": 350430 }, { "epoch": 1.77, "learning_rate": 3.479776601702226e-05, "loss": 0.0055, "step": 350440 }, { "epoch": 1.77, "learning_rate": 3.479019832400825e-05, "loss": 0.0056, "step": 350450 }, { "epoch": 1.77, "learning_rate": 3.4782630630994236e-05, "loss": 0.0059, "step": 350460 }, { "epoch": 1.77, "learning_rate": 3.477506293798023e-05, "loss": 0.008, "step": 350470 }, { "epoch": 1.77, "learning_rate": 3.476749524496622e-05, "loss": 0.0048, "step": 350480 }, { "epoch": 1.77, "learning_rate": 3.475992755195221e-05, "loss": 0.0091, "step": 350490 }, { "epoch": 1.77, "learning_rate": 3.4752359858938196e-05, "loss": 0.0069, "step": 350500 }, { "epoch": 1.77, "learning_rate": 3.474479216592419e-05, "loss": 0.006, "step": 350510 }, { "epoch": 1.77, "learning_rate": 3.473722447291018e-05, "loss": 0.0078, "step": 350520 }, { "epoch": 1.77, "learning_rate": 3.472965677989617e-05, "loss": 0.0053, "step": 350530 }, { "epoch": 1.77, "learning_rate": 3.4722089086882156e-05, "loss": 0.0045, "step": 350540 }, { "epoch": 1.77, "learning_rate": 3.471452139386815e-05, "loss": 0.0074, "step": 350550 }, { "epoch": 1.77, "learning_rate": 3.470695370085414e-05, "loss": 0.0072, "step": 350560 }, { "epoch": 1.77, "learning_rate": 3.469938600784013e-05, "loss": 0.0062, "step": 350570 }, { "epoch": 1.77, "learning_rate": 3.4691818314826115e-05, "loss": 0.0072, "step": 350580 }, { "epoch": 1.77, "learning_rate": 3.468425062181211e-05, "loss": 0.0048, "step": 350590 }, { "epoch": 1.77, "learning_rate": 3.467668292879809e-05, "loss": 0.0071, "step": 350600 }, { "epoch": 1.77, "learning_rate": 3.466911523578409e-05, "loss": 0.0056, "step": 350610 }, { "epoch": 1.77, "learning_rate": 3.4661547542770075e-05, "loss": 0.0064, "step": 350620 }, { "epoch": 1.77, "learning_rate": 3.465397984975606e-05, "loss": 0.0064, "step": 350630 }, { "epoch": 1.77, "learning_rate": 3.464641215674205e-05, "loss": 0.007, "step": 350640 }, { "epoch": 1.77, "learning_rate": 3.4638844463728046e-05, "loss": 0.0062, "step": 350650 }, { "epoch": 1.77, "learning_rate": 3.4631276770714035e-05, "loss": 0.0057, "step": 350660 }, { "epoch": 1.77, "learning_rate": 3.462370907770002e-05, "loss": 0.0068, "step": 350670 }, { "epoch": 1.77, "learning_rate": 3.461614138468601e-05, "loss": 0.0061, "step": 350680 }, { "epoch": 1.77, "learning_rate": 3.4608573691672006e-05, "loss": 0.005, "step": 350690 }, { "epoch": 1.77, "learning_rate": 3.4601005998657994e-05, "loss": 0.0064, "step": 350700 }, { "epoch": 1.77, "learning_rate": 3.459343830564398e-05, "loss": 0.0048, "step": 350710 }, { "epoch": 1.77, "learning_rate": 3.458587061262997e-05, "loss": 0.0088, "step": 350720 }, { "epoch": 1.77, "learning_rate": 3.4578302919615966e-05, "loss": 0.0046, "step": 350730 }, { "epoch": 1.77, "learning_rate": 3.4570735226601954e-05, "loss": 0.0058, "step": 350740 }, { "epoch": 1.77, "learning_rate": 3.456316753358794e-05, "loss": 0.0047, "step": 350750 }, { "epoch": 1.77, "learning_rate": 3.455559984057393e-05, "loss": 0.0071, "step": 350760 }, { "epoch": 1.77, "learning_rate": 3.454803214755992e-05, "loss": 0.0062, "step": 350770 }, { "epoch": 1.77, "learning_rate": 3.454046445454591e-05, "loss": 0.0065, "step": 350780 }, { "epoch": 1.77, "learning_rate": 3.45328967615319e-05, "loss": 0.0097, "step": 350790 }, { "epoch": 1.77, "learning_rate": 3.452532906851789e-05, "loss": 0.0058, "step": 350800 }, { "epoch": 1.77, "learning_rate": 3.451776137550388e-05, "loss": 0.0065, "step": 350810 }, { "epoch": 1.77, "learning_rate": 3.4510193682489866e-05, "loss": 0.0065, "step": 350820 }, { "epoch": 1.77, "learning_rate": 3.450262598947586e-05, "loss": 0.0097, "step": 350830 }, { "epoch": 1.77, "learning_rate": 3.449505829646185e-05, "loss": 0.0063, "step": 350840 }, { "epoch": 1.77, "learning_rate": 3.448749060344784e-05, "loss": 0.0077, "step": 350850 }, { "epoch": 1.77, "learning_rate": 3.4479922910433826e-05, "loss": 0.0066, "step": 350860 }, { "epoch": 1.77, "learning_rate": 3.447235521741982e-05, "loss": 0.0061, "step": 350870 }, { "epoch": 1.77, "learning_rate": 3.446478752440581e-05, "loss": 0.006, "step": 350880 }, { "epoch": 1.77, "learning_rate": 3.44572198313918e-05, "loss": 0.0057, "step": 350890 }, { "epoch": 1.77, "learning_rate": 3.4449652138377786e-05, "loss": 0.0061, "step": 350900 }, { "epoch": 1.77, "learning_rate": 3.4442084445363774e-05, "loss": 0.0068, "step": 350910 }, { "epoch": 1.77, "learning_rate": 3.443451675234976e-05, "loss": 0.0059, "step": 350920 }, { "epoch": 1.77, "learning_rate": 3.442694905933576e-05, "loss": 0.0079, "step": 350930 }, { "epoch": 1.77, "learning_rate": 3.4419381366321745e-05, "loss": 0.0072, "step": 350940 }, { "epoch": 1.77, "learning_rate": 3.4411813673307734e-05, "loss": 0.0075, "step": 350950 }, { "epoch": 1.77, "learning_rate": 3.440424598029372e-05, "loss": 0.0074, "step": 350960 }, { "epoch": 1.77, "learning_rate": 3.439667828727972e-05, "loss": 0.0089, "step": 350970 }, { "epoch": 1.77, "learning_rate": 3.4389110594265705e-05, "loss": 0.006, "step": 350980 }, { "epoch": 1.77, "learning_rate": 3.438154290125169e-05, "loss": 0.0046, "step": 350990 }, { "epoch": 1.77, "learning_rate": 3.437397520823768e-05, "loss": 0.0077, "step": 351000 }, { "epoch": 1.77, "eval_cer": 0.9144362920387732, "eval_loss": 0.004640540108084679, "eval_runtime": 116.6521, "eval_samples_per_second": 17.145, "eval_steps_per_second": 4.286, "step": 351000 }, { "epoch": 1.77, "learning_rate": 3.4366407515223676e-05, "loss": 0.0048, "step": 351010 }, { "epoch": 1.77, "learning_rate": 3.4358839822209665e-05, "loss": 0.0067, "step": 351020 }, { "epoch": 1.77, "learning_rate": 3.435127212919565e-05, "loss": 0.0061, "step": 351030 }, { "epoch": 1.77, "learning_rate": 3.434370443618164e-05, "loss": 0.0076, "step": 351040 }, { "epoch": 1.77, "learning_rate": 3.4336136743167636e-05, "loss": 0.0064, "step": 351050 }, { "epoch": 1.77, "learning_rate": 3.4328569050153624e-05, "loss": 0.0058, "step": 351060 }, { "epoch": 1.77, "learning_rate": 3.4321001357139606e-05, "loss": 0.0062, "step": 351070 }, { "epoch": 1.77, "learning_rate": 3.43134336641256e-05, "loss": 0.005, "step": 351080 }, { "epoch": 1.77, "learning_rate": 3.430586597111159e-05, "loss": 0.006, "step": 351090 }, { "epoch": 1.77, "learning_rate": 3.429829827809758e-05, "loss": 0.0062, "step": 351100 }, { "epoch": 1.77, "learning_rate": 3.4290730585083565e-05, "loss": 0.0078, "step": 351110 }, { "epoch": 1.77, "learning_rate": 3.428316289206956e-05, "loss": 0.0064, "step": 351120 }, { "epoch": 1.77, "learning_rate": 3.427559519905555e-05, "loss": 0.0045, "step": 351130 }, { "epoch": 1.77, "learning_rate": 3.426802750604154e-05, "loss": 0.0068, "step": 351140 }, { "epoch": 1.77, "learning_rate": 3.426045981302753e-05, "loss": 0.0054, "step": 351150 }, { "epoch": 1.77, "learning_rate": 3.425289212001352e-05, "loss": 0.006, "step": 351160 }, { "epoch": 1.77, "learning_rate": 3.424532442699951e-05, "loss": 0.0046, "step": 351170 }, { "epoch": 1.77, "learning_rate": 3.4237756733985496e-05, "loss": 0.0049, "step": 351180 }, { "epoch": 1.77, "learning_rate": 3.423018904097149e-05, "loss": 0.006, "step": 351190 }, { "epoch": 1.77, "learning_rate": 3.422262134795748e-05, "loss": 0.0057, "step": 351200 }, { "epoch": 1.77, "learning_rate": 3.421505365494347e-05, "loss": 0.0058, "step": 351210 }, { "epoch": 1.77, "learning_rate": 3.4207485961929456e-05, "loss": 0.0075, "step": 351220 }, { "epoch": 1.77, "learning_rate": 3.4199918268915444e-05, "loss": 0.0091, "step": 351230 }, { "epoch": 1.77, "learning_rate": 3.419235057590143e-05, "loss": 0.0062, "step": 351240 }, { "epoch": 1.77, "learning_rate": 3.418478288288742e-05, "loss": 0.0051, "step": 351250 }, { "epoch": 1.77, "learning_rate": 3.4177215189873416e-05, "loss": 0.0049, "step": 351260 }, { "epoch": 1.77, "learning_rate": 3.4169647496859404e-05, "loss": 0.0065, "step": 351270 }, { "epoch": 1.77, "learning_rate": 3.416207980384539e-05, "loss": 0.006, "step": 351280 }, { "epoch": 1.77, "learning_rate": 3.415451211083138e-05, "loss": 0.0072, "step": 351290 }, { "epoch": 1.77, "learning_rate": 3.4146944417817375e-05, "loss": 0.0039, "step": 351300 }, { "epoch": 1.77, "learning_rate": 3.4139376724803364e-05, "loss": 0.0055, "step": 351310 }, { "epoch": 1.77, "learning_rate": 3.413180903178935e-05, "loss": 0.0059, "step": 351320 }, { "epoch": 1.77, "learning_rate": 3.412424133877534e-05, "loss": 0.006, "step": 351330 }, { "epoch": 1.77, "learning_rate": 3.4116673645761335e-05, "loss": 0.0073, "step": 351340 }, { "epoch": 1.77, "learning_rate": 3.410910595274732e-05, "loss": 0.0059, "step": 351350 }, { "epoch": 1.77, "learning_rate": 3.410153825973331e-05, "loss": 0.0052, "step": 351360 }, { "epoch": 1.77, "learning_rate": 3.40939705667193e-05, "loss": 0.0047, "step": 351370 }, { "epoch": 1.77, "learning_rate": 3.408640287370529e-05, "loss": 0.0061, "step": 351380 }, { "epoch": 1.77, "learning_rate": 3.4078835180691276e-05, "loss": 0.0064, "step": 351390 }, { "epoch": 1.77, "learning_rate": 3.407126748767727e-05, "loss": 0.0049, "step": 351400 }, { "epoch": 1.77, "learning_rate": 3.406369979466326e-05, "loss": 0.0059, "step": 351410 }, { "epoch": 1.77, "learning_rate": 3.405613210164925e-05, "loss": 0.0064, "step": 351420 }, { "epoch": 1.77, "learning_rate": 3.4048564408635236e-05, "loss": 0.0067, "step": 351430 }, { "epoch": 1.77, "learning_rate": 3.404099671562123e-05, "loss": 0.0066, "step": 351440 }, { "epoch": 1.77, "learning_rate": 3.403342902260722e-05, "loss": 0.0073, "step": 351450 }, { "epoch": 1.77, "learning_rate": 3.402586132959321e-05, "loss": 0.006, "step": 351460 }, { "epoch": 1.77, "learning_rate": 3.4018293636579195e-05, "loss": 0.0056, "step": 351470 }, { "epoch": 1.77, "learning_rate": 3.401072594356519e-05, "loss": 0.0053, "step": 351480 }, { "epoch": 1.77, "learning_rate": 3.400315825055118e-05, "loss": 0.0055, "step": 351490 }, { "epoch": 1.77, "learning_rate": 3.399559055753717e-05, "loss": 0.0057, "step": 351500 }, { "epoch": 1.77, "learning_rate": 3.3988022864523155e-05, "loss": 0.0054, "step": 351510 }, { "epoch": 1.77, "learning_rate": 3.398045517150915e-05, "loss": 0.0051, "step": 351520 }, { "epoch": 1.77, "learning_rate": 3.397288747849514e-05, "loss": 0.0158, "step": 351530 }, { "epoch": 1.77, "learning_rate": 3.3965319785481127e-05, "loss": 0.0091, "step": 351540 }, { "epoch": 1.77, "learning_rate": 3.3957752092467115e-05, "loss": 0.0065, "step": 351550 }, { "epoch": 1.77, "learning_rate": 3.39501843994531e-05, "loss": 0.0068, "step": 351560 }, { "epoch": 1.77, "learning_rate": 3.394261670643909e-05, "loss": 0.0058, "step": 351570 }, { "epoch": 1.77, "learning_rate": 3.3935049013425086e-05, "loss": 0.0058, "step": 351580 }, { "epoch": 1.77, "learning_rate": 3.3927481320411074e-05, "loss": 0.0045, "step": 351590 }, { "epoch": 1.77, "learning_rate": 3.391991362739706e-05, "loss": 0.0081, "step": 351600 }, { "epoch": 1.77, "learning_rate": 3.391234593438305e-05, "loss": 0.0047, "step": 351610 }, { "epoch": 1.77, "learning_rate": 3.3904778241369046e-05, "loss": 0.0045, "step": 351620 }, { "epoch": 1.77, "learning_rate": 3.3897210548355034e-05, "loss": 0.005, "step": 351630 }, { "epoch": 1.77, "learning_rate": 3.388964285534102e-05, "loss": 0.0061, "step": 351640 }, { "epoch": 1.77, "learning_rate": 3.388207516232701e-05, "loss": 0.0047, "step": 351650 }, { "epoch": 1.77, "learning_rate": 3.3874507469313005e-05, "loss": 0.0056, "step": 351660 }, { "epoch": 1.77, "learning_rate": 3.3866939776298994e-05, "loss": 0.0053, "step": 351670 }, { "epoch": 1.77, "learning_rate": 3.385937208328498e-05, "loss": 0.0084, "step": 351680 }, { "epoch": 1.77, "learning_rate": 3.385180439027097e-05, "loss": 0.0062, "step": 351690 }, { "epoch": 1.77, "learning_rate": 3.384423669725696e-05, "loss": 0.0038, "step": 351700 }, { "epoch": 1.77, "learning_rate": 3.3836669004242947e-05, "loss": 0.0053, "step": 351710 }, { "epoch": 1.77, "learning_rate": 3.382910131122894e-05, "loss": 0.0067, "step": 351720 }, { "epoch": 1.77, "learning_rate": 3.382153361821493e-05, "loss": 0.0062, "step": 351730 }, { "epoch": 1.77, "learning_rate": 3.381396592520092e-05, "loss": 0.0066, "step": 351740 }, { "epoch": 1.77, "learning_rate": 3.3806398232186906e-05, "loss": 0.0072, "step": 351750 }, { "epoch": 1.77, "learning_rate": 3.37988305391729e-05, "loss": 0.0048, "step": 351760 }, { "epoch": 1.77, "learning_rate": 3.379126284615889e-05, "loss": 0.0057, "step": 351770 }, { "epoch": 1.77, "learning_rate": 3.378369515314488e-05, "loss": 0.0052, "step": 351780 }, { "epoch": 1.77, "learning_rate": 3.3776127460130866e-05, "loss": 0.0088, "step": 351790 }, { "epoch": 1.77, "learning_rate": 3.376855976711686e-05, "loss": 0.0054, "step": 351800 }, { "epoch": 1.77, "learning_rate": 3.376099207410285e-05, "loss": 0.0057, "step": 351810 }, { "epoch": 1.77, "learning_rate": 3.375342438108884e-05, "loss": 0.0049, "step": 351820 }, { "epoch": 1.78, "learning_rate": 3.3745856688074826e-05, "loss": 0.0052, "step": 351830 }, { "epoch": 1.78, "learning_rate": 3.373828899506082e-05, "loss": 0.004, "step": 351840 }, { "epoch": 1.78, "learning_rate": 3.37307213020468e-05, "loss": 0.0054, "step": 351850 }, { "epoch": 1.78, "learning_rate": 3.37231536090328e-05, "loss": 0.0081, "step": 351860 }, { "epoch": 1.78, "learning_rate": 3.3715585916018785e-05, "loss": 0.0075, "step": 351870 }, { "epoch": 1.78, "learning_rate": 3.3708018223004773e-05, "loss": 0.0047, "step": 351880 }, { "epoch": 1.78, "learning_rate": 3.370045052999076e-05, "loss": 0.0107, "step": 351890 }, { "epoch": 1.78, "learning_rate": 3.369288283697676e-05, "loss": 0.0055, "step": 351900 }, { "epoch": 1.78, "learning_rate": 3.3685315143962745e-05, "loss": 0.0044, "step": 351910 }, { "epoch": 1.78, "learning_rate": 3.367774745094873e-05, "loss": 0.0042, "step": 351920 }, { "epoch": 1.78, "learning_rate": 3.367017975793472e-05, "loss": 0.0069, "step": 351930 }, { "epoch": 1.78, "learning_rate": 3.3662612064920716e-05, "loss": 0.0058, "step": 351940 }, { "epoch": 1.78, "learning_rate": 3.3655044371906704e-05, "loss": 0.007, "step": 351950 }, { "epoch": 1.78, "learning_rate": 3.364747667889269e-05, "loss": 0.0055, "step": 351960 }, { "epoch": 1.78, "learning_rate": 3.363990898587868e-05, "loss": 0.0078, "step": 351970 }, { "epoch": 1.78, "learning_rate": 3.3632341292864676e-05, "loss": 0.0082, "step": 351980 }, { "epoch": 1.78, "learning_rate": 3.3624773599850664e-05, "loss": 0.0066, "step": 351990 }, { "epoch": 1.78, "learning_rate": 3.361720590683665e-05, "loss": 0.0054, "step": 352000 }, { "epoch": 1.78, "eval_cer": 0.9144343512465224, "eval_loss": 0.0045296261087059975, "eval_runtime": 116.5512, "eval_samples_per_second": 17.16, "eval_steps_per_second": 4.29, "step": 352000 }, { "epoch": 1.78, "learning_rate": 3.360963821382264e-05, "loss": 0.005, "step": 352010 }, { "epoch": 1.78, "learning_rate": 3.360207052080863e-05, "loss": 0.0078, "step": 352020 }, { "epoch": 1.78, "learning_rate": 3.359450282779462e-05, "loss": 0.0063, "step": 352030 }, { "epoch": 1.78, "learning_rate": 3.3586935134780605e-05, "loss": 0.0055, "step": 352040 }, { "epoch": 1.78, "learning_rate": 3.35793674417666e-05, "loss": 0.0039, "step": 352050 }, { "epoch": 1.78, "learning_rate": 3.357179974875259e-05, "loss": 0.0047, "step": 352060 }, { "epoch": 1.78, "learning_rate": 3.356423205573858e-05, "loss": 0.0048, "step": 352070 }, { "epoch": 1.78, "learning_rate": 3.3556664362724565e-05, "loss": 0.0067, "step": 352080 }, { "epoch": 1.78, "learning_rate": 3.354909666971056e-05, "loss": 0.0095, "step": 352090 }, { "epoch": 1.78, "learning_rate": 3.354152897669655e-05, "loss": 0.005, "step": 352100 }, { "epoch": 1.78, "learning_rate": 3.3533961283682536e-05, "loss": 0.0059, "step": 352110 }, { "epoch": 1.78, "learning_rate": 3.352639359066853e-05, "loss": 0.0076, "step": 352120 }, { "epoch": 1.78, "learning_rate": 3.351882589765452e-05, "loss": 0.0042, "step": 352130 }, { "epoch": 1.78, "learning_rate": 3.351125820464051e-05, "loss": 0.0074, "step": 352140 }, { "epoch": 1.78, "learning_rate": 3.3503690511626496e-05, "loss": 0.0046, "step": 352150 }, { "epoch": 1.78, "learning_rate": 3.349612281861249e-05, "loss": 0.0053, "step": 352160 }, { "epoch": 1.78, "learning_rate": 3.348855512559847e-05, "loss": 0.0071, "step": 352170 }, { "epoch": 1.78, "learning_rate": 3.348098743258446e-05, "loss": 0.0051, "step": 352180 }, { "epoch": 1.78, "learning_rate": 3.3473419739570456e-05, "loss": 0.0065, "step": 352190 }, { "epoch": 1.78, "learning_rate": 3.3465852046556444e-05, "loss": 0.0063, "step": 352200 }, { "epoch": 1.78, "learning_rate": 3.345828435354243e-05, "loss": 0.0072, "step": 352210 }, { "epoch": 1.78, "learning_rate": 3.345071666052842e-05, "loss": 0.0077, "step": 352220 }, { "epoch": 1.78, "learning_rate": 3.3443148967514415e-05, "loss": 0.0075, "step": 352230 }, { "epoch": 1.78, "learning_rate": 3.3435581274500403e-05, "loss": 0.0054, "step": 352240 }, { "epoch": 1.78, "learning_rate": 3.342801358148639e-05, "loss": 0.0065, "step": 352250 }, { "epoch": 1.78, "learning_rate": 3.342044588847238e-05, "loss": 0.0053, "step": 352260 }, { "epoch": 1.78, "learning_rate": 3.3412878195458375e-05, "loss": 0.007, "step": 352270 }, { "epoch": 1.78, "learning_rate": 3.340531050244436e-05, "loss": 0.0059, "step": 352280 }, { "epoch": 1.78, "learning_rate": 3.339774280943035e-05, "loss": 0.0067, "step": 352290 }, { "epoch": 1.78, "learning_rate": 3.339017511641634e-05, "loss": 0.0048, "step": 352300 }, { "epoch": 1.78, "learning_rate": 3.3382607423402335e-05, "loss": 0.0072, "step": 352310 }, { "epoch": 1.78, "learning_rate": 3.337503973038832e-05, "loss": 0.007, "step": 352320 }, { "epoch": 1.78, "learning_rate": 3.336747203737431e-05, "loss": 0.0072, "step": 352330 }, { "epoch": 1.78, "learning_rate": 3.33599043443603e-05, "loss": 0.0063, "step": 352340 }, { "epoch": 1.78, "learning_rate": 3.335233665134629e-05, "loss": 0.0044, "step": 352350 }, { "epoch": 1.78, "learning_rate": 3.3344768958332276e-05, "loss": 0.0051, "step": 352360 }, { "epoch": 1.78, "learning_rate": 3.333720126531827e-05, "loss": 0.0069, "step": 352370 }, { "epoch": 1.78, "learning_rate": 3.332963357230426e-05, "loss": 0.0052, "step": 352380 }, { "epoch": 1.78, "learning_rate": 3.332206587929025e-05, "loss": 0.0093, "step": 352390 }, { "epoch": 1.78, "learning_rate": 3.3314498186276235e-05, "loss": 0.0068, "step": 352400 }, { "epoch": 1.78, "learning_rate": 3.330693049326223e-05, "loss": 0.0053, "step": 352410 }, { "epoch": 1.78, "learning_rate": 3.329936280024822e-05, "loss": 0.0084, "step": 352420 }, { "epoch": 1.78, "learning_rate": 3.329179510723421e-05, "loss": 0.0045, "step": 352430 }, { "epoch": 1.78, "learning_rate": 3.3284227414220195e-05, "loss": 0.006, "step": 352440 }, { "epoch": 1.78, "learning_rate": 3.327665972120619e-05, "loss": 0.0049, "step": 352450 }, { "epoch": 1.78, "learning_rate": 3.326909202819218e-05, "loss": 0.0075, "step": 352460 }, { "epoch": 1.78, "learning_rate": 3.3261524335178166e-05, "loss": 0.0065, "step": 352470 }, { "epoch": 1.78, "learning_rate": 3.3253956642164155e-05, "loss": 0.0058, "step": 352480 }, { "epoch": 1.78, "learning_rate": 3.324638894915014e-05, "loss": 0.0062, "step": 352490 }, { "epoch": 1.78, "learning_rate": 3.323882125613613e-05, "loss": 0.0051, "step": 352500 }, { "epoch": 1.78, "learning_rate": 3.3231253563122126e-05, "loss": 0.0049, "step": 352510 }, { "epoch": 1.78, "learning_rate": 3.3223685870108114e-05, "loss": 0.006, "step": 352520 }, { "epoch": 1.78, "learning_rate": 3.32161181770941e-05, "loss": 0.0061, "step": 352530 }, { "epoch": 1.78, "learning_rate": 3.320855048408009e-05, "loss": 0.0051, "step": 352540 }, { "epoch": 1.78, "learning_rate": 3.3200982791066086e-05, "loss": 0.0095, "step": 352550 }, { "epoch": 1.78, "learning_rate": 3.3193415098052074e-05, "loss": 0.0056, "step": 352560 }, { "epoch": 1.78, "learning_rate": 3.318584740503806e-05, "loss": 0.0069, "step": 352570 }, { "epoch": 1.78, "learning_rate": 3.317827971202405e-05, "loss": 0.0063, "step": 352580 }, { "epoch": 1.78, "learning_rate": 3.3170712019010045e-05, "loss": 0.0052, "step": 352590 }, { "epoch": 1.78, "learning_rate": 3.3163144325996034e-05, "loss": 0.008, "step": 352600 }, { "epoch": 1.78, "learning_rate": 3.315557663298202e-05, "loss": 0.0064, "step": 352610 }, { "epoch": 1.78, "learning_rate": 3.314800893996801e-05, "loss": 0.0057, "step": 352620 }, { "epoch": 1.78, "learning_rate": 3.3140441246954005e-05, "loss": 0.0068, "step": 352630 }, { "epoch": 1.78, "learning_rate": 3.3132873553939986e-05, "loss": 0.007, "step": 352640 }, { "epoch": 1.78, "learning_rate": 3.312530586092598e-05, "loss": 0.0043, "step": 352650 }, { "epoch": 1.78, "learning_rate": 3.311773816791197e-05, "loss": 0.0061, "step": 352660 }, { "epoch": 1.78, "learning_rate": 3.311017047489796e-05, "loss": 0.0048, "step": 352670 }, { "epoch": 1.78, "learning_rate": 3.3102602781883946e-05, "loss": 0.0068, "step": 352680 }, { "epoch": 1.78, "learning_rate": 3.309503508886994e-05, "loss": 0.0057, "step": 352690 }, { "epoch": 1.78, "learning_rate": 3.308746739585593e-05, "loss": 0.0065, "step": 352700 }, { "epoch": 1.78, "learning_rate": 3.307989970284192e-05, "loss": 0.0067, "step": 352710 }, { "epoch": 1.78, "learning_rate": 3.3072332009827906e-05, "loss": 0.0057, "step": 352720 }, { "epoch": 1.78, "learning_rate": 3.30647643168139e-05, "loss": 0.005, "step": 352730 }, { "epoch": 1.78, "learning_rate": 3.305719662379989e-05, "loss": 0.0053, "step": 352740 }, { "epoch": 1.78, "learning_rate": 3.304962893078588e-05, "loss": 0.0055, "step": 352750 }, { "epoch": 1.78, "learning_rate": 3.3042061237771865e-05, "loss": 0.0074, "step": 352760 }, { "epoch": 1.78, "learning_rate": 3.303449354475786e-05, "loss": 0.0051, "step": 352770 }, { "epoch": 1.78, "learning_rate": 3.302692585174385e-05, "loss": 0.0059, "step": 352780 }, { "epoch": 1.78, "learning_rate": 3.301935815872984e-05, "loss": 0.0053, "step": 352790 }, { "epoch": 1.78, "learning_rate": 3.3011790465715825e-05, "loss": 0.0064, "step": 352800 }, { "epoch": 1.78, "learning_rate": 3.300422277270181e-05, "loss": 0.0094, "step": 352810 }, { "epoch": 1.78, "learning_rate": 3.29966550796878e-05, "loss": 0.0074, "step": 352820 }, { "epoch": 1.78, "learning_rate": 3.2989087386673796e-05, "loss": 0.0062, "step": 352830 }, { "epoch": 1.78, "learning_rate": 3.2981519693659785e-05, "loss": 0.0058, "step": 352840 }, { "epoch": 1.78, "learning_rate": 3.297395200064577e-05, "loss": 0.0072, "step": 352850 }, { "epoch": 1.78, "learning_rate": 3.296638430763176e-05, "loss": 0.0064, "step": 352860 }, { "epoch": 1.78, "learning_rate": 3.2958816614617756e-05, "loss": 0.0061, "step": 352870 }, { "epoch": 1.78, "learning_rate": 3.2951248921603744e-05, "loss": 0.0046, "step": 352880 }, { "epoch": 1.78, "learning_rate": 3.294368122858973e-05, "loss": 0.0049, "step": 352890 }, { "epoch": 1.78, "learning_rate": 3.293611353557572e-05, "loss": 0.0062, "step": 352900 }, { "epoch": 1.78, "learning_rate": 3.2928545842561716e-05, "loss": 0.0092, "step": 352910 }, { "epoch": 1.78, "learning_rate": 3.2920978149547704e-05, "loss": 0.0059, "step": 352920 }, { "epoch": 1.78, "learning_rate": 3.291341045653369e-05, "loss": 0.0047, "step": 352930 }, { "epoch": 1.78, "learning_rate": 3.290584276351968e-05, "loss": 0.0057, "step": 352940 }, { "epoch": 1.78, "learning_rate": 3.289827507050567e-05, "loss": 0.006, "step": 352950 }, { "epoch": 1.78, "learning_rate": 3.289070737749166e-05, "loss": 0.0046, "step": 352960 }, { "epoch": 1.78, "learning_rate": 3.2883139684477645e-05, "loss": 0.0061, "step": 352970 }, { "epoch": 1.78, "learning_rate": 3.287557199146364e-05, "loss": 0.0057, "step": 352980 }, { "epoch": 1.78, "learning_rate": 3.286800429844963e-05, "loss": 0.0086, "step": 352990 }, { "epoch": 1.78, "learning_rate": 3.2860436605435617e-05, "loss": 0.0081, "step": 353000 }, { "epoch": 1.78, "eval_cer": 0.9144139729278888, "eval_loss": 0.0045607974752783775, "eval_runtime": 116.7751, "eval_samples_per_second": 17.127, "eval_steps_per_second": 4.282, "step": 353000 }, { "epoch": 1.78, "learning_rate": 3.2852868912421605e-05, "loss": 0.0066, "step": 353010 }, { "epoch": 1.78, "learning_rate": 3.28453012194076e-05, "loss": 0.0069, "step": 353020 }, { "epoch": 1.78, "learning_rate": 3.283773352639359e-05, "loss": 0.0071, "step": 353030 }, { "epoch": 1.78, "learning_rate": 3.2830165833379576e-05, "loss": 0.009, "step": 353040 }, { "epoch": 1.78, "learning_rate": 3.2822598140365564e-05, "loss": 0.0079, "step": 353050 }, { "epoch": 1.78, "learning_rate": 3.281503044735156e-05, "loss": 0.0056, "step": 353060 }, { "epoch": 1.78, "learning_rate": 3.280746275433755e-05, "loss": 0.0065, "step": 353070 }, { "epoch": 1.78, "learning_rate": 3.2799895061323536e-05, "loss": 0.0054, "step": 353080 }, { "epoch": 1.78, "learning_rate": 3.279232736830953e-05, "loss": 0.0054, "step": 353090 }, { "epoch": 1.78, "learning_rate": 3.278475967529552e-05, "loss": 0.0043, "step": 353100 }, { "epoch": 1.78, "learning_rate": 3.27771919822815e-05, "loss": 0.0075, "step": 353110 }, { "epoch": 1.78, "learning_rate": 3.2769624289267496e-05, "loss": 0.0059, "step": 353120 }, { "epoch": 1.78, "learning_rate": 3.2762056596253484e-05, "loss": 0.006, "step": 353130 }, { "epoch": 1.78, "learning_rate": 3.275448890323947e-05, "loss": 0.0052, "step": 353140 }, { "epoch": 1.78, "learning_rate": 3.274692121022546e-05, "loss": 0.0079, "step": 353150 }, { "epoch": 1.78, "learning_rate": 3.2739353517211455e-05, "loss": 0.0156, "step": 353160 }, { "epoch": 1.78, "learning_rate": 3.273178582419744e-05, "loss": 0.0114, "step": 353170 }, { "epoch": 1.78, "learning_rate": 3.272421813118343e-05, "loss": 0.0084, "step": 353180 }, { "epoch": 1.78, "learning_rate": 3.271665043816942e-05, "loss": 0.0069, "step": 353190 }, { "epoch": 1.78, "learning_rate": 3.2709082745155415e-05, "loss": 0.0052, "step": 353200 }, { "epoch": 1.78, "learning_rate": 3.27015150521414e-05, "loss": 0.0043, "step": 353210 }, { "epoch": 1.78, "learning_rate": 3.269394735912739e-05, "loss": 0.0046, "step": 353220 }, { "epoch": 1.78, "learning_rate": 3.268637966611338e-05, "loss": 0.0058, "step": 353230 }, { "epoch": 1.78, "learning_rate": 3.2678811973099374e-05, "loss": 0.0052, "step": 353240 }, { "epoch": 1.78, "learning_rate": 3.267124428008536e-05, "loss": 0.0074, "step": 353250 }, { "epoch": 1.78, "learning_rate": 3.266367658707135e-05, "loss": 0.0065, "step": 353260 }, { "epoch": 1.78, "learning_rate": 3.265610889405734e-05, "loss": 0.0044, "step": 353270 }, { "epoch": 1.78, "learning_rate": 3.264854120104333e-05, "loss": 0.0045, "step": 353280 }, { "epoch": 1.78, "learning_rate": 3.2640973508029316e-05, "loss": 0.0074, "step": 353290 }, { "epoch": 1.78, "learning_rate": 3.263340581501531e-05, "loss": 0.0061, "step": 353300 }, { "epoch": 1.78, "learning_rate": 3.26258381220013e-05, "loss": 0.007, "step": 353310 }, { "epoch": 1.78, "learning_rate": 3.261827042898729e-05, "loss": 0.007, "step": 353320 }, { "epoch": 1.78, "learning_rate": 3.2610702735973275e-05, "loss": 0.0055, "step": 353330 }, { "epoch": 1.78, "learning_rate": 3.260313504295927e-05, "loss": 0.0072, "step": 353340 }, { "epoch": 1.78, "learning_rate": 3.259556734994526e-05, "loss": 0.006, "step": 353350 }, { "epoch": 1.78, "learning_rate": 3.258799965693125e-05, "loss": 0.0064, "step": 353360 }, { "epoch": 1.78, "learning_rate": 3.2580431963917235e-05, "loss": 0.0087, "step": 353370 }, { "epoch": 1.78, "learning_rate": 3.257286427090323e-05, "loss": 0.0064, "step": 353380 }, { "epoch": 1.78, "learning_rate": 3.256529657788922e-05, "loss": 0.0054, "step": 353390 }, { "epoch": 1.78, "learning_rate": 3.2557728884875206e-05, "loss": 0.0041, "step": 353400 }, { "epoch": 1.78, "learning_rate": 3.2550161191861195e-05, "loss": 0.0052, "step": 353410 }, { "epoch": 1.78, "learning_rate": 3.254259349884719e-05, "loss": 0.0048, "step": 353420 }, { "epoch": 1.78, "learning_rate": 3.253502580583317e-05, "loss": 0.0059, "step": 353430 }, { "epoch": 1.78, "learning_rate": 3.2527458112819166e-05, "loss": 0.0035, "step": 353440 }, { "epoch": 1.78, "learning_rate": 3.2519890419805154e-05, "loss": 0.0087, "step": 353450 }, { "epoch": 1.78, "learning_rate": 3.251232272679114e-05, "loss": 0.0055, "step": 353460 }, { "epoch": 1.78, "learning_rate": 3.250475503377713e-05, "loss": 0.0065, "step": 353470 }, { "epoch": 1.78, "learning_rate": 3.2497187340763126e-05, "loss": 0.0058, "step": 353480 }, { "epoch": 1.78, "learning_rate": 3.2489619647749114e-05, "loss": 0.0078, "step": 353490 }, { "epoch": 1.78, "learning_rate": 3.24820519547351e-05, "loss": 0.005, "step": 353500 }, { "epoch": 1.78, "learning_rate": 3.247448426172109e-05, "loss": 0.0069, "step": 353510 }, { "epoch": 1.78, "learning_rate": 3.2466916568707085e-05, "loss": 0.0073, "step": 353520 }, { "epoch": 1.78, "learning_rate": 3.2459348875693073e-05, "loss": 0.0044, "step": 353530 }, { "epoch": 1.78, "learning_rate": 3.245178118267906e-05, "loss": 0.005, "step": 353540 }, { "epoch": 1.78, "learning_rate": 3.244421348966505e-05, "loss": 0.0048, "step": 353550 }, { "epoch": 1.78, "learning_rate": 3.2436645796651045e-05, "loss": 0.0063, "step": 353560 }, { "epoch": 1.78, "learning_rate": 3.242907810363703e-05, "loss": 0.0058, "step": 353570 }, { "epoch": 1.78, "learning_rate": 3.242151041062302e-05, "loss": 0.0054, "step": 353580 }, { "epoch": 1.78, "learning_rate": 3.241394271760901e-05, "loss": 0.0058, "step": 353590 }, { "epoch": 1.78, "learning_rate": 3.2406375024595e-05, "loss": 0.0062, "step": 353600 }, { "epoch": 1.78, "learning_rate": 3.2398807331580986e-05, "loss": 0.0054, "step": 353610 }, { "epoch": 1.78, "learning_rate": 3.239123963856698e-05, "loss": 0.0071, "step": 353620 }, { "epoch": 1.78, "learning_rate": 3.238367194555297e-05, "loss": 0.0046, "step": 353630 }, { "epoch": 1.78, "learning_rate": 3.237610425253896e-05, "loss": 0.0053, "step": 353640 }, { "epoch": 1.78, "learning_rate": 3.2368536559524946e-05, "loss": 0.0085, "step": 353650 }, { "epoch": 1.78, "learning_rate": 3.236096886651094e-05, "loss": 0.0094, "step": 353660 }, { "epoch": 1.78, "learning_rate": 3.235340117349693e-05, "loss": 0.0066, "step": 353670 }, { "epoch": 1.78, "learning_rate": 3.234583348048292e-05, "loss": 0.0042, "step": 353680 }, { "epoch": 1.78, "learning_rate": 3.2338265787468905e-05, "loss": 0.0064, "step": 353690 }, { "epoch": 1.78, "learning_rate": 3.23306980944549e-05, "loss": 0.0064, "step": 353700 }, { "epoch": 1.78, "learning_rate": 3.232313040144089e-05, "loss": 0.0065, "step": 353710 }, { "epoch": 1.78, "learning_rate": 3.231556270842688e-05, "loss": 0.0071, "step": 353720 }, { "epoch": 1.78, "learning_rate": 3.2307995015412865e-05, "loss": 0.005, "step": 353730 }, { "epoch": 1.78, "learning_rate": 3.230042732239885e-05, "loss": 0.0076, "step": 353740 }, { "epoch": 1.78, "learning_rate": 3.229285962938484e-05, "loss": 0.0079, "step": 353750 }, { "epoch": 1.78, "learning_rate": 3.228529193637083e-05, "loss": 0.0043, "step": 353760 }, { "epoch": 1.78, "learning_rate": 3.2277724243356825e-05, "loss": 0.0055, "step": 353770 }, { "epoch": 1.78, "learning_rate": 3.227015655034281e-05, "loss": 0.0067, "step": 353780 }, { "epoch": 1.78, "learning_rate": 3.22625888573288e-05, "loss": 0.0056, "step": 353790 }, { "epoch": 1.78, "learning_rate": 3.2255021164314796e-05, "loss": 0.0065, "step": 353800 }, { "epoch": 1.79, "learning_rate": 3.2247453471300784e-05, "loss": 0.0066, "step": 353810 }, { "epoch": 1.79, "learning_rate": 3.223988577828677e-05, "loss": 0.0061, "step": 353820 }, { "epoch": 1.79, "learning_rate": 3.223231808527276e-05, "loss": 0.0085, "step": 353830 }, { "epoch": 1.79, "learning_rate": 3.2224750392258756e-05, "loss": 0.0033, "step": 353840 }, { "epoch": 1.79, "learning_rate": 3.2217182699244744e-05, "loss": 0.0059, "step": 353850 }, { "epoch": 1.79, "learning_rate": 3.220961500623073e-05, "loss": 0.0062, "step": 353860 }, { "epoch": 1.79, "learning_rate": 3.220204731321672e-05, "loss": 0.0058, "step": 353870 }, { "epoch": 1.79, "learning_rate": 3.2194479620202715e-05, "loss": 0.0045, "step": 353880 }, { "epoch": 1.79, "learning_rate": 3.2186911927188704e-05, "loss": 0.0052, "step": 353890 }, { "epoch": 1.79, "learning_rate": 3.2179344234174685e-05, "loss": 0.0056, "step": 353900 }, { "epoch": 1.79, "learning_rate": 3.217177654116068e-05, "loss": 0.0062, "step": 353910 }, { "epoch": 1.79, "learning_rate": 3.216420884814667e-05, "loss": 0.0062, "step": 353920 }, { "epoch": 1.79, "learning_rate": 3.2156641155132656e-05, "loss": 0.0081, "step": 353930 }, { "epoch": 1.79, "learning_rate": 3.2149073462118645e-05, "loss": 0.0058, "step": 353940 }, { "epoch": 1.79, "learning_rate": 3.214150576910464e-05, "loss": 0.0044, "step": 353950 }, { "epoch": 1.79, "learning_rate": 3.213393807609063e-05, "loss": 0.0054, "step": 353960 }, { "epoch": 1.79, "learning_rate": 3.2126370383076616e-05, "loss": 0.0076, "step": 353970 }, { "epoch": 1.79, "learning_rate": 3.2118802690062604e-05, "loss": 0.0058, "step": 353980 }, { "epoch": 1.79, "learning_rate": 3.21112349970486e-05, "loss": 0.0069, "step": 353990 }, { "epoch": 1.79, "learning_rate": 3.210366730403459e-05, "loss": 0.0051, "step": 354000 }, { "epoch": 1.79, "eval_cer": 0.9144197953046413, "eval_loss": 0.004529756028205156, "eval_runtime": 116.782, "eval_samples_per_second": 17.126, "eval_steps_per_second": 4.281, "step": 354000 }, { "epoch": 1.79, "learning_rate": 3.2096099611020576e-05, "loss": 0.0069, "step": 354010 }, { "epoch": 1.79, "learning_rate": 3.2088531918006564e-05, "loss": 0.0073, "step": 354020 }, { "epoch": 1.79, "learning_rate": 3.208096422499256e-05, "loss": 0.0055, "step": 354030 }, { "epoch": 1.79, "learning_rate": 3.207339653197855e-05, "loss": 0.0066, "step": 354040 }, { "epoch": 1.79, "learning_rate": 3.2065828838964535e-05, "loss": 0.0061, "step": 354050 }, { "epoch": 1.79, "learning_rate": 3.2058261145950524e-05, "loss": 0.0063, "step": 354060 }, { "epoch": 1.79, "learning_rate": 3.205069345293651e-05, "loss": 0.0078, "step": 354070 }, { "epoch": 1.79, "learning_rate": 3.20431257599225e-05, "loss": 0.0059, "step": 354080 }, { "epoch": 1.79, "learning_rate": 3.2035558066908495e-05, "loss": 0.0059, "step": 354090 }, { "epoch": 1.79, "learning_rate": 3.202799037389448e-05, "loss": 0.0063, "step": 354100 }, { "epoch": 1.79, "learning_rate": 3.202042268088047e-05, "loss": 0.0072, "step": 354110 }, { "epoch": 1.79, "learning_rate": 3.201285498786646e-05, "loss": 0.0064, "step": 354120 }, { "epoch": 1.79, "learning_rate": 3.2005287294852455e-05, "loss": 0.0045, "step": 354130 }, { "epoch": 1.79, "learning_rate": 3.199771960183844e-05, "loss": 0.0072, "step": 354140 }, { "epoch": 1.79, "learning_rate": 3.199015190882443e-05, "loss": 0.0056, "step": 354150 }, { "epoch": 1.79, "learning_rate": 3.198258421581042e-05, "loss": 0.0113, "step": 354160 }, { "epoch": 1.79, "learning_rate": 3.1975016522796414e-05, "loss": 0.0064, "step": 354170 }, { "epoch": 1.79, "learning_rate": 3.19674488297824e-05, "loss": 0.0082, "step": 354180 }, { "epoch": 1.79, "learning_rate": 3.195988113676839e-05, "loss": 0.0063, "step": 354190 }, { "epoch": 1.79, "learning_rate": 3.195231344375438e-05, "loss": 0.0056, "step": 354200 }, { "epoch": 1.79, "learning_rate": 3.194474575074037e-05, "loss": 0.0058, "step": 354210 }, { "epoch": 1.79, "learning_rate": 3.1937178057726355e-05, "loss": 0.0054, "step": 354220 }, { "epoch": 1.79, "learning_rate": 3.192961036471235e-05, "loss": 0.0048, "step": 354230 }, { "epoch": 1.79, "learning_rate": 3.192204267169834e-05, "loss": 0.0055, "step": 354240 }, { "epoch": 1.79, "learning_rate": 3.191447497868433e-05, "loss": 0.0057, "step": 354250 }, { "epoch": 1.79, "learning_rate": 3.1906907285670315e-05, "loss": 0.0071, "step": 354260 }, { "epoch": 1.79, "learning_rate": 3.189933959265631e-05, "loss": 0.0059, "step": 354270 }, { "epoch": 1.79, "learning_rate": 3.18917718996423e-05, "loss": 0.0064, "step": 354280 }, { "epoch": 1.79, "learning_rate": 3.1884204206628287e-05, "loss": 0.0066, "step": 354290 }, { "epoch": 1.79, "learning_rate": 3.1876636513614275e-05, "loss": 0.0067, "step": 354300 }, { "epoch": 1.79, "learning_rate": 3.186906882060027e-05, "loss": 0.0059, "step": 354310 }, { "epoch": 1.79, "learning_rate": 3.186150112758626e-05, "loss": 0.007, "step": 354320 }, { "epoch": 1.79, "learning_rate": 3.1853933434572246e-05, "loss": 0.0065, "step": 354330 }, { "epoch": 1.79, "learning_rate": 3.1846365741558234e-05, "loss": 0.0062, "step": 354340 }, { "epoch": 1.79, "learning_rate": 3.183879804854423e-05, "loss": 0.0077, "step": 354350 }, { "epoch": 1.79, "learning_rate": 3.183123035553022e-05, "loss": 0.0062, "step": 354360 }, { "epoch": 1.79, "learning_rate": 3.1823662662516206e-05, "loss": 0.0074, "step": 354370 }, { "epoch": 1.79, "learning_rate": 3.1816094969502194e-05, "loss": 0.0086, "step": 354380 }, { "epoch": 1.79, "learning_rate": 3.180852727648818e-05, "loss": 0.0063, "step": 354390 }, { "epoch": 1.79, "learning_rate": 3.180095958347417e-05, "loss": 0.0074, "step": 354400 }, { "epoch": 1.79, "learning_rate": 3.1793391890460165e-05, "loss": 0.0051, "step": 354410 }, { "epoch": 1.79, "learning_rate": 3.1785824197446154e-05, "loss": 0.0077, "step": 354420 }, { "epoch": 1.79, "learning_rate": 3.177825650443214e-05, "loss": 0.0073, "step": 354430 }, { "epoch": 1.79, "learning_rate": 3.177068881141813e-05, "loss": 0.0068, "step": 354440 }, { "epoch": 1.79, "learning_rate": 3.1763121118404125e-05, "loss": 0.0048, "step": 354450 }, { "epoch": 1.79, "learning_rate": 3.175555342539011e-05, "loss": 0.0071, "step": 354460 }, { "epoch": 1.79, "learning_rate": 3.17479857323761e-05, "loss": 0.0048, "step": 354470 }, { "epoch": 1.79, "learning_rate": 3.174041803936209e-05, "loss": 0.0056, "step": 354480 }, { "epoch": 1.79, "learning_rate": 3.1732850346348085e-05, "loss": 0.0059, "step": 354490 }, { "epoch": 1.79, "learning_rate": 3.172528265333407e-05, "loss": 0.0053, "step": 354500 }, { "epoch": 1.79, "learning_rate": 3.171771496032006e-05, "loss": 0.005, "step": 354510 }, { "epoch": 1.79, "learning_rate": 3.171014726730605e-05, "loss": 0.007, "step": 354520 }, { "epoch": 1.79, "learning_rate": 3.170257957429204e-05, "loss": 0.0067, "step": 354530 }, { "epoch": 1.79, "learning_rate": 3.1695011881278026e-05, "loss": 0.005, "step": 354540 }, { "epoch": 1.79, "learning_rate": 3.168744418826402e-05, "loss": 0.0076, "step": 354550 }, { "epoch": 1.79, "learning_rate": 3.167987649525001e-05, "loss": 0.0054, "step": 354560 }, { "epoch": 1.79, "learning_rate": 3.1672308802236e-05, "loss": 0.004, "step": 354570 }, { "epoch": 1.79, "learning_rate": 3.1664741109221986e-05, "loss": 0.0068, "step": 354580 }, { "epoch": 1.79, "learning_rate": 3.165717341620798e-05, "loss": 0.0065, "step": 354590 }, { "epoch": 1.79, "learning_rate": 3.164960572319397e-05, "loss": 0.0076, "step": 354600 }, { "epoch": 1.79, "learning_rate": 3.164203803017996e-05, "loss": 0.0072, "step": 354610 }, { "epoch": 1.79, "learning_rate": 3.1634470337165945e-05, "loss": 0.0065, "step": 354620 }, { "epoch": 1.79, "learning_rate": 3.162690264415194e-05, "loss": 0.0055, "step": 354630 }, { "epoch": 1.79, "learning_rate": 3.161933495113793e-05, "loss": 0.0057, "step": 354640 }, { "epoch": 1.79, "learning_rate": 3.1611767258123917e-05, "loss": 0.0048, "step": 354650 }, { "epoch": 1.79, "learning_rate": 3.1604199565109905e-05, "loss": 0.0067, "step": 354660 }, { "epoch": 1.79, "learning_rate": 3.15966318720959e-05, "loss": 0.0064, "step": 354670 }, { "epoch": 1.79, "learning_rate": 3.158906417908188e-05, "loss": 0.0059, "step": 354680 }, { "epoch": 1.79, "learning_rate": 3.158149648606787e-05, "loss": 0.0044, "step": 354690 }, { "epoch": 1.79, "learning_rate": 3.1573928793053864e-05, "loss": 0.0069, "step": 354700 }, { "epoch": 1.79, "learning_rate": 3.156636110003985e-05, "loss": 0.0073, "step": 354710 }, { "epoch": 1.79, "learning_rate": 3.155879340702584e-05, "loss": 0.0057, "step": 354720 }, { "epoch": 1.79, "learning_rate": 3.155122571401183e-05, "loss": 0.0064, "step": 354730 }, { "epoch": 1.79, "learning_rate": 3.1543658020997824e-05, "loss": 0.0053, "step": 354740 }, { "epoch": 1.79, "learning_rate": 3.153609032798381e-05, "loss": 0.0062, "step": 354750 }, { "epoch": 1.79, "learning_rate": 3.15285226349698e-05, "loss": 0.0087, "step": 354760 }, { "epoch": 1.79, "learning_rate": 3.1520954941955796e-05, "loss": 0.0073, "step": 354770 }, { "epoch": 1.79, "learning_rate": 3.1513387248941784e-05, "loss": 0.0048, "step": 354780 }, { "epoch": 1.79, "learning_rate": 3.150581955592777e-05, "loss": 0.0047, "step": 354790 }, { "epoch": 1.79, "learning_rate": 3.149825186291376e-05, "loss": 0.0066, "step": 354800 }, { "epoch": 1.79, "learning_rate": 3.1490684169899755e-05, "loss": 0.0053, "step": 354810 }, { "epoch": 1.79, "learning_rate": 3.1483116476885743e-05, "loss": 0.0066, "step": 354820 }, { "epoch": 1.79, "learning_rate": 3.147554878387173e-05, "loss": 0.0065, "step": 354830 }, { "epoch": 1.79, "learning_rate": 3.146798109085772e-05, "loss": 0.006, "step": 354840 }, { "epoch": 1.79, "learning_rate": 3.146041339784371e-05, "loss": 0.0055, "step": 354850 }, { "epoch": 1.79, "learning_rate": 3.1452845704829696e-05, "loss": 0.0048, "step": 354860 }, { "epoch": 1.79, "learning_rate": 3.1445278011815685e-05, "loss": 0.0065, "step": 354870 }, { "epoch": 1.79, "learning_rate": 3.143771031880168e-05, "loss": 0.0061, "step": 354880 }, { "epoch": 1.79, "learning_rate": 3.143014262578767e-05, "loss": 0.0064, "step": 354890 }, { "epoch": 1.79, "learning_rate": 3.1422574932773656e-05, "loss": 0.008, "step": 354900 }, { "epoch": 1.79, "learning_rate": 3.1415007239759644e-05, "loss": 0.0046, "step": 354910 }, { "epoch": 1.79, "learning_rate": 3.140743954674564e-05, "loss": 0.0072, "step": 354920 }, { "epoch": 1.79, "learning_rate": 3.139987185373163e-05, "loss": 0.0054, "step": 354930 }, { "epoch": 1.79, "learning_rate": 3.1392304160717616e-05, "loss": 0.0056, "step": 354940 }, { "epoch": 1.79, "learning_rate": 3.1384736467703604e-05, "loss": 0.0065, "step": 354950 }, { "epoch": 1.79, "learning_rate": 3.13771687746896e-05, "loss": 0.0073, "step": 354960 }, { "epoch": 1.79, "learning_rate": 3.136960108167559e-05, "loss": 0.0052, "step": 354970 }, { "epoch": 1.79, "learning_rate": 3.1362033388661575e-05, "loss": 0.0064, "step": 354980 }, { "epoch": 1.79, "learning_rate": 3.1354465695647563e-05, "loss": 0.0048, "step": 354990 }, { "epoch": 1.79, "learning_rate": 3.134689800263355e-05, "loss": 0.006, "step": 355000 }, { "epoch": 1.79, "eval_cer": 0.9144265880775191, "eval_loss": 0.004483331926167011, "eval_runtime": 116.7694, "eval_samples_per_second": 17.128, "eval_steps_per_second": 4.282, "step": 355000 }, { "epoch": 1.79, "learning_rate": 3.133933030961954e-05, "loss": 0.0064, "step": 355010 }, { "epoch": 1.79, "learning_rate": 3.1331762616605535e-05, "loss": 0.0053, "step": 355020 }, { "epoch": 1.79, "learning_rate": 3.132419492359152e-05, "loss": 0.0061, "step": 355030 }, { "epoch": 1.79, "learning_rate": 3.131662723057751e-05, "loss": 0.0045, "step": 355040 }, { "epoch": 1.79, "learning_rate": 3.13090595375635e-05, "loss": 0.0057, "step": 355050 }, { "epoch": 1.79, "learning_rate": 3.1301491844549495e-05, "loss": 0.0053, "step": 355060 }, { "epoch": 1.79, "learning_rate": 3.129392415153548e-05, "loss": 0.0064, "step": 355070 }, { "epoch": 1.79, "learning_rate": 3.128635645852147e-05, "loss": 0.0051, "step": 355080 }, { "epoch": 1.79, "learning_rate": 3.127878876550746e-05, "loss": 0.0088, "step": 355090 }, { "epoch": 1.79, "learning_rate": 3.1271221072493454e-05, "loss": 0.0071, "step": 355100 }, { "epoch": 1.79, "learning_rate": 3.126365337947944e-05, "loss": 0.0065, "step": 355110 }, { "epoch": 1.79, "learning_rate": 3.125608568646543e-05, "loss": 0.0063, "step": 355120 }, { "epoch": 1.79, "learning_rate": 3.124851799345142e-05, "loss": 0.0055, "step": 355130 }, { "epoch": 1.79, "learning_rate": 3.1240950300437414e-05, "loss": 0.0042, "step": 355140 }, { "epoch": 1.79, "learning_rate": 3.1233382607423395e-05, "loss": 0.0053, "step": 355150 }, { "epoch": 1.79, "learning_rate": 3.122581491440939e-05, "loss": 0.0043, "step": 355160 }, { "epoch": 1.79, "learning_rate": 3.121824722139538e-05, "loss": 0.0063, "step": 355170 }, { "epoch": 1.79, "learning_rate": 3.121067952838137e-05, "loss": 0.007, "step": 355180 }, { "epoch": 1.79, "learning_rate": 3.1203111835367355e-05, "loss": 0.0072, "step": 355190 }, { "epoch": 1.79, "learning_rate": 3.119554414235335e-05, "loss": 0.0075, "step": 355200 }, { "epoch": 1.79, "learning_rate": 3.118797644933934e-05, "loss": 0.006, "step": 355210 }, { "epoch": 1.79, "learning_rate": 3.1180408756325326e-05, "loss": 0.0059, "step": 355220 }, { "epoch": 1.79, "learning_rate": 3.1172841063311315e-05, "loss": 0.0076, "step": 355230 }, { "epoch": 1.79, "learning_rate": 3.116527337029731e-05, "loss": 0.0064, "step": 355240 }, { "epoch": 1.79, "learning_rate": 3.11577056772833e-05, "loss": 0.0044, "step": 355250 }, { "epoch": 1.79, "learning_rate": 3.1150137984269286e-05, "loss": 0.0054, "step": 355260 }, { "epoch": 1.79, "learning_rate": 3.1142570291255274e-05, "loss": 0.0054, "step": 355270 }, { "epoch": 1.79, "learning_rate": 3.113500259824127e-05, "loss": 0.0055, "step": 355280 }, { "epoch": 1.79, "learning_rate": 3.112743490522726e-05, "loss": 0.0071, "step": 355290 }, { "epoch": 1.79, "learning_rate": 3.1119867212213246e-05, "loss": 0.0045, "step": 355300 }, { "epoch": 1.79, "learning_rate": 3.1112299519199234e-05, "loss": 0.0075, "step": 355310 }, { "epoch": 1.79, "learning_rate": 3.110473182618522e-05, "loss": 0.0058, "step": 355320 }, { "epoch": 1.79, "learning_rate": 3.109716413317121e-05, "loss": 0.0053, "step": 355330 }, { "epoch": 1.79, "learning_rate": 3.1089596440157205e-05, "loss": 0.0053, "step": 355340 }, { "epoch": 1.79, "learning_rate": 3.1082028747143194e-05, "loss": 0.0032, "step": 355350 }, { "epoch": 1.79, "learning_rate": 3.107446105412918e-05, "loss": 0.0064, "step": 355360 }, { "epoch": 1.79, "learning_rate": 3.106689336111517e-05, "loss": 0.0048, "step": 355370 }, { "epoch": 1.79, "learning_rate": 3.1059325668101165e-05, "loss": 0.0061, "step": 355380 }, { "epoch": 1.79, "learning_rate": 3.105175797508715e-05, "loss": 0.0046, "step": 355390 }, { "epoch": 1.79, "learning_rate": 3.104419028207314e-05, "loss": 0.0058, "step": 355400 }, { "epoch": 1.79, "learning_rate": 3.103662258905913e-05, "loss": 0.009, "step": 355410 }, { "epoch": 1.79, "learning_rate": 3.1029054896045125e-05, "loss": 0.0056, "step": 355420 }, { "epoch": 1.79, "learning_rate": 3.102148720303111e-05, "loss": 0.0058, "step": 355430 }, { "epoch": 1.79, "learning_rate": 3.10139195100171e-05, "loss": 0.0049, "step": 355440 }, { "epoch": 1.79, "learning_rate": 3.100635181700309e-05, "loss": 0.0083, "step": 355450 }, { "epoch": 1.79, "learning_rate": 3.0998784123989084e-05, "loss": 0.0058, "step": 355460 }, { "epoch": 1.79, "learning_rate": 3.0991216430975066e-05, "loss": 0.0056, "step": 355470 }, { "epoch": 1.79, "learning_rate": 3.098364873796106e-05, "loss": 0.0054, "step": 355480 }, { "epoch": 1.79, "learning_rate": 3.097608104494705e-05, "loss": 0.0093, "step": 355490 }, { "epoch": 1.79, "learning_rate": 3.096851335193304e-05, "loss": 0.0048, "step": 355500 }, { "epoch": 1.79, "learning_rate": 3.0960945658919025e-05, "loss": 0.0056, "step": 355510 }, { "epoch": 1.79, "learning_rate": 3.095337796590502e-05, "loss": 0.0061, "step": 355520 }, { "epoch": 1.79, "learning_rate": 3.094581027289101e-05, "loss": 0.0058, "step": 355530 }, { "epoch": 1.79, "learning_rate": 3.0938242579877e-05, "loss": 0.0074, "step": 355540 }, { "epoch": 1.79, "learning_rate": 3.0930674886862985e-05, "loss": 0.006, "step": 355550 }, { "epoch": 1.79, "learning_rate": 3.092310719384898e-05, "loss": 0.0052, "step": 355560 }, { "epoch": 1.79, "learning_rate": 3.091553950083497e-05, "loss": 0.0059, "step": 355570 }, { "epoch": 1.79, "learning_rate": 3.0907971807820956e-05, "loss": 0.0047, "step": 355580 }, { "epoch": 1.79, "learning_rate": 3.0900404114806945e-05, "loss": 0.0061, "step": 355590 }, { "epoch": 1.79, "learning_rate": 3.089283642179294e-05, "loss": 0.0061, "step": 355600 }, { "epoch": 1.79, "learning_rate": 3.088526872877893e-05, "loss": 0.009, "step": 355610 }, { "epoch": 1.79, "learning_rate": 3.0877701035764916e-05, "loss": 0.0062, "step": 355620 }, { "epoch": 1.79, "learning_rate": 3.0870133342750904e-05, "loss": 0.0045, "step": 355630 }, { "epoch": 1.79, "learning_rate": 3.086256564973689e-05, "loss": 0.0058, "step": 355640 }, { "epoch": 1.79, "learning_rate": 3.085499795672288e-05, "loss": 0.0058, "step": 355650 }, { "epoch": 1.79, "learning_rate": 3.084743026370887e-05, "loss": 0.006, "step": 355660 }, { "epoch": 1.79, "learning_rate": 3.0839862570694864e-05, "loss": 0.0056, "step": 355670 }, { "epoch": 1.79, "learning_rate": 3.083229487768085e-05, "loss": 0.0071, "step": 355680 }, { "epoch": 1.79, "learning_rate": 3.082472718466684e-05, "loss": 0.006, "step": 355690 }, { "epoch": 1.79, "learning_rate": 3.081715949165283e-05, "loss": 0.0052, "step": 355700 }, { "epoch": 1.79, "learning_rate": 3.0809591798638824e-05, "loss": 0.0056, "step": 355710 }, { "epoch": 1.79, "learning_rate": 3.080202410562481e-05, "loss": 0.0051, "step": 355720 }, { "epoch": 1.79, "learning_rate": 3.07944564126108e-05, "loss": 0.007, "step": 355730 }, { "epoch": 1.79, "learning_rate": 3.0786888719596795e-05, "loss": 0.0045, "step": 355740 }, { "epoch": 1.79, "learning_rate": 3.077932102658278e-05, "loss": 0.0052, "step": 355750 }, { "epoch": 1.79, "learning_rate": 3.077175333356877e-05, "loss": 0.007, "step": 355760 }, { "epoch": 1.79, "learning_rate": 3.076418564055476e-05, "loss": 0.0086, "step": 355770 }, { "epoch": 1.79, "learning_rate": 3.075661794754075e-05, "loss": 0.0046, "step": 355780 }, { "epoch": 1.79, "learning_rate": 3.0749050254526736e-05, "loss": 0.0052, "step": 355790 }, { "epoch": 1.8, "learning_rate": 3.0741482561512724e-05, "loss": 0.0052, "step": 355800 }, { "epoch": 1.8, "learning_rate": 3.073391486849872e-05, "loss": 0.0052, "step": 355810 }, { "epoch": 1.8, "learning_rate": 3.072634717548471e-05, "loss": 0.0061, "step": 355820 }, { "epoch": 1.8, "learning_rate": 3.0718779482470696e-05, "loss": 0.0046, "step": 355830 }, { "epoch": 1.8, "learning_rate": 3.0711211789456684e-05, "loss": 0.0049, "step": 355840 }, { "epoch": 1.8, "learning_rate": 3.070364409644268e-05, "loss": 0.0061, "step": 355850 }, { "epoch": 1.8, "learning_rate": 3.069607640342867e-05, "loss": 0.0077, "step": 355860 }, { "epoch": 1.8, "learning_rate": 3.0688508710414655e-05, "loss": 0.0044, "step": 355870 }, { "epoch": 1.8, "learning_rate": 3.0680941017400644e-05, "loss": 0.0064, "step": 355880 }, { "epoch": 1.8, "learning_rate": 3.067337332438664e-05, "loss": 0.0053, "step": 355890 }, { "epoch": 1.8, "learning_rate": 3.066580563137263e-05, "loss": 0.0044, "step": 355900 }, { "epoch": 1.8, "learning_rate": 3.0658237938358615e-05, "loss": 0.0062, "step": 355910 }, { "epoch": 1.8, "learning_rate": 3.06506702453446e-05, "loss": 0.0064, "step": 355920 }, { "epoch": 1.8, "learning_rate": 3.06431025523306e-05, "loss": 0.0071, "step": 355930 }, { "epoch": 1.8, "learning_rate": 3.063553485931658e-05, "loss": 0.0051, "step": 355940 }, { "epoch": 1.8, "learning_rate": 3.0627967166302575e-05, "loss": 0.0045, "step": 355950 }, { "epoch": 1.8, "learning_rate": 3.062039947328856e-05, "loss": 0.0048, "step": 355960 }, { "epoch": 1.8, "learning_rate": 3.061283178027455e-05, "loss": 0.0049, "step": 355970 }, { "epoch": 1.8, "learning_rate": 3.060526408726054e-05, "loss": 0.0086, "step": 355980 }, { "epoch": 1.8, "learning_rate": 3.0597696394246534e-05, "loss": 0.0049, "step": 355990 }, { "epoch": 1.8, "learning_rate": 3.059012870123252e-05, "loss": 0.005, "step": 356000 }, { "epoch": 1.8, "eval_cer": 0.9144130025317635, "eval_loss": 0.0044956691563129425, "eval_runtime": 116.7755, "eval_samples_per_second": 17.127, "eval_steps_per_second": 4.282, "step": 356000 }, { "epoch": 1.8, "learning_rate": 3.058256100821851e-05, "loss": 0.0047, "step": 356010 }, { "epoch": 1.8, "learning_rate": 3.05749933152045e-05, "loss": 0.0055, "step": 356020 }, { "epoch": 1.8, "learning_rate": 3.0567425622190494e-05, "loss": 0.0052, "step": 356030 }, { "epoch": 1.8, "learning_rate": 3.055985792917648e-05, "loss": 0.006, "step": 356040 }, { "epoch": 1.8, "learning_rate": 3.055229023616247e-05, "loss": 0.0087, "step": 356050 }, { "epoch": 1.8, "learning_rate": 3.054472254314846e-05, "loss": 0.0071, "step": 356060 }, { "epoch": 1.8, "learning_rate": 3.0537154850134454e-05, "loss": 0.0055, "step": 356070 }, { "epoch": 1.8, "learning_rate": 3.052958715712044e-05, "loss": 0.0057, "step": 356080 }, { "epoch": 1.8, "learning_rate": 3.052201946410643e-05, "loss": 0.0051, "step": 356090 }, { "epoch": 1.8, "learning_rate": 3.051445177109242e-05, "loss": 0.0056, "step": 356100 }, { "epoch": 1.8, "learning_rate": 3.0506884078078407e-05, "loss": 0.0062, "step": 356110 }, { "epoch": 1.8, "learning_rate": 3.0499316385064398e-05, "loss": 0.0046, "step": 356120 }, { "epoch": 1.8, "learning_rate": 3.0491748692050386e-05, "loss": 0.0079, "step": 356130 }, { "epoch": 1.8, "learning_rate": 3.0484180999036378e-05, "loss": 0.0063, "step": 356140 }, { "epoch": 1.8, "learning_rate": 3.0476613306022366e-05, "loss": 0.0073, "step": 356150 }, { "epoch": 1.8, "learning_rate": 3.0469045613008358e-05, "loss": 0.0049, "step": 356160 }, { "epoch": 1.8, "learning_rate": 3.0461477919994346e-05, "loss": 0.0083, "step": 356170 }, { "epoch": 1.8, "learning_rate": 3.0453910226980338e-05, "loss": 0.0052, "step": 356180 }, { "epoch": 1.8, "learning_rate": 3.0446342533966326e-05, "loss": 0.004, "step": 356190 }, { "epoch": 1.8, "learning_rate": 3.0438774840952318e-05, "loss": 0.0066, "step": 356200 }, { "epoch": 1.8, "learning_rate": 3.0431207147938306e-05, "loss": 0.0066, "step": 356210 }, { "epoch": 1.8, "learning_rate": 3.0423639454924297e-05, "loss": 0.0064, "step": 356220 }, { "epoch": 1.8, "learning_rate": 3.0416071761910286e-05, "loss": 0.0062, "step": 356230 }, { "epoch": 1.8, "learning_rate": 3.0408504068896277e-05, "loss": 0.0067, "step": 356240 }, { "epoch": 1.8, "learning_rate": 3.0400936375882262e-05, "loss": 0.0047, "step": 356250 }, { "epoch": 1.8, "learning_rate": 3.0393368682868254e-05, "loss": 0.0056, "step": 356260 }, { "epoch": 1.8, "learning_rate": 3.0385800989854242e-05, "loss": 0.0048, "step": 356270 }, { "epoch": 1.8, "learning_rate": 3.0378233296840233e-05, "loss": 0.0092, "step": 356280 }, { "epoch": 1.8, "learning_rate": 3.037066560382622e-05, "loss": 0.0062, "step": 356290 }, { "epoch": 1.8, "learning_rate": 3.0363097910812213e-05, "loss": 0.0042, "step": 356300 }, { "epoch": 1.8, "learning_rate": 3.03555302177982e-05, "loss": 0.0073, "step": 356310 }, { "epoch": 1.8, "learning_rate": 3.0347962524784193e-05, "loss": 0.0077, "step": 356320 }, { "epoch": 1.8, "learning_rate": 3.034039483177018e-05, "loss": 0.0072, "step": 356330 }, { "epoch": 1.8, "learning_rate": 3.0332827138756173e-05, "loss": 0.006, "step": 356340 }, { "epoch": 1.8, "learning_rate": 3.032525944574216e-05, "loss": 0.0058, "step": 356350 }, { "epoch": 1.8, "learning_rate": 3.0317691752728153e-05, "loss": 0.0056, "step": 356360 }, { "epoch": 1.8, "learning_rate": 3.031012405971414e-05, "loss": 0.0055, "step": 356370 }, { "epoch": 1.8, "learning_rate": 3.0302556366700133e-05, "loss": 0.0091, "step": 356380 }, { "epoch": 1.8, "learning_rate": 3.029498867368612e-05, "loss": 0.0079, "step": 356390 }, { "epoch": 1.8, "learning_rate": 3.0287420980672112e-05, "loss": 0.0073, "step": 356400 }, { "epoch": 1.8, "learning_rate": 3.0279853287658097e-05, "loss": 0.005, "step": 356410 }, { "epoch": 1.8, "learning_rate": 3.0272285594644085e-05, "loss": 0.0058, "step": 356420 }, { "epoch": 1.8, "learning_rate": 3.0264717901630077e-05, "loss": 0.0065, "step": 356430 }, { "epoch": 1.8, "learning_rate": 3.0257150208616065e-05, "loss": 0.0065, "step": 356440 }, { "epoch": 1.8, "learning_rate": 3.0249582515602057e-05, "loss": 0.0057, "step": 356450 }, { "epoch": 1.8, "learning_rate": 3.024201482258805e-05, "loss": 0.0058, "step": 356460 }, { "epoch": 1.8, "learning_rate": 3.0234447129574037e-05, "loss": 0.0057, "step": 356470 }, { "epoch": 1.8, "learning_rate": 3.0226879436560028e-05, "loss": 0.0058, "step": 356480 }, { "epoch": 1.8, "learning_rate": 3.0219311743546017e-05, "loss": 0.0075, "step": 356490 }, { "epoch": 1.8, "learning_rate": 3.0211744050532008e-05, "loss": 0.004, "step": 356500 }, { "epoch": 1.8, "learning_rate": 3.0204176357517996e-05, "loss": 0.0067, "step": 356510 }, { "epoch": 1.8, "learning_rate": 3.0196608664503988e-05, "loss": 0.0055, "step": 356520 }, { "epoch": 1.8, "learning_rate": 3.0189040971489976e-05, "loss": 0.0104, "step": 356530 }, { "epoch": 1.8, "learning_rate": 3.0181473278475968e-05, "loss": 0.0058, "step": 356540 }, { "epoch": 1.8, "learning_rate": 3.0173905585461956e-05, "loss": 0.0038, "step": 356550 }, { "epoch": 1.8, "learning_rate": 3.0166337892447948e-05, "loss": 0.0057, "step": 356560 }, { "epoch": 1.8, "learning_rate": 3.0158770199433932e-05, "loss": 0.0031, "step": 356570 }, { "epoch": 1.8, "learning_rate": 3.015120250641992e-05, "loss": 0.0049, "step": 356580 }, { "epoch": 1.8, "learning_rate": 3.0143634813405912e-05, "loss": 0.0059, "step": 356590 }, { "epoch": 1.8, "learning_rate": 3.01360671203919e-05, "loss": 0.0049, "step": 356600 }, { "epoch": 1.8, "learning_rate": 3.0128499427377892e-05, "loss": 0.0063, "step": 356610 }, { "epoch": 1.8, "learning_rate": 3.012093173436388e-05, "loss": 0.0051, "step": 356620 }, { "epoch": 1.8, "learning_rate": 3.0113364041349872e-05, "loss": 0.006, "step": 356630 }, { "epoch": 1.8, "learning_rate": 3.010579634833586e-05, "loss": 0.0051, "step": 356640 }, { "epoch": 1.8, "learning_rate": 3.0098228655321852e-05, "loss": 0.0052, "step": 356650 }, { "epoch": 1.8, "learning_rate": 3.009066096230784e-05, "loss": 0.0044, "step": 356660 }, { "epoch": 1.8, "learning_rate": 3.008309326929383e-05, "loss": 0.0072, "step": 356670 }, { "epoch": 1.8, "learning_rate": 3.007552557627982e-05, "loss": 0.0056, "step": 356680 }, { "epoch": 1.8, "learning_rate": 3.006795788326581e-05, "loss": 0.0071, "step": 356690 }, { "epoch": 1.8, "learning_rate": 3.00603901902518e-05, "loss": 0.0054, "step": 356700 }, { "epoch": 1.8, "learning_rate": 3.005282249723779e-05, "loss": 0.0047, "step": 356710 }, { "epoch": 1.8, "learning_rate": 3.0045254804223783e-05, "loss": 0.0075, "step": 356720 }, { "epoch": 1.8, "learning_rate": 3.0037687111209768e-05, "loss": 0.0047, "step": 356730 }, { "epoch": 1.8, "learning_rate": 3.0030119418195756e-05, "loss": 0.0061, "step": 356740 }, { "epoch": 1.8, "learning_rate": 3.0022551725181747e-05, "loss": 0.0066, "step": 356750 }, { "epoch": 1.8, "learning_rate": 3.0014984032167736e-05, "loss": 0.0065, "step": 356760 }, { "epoch": 1.8, "learning_rate": 3.0007416339153727e-05, "loss": 0.0051, "step": 356770 }, { "epoch": 1.8, "learning_rate": 2.9999848646139716e-05, "loss": 0.0065, "step": 356780 }, { "epoch": 1.8, "learning_rate": 2.9992280953125707e-05, "loss": 0.0065, "step": 356790 }, { "epoch": 1.8, "learning_rate": 2.9984713260111695e-05, "loss": 0.005, "step": 356800 }, { "epoch": 1.8, "learning_rate": 2.9977145567097687e-05, "loss": 0.0071, "step": 356810 }, { "epoch": 1.8, "learning_rate": 2.9969577874083675e-05, "loss": 0.0053, "step": 356820 }, { "epoch": 1.8, "learning_rate": 2.9962010181069667e-05, "loss": 0.0059, "step": 356830 }, { "epoch": 1.8, "learning_rate": 2.9954442488055655e-05, "loss": 0.0051, "step": 356840 }, { "epoch": 1.8, "learning_rate": 2.9946874795041647e-05, "loss": 0.0067, "step": 356850 }, { "epoch": 1.8, "learning_rate": 2.9939307102027635e-05, "loss": 0.0061, "step": 356860 }, { "epoch": 1.8, "learning_rate": 2.9931739409013626e-05, "loss": 0.0066, "step": 356870 }, { "epoch": 1.8, "learning_rate": 2.992417171599961e-05, "loss": 0.0053, "step": 356880 }, { "epoch": 1.8, "learning_rate": 2.9916604022985603e-05, "loss": 0.0063, "step": 356890 }, { "epoch": 1.8, "learning_rate": 2.990903632997159e-05, "loss": 0.0073, "step": 356900 }, { "epoch": 1.8, "learning_rate": 2.9901468636957583e-05, "loss": 0.008, "step": 356910 }, { "epoch": 1.8, "learning_rate": 2.989390094394357e-05, "loss": 0.0055, "step": 356920 }, { "epoch": 1.8, "learning_rate": 2.9886333250929563e-05, "loss": 0.0048, "step": 356930 }, { "epoch": 1.8, "learning_rate": 2.987876555791555e-05, "loss": 0.0065, "step": 356940 }, { "epoch": 1.8, "learning_rate": 2.9871197864901542e-05, "loss": 0.0063, "step": 356950 }, { "epoch": 1.8, "learning_rate": 2.986363017188753e-05, "loss": 0.0072, "step": 356960 }, { "epoch": 1.8, "learning_rate": 2.9856062478873522e-05, "loss": 0.0048, "step": 356970 }, { "epoch": 1.8, "learning_rate": 2.984849478585951e-05, "loss": 0.0053, "step": 356980 }, { "epoch": 1.8, "learning_rate": 2.9840927092845502e-05, "loss": 0.0047, "step": 356990 }, { "epoch": 1.8, "learning_rate": 2.983335939983149e-05, "loss": 0.0061, "step": 357000 }, { "epoch": 1.8, "eval_cer": 0.9144139729278888, "eval_loss": 0.004504029173403978, "eval_runtime": 116.8007, "eval_samples_per_second": 17.123, "eval_steps_per_second": 4.281, "step": 357000 }, { "epoch": 1.8, "learning_rate": 2.9825791706817482e-05, "loss": 0.0057, "step": 357010 }, { "epoch": 1.8, "learning_rate": 2.981822401380347e-05, "loss": 0.0074, "step": 357020 }, { "epoch": 1.8, "learning_rate": 2.981065632078946e-05, "loss": 0.0063, "step": 357030 }, { "epoch": 1.8, "learning_rate": 2.9803088627775446e-05, "loss": 0.0048, "step": 357040 }, { "epoch": 1.8, "learning_rate": 2.9795520934761438e-05, "loss": 0.0068, "step": 357050 }, { "epoch": 1.8, "learning_rate": 2.9787953241747426e-05, "loss": 0.0072, "step": 357060 }, { "epoch": 1.8, "learning_rate": 2.9780385548733418e-05, "loss": 0.006, "step": 357070 }, { "epoch": 1.8, "learning_rate": 2.9772817855719406e-05, "loss": 0.0052, "step": 357080 }, { "epoch": 1.8, "learning_rate": 2.9765250162705398e-05, "loss": 0.0061, "step": 357090 }, { "epoch": 1.8, "learning_rate": 2.9757682469691386e-05, "loss": 0.0069, "step": 357100 }, { "epoch": 1.8, "learning_rate": 2.9750114776677378e-05, "loss": 0.0077, "step": 357110 }, { "epoch": 1.8, "learning_rate": 2.9742547083663366e-05, "loss": 0.0031, "step": 357120 }, { "epoch": 1.8, "learning_rate": 2.9734979390649357e-05, "loss": 0.0046, "step": 357130 }, { "epoch": 1.8, "learning_rate": 2.9727411697635346e-05, "loss": 0.0067, "step": 357140 }, { "epoch": 1.8, "learning_rate": 2.9719844004621337e-05, "loss": 0.0053, "step": 357150 }, { "epoch": 1.8, "learning_rate": 2.9712276311607325e-05, "loss": 0.0041, "step": 357160 }, { "epoch": 1.8, "learning_rate": 2.9704708618593317e-05, "loss": 0.0084, "step": 357170 }, { "epoch": 1.8, "learning_rate": 2.9697140925579305e-05, "loss": 0.005, "step": 357180 }, { "epoch": 1.8, "learning_rate": 2.9689573232565297e-05, "loss": 0.0074, "step": 357190 }, { "epoch": 1.8, "learning_rate": 2.968200553955128e-05, "loss": 0.011, "step": 357200 }, { "epoch": 1.8, "learning_rate": 2.9674437846537273e-05, "loss": 0.0068, "step": 357210 }, { "epoch": 1.8, "learning_rate": 2.966687015352326e-05, "loss": 0.0044, "step": 357220 }, { "epoch": 1.8, "learning_rate": 2.9659302460509253e-05, "loss": 0.0077, "step": 357230 }, { "epoch": 1.8, "learning_rate": 2.965173476749524e-05, "loss": 0.0072, "step": 357240 }, { "epoch": 1.8, "learning_rate": 2.9644167074481233e-05, "loss": 0.0061, "step": 357250 }, { "epoch": 1.8, "learning_rate": 2.963659938146722e-05, "loss": 0.0044, "step": 357260 }, { "epoch": 1.8, "learning_rate": 2.9629031688453213e-05, "loss": 0.0044, "step": 357270 }, { "epoch": 1.8, "learning_rate": 2.96214639954392e-05, "loss": 0.008, "step": 357280 }, { "epoch": 1.8, "learning_rate": 2.9613896302425193e-05, "loss": 0.0048, "step": 357290 }, { "epoch": 1.8, "learning_rate": 2.960632860941118e-05, "loss": 0.0053, "step": 357300 }, { "epoch": 1.8, "learning_rate": 2.9598760916397172e-05, "loss": 0.0058, "step": 357310 }, { "epoch": 1.8, "learning_rate": 2.959119322338316e-05, "loss": 0.0065, "step": 357320 }, { "epoch": 1.8, "learning_rate": 2.9583625530369152e-05, "loss": 0.0045, "step": 357330 }, { "epoch": 1.8, "learning_rate": 2.957605783735514e-05, "loss": 0.0059, "step": 357340 }, { "epoch": 1.8, "learning_rate": 2.9568490144341125e-05, "loss": 0.0061, "step": 357350 }, { "epoch": 1.8, "learning_rate": 2.9560922451327117e-05, "loss": 0.0051, "step": 357360 }, { "epoch": 1.8, "learning_rate": 2.9553354758313105e-05, "loss": 0.0058, "step": 357370 }, { "epoch": 1.8, "learning_rate": 2.9545787065299097e-05, "loss": 0.0067, "step": 357380 }, { "epoch": 1.8, "learning_rate": 2.9538219372285085e-05, "loss": 0.0051, "step": 357390 }, { "epoch": 1.8, "learning_rate": 2.9530651679271077e-05, "loss": 0.0057, "step": 357400 }, { "epoch": 1.8, "learning_rate": 2.9523083986257065e-05, "loss": 0.0065, "step": 357410 }, { "epoch": 1.8, "learning_rate": 2.9515516293243056e-05, "loss": 0.0054, "step": 357420 }, { "epoch": 1.8, "learning_rate": 2.9507948600229048e-05, "loss": 0.0049, "step": 357430 }, { "epoch": 1.8, "learning_rate": 2.9500380907215036e-05, "loss": 0.0047, "step": 357440 }, { "epoch": 1.8, "learning_rate": 2.9492813214201028e-05, "loss": 0.0056, "step": 357450 }, { "epoch": 1.8, "learning_rate": 2.9485245521187016e-05, "loss": 0.0084, "step": 357460 }, { "epoch": 1.8, "learning_rate": 2.9477677828173008e-05, "loss": 0.0066, "step": 357470 }, { "epoch": 1.8, "learning_rate": 2.9470110135158996e-05, "loss": 0.007, "step": 357480 }, { "epoch": 1.8, "learning_rate": 2.9462542442144987e-05, "loss": 0.0054, "step": 357490 }, { "epoch": 1.8, "learning_rate": 2.9454974749130976e-05, "loss": 0.0049, "step": 357500 }, { "epoch": 1.8, "learning_rate": 2.944740705611696e-05, "loss": 0.0056, "step": 357510 }, { "epoch": 1.8, "learning_rate": 2.9439839363102952e-05, "loss": 0.006, "step": 357520 }, { "epoch": 1.8, "learning_rate": 2.943227167008894e-05, "loss": 0.0063, "step": 357530 }, { "epoch": 1.8, "learning_rate": 2.9424703977074932e-05, "loss": 0.0048, "step": 357540 }, { "epoch": 1.8, "learning_rate": 2.941713628406092e-05, "loss": 0.0061, "step": 357550 }, { "epoch": 1.8, "learning_rate": 2.9409568591046912e-05, "loss": 0.006, "step": 357560 }, { "epoch": 1.8, "learning_rate": 2.94020008980329e-05, "loss": 0.0059, "step": 357570 }, { "epoch": 1.8, "learning_rate": 2.939443320501889e-05, "loss": 0.0077, "step": 357580 }, { "epoch": 1.8, "learning_rate": 2.938686551200488e-05, "loss": 0.0057, "step": 357590 }, { "epoch": 1.8, "learning_rate": 2.937929781899087e-05, "loss": 0.0061, "step": 357600 }, { "epoch": 1.8, "learning_rate": 2.937173012597686e-05, "loss": 0.0055, "step": 357610 }, { "epoch": 1.8, "learning_rate": 2.936416243296285e-05, "loss": 0.0061, "step": 357620 }, { "epoch": 1.8, "learning_rate": 2.935659473994884e-05, "loss": 0.0054, "step": 357630 }, { "epoch": 1.8, "learning_rate": 2.934902704693483e-05, "loss": 0.0048, "step": 357640 }, { "epoch": 1.8, "learning_rate": 2.934145935392082e-05, "loss": 0.0059, "step": 357650 }, { "epoch": 1.8, "learning_rate": 2.933389166090681e-05, "loss": 0.0051, "step": 357660 }, { "epoch": 1.8, "learning_rate": 2.9326323967892796e-05, "loss": 0.0069, "step": 357670 }, { "epoch": 1.8, "learning_rate": 2.9318756274878787e-05, "loss": 0.0069, "step": 357680 }, { "epoch": 1.8, "learning_rate": 2.9311188581864776e-05, "loss": 0.0061, "step": 357690 }, { "epoch": 1.8, "learning_rate": 2.9303620888850767e-05, "loss": 0.0049, "step": 357700 }, { "epoch": 1.8, "learning_rate": 2.9296053195836755e-05, "loss": 0.007, "step": 357710 }, { "epoch": 1.8, "learning_rate": 2.9288485502822747e-05, "loss": 0.0053, "step": 357720 }, { "epoch": 1.8, "learning_rate": 2.9280917809808735e-05, "loss": 0.0079, "step": 357730 }, { "epoch": 1.8, "learning_rate": 2.9273350116794727e-05, "loss": 0.0074, "step": 357740 }, { "epoch": 1.8, "learning_rate": 2.9265782423780715e-05, "loss": 0.0097, "step": 357750 }, { "epoch": 1.8, "learning_rate": 2.9258214730766707e-05, "loss": 0.0051, "step": 357760 }, { "epoch": 1.8, "learning_rate": 2.9250647037752695e-05, "loss": 0.0054, "step": 357770 }, { "epoch": 1.81, "learning_rate": 2.9243079344738686e-05, "loss": 0.0065, "step": 357780 }, { "epoch": 1.81, "learning_rate": 2.9235511651724675e-05, "loss": 0.0065, "step": 357790 }, { "epoch": 1.81, "learning_rate": 2.9227943958710666e-05, "loss": 0.0074, "step": 357800 }, { "epoch": 1.81, "learning_rate": 2.9220376265696655e-05, "loss": 0.0054, "step": 357810 }, { "epoch": 1.81, "learning_rate": 2.9212808572682643e-05, "loss": 0.0062, "step": 357820 }, { "epoch": 1.81, "learning_rate": 2.920524087966863e-05, "loss": 0.0064, "step": 357830 }, { "epoch": 1.81, "learning_rate": 2.9197673186654623e-05, "loss": 0.0068, "step": 357840 }, { "epoch": 1.81, "learning_rate": 2.919010549364061e-05, "loss": 0.0054, "step": 357850 }, { "epoch": 1.81, "learning_rate": 2.9182537800626602e-05, "loss": 0.0061, "step": 357860 }, { "epoch": 1.81, "learning_rate": 2.917497010761259e-05, "loss": 0.0075, "step": 357870 }, { "epoch": 1.81, "learning_rate": 2.9167402414598582e-05, "loss": 0.0053, "step": 357880 }, { "epoch": 1.81, "learning_rate": 2.915983472158457e-05, "loss": 0.0065, "step": 357890 }, { "epoch": 1.81, "learning_rate": 2.9152267028570562e-05, "loss": 0.0058, "step": 357900 }, { "epoch": 1.81, "learning_rate": 2.914469933555655e-05, "loss": 0.0052, "step": 357910 }, { "epoch": 1.81, "learning_rate": 2.9137131642542542e-05, "loss": 0.0056, "step": 357920 }, { "epoch": 1.81, "learning_rate": 2.912956394952853e-05, "loss": 0.0074, "step": 357930 }, { "epoch": 1.81, "learning_rate": 2.912199625651452e-05, "loss": 0.0075, "step": 357940 }, { "epoch": 1.81, "learning_rate": 2.911442856350051e-05, "loss": 0.0053, "step": 357950 }, { "epoch": 1.81, "learning_rate": 2.91068608704865e-05, "loss": 0.0077, "step": 357960 }, { "epoch": 1.81, "learning_rate": 2.909929317747249e-05, "loss": 0.0072, "step": 357970 }, { "epoch": 1.81, "learning_rate": 2.9091725484458478e-05, "loss": 0.0036, "step": 357980 }, { "epoch": 1.81, "learning_rate": 2.9084157791444466e-05, "loss": 0.0061, "step": 357990 }, { "epoch": 1.81, "learning_rate": 2.9076590098430458e-05, "loss": 0.0079, "step": 358000 }, { "epoch": 1.81, "eval_cer": 0.9144353216426477, "eval_loss": 0.004471032880246639, "eval_runtime": 116.5217, "eval_samples_per_second": 17.164, "eval_steps_per_second": 4.291, "step": 358000 }, { "epoch": 1.81, "learning_rate": 2.9069022405416446e-05, "loss": 0.0062, "step": 358010 }, { "epoch": 1.81, "learning_rate": 2.9061454712402438e-05, "loss": 0.007, "step": 358020 }, { "epoch": 1.81, "learning_rate": 2.9053887019388426e-05, "loss": 0.0066, "step": 358030 }, { "epoch": 1.81, "learning_rate": 2.9046319326374417e-05, "loss": 0.0092, "step": 358040 }, { "epoch": 1.81, "learning_rate": 2.9038751633360406e-05, "loss": 0.0076, "step": 358050 }, { "epoch": 1.81, "learning_rate": 2.9031183940346397e-05, "loss": 0.0057, "step": 358060 }, { "epoch": 1.81, "learning_rate": 2.9023616247332385e-05, "loss": 0.0057, "step": 358070 }, { "epoch": 1.81, "learning_rate": 2.9016048554318377e-05, "loss": 0.005, "step": 358080 }, { "epoch": 1.81, "learning_rate": 2.9008480861304365e-05, "loss": 0.0064, "step": 358090 }, { "epoch": 1.81, "learning_rate": 2.9000913168290357e-05, "loss": 0.0067, "step": 358100 }, { "epoch": 1.81, "learning_rate": 2.8993345475276345e-05, "loss": 0.0092, "step": 358110 }, { "epoch": 1.81, "learning_rate": 2.8985777782262337e-05, "loss": 0.006, "step": 358120 }, { "epoch": 1.81, "learning_rate": 2.8978210089248325e-05, "loss": 0.0065, "step": 358130 }, { "epoch": 1.81, "learning_rate": 2.8970642396234313e-05, "loss": 0.0053, "step": 358140 }, { "epoch": 1.81, "learning_rate": 2.89630747032203e-05, "loss": 0.0052, "step": 358150 }, { "epoch": 1.81, "learning_rate": 2.8955507010206293e-05, "loss": 0.0041, "step": 358160 }, { "epoch": 1.81, "learning_rate": 2.894793931719228e-05, "loss": 0.005, "step": 358170 }, { "epoch": 1.81, "learning_rate": 2.8940371624178273e-05, "loss": 0.0078, "step": 358180 }, { "epoch": 1.81, "learning_rate": 2.893280393116426e-05, "loss": 0.0055, "step": 358190 }, { "epoch": 1.81, "learning_rate": 2.8925236238150253e-05, "loss": 0.0056, "step": 358200 }, { "epoch": 1.81, "learning_rate": 2.891766854513624e-05, "loss": 0.0062, "step": 358210 }, { "epoch": 1.81, "learning_rate": 2.8910100852122232e-05, "loss": 0.0051, "step": 358220 }, { "epoch": 1.81, "learning_rate": 2.890253315910822e-05, "loss": 0.0067, "step": 358230 }, { "epoch": 1.81, "learning_rate": 2.8894965466094212e-05, "loss": 0.0067, "step": 358240 }, { "epoch": 1.81, "learning_rate": 2.88873977730802e-05, "loss": 0.0075, "step": 358250 }, { "epoch": 1.81, "learning_rate": 2.8879830080066192e-05, "loss": 0.0066, "step": 358260 }, { "epoch": 1.81, "learning_rate": 2.887226238705218e-05, "loss": 0.0061, "step": 358270 }, { "epoch": 1.81, "learning_rate": 2.8864694694038172e-05, "loss": 0.0055, "step": 358280 }, { "epoch": 1.81, "learning_rate": 2.885712700102416e-05, "loss": 0.0077, "step": 358290 }, { "epoch": 1.81, "learning_rate": 2.8849559308010145e-05, "loss": 0.0058, "step": 358300 }, { "epoch": 1.81, "learning_rate": 2.8841991614996137e-05, "loss": 0.0062, "step": 358310 }, { "epoch": 1.81, "learning_rate": 2.8834423921982125e-05, "loss": 0.0038, "step": 358320 }, { "epoch": 1.81, "learning_rate": 2.8826856228968116e-05, "loss": 0.0077, "step": 358330 }, { "epoch": 1.81, "learning_rate": 2.8819288535954105e-05, "loss": 0.0065, "step": 358340 }, { "epoch": 1.81, "learning_rate": 2.8811720842940096e-05, "loss": 0.0053, "step": 358350 }, { "epoch": 1.81, "learning_rate": 2.8804153149926084e-05, "loss": 0.0059, "step": 358360 }, { "epoch": 1.81, "learning_rate": 2.8796585456912076e-05, "loss": 0.0056, "step": 358370 }, { "epoch": 1.81, "learning_rate": 2.8789017763898064e-05, "loss": 0.0081, "step": 358380 }, { "epoch": 1.81, "learning_rate": 2.8781450070884056e-05, "loss": 0.0075, "step": 358390 }, { "epoch": 1.81, "learning_rate": 2.8773882377870048e-05, "loss": 0.0079, "step": 358400 }, { "epoch": 1.81, "learning_rate": 2.8766314684856036e-05, "loss": 0.0058, "step": 358410 }, { "epoch": 1.81, "learning_rate": 2.8758746991842027e-05, "loss": 0.0059, "step": 358420 }, { "epoch": 1.81, "learning_rate": 2.8751179298828016e-05, "loss": 0.0052, "step": 358430 }, { "epoch": 1.81, "learning_rate": 2.8743611605814007e-05, "loss": 0.0047, "step": 358440 }, { "epoch": 1.81, "learning_rate": 2.8736043912799992e-05, "loss": 0.0057, "step": 358450 }, { "epoch": 1.81, "learning_rate": 2.872847621978598e-05, "loss": 0.0066, "step": 358460 }, { "epoch": 1.81, "learning_rate": 2.8720908526771972e-05, "loss": 0.0065, "step": 358470 }, { "epoch": 1.81, "learning_rate": 2.871334083375796e-05, "loss": 0.0056, "step": 358480 }, { "epoch": 1.81, "learning_rate": 2.870577314074395e-05, "loss": 0.0066, "step": 358490 }, { "epoch": 1.81, "learning_rate": 2.869820544772994e-05, "loss": 0.0057, "step": 358500 }, { "epoch": 1.81, "learning_rate": 2.869063775471593e-05, "loss": 0.006, "step": 358510 }, { "epoch": 1.81, "learning_rate": 2.868307006170192e-05, "loss": 0.0064, "step": 358520 }, { "epoch": 1.81, "learning_rate": 2.867550236868791e-05, "loss": 0.0069, "step": 358530 }, { "epoch": 1.81, "learning_rate": 2.86679346756739e-05, "loss": 0.0065, "step": 358540 }, { "epoch": 1.81, "learning_rate": 2.866036698265989e-05, "loss": 0.0046, "step": 358550 }, { "epoch": 1.81, "learning_rate": 2.865279928964588e-05, "loss": 0.0058, "step": 358560 }, { "epoch": 1.81, "learning_rate": 2.864523159663187e-05, "loss": 0.0069, "step": 358570 }, { "epoch": 1.81, "learning_rate": 2.863766390361786e-05, "loss": 0.0066, "step": 358580 }, { "epoch": 1.81, "learning_rate": 2.863009621060385e-05, "loss": 0.0065, "step": 358590 }, { "epoch": 1.81, "learning_rate": 2.862252851758984e-05, "loss": 0.0074, "step": 358600 }, { "epoch": 1.81, "learning_rate": 2.8614960824575827e-05, "loss": 0.0041, "step": 358610 }, { "epoch": 1.81, "learning_rate": 2.8607393131561815e-05, "loss": 0.0051, "step": 358620 }, { "epoch": 1.81, "learning_rate": 2.8599825438547807e-05, "loss": 0.0069, "step": 358630 }, { "epoch": 1.81, "learning_rate": 2.8592257745533795e-05, "loss": 0.0049, "step": 358640 }, { "epoch": 1.81, "learning_rate": 2.8584690052519787e-05, "loss": 0.0074, "step": 358650 }, { "epoch": 1.81, "learning_rate": 2.8577122359505775e-05, "loss": 0.0068, "step": 358660 }, { "epoch": 1.81, "learning_rate": 2.8569554666491767e-05, "loss": 0.0071, "step": 358670 }, { "epoch": 1.81, "learning_rate": 2.8561986973477755e-05, "loss": 0.0072, "step": 358680 }, { "epoch": 1.81, "learning_rate": 2.8554419280463747e-05, "loss": 0.0061, "step": 358690 }, { "epoch": 1.81, "learning_rate": 2.8546851587449735e-05, "loss": 0.006, "step": 358700 }, { "epoch": 1.81, "learning_rate": 2.8539283894435726e-05, "loss": 0.0052, "step": 358710 }, { "epoch": 1.81, "learning_rate": 2.8531716201421715e-05, "loss": 0.0063, "step": 358720 }, { "epoch": 1.81, "learning_rate": 2.8524148508407706e-05, "loss": 0.0047, "step": 358730 }, { "epoch": 1.81, "learning_rate": 2.8516580815393694e-05, "loss": 0.0073, "step": 358740 }, { "epoch": 1.81, "learning_rate": 2.8509013122379686e-05, "loss": 0.0047, "step": 358750 }, { "epoch": 1.81, "learning_rate": 2.8501445429365674e-05, "loss": 0.0063, "step": 358760 }, { "epoch": 1.81, "learning_rate": 2.8493877736351662e-05, "loss": 0.0066, "step": 358770 }, { "epoch": 1.81, "learning_rate": 2.848631004333765e-05, "loss": 0.0092, "step": 358780 }, { "epoch": 1.81, "learning_rate": 2.8478742350323642e-05, "loss": 0.0044, "step": 358790 }, { "epoch": 1.81, "learning_rate": 2.847117465730963e-05, "loss": 0.0055, "step": 358800 }, { "epoch": 1.81, "learning_rate": 2.8463606964295622e-05, "loss": 0.0067, "step": 358810 }, { "epoch": 1.81, "learning_rate": 2.845603927128161e-05, "loss": 0.0046, "step": 358820 }, { "epoch": 1.81, "learning_rate": 2.8448471578267602e-05, "loss": 0.0059, "step": 358830 }, { "epoch": 1.81, "learning_rate": 2.844090388525359e-05, "loss": 0.0054, "step": 358840 }, { "epoch": 1.81, "learning_rate": 2.8433336192239582e-05, "loss": 0.0067, "step": 358850 }, { "epoch": 1.81, "learning_rate": 2.842576849922557e-05, "loss": 0.0062, "step": 358860 }, { "epoch": 1.81, "learning_rate": 2.841820080621156e-05, "loss": 0.008, "step": 358870 }, { "epoch": 1.81, "learning_rate": 2.841063311319755e-05, "loss": 0.0059, "step": 358880 }, { "epoch": 1.81, "learning_rate": 2.840306542018354e-05, "loss": 0.0058, "step": 358890 }, { "epoch": 1.81, "learning_rate": 2.839549772716953e-05, "loss": 0.0058, "step": 358900 }, { "epoch": 1.81, "learning_rate": 2.838793003415552e-05, "loss": 0.0068, "step": 358910 }, { "epoch": 1.81, "learning_rate": 2.8380362341141506e-05, "loss": 0.0058, "step": 358920 }, { "epoch": 1.81, "learning_rate": 2.8372794648127498e-05, "loss": 0.0049, "step": 358930 }, { "epoch": 1.81, "learning_rate": 2.8365226955113486e-05, "loss": 0.0073, "step": 358940 }, { "epoch": 1.81, "learning_rate": 2.8357659262099477e-05, "loss": 0.0047, "step": 358950 }, { "epoch": 1.81, "learning_rate": 2.8350091569085466e-05, "loss": 0.0046, "step": 358960 }, { "epoch": 1.81, "learning_rate": 2.8342523876071457e-05, "loss": 0.004, "step": 358970 }, { "epoch": 1.81, "learning_rate": 2.8334956183057446e-05, "loss": 0.0052, "step": 358980 }, { "epoch": 1.81, "learning_rate": 2.8327388490043437e-05, "loss": 0.0059, "step": 358990 }, { "epoch": 1.81, "learning_rate": 2.8319820797029425e-05, "loss": 0.0065, "step": 359000 }, { "epoch": 1.81, "eval_cer": 0.9144217360968921, "eval_loss": 0.004385951440781355, "eval_runtime": 116.7254, "eval_samples_per_second": 17.134, "eval_steps_per_second": 4.284, "step": 359000 }, { "epoch": 1.81, "learning_rate": 2.8312253104015417e-05, "loss": 0.0066, "step": 359010 }, { "epoch": 1.81, "learning_rate": 2.8304685411001405e-05, "loss": 0.0076, "step": 359020 }, { "epoch": 1.81, "learning_rate": 2.8297117717987397e-05, "loss": 0.0056, "step": 359030 }, { "epoch": 1.81, "learning_rate": 2.8289550024973385e-05, "loss": 0.0047, "step": 359040 }, { "epoch": 1.81, "learning_rate": 2.8281982331959377e-05, "loss": 0.0052, "step": 359050 }, { "epoch": 1.81, "learning_rate": 2.8274414638945365e-05, "loss": 0.0079, "step": 359060 }, { "epoch": 1.81, "learning_rate": 2.8266846945931356e-05, "loss": 0.0053, "step": 359070 }, { "epoch": 1.81, "learning_rate": 2.825927925291734e-05, "loss": 0.0071, "step": 359080 }, { "epoch": 1.81, "learning_rate": 2.825171155990333e-05, "loss": 0.0071, "step": 359090 }, { "epoch": 1.81, "learning_rate": 2.824414386688932e-05, "loss": 0.0053, "step": 359100 }, { "epoch": 1.81, "learning_rate": 2.8236576173875313e-05, "loss": 0.0052, "step": 359110 }, { "epoch": 1.81, "learning_rate": 2.82290084808613e-05, "loss": 0.0076, "step": 359120 }, { "epoch": 1.81, "learning_rate": 2.8221440787847293e-05, "loss": 0.0054, "step": 359130 }, { "epoch": 1.81, "learning_rate": 2.821387309483328e-05, "loss": 0.0067, "step": 359140 }, { "epoch": 1.81, "learning_rate": 2.8206305401819272e-05, "loss": 0.0045, "step": 359150 }, { "epoch": 1.81, "learning_rate": 2.819873770880526e-05, "loss": 0.0044, "step": 359160 }, { "epoch": 1.81, "learning_rate": 2.8191170015791252e-05, "loss": 0.004, "step": 359170 }, { "epoch": 1.81, "learning_rate": 2.818360232277724e-05, "loss": 0.0063, "step": 359180 }, { "epoch": 1.81, "learning_rate": 2.8176034629763232e-05, "loss": 0.0052, "step": 359190 }, { "epoch": 1.81, "learning_rate": 2.816846693674922e-05, "loss": 0.005, "step": 359200 }, { "epoch": 1.81, "learning_rate": 2.8160899243735212e-05, "loss": 0.007, "step": 359210 }, { "epoch": 1.81, "learning_rate": 2.81533315507212e-05, "loss": 0.0076, "step": 359220 }, { "epoch": 1.81, "learning_rate": 2.814576385770719e-05, "loss": 0.0062, "step": 359230 }, { "epoch": 1.81, "learning_rate": 2.8138196164693176e-05, "loss": 0.0054, "step": 359240 }, { "epoch": 1.81, "learning_rate": 2.8130628471679165e-05, "loss": 0.0068, "step": 359250 }, { "epoch": 1.81, "learning_rate": 2.8123060778665156e-05, "loss": 0.0081, "step": 359260 }, { "epoch": 1.81, "learning_rate": 2.8115493085651145e-05, "loss": 0.0052, "step": 359270 }, { "epoch": 1.81, "learning_rate": 2.8107925392637136e-05, "loss": 0.0054, "step": 359280 }, { "epoch": 1.81, "learning_rate": 2.8100357699623124e-05, "loss": 0.0065, "step": 359290 }, { "epoch": 1.81, "learning_rate": 2.8092790006609116e-05, "loss": 0.0041, "step": 359300 }, { "epoch": 1.81, "learning_rate": 2.8085222313595104e-05, "loss": 0.0068, "step": 359310 }, { "epoch": 1.81, "learning_rate": 2.8077654620581096e-05, "loss": 0.0066, "step": 359320 }, { "epoch": 1.81, "learning_rate": 2.8070086927567084e-05, "loss": 0.0066, "step": 359330 }, { "epoch": 1.81, "learning_rate": 2.8062519234553076e-05, "loss": 0.0041, "step": 359340 }, { "epoch": 1.81, "learning_rate": 2.8054951541539064e-05, "loss": 0.006, "step": 359350 }, { "epoch": 1.81, "learning_rate": 2.8047383848525055e-05, "loss": 0.0081, "step": 359360 }, { "epoch": 1.81, "learning_rate": 2.8039816155511047e-05, "loss": 0.0053, "step": 359370 }, { "epoch": 1.81, "learning_rate": 2.8032248462497035e-05, "loss": 0.0066, "step": 359380 }, { "epoch": 1.81, "learning_rate": 2.8024680769483027e-05, "loss": 0.0047, "step": 359390 }, { "epoch": 1.81, "learning_rate": 2.801711307646901e-05, "loss": 0.0052, "step": 359400 }, { "epoch": 1.81, "learning_rate": 2.8009545383455e-05, "loss": 0.0101, "step": 359410 }, { "epoch": 1.81, "learning_rate": 2.800197769044099e-05, "loss": 0.0105, "step": 359420 }, { "epoch": 1.81, "learning_rate": 2.799440999742698e-05, "loss": 0.0047, "step": 359430 }, { "epoch": 1.81, "learning_rate": 2.798684230441297e-05, "loss": 0.0063, "step": 359440 }, { "epoch": 1.81, "learning_rate": 2.797927461139896e-05, "loss": 0.0055, "step": 359450 }, { "epoch": 1.81, "learning_rate": 2.797170691838495e-05, "loss": 0.0061, "step": 359460 }, { "epoch": 1.81, "learning_rate": 2.796413922537094e-05, "loss": 0.0055, "step": 359470 }, { "epoch": 1.81, "learning_rate": 2.795657153235693e-05, "loss": 0.0067, "step": 359480 }, { "epoch": 1.81, "learning_rate": 2.794900383934292e-05, "loss": 0.0061, "step": 359490 }, { "epoch": 1.81, "learning_rate": 2.794143614632891e-05, "loss": 0.0044, "step": 359500 }, { "epoch": 1.81, "learning_rate": 2.79338684533149e-05, "loss": 0.0049, "step": 359510 }, { "epoch": 1.81, "learning_rate": 2.792630076030089e-05, "loss": 0.0061, "step": 359520 }, { "epoch": 1.81, "learning_rate": 2.791873306728688e-05, "loss": 0.0046, "step": 359530 }, { "epoch": 1.81, "learning_rate": 2.791116537427287e-05, "loss": 0.0055, "step": 359540 }, { "epoch": 1.81, "learning_rate": 2.7903597681258855e-05, "loss": 0.0067, "step": 359550 }, { "epoch": 1.81, "learning_rate": 2.7896029988244847e-05, "loss": 0.0064, "step": 359560 }, { "epoch": 1.81, "learning_rate": 2.7888462295230835e-05, "loss": 0.0055, "step": 359570 }, { "epoch": 1.81, "learning_rate": 2.7880894602216827e-05, "loss": 0.0054, "step": 359580 }, { "epoch": 1.81, "learning_rate": 2.7873326909202815e-05, "loss": 0.0102, "step": 359590 }, { "epoch": 1.81, "learning_rate": 2.7865759216188807e-05, "loss": 0.0068, "step": 359600 }, { "epoch": 1.81, "learning_rate": 2.7858191523174795e-05, "loss": 0.0067, "step": 359610 }, { "epoch": 1.81, "learning_rate": 2.7850623830160786e-05, "loss": 0.0047, "step": 359620 }, { "epoch": 1.81, "learning_rate": 2.7843056137146775e-05, "loss": 0.0068, "step": 359630 }, { "epoch": 1.81, "learning_rate": 2.7835488444132766e-05, "loss": 0.0063, "step": 359640 }, { "epoch": 1.81, "learning_rate": 2.7827920751118754e-05, "loss": 0.008, "step": 359650 }, { "epoch": 1.81, "learning_rate": 2.7820353058104746e-05, "loss": 0.0058, "step": 359660 }, { "epoch": 1.81, "learning_rate": 2.7812785365090734e-05, "loss": 0.0055, "step": 359670 }, { "epoch": 1.81, "learning_rate": 2.7805217672076726e-05, "loss": 0.0066, "step": 359680 }, { "epoch": 1.81, "learning_rate": 2.7797649979062714e-05, "loss": 0.0077, "step": 359690 }, { "epoch": 1.81, "learning_rate": 2.7790082286048706e-05, "loss": 0.0082, "step": 359700 }, { "epoch": 1.81, "learning_rate": 2.778251459303469e-05, "loss": 0.0055, "step": 359710 }, { "epoch": 1.81, "learning_rate": 2.7774946900020682e-05, "loss": 0.0069, "step": 359720 }, { "epoch": 1.81, "learning_rate": 2.776737920700667e-05, "loss": 0.0083, "step": 359730 }, { "epoch": 1.81, "learning_rate": 2.7759811513992662e-05, "loss": 0.0053, "step": 359740 }, { "epoch": 1.81, "learning_rate": 2.775224382097865e-05, "loss": 0.0048, "step": 359750 }, { "epoch": 1.82, "learning_rate": 2.7744676127964642e-05, "loss": 0.0055, "step": 359760 }, { "epoch": 1.82, "learning_rate": 2.773710843495063e-05, "loss": 0.006, "step": 359770 }, { "epoch": 1.82, "learning_rate": 2.772954074193662e-05, "loss": 0.0056, "step": 359780 }, { "epoch": 1.82, "learning_rate": 2.772197304892261e-05, "loss": 0.0043, "step": 359790 }, { "epoch": 1.82, "learning_rate": 2.77144053559086e-05, "loss": 0.0061, "step": 359800 }, { "epoch": 1.82, "learning_rate": 2.770683766289459e-05, "loss": 0.0079, "step": 359810 }, { "epoch": 1.82, "learning_rate": 2.769926996988058e-05, "loss": 0.0067, "step": 359820 }, { "epoch": 1.82, "learning_rate": 2.769170227686657e-05, "loss": 0.0063, "step": 359830 }, { "epoch": 1.82, "learning_rate": 2.768413458385256e-05, "loss": 0.0048, "step": 359840 }, { "epoch": 1.82, "learning_rate": 2.767656689083855e-05, "loss": 0.0062, "step": 359850 }, { "epoch": 1.82, "learning_rate": 2.766899919782454e-05, "loss": 0.0091, "step": 359860 }, { "epoch": 1.82, "learning_rate": 2.7661431504810526e-05, "loss": 0.0055, "step": 359870 }, { "epoch": 1.82, "learning_rate": 2.7653863811796517e-05, "loss": 0.0074, "step": 359880 }, { "epoch": 1.82, "learning_rate": 2.7646296118782506e-05, "loss": 0.0074, "step": 359890 }, { "epoch": 1.82, "learning_rate": 2.7638728425768497e-05, "loss": 0.006, "step": 359900 }, { "epoch": 1.82, "learning_rate": 2.7631160732754485e-05, "loss": 0.005, "step": 359910 }, { "epoch": 1.82, "learning_rate": 2.7623593039740477e-05, "loss": 0.0066, "step": 359920 }, { "epoch": 1.82, "learning_rate": 2.7616025346726465e-05, "loss": 0.0063, "step": 359930 }, { "epoch": 1.82, "learning_rate": 2.7608457653712457e-05, "loss": 0.0047, "step": 359940 }, { "epoch": 1.82, "learning_rate": 2.7600889960698445e-05, "loss": 0.0057, "step": 359950 }, { "epoch": 1.82, "learning_rate": 2.7593322267684437e-05, "loss": 0.0074, "step": 359960 }, { "epoch": 1.82, "learning_rate": 2.7585754574670425e-05, "loss": 0.007, "step": 359970 }, { "epoch": 1.82, "learning_rate": 2.7578186881656416e-05, "loss": 0.0047, "step": 359980 }, { "epoch": 1.82, "learning_rate": 2.7570619188642405e-05, "loss": 0.0048, "step": 359990 }, { "epoch": 1.82, "learning_rate": 2.7563051495628396e-05, "loss": 0.0062, "step": 360000 }, { "epoch": 1.82, "eval_cer": 0.9144062097588856, "eval_loss": 0.0043929265812039375, "eval_runtime": 116.599, "eval_samples_per_second": 17.153, "eval_steps_per_second": 4.288, "step": 360000 }, { "epoch": 1.82, "learning_rate": 2.7555483802614385e-05, "loss": 0.0062, "step": 360010 }, { "epoch": 1.82, "learning_rate": 2.754791610960037e-05, "loss": 0.0045, "step": 360020 }, { "epoch": 1.82, "learning_rate": 2.754034841658636e-05, "loss": 0.0056, "step": 360030 }, { "epoch": 1.82, "learning_rate": 2.753278072357235e-05, "loss": 0.0054, "step": 360040 }, { "epoch": 1.82, "learning_rate": 2.752521303055834e-05, "loss": 0.0068, "step": 360050 }, { "epoch": 1.82, "learning_rate": 2.751764533754433e-05, "loss": 0.0068, "step": 360060 }, { "epoch": 1.82, "learning_rate": 2.751007764453032e-05, "loss": 0.0061, "step": 360070 }, { "epoch": 1.82, "learning_rate": 2.7502509951516312e-05, "loss": 0.0055, "step": 360080 }, { "epoch": 1.82, "learning_rate": 2.74949422585023e-05, "loss": 0.0047, "step": 360090 }, { "epoch": 1.82, "learning_rate": 2.7487374565488292e-05, "loss": 0.0057, "step": 360100 }, { "epoch": 1.82, "learning_rate": 2.747980687247428e-05, "loss": 0.0058, "step": 360110 }, { "epoch": 1.82, "learning_rate": 2.7472239179460272e-05, "loss": 0.0076, "step": 360120 }, { "epoch": 1.82, "learning_rate": 2.746467148644626e-05, "loss": 0.0048, "step": 360130 }, { "epoch": 1.82, "learning_rate": 2.745710379343225e-05, "loss": 0.0059, "step": 360140 }, { "epoch": 1.82, "learning_rate": 2.744953610041824e-05, "loss": 0.0064, "step": 360150 }, { "epoch": 1.82, "learning_rate": 2.744196840740423e-05, "loss": 0.0056, "step": 360160 }, { "epoch": 1.82, "learning_rate": 2.743440071439022e-05, "loss": 0.0048, "step": 360170 }, { "epoch": 1.82, "learning_rate": 2.7426833021376205e-05, "loss": 0.0056, "step": 360180 }, { "epoch": 1.82, "learning_rate": 2.7419265328362196e-05, "loss": 0.0053, "step": 360190 }, { "epoch": 1.82, "learning_rate": 2.7411697635348184e-05, "loss": 0.0065, "step": 360200 }, { "epoch": 1.82, "learning_rate": 2.7404129942334176e-05, "loss": 0.0051, "step": 360210 }, { "epoch": 1.82, "learning_rate": 2.7396562249320164e-05, "loss": 0.0063, "step": 360220 }, { "epoch": 1.82, "learning_rate": 2.7388994556306156e-05, "loss": 0.0052, "step": 360230 }, { "epoch": 1.82, "learning_rate": 2.7381426863292144e-05, "loss": 0.0051, "step": 360240 }, { "epoch": 1.82, "learning_rate": 2.7373859170278136e-05, "loss": 0.0059, "step": 360250 }, { "epoch": 1.82, "learning_rate": 2.7366291477264124e-05, "loss": 0.0054, "step": 360260 }, { "epoch": 1.82, "learning_rate": 2.7358723784250115e-05, "loss": 0.0048, "step": 360270 }, { "epoch": 1.82, "learning_rate": 2.7351156091236104e-05, "loss": 0.0048, "step": 360280 }, { "epoch": 1.82, "learning_rate": 2.7343588398222095e-05, "loss": 0.0056, "step": 360290 }, { "epoch": 1.82, "learning_rate": 2.7336020705208084e-05, "loss": 0.0051, "step": 360300 }, { "epoch": 1.82, "learning_rate": 2.7328453012194075e-05, "loss": 0.0045, "step": 360310 }, { "epoch": 1.82, "learning_rate": 2.7320885319180063e-05, "loss": 0.0113, "step": 360320 }, { "epoch": 1.82, "learning_rate": 2.7313317626166055e-05, "loss": 0.0082, "step": 360330 }, { "epoch": 1.82, "learning_rate": 2.730574993315204e-05, "loss": 0.0063, "step": 360340 }, { "epoch": 1.82, "learning_rate": 2.729818224013803e-05, "loss": 0.006, "step": 360350 }, { "epoch": 1.82, "learning_rate": 2.729061454712402e-05, "loss": 0.0074, "step": 360360 }, { "epoch": 1.82, "learning_rate": 2.728304685411001e-05, "loss": 0.0053, "step": 360370 }, { "epoch": 1.82, "learning_rate": 2.7275479161096e-05, "loss": 0.0054, "step": 360380 }, { "epoch": 1.82, "learning_rate": 2.726791146808199e-05, "loss": 0.0063, "step": 360390 }, { "epoch": 1.82, "learning_rate": 2.726034377506798e-05, "loss": 0.0048, "step": 360400 }, { "epoch": 1.82, "learning_rate": 2.725277608205397e-05, "loss": 0.0064, "step": 360410 }, { "epoch": 1.82, "learning_rate": 2.724520838903996e-05, "loss": 0.0049, "step": 360420 }, { "epoch": 1.82, "learning_rate": 2.723764069602595e-05, "loss": 0.0059, "step": 360430 }, { "epoch": 1.82, "learning_rate": 2.723007300301194e-05, "loss": 0.0106, "step": 360440 }, { "epoch": 1.82, "learning_rate": 2.722250530999793e-05, "loss": 0.0067, "step": 360450 }, { "epoch": 1.82, "learning_rate": 2.721493761698392e-05, "loss": 0.0059, "step": 360460 }, { "epoch": 1.82, "learning_rate": 2.720736992396991e-05, "loss": 0.008, "step": 360470 }, { "epoch": 1.82, "learning_rate": 2.71998022309559e-05, "loss": 0.0051, "step": 360480 }, { "epoch": 1.82, "learning_rate": 2.719223453794189e-05, "loss": 0.0041, "step": 360490 }, { "epoch": 1.82, "learning_rate": 2.7184666844927875e-05, "loss": 0.0056, "step": 360500 }, { "epoch": 1.82, "learning_rate": 2.7177099151913867e-05, "loss": 0.0052, "step": 360510 }, { "epoch": 1.82, "learning_rate": 2.7169531458899855e-05, "loss": 0.0053, "step": 360520 }, { "epoch": 1.82, "learning_rate": 2.7161963765885846e-05, "loss": 0.0062, "step": 360530 }, { "epoch": 1.82, "learning_rate": 2.7154396072871835e-05, "loss": 0.0051, "step": 360540 }, { "epoch": 1.82, "learning_rate": 2.7146828379857826e-05, "loss": 0.0052, "step": 360550 }, { "epoch": 1.82, "learning_rate": 2.7139260686843814e-05, "loss": 0.0064, "step": 360560 }, { "epoch": 1.82, "learning_rate": 2.7131692993829806e-05, "loss": 0.0047, "step": 360570 }, { "epoch": 1.82, "learning_rate": 2.7124125300815794e-05, "loss": 0.0066, "step": 360580 }, { "epoch": 1.82, "learning_rate": 2.7116557607801786e-05, "loss": 0.0045, "step": 360590 }, { "epoch": 1.82, "learning_rate": 2.7108989914787774e-05, "loss": 0.0078, "step": 360600 }, { "epoch": 1.82, "learning_rate": 2.7101422221773766e-05, "loss": 0.0072, "step": 360610 }, { "epoch": 1.82, "learning_rate": 2.7093854528759754e-05, "loss": 0.0058, "step": 360620 }, { "epoch": 1.82, "learning_rate": 2.7086286835745746e-05, "loss": 0.0043, "step": 360630 }, { "epoch": 1.82, "learning_rate": 2.7078719142731734e-05, "loss": 0.0078, "step": 360640 }, { "epoch": 1.82, "learning_rate": 2.7071151449717722e-05, "loss": 0.0047, "step": 360650 }, { "epoch": 1.82, "learning_rate": 2.706358375670371e-05, "loss": 0.0066, "step": 360660 }, { "epoch": 1.82, "learning_rate": 2.7056016063689702e-05, "loss": 0.0058, "step": 360670 }, { "epoch": 1.82, "learning_rate": 2.704844837067569e-05, "loss": 0.005, "step": 360680 }, { "epoch": 1.82, "learning_rate": 2.704088067766168e-05, "loss": 0.0067, "step": 360690 }, { "epoch": 1.82, "learning_rate": 2.703331298464767e-05, "loss": 0.0082, "step": 360700 }, { "epoch": 1.82, "learning_rate": 2.702574529163366e-05, "loss": 0.0062, "step": 360710 }, { "epoch": 1.82, "learning_rate": 2.701817759861965e-05, "loss": 0.013, "step": 360720 }, { "epoch": 1.82, "learning_rate": 2.701060990560564e-05, "loss": 0.0068, "step": 360730 }, { "epoch": 1.82, "learning_rate": 2.700304221259163e-05, "loss": 0.0064, "step": 360740 }, { "epoch": 1.82, "learning_rate": 2.699547451957762e-05, "loss": 0.0074, "step": 360750 }, { "epoch": 1.82, "learning_rate": 2.698790682656361e-05, "loss": 0.0058, "step": 360760 }, { "epoch": 1.82, "learning_rate": 2.69803391335496e-05, "loss": 0.0029, "step": 360770 }, { "epoch": 1.82, "learning_rate": 2.697277144053559e-05, "loss": 0.0085, "step": 360780 }, { "epoch": 1.82, "learning_rate": 2.696520374752158e-05, "loss": 0.0093, "step": 360790 }, { "epoch": 1.82, "learning_rate": 2.695763605450757e-05, "loss": 0.0061, "step": 360800 }, { "epoch": 1.82, "learning_rate": 2.6950068361493557e-05, "loss": 0.0061, "step": 360810 }, { "epoch": 1.82, "learning_rate": 2.6942500668479545e-05, "loss": 0.0066, "step": 360820 }, { "epoch": 1.82, "learning_rate": 2.6934932975465537e-05, "loss": 0.0062, "step": 360830 }, { "epoch": 1.82, "learning_rate": 2.6927365282451525e-05, "loss": 0.0064, "step": 360840 }, { "epoch": 1.82, "learning_rate": 2.6919797589437517e-05, "loss": 0.005, "step": 360850 }, { "epoch": 1.82, "learning_rate": 2.6912229896423505e-05, "loss": 0.0067, "step": 360860 }, { "epoch": 1.82, "learning_rate": 2.6904662203409497e-05, "loss": 0.005, "step": 360870 }, { "epoch": 1.82, "learning_rate": 2.6897094510395485e-05, "loss": 0.0059, "step": 360880 }, { "epoch": 1.82, "learning_rate": 2.6889526817381477e-05, "loss": 0.005, "step": 360890 }, { "epoch": 1.82, "learning_rate": 2.6881959124367465e-05, "loss": 0.0093, "step": 360900 }, { "epoch": 1.82, "learning_rate": 2.6874391431353456e-05, "loss": 0.0057, "step": 360910 }, { "epoch": 1.82, "learning_rate": 2.6866823738339445e-05, "loss": 0.0088, "step": 360920 }, { "epoch": 1.82, "learning_rate": 2.6859256045325436e-05, "loss": 0.0055, "step": 360930 }, { "epoch": 1.82, "learning_rate": 2.6851688352311424e-05, "loss": 0.0049, "step": 360940 }, { "epoch": 1.82, "learning_rate": 2.6844120659297416e-05, "loss": 0.0049, "step": 360950 }, { "epoch": 1.82, "learning_rate": 2.6836552966283404e-05, "loss": 0.0059, "step": 360960 }, { "epoch": 1.82, "learning_rate": 2.682898527326939e-05, "loss": 0.0042, "step": 360970 }, { "epoch": 1.82, "learning_rate": 2.682141758025538e-05, "loss": 0.0071, "step": 360980 }, { "epoch": 1.82, "learning_rate": 2.681384988724137e-05, "loss": 0.0062, "step": 360990 }, { "epoch": 1.82, "learning_rate": 2.680628219422736e-05, "loss": 0.0057, "step": 361000 }, { "epoch": 1.82, "eval_cer": 0.9144256176813937, "eval_loss": 0.004407630767673254, "eval_runtime": 116.7425, "eval_samples_per_second": 17.132, "eval_steps_per_second": 4.283, "step": 361000 }, { "epoch": 1.82, "learning_rate": 2.679871450121335e-05, "loss": 0.0085, "step": 361010 }, { "epoch": 1.82, "learning_rate": 2.679114680819934e-05, "loss": 0.0054, "step": 361020 }, { "epoch": 1.82, "learning_rate": 2.678357911518533e-05, "loss": 0.0053, "step": 361030 }, { "epoch": 1.82, "learning_rate": 2.677601142217132e-05, "loss": 0.0045, "step": 361040 }, { "epoch": 1.82, "learning_rate": 2.6768443729157312e-05, "loss": 0.0075, "step": 361050 }, { "epoch": 1.82, "learning_rate": 2.67608760361433e-05, "loss": 0.0074, "step": 361060 }, { "epoch": 1.82, "learning_rate": 2.675330834312929e-05, "loss": 0.0052, "step": 361070 }, { "epoch": 1.82, "learning_rate": 2.674574065011528e-05, "loss": 0.0078, "step": 361080 }, { "epoch": 1.82, "learning_rate": 2.673817295710127e-05, "loss": 0.0057, "step": 361090 }, { "epoch": 1.82, "learning_rate": 2.673060526408726e-05, "loss": 0.0061, "step": 361100 }, { "epoch": 1.82, "learning_rate": 2.672303757107325e-05, "loss": 0.0063, "step": 361110 }, { "epoch": 1.82, "learning_rate": 2.6715469878059236e-05, "loss": 0.0055, "step": 361120 }, { "epoch": 1.82, "learning_rate": 2.6707902185045224e-05, "loss": 0.0046, "step": 361130 }, { "epoch": 1.82, "learning_rate": 2.6700334492031216e-05, "loss": 0.005, "step": 361140 }, { "epoch": 1.82, "learning_rate": 2.6692766799017204e-05, "loss": 0.0045, "step": 361150 }, { "epoch": 1.82, "learning_rate": 2.6685199106003196e-05, "loss": 0.0059, "step": 361160 }, { "epoch": 1.82, "learning_rate": 2.6677631412989184e-05, "loss": 0.006, "step": 361170 }, { "epoch": 1.82, "learning_rate": 2.6670063719975176e-05, "loss": 0.0058, "step": 361180 }, { "epoch": 1.82, "learning_rate": 2.6662496026961164e-05, "loss": 0.0045, "step": 361190 }, { "epoch": 1.82, "learning_rate": 2.6654928333947155e-05, "loss": 0.0069, "step": 361200 }, { "epoch": 1.82, "learning_rate": 2.6647360640933144e-05, "loss": 0.0047, "step": 361210 }, { "epoch": 1.82, "learning_rate": 2.6639792947919135e-05, "loss": 0.0058, "step": 361220 }, { "epoch": 1.82, "learning_rate": 2.6632225254905123e-05, "loss": 0.0072, "step": 361230 }, { "epoch": 1.82, "learning_rate": 2.6624657561891115e-05, "loss": 0.0057, "step": 361240 }, { "epoch": 1.82, "learning_rate": 2.6617089868877103e-05, "loss": 0.006, "step": 361250 }, { "epoch": 1.82, "learning_rate": 2.6609522175863095e-05, "loss": 0.0061, "step": 361260 }, { "epoch": 1.82, "learning_rate": 2.6601954482849083e-05, "loss": 0.0065, "step": 361270 }, { "epoch": 1.82, "learning_rate": 2.659438678983507e-05, "loss": 0.0081, "step": 361280 }, { "epoch": 1.82, "learning_rate": 2.658681909682106e-05, "loss": 0.0053, "step": 361290 }, { "epoch": 1.82, "learning_rate": 2.657925140380705e-05, "loss": 0.0057, "step": 361300 }, { "epoch": 1.82, "learning_rate": 2.657168371079304e-05, "loss": 0.0062, "step": 361310 }, { "epoch": 1.82, "learning_rate": 2.656411601777903e-05, "loss": 0.0067, "step": 361320 }, { "epoch": 1.82, "learning_rate": 2.655654832476502e-05, "loss": 0.0064, "step": 361330 }, { "epoch": 1.82, "learning_rate": 2.654898063175101e-05, "loss": 0.0043, "step": 361340 }, { "epoch": 1.82, "learning_rate": 2.6541412938737e-05, "loss": 0.0062, "step": 361350 }, { "epoch": 1.82, "learning_rate": 2.653384524572299e-05, "loss": 0.0061, "step": 361360 }, { "epoch": 1.82, "learning_rate": 2.652627755270898e-05, "loss": 0.0054, "step": 361370 }, { "epoch": 1.82, "learning_rate": 2.651870985969497e-05, "loss": 0.0057, "step": 361380 }, { "epoch": 1.82, "learning_rate": 2.651114216668096e-05, "loss": 0.0048, "step": 361390 }, { "epoch": 1.82, "learning_rate": 2.650357447366695e-05, "loss": 0.0049, "step": 361400 }, { "epoch": 1.82, "learning_rate": 2.649600678065294e-05, "loss": 0.0063, "step": 361410 }, { "epoch": 1.82, "learning_rate": 2.648843908763893e-05, "loss": 0.0069, "step": 361420 }, { "epoch": 1.82, "learning_rate": 2.6480871394624918e-05, "loss": 0.0058, "step": 361430 }, { "epoch": 1.82, "learning_rate": 2.6473303701610906e-05, "loss": 0.0084, "step": 361440 }, { "epoch": 1.82, "learning_rate": 2.6465736008596895e-05, "loss": 0.0063, "step": 361450 }, { "epoch": 1.82, "learning_rate": 2.6458168315582886e-05, "loss": 0.0062, "step": 361460 }, { "epoch": 1.82, "learning_rate": 2.6450600622568875e-05, "loss": 0.0063, "step": 361470 }, { "epoch": 1.82, "learning_rate": 2.6443032929554866e-05, "loss": 0.0049, "step": 361480 }, { "epoch": 1.82, "learning_rate": 2.6435465236540854e-05, "loss": 0.0056, "step": 361490 }, { "epoch": 1.82, "learning_rate": 2.6427897543526846e-05, "loss": 0.0072, "step": 361500 }, { "epoch": 1.82, "learning_rate": 2.6420329850512834e-05, "loss": 0.0067, "step": 361510 }, { "epoch": 1.82, "learning_rate": 2.6412762157498826e-05, "loss": 0.0039, "step": 361520 }, { "epoch": 1.82, "learning_rate": 2.6405194464484814e-05, "loss": 0.005, "step": 361530 }, { "epoch": 1.82, "learning_rate": 2.6397626771470806e-05, "loss": 0.006, "step": 361540 }, { "epoch": 1.82, "learning_rate": 2.6390059078456794e-05, "loss": 0.005, "step": 361550 }, { "epoch": 1.82, "learning_rate": 2.6382491385442785e-05, "loss": 0.0061, "step": 361560 }, { "epoch": 1.82, "learning_rate": 2.6374923692428774e-05, "loss": 0.006, "step": 361570 }, { "epoch": 1.82, "learning_rate": 2.6367355999414765e-05, "loss": 0.0053, "step": 361580 }, { "epoch": 1.82, "learning_rate": 2.6359788306400753e-05, "loss": 0.0038, "step": 361590 }, { "epoch": 1.82, "learning_rate": 2.635222061338674e-05, "loss": 0.0052, "step": 361600 }, { "epoch": 1.82, "learning_rate": 2.634465292037273e-05, "loss": 0.008, "step": 361610 }, { "epoch": 1.82, "learning_rate": 2.633708522735872e-05, "loss": 0.0053, "step": 361620 }, { "epoch": 1.82, "learning_rate": 2.632951753434471e-05, "loss": 0.0062, "step": 361630 }, { "epoch": 1.82, "learning_rate": 2.63219498413307e-05, "loss": 0.0051, "step": 361640 }, { "epoch": 1.82, "learning_rate": 2.631438214831669e-05, "loss": 0.0066, "step": 361650 }, { "epoch": 1.82, "learning_rate": 2.630681445530268e-05, "loss": 0.0042, "step": 361660 }, { "epoch": 1.82, "learning_rate": 2.629924676228867e-05, "loss": 0.007, "step": 361670 }, { "epoch": 1.82, "learning_rate": 2.629167906927466e-05, "loss": 0.0068, "step": 361680 }, { "epoch": 1.82, "learning_rate": 2.628411137626065e-05, "loss": 0.0044, "step": 361690 }, { "epoch": 1.82, "learning_rate": 2.627654368324664e-05, "loss": 0.0062, "step": 361700 }, { "epoch": 1.82, "learning_rate": 2.626897599023263e-05, "loss": 0.0061, "step": 361710 }, { "epoch": 1.82, "learning_rate": 2.626140829721862e-05, "loss": 0.0074, "step": 361720 }, { "epoch": 1.82, "learning_rate": 2.625384060420461e-05, "loss": 0.0062, "step": 361730 }, { "epoch": 1.83, "learning_rate": 2.62462729111906e-05, "loss": 0.0066, "step": 361740 }, { "epoch": 1.83, "learning_rate": 2.6238705218176585e-05, "loss": 0.0052, "step": 361750 }, { "epoch": 1.83, "learning_rate": 2.6231137525162577e-05, "loss": 0.0045, "step": 361760 }, { "epoch": 1.83, "learning_rate": 2.6223569832148565e-05, "loss": 0.0039, "step": 361770 }, { "epoch": 1.83, "learning_rate": 2.6216002139134557e-05, "loss": 0.0052, "step": 361780 }, { "epoch": 1.83, "learning_rate": 2.6208434446120545e-05, "loss": 0.0055, "step": 361790 }, { "epoch": 1.83, "learning_rate": 2.6200866753106537e-05, "loss": 0.0067, "step": 361800 }, { "epoch": 1.83, "learning_rate": 2.6193299060092525e-05, "loss": 0.0066, "step": 361810 }, { "epoch": 1.83, "learning_rate": 2.6185731367078516e-05, "loss": 0.0093, "step": 361820 }, { "epoch": 1.83, "learning_rate": 2.6178163674064505e-05, "loss": 0.0068, "step": 361830 }, { "epoch": 1.83, "learning_rate": 2.6170595981050496e-05, "loss": 0.0061, "step": 361840 }, { "epoch": 1.83, "learning_rate": 2.6163028288036484e-05, "loss": 0.0065, "step": 361850 }, { "epoch": 1.83, "learning_rate": 2.6155460595022476e-05, "loss": 0.0058, "step": 361860 }, { "epoch": 1.83, "learning_rate": 2.6147892902008464e-05, "loss": 0.0058, "step": 361870 }, { "epoch": 1.83, "learning_rate": 2.6140325208994456e-05, "loss": 0.0068, "step": 361880 }, { "epoch": 1.83, "learning_rate": 2.6132757515980444e-05, "loss": 0.0055, "step": 361890 }, { "epoch": 1.83, "learning_rate": 2.6125189822966436e-05, "loss": 0.0049, "step": 361900 }, { "epoch": 1.83, "learning_rate": 2.611762212995242e-05, "loss": 0.0048, "step": 361910 }, { "epoch": 1.83, "learning_rate": 2.611005443693841e-05, "loss": 0.0061, "step": 361920 }, { "epoch": 1.83, "learning_rate": 2.61024867439244e-05, "loss": 0.0044, "step": 361930 }, { "epoch": 1.83, "learning_rate": 2.609491905091039e-05, "loss": 0.006, "step": 361940 }, { "epoch": 1.83, "learning_rate": 2.608735135789638e-05, "loss": 0.0066, "step": 361950 }, { "epoch": 1.83, "learning_rate": 2.607978366488237e-05, "loss": 0.0086, "step": 361960 }, { "epoch": 1.83, "learning_rate": 2.607221597186836e-05, "loss": 0.0061, "step": 361970 }, { "epoch": 1.83, "learning_rate": 2.6064648278854348e-05, "loss": 0.0078, "step": 361980 }, { "epoch": 1.83, "learning_rate": 2.605708058584034e-05, "loss": 0.0048, "step": 361990 }, { "epoch": 1.83, "learning_rate": 2.6049512892826328e-05, "loss": 0.0065, "step": 362000 }, { "epoch": 1.83, "eval_cer": 0.9144314400581461, "eval_loss": 0.004417457617819309, "eval_runtime": 116.6172, "eval_samples_per_second": 17.15, "eval_steps_per_second": 4.288, "step": 362000 }, { "epoch": 1.83, "learning_rate": 2.604194519981232e-05, "loss": 0.0051, "step": 362010 }, { "epoch": 1.83, "learning_rate": 2.603437750679831e-05, "loss": 0.0065, "step": 362020 }, { "epoch": 1.83, "learning_rate": 2.60268098137843e-05, "loss": 0.0086, "step": 362030 }, { "epoch": 1.83, "learning_rate": 2.601924212077029e-05, "loss": 0.0066, "step": 362040 }, { "epoch": 1.83, "learning_rate": 2.601167442775628e-05, "loss": 0.0053, "step": 362050 }, { "epoch": 1.83, "learning_rate": 2.600410673474227e-05, "loss": 0.0049, "step": 362060 }, { "epoch": 1.83, "learning_rate": 2.5996539041728256e-05, "loss": 0.005, "step": 362070 }, { "epoch": 1.83, "learning_rate": 2.5988971348714244e-05, "loss": 0.0059, "step": 362080 }, { "epoch": 1.83, "learning_rate": 2.5981403655700236e-05, "loss": 0.0065, "step": 362090 }, { "epoch": 1.83, "learning_rate": 2.5973835962686224e-05, "loss": 0.0058, "step": 362100 }, { "epoch": 1.83, "learning_rate": 2.5966268269672215e-05, "loss": 0.0067, "step": 362110 }, { "epoch": 1.83, "learning_rate": 2.5958700576658204e-05, "loss": 0.0067, "step": 362120 }, { "epoch": 1.83, "learning_rate": 2.5951132883644195e-05, "loss": 0.0054, "step": 362130 }, { "epoch": 1.83, "learning_rate": 2.5943565190630183e-05, "loss": 0.0043, "step": 362140 }, { "epoch": 1.83, "learning_rate": 2.5935997497616175e-05, "loss": 0.0057, "step": 362150 }, { "epoch": 1.83, "learning_rate": 2.5928429804602163e-05, "loss": 0.0045, "step": 362160 }, { "epoch": 1.83, "learning_rate": 2.5920862111588155e-05, "loss": 0.006, "step": 362170 }, { "epoch": 1.83, "learning_rate": 2.5913294418574143e-05, "loss": 0.0074, "step": 362180 }, { "epoch": 1.83, "learning_rate": 2.5905726725560135e-05, "loss": 0.0053, "step": 362190 }, { "epoch": 1.83, "learning_rate": 2.5898159032546123e-05, "loss": 0.0063, "step": 362200 }, { "epoch": 1.83, "learning_rate": 2.5890591339532115e-05, "loss": 0.0046, "step": 362210 }, { "epoch": 1.83, "learning_rate": 2.58830236465181e-05, "loss": 0.0072, "step": 362220 }, { "epoch": 1.83, "learning_rate": 2.587545595350409e-05, "loss": 0.0055, "step": 362230 }, { "epoch": 1.83, "learning_rate": 2.586788826049008e-05, "loss": 0.0078, "step": 362240 }, { "epoch": 1.83, "learning_rate": 2.586032056747607e-05, "loss": 0.0065, "step": 362250 }, { "epoch": 1.83, "learning_rate": 2.585275287446206e-05, "loss": 0.0075, "step": 362260 }, { "epoch": 1.83, "learning_rate": 2.584518518144805e-05, "loss": 0.0065, "step": 362270 }, { "epoch": 1.83, "learning_rate": 2.583761748843404e-05, "loss": 0.0063, "step": 362280 }, { "epoch": 1.83, "learning_rate": 2.583004979542003e-05, "loss": 0.0042, "step": 362290 }, { "epoch": 1.83, "learning_rate": 2.582248210240602e-05, "loss": 0.0082, "step": 362300 }, { "epoch": 1.83, "learning_rate": 2.581491440939201e-05, "loss": 0.0085, "step": 362310 }, { "epoch": 1.83, "learning_rate": 2.5807346716378e-05, "loss": 0.0074, "step": 362320 }, { "epoch": 1.83, "learning_rate": 2.579977902336399e-05, "loss": 0.0051, "step": 362330 }, { "epoch": 1.83, "learning_rate": 2.5792211330349978e-05, "loss": 0.0059, "step": 362340 }, { "epoch": 1.83, "learning_rate": 2.578464363733597e-05, "loss": 0.0074, "step": 362350 }, { "epoch": 1.83, "learning_rate": 2.5777075944321958e-05, "loss": 0.0079, "step": 362360 }, { "epoch": 1.83, "learning_rate": 2.576950825130795e-05, "loss": 0.0064, "step": 362370 }, { "epoch": 1.83, "learning_rate": 2.5761940558293935e-05, "loss": 0.0068, "step": 362380 }, { "epoch": 1.83, "learning_rate": 2.5754372865279926e-05, "loss": 0.005, "step": 362390 }, { "epoch": 1.83, "learning_rate": 2.5746805172265914e-05, "loss": 0.0056, "step": 362400 }, { "epoch": 1.83, "learning_rate": 2.5739237479251906e-05, "loss": 0.006, "step": 362410 }, { "epoch": 1.83, "learning_rate": 2.5731669786237894e-05, "loss": 0.0094, "step": 362420 }, { "epoch": 1.83, "learning_rate": 2.5724102093223886e-05, "loss": 0.0069, "step": 362430 }, { "epoch": 1.83, "learning_rate": 2.5716534400209874e-05, "loss": 0.0073, "step": 362440 }, { "epoch": 1.83, "learning_rate": 2.5708966707195866e-05, "loss": 0.0065, "step": 362450 }, { "epoch": 1.83, "learning_rate": 2.5701399014181854e-05, "loss": 0.0045, "step": 362460 }, { "epoch": 1.83, "learning_rate": 2.5693831321167845e-05, "loss": 0.0073, "step": 362470 }, { "epoch": 1.83, "learning_rate": 2.5686263628153834e-05, "loss": 0.0069, "step": 362480 }, { "epoch": 1.83, "learning_rate": 2.5678695935139825e-05, "loss": 0.0059, "step": 362490 }, { "epoch": 1.83, "learning_rate": 2.5671128242125814e-05, "loss": 0.0088, "step": 362500 }, { "epoch": 1.83, "learning_rate": 2.5663560549111805e-05, "loss": 0.0039, "step": 362510 }, { "epoch": 1.83, "learning_rate": 2.5655992856097793e-05, "loss": 0.0061, "step": 362520 }, { "epoch": 1.83, "learning_rate": 2.5648425163083785e-05, "loss": 0.006, "step": 362530 }, { "epoch": 1.83, "learning_rate": 2.564085747006977e-05, "loss": 0.0065, "step": 362540 }, { "epoch": 1.83, "learning_rate": 2.563328977705576e-05, "loss": 0.0036, "step": 362550 }, { "epoch": 1.83, "learning_rate": 2.562572208404175e-05, "loss": 0.0071, "step": 362560 }, { "epoch": 1.83, "learning_rate": 2.561815439102774e-05, "loss": 0.0054, "step": 362570 }, { "epoch": 1.83, "learning_rate": 2.561058669801373e-05, "loss": 0.004, "step": 362580 }, { "epoch": 1.83, "learning_rate": 2.560301900499972e-05, "loss": 0.0061, "step": 362590 }, { "epoch": 1.83, "learning_rate": 2.559545131198571e-05, "loss": 0.0055, "step": 362600 }, { "epoch": 1.83, "learning_rate": 2.55878836189717e-05, "loss": 0.0066, "step": 362610 }, { "epoch": 1.83, "learning_rate": 2.558031592595769e-05, "loss": 0.0054, "step": 362620 }, { "epoch": 1.83, "learning_rate": 2.557274823294368e-05, "loss": 0.0054, "step": 362630 }, { "epoch": 1.83, "learning_rate": 2.556518053992967e-05, "loss": 0.0076, "step": 362640 }, { "epoch": 1.83, "learning_rate": 2.555761284691566e-05, "loss": 0.0058, "step": 362650 }, { "epoch": 1.83, "learning_rate": 2.555004515390165e-05, "loss": 0.0034, "step": 362660 }, { "epoch": 1.83, "learning_rate": 2.554247746088764e-05, "loss": 0.0066, "step": 362670 }, { "epoch": 1.83, "learning_rate": 2.553490976787363e-05, "loss": 0.0059, "step": 362680 }, { "epoch": 1.83, "learning_rate": 2.552734207485962e-05, "loss": 0.0046, "step": 362690 }, { "epoch": 1.83, "learning_rate": 2.5519774381845605e-05, "loss": 0.0078, "step": 362700 }, { "epoch": 1.83, "learning_rate": 2.5512206688831593e-05, "loss": 0.006, "step": 362710 }, { "epoch": 1.83, "learning_rate": 2.5504638995817585e-05, "loss": 0.0065, "step": 362720 }, { "epoch": 1.83, "learning_rate": 2.5497071302803576e-05, "loss": 0.0041, "step": 362730 }, { "epoch": 1.83, "learning_rate": 2.5489503609789565e-05, "loss": 0.0069, "step": 362740 }, { "epoch": 1.83, "learning_rate": 2.5481935916775556e-05, "loss": 0.0054, "step": 362750 }, { "epoch": 1.83, "learning_rate": 2.5474368223761544e-05, "loss": 0.0077, "step": 362760 }, { "epoch": 1.83, "learning_rate": 2.5466800530747536e-05, "loss": 0.0075, "step": 362770 }, { "epoch": 1.83, "learning_rate": 2.5459232837733524e-05, "loss": 0.0047, "step": 362780 }, { "epoch": 1.83, "learning_rate": 2.5451665144719516e-05, "loss": 0.0051, "step": 362790 }, { "epoch": 1.83, "learning_rate": 2.5444097451705504e-05, "loss": 0.0067, "step": 362800 }, { "epoch": 1.83, "learning_rate": 2.5436529758691496e-05, "loss": 0.0065, "step": 362810 }, { "epoch": 1.83, "learning_rate": 2.5428962065677484e-05, "loss": 0.0066, "step": 362820 }, { "epoch": 1.83, "learning_rate": 2.5421394372663476e-05, "loss": 0.0057, "step": 362830 }, { "epoch": 1.83, "learning_rate": 2.5413826679649464e-05, "loss": 0.0092, "step": 362840 }, { "epoch": 1.83, "learning_rate": 2.540625898663545e-05, "loss": 0.0068, "step": 362850 }, { "epoch": 1.83, "learning_rate": 2.539869129362144e-05, "loss": 0.0053, "step": 362860 }, { "epoch": 1.83, "learning_rate": 2.539112360060743e-05, "loss": 0.0053, "step": 362870 }, { "epoch": 1.83, "learning_rate": 2.538355590759342e-05, "loss": 0.0061, "step": 362880 }, { "epoch": 1.83, "learning_rate": 2.5375988214579408e-05, "loss": 0.0059, "step": 362890 }, { "epoch": 1.83, "learning_rate": 2.53684205215654e-05, "loss": 0.0055, "step": 362900 }, { "epoch": 1.83, "learning_rate": 2.5360852828551388e-05, "loss": 0.0081, "step": 362910 }, { "epoch": 1.83, "learning_rate": 2.535328513553738e-05, "loss": 0.0071, "step": 362920 }, { "epoch": 1.83, "learning_rate": 2.5345717442523368e-05, "loss": 0.0067, "step": 362930 }, { "epoch": 1.83, "learning_rate": 2.533814974950936e-05, "loss": 0.0065, "step": 362940 }, { "epoch": 1.83, "learning_rate": 2.5330582056495348e-05, "loss": 0.0061, "step": 362950 }, { "epoch": 1.83, "learning_rate": 2.532301436348134e-05, "loss": 0.004, "step": 362960 }, { "epoch": 1.83, "learning_rate": 2.5315446670467328e-05, "loss": 0.0056, "step": 362970 }, { "epoch": 1.83, "learning_rate": 2.530787897745332e-05, "loss": 0.0048, "step": 362980 }, { "epoch": 1.83, "learning_rate": 2.530031128443931e-05, "loss": 0.0088, "step": 362990 }, { "epoch": 1.83, "learning_rate": 2.52927435914253e-05, "loss": 0.0045, "step": 363000 }, { "epoch": 1.83, "eval_cer": 0.9144324104542716, "eval_loss": 0.004368518013507128, "eval_runtime": 116.7968, "eval_samples_per_second": 17.124, "eval_steps_per_second": 4.281, "step": 363000 }, { "epoch": 1.83, "learning_rate": 2.5285175898411284e-05, "loss": 0.0062, "step": 363010 }, { "epoch": 1.83, "learning_rate": 2.5277608205397275e-05, "loss": 0.0062, "step": 363020 }, { "epoch": 1.83, "learning_rate": 2.5270040512383264e-05, "loss": 0.0061, "step": 363030 }, { "epoch": 1.83, "learning_rate": 2.5262472819369255e-05, "loss": 0.0047, "step": 363040 }, { "epoch": 1.83, "learning_rate": 2.5254905126355243e-05, "loss": 0.0046, "step": 363050 }, { "epoch": 1.83, "learning_rate": 2.5247337433341235e-05, "loss": 0.0072, "step": 363060 }, { "epoch": 1.83, "learning_rate": 2.5239769740327223e-05, "loss": 0.0071, "step": 363070 }, { "epoch": 1.83, "learning_rate": 2.5232202047313215e-05, "loss": 0.0081, "step": 363080 }, { "epoch": 1.83, "learning_rate": 2.5224634354299203e-05, "loss": 0.0079, "step": 363090 }, { "epoch": 1.83, "learning_rate": 2.5217066661285195e-05, "loss": 0.0046, "step": 363100 }, { "epoch": 1.83, "learning_rate": 2.5209498968271183e-05, "loss": 0.0065, "step": 363110 }, { "epoch": 1.83, "learning_rate": 2.5201931275257175e-05, "loss": 0.0054, "step": 363120 }, { "epoch": 1.83, "learning_rate": 2.5194363582243163e-05, "loss": 0.005, "step": 363130 }, { "epoch": 1.83, "learning_rate": 2.5186795889229154e-05, "loss": 0.0062, "step": 363140 }, { "epoch": 1.83, "learning_rate": 2.5179228196215143e-05, "loss": 0.006, "step": 363150 }, { "epoch": 1.83, "learning_rate": 2.5171660503201134e-05, "loss": 0.0087, "step": 363160 }, { "epoch": 1.83, "learning_rate": 2.516409281018712e-05, "loss": 0.0048, "step": 363170 }, { "epoch": 1.83, "learning_rate": 2.515652511717311e-05, "loss": 0.0053, "step": 363180 }, { "epoch": 1.83, "learning_rate": 2.51489574241591e-05, "loss": 0.006, "step": 363190 }, { "epoch": 1.83, "learning_rate": 2.514138973114509e-05, "loss": 0.0057, "step": 363200 }, { "epoch": 1.83, "learning_rate": 2.513382203813108e-05, "loss": 0.0076, "step": 363210 }, { "epoch": 1.83, "learning_rate": 2.512625434511707e-05, "loss": 0.005, "step": 363220 }, { "epoch": 1.83, "learning_rate": 2.511868665210306e-05, "loss": 0.006, "step": 363230 }, { "epoch": 1.83, "learning_rate": 2.511111895908905e-05, "loss": 0.0041, "step": 363240 }, { "epoch": 1.83, "learning_rate": 2.510355126607504e-05, "loss": 0.0079, "step": 363250 }, { "epoch": 1.83, "learning_rate": 2.509598357306103e-05, "loss": 0.0062, "step": 363260 }, { "epoch": 1.83, "learning_rate": 2.5088415880047018e-05, "loss": 0.0057, "step": 363270 }, { "epoch": 1.83, "learning_rate": 2.508084818703301e-05, "loss": 0.0059, "step": 363280 }, { "epoch": 1.83, "learning_rate": 2.5073280494018998e-05, "loss": 0.0076, "step": 363290 }, { "epoch": 1.83, "learning_rate": 2.506571280100499e-05, "loss": 0.0045, "step": 363300 }, { "epoch": 1.83, "learning_rate": 2.5058145107990978e-05, "loss": 0.0058, "step": 363310 }, { "epoch": 1.83, "learning_rate": 2.5050577414976966e-05, "loss": 0.0056, "step": 363320 }, { "epoch": 1.83, "learning_rate": 2.5043009721962954e-05, "loss": 0.0055, "step": 363330 }, { "epoch": 1.83, "learning_rate": 2.5035442028948946e-05, "loss": 0.0068, "step": 363340 }, { "epoch": 1.83, "learning_rate": 2.5027874335934934e-05, "loss": 0.007, "step": 363350 }, { "epoch": 1.83, "learning_rate": 2.5020306642920926e-05, "loss": 0.0048, "step": 363360 }, { "epoch": 1.83, "learning_rate": 2.5012738949906914e-05, "loss": 0.0047, "step": 363370 }, { "epoch": 1.83, "learning_rate": 2.5005171256892906e-05, "loss": 0.0059, "step": 363380 }, { "epoch": 1.83, "learning_rate": 2.4997603563878894e-05, "loss": 0.0045, "step": 363390 }, { "epoch": 1.83, "learning_rate": 2.4990035870864885e-05, "loss": 0.0066, "step": 363400 }, { "epoch": 1.83, "learning_rate": 2.4982468177850874e-05, "loss": 0.0053, "step": 363410 }, { "epoch": 1.83, "learning_rate": 2.4974900484836865e-05, "loss": 0.0041, "step": 363420 }, { "epoch": 1.83, "learning_rate": 2.4967332791822853e-05, "loss": 0.0074, "step": 363430 }, { "epoch": 1.83, "learning_rate": 2.4959765098808845e-05, "loss": 0.0078, "step": 363440 }, { "epoch": 1.83, "learning_rate": 2.4952197405794833e-05, "loss": 0.008, "step": 363450 }, { "epoch": 1.83, "learning_rate": 2.4944629712780825e-05, "loss": 0.0049, "step": 363460 }, { "epoch": 1.83, "learning_rate": 2.4937062019766813e-05, "loss": 0.0061, "step": 363470 }, { "epoch": 1.83, "learning_rate": 2.49294943267528e-05, "loss": 0.0058, "step": 363480 }, { "epoch": 1.83, "learning_rate": 2.492192663373879e-05, "loss": 0.0044, "step": 363490 }, { "epoch": 1.83, "learning_rate": 2.491435894072478e-05, "loss": 0.0055, "step": 363500 }, { "epoch": 1.83, "learning_rate": 2.490679124771077e-05, "loss": 0.0052, "step": 363510 }, { "epoch": 1.83, "learning_rate": 2.489922355469676e-05, "loss": 0.0052, "step": 363520 }, { "epoch": 1.83, "learning_rate": 2.489165586168275e-05, "loss": 0.0049, "step": 363530 }, { "epoch": 1.83, "learning_rate": 2.488408816866874e-05, "loss": 0.0056, "step": 363540 }, { "epoch": 1.83, "learning_rate": 2.487652047565473e-05, "loss": 0.0059, "step": 363550 }, { "epoch": 1.83, "learning_rate": 2.486895278264072e-05, "loss": 0.0062, "step": 363560 }, { "epoch": 1.83, "learning_rate": 2.486138508962671e-05, "loss": 0.0074, "step": 363570 }, { "epoch": 1.83, "learning_rate": 2.48538173966127e-05, "loss": 0.005, "step": 363580 }, { "epoch": 1.83, "learning_rate": 2.484624970359869e-05, "loss": 0.0047, "step": 363590 }, { "epoch": 1.83, "learning_rate": 2.483868201058468e-05, "loss": 0.0092, "step": 363600 }, { "epoch": 1.83, "learning_rate": 2.483111431757067e-05, "loss": 0.0067, "step": 363610 }, { "epoch": 1.83, "learning_rate": 2.482354662455666e-05, "loss": 0.0083, "step": 363620 }, { "epoch": 1.83, "learning_rate": 2.4815978931542648e-05, "loss": 0.006, "step": 363630 }, { "epoch": 1.83, "learning_rate": 2.4808411238528633e-05, "loss": 0.0065, "step": 363640 }, { "epoch": 1.83, "learning_rate": 2.4800843545514625e-05, "loss": 0.0067, "step": 363650 }, { "epoch": 1.83, "learning_rate": 2.4793275852500613e-05, "loss": 0.0042, "step": 363660 }, { "epoch": 1.83, "learning_rate": 2.4785708159486605e-05, "loss": 0.0044, "step": 363670 }, { "epoch": 1.83, "learning_rate": 2.4778140466472593e-05, "loss": 0.0048, "step": 363680 }, { "epoch": 1.83, "learning_rate": 2.4770572773458584e-05, "loss": 0.0057, "step": 363690 }, { "epoch": 1.83, "learning_rate": 2.4763005080444576e-05, "loss": 0.0062, "step": 363700 }, { "epoch": 1.83, "learning_rate": 2.4755437387430564e-05, "loss": 0.0062, "step": 363710 }, { "epoch": 1.84, "learning_rate": 2.4747869694416556e-05, "loss": 0.0048, "step": 363720 }, { "epoch": 1.84, "learning_rate": 2.4740302001402544e-05, "loss": 0.0061, "step": 363730 }, { "epoch": 1.84, "learning_rate": 2.4732734308388536e-05, "loss": 0.0067, "step": 363740 }, { "epoch": 1.84, "learning_rate": 2.4725166615374524e-05, "loss": 0.0059, "step": 363750 }, { "epoch": 1.84, "learning_rate": 2.4717598922360515e-05, "loss": 0.0052, "step": 363760 }, { "epoch": 1.84, "learning_rate": 2.4710031229346504e-05, "loss": 0.0037, "step": 363770 }, { "epoch": 1.84, "learning_rate": 2.4702463536332495e-05, "loss": 0.0053, "step": 363780 }, { "epoch": 1.84, "learning_rate": 2.4694895843318483e-05, "loss": 0.007, "step": 363790 }, { "epoch": 1.84, "learning_rate": 2.468732815030447e-05, "loss": 0.0055, "step": 363800 }, { "epoch": 1.84, "learning_rate": 2.467976045729046e-05, "loss": 0.0065, "step": 363810 }, { "epoch": 1.84, "learning_rate": 2.4672192764276448e-05, "loss": 0.004, "step": 363820 }, { "epoch": 1.84, "learning_rate": 2.466462507126244e-05, "loss": 0.0065, "step": 363830 }, { "epoch": 1.84, "learning_rate": 2.4657057378248428e-05, "loss": 0.007, "step": 363840 }, { "epoch": 1.84, "learning_rate": 2.464948968523442e-05, "loss": 0.0065, "step": 363850 }, { "epoch": 1.84, "learning_rate": 2.4641921992220408e-05, "loss": 0.0046, "step": 363860 }, { "epoch": 1.84, "learning_rate": 2.46343542992064e-05, "loss": 0.0065, "step": 363870 }, { "epoch": 1.84, "learning_rate": 2.4626786606192388e-05, "loss": 0.0052, "step": 363880 }, { "epoch": 1.84, "learning_rate": 2.461921891317838e-05, "loss": 0.0069, "step": 363890 }, { "epoch": 1.84, "learning_rate": 2.4611651220164367e-05, "loss": 0.0072, "step": 363900 }, { "epoch": 1.84, "learning_rate": 2.460408352715036e-05, "loss": 0.0074, "step": 363910 }, { "epoch": 1.84, "learning_rate": 2.4596515834136347e-05, "loss": 0.0058, "step": 363920 }, { "epoch": 1.84, "learning_rate": 2.458894814112234e-05, "loss": 0.0069, "step": 363930 }, { "epoch": 1.84, "learning_rate": 2.4581380448108327e-05, "loss": 0.0073, "step": 363940 }, { "epoch": 1.84, "learning_rate": 2.4573812755094315e-05, "loss": 0.0068, "step": 363950 }, { "epoch": 1.84, "learning_rate": 2.4566245062080304e-05, "loss": 0.0043, "step": 363960 }, { "epoch": 1.84, "learning_rate": 2.4558677369066295e-05, "loss": 0.004, "step": 363970 }, { "epoch": 1.84, "learning_rate": 2.4551109676052283e-05, "loss": 0.0039, "step": 363980 }, { "epoch": 1.84, "learning_rate": 2.4543541983038275e-05, "loss": 0.0056, "step": 363990 }, { "epoch": 1.84, "learning_rate": 2.4535974290024263e-05, "loss": 0.0058, "step": 364000 }, { "epoch": 1.84, "eval_cer": 0.9144071801550111, "eval_loss": 0.004426935221999884, "eval_runtime": 116.6371, "eval_samples_per_second": 17.147, "eval_steps_per_second": 4.287, "step": 364000 }, { "epoch": 1.84, "learning_rate": 2.4528406597010255e-05, "loss": 0.0055, "step": 364010 }, { "epoch": 1.84, "learning_rate": 2.4520838903996243e-05, "loss": 0.006, "step": 364020 }, { "epoch": 1.84, "learning_rate": 2.4513271210982235e-05, "loss": 0.0074, "step": 364030 }, { "epoch": 1.84, "learning_rate": 2.4505703517968223e-05, "loss": 0.0064, "step": 364040 }, { "epoch": 1.84, "learning_rate": 2.4498135824954214e-05, "loss": 0.0067, "step": 364050 }, { "epoch": 1.84, "learning_rate": 2.4490568131940203e-05, "loss": 0.0051, "step": 364060 }, { "epoch": 1.84, "learning_rate": 2.4483000438926194e-05, "loss": 0.0048, "step": 364070 }, { "epoch": 1.84, "learning_rate": 2.4475432745912182e-05, "loss": 0.007, "step": 364080 }, { "epoch": 1.84, "learning_rate": 2.4467865052898174e-05, "loss": 0.0066, "step": 364090 }, { "epoch": 1.84, "learning_rate": 2.4460297359884162e-05, "loss": 0.0058, "step": 364100 }, { "epoch": 1.84, "learning_rate": 2.445272966687015e-05, "loss": 0.0048, "step": 364110 }, { "epoch": 1.84, "learning_rate": 2.444516197385614e-05, "loss": 0.0044, "step": 364120 }, { "epoch": 1.84, "learning_rate": 2.443759428084213e-05, "loss": 0.0064, "step": 364130 }, { "epoch": 1.84, "learning_rate": 2.443002658782812e-05, "loss": 0.0062, "step": 364140 }, { "epoch": 1.84, "learning_rate": 2.442245889481411e-05, "loss": 0.0054, "step": 364150 }, { "epoch": 1.84, "learning_rate": 2.44148912018001e-05, "loss": 0.0049, "step": 364160 }, { "epoch": 1.84, "learning_rate": 2.440732350878609e-05, "loss": 0.0049, "step": 364170 }, { "epoch": 1.84, "learning_rate": 2.4399755815772078e-05, "loss": 0.0063, "step": 364180 }, { "epoch": 1.84, "learning_rate": 2.439218812275807e-05, "loss": 0.0054, "step": 364190 }, { "epoch": 1.84, "learning_rate": 2.4384620429744058e-05, "loss": 0.005, "step": 364200 }, { "epoch": 1.84, "learning_rate": 2.437705273673005e-05, "loss": 0.0052, "step": 364210 }, { "epoch": 1.84, "learning_rate": 2.4369485043716038e-05, "loss": 0.0083, "step": 364220 }, { "epoch": 1.84, "learning_rate": 2.436191735070203e-05, "loss": 0.0056, "step": 364230 }, { "epoch": 1.84, "learning_rate": 2.4354349657688018e-05, "loss": 0.0063, "step": 364240 }, { "epoch": 1.84, "learning_rate": 2.434678196467401e-05, "loss": 0.0061, "step": 364250 }, { "epoch": 1.84, "learning_rate": 2.4339214271659998e-05, "loss": 0.006, "step": 364260 }, { "epoch": 1.84, "learning_rate": 2.4331646578645986e-05, "loss": 0.0062, "step": 364270 }, { "epoch": 1.84, "learning_rate": 2.4324078885631974e-05, "loss": 0.0061, "step": 364280 }, { "epoch": 1.84, "learning_rate": 2.4316511192617966e-05, "loss": 0.005, "step": 364290 }, { "epoch": 1.84, "learning_rate": 2.4308943499603954e-05, "loss": 0.005, "step": 364300 }, { "epoch": 1.84, "learning_rate": 2.4301375806589945e-05, "loss": 0.0085, "step": 364310 }, { "epoch": 1.84, "learning_rate": 2.4293808113575934e-05, "loss": 0.0096, "step": 364320 }, { "epoch": 1.84, "learning_rate": 2.4286240420561925e-05, "loss": 0.0056, "step": 364330 }, { "epoch": 1.84, "learning_rate": 2.4278672727547913e-05, "loss": 0.0081, "step": 364340 }, { "epoch": 1.84, "learning_rate": 2.4271105034533905e-05, "loss": 0.0048, "step": 364350 }, { "epoch": 1.84, "learning_rate": 2.4263537341519893e-05, "loss": 0.0052, "step": 364360 }, { "epoch": 1.84, "learning_rate": 2.4255969648505885e-05, "loss": 0.0048, "step": 364370 }, { "epoch": 1.84, "learning_rate": 2.4248401955491873e-05, "loss": 0.0046, "step": 364380 }, { "epoch": 1.84, "learning_rate": 2.4240834262477865e-05, "loss": 0.0079, "step": 364390 }, { "epoch": 1.84, "learning_rate": 2.4233266569463853e-05, "loss": 0.0051, "step": 364400 }, { "epoch": 1.84, "learning_rate": 2.4225698876449845e-05, "loss": 0.0056, "step": 364410 }, { "epoch": 1.84, "learning_rate": 2.421813118343583e-05, "loss": 0.0053, "step": 364420 }, { "epoch": 1.84, "learning_rate": 2.421056349042182e-05, "loss": 0.0048, "step": 364430 }, { "epoch": 1.84, "learning_rate": 2.420299579740781e-05, "loss": 0.0057, "step": 364440 }, { "epoch": 1.84, "learning_rate": 2.41954281043938e-05, "loss": 0.0048, "step": 364450 }, { "epoch": 1.84, "learning_rate": 2.418786041137979e-05, "loss": 0.0048, "step": 364460 }, { "epoch": 1.84, "learning_rate": 2.418029271836578e-05, "loss": 0.0061, "step": 364470 }, { "epoch": 1.84, "learning_rate": 2.417272502535177e-05, "loss": 0.0056, "step": 364480 }, { "epoch": 1.84, "learning_rate": 2.416515733233776e-05, "loss": 0.0045, "step": 364490 }, { "epoch": 1.84, "learning_rate": 2.415758963932375e-05, "loss": 0.005, "step": 364500 }, { "epoch": 1.84, "learning_rate": 2.415002194630974e-05, "loss": 0.0048, "step": 364510 }, { "epoch": 1.84, "learning_rate": 2.414245425329573e-05, "loss": 0.0047, "step": 364520 }, { "epoch": 1.84, "learning_rate": 2.413488656028172e-05, "loss": 0.0063, "step": 364530 }, { "epoch": 1.84, "learning_rate": 2.412731886726771e-05, "loss": 0.0065, "step": 364540 }, { "epoch": 1.84, "learning_rate": 2.41197511742537e-05, "loss": 0.0071, "step": 364550 }, { "epoch": 1.84, "learning_rate": 2.4112183481239688e-05, "loss": 0.0055, "step": 364560 }, { "epoch": 1.84, "learning_rate": 2.410461578822568e-05, "loss": 0.0047, "step": 364570 }, { "epoch": 1.84, "learning_rate": 2.4097048095211665e-05, "loss": 0.0059, "step": 364580 }, { "epoch": 1.84, "learning_rate": 2.4089480402197653e-05, "loss": 0.0064, "step": 364590 }, { "epoch": 1.84, "learning_rate": 2.4081912709183644e-05, "loss": 0.0052, "step": 364600 }, { "epoch": 1.84, "learning_rate": 2.4074345016169633e-05, "loss": 0.0067, "step": 364610 }, { "epoch": 1.84, "learning_rate": 2.4066777323155624e-05, "loss": 0.0045, "step": 364620 }, { "epoch": 1.84, "learning_rate": 2.4059209630141612e-05, "loss": 0.0077, "step": 364630 }, { "epoch": 1.84, "learning_rate": 2.4051641937127604e-05, "loss": 0.0061, "step": 364640 }, { "epoch": 1.84, "learning_rate": 2.4044074244113592e-05, "loss": 0.0049, "step": 364650 }, { "epoch": 1.84, "learning_rate": 2.4036506551099584e-05, "loss": 0.0055, "step": 364660 }, { "epoch": 1.84, "learning_rate": 2.4028938858085575e-05, "loss": 0.0048, "step": 364670 }, { "epoch": 1.84, "learning_rate": 2.4021371165071564e-05, "loss": 0.0047, "step": 364680 }, { "epoch": 1.84, "learning_rate": 2.4013803472057555e-05, "loss": 0.0062, "step": 364690 }, { "epoch": 1.84, "learning_rate": 2.4006235779043544e-05, "loss": 0.0066, "step": 364700 }, { "epoch": 1.84, "learning_rate": 2.3998668086029535e-05, "loss": 0.0053, "step": 364710 }, { "epoch": 1.84, "learning_rate": 2.3991100393015523e-05, "loss": 0.0043, "step": 364720 }, { "epoch": 1.84, "learning_rate": 2.3983532700001515e-05, "loss": 0.0054, "step": 364730 }, { "epoch": 1.84, "learning_rate": 2.39759650069875e-05, "loss": 0.0055, "step": 364740 }, { "epoch": 1.84, "learning_rate": 2.3968397313973488e-05, "loss": 0.0058, "step": 364750 }, { "epoch": 1.84, "learning_rate": 2.396082962095948e-05, "loss": 0.0056, "step": 364760 }, { "epoch": 1.84, "learning_rate": 2.3953261927945468e-05, "loss": 0.0051, "step": 364770 }, { "epoch": 1.84, "learning_rate": 2.394569423493146e-05, "loss": 0.0061, "step": 364780 }, { "epoch": 1.84, "learning_rate": 2.3938126541917448e-05, "loss": 0.0068, "step": 364790 }, { "epoch": 1.84, "learning_rate": 2.393055884890344e-05, "loss": 0.0056, "step": 364800 }, { "epoch": 1.84, "learning_rate": 2.3922991155889427e-05, "loss": 0.0046, "step": 364810 }, { "epoch": 1.84, "learning_rate": 2.391542346287542e-05, "loss": 0.0066, "step": 364820 }, { "epoch": 1.84, "learning_rate": 2.3907855769861407e-05, "loss": 0.0063, "step": 364830 }, { "epoch": 1.84, "learning_rate": 2.39002880768474e-05, "loss": 0.0067, "step": 364840 }, { "epoch": 1.84, "learning_rate": 2.3892720383833387e-05, "loss": 0.0056, "step": 364850 }, { "epoch": 1.84, "learning_rate": 2.388515269081938e-05, "loss": 0.0039, "step": 364860 }, { "epoch": 1.84, "learning_rate": 2.3877584997805367e-05, "loss": 0.0083, "step": 364870 }, { "epoch": 1.84, "learning_rate": 2.387001730479136e-05, "loss": 0.0064, "step": 364880 }, { "epoch": 1.84, "learning_rate": 2.3862449611777343e-05, "loss": 0.0097, "step": 364890 }, { "epoch": 1.84, "learning_rate": 2.3854881918763335e-05, "loss": 0.0063, "step": 364900 }, { "epoch": 1.84, "learning_rate": 2.3847314225749323e-05, "loss": 0.0059, "step": 364910 }, { "epoch": 1.84, "learning_rate": 2.3839746532735315e-05, "loss": 0.0048, "step": 364920 }, { "epoch": 1.84, "learning_rate": 2.3832178839721303e-05, "loss": 0.0045, "step": 364930 }, { "epoch": 1.84, "learning_rate": 2.3824611146707295e-05, "loss": 0.0064, "step": 364940 }, { "epoch": 1.84, "learning_rate": 2.3817043453693283e-05, "loss": 0.0047, "step": 364950 }, { "epoch": 1.84, "learning_rate": 2.3809475760679274e-05, "loss": 0.0058, "step": 364960 }, { "epoch": 1.84, "learning_rate": 2.3801908067665263e-05, "loss": 0.0059, "step": 364970 }, { "epoch": 1.84, "learning_rate": 2.3794340374651254e-05, "loss": 0.004, "step": 364980 }, { "epoch": 1.84, "learning_rate": 2.3786772681637243e-05, "loss": 0.0045, "step": 364990 }, { "epoch": 1.84, "learning_rate": 2.3779204988623234e-05, "loss": 0.0054, "step": 365000 }, { "epoch": 1.84, "eval_cer": 0.9144207657007667, "eval_loss": 0.0044406414963305, "eval_runtime": 116.6279, "eval_samples_per_second": 17.149, "eval_steps_per_second": 4.287, "step": 365000 }, { "epoch": 1.84, "learning_rate": 2.3771637295609222e-05, "loss": 0.004, "step": 365010 }, { "epoch": 1.84, "learning_rate": 2.3764069602595214e-05, "loss": 0.0067, "step": 365020 }, { "epoch": 1.84, "learning_rate": 2.3756501909581202e-05, "loss": 0.0058, "step": 365030 }, { "epoch": 1.84, "learning_rate": 2.3748934216567194e-05, "loss": 0.0055, "step": 365040 }, { "epoch": 1.84, "learning_rate": 2.374136652355318e-05, "loss": 0.0063, "step": 365050 }, { "epoch": 1.84, "learning_rate": 2.373379883053917e-05, "loss": 0.0056, "step": 365060 }, { "epoch": 1.84, "learning_rate": 2.372623113752516e-05, "loss": 0.007, "step": 365070 }, { "epoch": 1.84, "learning_rate": 2.371866344451115e-05, "loss": 0.0063, "step": 365080 }, { "epoch": 1.84, "learning_rate": 2.3711095751497138e-05, "loss": 0.0058, "step": 365090 }, { "epoch": 1.84, "learning_rate": 2.370352805848313e-05, "loss": 0.0053, "step": 365100 }, { "epoch": 1.84, "learning_rate": 2.3695960365469118e-05, "loss": 0.0065, "step": 365110 }, { "epoch": 1.84, "learning_rate": 2.368839267245511e-05, "loss": 0.0032, "step": 365120 }, { "epoch": 1.84, "learning_rate": 2.3680824979441098e-05, "loss": 0.0056, "step": 365130 }, { "epoch": 1.84, "learning_rate": 2.367325728642709e-05, "loss": 0.0047, "step": 365140 }, { "epoch": 1.84, "learning_rate": 2.3665689593413078e-05, "loss": 0.0051, "step": 365150 }, { "epoch": 1.84, "learning_rate": 2.365812190039907e-05, "loss": 0.0054, "step": 365160 }, { "epoch": 1.84, "learning_rate": 2.3650554207385058e-05, "loss": 0.0056, "step": 365170 }, { "epoch": 1.84, "learning_rate": 2.364298651437105e-05, "loss": 0.0054, "step": 365180 }, { "epoch": 1.84, "learning_rate": 2.3635418821357037e-05, "loss": 0.005, "step": 365190 }, { "epoch": 1.84, "learning_rate": 2.362785112834303e-05, "loss": 0.0056, "step": 365200 }, { "epoch": 1.84, "learning_rate": 2.3620283435329014e-05, "loss": 0.0072, "step": 365210 }, { "epoch": 1.84, "learning_rate": 2.3612715742315005e-05, "loss": 0.0042, "step": 365220 }, { "epoch": 1.84, "learning_rate": 2.3605148049300994e-05, "loss": 0.0073, "step": 365230 }, { "epoch": 1.84, "learning_rate": 2.3597580356286985e-05, "loss": 0.0079, "step": 365240 }, { "epoch": 1.84, "learning_rate": 2.3590012663272973e-05, "loss": 0.0054, "step": 365250 }, { "epoch": 1.84, "learning_rate": 2.3582444970258965e-05, "loss": 0.0055, "step": 365260 }, { "epoch": 1.84, "learning_rate": 2.3574877277244953e-05, "loss": 0.0067, "step": 365270 }, { "epoch": 1.84, "learning_rate": 2.3567309584230945e-05, "loss": 0.0083, "step": 365280 }, { "epoch": 1.84, "learning_rate": 2.3559741891216933e-05, "loss": 0.0051, "step": 365290 }, { "epoch": 1.84, "learning_rate": 2.3552174198202925e-05, "loss": 0.0046, "step": 365300 }, { "epoch": 1.84, "learning_rate": 2.3544606505188913e-05, "loss": 0.0056, "step": 365310 }, { "epoch": 1.84, "learning_rate": 2.3537038812174905e-05, "loss": 0.0059, "step": 365320 }, { "epoch": 1.84, "learning_rate": 2.3529471119160893e-05, "loss": 0.0046, "step": 365330 }, { "epoch": 1.84, "learning_rate": 2.3521903426146884e-05, "loss": 0.0064, "step": 365340 }, { "epoch": 1.84, "learning_rate": 2.3514335733132873e-05, "loss": 0.0057, "step": 365350 }, { "epoch": 1.84, "learning_rate": 2.3506768040118864e-05, "loss": 0.0059, "step": 365360 }, { "epoch": 1.84, "learning_rate": 2.349920034710485e-05, "loss": 0.0049, "step": 365370 }, { "epoch": 1.84, "learning_rate": 2.3491632654090837e-05, "loss": 0.0061, "step": 365380 }, { "epoch": 1.84, "learning_rate": 2.348406496107683e-05, "loss": 0.0052, "step": 365390 }, { "epoch": 1.84, "learning_rate": 2.347649726806282e-05, "loss": 0.0071, "step": 365400 }, { "epoch": 1.84, "learning_rate": 2.346892957504881e-05, "loss": 0.0056, "step": 365410 }, { "epoch": 1.84, "learning_rate": 2.34613618820348e-05, "loss": 0.006, "step": 365420 }, { "epoch": 1.84, "learning_rate": 2.345379418902079e-05, "loss": 0.0054, "step": 365430 }, { "epoch": 1.84, "learning_rate": 2.344622649600678e-05, "loss": 0.0058, "step": 365440 }, { "epoch": 1.84, "learning_rate": 2.343865880299277e-05, "loss": 0.0073, "step": 365450 }, { "epoch": 1.84, "learning_rate": 2.343109110997876e-05, "loss": 0.0074, "step": 365460 }, { "epoch": 1.84, "learning_rate": 2.3423523416964748e-05, "loss": 0.0055, "step": 365470 }, { "epoch": 1.84, "learning_rate": 2.341595572395074e-05, "loss": 0.0062, "step": 365480 }, { "epoch": 1.84, "learning_rate": 2.3408388030936728e-05, "loss": 0.0054, "step": 365490 }, { "epoch": 1.84, "learning_rate": 2.340082033792272e-05, "loss": 0.0058, "step": 365500 }, { "epoch": 1.84, "learning_rate": 2.3393252644908708e-05, "loss": 0.0069, "step": 365510 }, { "epoch": 1.84, "learning_rate": 2.3385684951894693e-05, "loss": 0.0055, "step": 365520 }, { "epoch": 1.84, "learning_rate": 2.3378117258880684e-05, "loss": 0.0055, "step": 365530 }, { "epoch": 1.84, "learning_rate": 2.3370549565866672e-05, "loss": 0.0039, "step": 365540 }, { "epoch": 1.84, "learning_rate": 2.3362981872852664e-05, "loss": 0.0066, "step": 365550 }, { "epoch": 1.84, "learning_rate": 2.3355414179838652e-05, "loss": 0.0055, "step": 365560 }, { "epoch": 1.84, "learning_rate": 2.3347846486824644e-05, "loss": 0.0081, "step": 365570 }, { "epoch": 1.84, "learning_rate": 2.3340278793810632e-05, "loss": 0.0068, "step": 365580 }, { "epoch": 1.84, "learning_rate": 2.3332711100796624e-05, "loss": 0.0064, "step": 365590 }, { "epoch": 1.84, "learning_rate": 2.3325143407782612e-05, "loss": 0.0052, "step": 365600 }, { "epoch": 1.84, "learning_rate": 2.3317575714768604e-05, "loss": 0.0057, "step": 365610 }, { "epoch": 1.84, "learning_rate": 2.3310008021754592e-05, "loss": 0.0037, "step": 365620 }, { "epoch": 1.84, "learning_rate": 2.3302440328740583e-05, "loss": 0.0042, "step": 365630 }, { "epoch": 1.84, "learning_rate": 2.3294872635726575e-05, "loss": 0.0054, "step": 365640 }, { "epoch": 1.84, "learning_rate": 2.3287304942712563e-05, "loss": 0.0048, "step": 365650 }, { "epoch": 1.84, "learning_rate": 2.3279737249698555e-05, "loss": 0.0053, "step": 365660 }, { "epoch": 1.84, "learning_rate": 2.3272169556684543e-05, "loss": 0.0039, "step": 365670 }, { "epoch": 1.84, "learning_rate": 2.3264601863670528e-05, "loss": 0.005, "step": 365680 }, { "epoch": 1.84, "learning_rate": 2.325703417065652e-05, "loss": 0.0067, "step": 365690 }, { "epoch": 1.84, "learning_rate": 2.3249466477642508e-05, "loss": 0.0058, "step": 365700 }, { "epoch": 1.85, "learning_rate": 2.32418987846285e-05, "loss": 0.0065, "step": 365710 }, { "epoch": 1.85, "learning_rate": 2.3234331091614488e-05, "loss": 0.0055, "step": 365720 }, { "epoch": 1.85, "learning_rate": 2.322676339860048e-05, "loss": 0.0078, "step": 365730 }, { "epoch": 1.85, "learning_rate": 2.3219195705586467e-05, "loss": 0.0055, "step": 365740 }, { "epoch": 1.85, "learning_rate": 2.321162801257246e-05, "loss": 0.0074, "step": 365750 }, { "epoch": 1.85, "learning_rate": 2.3204060319558447e-05, "loss": 0.0057, "step": 365760 }, { "epoch": 1.85, "learning_rate": 2.319649262654444e-05, "loss": 0.006, "step": 365770 }, { "epoch": 1.85, "learning_rate": 2.3188924933530427e-05, "loss": 0.0105, "step": 365780 }, { "epoch": 1.85, "learning_rate": 2.318135724051642e-05, "loss": 0.0054, "step": 365790 }, { "epoch": 1.85, "learning_rate": 2.3173789547502407e-05, "loss": 0.0059, "step": 365800 }, { "epoch": 1.85, "learning_rate": 2.31662218544884e-05, "loss": 0.0075, "step": 365810 }, { "epoch": 1.85, "learning_rate": 2.3158654161474387e-05, "loss": 0.0051, "step": 365820 }, { "epoch": 1.85, "learning_rate": 2.3151086468460378e-05, "loss": 0.0066, "step": 365830 }, { "epoch": 1.85, "learning_rate": 2.3143518775446363e-05, "loss": 0.0042, "step": 365840 }, { "epoch": 1.85, "learning_rate": 2.3135951082432355e-05, "loss": 0.0051, "step": 365850 }, { "epoch": 1.85, "learning_rate": 2.3128383389418343e-05, "loss": 0.0064, "step": 365860 }, { "epoch": 1.85, "learning_rate": 2.3120815696404335e-05, "loss": 0.0054, "step": 365870 }, { "epoch": 1.85, "learning_rate": 2.3113248003390323e-05, "loss": 0.0041, "step": 365880 }, { "epoch": 1.85, "learning_rate": 2.3105680310376314e-05, "loss": 0.0057, "step": 365890 }, { "epoch": 1.85, "learning_rate": 2.3098112617362303e-05, "loss": 0.0057, "step": 365900 }, { "epoch": 1.85, "learning_rate": 2.3090544924348294e-05, "loss": 0.0064, "step": 365910 }, { "epoch": 1.85, "learning_rate": 2.3082977231334282e-05, "loss": 0.0051, "step": 365920 }, { "epoch": 1.85, "learning_rate": 2.3075409538320274e-05, "loss": 0.0053, "step": 365930 }, { "epoch": 1.85, "learning_rate": 2.3067841845306262e-05, "loss": 0.0063, "step": 365940 }, { "epoch": 1.85, "learning_rate": 2.3060274152292254e-05, "loss": 0.0064, "step": 365950 }, { "epoch": 1.85, "learning_rate": 2.3052706459278242e-05, "loss": 0.0065, "step": 365960 }, { "epoch": 1.85, "learning_rate": 2.3045138766264234e-05, "loss": 0.0063, "step": 365970 }, { "epoch": 1.85, "learning_rate": 2.3037571073250222e-05, "loss": 0.0052, "step": 365980 }, { "epoch": 1.85, "learning_rate": 2.303000338023621e-05, "loss": 0.0091, "step": 365990 }, { "epoch": 1.85, "learning_rate": 2.30224356872222e-05, "loss": 0.0038, "step": 366000 }, { "epoch": 1.85, "eval_cer": 0.914423676889143, "eval_loss": 0.004396693781018257, "eval_runtime": 116.8468, "eval_samples_per_second": 17.116, "eval_steps_per_second": 4.279, "step": 366000 }, { "epoch": 1.85, "learning_rate": 2.301486799420819e-05, "loss": 0.0056, "step": 366010 }, { "epoch": 1.85, "learning_rate": 2.3007300301194178e-05, "loss": 0.005, "step": 366020 }, { "epoch": 1.85, "learning_rate": 2.299973260818017e-05, "loss": 0.0065, "step": 366030 }, { "epoch": 1.85, "learning_rate": 2.2992164915166158e-05, "loss": 0.0061, "step": 366040 }, { "epoch": 1.85, "learning_rate": 2.298459722215215e-05, "loss": 0.0049, "step": 366050 }, { "epoch": 1.85, "learning_rate": 2.2977029529138138e-05, "loss": 0.0045, "step": 366060 }, { "epoch": 1.85, "learning_rate": 2.296946183612413e-05, "loss": 0.0051, "step": 366070 }, { "epoch": 1.85, "learning_rate": 2.2961894143110118e-05, "loss": 0.006, "step": 366080 }, { "epoch": 1.85, "learning_rate": 2.295432645009611e-05, "loss": 0.0051, "step": 366090 }, { "epoch": 1.85, "learning_rate": 2.2946758757082097e-05, "loss": 0.0056, "step": 366100 }, { "epoch": 1.85, "learning_rate": 2.293919106406809e-05, "loss": 0.0087, "step": 366110 }, { "epoch": 1.85, "learning_rate": 2.2931623371054077e-05, "loss": 0.0076, "step": 366120 }, { "epoch": 1.85, "learning_rate": 2.292405567804007e-05, "loss": 0.0091, "step": 366130 }, { "epoch": 1.85, "learning_rate": 2.2916487985026057e-05, "loss": 0.0043, "step": 366140 }, { "epoch": 1.85, "learning_rate": 2.2908920292012045e-05, "loss": 0.0055, "step": 366150 }, { "epoch": 1.85, "learning_rate": 2.2901352598998034e-05, "loss": 0.0061, "step": 366160 }, { "epoch": 1.85, "learning_rate": 2.2893784905984025e-05, "loss": 0.006, "step": 366170 }, { "epoch": 1.85, "learning_rate": 2.2886217212970013e-05, "loss": 0.0042, "step": 366180 }, { "epoch": 1.85, "learning_rate": 2.2878649519956005e-05, "loss": 0.0045, "step": 366190 }, { "epoch": 1.85, "learning_rate": 2.2871081826941993e-05, "loss": 0.0049, "step": 366200 }, { "epoch": 1.85, "learning_rate": 2.2863514133927985e-05, "loss": 0.0078, "step": 366210 }, { "epoch": 1.85, "learning_rate": 2.2855946440913973e-05, "loss": 0.007, "step": 366220 }, { "epoch": 1.85, "learning_rate": 2.2848378747899965e-05, "loss": 0.0053, "step": 366230 }, { "epoch": 1.85, "learning_rate": 2.2840811054885953e-05, "loss": 0.006, "step": 366240 }, { "epoch": 1.85, "learning_rate": 2.2833243361871944e-05, "loss": 0.0057, "step": 366250 }, { "epoch": 1.85, "learning_rate": 2.2825675668857933e-05, "loss": 0.0073, "step": 366260 }, { "epoch": 1.85, "learning_rate": 2.2818107975843924e-05, "loss": 0.0053, "step": 366270 }, { "epoch": 1.85, "learning_rate": 2.2810540282829912e-05, "loss": 0.005, "step": 366280 }, { "epoch": 1.85, "learning_rate": 2.2802972589815904e-05, "loss": 0.0056, "step": 366290 }, { "epoch": 1.85, "learning_rate": 2.2795404896801892e-05, "loss": 0.0051, "step": 366300 }, { "epoch": 1.85, "learning_rate": 2.2787837203787877e-05, "loss": 0.0057, "step": 366310 }, { "epoch": 1.85, "learning_rate": 2.278026951077387e-05, "loss": 0.0084, "step": 366320 }, { "epoch": 1.85, "learning_rate": 2.2772701817759857e-05, "loss": 0.005, "step": 366330 }, { "epoch": 1.85, "learning_rate": 2.276513412474585e-05, "loss": 0.0068, "step": 366340 }, { "epoch": 1.85, "learning_rate": 2.2757566431731837e-05, "loss": 0.0077, "step": 366350 }, { "epoch": 1.85, "learning_rate": 2.274999873871783e-05, "loss": 0.005, "step": 366360 }, { "epoch": 1.85, "learning_rate": 2.274243104570382e-05, "loss": 0.0065, "step": 366370 }, { "epoch": 1.85, "learning_rate": 2.2734863352689808e-05, "loss": 0.0048, "step": 366380 }, { "epoch": 1.85, "learning_rate": 2.27272956596758e-05, "loss": 0.0069, "step": 366390 }, { "epoch": 1.85, "learning_rate": 2.2719727966661788e-05, "loss": 0.0067, "step": 366400 }, { "epoch": 1.85, "learning_rate": 2.271216027364778e-05, "loss": 0.0062, "step": 366410 }, { "epoch": 1.85, "learning_rate": 2.2704592580633768e-05, "loss": 0.0051, "step": 366420 }, { "epoch": 1.85, "learning_rate": 2.269702488761976e-05, "loss": 0.0047, "step": 366430 }, { "epoch": 1.85, "learning_rate": 2.2689457194605748e-05, "loss": 0.0062, "step": 366440 }, { "epoch": 1.85, "learning_rate": 2.268188950159174e-05, "loss": 0.0053, "step": 366450 }, { "epoch": 1.85, "learning_rate": 2.2674321808577728e-05, "loss": 0.006, "step": 366460 }, { "epoch": 1.85, "learning_rate": 2.2666754115563712e-05, "loss": 0.0065, "step": 366470 }, { "epoch": 1.85, "learning_rate": 2.2659186422549704e-05, "loss": 0.0086, "step": 366480 }, { "epoch": 1.85, "learning_rate": 2.2651618729535692e-05, "loss": 0.0059, "step": 366490 }, { "epoch": 1.85, "learning_rate": 2.2644051036521684e-05, "loss": 0.0064, "step": 366500 }, { "epoch": 1.85, "learning_rate": 2.2636483343507672e-05, "loss": 0.0068, "step": 366510 }, { "epoch": 1.85, "learning_rate": 2.2628915650493664e-05, "loss": 0.0054, "step": 366520 }, { "epoch": 1.85, "learning_rate": 2.2621347957479652e-05, "loss": 0.0053, "step": 366530 }, { "epoch": 1.85, "learning_rate": 2.2613780264465643e-05, "loss": 0.0063, "step": 366540 }, { "epoch": 1.85, "learning_rate": 2.260621257145163e-05, "loss": 0.0059, "step": 366550 }, { "epoch": 1.85, "learning_rate": 2.2598644878437623e-05, "loss": 0.0059, "step": 366560 }, { "epoch": 1.85, "learning_rate": 2.259107718542361e-05, "loss": 0.005, "step": 366570 }, { "epoch": 1.85, "learning_rate": 2.2583509492409603e-05, "loss": 0.0065, "step": 366580 }, { "epoch": 1.85, "learning_rate": 2.257594179939559e-05, "loss": 0.0045, "step": 366590 }, { "epoch": 1.85, "learning_rate": 2.2568374106381583e-05, "loss": 0.0062, "step": 366600 }, { "epoch": 1.85, "learning_rate": 2.256080641336757e-05, "loss": 0.0068, "step": 366610 }, { "epoch": 1.85, "learning_rate": 2.255323872035356e-05, "loss": 0.0078, "step": 366620 }, { "epoch": 1.85, "learning_rate": 2.2545671027339548e-05, "loss": 0.0067, "step": 366630 }, { "epoch": 1.85, "learning_rate": 2.253810333432554e-05, "loss": 0.0056, "step": 366640 }, { "epoch": 1.85, "learning_rate": 2.2530535641311527e-05, "loss": 0.0059, "step": 366650 }, { "epoch": 1.85, "learning_rate": 2.252296794829752e-05, "loss": 0.008, "step": 366660 }, { "epoch": 1.85, "learning_rate": 2.2515400255283507e-05, "loss": 0.0044, "step": 366670 }, { "epoch": 1.85, "learning_rate": 2.25078325622695e-05, "loss": 0.0053, "step": 366680 }, { "epoch": 1.85, "learning_rate": 2.2500264869255487e-05, "loss": 0.0057, "step": 366690 }, { "epoch": 1.85, "learning_rate": 2.249269717624148e-05, "loss": 0.0053, "step": 366700 }, { "epoch": 1.85, "learning_rate": 2.2485129483227467e-05, "loss": 0.0041, "step": 366710 }, { "epoch": 1.85, "learning_rate": 2.247756179021346e-05, "loss": 0.0064, "step": 366720 }, { "epoch": 1.85, "learning_rate": 2.2469994097199447e-05, "loss": 0.007, "step": 366730 }, { "epoch": 1.85, "learning_rate": 2.246242640418544e-05, "loss": 0.0075, "step": 366740 }, { "epoch": 1.85, "learning_rate": 2.2454858711171427e-05, "loss": 0.007, "step": 366750 }, { "epoch": 1.85, "learning_rate": 2.2447291018157418e-05, "loss": 0.0063, "step": 366760 }, { "epoch": 1.85, "learning_rate": 2.2439723325143406e-05, "loss": 0.007, "step": 366770 }, { "epoch": 1.85, "learning_rate": 2.2432155632129395e-05, "loss": 0.0046, "step": 366780 }, { "epoch": 1.85, "learning_rate": 2.2424587939115383e-05, "loss": 0.0059, "step": 366790 }, { "epoch": 1.85, "learning_rate": 2.2417020246101374e-05, "loss": 0.0092, "step": 366800 }, { "epoch": 1.85, "learning_rate": 2.2409452553087363e-05, "loss": 0.0059, "step": 366810 }, { "epoch": 1.85, "learning_rate": 2.2401884860073354e-05, "loss": 0.0065, "step": 366820 }, { "epoch": 1.85, "learning_rate": 2.2394317167059342e-05, "loss": 0.0085, "step": 366830 }, { "epoch": 1.85, "learning_rate": 2.2386749474045334e-05, "loss": 0.0045, "step": 366840 }, { "epoch": 1.85, "learning_rate": 2.2379181781031322e-05, "loss": 0.0069, "step": 366850 }, { "epoch": 1.85, "learning_rate": 2.2371614088017314e-05, "loss": 0.0078, "step": 366860 }, { "epoch": 1.85, "learning_rate": 2.2364046395003302e-05, "loss": 0.0075, "step": 366870 }, { "epoch": 1.85, "learning_rate": 2.2356478701989294e-05, "loss": 0.0053, "step": 366880 }, { "epoch": 1.85, "learning_rate": 2.2348911008975282e-05, "loss": 0.0076, "step": 366890 }, { "epoch": 1.85, "learning_rate": 2.2341343315961274e-05, "loss": 0.0053, "step": 366900 }, { "epoch": 1.85, "learning_rate": 2.2333775622947262e-05, "loss": 0.0082, "step": 366910 }, { "epoch": 1.85, "learning_rate": 2.2326207929933253e-05, "loss": 0.0058, "step": 366920 }, { "epoch": 1.85, "learning_rate": 2.231864023691924e-05, "loss": 0.0041, "step": 366930 }, { "epoch": 1.85, "learning_rate": 2.231107254390523e-05, "loss": 0.0062, "step": 366940 }, { "epoch": 1.85, "learning_rate": 2.2303504850891218e-05, "loss": 0.0054, "step": 366950 }, { "epoch": 1.85, "learning_rate": 2.229593715787721e-05, "loss": 0.0057, "step": 366960 }, { "epoch": 1.85, "learning_rate": 2.2288369464863198e-05, "loss": 0.0066, "step": 366970 }, { "epoch": 1.85, "learning_rate": 2.228080177184919e-05, "loss": 0.0067, "step": 366980 }, { "epoch": 1.85, "learning_rate": 2.2273234078835178e-05, "loss": 0.0079, "step": 366990 }, { "epoch": 1.85, "learning_rate": 2.226566638582117e-05, "loss": 0.0065, "step": 367000 }, { "epoch": 1.85, "eval_cer": 0.9144217360968921, "eval_loss": 0.004412375390529633, "eval_runtime": 116.7639, "eval_samples_per_second": 17.129, "eval_steps_per_second": 4.282, "step": 367000 }, { "epoch": 1.85, "learning_rate": 2.2258098692807157e-05, "loss": 0.0051, "step": 367010 }, { "epoch": 1.85, "learning_rate": 2.225053099979315e-05, "loss": 0.0068, "step": 367020 }, { "epoch": 1.85, "learning_rate": 2.2242963306779137e-05, "loss": 0.0064, "step": 367030 }, { "epoch": 1.85, "learning_rate": 2.223539561376513e-05, "loss": 0.0049, "step": 367040 }, { "epoch": 1.85, "learning_rate": 2.2227827920751117e-05, "loss": 0.0059, "step": 367050 }, { "epoch": 1.85, "learning_rate": 2.222026022773711e-05, "loss": 0.0046, "step": 367060 }, { "epoch": 1.85, "learning_rate": 2.2212692534723097e-05, "loss": 0.0066, "step": 367070 }, { "epoch": 1.85, "learning_rate": 2.220512484170909e-05, "loss": 0.0048, "step": 367080 }, { "epoch": 1.85, "learning_rate": 2.2197557148695073e-05, "loss": 0.0056, "step": 367090 }, { "epoch": 1.85, "learning_rate": 2.2189989455681065e-05, "loss": 0.0052, "step": 367100 }, { "epoch": 1.85, "learning_rate": 2.2182421762667053e-05, "loss": 0.0046, "step": 367110 }, { "epoch": 1.85, "learning_rate": 2.2174854069653045e-05, "loss": 0.007, "step": 367120 }, { "epoch": 1.85, "learning_rate": 2.2167286376639033e-05, "loss": 0.0026, "step": 367130 }, { "epoch": 1.85, "learning_rate": 2.2159718683625025e-05, "loss": 0.0067, "step": 367140 }, { "epoch": 1.85, "learning_rate": 2.2152150990611013e-05, "loss": 0.007, "step": 367150 }, { "epoch": 1.85, "learning_rate": 2.2144583297597004e-05, "loss": 0.0064, "step": 367160 }, { "epoch": 1.85, "learning_rate": 2.2137015604582993e-05, "loss": 0.0058, "step": 367170 }, { "epoch": 1.85, "learning_rate": 2.2129447911568984e-05, "loss": 0.0055, "step": 367180 }, { "epoch": 1.85, "learning_rate": 2.2121880218554973e-05, "loss": 0.0045, "step": 367190 }, { "epoch": 1.85, "learning_rate": 2.2114312525540964e-05, "loss": 0.0054, "step": 367200 }, { "epoch": 1.85, "learning_rate": 2.2106744832526952e-05, "loss": 0.0062, "step": 367210 }, { "epoch": 1.85, "learning_rate": 2.2099177139512944e-05, "loss": 0.0056, "step": 367220 }, { "epoch": 1.85, "learning_rate": 2.2091609446498932e-05, "loss": 0.0058, "step": 367230 }, { "epoch": 1.85, "learning_rate": 2.2084041753484924e-05, "loss": 0.0061, "step": 367240 }, { "epoch": 1.85, "learning_rate": 2.207647406047091e-05, "loss": 0.0057, "step": 367250 }, { "epoch": 1.85, "learning_rate": 2.2068906367456897e-05, "loss": 0.0045, "step": 367260 }, { "epoch": 1.85, "learning_rate": 2.206133867444289e-05, "loss": 0.006, "step": 367270 }, { "epoch": 1.85, "learning_rate": 2.2053770981428877e-05, "loss": 0.0064, "step": 367280 }, { "epoch": 1.85, "learning_rate": 2.2046203288414868e-05, "loss": 0.0075, "step": 367290 }, { "epoch": 1.85, "learning_rate": 2.2038635595400856e-05, "loss": 0.0054, "step": 367300 }, { "epoch": 1.85, "learning_rate": 2.2031067902386848e-05, "loss": 0.0074, "step": 367310 }, { "epoch": 1.85, "learning_rate": 2.2023500209372836e-05, "loss": 0.0048, "step": 367320 }, { "epoch": 1.85, "learning_rate": 2.2015932516358828e-05, "loss": 0.0055, "step": 367330 }, { "epoch": 1.85, "learning_rate": 2.200836482334482e-05, "loss": 0.0049, "step": 367340 }, { "epoch": 1.85, "learning_rate": 2.2000797130330808e-05, "loss": 0.0054, "step": 367350 }, { "epoch": 1.85, "learning_rate": 2.19932294373168e-05, "loss": 0.005, "step": 367360 }, { "epoch": 1.85, "learning_rate": 2.1985661744302788e-05, "loss": 0.0059, "step": 367370 }, { "epoch": 1.85, "learning_rate": 2.197809405128878e-05, "loss": 0.0068, "step": 367380 }, { "epoch": 1.85, "learning_rate": 2.1970526358274767e-05, "loss": 0.005, "step": 367390 }, { "epoch": 1.85, "learning_rate": 2.196295866526076e-05, "loss": 0.0064, "step": 367400 }, { "epoch": 1.85, "learning_rate": 2.1955390972246744e-05, "loss": 0.0073, "step": 367410 }, { "epoch": 1.85, "learning_rate": 2.1947823279232732e-05, "loss": 0.0054, "step": 367420 }, { "epoch": 1.85, "learning_rate": 2.1940255586218724e-05, "loss": 0.0049, "step": 367430 }, { "epoch": 1.85, "learning_rate": 2.1932687893204712e-05, "loss": 0.0059, "step": 367440 }, { "epoch": 1.85, "learning_rate": 2.1925120200190703e-05, "loss": 0.0067, "step": 367450 }, { "epoch": 1.85, "learning_rate": 2.1917552507176692e-05, "loss": 0.0062, "step": 367460 }, { "epoch": 1.85, "learning_rate": 2.1909984814162683e-05, "loss": 0.0061, "step": 367470 }, { "epoch": 1.85, "learning_rate": 2.190241712114867e-05, "loss": 0.0052, "step": 367480 }, { "epoch": 1.85, "learning_rate": 2.1894849428134663e-05, "loss": 0.0086, "step": 367490 }, { "epoch": 1.85, "learning_rate": 2.188728173512065e-05, "loss": 0.0057, "step": 367500 }, { "epoch": 1.85, "learning_rate": 2.1879714042106643e-05, "loss": 0.0056, "step": 367510 }, { "epoch": 1.85, "learning_rate": 2.187214634909263e-05, "loss": 0.0032, "step": 367520 }, { "epoch": 1.85, "learning_rate": 2.1864578656078623e-05, "loss": 0.0067, "step": 367530 }, { "epoch": 1.85, "learning_rate": 2.185701096306461e-05, "loss": 0.0082, "step": 367540 }, { "epoch": 1.85, "learning_rate": 2.1849443270050603e-05, "loss": 0.0057, "step": 367550 }, { "epoch": 1.85, "learning_rate": 2.184187557703659e-05, "loss": 0.0056, "step": 367560 }, { "epoch": 1.85, "learning_rate": 2.183430788402258e-05, "loss": 0.0061, "step": 367570 }, { "epoch": 1.85, "learning_rate": 2.1826740191008567e-05, "loss": 0.0051, "step": 367580 }, { "epoch": 1.85, "learning_rate": 2.181917249799456e-05, "loss": 0.0055, "step": 367590 }, { "epoch": 1.85, "learning_rate": 2.1811604804980547e-05, "loss": 0.0038, "step": 367600 }, { "epoch": 1.85, "learning_rate": 2.180403711196654e-05, "loss": 0.006, "step": 367610 }, { "epoch": 1.85, "learning_rate": 2.1796469418952527e-05, "loss": 0.0061, "step": 367620 }, { "epoch": 1.85, "learning_rate": 2.178890172593852e-05, "loss": 0.0061, "step": 367630 }, { "epoch": 1.85, "learning_rate": 2.1781334032924507e-05, "loss": 0.0063, "step": 367640 }, { "epoch": 1.85, "learning_rate": 2.17737663399105e-05, "loss": 0.0063, "step": 367650 }, { "epoch": 1.85, "learning_rate": 2.1766198646896487e-05, "loss": 0.0059, "step": 367660 }, { "epoch": 1.85, "learning_rate": 2.1758630953882478e-05, "loss": 0.0058, "step": 367670 }, { "epoch": 1.85, "learning_rate": 2.1751063260868466e-05, "loss": 0.0075, "step": 367680 }, { "epoch": 1.86, "learning_rate": 2.1743495567854458e-05, "loss": 0.0063, "step": 367690 }, { "epoch": 1.86, "learning_rate": 2.1735927874840446e-05, "loss": 0.0061, "step": 367700 }, { "epoch": 1.86, "learning_rate": 2.1728360181826438e-05, "loss": 0.0069, "step": 367710 }, { "epoch": 1.86, "learning_rate": 2.1720792488812423e-05, "loss": 0.0046, "step": 367720 }, { "epoch": 1.86, "learning_rate": 2.1713224795798414e-05, "loss": 0.0086, "step": 367730 }, { "epoch": 1.86, "learning_rate": 2.1705657102784402e-05, "loss": 0.006, "step": 367740 }, { "epoch": 1.86, "learning_rate": 2.1698089409770394e-05, "loss": 0.0046, "step": 367750 }, { "epoch": 1.86, "learning_rate": 2.1690521716756382e-05, "loss": 0.0046, "step": 367760 }, { "epoch": 1.86, "learning_rate": 2.1682954023742374e-05, "loss": 0.006, "step": 367770 }, { "epoch": 1.86, "learning_rate": 2.1675386330728362e-05, "loss": 0.0077, "step": 367780 }, { "epoch": 1.86, "learning_rate": 2.1667818637714354e-05, "loss": 0.0052, "step": 367790 }, { "epoch": 1.86, "learning_rate": 2.1660250944700342e-05, "loss": 0.0042, "step": 367800 }, { "epoch": 1.86, "learning_rate": 2.1652683251686334e-05, "loss": 0.0085, "step": 367810 }, { "epoch": 1.86, "learning_rate": 2.1645115558672322e-05, "loss": 0.0065, "step": 367820 }, { "epoch": 1.86, "learning_rate": 2.1637547865658313e-05, "loss": 0.0078, "step": 367830 }, { "epoch": 1.86, "learning_rate": 2.16299801726443e-05, "loss": 0.0047, "step": 367840 }, { "epoch": 1.86, "learning_rate": 2.1622412479630293e-05, "loss": 0.0054, "step": 367850 }, { "epoch": 1.86, "learning_rate": 2.161484478661628e-05, "loss": 0.0052, "step": 367860 }, { "epoch": 1.86, "learning_rate": 2.1607277093602273e-05, "loss": 0.0059, "step": 367870 }, { "epoch": 1.86, "learning_rate": 2.1599709400588258e-05, "loss": 0.006, "step": 367880 }, { "epoch": 1.86, "learning_rate": 2.159214170757425e-05, "loss": 0.0062, "step": 367890 }, { "epoch": 1.86, "learning_rate": 2.1584574014560238e-05, "loss": 0.0046, "step": 367900 }, { "epoch": 1.86, "learning_rate": 2.157700632154623e-05, "loss": 0.0047, "step": 367910 }, { "epoch": 1.86, "learning_rate": 2.1569438628532218e-05, "loss": 0.0072, "step": 367920 }, { "epoch": 1.86, "learning_rate": 2.156187093551821e-05, "loss": 0.0063, "step": 367930 }, { "epoch": 1.86, "learning_rate": 2.1554303242504197e-05, "loss": 0.0066, "step": 367940 }, { "epoch": 1.86, "learning_rate": 2.154673554949019e-05, "loss": 0.0046, "step": 367950 }, { "epoch": 1.86, "learning_rate": 2.1539167856476177e-05, "loss": 0.0076, "step": 367960 }, { "epoch": 1.86, "learning_rate": 2.153160016346217e-05, "loss": 0.0077, "step": 367970 }, { "epoch": 1.86, "learning_rate": 2.1524032470448157e-05, "loss": 0.0058, "step": 367980 }, { "epoch": 1.86, "learning_rate": 2.151646477743415e-05, "loss": 0.0042, "step": 367990 }, { "epoch": 1.86, "learning_rate": 2.1508897084420137e-05, "loss": 0.0072, "step": 368000 }, { "epoch": 1.86, "eval_cer": 0.9144285288697699, "eval_loss": 0.004368205089122057, "eval_runtime": 116.793, "eval_samples_per_second": 17.124, "eval_steps_per_second": 4.281, "step": 368000 }, { "epoch": 1.86, "learning_rate": 2.150132939140613e-05, "loss": 0.0076, "step": 368010 }, { "epoch": 1.86, "learning_rate": 2.1493761698392117e-05, "loss": 0.0044, "step": 368020 }, { "epoch": 1.86, "learning_rate": 2.1486194005378108e-05, "loss": 0.0057, "step": 368030 }, { "epoch": 1.86, "learning_rate": 2.1478626312364093e-05, "loss": 0.0048, "step": 368040 }, { "epoch": 1.86, "learning_rate": 2.1471058619350085e-05, "loss": 0.0039, "step": 368050 }, { "epoch": 1.86, "learning_rate": 2.1463490926336073e-05, "loss": 0.0054, "step": 368060 }, { "epoch": 1.86, "learning_rate": 2.1455923233322065e-05, "loss": 0.0038, "step": 368070 }, { "epoch": 1.86, "learning_rate": 2.1448355540308053e-05, "loss": 0.0057, "step": 368080 }, { "epoch": 1.86, "learning_rate": 2.1440787847294044e-05, "loss": 0.0068, "step": 368090 }, { "epoch": 1.86, "learning_rate": 2.1433220154280033e-05, "loss": 0.0078, "step": 368100 }, { "epoch": 1.86, "learning_rate": 2.1425652461266024e-05, "loss": 0.0053, "step": 368110 }, { "epoch": 1.86, "learning_rate": 2.1418084768252012e-05, "loss": 0.0062, "step": 368120 }, { "epoch": 1.86, "learning_rate": 2.1410517075238004e-05, "loss": 0.0109, "step": 368130 }, { "epoch": 1.86, "learning_rate": 2.1402949382223992e-05, "loss": 0.0045, "step": 368140 }, { "epoch": 1.86, "learning_rate": 2.1395381689209984e-05, "loss": 0.0061, "step": 368150 }, { "epoch": 1.86, "learning_rate": 2.1387813996195972e-05, "loss": 0.006, "step": 368160 }, { "epoch": 1.86, "learning_rate": 2.1380246303181964e-05, "loss": 0.0053, "step": 368170 }, { "epoch": 1.86, "learning_rate": 2.1372678610167952e-05, "loss": 0.0046, "step": 368180 }, { "epoch": 1.86, "learning_rate": 2.1365110917153937e-05, "loss": 0.0041, "step": 368190 }, { "epoch": 1.86, "learning_rate": 2.135754322413993e-05, "loss": 0.0054, "step": 368200 }, { "epoch": 1.86, "learning_rate": 2.1349975531125917e-05, "loss": 0.005, "step": 368210 }, { "epoch": 1.86, "learning_rate": 2.1342407838111908e-05, "loss": 0.0082, "step": 368220 }, { "epoch": 1.86, "learning_rate": 2.1334840145097896e-05, "loss": 0.0054, "step": 368230 }, { "epoch": 1.86, "learning_rate": 2.1327272452083888e-05, "loss": 0.0047, "step": 368240 }, { "epoch": 1.86, "learning_rate": 2.1319704759069876e-05, "loss": 0.0059, "step": 368250 }, { "epoch": 1.86, "learning_rate": 2.1312137066055868e-05, "loss": 0.0063, "step": 368260 }, { "epoch": 1.86, "learning_rate": 2.1304569373041856e-05, "loss": 0.0102, "step": 368270 }, { "epoch": 1.86, "learning_rate": 2.1297001680027848e-05, "loss": 0.0049, "step": 368280 }, { "epoch": 1.86, "learning_rate": 2.1289433987013836e-05, "loss": 0.0054, "step": 368290 }, { "epoch": 1.86, "learning_rate": 2.1281866293999827e-05, "loss": 0.0052, "step": 368300 }, { "epoch": 1.86, "learning_rate": 2.127429860098582e-05, "loss": 0.0069, "step": 368310 }, { "epoch": 1.86, "learning_rate": 2.1266730907971807e-05, "loss": 0.0042, "step": 368320 }, { "epoch": 1.86, "learning_rate": 2.12591632149578e-05, "loss": 0.0044, "step": 368330 }, { "epoch": 1.86, "learning_rate": 2.1251595521943787e-05, "loss": 0.0074, "step": 368340 }, { "epoch": 1.86, "learning_rate": 2.1244027828929772e-05, "loss": 0.0058, "step": 368350 }, { "epoch": 1.86, "learning_rate": 2.1236460135915764e-05, "loss": 0.0065, "step": 368360 }, { "epoch": 1.86, "learning_rate": 2.1228892442901752e-05, "loss": 0.0042, "step": 368370 }, { "epoch": 1.86, "learning_rate": 2.1221324749887743e-05, "loss": 0.0044, "step": 368380 }, { "epoch": 1.86, "learning_rate": 2.121375705687373e-05, "loss": 0.0063, "step": 368390 }, { "epoch": 1.86, "learning_rate": 2.1206189363859723e-05, "loss": 0.0054, "step": 368400 }, { "epoch": 1.86, "learning_rate": 2.119862167084571e-05, "loss": 0.0068, "step": 368410 }, { "epoch": 1.86, "learning_rate": 2.1191053977831703e-05, "loss": 0.008, "step": 368420 }, { "epoch": 1.86, "learning_rate": 2.118348628481769e-05, "loss": 0.0068, "step": 368430 }, { "epoch": 1.86, "learning_rate": 2.1175918591803683e-05, "loss": 0.0058, "step": 368440 }, { "epoch": 1.86, "learning_rate": 2.116835089878967e-05, "loss": 0.0059, "step": 368450 }, { "epoch": 1.86, "learning_rate": 2.1160783205775663e-05, "loss": 0.0046, "step": 368460 }, { "epoch": 1.86, "learning_rate": 2.115321551276165e-05, "loss": 0.0037, "step": 368470 }, { "epoch": 1.86, "learning_rate": 2.1145647819747642e-05, "loss": 0.0074, "step": 368480 }, { "epoch": 1.86, "learning_rate": 2.113808012673363e-05, "loss": 0.0065, "step": 368490 }, { "epoch": 1.86, "learning_rate": 2.1130512433719622e-05, "loss": 0.0057, "step": 368500 }, { "epoch": 1.86, "learning_rate": 2.1122944740705607e-05, "loss": 0.0054, "step": 368510 }, { "epoch": 1.86, "learning_rate": 2.11153770476916e-05, "loss": 0.0053, "step": 368520 }, { "epoch": 1.86, "learning_rate": 2.1107809354677587e-05, "loss": 0.0057, "step": 368530 }, { "epoch": 1.86, "learning_rate": 2.110024166166358e-05, "loss": 0.0053, "step": 368540 }, { "epoch": 1.86, "learning_rate": 2.1092673968649567e-05, "loss": 0.0069, "step": 368550 }, { "epoch": 1.86, "learning_rate": 2.108510627563556e-05, "loss": 0.005, "step": 368560 }, { "epoch": 1.86, "learning_rate": 2.1077538582621547e-05, "loss": 0.0062, "step": 368570 }, { "epoch": 1.86, "learning_rate": 2.1069970889607538e-05, "loss": 0.0071, "step": 368580 }, { "epoch": 1.86, "learning_rate": 2.1062403196593526e-05, "loss": 0.0073, "step": 368590 }, { "epoch": 1.86, "learning_rate": 2.1054835503579518e-05, "loss": 0.0055, "step": 368600 }, { "epoch": 1.86, "learning_rate": 2.1047267810565506e-05, "loss": 0.0046, "step": 368610 }, { "epoch": 1.86, "learning_rate": 2.1039700117551498e-05, "loss": 0.0074, "step": 368620 }, { "epoch": 1.86, "learning_rate": 2.1032132424537486e-05, "loss": 0.0064, "step": 368630 }, { "epoch": 1.86, "learning_rate": 2.1024564731523478e-05, "loss": 0.0052, "step": 368640 }, { "epoch": 1.86, "learning_rate": 2.1016997038509466e-05, "loss": 0.0062, "step": 368650 }, { "epoch": 1.86, "learning_rate": 2.1009429345495458e-05, "loss": 0.0063, "step": 368660 }, { "epoch": 1.86, "learning_rate": 2.1001861652481442e-05, "loss": 0.0049, "step": 368670 }, { "epoch": 1.86, "learning_rate": 2.0994293959467434e-05, "loss": 0.005, "step": 368680 }, { "epoch": 1.86, "learning_rate": 2.0986726266453422e-05, "loss": 0.0046, "step": 368690 }, { "epoch": 1.86, "learning_rate": 2.0979158573439414e-05, "loss": 0.0067, "step": 368700 }, { "epoch": 1.86, "learning_rate": 2.0971590880425402e-05, "loss": 0.0067, "step": 368710 }, { "epoch": 1.86, "learning_rate": 2.0964023187411394e-05, "loss": 0.0053, "step": 368720 }, { "epoch": 1.86, "learning_rate": 2.0956455494397382e-05, "loss": 0.005, "step": 368730 }, { "epoch": 1.86, "learning_rate": 2.0948887801383373e-05, "loss": 0.0048, "step": 368740 }, { "epoch": 1.86, "learning_rate": 2.094132010836936e-05, "loss": 0.0051, "step": 368750 }, { "epoch": 1.86, "learning_rate": 2.0933752415355353e-05, "loss": 0.0065, "step": 368760 }, { "epoch": 1.86, "learning_rate": 2.092618472234134e-05, "loss": 0.0068, "step": 368770 }, { "epoch": 1.86, "learning_rate": 2.0918617029327333e-05, "loss": 0.0065, "step": 368780 }, { "epoch": 1.86, "learning_rate": 2.091104933631332e-05, "loss": 0.0066, "step": 368790 }, { "epoch": 1.86, "learning_rate": 2.0903481643299313e-05, "loss": 0.0049, "step": 368800 }, { "epoch": 1.86, "learning_rate": 2.08959139502853e-05, "loss": 0.0052, "step": 368810 }, { "epoch": 1.86, "learning_rate": 2.088834625727129e-05, "loss": 0.0043, "step": 368820 }, { "epoch": 1.86, "learning_rate": 2.0880778564257278e-05, "loss": 0.0056, "step": 368830 }, { "epoch": 1.86, "learning_rate": 2.087321087124327e-05, "loss": 0.0045, "step": 368840 }, { "epoch": 1.86, "learning_rate": 2.0865643178229257e-05, "loss": 0.0057, "step": 368850 }, { "epoch": 1.86, "learning_rate": 2.085807548521525e-05, "loss": 0.0052, "step": 368860 }, { "epoch": 1.86, "learning_rate": 2.0850507792201237e-05, "loss": 0.0077, "step": 368870 }, { "epoch": 1.86, "learning_rate": 2.084294009918723e-05, "loss": 0.0053, "step": 368880 }, { "epoch": 1.86, "learning_rate": 2.0835372406173217e-05, "loss": 0.007, "step": 368890 }, { "epoch": 1.86, "learning_rate": 2.082780471315921e-05, "loss": 0.0057, "step": 368900 }, { "epoch": 1.86, "learning_rate": 2.0820237020145197e-05, "loss": 0.0061, "step": 368910 }, { "epoch": 1.86, "learning_rate": 2.081266932713119e-05, "loss": 0.0074, "step": 368920 }, { "epoch": 1.86, "learning_rate": 2.0805101634117177e-05, "loss": 0.0055, "step": 368930 }, { "epoch": 1.86, "learning_rate": 2.079753394110317e-05, "loss": 0.0057, "step": 368940 }, { "epoch": 1.86, "learning_rate": 2.0789966248089157e-05, "loss": 0.0044, "step": 368950 }, { "epoch": 1.86, "learning_rate": 2.0782398555075148e-05, "loss": 0.0061, "step": 368960 }, { "epoch": 1.86, "learning_rate": 2.0774830862061136e-05, "loss": 0.0043, "step": 368970 }, { "epoch": 1.86, "learning_rate": 2.076726316904712e-05, "loss": 0.0084, "step": 368980 }, { "epoch": 1.86, "learning_rate": 2.0759695476033113e-05, "loss": 0.0047, "step": 368990 }, { "epoch": 1.86, "learning_rate": 2.07521277830191e-05, "loss": 0.008, "step": 369000 }, { "epoch": 1.86, "eval_cer": 0.9144450256039017, "eval_loss": 0.0044240448623895645, "eval_runtime": 116.7122, "eval_samples_per_second": 17.136, "eval_steps_per_second": 4.284, "step": 369000 }, { "epoch": 1.86, "learning_rate": 2.0744560090005093e-05, "loss": 0.0053, "step": 369010 }, { "epoch": 1.86, "learning_rate": 2.0736992396991084e-05, "loss": 0.0047, "step": 369020 }, { "epoch": 1.86, "learning_rate": 2.0729424703977072e-05, "loss": 0.0054, "step": 369030 }, { "epoch": 1.86, "learning_rate": 2.0721857010963064e-05, "loss": 0.0058, "step": 369040 }, { "epoch": 1.86, "learning_rate": 2.0714289317949052e-05, "loss": 0.0055, "step": 369050 }, { "epoch": 1.86, "learning_rate": 2.0706721624935044e-05, "loss": 0.0067, "step": 369060 }, { "epoch": 1.86, "learning_rate": 2.0699153931921032e-05, "loss": 0.0061, "step": 369070 }, { "epoch": 1.86, "learning_rate": 2.0691586238907024e-05, "loss": 0.0068, "step": 369080 }, { "epoch": 1.86, "learning_rate": 2.0684018545893012e-05, "loss": 0.0059, "step": 369090 }, { "epoch": 1.86, "learning_rate": 2.0676450852879004e-05, "loss": 0.0069, "step": 369100 }, { "epoch": 1.86, "learning_rate": 2.0668883159864992e-05, "loss": 0.006, "step": 369110 }, { "epoch": 1.86, "learning_rate": 2.0661315466850983e-05, "loss": 0.0063, "step": 369120 }, { "epoch": 1.86, "learning_rate": 2.065374777383697e-05, "loss": 0.0104, "step": 369130 }, { "epoch": 1.86, "learning_rate": 2.0646180080822956e-05, "loss": 0.0061, "step": 369140 }, { "epoch": 1.86, "learning_rate": 2.0638612387808948e-05, "loss": 0.0047, "step": 369150 }, { "epoch": 1.86, "learning_rate": 2.0631044694794936e-05, "loss": 0.0112, "step": 369160 }, { "epoch": 1.86, "learning_rate": 2.0623477001780928e-05, "loss": 0.0056, "step": 369170 }, { "epoch": 1.86, "learning_rate": 2.0615909308766916e-05, "loss": 0.0059, "step": 369180 }, { "epoch": 1.86, "learning_rate": 2.0608341615752908e-05, "loss": 0.005, "step": 369190 }, { "epoch": 1.86, "learning_rate": 2.0600773922738896e-05, "loss": 0.0068, "step": 369200 }, { "epoch": 1.86, "learning_rate": 2.0593206229724887e-05, "loss": 0.0113, "step": 369210 }, { "epoch": 1.86, "learning_rate": 2.0585638536710876e-05, "loss": 0.0063, "step": 369220 }, { "epoch": 1.86, "learning_rate": 2.0578070843696867e-05, "loss": 0.0059, "step": 369230 }, { "epoch": 1.86, "learning_rate": 2.0570503150682856e-05, "loss": 0.0064, "step": 369240 }, { "epoch": 1.86, "learning_rate": 2.0562935457668847e-05, "loss": 0.0059, "step": 369250 }, { "epoch": 1.86, "learning_rate": 2.0555367764654835e-05, "loss": 0.0045, "step": 369260 }, { "epoch": 1.86, "learning_rate": 2.0547800071640827e-05, "loss": 0.0057, "step": 369270 }, { "epoch": 1.86, "learning_rate": 2.054023237862682e-05, "loss": 0.0059, "step": 369280 }, { "epoch": 1.86, "learning_rate": 2.0532664685612803e-05, "loss": 0.006, "step": 369290 }, { "epoch": 1.86, "learning_rate": 2.052509699259879e-05, "loss": 0.0066, "step": 369300 }, { "epoch": 1.86, "learning_rate": 2.0517529299584783e-05, "loss": 0.0061, "step": 369310 }, { "epoch": 1.86, "learning_rate": 2.050996160657077e-05, "loss": 0.0063, "step": 369320 }, { "epoch": 1.86, "learning_rate": 2.0502393913556763e-05, "loss": 0.0086, "step": 369330 }, { "epoch": 1.86, "learning_rate": 2.049482622054275e-05, "loss": 0.0049, "step": 369340 }, { "epoch": 1.86, "learning_rate": 2.0487258527528743e-05, "loss": 0.0045, "step": 369350 }, { "epoch": 1.86, "learning_rate": 2.047969083451473e-05, "loss": 0.0048, "step": 369360 }, { "epoch": 1.86, "learning_rate": 2.0472123141500723e-05, "loss": 0.0133, "step": 369370 }, { "epoch": 1.86, "learning_rate": 2.046455544848671e-05, "loss": 0.006, "step": 369380 }, { "epoch": 1.86, "learning_rate": 2.0456987755472703e-05, "loss": 0.0063, "step": 369390 }, { "epoch": 1.86, "learning_rate": 2.044942006245869e-05, "loss": 0.008, "step": 369400 }, { "epoch": 1.86, "learning_rate": 2.0441852369444682e-05, "loss": 0.0049, "step": 369410 }, { "epoch": 1.86, "learning_rate": 2.043428467643067e-05, "loss": 0.0055, "step": 369420 }, { "epoch": 1.86, "learning_rate": 2.0426716983416662e-05, "loss": 0.0044, "step": 369430 }, { "epoch": 1.86, "learning_rate": 2.041914929040265e-05, "loss": 0.005, "step": 369440 }, { "epoch": 1.86, "learning_rate": 2.041158159738864e-05, "loss": 0.0033, "step": 369450 }, { "epoch": 1.86, "learning_rate": 2.0404013904374627e-05, "loss": 0.0059, "step": 369460 }, { "epoch": 1.86, "learning_rate": 2.039644621136062e-05, "loss": 0.0047, "step": 369470 }, { "epoch": 1.86, "learning_rate": 2.0388878518346607e-05, "loss": 0.0069, "step": 369480 }, { "epoch": 1.86, "learning_rate": 2.0381310825332598e-05, "loss": 0.0075, "step": 369490 }, { "epoch": 1.86, "learning_rate": 2.0373743132318586e-05, "loss": 0.0051, "step": 369500 }, { "epoch": 1.86, "learning_rate": 2.0366175439304578e-05, "loss": 0.0049, "step": 369510 }, { "epoch": 1.86, "learning_rate": 2.0358607746290566e-05, "loss": 0.007, "step": 369520 }, { "epoch": 1.86, "learning_rate": 2.0351040053276558e-05, "loss": 0.0048, "step": 369530 }, { "epoch": 1.86, "learning_rate": 2.0343472360262546e-05, "loss": 0.0064, "step": 369540 }, { "epoch": 1.86, "learning_rate": 2.0335904667248538e-05, "loss": 0.0065, "step": 369550 }, { "epoch": 1.86, "learning_rate": 2.0328336974234526e-05, "loss": 0.0068, "step": 369560 }, { "epoch": 1.86, "learning_rate": 2.0320769281220518e-05, "loss": 0.0053, "step": 369570 }, { "epoch": 1.86, "learning_rate": 2.0313201588206506e-05, "loss": 0.006, "step": 369580 }, { "epoch": 1.86, "learning_rate": 2.0305633895192497e-05, "loss": 0.0044, "step": 369590 }, { "epoch": 1.86, "learning_rate": 2.0298066202178486e-05, "loss": 0.0049, "step": 369600 }, { "epoch": 1.86, "learning_rate": 2.0290498509164474e-05, "loss": 0.0043, "step": 369610 }, { "epoch": 1.86, "learning_rate": 2.0282930816150462e-05, "loss": 0.0067, "step": 369620 }, { "epoch": 1.86, "learning_rate": 2.0275363123136454e-05, "loss": 0.0068, "step": 369630 }, { "epoch": 1.86, "learning_rate": 2.0267795430122442e-05, "loss": 0.0067, "step": 369640 }, { "epoch": 1.86, "learning_rate": 2.0260227737108433e-05, "loss": 0.0059, "step": 369650 }, { "epoch": 1.86, "learning_rate": 2.0252660044094422e-05, "loss": 0.0065, "step": 369660 }, { "epoch": 1.87, "learning_rate": 2.0245092351080413e-05, "loss": 0.0085, "step": 369670 }, { "epoch": 1.87, "learning_rate": 2.02375246580664e-05, "loss": 0.0072, "step": 369680 }, { "epoch": 1.87, "learning_rate": 2.0229956965052393e-05, "loss": 0.0045, "step": 369690 }, { "epoch": 1.87, "learning_rate": 2.022238927203838e-05, "loss": 0.0046, "step": 369700 }, { "epoch": 1.87, "learning_rate": 2.0214821579024373e-05, "loss": 0.0068, "step": 369710 }, { "epoch": 1.87, "learning_rate": 2.020725388601036e-05, "loss": 0.0068, "step": 369720 }, { "epoch": 1.87, "learning_rate": 2.0199686192996353e-05, "loss": 0.0054, "step": 369730 }, { "epoch": 1.87, "learning_rate": 2.019211849998234e-05, "loss": 0.0056, "step": 369740 }, { "epoch": 1.87, "learning_rate": 2.0184550806968333e-05, "loss": 0.0053, "step": 369750 }, { "epoch": 1.87, "learning_rate": 2.017698311395432e-05, "loss": 0.0069, "step": 369760 }, { "epoch": 1.87, "learning_rate": 2.016941542094031e-05, "loss": 0.0059, "step": 369770 }, { "epoch": 1.87, "learning_rate": 2.0161847727926297e-05, "loss": 0.0049, "step": 369780 }, { "epoch": 1.87, "learning_rate": 2.015428003491229e-05, "loss": 0.006, "step": 369790 }, { "epoch": 1.87, "learning_rate": 2.0146712341898277e-05, "loss": 0.0046, "step": 369800 }, { "epoch": 1.87, "learning_rate": 2.013914464888427e-05, "loss": 0.0059, "step": 369810 }, { "epoch": 1.87, "learning_rate": 2.0131576955870257e-05, "loss": 0.007, "step": 369820 }, { "epoch": 1.87, "learning_rate": 2.012400926285625e-05, "loss": 0.0055, "step": 369830 }, { "epoch": 1.87, "learning_rate": 2.0116441569842237e-05, "loss": 0.0064, "step": 369840 }, { "epoch": 1.87, "learning_rate": 2.010887387682823e-05, "loss": 0.0043, "step": 369850 }, { "epoch": 1.87, "learning_rate": 2.0101306183814217e-05, "loss": 0.005, "step": 369860 }, { "epoch": 1.87, "learning_rate": 2.0093738490800208e-05, "loss": 0.0058, "step": 369870 }, { "epoch": 1.87, "learning_rate": 2.0086170797786196e-05, "loss": 0.0063, "step": 369880 }, { "epoch": 1.87, "learning_rate": 2.0078603104772188e-05, "loss": 0.007, "step": 369890 }, { "epoch": 1.87, "learning_rate": 2.0071035411758176e-05, "loss": 0.0058, "step": 369900 }, { "epoch": 1.87, "learning_rate": 2.0063467718744168e-05, "loss": 0.0045, "step": 369910 }, { "epoch": 1.87, "learning_rate": 2.0055900025730153e-05, "loss": 0.0061, "step": 369920 }, { "epoch": 1.87, "learning_rate": 2.004833233271614e-05, "loss": 0.0067, "step": 369930 }, { "epoch": 1.87, "learning_rate": 2.0040764639702132e-05, "loss": 0.005, "step": 369940 }, { "epoch": 1.87, "learning_rate": 2.003319694668812e-05, "loss": 0.0042, "step": 369950 }, { "epoch": 1.87, "learning_rate": 2.0025629253674112e-05, "loss": 0.0084, "step": 369960 }, { "epoch": 1.87, "learning_rate": 2.00180615606601e-05, "loss": 0.007, "step": 369970 }, { "epoch": 1.87, "learning_rate": 2.0010493867646092e-05, "loss": 0.0052, "step": 369980 }, { "epoch": 1.87, "learning_rate": 2.0002926174632084e-05, "loss": 0.0055, "step": 369990 }, { "epoch": 1.87, "learning_rate": 1.9995358481618072e-05, "loss": 0.0046, "step": 370000 }, { "epoch": 1.87, "eval_cer": 0.9144246472852683, "eval_loss": 0.004436591174453497, "eval_runtime": 116.7427, "eval_samples_per_second": 17.132, "eval_steps_per_second": 4.283, "step": 370000 }, { "epoch": 1.87, "learning_rate": 1.9987790788604064e-05, "loss": 0.0047, "step": 370010 }, { "epoch": 1.87, "learning_rate": 1.9980223095590052e-05, "loss": 0.0077, "step": 370020 }, { "epoch": 1.87, "learning_rate": 1.9972655402576043e-05, "loss": 0.0039, "step": 370030 }, { "epoch": 1.87, "learning_rate": 1.996508770956203e-05, "loss": 0.0071, "step": 370040 }, { "epoch": 1.87, "learning_rate": 1.9957520016548023e-05, "loss": 0.0044, "step": 370050 }, { "epoch": 1.87, "learning_rate": 1.994995232353401e-05, "loss": 0.0049, "step": 370060 }, { "epoch": 1.87, "learning_rate": 1.9942384630520003e-05, "loss": 0.0055, "step": 370070 }, { "epoch": 1.87, "learning_rate": 1.9934816937505988e-05, "loss": 0.0046, "step": 370080 }, { "epoch": 1.87, "learning_rate": 1.9927249244491976e-05, "loss": 0.0043, "step": 370090 }, { "epoch": 1.87, "learning_rate": 1.9919681551477968e-05, "loss": 0.0069, "step": 370100 }, { "epoch": 1.87, "learning_rate": 1.9912113858463956e-05, "loss": 0.005, "step": 370110 }, { "epoch": 1.87, "learning_rate": 1.9904546165449948e-05, "loss": 0.007, "step": 370120 }, { "epoch": 1.87, "learning_rate": 1.9896978472435936e-05, "loss": 0.005, "step": 370130 }, { "epoch": 1.87, "learning_rate": 1.9889410779421927e-05, "loss": 0.0073, "step": 370140 }, { "epoch": 1.87, "learning_rate": 1.9881843086407916e-05, "loss": 0.0052, "step": 370150 }, { "epoch": 1.87, "learning_rate": 1.9874275393393907e-05, "loss": 0.0056, "step": 370160 }, { "epoch": 1.87, "learning_rate": 1.9866707700379895e-05, "loss": 0.006, "step": 370170 }, { "epoch": 1.87, "learning_rate": 1.9859140007365887e-05, "loss": 0.0049, "step": 370180 }, { "epoch": 1.87, "learning_rate": 1.9851572314351875e-05, "loss": 0.0052, "step": 370190 }, { "epoch": 1.87, "learning_rate": 1.9844004621337867e-05, "loss": 0.0072, "step": 370200 }, { "epoch": 1.87, "learning_rate": 1.9836436928323855e-05, "loss": 0.005, "step": 370210 }, { "epoch": 1.87, "learning_rate": 1.9828869235309847e-05, "loss": 0.0041, "step": 370220 }, { "epoch": 1.87, "learning_rate": 1.9821301542295835e-05, "loss": 0.0062, "step": 370230 }, { "epoch": 1.87, "learning_rate": 1.9813733849281823e-05, "loss": 0.0067, "step": 370240 }, { "epoch": 1.87, "learning_rate": 1.980616615626781e-05, "loss": 0.0079, "step": 370250 }, { "epoch": 1.87, "learning_rate": 1.9798598463253803e-05, "loss": 0.0051, "step": 370260 }, { "epoch": 1.87, "learning_rate": 1.979103077023979e-05, "loss": 0.0054, "step": 370270 }, { "epoch": 1.87, "learning_rate": 1.9783463077225783e-05, "loss": 0.0046, "step": 370280 }, { "epoch": 1.87, "learning_rate": 1.977589538421177e-05, "loss": 0.0056, "step": 370290 }, { "epoch": 1.87, "learning_rate": 1.9768327691197763e-05, "loss": 0.0058, "step": 370300 }, { "epoch": 1.87, "learning_rate": 1.976075999818375e-05, "loss": 0.0048, "step": 370310 }, { "epoch": 1.87, "learning_rate": 1.9753192305169742e-05, "loss": 0.0044, "step": 370320 }, { "epoch": 1.87, "learning_rate": 1.974562461215573e-05, "loss": 0.0067, "step": 370330 }, { "epoch": 1.87, "learning_rate": 1.9738056919141722e-05, "loss": 0.0066, "step": 370340 }, { "epoch": 1.87, "learning_rate": 1.973048922612771e-05, "loss": 0.0056, "step": 370350 }, { "epoch": 1.87, "learning_rate": 1.9722921533113702e-05, "loss": 0.0064, "step": 370360 }, { "epoch": 1.87, "learning_rate": 1.971535384009969e-05, "loss": 0.0044, "step": 370370 }, { "epoch": 1.87, "learning_rate": 1.9707786147085682e-05, "loss": 0.0058, "step": 370380 }, { "epoch": 1.87, "learning_rate": 1.9700218454071667e-05, "loss": 0.0077, "step": 370390 }, { "epoch": 1.87, "learning_rate": 1.969265076105766e-05, "loss": 0.0057, "step": 370400 }, { "epoch": 1.87, "learning_rate": 1.9685083068043647e-05, "loss": 0.006, "step": 370410 }, { "epoch": 1.87, "learning_rate": 1.9677515375029638e-05, "loss": 0.0039, "step": 370420 }, { "epoch": 1.87, "learning_rate": 1.9669947682015626e-05, "loss": 0.0059, "step": 370430 }, { "epoch": 1.87, "learning_rate": 1.9662379989001618e-05, "loss": 0.0069, "step": 370440 }, { "epoch": 1.87, "learning_rate": 1.9654812295987606e-05, "loss": 0.007, "step": 370450 }, { "epoch": 1.87, "learning_rate": 1.9647244602973598e-05, "loss": 0.0086, "step": 370460 }, { "epoch": 1.87, "learning_rate": 1.9639676909959586e-05, "loss": 0.0069, "step": 370470 }, { "epoch": 1.87, "learning_rate": 1.9632109216945578e-05, "loss": 0.0049, "step": 370480 }, { "epoch": 1.87, "learning_rate": 1.9624541523931566e-05, "loss": 0.0074, "step": 370490 }, { "epoch": 1.87, "learning_rate": 1.9616973830917557e-05, "loss": 0.0054, "step": 370500 }, { "epoch": 1.87, "learning_rate": 1.9609406137903546e-05, "loss": 0.0056, "step": 370510 }, { "epoch": 1.87, "learning_rate": 1.9601838444889537e-05, "loss": 0.0051, "step": 370520 }, { "epoch": 1.87, "learning_rate": 1.9594270751875525e-05, "loss": 0.0051, "step": 370530 }, { "epoch": 1.87, "learning_rate": 1.9586703058861517e-05, "loss": 0.0053, "step": 370540 }, { "epoch": 1.87, "learning_rate": 1.9579135365847502e-05, "loss": 0.0052, "step": 370550 }, { "epoch": 1.87, "learning_rate": 1.9571567672833494e-05, "loss": 0.0054, "step": 370560 }, { "epoch": 1.87, "learning_rate": 1.9563999979819482e-05, "loss": 0.0054, "step": 370570 }, { "epoch": 1.87, "learning_rate": 1.9556432286805473e-05, "loss": 0.006, "step": 370580 }, { "epoch": 1.87, "learning_rate": 1.954886459379146e-05, "loss": 0.0061, "step": 370590 }, { "epoch": 1.87, "learning_rate": 1.9541296900777453e-05, "loss": 0.0066, "step": 370600 }, { "epoch": 1.87, "learning_rate": 1.953372920776344e-05, "loss": 0.0068, "step": 370610 }, { "epoch": 1.87, "learning_rate": 1.9526161514749433e-05, "loss": 0.004, "step": 370620 }, { "epoch": 1.87, "learning_rate": 1.951859382173542e-05, "loss": 0.0069, "step": 370630 }, { "epoch": 1.87, "learning_rate": 1.9511026128721413e-05, "loss": 0.0063, "step": 370640 }, { "epoch": 1.87, "learning_rate": 1.95034584357074e-05, "loss": 0.0071, "step": 370650 }, { "epoch": 1.87, "learning_rate": 1.9495890742693393e-05, "loss": 0.0065, "step": 370660 }, { "epoch": 1.87, "learning_rate": 1.948832304967938e-05, "loss": 0.0064, "step": 370670 }, { "epoch": 1.87, "learning_rate": 1.9480755356665372e-05, "loss": 0.0063, "step": 370680 }, { "epoch": 1.87, "learning_rate": 1.947318766365136e-05, "loss": 0.0066, "step": 370690 }, { "epoch": 1.87, "learning_rate": 1.9465619970637352e-05, "loss": 0.0071, "step": 370700 }, { "epoch": 1.87, "learning_rate": 1.9458052277623337e-05, "loss": 0.0045, "step": 370710 }, { "epoch": 1.87, "learning_rate": 1.945048458460933e-05, "loss": 0.0067, "step": 370720 }, { "epoch": 1.87, "learning_rate": 1.9442916891595317e-05, "loss": 0.0051, "step": 370730 }, { "epoch": 1.87, "learning_rate": 1.943534919858131e-05, "loss": 0.0063, "step": 370740 }, { "epoch": 1.87, "learning_rate": 1.9427781505567297e-05, "loss": 0.0051, "step": 370750 }, { "epoch": 1.87, "learning_rate": 1.942021381255329e-05, "loss": 0.0067, "step": 370760 }, { "epoch": 1.87, "learning_rate": 1.9412646119539277e-05, "loss": 0.0039, "step": 370770 }, { "epoch": 1.87, "learning_rate": 1.9405078426525268e-05, "loss": 0.0065, "step": 370780 }, { "epoch": 1.87, "learning_rate": 1.9397510733511256e-05, "loss": 0.0055, "step": 370790 }, { "epoch": 1.87, "learning_rate": 1.9389943040497248e-05, "loss": 0.0066, "step": 370800 }, { "epoch": 1.87, "learning_rate": 1.9382375347483236e-05, "loss": 0.0062, "step": 370810 }, { "epoch": 1.87, "learning_rate": 1.9374807654469228e-05, "loss": 0.0048, "step": 370820 }, { "epoch": 1.87, "learning_rate": 1.9367239961455216e-05, "loss": 0.0055, "step": 370830 }, { "epoch": 1.87, "learning_rate": 1.9359672268441208e-05, "loss": 0.0062, "step": 370840 }, { "epoch": 1.87, "learning_rate": 1.9352104575427196e-05, "loss": 0.0074, "step": 370850 }, { "epoch": 1.87, "learning_rate": 1.9344536882413188e-05, "loss": 0.0052, "step": 370860 }, { "epoch": 1.87, "learning_rate": 1.9336969189399172e-05, "loss": 0.0056, "step": 370870 }, { "epoch": 1.87, "learning_rate": 1.932940149638516e-05, "loss": 0.0074, "step": 370880 }, { "epoch": 1.87, "learning_rate": 1.9321833803371152e-05, "loss": 0.0064, "step": 370890 }, { "epoch": 1.87, "learning_rate": 1.931426611035714e-05, "loss": 0.0054, "step": 370900 }, { "epoch": 1.87, "learning_rate": 1.9306698417343132e-05, "loss": 0.0053, "step": 370910 }, { "epoch": 1.87, "learning_rate": 1.929913072432912e-05, "loss": 0.005, "step": 370920 }, { "epoch": 1.87, "learning_rate": 1.9291563031315112e-05, "loss": 0.0099, "step": 370930 }, { "epoch": 1.87, "learning_rate": 1.92839953383011e-05, "loss": 0.0077, "step": 370940 }, { "epoch": 1.87, "learning_rate": 1.927642764528709e-05, "loss": 0.0049, "step": 370950 }, { "epoch": 1.87, "learning_rate": 1.9268859952273083e-05, "loss": 0.0057, "step": 370960 }, { "epoch": 1.87, "learning_rate": 1.926129225925907e-05, "loss": 0.0056, "step": 370970 }, { "epoch": 1.87, "learning_rate": 1.9253724566245063e-05, "loss": 0.0049, "step": 370980 }, { "epoch": 1.87, "learning_rate": 1.924615687323105e-05, "loss": 0.0048, "step": 370990 }, { "epoch": 1.87, "learning_rate": 1.9238589180217043e-05, "loss": 0.0069, "step": 371000 }, { "epoch": 1.87, "eval_cer": 0.9144450256039017, "eval_loss": 0.004348627291619778, "eval_runtime": 116.6791, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 371000 }, { "epoch": 1.87, "learning_rate": 1.923102148720303e-05, "loss": 0.0046, "step": 371010 }, { "epoch": 1.87, "learning_rate": 1.9223453794189016e-05, "loss": 0.0054, "step": 371020 }, { "epoch": 1.87, "learning_rate": 1.9215886101175008e-05, "loss": 0.0062, "step": 371030 }, { "epoch": 1.87, "learning_rate": 1.9208318408160996e-05, "loss": 0.0049, "step": 371040 }, { "epoch": 1.87, "learning_rate": 1.9200750715146987e-05, "loss": 0.0048, "step": 371050 }, { "epoch": 1.87, "learning_rate": 1.9193183022132976e-05, "loss": 0.0059, "step": 371060 }, { "epoch": 1.87, "learning_rate": 1.9185615329118967e-05, "loss": 0.0032, "step": 371070 }, { "epoch": 1.87, "learning_rate": 1.9178047636104955e-05, "loss": 0.0069, "step": 371080 }, { "epoch": 1.87, "learning_rate": 1.9170479943090947e-05, "loss": 0.0071, "step": 371090 }, { "epoch": 1.87, "learning_rate": 1.9162912250076935e-05, "loss": 0.0053, "step": 371100 }, { "epoch": 1.87, "learning_rate": 1.9155344557062927e-05, "loss": 0.0069, "step": 371110 }, { "epoch": 1.87, "learning_rate": 1.9147776864048915e-05, "loss": 0.0068, "step": 371120 }, { "epoch": 1.87, "learning_rate": 1.9140209171034907e-05, "loss": 0.0045, "step": 371130 }, { "epoch": 1.87, "learning_rate": 1.9132641478020895e-05, "loss": 0.007, "step": 371140 }, { "epoch": 1.87, "learning_rate": 1.9125073785006887e-05, "loss": 0.0056, "step": 371150 }, { "epoch": 1.87, "learning_rate": 1.9117506091992875e-05, "loss": 0.0048, "step": 371160 }, { "epoch": 1.87, "learning_rate": 1.9109938398978866e-05, "loss": 0.0057, "step": 371170 }, { "epoch": 1.87, "learning_rate": 1.910237070596485e-05, "loss": 0.0044, "step": 371180 }, { "epoch": 1.87, "learning_rate": 1.9094803012950843e-05, "loss": 0.0068, "step": 371190 }, { "epoch": 1.87, "learning_rate": 1.908723531993683e-05, "loss": 0.0061, "step": 371200 }, { "epoch": 1.87, "learning_rate": 1.9079667626922823e-05, "loss": 0.007, "step": 371210 }, { "epoch": 1.87, "learning_rate": 1.907209993390881e-05, "loss": 0.0048, "step": 371220 }, { "epoch": 1.87, "learning_rate": 1.9064532240894802e-05, "loss": 0.0073, "step": 371230 }, { "epoch": 1.87, "learning_rate": 1.905696454788079e-05, "loss": 0.0074, "step": 371240 }, { "epoch": 1.87, "learning_rate": 1.9049396854866782e-05, "loss": 0.0087, "step": 371250 }, { "epoch": 1.87, "learning_rate": 1.904182916185277e-05, "loss": 0.0052, "step": 371260 }, { "epoch": 1.87, "learning_rate": 1.9034261468838762e-05, "loss": 0.0068, "step": 371270 }, { "epoch": 1.87, "learning_rate": 1.902669377582475e-05, "loss": 0.0055, "step": 371280 }, { "epoch": 1.87, "learning_rate": 1.9019126082810742e-05, "loss": 0.0033, "step": 371290 }, { "epoch": 1.87, "learning_rate": 1.901155838979673e-05, "loss": 0.0047, "step": 371300 }, { "epoch": 1.87, "learning_rate": 1.9003990696782722e-05, "loss": 0.0054, "step": 371310 }, { "epoch": 1.87, "learning_rate": 1.899642300376871e-05, "loss": 0.0065, "step": 371320 }, { "epoch": 1.87, "learning_rate": 1.89888553107547e-05, "loss": 0.0046, "step": 371330 }, { "epoch": 1.87, "learning_rate": 1.8981287617740686e-05, "loss": 0.0058, "step": 371340 }, { "epoch": 1.87, "learning_rate": 1.8973719924726678e-05, "loss": 0.0055, "step": 371350 }, { "epoch": 1.87, "learning_rate": 1.8966152231712666e-05, "loss": 0.0062, "step": 371360 }, { "epoch": 1.87, "learning_rate": 1.8958584538698658e-05, "loss": 0.0058, "step": 371370 }, { "epoch": 1.87, "learning_rate": 1.8951016845684646e-05, "loss": 0.0064, "step": 371380 }, { "epoch": 1.87, "learning_rate": 1.8943449152670638e-05, "loss": 0.0063, "step": 371390 }, { "epoch": 1.87, "learning_rate": 1.8935881459656626e-05, "loss": 0.0049, "step": 371400 }, { "epoch": 1.87, "learning_rate": 1.8928313766642617e-05, "loss": 0.0054, "step": 371410 }, { "epoch": 1.87, "learning_rate": 1.8920746073628606e-05, "loss": 0.0066, "step": 371420 }, { "epoch": 1.87, "learning_rate": 1.8913178380614597e-05, "loss": 0.0055, "step": 371430 }, { "epoch": 1.87, "learning_rate": 1.8905610687600586e-05, "loss": 0.0062, "step": 371440 }, { "epoch": 1.87, "learning_rate": 1.8898042994586577e-05, "loss": 0.0049, "step": 371450 }, { "epoch": 1.87, "learning_rate": 1.8890475301572565e-05, "loss": 0.0058, "step": 371460 }, { "epoch": 1.87, "learning_rate": 1.8882907608558557e-05, "loss": 0.0056, "step": 371470 }, { "epoch": 1.87, "learning_rate": 1.8875339915544545e-05, "loss": 0.005, "step": 371480 }, { "epoch": 1.87, "learning_rate": 1.8867772222530533e-05, "loss": 0.0057, "step": 371490 }, { "epoch": 1.87, "learning_rate": 1.886020452951652e-05, "loss": 0.0094, "step": 371500 }, { "epoch": 1.87, "learning_rate": 1.8852636836502513e-05, "loss": 0.0107, "step": 371510 }, { "epoch": 1.87, "learning_rate": 1.88450691434885e-05, "loss": 0.0045, "step": 371520 }, { "epoch": 1.87, "learning_rate": 1.8837501450474493e-05, "loss": 0.006, "step": 371530 }, { "epoch": 1.87, "learning_rate": 1.882993375746048e-05, "loss": 0.0068, "step": 371540 }, { "epoch": 1.87, "learning_rate": 1.8822366064446473e-05, "loss": 0.0079, "step": 371550 }, { "epoch": 1.87, "learning_rate": 1.881479837143246e-05, "loss": 0.0045, "step": 371560 }, { "epoch": 1.87, "learning_rate": 1.8807230678418453e-05, "loss": 0.0041, "step": 371570 }, { "epoch": 1.87, "learning_rate": 1.879966298540444e-05, "loss": 0.0059, "step": 371580 }, { "epoch": 1.87, "learning_rate": 1.8792095292390433e-05, "loss": 0.0046, "step": 371590 }, { "epoch": 1.87, "learning_rate": 1.878452759937642e-05, "loss": 0.0053, "step": 371600 }, { "epoch": 1.87, "learning_rate": 1.8776959906362412e-05, "loss": 0.0045, "step": 371610 }, { "epoch": 1.87, "learning_rate": 1.87693922133484e-05, "loss": 0.0053, "step": 371620 }, { "epoch": 1.87, "learning_rate": 1.8761824520334392e-05, "loss": 0.0049, "step": 371630 }, { "epoch": 1.87, "learning_rate": 1.875425682732038e-05, "loss": 0.0071, "step": 371640 }, { "epoch": 1.88, "learning_rate": 1.874668913430637e-05, "loss": 0.0051, "step": 371650 }, { "epoch": 1.88, "learning_rate": 1.873912144129236e-05, "loss": 0.004, "step": 371660 }, { "epoch": 1.88, "learning_rate": 1.873155374827835e-05, "loss": 0.0063, "step": 371670 }, { "epoch": 1.88, "learning_rate": 1.872398605526434e-05, "loss": 0.0059, "step": 371680 }, { "epoch": 1.88, "learning_rate": 1.8716418362250328e-05, "loss": 0.0069, "step": 371690 }, { "epoch": 1.88, "learning_rate": 1.8708850669236316e-05, "loss": 0.0046, "step": 371700 }, { "epoch": 1.88, "learning_rate": 1.8701282976222308e-05, "loss": 0.0056, "step": 371710 }, { "epoch": 1.88, "learning_rate": 1.8693715283208296e-05, "loss": 0.0068, "step": 371720 }, { "epoch": 1.88, "learning_rate": 1.8686147590194288e-05, "loss": 0.0055, "step": 371730 }, { "epoch": 1.88, "learning_rate": 1.8678579897180276e-05, "loss": 0.0061, "step": 371740 }, { "epoch": 1.88, "learning_rate": 1.8671012204166268e-05, "loss": 0.0054, "step": 371750 }, { "epoch": 1.88, "learning_rate": 1.8663444511152256e-05, "loss": 0.0063, "step": 371760 }, { "epoch": 1.88, "learning_rate": 1.8655876818138244e-05, "loss": 0.0044, "step": 371770 }, { "epoch": 1.88, "learning_rate": 1.8648309125124232e-05, "loss": 0.009, "step": 371780 }, { "epoch": 1.88, "learning_rate": 1.8640741432110224e-05, "loss": 0.0083, "step": 371790 }, { "epoch": 1.88, "learning_rate": 1.8633173739096216e-05, "loss": 0.0165, "step": 371800 }, { "epoch": 1.88, "learning_rate": 1.8625606046082204e-05, "loss": 0.004, "step": 371810 }, { "epoch": 1.88, "learning_rate": 1.8618038353068195e-05, "loss": 0.0045, "step": 371820 }, { "epoch": 1.88, "learning_rate": 1.8610470660054184e-05, "loss": 0.0055, "step": 371830 }, { "epoch": 1.88, "learning_rate": 1.8602902967040175e-05, "loss": 0.0069, "step": 371840 }, { "epoch": 1.88, "learning_rate": 1.859533527402616e-05, "loss": 0.0052, "step": 371850 }, { "epoch": 1.88, "learning_rate": 1.8587767581012152e-05, "loss": 0.0053, "step": 371860 }, { "epoch": 1.88, "learning_rate": 1.858019988799814e-05, "loss": 0.0058, "step": 371870 }, { "epoch": 1.88, "learning_rate": 1.857263219498413e-05, "loss": 0.0056, "step": 371880 }, { "epoch": 1.88, "learning_rate": 1.856506450197012e-05, "loss": 0.0041, "step": 371890 }, { "epoch": 1.88, "learning_rate": 1.855749680895611e-05, "loss": 0.0062, "step": 371900 }, { "epoch": 1.88, "learning_rate": 1.85499291159421e-05, "loss": 0.0091, "step": 371910 }, { "epoch": 1.88, "learning_rate": 1.854236142292809e-05, "loss": 0.0052, "step": 371920 }, { "epoch": 1.88, "learning_rate": 1.853479372991408e-05, "loss": 0.0055, "step": 371930 }, { "epoch": 1.88, "learning_rate": 1.8527226036900068e-05, "loss": 0.007, "step": 371940 }, { "epoch": 1.88, "learning_rate": 1.851965834388606e-05, "loss": 0.0053, "step": 371950 }, { "epoch": 1.88, "learning_rate": 1.8512090650872047e-05, "loss": 0.0066, "step": 371960 }, { "epoch": 1.88, "learning_rate": 1.850452295785804e-05, "loss": 0.0068, "step": 371970 }, { "epoch": 1.88, "learning_rate": 1.8496955264844027e-05, "loss": 0.0047, "step": 371980 }, { "epoch": 1.88, "learning_rate": 1.848938757183002e-05, "loss": 0.006, "step": 371990 }, { "epoch": 1.88, "learning_rate": 1.8481819878816007e-05, "loss": 0.0052, "step": 372000 }, { "epoch": 1.88, "eval_cer": 0.914423676889143, "eval_loss": 0.004319104366004467, "eval_runtime": 116.6762, "eval_samples_per_second": 17.141, "eval_steps_per_second": 4.285, "step": 372000 }, { "epoch": 1.88, "learning_rate": 1.8474252185801995e-05, "loss": 0.0082, "step": 372010 }, { "epoch": 1.88, "learning_rate": 1.8466684492787987e-05, "loss": 0.0047, "step": 372020 }, { "epoch": 1.88, "learning_rate": 1.8459116799773975e-05, "loss": 0.0046, "step": 372030 }, { "epoch": 1.88, "learning_rate": 1.8451549106759967e-05, "loss": 0.0052, "step": 372040 }, { "epoch": 1.88, "learning_rate": 1.8443981413745955e-05, "loss": 0.005, "step": 372050 }, { "epoch": 1.88, "learning_rate": 1.8436413720731947e-05, "loss": 0.0072, "step": 372060 }, { "epoch": 1.88, "learning_rate": 1.8428846027717935e-05, "loss": 0.0044, "step": 372070 }, { "epoch": 1.88, "learning_rate": 1.8421278334703923e-05, "loss": 0.0104, "step": 372080 }, { "epoch": 1.88, "learning_rate": 1.8413710641689915e-05, "loss": 0.0045, "step": 372090 }, { "epoch": 1.88, "learning_rate": 1.8406142948675903e-05, "loss": 0.0161, "step": 372100 }, { "epoch": 1.88, "learning_rate": 1.8398575255661894e-05, "loss": 0.0056, "step": 372110 }, { "epoch": 1.88, "learning_rate": 1.8391007562647883e-05, "loss": 0.0065, "step": 372120 }, { "epoch": 1.88, "learning_rate": 1.8383439869633874e-05, "loss": 0.0052, "step": 372130 }, { "epoch": 1.88, "learning_rate": 1.8375872176619862e-05, "loss": 0.0055, "step": 372140 }, { "epoch": 1.88, "learning_rate": 1.8368304483605854e-05, "loss": 0.0057, "step": 372150 }, { "epoch": 1.88, "learning_rate": 1.8360736790591842e-05, "loss": 0.0057, "step": 372160 }, { "epoch": 1.88, "learning_rate": 1.835316909757783e-05, "loss": 0.0046, "step": 372170 }, { "epoch": 1.88, "learning_rate": 1.8345601404563822e-05, "loss": 0.006, "step": 372180 }, { "epoch": 1.88, "learning_rate": 1.833803371154981e-05, "loss": 0.0073, "step": 372190 }, { "epoch": 1.88, "learning_rate": 1.8330466018535802e-05, "loss": 0.0065, "step": 372200 }, { "epoch": 1.88, "learning_rate": 1.832289832552179e-05, "loss": 0.0045, "step": 372210 }, { "epoch": 1.88, "learning_rate": 1.8315330632507782e-05, "loss": 0.0055, "step": 372220 }, { "epoch": 1.88, "learning_rate": 1.830776293949377e-05, "loss": 0.0057, "step": 372230 }, { "epoch": 1.88, "learning_rate": 1.8300195246479758e-05, "loss": 0.0072, "step": 372240 }, { "epoch": 1.88, "learning_rate": 1.829262755346575e-05, "loss": 0.0058, "step": 372250 }, { "epoch": 1.88, "learning_rate": 1.8285059860451738e-05, "loss": 0.0052, "step": 372260 }, { "epoch": 1.88, "learning_rate": 1.827749216743773e-05, "loss": 0.0062, "step": 372270 }, { "epoch": 1.88, "learning_rate": 1.8269924474423718e-05, "loss": 0.0049, "step": 372280 }, { "epoch": 1.88, "learning_rate": 1.826235678140971e-05, "loss": 0.0054, "step": 372290 }, { "epoch": 1.88, "learning_rate": 1.8254789088395698e-05, "loss": 0.0044, "step": 372300 }, { "epoch": 1.88, "learning_rate": 1.824722139538169e-05, "loss": 0.0048, "step": 372310 }, { "epoch": 1.88, "learning_rate": 1.8239653702367678e-05, "loss": 0.007, "step": 372320 }, { "epoch": 1.88, "learning_rate": 1.8232086009353666e-05, "loss": 0.0065, "step": 372330 }, { "epoch": 1.88, "learning_rate": 1.8224518316339657e-05, "loss": 0.0048, "step": 372340 }, { "epoch": 1.88, "learning_rate": 1.8216950623325646e-05, "loss": 0.0063, "step": 372350 }, { "epoch": 1.88, "learning_rate": 1.8209382930311637e-05, "loss": 0.0089, "step": 372360 }, { "epoch": 1.88, "learning_rate": 1.8201815237297625e-05, "loss": 0.0054, "step": 372370 }, { "epoch": 1.88, "learning_rate": 1.8194247544283617e-05, "loss": 0.0057, "step": 372380 }, { "epoch": 1.88, "learning_rate": 1.8186679851269605e-05, "loss": 0.0048, "step": 372390 }, { "epoch": 1.88, "learning_rate": 1.8179112158255593e-05, "loss": 0.0066, "step": 372400 }, { "epoch": 1.88, "learning_rate": 1.8171544465241585e-05, "loss": 0.0072, "step": 372410 }, { "epoch": 1.88, "learning_rate": 1.8163976772227573e-05, "loss": 0.0058, "step": 372420 }, { "epoch": 1.88, "learning_rate": 1.8156409079213565e-05, "loss": 0.0051, "step": 372430 }, { "epoch": 1.88, "learning_rate": 1.8148841386199553e-05, "loss": 0.0044, "step": 372440 }, { "epoch": 1.88, "learning_rate": 1.8141273693185545e-05, "loss": 0.0075, "step": 372450 }, { "epoch": 1.88, "learning_rate": 1.8133706000171533e-05, "loss": 0.0039, "step": 372460 }, { "epoch": 1.88, "learning_rate": 1.8126138307157525e-05, "loss": 0.0068, "step": 372470 }, { "epoch": 1.88, "learning_rate": 1.8118570614143513e-05, "loss": 0.0055, "step": 372480 }, { "epoch": 1.88, "learning_rate": 1.81110029211295e-05, "loss": 0.0045, "step": 372490 }, { "epoch": 1.88, "learning_rate": 1.8103435228115493e-05, "loss": 0.0053, "step": 372500 }, { "epoch": 1.88, "learning_rate": 1.809586753510148e-05, "loss": 0.0059, "step": 372510 }, { "epoch": 1.88, "learning_rate": 1.8088299842087472e-05, "loss": 0.0071, "step": 372520 }, { "epoch": 1.88, "learning_rate": 1.808073214907346e-05, "loss": 0.0056, "step": 372530 }, { "epoch": 1.88, "learning_rate": 1.8073164456059452e-05, "loss": 0.0044, "step": 372540 }, { "epoch": 1.88, "learning_rate": 1.806559676304544e-05, "loss": 0.0078, "step": 372550 }, { "epoch": 1.88, "learning_rate": 1.805802907003143e-05, "loss": 0.0081, "step": 372560 }, { "epoch": 1.88, "learning_rate": 1.805046137701742e-05, "loss": 0.0048, "step": 372570 }, { "epoch": 1.88, "learning_rate": 1.804289368400341e-05, "loss": 0.0059, "step": 372580 }, { "epoch": 1.88, "learning_rate": 1.80353259909894e-05, "loss": 0.0039, "step": 372590 }, { "epoch": 1.88, "learning_rate": 1.802775829797539e-05, "loss": 0.005, "step": 372600 }, { "epoch": 1.88, "learning_rate": 1.802019060496138e-05, "loss": 0.0049, "step": 372610 }, { "epoch": 1.88, "learning_rate": 1.8012622911947368e-05, "loss": 0.0064, "step": 372620 }, { "epoch": 1.88, "learning_rate": 1.8005055218933356e-05, "loss": 0.0047, "step": 372630 }, { "epoch": 1.88, "learning_rate": 1.7997487525919348e-05, "loss": 0.0055, "step": 372640 }, { "epoch": 1.88, "learning_rate": 1.7989919832905336e-05, "loss": 0.0057, "step": 372650 }, { "epoch": 1.88, "learning_rate": 1.7982352139891328e-05, "loss": 0.0072, "step": 372660 }, { "epoch": 1.88, "learning_rate": 1.7974784446877316e-05, "loss": 0.0048, "step": 372670 }, { "epoch": 1.88, "learning_rate": 1.7967216753863308e-05, "loss": 0.0052, "step": 372680 }, { "epoch": 1.88, "learning_rate": 1.7959649060849296e-05, "loss": 0.0037, "step": 372690 }, { "epoch": 1.88, "learning_rate": 1.7952081367835287e-05, "loss": 0.0057, "step": 372700 }, { "epoch": 1.88, "learning_rate": 1.7944513674821272e-05, "loss": 0.004, "step": 372710 }, { "epoch": 1.88, "learning_rate": 1.7936945981807264e-05, "loss": 0.0043, "step": 372720 }, { "epoch": 1.88, "learning_rate": 1.7929378288793252e-05, "loss": 0.0063, "step": 372730 }, { "epoch": 1.88, "learning_rate": 1.7921810595779244e-05, "loss": 0.0068, "step": 372740 }, { "epoch": 1.88, "learning_rate": 1.7914242902765232e-05, "loss": 0.0064, "step": 372750 }, { "epoch": 1.88, "learning_rate": 1.7906675209751224e-05, "loss": 0.0071, "step": 372760 }, { "epoch": 1.88, "learning_rate": 1.7899107516737215e-05, "loss": 0.0064, "step": 372770 }, { "epoch": 1.88, "learning_rate": 1.7891539823723203e-05, "loss": 0.0056, "step": 372780 }, { "epoch": 1.88, "learning_rate": 1.788397213070919e-05, "loss": 0.0047, "step": 372790 }, { "epoch": 1.88, "learning_rate": 1.787640443769518e-05, "loss": 0.0042, "step": 372800 }, { "epoch": 1.88, "learning_rate": 1.786883674468117e-05, "loss": 0.0075, "step": 372810 }, { "epoch": 1.88, "learning_rate": 1.786126905166716e-05, "loss": 0.004, "step": 372820 }, { "epoch": 1.88, "learning_rate": 1.785370135865315e-05, "loss": 0.0065, "step": 372830 }, { "epoch": 1.88, "learning_rate": 1.784613366563914e-05, "loss": 0.0063, "step": 372840 }, { "epoch": 1.88, "learning_rate": 1.783856597262513e-05, "loss": 0.006, "step": 372850 }, { "epoch": 1.88, "learning_rate": 1.783099827961112e-05, "loss": 0.0049, "step": 372860 }, { "epoch": 1.88, "learning_rate": 1.7823430586597108e-05, "loss": 0.0045, "step": 372870 }, { "epoch": 1.88, "learning_rate": 1.78158628935831e-05, "loss": 0.0057, "step": 372880 }, { "epoch": 1.88, "learning_rate": 1.7808295200569087e-05, "loss": 0.0073, "step": 372890 }, { "epoch": 1.88, "learning_rate": 1.780072750755508e-05, "loss": 0.0043, "step": 372900 }, { "epoch": 1.88, "learning_rate": 1.7793159814541067e-05, "loss": 0.0058, "step": 372910 }, { "epoch": 1.88, "learning_rate": 1.778559212152706e-05, "loss": 0.0074, "step": 372920 }, { "epoch": 1.88, "learning_rate": 1.7778024428513047e-05, "loss": 0.0053, "step": 372930 }, { "epoch": 1.88, "learning_rate": 1.777045673549904e-05, "loss": 0.0078, "step": 372940 }, { "epoch": 1.88, "learning_rate": 1.7762889042485027e-05, "loss": 0.005, "step": 372950 }, { "epoch": 1.88, "learning_rate": 1.7755321349471015e-05, "loss": 0.0051, "step": 372960 }, { "epoch": 1.88, "learning_rate": 1.7747753656457007e-05, "loss": 0.0078, "step": 372970 }, { "epoch": 1.88, "learning_rate": 1.7740185963442995e-05, "loss": 0.006, "step": 372980 }, { "epoch": 1.88, "learning_rate": 1.7732618270428986e-05, "loss": 0.0034, "step": 372990 }, { "epoch": 1.88, "learning_rate": 1.7725050577414975e-05, "loss": 0.0082, "step": 373000 }, { "epoch": 1.88, "eval_cer": 0.9144353216426477, "eval_loss": 0.00432598264887929, "eval_runtime": 116.7735, "eval_samples_per_second": 17.127, "eval_steps_per_second": 4.282, "step": 373000 }, { "epoch": 1.88, "learning_rate": 1.7717482884400966e-05, "loss": 0.009, "step": 373010 }, { "epoch": 1.88, "learning_rate": 1.7709915191386954e-05, "loss": 0.0066, "step": 373020 }, { "epoch": 1.88, "learning_rate": 1.7702347498372943e-05, "loss": 0.0064, "step": 373030 }, { "epoch": 1.88, "learning_rate": 1.7694779805358934e-05, "loss": 0.0052, "step": 373040 }, { "epoch": 1.88, "learning_rate": 1.7687212112344923e-05, "loss": 0.01, "step": 373050 }, { "epoch": 1.88, "learning_rate": 1.7679644419330914e-05, "loss": 0.0044, "step": 373060 }, { "epoch": 1.88, "learning_rate": 1.7672076726316902e-05, "loss": 0.0077, "step": 373070 }, { "epoch": 1.88, "learning_rate": 1.7664509033302894e-05, "loss": 0.0049, "step": 373080 }, { "epoch": 1.88, "learning_rate": 1.7656941340288882e-05, "loss": 0.007, "step": 373090 }, { "epoch": 1.88, "learning_rate": 1.764937364727487e-05, "loss": 0.006, "step": 373100 }, { "epoch": 1.88, "learning_rate": 1.7641805954260862e-05, "loss": 0.0057, "step": 373110 }, { "epoch": 1.88, "learning_rate": 1.763423826124685e-05, "loss": 0.0048, "step": 373120 }, { "epoch": 1.88, "learning_rate": 1.7626670568232842e-05, "loss": 0.0064, "step": 373130 }, { "epoch": 1.88, "learning_rate": 1.761910287521883e-05, "loss": 0.0047, "step": 373140 }, { "epoch": 1.88, "learning_rate": 1.761153518220482e-05, "loss": 0.0072, "step": 373150 }, { "epoch": 1.88, "learning_rate": 1.760396748919081e-05, "loss": 0.0076, "step": 373160 }, { "epoch": 1.88, "learning_rate": 1.75963997961768e-05, "loss": 0.0067, "step": 373170 }, { "epoch": 1.88, "learning_rate": 1.758883210316279e-05, "loss": 0.0056, "step": 373180 }, { "epoch": 1.88, "learning_rate": 1.7581264410148778e-05, "loss": 0.0055, "step": 373190 }, { "epoch": 1.88, "learning_rate": 1.757369671713477e-05, "loss": 0.0044, "step": 373200 }, { "epoch": 1.88, "learning_rate": 1.7566129024120758e-05, "loss": 0.006, "step": 373210 }, { "epoch": 1.88, "learning_rate": 1.755856133110675e-05, "loss": 0.0072, "step": 373220 }, { "epoch": 1.88, "learning_rate": 1.7550993638092738e-05, "loss": 0.0051, "step": 373230 }, { "epoch": 1.88, "learning_rate": 1.754342594507873e-05, "loss": 0.0062, "step": 373240 }, { "epoch": 1.88, "learning_rate": 1.7535858252064717e-05, "loss": 0.0054, "step": 373250 }, { "epoch": 1.88, "learning_rate": 1.7528290559050706e-05, "loss": 0.0049, "step": 373260 }, { "epoch": 1.88, "learning_rate": 1.7520722866036697e-05, "loss": 0.0063, "step": 373270 }, { "epoch": 1.88, "learning_rate": 1.7513155173022685e-05, "loss": 0.007, "step": 373280 }, { "epoch": 1.88, "learning_rate": 1.7505587480008677e-05, "loss": 0.0078, "step": 373290 }, { "epoch": 1.88, "learning_rate": 1.7498019786994665e-05, "loss": 0.0065, "step": 373300 }, { "epoch": 1.88, "learning_rate": 1.7490452093980657e-05, "loss": 0.0074, "step": 373310 }, { "epoch": 1.88, "learning_rate": 1.7482884400966645e-05, "loss": 0.0038, "step": 373320 }, { "epoch": 1.88, "learning_rate": 1.7475316707952637e-05, "loss": 0.0068, "step": 373330 }, { "epoch": 1.88, "learning_rate": 1.7467749014938625e-05, "loss": 0.0052, "step": 373340 }, { "epoch": 1.88, "learning_rate": 1.7460181321924613e-05, "loss": 0.0068, "step": 373350 }, { "epoch": 1.88, "learning_rate": 1.7452613628910605e-05, "loss": 0.0049, "step": 373360 }, { "epoch": 1.88, "learning_rate": 1.7445045935896593e-05, "loss": 0.0066, "step": 373370 }, { "epoch": 1.88, "learning_rate": 1.7437478242882585e-05, "loss": 0.0049, "step": 373380 }, { "epoch": 1.88, "learning_rate": 1.7429910549868573e-05, "loss": 0.0058, "step": 373390 }, { "epoch": 1.88, "learning_rate": 1.7422342856854564e-05, "loss": 0.0051, "step": 373400 }, { "epoch": 1.88, "learning_rate": 1.7414775163840553e-05, "loss": 0.0069, "step": 373410 }, { "epoch": 1.88, "learning_rate": 1.740720747082654e-05, "loss": 0.0064, "step": 373420 }, { "epoch": 1.88, "learning_rate": 1.7399639777812532e-05, "loss": 0.0065, "step": 373430 }, { "epoch": 1.88, "learning_rate": 1.739207208479852e-05, "loss": 0.0067, "step": 373440 }, { "epoch": 1.88, "learning_rate": 1.7384504391784512e-05, "loss": 0.0053, "step": 373450 }, { "epoch": 1.88, "learning_rate": 1.73769366987705e-05, "loss": 0.0046, "step": 373460 }, { "epoch": 1.88, "learning_rate": 1.7369369005756492e-05, "loss": 0.0067, "step": 373470 }, { "epoch": 1.88, "learning_rate": 1.736180131274248e-05, "loss": 0.0057, "step": 373480 }, { "epoch": 1.88, "learning_rate": 1.7354233619728472e-05, "loss": 0.006, "step": 373490 }, { "epoch": 1.88, "learning_rate": 1.734666592671446e-05, "loss": 0.0041, "step": 373500 }, { "epoch": 1.88, "learning_rate": 1.733909823370045e-05, "loss": 0.0062, "step": 373510 }, { "epoch": 1.88, "learning_rate": 1.733153054068644e-05, "loss": 0.0064, "step": 373520 }, { "epoch": 1.88, "learning_rate": 1.7323962847672428e-05, "loss": 0.006, "step": 373530 }, { "epoch": 1.88, "learning_rate": 1.731639515465842e-05, "loss": 0.0067, "step": 373540 }, { "epoch": 1.88, "learning_rate": 1.7308827461644408e-05, "loss": 0.0062, "step": 373550 }, { "epoch": 1.88, "learning_rate": 1.73012597686304e-05, "loss": 0.0057, "step": 373560 }, { "epoch": 1.88, "learning_rate": 1.7293692075616388e-05, "loss": 0.0058, "step": 373570 }, { "epoch": 1.88, "learning_rate": 1.7286124382602376e-05, "loss": 0.0061, "step": 373580 }, { "epoch": 1.88, "learning_rate": 1.7278556689588364e-05, "loss": 0.005, "step": 373590 }, { "epoch": 1.88, "learning_rate": 1.7270988996574356e-05, "loss": 0.0078, "step": 373600 }, { "epoch": 1.88, "learning_rate": 1.7263421303560347e-05, "loss": 0.0081, "step": 373610 }, { "epoch": 1.88, "learning_rate": 1.7255853610546336e-05, "loss": 0.006, "step": 373620 }, { "epoch": 1.89, "learning_rate": 1.7248285917532327e-05, "loss": 0.0054, "step": 373630 }, { "epoch": 1.89, "learning_rate": 1.7240718224518316e-05, "loss": 0.0055, "step": 373640 }, { "epoch": 1.89, "learning_rate": 1.7233150531504304e-05, "loss": 0.0077, "step": 373650 }, { "epoch": 1.89, "learning_rate": 1.7225582838490292e-05, "loss": 0.0061, "step": 373660 }, { "epoch": 1.89, "learning_rate": 1.7218015145476284e-05, "loss": 0.0067, "step": 373670 }, { "epoch": 1.89, "learning_rate": 1.7210447452462272e-05, "loss": 0.0044, "step": 373680 }, { "epoch": 1.89, "learning_rate": 1.7202879759448263e-05, "loss": 0.0076, "step": 373690 }, { "epoch": 1.89, "learning_rate": 1.719531206643425e-05, "loss": 0.004, "step": 373700 }, { "epoch": 1.89, "learning_rate": 1.7187744373420243e-05, "loss": 0.0059, "step": 373710 }, { "epoch": 1.89, "learning_rate": 1.718017668040623e-05, "loss": 0.0082, "step": 373720 }, { "epoch": 1.89, "learning_rate": 1.717260898739222e-05, "loss": 0.0071, "step": 373730 }, { "epoch": 1.89, "learning_rate": 1.716504129437821e-05, "loss": 0.0061, "step": 373740 }, { "epoch": 1.89, "learning_rate": 1.71574736013642e-05, "loss": 0.0046, "step": 373750 }, { "epoch": 1.89, "learning_rate": 1.714990590835019e-05, "loss": 0.0051, "step": 373760 }, { "epoch": 1.89, "learning_rate": 1.714233821533618e-05, "loss": 0.005, "step": 373770 }, { "epoch": 1.89, "learning_rate": 1.713477052232217e-05, "loss": 0.0053, "step": 373780 }, { "epoch": 1.89, "learning_rate": 1.712720282930816e-05, "loss": 0.0062, "step": 373790 }, { "epoch": 1.89, "learning_rate": 1.711963513629415e-05, "loss": 0.0068, "step": 373800 }, { "epoch": 1.89, "learning_rate": 1.711206744328014e-05, "loss": 0.0082, "step": 373810 }, { "epoch": 1.89, "learning_rate": 1.7104499750266127e-05, "loss": 0.0077, "step": 373820 }, { "epoch": 1.89, "learning_rate": 1.709693205725212e-05, "loss": 0.0064, "step": 373830 }, { "epoch": 1.89, "learning_rate": 1.7089364364238107e-05, "loss": 0.0068, "step": 373840 }, { "epoch": 1.89, "learning_rate": 1.70817966712241e-05, "loss": 0.0057, "step": 373850 }, { "epoch": 1.89, "learning_rate": 1.7074228978210087e-05, "loss": 0.0046, "step": 373860 }, { "epoch": 1.89, "learning_rate": 1.706666128519608e-05, "loss": 0.0052, "step": 373870 }, { "epoch": 1.89, "learning_rate": 1.7059093592182067e-05, "loss": 0.0073, "step": 373880 }, { "epoch": 1.89, "learning_rate": 1.7051525899168055e-05, "loss": 0.005, "step": 373890 }, { "epoch": 1.89, "learning_rate": 1.7043958206154047e-05, "loss": 0.0065, "step": 373900 }, { "epoch": 1.89, "learning_rate": 1.7036390513140035e-05, "loss": 0.0049, "step": 373910 }, { "epoch": 1.89, "learning_rate": 1.7028822820126026e-05, "loss": 0.0044, "step": 373920 }, { "epoch": 1.89, "learning_rate": 1.7021255127112015e-05, "loss": 0.005, "step": 373930 }, { "epoch": 1.89, "learning_rate": 1.7013687434098006e-05, "loss": 0.0069, "step": 373940 }, { "epoch": 1.89, "learning_rate": 1.7006119741083994e-05, "loss": 0.0076, "step": 373950 }, { "epoch": 1.89, "learning_rate": 1.6998552048069986e-05, "loss": 0.0046, "step": 373960 }, { "epoch": 1.89, "learning_rate": 1.6990984355055974e-05, "loss": 0.0064, "step": 373970 }, { "epoch": 1.89, "learning_rate": 1.6983416662041962e-05, "loss": 0.0059, "step": 373980 }, { "epoch": 1.89, "learning_rate": 1.6975848969027954e-05, "loss": 0.0058, "step": 373990 }, { "epoch": 1.89, "learning_rate": 1.6968281276013942e-05, "loss": 0.005, "step": 374000 }, { "epoch": 1.89, "eval_cer": 0.9144294992658953, "eval_loss": 0.004294942133128643, "eval_runtime": 116.742, "eval_samples_per_second": 17.132, "eval_steps_per_second": 4.283, "step": 374000 }, { "epoch": 1.89, "learning_rate": 1.6960713582999934e-05, "loss": 0.0042, "step": 374010 }, { "epoch": 1.89, "learning_rate": 1.6953145889985922e-05, "loss": 0.0059, "step": 374020 }, { "epoch": 1.89, "learning_rate": 1.6945578196971914e-05, "loss": 0.0079, "step": 374030 }, { "epoch": 1.89, "learning_rate": 1.6938010503957902e-05, "loss": 0.0031, "step": 374040 }, { "epoch": 1.89, "learning_rate": 1.693044281094389e-05, "loss": 0.0058, "step": 374050 }, { "epoch": 1.89, "learning_rate": 1.6922875117929882e-05, "loss": 0.0061, "step": 374060 }, { "epoch": 1.89, "learning_rate": 1.691530742491587e-05, "loss": 0.0053, "step": 374070 }, { "epoch": 1.89, "learning_rate": 1.690773973190186e-05, "loss": 0.0054, "step": 374080 }, { "epoch": 1.89, "learning_rate": 1.690017203888785e-05, "loss": 0.0043, "step": 374090 }, { "epoch": 1.89, "learning_rate": 1.689260434587384e-05, "loss": 0.0077, "step": 374100 }, { "epoch": 1.89, "learning_rate": 1.688503665285983e-05, "loss": 0.0062, "step": 374110 }, { "epoch": 1.89, "learning_rate": 1.687746895984582e-05, "loss": 0.0052, "step": 374120 }, { "epoch": 1.89, "learning_rate": 1.686990126683181e-05, "loss": 0.0058, "step": 374130 }, { "epoch": 1.89, "learning_rate": 1.6862333573817798e-05, "loss": 0.0059, "step": 374140 }, { "epoch": 1.89, "learning_rate": 1.685476588080379e-05, "loss": 0.0068, "step": 374150 }, { "epoch": 1.89, "learning_rate": 1.6847198187789777e-05, "loss": 0.0053, "step": 374160 }, { "epoch": 1.89, "learning_rate": 1.683963049477577e-05, "loss": 0.005, "step": 374170 }, { "epoch": 1.89, "learning_rate": 1.6832062801761757e-05, "loss": 0.0045, "step": 374180 }, { "epoch": 1.89, "learning_rate": 1.682449510874775e-05, "loss": 0.0035, "step": 374190 }, { "epoch": 1.89, "learning_rate": 1.6816927415733737e-05, "loss": 0.0072, "step": 374200 }, { "epoch": 1.89, "learning_rate": 1.6809359722719725e-05, "loss": 0.0059, "step": 374210 }, { "epoch": 1.89, "learning_rate": 1.6801792029705717e-05, "loss": 0.0056, "step": 374220 }, { "epoch": 1.89, "learning_rate": 1.6794224336691705e-05, "loss": 0.0065, "step": 374230 }, { "epoch": 1.89, "learning_rate": 1.6786656643677697e-05, "loss": 0.0052, "step": 374240 }, { "epoch": 1.89, "learning_rate": 1.6779088950663685e-05, "loss": 0.0047, "step": 374250 }, { "epoch": 1.89, "learning_rate": 1.6771521257649677e-05, "loss": 0.0054, "step": 374260 }, { "epoch": 1.89, "learning_rate": 1.6763953564635665e-05, "loss": 0.006, "step": 374270 }, { "epoch": 1.89, "learning_rate": 1.6756385871621653e-05, "loss": 0.0059, "step": 374280 }, { "epoch": 1.89, "learning_rate": 1.6748818178607645e-05, "loss": 0.0045, "step": 374290 }, { "epoch": 1.89, "learning_rate": 1.6741250485593633e-05, "loss": 0.0076, "step": 374300 }, { "epoch": 1.89, "learning_rate": 1.6733682792579624e-05, "loss": 0.0044, "step": 374310 }, { "epoch": 1.89, "learning_rate": 1.6726115099565613e-05, "loss": 0.0056, "step": 374320 }, { "epoch": 1.89, "learning_rate": 1.6718547406551604e-05, "loss": 0.0053, "step": 374330 }, { "epoch": 1.89, "learning_rate": 1.6710979713537593e-05, "loss": 0.0071, "step": 374340 }, { "epoch": 1.89, "learning_rate": 1.6703412020523584e-05, "loss": 0.0051, "step": 374350 }, { "epoch": 1.89, "learning_rate": 1.6695844327509572e-05, "loss": 0.0064, "step": 374360 }, { "epoch": 1.89, "learning_rate": 1.668827663449556e-05, "loss": 0.006, "step": 374370 }, { "epoch": 1.89, "learning_rate": 1.6680708941481552e-05, "loss": 0.0049, "step": 374380 }, { "epoch": 1.89, "learning_rate": 1.667314124846754e-05, "loss": 0.0083, "step": 374390 }, { "epoch": 1.89, "learning_rate": 1.6665573555453532e-05, "loss": 0.004, "step": 374400 }, { "epoch": 1.89, "learning_rate": 1.665800586243952e-05, "loss": 0.0063, "step": 374410 }, { "epoch": 1.89, "learning_rate": 1.6650438169425512e-05, "loss": 0.0058, "step": 374420 }, { "epoch": 1.89, "learning_rate": 1.66428704764115e-05, "loss": 0.0054, "step": 374430 }, { "epoch": 1.89, "learning_rate": 1.6635302783397488e-05, "loss": 0.006, "step": 374440 }, { "epoch": 1.89, "learning_rate": 1.6627735090383476e-05, "loss": 0.0062, "step": 374450 }, { "epoch": 1.89, "learning_rate": 1.6620167397369468e-05, "loss": 0.0064, "step": 374460 }, { "epoch": 1.89, "learning_rate": 1.661259970435546e-05, "loss": 0.007, "step": 374470 }, { "epoch": 1.89, "learning_rate": 1.6605032011341448e-05, "loss": 0.0066, "step": 374480 }, { "epoch": 1.89, "learning_rate": 1.659746431832744e-05, "loss": 0.0079, "step": 374490 }, { "epoch": 1.89, "learning_rate": 1.6589896625313428e-05, "loss": 0.0062, "step": 374500 }, { "epoch": 1.89, "learning_rate": 1.658232893229942e-05, "loss": 0.0062, "step": 374510 }, { "epoch": 1.89, "learning_rate": 1.6574761239285404e-05, "loss": 0.0063, "step": 374520 }, { "epoch": 1.89, "learning_rate": 1.6567193546271396e-05, "loss": 0.0057, "step": 374530 }, { "epoch": 1.89, "learning_rate": 1.6559625853257384e-05, "loss": 0.0049, "step": 374540 }, { "epoch": 1.89, "learning_rate": 1.6552058160243376e-05, "loss": 0.0063, "step": 374550 }, { "epoch": 1.89, "learning_rate": 1.6544490467229364e-05, "loss": 0.0048, "step": 374560 }, { "epoch": 1.89, "learning_rate": 1.6536922774215355e-05, "loss": 0.0062, "step": 374570 }, { "epoch": 1.89, "learning_rate": 1.6529355081201347e-05, "loss": 0.0056, "step": 374580 }, { "epoch": 1.89, "learning_rate": 1.6521787388187335e-05, "loss": 0.0056, "step": 374590 }, { "epoch": 1.89, "learning_rate": 1.6514219695173323e-05, "loss": 0.0063, "step": 374600 }, { "epoch": 1.89, "learning_rate": 1.650665200215931e-05, "loss": 0.0079, "step": 374610 }, { "epoch": 1.89, "learning_rate": 1.6499084309145303e-05, "loss": 0.0066, "step": 374620 }, { "epoch": 1.89, "learning_rate": 1.649151661613129e-05, "loss": 0.0052, "step": 374630 }, { "epoch": 1.89, "learning_rate": 1.6483948923117283e-05, "loss": 0.0071, "step": 374640 }, { "epoch": 1.89, "learning_rate": 1.647638123010327e-05, "loss": 0.0079, "step": 374650 }, { "epoch": 1.89, "learning_rate": 1.6468813537089263e-05, "loss": 0.0065, "step": 374660 }, { "epoch": 1.89, "learning_rate": 1.646124584407525e-05, "loss": 0.0049, "step": 374670 }, { "epoch": 1.89, "learning_rate": 1.645367815106124e-05, "loss": 0.0061, "step": 374680 }, { "epoch": 1.89, "learning_rate": 1.644611045804723e-05, "loss": 0.005, "step": 374690 }, { "epoch": 1.89, "learning_rate": 1.643854276503322e-05, "loss": 0.0061, "step": 374700 }, { "epoch": 1.89, "learning_rate": 1.643097507201921e-05, "loss": 0.0047, "step": 374710 }, { "epoch": 1.89, "learning_rate": 1.64234073790052e-05, "loss": 0.0055, "step": 374720 }, { "epoch": 1.89, "learning_rate": 1.641583968599119e-05, "loss": 0.0053, "step": 374730 }, { "epoch": 1.89, "learning_rate": 1.640827199297718e-05, "loss": 0.0048, "step": 374740 }, { "epoch": 1.89, "learning_rate": 1.6400704299963167e-05, "loss": 0.0046, "step": 374750 }, { "epoch": 1.89, "learning_rate": 1.639313660694916e-05, "loss": 0.0041, "step": 374760 }, { "epoch": 1.89, "learning_rate": 1.6385568913935147e-05, "loss": 0.0056, "step": 374770 }, { "epoch": 1.89, "learning_rate": 1.637800122092114e-05, "loss": 0.0044, "step": 374780 }, { "epoch": 1.89, "learning_rate": 1.6370433527907127e-05, "loss": 0.0046, "step": 374790 }, { "epoch": 1.89, "learning_rate": 1.636286583489312e-05, "loss": 0.0075, "step": 374800 }, { "epoch": 1.89, "learning_rate": 1.6355298141879107e-05, "loss": 0.006, "step": 374810 }, { "epoch": 1.89, "learning_rate": 1.6347730448865098e-05, "loss": 0.0051, "step": 374820 }, { "epoch": 1.89, "learning_rate": 1.6340162755851086e-05, "loss": 0.0054, "step": 374830 }, { "epoch": 1.89, "learning_rate": 1.6332595062837075e-05, "loss": 0.0064, "step": 374840 }, { "epoch": 1.89, "learning_rate": 1.6325027369823066e-05, "loss": 0.0064, "step": 374850 }, { "epoch": 1.89, "learning_rate": 1.6317459676809054e-05, "loss": 0.007, "step": 374860 }, { "epoch": 1.89, "learning_rate": 1.6309891983795046e-05, "loss": 0.0051, "step": 374870 }, { "epoch": 1.89, "learning_rate": 1.6302324290781034e-05, "loss": 0.005, "step": 374880 }, { "epoch": 1.89, "learning_rate": 1.6294756597767026e-05, "loss": 0.0071, "step": 374890 }, { "epoch": 1.89, "learning_rate": 1.6287188904753014e-05, "loss": 0.0054, "step": 374900 }, { "epoch": 1.89, "learning_rate": 1.6279621211739002e-05, "loss": 0.0075, "step": 374910 }, { "epoch": 1.89, "learning_rate": 1.6272053518724994e-05, "loss": 0.0051, "step": 374920 }, { "epoch": 1.89, "learning_rate": 1.6264485825710982e-05, "loss": 0.0049, "step": 374930 }, { "epoch": 1.89, "learning_rate": 1.6256918132696974e-05, "loss": 0.0071, "step": 374940 }, { "epoch": 1.89, "learning_rate": 1.6249350439682962e-05, "loss": 0.0059, "step": 374950 }, { "epoch": 1.89, "learning_rate": 1.6241782746668954e-05, "loss": 0.005, "step": 374960 }, { "epoch": 1.89, "learning_rate": 1.6234215053654942e-05, "loss": 0.0062, "step": 374970 }, { "epoch": 1.89, "learning_rate": 1.6226647360640933e-05, "loss": 0.0058, "step": 374980 }, { "epoch": 1.89, "learning_rate": 1.621907966762692e-05, "loss": 0.0066, "step": 374990 }, { "epoch": 1.89, "learning_rate": 1.621151197461291e-05, "loss": 0.0035, "step": 375000 }, { "epoch": 1.89, "eval_cer": 0.9144246472852683, "eval_loss": 0.004302851855754852, "eval_runtime": 116.6099, "eval_samples_per_second": 17.151, "eval_steps_per_second": 4.288, "step": 375000 }, { "epoch": 1.89, "learning_rate": 1.62039442815989e-05, "loss": 0.0051, "step": 375010 }, { "epoch": 1.89, "learning_rate": 1.619637658858489e-05, "loss": 0.0057, "step": 375020 }, { "epoch": 1.89, "learning_rate": 1.618880889557088e-05, "loss": 0.0052, "step": 375030 }, { "epoch": 1.89, "learning_rate": 1.618124120255687e-05, "loss": 0.0053, "step": 375040 }, { "epoch": 1.89, "learning_rate": 1.617367350954286e-05, "loss": 0.0054, "step": 375050 }, { "epoch": 1.89, "learning_rate": 1.616610581652885e-05, "loss": 0.0044, "step": 375060 }, { "epoch": 1.89, "learning_rate": 1.6158538123514838e-05, "loss": 0.0039, "step": 375070 }, { "epoch": 1.89, "learning_rate": 1.615097043050083e-05, "loss": 0.0069, "step": 375080 }, { "epoch": 1.89, "learning_rate": 1.6143402737486817e-05, "loss": 0.0047, "step": 375090 }, { "epoch": 1.89, "learning_rate": 1.613583504447281e-05, "loss": 0.0051, "step": 375100 }, { "epoch": 1.89, "learning_rate": 1.6128267351458797e-05, "loss": 0.0064, "step": 375110 }, { "epoch": 1.89, "learning_rate": 1.612069965844479e-05, "loss": 0.0064, "step": 375120 }, { "epoch": 1.89, "learning_rate": 1.6113131965430777e-05, "loss": 0.0069, "step": 375130 }, { "epoch": 1.89, "learning_rate": 1.610556427241677e-05, "loss": 0.0057, "step": 375140 }, { "epoch": 1.89, "learning_rate": 1.6097996579402757e-05, "loss": 0.0064, "step": 375150 }, { "epoch": 1.89, "learning_rate": 1.6090428886388745e-05, "loss": 0.0045, "step": 375160 }, { "epoch": 1.89, "learning_rate": 1.6082861193374737e-05, "loss": 0.0057, "step": 375170 }, { "epoch": 1.89, "learning_rate": 1.6075293500360725e-05, "loss": 0.0056, "step": 375180 }, { "epoch": 1.89, "learning_rate": 1.6067725807346716e-05, "loss": 0.0059, "step": 375190 }, { "epoch": 1.89, "learning_rate": 1.6060158114332705e-05, "loss": 0.004, "step": 375200 }, { "epoch": 1.89, "learning_rate": 1.6052590421318696e-05, "loss": 0.0067, "step": 375210 }, { "epoch": 1.89, "learning_rate": 1.6045022728304685e-05, "loss": 0.0041, "step": 375220 }, { "epoch": 1.89, "learning_rate": 1.6037455035290673e-05, "loss": 0.0059, "step": 375230 }, { "epoch": 1.89, "learning_rate": 1.6029887342276664e-05, "loss": 0.0071, "step": 375240 }, { "epoch": 1.89, "learning_rate": 1.6022319649262653e-05, "loss": 0.0047, "step": 375250 }, { "epoch": 1.89, "learning_rate": 1.6014751956248644e-05, "loss": 0.0063, "step": 375260 }, { "epoch": 1.89, "learning_rate": 1.6007184263234632e-05, "loss": 0.0051, "step": 375270 }, { "epoch": 1.89, "learning_rate": 1.5999616570220624e-05, "loss": 0.0044, "step": 375280 }, { "epoch": 1.89, "learning_rate": 1.5992048877206612e-05, "loss": 0.0046, "step": 375290 }, { "epoch": 1.89, "learning_rate": 1.59844811841926e-05, "loss": 0.0056, "step": 375300 }, { "epoch": 1.89, "learning_rate": 1.5976913491178592e-05, "loss": 0.0068, "step": 375310 }, { "epoch": 1.89, "learning_rate": 1.596934579816458e-05, "loss": 0.0062, "step": 375320 }, { "epoch": 1.89, "learning_rate": 1.5961778105150572e-05, "loss": 0.006, "step": 375330 }, { "epoch": 1.89, "learning_rate": 1.595421041213656e-05, "loss": 0.0062, "step": 375340 }, { "epoch": 1.89, "learning_rate": 1.594664271912255e-05, "loss": 0.0052, "step": 375350 }, { "epoch": 1.89, "learning_rate": 1.593907502610854e-05, "loss": 0.0079, "step": 375360 }, { "epoch": 1.89, "learning_rate": 1.593150733309453e-05, "loss": 0.0071, "step": 375370 }, { "epoch": 1.89, "learning_rate": 1.5923939640080516e-05, "loss": 0.0059, "step": 375380 }, { "epoch": 1.89, "learning_rate": 1.5916371947066508e-05, "loss": 0.0042, "step": 375390 }, { "epoch": 1.89, "learning_rate": 1.5908804254052496e-05, "loss": 0.0058, "step": 375400 }, { "epoch": 1.89, "learning_rate": 1.5901236561038488e-05, "loss": 0.0061, "step": 375410 }, { "epoch": 1.89, "learning_rate": 1.5893668868024476e-05, "loss": 0.0058, "step": 375420 }, { "epoch": 1.89, "learning_rate": 1.5886101175010468e-05, "loss": 0.0049, "step": 375430 }, { "epoch": 1.89, "learning_rate": 1.587853348199646e-05, "loss": 0.0052, "step": 375440 }, { "epoch": 1.89, "learning_rate": 1.5870965788982447e-05, "loss": 0.0041, "step": 375450 }, { "epoch": 1.89, "learning_rate": 1.5863398095968436e-05, "loss": 0.0063, "step": 375460 }, { "epoch": 1.89, "learning_rate": 1.5855830402954424e-05, "loss": 0.005, "step": 375470 }, { "epoch": 1.89, "learning_rate": 1.5848262709940415e-05, "loss": 0.0061, "step": 375480 }, { "epoch": 1.89, "learning_rate": 1.5840695016926404e-05, "loss": 0.0067, "step": 375490 }, { "epoch": 1.89, "learning_rate": 1.5833127323912395e-05, "loss": 0.0048, "step": 375500 }, { "epoch": 1.89, "learning_rate": 1.5825559630898384e-05, "loss": 0.0054, "step": 375510 }, { "epoch": 1.89, "learning_rate": 1.5817991937884375e-05, "loss": 0.0052, "step": 375520 }, { "epoch": 1.89, "learning_rate": 1.5810424244870363e-05, "loss": 0.0053, "step": 375530 }, { "epoch": 1.89, "learning_rate": 1.580285655185635e-05, "loss": 0.0062, "step": 375540 }, { "epoch": 1.89, "learning_rate": 1.5795288858842343e-05, "loss": 0.0054, "step": 375550 }, { "epoch": 1.89, "learning_rate": 1.578772116582833e-05, "loss": 0.0073, "step": 375560 }, { "epoch": 1.89, "learning_rate": 1.5780153472814323e-05, "loss": 0.0057, "step": 375570 }, { "epoch": 1.89, "learning_rate": 1.577258577980031e-05, "loss": 0.0052, "step": 375580 }, { "epoch": 1.89, "learning_rate": 1.5765018086786303e-05, "loss": 0.004, "step": 375590 }, { "epoch": 1.89, "learning_rate": 1.575745039377229e-05, "loss": 0.0067, "step": 375600 }, { "epoch": 1.89, "learning_rate": 1.5749882700758283e-05, "loss": 0.0062, "step": 375610 }, { "epoch": 1.9, "learning_rate": 1.574231500774427e-05, "loss": 0.0053, "step": 375620 }, { "epoch": 1.9, "learning_rate": 1.573474731473026e-05, "loss": 0.0049, "step": 375630 }, { "epoch": 1.9, "learning_rate": 1.572717962171625e-05, "loss": 0.0058, "step": 375640 }, { "epoch": 1.9, "learning_rate": 1.571961192870224e-05, "loss": 0.005, "step": 375650 }, { "epoch": 1.9, "learning_rate": 1.571204423568823e-05, "loss": 0.0058, "step": 375660 }, { "epoch": 1.9, "learning_rate": 1.570447654267422e-05, "loss": 0.0064, "step": 375670 }, { "epoch": 1.9, "learning_rate": 1.569690884966021e-05, "loss": 0.0066, "step": 375680 }, { "epoch": 1.9, "learning_rate": 1.56893411566462e-05, "loss": 0.0049, "step": 375690 }, { "epoch": 1.9, "learning_rate": 1.5681773463632187e-05, "loss": 0.0051, "step": 375700 }, { "epoch": 1.9, "learning_rate": 1.567420577061818e-05, "loss": 0.0056, "step": 375710 }, { "epoch": 1.9, "learning_rate": 1.5666638077604167e-05, "loss": 0.0035, "step": 375720 }, { "epoch": 1.9, "learning_rate": 1.5659070384590158e-05, "loss": 0.0052, "step": 375730 }, { "epoch": 1.9, "learning_rate": 1.5651502691576146e-05, "loss": 0.0059, "step": 375740 }, { "epoch": 1.9, "learning_rate": 1.5643934998562138e-05, "loss": 0.0076, "step": 375750 }, { "epoch": 1.9, "learning_rate": 1.5636367305548126e-05, "loss": 0.0041, "step": 375760 }, { "epoch": 1.9, "learning_rate": 1.5628799612534114e-05, "loss": 0.0043, "step": 375770 }, { "epoch": 1.9, "learning_rate": 1.5621231919520106e-05, "loss": 0.0064, "step": 375780 }, { "epoch": 1.9, "learning_rate": 1.5613664226506094e-05, "loss": 0.0046, "step": 375790 }, { "epoch": 1.9, "learning_rate": 1.5606096533492086e-05, "loss": 0.0054, "step": 375800 }, { "epoch": 1.9, "learning_rate": 1.5598528840478074e-05, "loss": 0.0068, "step": 375810 }, { "epoch": 1.9, "learning_rate": 1.5590961147464066e-05, "loss": 0.0063, "step": 375820 }, { "epoch": 1.9, "learning_rate": 1.5583393454450054e-05, "loss": 0.0072, "step": 375830 }, { "epoch": 1.9, "learning_rate": 1.5575825761436046e-05, "loss": 0.0037, "step": 375840 }, { "epoch": 1.9, "learning_rate": 1.5568258068422034e-05, "loss": 0.0055, "step": 375850 }, { "epoch": 1.9, "learning_rate": 1.5560690375408022e-05, "loss": 0.0044, "step": 375860 }, { "epoch": 1.9, "learning_rate": 1.5553122682394014e-05, "loss": 0.0048, "step": 375870 }, { "epoch": 1.9, "learning_rate": 1.5545554989380002e-05, "loss": 0.0044, "step": 375880 }, { "epoch": 1.9, "learning_rate": 1.5537987296365993e-05, "loss": 0.0063, "step": 375890 }, { "epoch": 1.9, "learning_rate": 1.553041960335198e-05, "loss": 0.0047, "step": 375900 }, { "epoch": 1.9, "learning_rate": 1.5522851910337973e-05, "loss": 0.0063, "step": 375910 }, { "epoch": 1.9, "learning_rate": 1.551528421732396e-05, "loss": 0.0056, "step": 375920 }, { "epoch": 1.9, "learning_rate": 1.550771652430995e-05, "loss": 0.0064, "step": 375930 }, { "epoch": 1.9, "learning_rate": 1.550014883129594e-05, "loss": 0.0052, "step": 375940 }, { "epoch": 1.9, "learning_rate": 1.549258113828193e-05, "loss": 0.0049, "step": 375950 }, { "epoch": 1.9, "learning_rate": 1.548501344526792e-05, "loss": 0.005, "step": 375960 }, { "epoch": 1.9, "learning_rate": 1.547744575225391e-05, "loss": 0.0057, "step": 375970 }, { "epoch": 1.9, "learning_rate": 1.54698780592399e-05, "loss": 0.0068, "step": 375980 }, { "epoch": 1.9, "learning_rate": 1.546231036622589e-05, "loss": 0.0051, "step": 375990 }, { "epoch": 1.9, "learning_rate": 1.545474267321188e-05, "loss": 0.007, "step": 376000 }, { "epoch": 1.9, "eval_cer": 0.9144372624348985, "eval_loss": 0.00426588486880064, "eval_runtime": 116.7025, "eval_samples_per_second": 17.138, "eval_steps_per_second": 4.284, "step": 376000 }, { "epoch": 1.9, "learning_rate": 1.544717498019787e-05, "loss": 0.0051, "step": 376010 }, { "epoch": 1.9, "learning_rate": 1.5439607287183857e-05, "loss": 0.0062, "step": 376020 }, { "epoch": 1.9, "learning_rate": 1.543203959416985e-05, "loss": 0.007, "step": 376030 }, { "epoch": 1.9, "learning_rate": 1.5424471901155837e-05, "loss": 0.0059, "step": 376040 }, { "epoch": 1.9, "learning_rate": 1.541690420814183e-05, "loss": 0.0052, "step": 376050 }, { "epoch": 1.9, "learning_rate": 1.5409336515127817e-05, "loss": 0.0059, "step": 376060 }, { "epoch": 1.9, "learning_rate": 1.540176882211381e-05, "loss": 0.0059, "step": 376070 }, { "epoch": 1.9, "learning_rate": 1.5394201129099797e-05, "loss": 0.0055, "step": 376080 }, { "epoch": 1.9, "learning_rate": 1.5386633436085785e-05, "loss": 0.0061, "step": 376090 }, { "epoch": 1.9, "learning_rate": 1.5379065743071777e-05, "loss": 0.0052, "step": 376100 }, { "epoch": 1.9, "learning_rate": 1.5371498050057765e-05, "loss": 0.0053, "step": 376110 }, { "epoch": 1.9, "learning_rate": 1.5363930357043756e-05, "loss": 0.0046, "step": 376120 }, { "epoch": 1.9, "learning_rate": 1.5356362664029745e-05, "loss": 0.0064, "step": 376130 }, { "epoch": 1.9, "learning_rate": 1.5348794971015736e-05, "loss": 0.0044, "step": 376140 }, { "epoch": 1.9, "learning_rate": 1.5341227278001724e-05, "loss": 0.0044, "step": 376150 }, { "epoch": 1.9, "learning_rate": 1.5333659584987716e-05, "loss": 0.0042, "step": 376160 }, { "epoch": 1.9, "learning_rate": 1.5326091891973704e-05, "loss": 0.0039, "step": 376170 }, { "epoch": 1.9, "learning_rate": 1.5318524198959692e-05, "loss": 0.0047, "step": 376180 }, { "epoch": 1.9, "learning_rate": 1.5310956505945684e-05, "loss": 0.0049, "step": 376190 }, { "epoch": 1.9, "learning_rate": 1.5303388812931672e-05, "loss": 0.0053, "step": 376200 }, { "epoch": 1.9, "learning_rate": 1.5295821119917664e-05, "loss": 0.0056, "step": 376210 }, { "epoch": 1.9, "learning_rate": 1.5288253426903652e-05, "loss": 0.0061, "step": 376220 }, { "epoch": 1.9, "learning_rate": 1.5280685733889644e-05, "loss": 0.0065, "step": 376230 }, { "epoch": 1.9, "learning_rate": 1.5273118040875632e-05, "loss": 0.0102, "step": 376240 }, { "epoch": 1.9, "learning_rate": 1.526555034786162e-05, "loss": 0.0057, "step": 376250 }, { "epoch": 1.9, "learning_rate": 1.525798265484761e-05, "loss": 0.0055, "step": 376260 }, { "epoch": 1.9, "learning_rate": 1.52504149618336e-05, "loss": 0.005, "step": 376270 }, { "epoch": 1.9, "learning_rate": 1.524284726881959e-05, "loss": 0.0069, "step": 376280 }, { "epoch": 1.9, "learning_rate": 1.523527957580558e-05, "loss": 0.0043, "step": 376290 }, { "epoch": 1.9, "learning_rate": 1.522771188279157e-05, "loss": 0.0059, "step": 376300 }, { "epoch": 1.9, "learning_rate": 1.522014418977756e-05, "loss": 0.0059, "step": 376310 }, { "epoch": 1.9, "learning_rate": 1.5212576496763548e-05, "loss": 0.0053, "step": 376320 }, { "epoch": 1.9, "learning_rate": 1.5205008803749538e-05, "loss": 0.0053, "step": 376330 }, { "epoch": 1.9, "learning_rate": 1.5197441110735528e-05, "loss": 0.0055, "step": 376340 }, { "epoch": 1.9, "learning_rate": 1.5189873417721518e-05, "loss": 0.0096, "step": 376350 }, { "epoch": 1.9, "learning_rate": 1.5182305724707507e-05, "loss": 0.0047, "step": 376360 }, { "epoch": 1.9, "learning_rate": 1.5174738031693497e-05, "loss": 0.0077, "step": 376370 }, { "epoch": 1.9, "learning_rate": 1.5167170338679487e-05, "loss": 0.0059, "step": 376380 }, { "epoch": 1.9, "learning_rate": 1.5159602645665477e-05, "loss": 0.0048, "step": 376390 }, { "epoch": 1.9, "learning_rate": 1.5152034952651465e-05, "loss": 0.0047, "step": 376400 }, { "epoch": 1.9, "learning_rate": 1.5144467259637455e-05, "loss": 0.0052, "step": 376410 }, { "epoch": 1.9, "learning_rate": 1.5136899566623445e-05, "loss": 0.0065, "step": 376420 }, { "epoch": 1.9, "learning_rate": 1.5129331873609435e-05, "loss": 0.0057, "step": 376430 }, { "epoch": 1.9, "learning_rate": 1.5121764180595425e-05, "loss": 0.0065, "step": 376440 }, { "epoch": 1.9, "learning_rate": 1.5114196487581415e-05, "loss": 0.0052, "step": 376450 }, { "epoch": 1.9, "learning_rate": 1.5106628794567405e-05, "loss": 0.0064, "step": 376460 }, { "epoch": 1.9, "learning_rate": 1.5099061101553395e-05, "loss": 0.0043, "step": 376470 }, { "epoch": 1.9, "learning_rate": 1.5091493408539383e-05, "loss": 0.0062, "step": 376480 }, { "epoch": 1.9, "learning_rate": 1.5083925715525373e-05, "loss": 0.0058, "step": 376490 }, { "epoch": 1.9, "learning_rate": 1.5076358022511363e-05, "loss": 0.0042, "step": 376500 }, { "epoch": 1.9, "learning_rate": 1.5068790329497353e-05, "loss": 0.0052, "step": 376510 }, { "epoch": 1.9, "learning_rate": 1.5061222636483343e-05, "loss": 0.0057, "step": 376520 }, { "epoch": 1.9, "learning_rate": 1.5053654943469333e-05, "loss": 0.0062, "step": 376530 }, { "epoch": 1.9, "learning_rate": 1.5046087250455323e-05, "loss": 0.0065, "step": 376540 }, { "epoch": 1.9, "learning_rate": 1.5038519557441312e-05, "loss": 0.0051, "step": 376550 }, { "epoch": 1.9, "learning_rate": 1.50309518644273e-05, "loss": 0.005, "step": 376560 }, { "epoch": 1.9, "learning_rate": 1.502338417141329e-05, "loss": 0.0055, "step": 376570 }, { "epoch": 1.9, "learning_rate": 1.501581647839928e-05, "loss": 0.0056, "step": 376580 }, { "epoch": 1.9, "learning_rate": 1.500824878538527e-05, "loss": 0.004, "step": 376590 }, { "epoch": 1.9, "learning_rate": 1.500068109237126e-05, "loss": 0.0054, "step": 376600 }, { "epoch": 1.9, "learning_rate": 1.499311339935725e-05, "loss": 0.0044, "step": 376610 }, { "epoch": 1.9, "learning_rate": 1.498554570634324e-05, "loss": 0.0058, "step": 376620 }, { "epoch": 1.9, "learning_rate": 1.497797801332923e-05, "loss": 0.0052, "step": 376630 }, { "epoch": 1.9, "learning_rate": 1.4970410320315218e-05, "loss": 0.0049, "step": 376640 }, { "epoch": 1.9, "learning_rate": 1.4962842627301208e-05, "loss": 0.0058, "step": 376650 }, { "epoch": 1.9, "learning_rate": 1.4955274934287198e-05, "loss": 0.0054, "step": 376660 }, { "epoch": 1.9, "learning_rate": 1.4947707241273188e-05, "loss": 0.0058, "step": 376670 }, { "epoch": 1.9, "learning_rate": 1.4940139548259178e-05, "loss": 0.0055, "step": 376680 }, { "epoch": 1.9, "learning_rate": 1.4932571855245168e-05, "loss": 0.0069, "step": 376690 }, { "epoch": 1.9, "learning_rate": 1.4925004162231158e-05, "loss": 0.0054, "step": 376700 }, { "epoch": 1.9, "learning_rate": 1.4917436469217148e-05, "loss": 0.0048, "step": 376710 }, { "epoch": 1.9, "learning_rate": 1.4909868776203134e-05, "loss": 0.0048, "step": 376720 }, { "epoch": 1.9, "learning_rate": 1.4902301083189124e-05, "loss": 0.0055, "step": 376730 }, { "epoch": 1.9, "learning_rate": 1.4894733390175114e-05, "loss": 0.0057, "step": 376740 }, { "epoch": 1.9, "learning_rate": 1.4887165697161104e-05, "loss": 0.005, "step": 376750 }, { "epoch": 1.9, "learning_rate": 1.4879598004147096e-05, "loss": 0.0063, "step": 376760 }, { "epoch": 1.9, "learning_rate": 1.4872030311133085e-05, "loss": 0.0076, "step": 376770 }, { "epoch": 1.9, "learning_rate": 1.4864462618119075e-05, "loss": 0.0053, "step": 376780 }, { "epoch": 1.9, "learning_rate": 1.4856894925105065e-05, "loss": 0.0055, "step": 376790 }, { "epoch": 1.9, "learning_rate": 1.4849327232091052e-05, "loss": 0.0052, "step": 376800 }, { "epoch": 1.9, "learning_rate": 1.4841759539077042e-05, "loss": 0.0058, "step": 376810 }, { "epoch": 1.9, "learning_rate": 1.4834191846063032e-05, "loss": 0.005, "step": 376820 }, { "epoch": 1.9, "learning_rate": 1.4826624153049022e-05, "loss": 0.008, "step": 376830 }, { "epoch": 1.9, "learning_rate": 1.4819056460035011e-05, "loss": 0.0047, "step": 376840 }, { "epoch": 1.9, "learning_rate": 1.4811488767021001e-05, "loss": 0.0055, "step": 376850 }, { "epoch": 1.9, "learning_rate": 1.4803921074006991e-05, "loss": 0.0083, "step": 376860 }, { "epoch": 1.9, "learning_rate": 1.479635338099298e-05, "loss": 0.0069, "step": 376870 }, { "epoch": 1.9, "learning_rate": 1.478878568797897e-05, "loss": 0.0048, "step": 376880 }, { "epoch": 1.9, "learning_rate": 1.478121799496496e-05, "loss": 0.006, "step": 376890 }, { "epoch": 1.9, "learning_rate": 1.477365030195095e-05, "loss": 0.0044, "step": 376900 }, { "epoch": 1.9, "learning_rate": 1.4766082608936939e-05, "loss": 0.0079, "step": 376910 }, { "epoch": 1.9, "learning_rate": 1.4758514915922929e-05, "loss": 0.0053, "step": 376920 }, { "epoch": 1.9, "learning_rate": 1.4750947222908919e-05, "loss": 0.0064, "step": 376930 }, { "epoch": 1.9, "learning_rate": 1.4743379529894909e-05, "loss": 0.0052, "step": 376940 }, { "epoch": 1.9, "learning_rate": 1.4735811836880897e-05, "loss": 0.0055, "step": 376950 }, { "epoch": 1.9, "learning_rate": 1.4728244143866887e-05, "loss": 0.0059, "step": 376960 }, { "epoch": 1.9, "learning_rate": 1.4720676450852877e-05, "loss": 0.0049, "step": 376970 }, { "epoch": 1.9, "learning_rate": 1.4713108757838867e-05, "loss": 0.005, "step": 376980 }, { "epoch": 1.9, "learning_rate": 1.4705541064824857e-05, "loss": 0.0065, "step": 376990 }, { "epoch": 1.9, "learning_rate": 1.4697973371810847e-05, "loss": 0.0067, "step": 377000 }, { "epoch": 1.9, "eval_cer": 0.914438232831024, "eval_loss": 0.004278304520994425, "eval_runtime": 116.1202, "eval_samples_per_second": 17.224, "eval_steps_per_second": 4.306, "step": 377000 }, { "epoch": 1.9, "learning_rate": 1.4690405678796837e-05, "loss": 0.0054, "step": 377010 }, { "epoch": 1.9, "learning_rate": 1.4682837985782826e-05, "loss": 0.0067, "step": 377020 }, { "epoch": 1.9, "learning_rate": 1.4675270292768815e-05, "loss": 0.0035, "step": 377030 }, { "epoch": 1.9, "learning_rate": 1.4667702599754805e-05, "loss": 0.0054, "step": 377040 }, { "epoch": 1.9, "learning_rate": 1.4660134906740795e-05, "loss": 0.0046, "step": 377050 }, { "epoch": 1.9, "learning_rate": 1.4652567213726784e-05, "loss": 0.0062, "step": 377060 }, { "epoch": 1.9, "learning_rate": 1.4644999520712774e-05, "loss": 0.0048, "step": 377070 }, { "epoch": 1.9, "learning_rate": 1.4637431827698764e-05, "loss": 0.0047, "step": 377080 }, { "epoch": 1.9, "learning_rate": 1.4629864134684754e-05, "loss": 0.0055, "step": 377090 }, { "epoch": 1.9, "learning_rate": 1.4622296441670744e-05, "loss": 0.0066, "step": 377100 }, { "epoch": 1.9, "learning_rate": 1.4614728748656732e-05, "loss": 0.005, "step": 377110 }, { "epoch": 1.9, "learning_rate": 1.4607161055642722e-05, "loss": 0.0054, "step": 377120 }, { "epoch": 1.9, "learning_rate": 1.4599593362628712e-05, "loss": 0.0084, "step": 377130 }, { "epoch": 1.9, "learning_rate": 1.4592025669614702e-05, "loss": 0.0059, "step": 377140 }, { "epoch": 1.9, "learning_rate": 1.4584457976600692e-05, "loss": 0.0052, "step": 377150 }, { "epoch": 1.9, "learning_rate": 1.4576890283586682e-05, "loss": 0.0065, "step": 377160 }, { "epoch": 1.9, "learning_rate": 1.4569322590572672e-05, "loss": 0.0059, "step": 377170 }, { "epoch": 1.9, "learning_rate": 1.4561754897558662e-05, "loss": 0.0045, "step": 377180 }, { "epoch": 1.9, "learning_rate": 1.455418720454465e-05, "loss": 0.0083, "step": 377190 }, { "epoch": 1.9, "learning_rate": 1.454661951153064e-05, "loss": 0.007, "step": 377200 }, { "epoch": 1.9, "learning_rate": 1.453905181851663e-05, "loss": 0.0055, "step": 377210 }, { "epoch": 1.9, "learning_rate": 1.453148412550262e-05, "loss": 0.0081, "step": 377220 }, { "epoch": 1.9, "learning_rate": 1.452391643248861e-05, "loss": 0.0065, "step": 377230 }, { "epoch": 1.9, "learning_rate": 1.45163487394746e-05, "loss": 0.0076, "step": 377240 }, { "epoch": 1.9, "learning_rate": 1.450878104646059e-05, "loss": 0.0056, "step": 377250 }, { "epoch": 1.9, "learning_rate": 1.450121335344658e-05, "loss": 0.0068, "step": 377260 }, { "epoch": 1.9, "learning_rate": 1.4493645660432568e-05, "loss": 0.0073, "step": 377270 }, { "epoch": 1.9, "learning_rate": 1.4486077967418557e-05, "loss": 0.0083, "step": 377280 }, { "epoch": 1.9, "learning_rate": 1.4478510274404547e-05, "loss": 0.0058, "step": 377290 }, { "epoch": 1.9, "learning_rate": 1.4470942581390537e-05, "loss": 0.0064, "step": 377300 }, { "epoch": 1.9, "learning_rate": 1.4463374888376527e-05, "loss": 0.0052, "step": 377310 }, { "epoch": 1.9, "learning_rate": 1.4455807195362517e-05, "loss": 0.006, "step": 377320 }, { "epoch": 1.9, "learning_rate": 1.4448239502348507e-05, "loss": 0.0077, "step": 377330 }, { "epoch": 1.9, "learning_rate": 1.4440671809334497e-05, "loss": 0.0063, "step": 377340 }, { "epoch": 1.9, "learning_rate": 1.4433104116320485e-05, "loss": 0.0042, "step": 377350 }, { "epoch": 1.9, "learning_rate": 1.4425536423306475e-05, "loss": 0.0047, "step": 377360 }, { "epoch": 1.9, "learning_rate": 1.4417968730292465e-05, "loss": 0.0038, "step": 377370 }, { "epoch": 1.9, "learning_rate": 1.4410401037278455e-05, "loss": 0.0051, "step": 377380 }, { "epoch": 1.9, "learning_rate": 1.4402833344264445e-05, "loss": 0.0039, "step": 377390 }, { "epoch": 1.9, "learning_rate": 1.4395265651250435e-05, "loss": 0.0038, "step": 377400 }, { "epoch": 1.9, "learning_rate": 1.4387697958236425e-05, "loss": 0.0047, "step": 377410 }, { "epoch": 1.9, "learning_rate": 1.4380130265222413e-05, "loss": 0.006, "step": 377420 }, { "epoch": 1.9, "learning_rate": 1.4372562572208403e-05, "loss": 0.0039, "step": 377430 }, { "epoch": 1.9, "learning_rate": 1.4364994879194393e-05, "loss": 0.0058, "step": 377440 }, { "epoch": 1.9, "learning_rate": 1.4357427186180383e-05, "loss": 0.0046, "step": 377450 }, { "epoch": 1.9, "learning_rate": 1.4349859493166372e-05, "loss": 0.0064, "step": 377460 }, { "epoch": 1.9, "learning_rate": 1.4342291800152362e-05, "loss": 0.0051, "step": 377470 }, { "epoch": 1.9, "learning_rate": 1.4334724107138352e-05, "loss": 0.0056, "step": 377480 }, { "epoch": 1.9, "learning_rate": 1.4327156414124342e-05, "loss": 0.0068, "step": 377490 }, { "epoch": 1.9, "learning_rate": 1.431958872111033e-05, "loss": 0.0058, "step": 377500 }, { "epoch": 1.9, "learning_rate": 1.431202102809632e-05, "loss": 0.0063, "step": 377510 }, { "epoch": 1.9, "learning_rate": 1.430445333508231e-05, "loss": 0.0049, "step": 377520 }, { "epoch": 1.9, "learning_rate": 1.42968856420683e-05, "loss": 0.0058, "step": 377530 }, { "epoch": 1.9, "learning_rate": 1.428931794905429e-05, "loss": 0.0053, "step": 377540 }, { "epoch": 1.9, "learning_rate": 1.428175025604028e-05, "loss": 0.0036, "step": 377550 }, { "epoch": 1.9, "learning_rate": 1.427418256302627e-05, "loss": 0.006, "step": 377560 }, { "epoch": 1.9, "learning_rate": 1.426661487001226e-05, "loss": 0.007, "step": 377570 }, { "epoch": 1.9, "learning_rate": 1.4259047176998246e-05, "loss": 0.0068, "step": 377580 }, { "epoch": 1.9, "learning_rate": 1.4251479483984236e-05, "loss": 0.0052, "step": 377590 }, { "epoch": 1.91, "learning_rate": 1.4243911790970228e-05, "loss": 0.0048, "step": 377600 }, { "epoch": 1.91, "learning_rate": 1.4236344097956218e-05, "loss": 0.0057, "step": 377610 }, { "epoch": 1.91, "learning_rate": 1.4228776404942208e-05, "loss": 0.0043, "step": 377620 }, { "epoch": 1.91, "learning_rate": 1.4221208711928198e-05, "loss": 0.0073, "step": 377630 }, { "epoch": 1.91, "learning_rate": 1.4213641018914188e-05, "loss": 0.0061, "step": 377640 }, { "epoch": 1.91, "learning_rate": 1.4206073325900177e-05, "loss": 0.0057, "step": 377650 }, { "epoch": 1.91, "learning_rate": 1.4198505632886164e-05, "loss": 0.005, "step": 377660 }, { "epoch": 1.91, "learning_rate": 1.4190937939872154e-05, "loss": 0.0076, "step": 377670 }, { "epoch": 1.91, "learning_rate": 1.4183370246858144e-05, "loss": 0.0052, "step": 377680 }, { "epoch": 1.91, "learning_rate": 1.4175802553844134e-05, "loss": 0.0049, "step": 377690 }, { "epoch": 1.91, "learning_rate": 1.4168234860830124e-05, "loss": 0.0046, "step": 377700 }, { "epoch": 1.91, "learning_rate": 1.4160667167816114e-05, "loss": 0.0049, "step": 377710 }, { "epoch": 1.91, "learning_rate": 1.4153099474802103e-05, "loss": 0.0055, "step": 377720 }, { "epoch": 1.91, "learning_rate": 1.4145531781788095e-05, "loss": 0.0061, "step": 377730 }, { "epoch": 1.91, "learning_rate": 1.4137964088774082e-05, "loss": 0.0067, "step": 377740 }, { "epoch": 1.91, "learning_rate": 1.4130396395760071e-05, "loss": 0.0042, "step": 377750 }, { "epoch": 1.91, "learning_rate": 1.4122828702746061e-05, "loss": 0.0064, "step": 377760 }, { "epoch": 1.91, "learning_rate": 1.4115261009732051e-05, "loss": 0.0064, "step": 377770 }, { "epoch": 1.91, "learning_rate": 1.4107693316718041e-05, "loss": 0.0043, "step": 377780 }, { "epoch": 1.91, "learning_rate": 1.4100125623704031e-05, "loss": 0.0062, "step": 377790 }, { "epoch": 1.91, "learning_rate": 1.4092557930690021e-05, "loss": 0.0046, "step": 377800 }, { "epoch": 1.91, "learning_rate": 1.4084990237676011e-05, "loss": 0.0038, "step": 377810 }, { "epoch": 1.91, "learning_rate": 1.4077422544662e-05, "loss": 0.0044, "step": 377820 }, { "epoch": 1.91, "learning_rate": 1.4069854851647989e-05, "loss": 0.0046, "step": 377830 }, { "epoch": 1.91, "learning_rate": 1.4062287158633979e-05, "loss": 0.0045, "step": 377840 }, { "epoch": 1.91, "learning_rate": 1.4054719465619969e-05, "loss": 0.0054, "step": 377850 }, { "epoch": 1.91, "learning_rate": 1.4047151772605959e-05, "loss": 0.0057, "step": 377860 }, { "epoch": 1.91, "learning_rate": 1.4039584079591949e-05, "loss": 0.0057, "step": 377870 }, { "epoch": 1.91, "learning_rate": 1.4032016386577939e-05, "loss": 0.0059, "step": 377880 }, { "epoch": 1.91, "learning_rate": 1.4024448693563929e-05, "loss": 0.0071, "step": 377890 }, { "epoch": 1.91, "learning_rate": 1.4016881000549917e-05, "loss": 0.0063, "step": 377900 }, { "epoch": 1.91, "learning_rate": 1.4009313307535907e-05, "loss": 0.006, "step": 377910 }, { "epoch": 1.91, "learning_rate": 1.4001745614521897e-05, "loss": 0.0038, "step": 377920 }, { "epoch": 1.91, "learning_rate": 1.3994177921507887e-05, "loss": 0.0055, "step": 377930 }, { "epoch": 1.91, "learning_rate": 1.3986610228493876e-05, "loss": 0.0048, "step": 377940 }, { "epoch": 1.91, "learning_rate": 1.3979042535479866e-05, "loss": 0.0058, "step": 377950 }, { "epoch": 1.91, "learning_rate": 1.3971474842465856e-05, "loss": 0.0068, "step": 377960 }, { "epoch": 1.91, "learning_rate": 1.3963907149451844e-05, "loss": 0.006, "step": 377970 }, { "epoch": 1.91, "learning_rate": 1.3956339456437834e-05, "loss": 0.0067, "step": 377980 }, { "epoch": 1.91, "learning_rate": 1.3948771763423824e-05, "loss": 0.0065, "step": 377990 }, { "epoch": 1.91, "learning_rate": 1.3941204070409814e-05, "loss": 0.0045, "step": 378000 }, { "epoch": 1.91, "eval_cer": 0.9144217360968921, "eval_loss": 0.004249492194503546, "eval_runtime": 116.3497, "eval_samples_per_second": 17.19, "eval_steps_per_second": 4.297, "step": 378000 }, { "epoch": 1.91, "learning_rate": 1.3933636377395804e-05, "loss": 0.0053, "step": 378010 }, { "epoch": 1.91, "learning_rate": 1.3926068684381794e-05, "loss": 0.0053, "step": 378020 }, { "epoch": 1.91, "learning_rate": 1.3918500991367784e-05, "loss": 0.0052, "step": 378030 }, { "epoch": 1.91, "learning_rate": 1.3910933298353774e-05, "loss": 0.0063, "step": 378040 }, { "epoch": 1.91, "learning_rate": 1.3903365605339762e-05, "loss": 0.0061, "step": 378050 }, { "epoch": 1.91, "learning_rate": 1.3895797912325752e-05, "loss": 0.0051, "step": 378060 }, { "epoch": 1.91, "learning_rate": 1.3888230219311742e-05, "loss": 0.0091, "step": 378070 }, { "epoch": 1.91, "learning_rate": 1.3880662526297732e-05, "loss": 0.0054, "step": 378080 }, { "epoch": 1.91, "learning_rate": 1.3873094833283722e-05, "loss": 0.0048, "step": 378090 }, { "epoch": 1.91, "learning_rate": 1.3865527140269712e-05, "loss": 0.005, "step": 378100 }, { "epoch": 1.91, "learning_rate": 1.3857959447255702e-05, "loss": 0.007, "step": 378110 }, { "epoch": 1.91, "learning_rate": 1.3850391754241691e-05, "loss": 0.0059, "step": 378120 }, { "epoch": 1.91, "learning_rate": 1.384282406122768e-05, "loss": 0.0046, "step": 378130 }, { "epoch": 1.91, "learning_rate": 1.383525636821367e-05, "loss": 0.0055, "step": 378140 }, { "epoch": 1.91, "learning_rate": 1.382768867519966e-05, "loss": 0.0052, "step": 378150 }, { "epoch": 1.91, "learning_rate": 1.382012098218565e-05, "loss": 0.0064, "step": 378160 }, { "epoch": 1.91, "learning_rate": 1.381255328917164e-05, "loss": 0.0058, "step": 378170 }, { "epoch": 1.91, "learning_rate": 1.380498559615763e-05, "loss": 0.0061, "step": 378180 }, { "epoch": 1.91, "learning_rate": 1.379741790314362e-05, "loss": 0.0079, "step": 378190 }, { "epoch": 1.91, "learning_rate": 1.3789850210129609e-05, "loss": 0.0046, "step": 378200 }, { "epoch": 1.91, "learning_rate": 1.3782282517115597e-05, "loss": 0.0043, "step": 378210 }, { "epoch": 1.91, "learning_rate": 1.3774714824101587e-05, "loss": 0.0049, "step": 378220 }, { "epoch": 1.91, "learning_rate": 1.3767147131087577e-05, "loss": 0.0052, "step": 378230 }, { "epoch": 1.91, "learning_rate": 1.3759579438073567e-05, "loss": 0.0072, "step": 378240 }, { "epoch": 1.91, "learning_rate": 1.3752011745059557e-05, "loss": 0.0067, "step": 378250 }, { "epoch": 1.91, "learning_rate": 1.3744444052045547e-05, "loss": 0.0071, "step": 378260 }, { "epoch": 1.91, "learning_rate": 1.3736876359031537e-05, "loss": 0.0061, "step": 378270 }, { "epoch": 1.91, "learning_rate": 1.3729308666017527e-05, "loss": 0.0069, "step": 378280 }, { "epoch": 1.91, "learning_rate": 1.3721740973003515e-05, "loss": 0.0057, "step": 378290 }, { "epoch": 1.91, "learning_rate": 1.3714173279989505e-05, "loss": 0.0077, "step": 378300 }, { "epoch": 1.91, "learning_rate": 1.3706605586975495e-05, "loss": 0.0059, "step": 378310 }, { "epoch": 1.91, "learning_rate": 1.3699037893961485e-05, "loss": 0.0059, "step": 378320 }, { "epoch": 1.91, "learning_rate": 1.3691470200947475e-05, "loss": 0.0078, "step": 378330 }, { "epoch": 1.91, "learning_rate": 1.3683902507933464e-05, "loss": 0.0047, "step": 378340 }, { "epoch": 1.91, "learning_rate": 1.3676334814919454e-05, "loss": 0.0055, "step": 378350 }, { "epoch": 1.91, "learning_rate": 1.3668767121905444e-05, "loss": 0.005, "step": 378360 }, { "epoch": 1.91, "learning_rate": 1.3661199428891433e-05, "loss": 0.0049, "step": 378370 }, { "epoch": 1.91, "learning_rate": 1.3653631735877422e-05, "loss": 0.0061, "step": 378380 }, { "epoch": 1.91, "learning_rate": 1.3646064042863412e-05, "loss": 0.0061, "step": 378390 }, { "epoch": 1.91, "learning_rate": 1.3638496349849402e-05, "loss": 0.0057, "step": 378400 }, { "epoch": 1.91, "learning_rate": 1.3630928656835392e-05, "loss": 0.0059, "step": 378410 }, { "epoch": 1.91, "learning_rate": 1.3623360963821382e-05, "loss": 0.0053, "step": 378420 }, { "epoch": 1.91, "learning_rate": 1.3615793270807372e-05, "loss": 0.0063, "step": 378430 }, { "epoch": 1.91, "learning_rate": 1.3608225577793362e-05, "loss": 0.0048, "step": 378440 }, { "epoch": 1.91, "learning_rate": 1.360065788477935e-05, "loss": 0.0064, "step": 378450 }, { "epoch": 1.91, "learning_rate": 1.359309019176534e-05, "loss": 0.0049, "step": 378460 }, { "epoch": 1.91, "learning_rate": 1.358552249875133e-05, "loss": 0.0037, "step": 378470 }, { "epoch": 1.91, "learning_rate": 1.357795480573732e-05, "loss": 0.0048, "step": 378480 }, { "epoch": 1.91, "learning_rate": 1.357038711272331e-05, "loss": 0.007, "step": 378490 }, { "epoch": 1.91, "learning_rate": 1.35628194197093e-05, "loss": 0.0067, "step": 378500 }, { "epoch": 1.91, "learning_rate": 1.355525172669529e-05, "loss": 0.0047, "step": 378510 }, { "epoch": 1.91, "learning_rate": 1.3547684033681276e-05, "loss": 0.0065, "step": 378520 }, { "epoch": 1.91, "learning_rate": 1.3540116340667266e-05, "loss": 0.0059, "step": 378530 }, { "epoch": 1.91, "learning_rate": 1.3532548647653256e-05, "loss": 0.007, "step": 378540 }, { "epoch": 1.91, "learning_rate": 1.3524980954639246e-05, "loss": 0.0063, "step": 378550 }, { "epoch": 1.91, "learning_rate": 1.3517413261625236e-05, "loss": 0.0044, "step": 378560 }, { "epoch": 1.91, "learning_rate": 1.3509845568611227e-05, "loss": 0.006, "step": 378570 }, { "epoch": 1.91, "learning_rate": 1.3502277875597217e-05, "loss": 0.0049, "step": 378580 }, { "epoch": 1.91, "learning_rate": 1.3494710182583207e-05, "loss": 0.0052, "step": 378590 }, { "epoch": 1.91, "learning_rate": 1.3487142489569194e-05, "loss": 0.005, "step": 378600 }, { "epoch": 1.91, "learning_rate": 1.3479574796555184e-05, "loss": 0.0071, "step": 378610 }, { "epoch": 1.91, "learning_rate": 1.3472007103541174e-05, "loss": 0.0054, "step": 378620 }, { "epoch": 1.91, "learning_rate": 1.3464439410527163e-05, "loss": 0.0055, "step": 378630 }, { "epoch": 1.91, "learning_rate": 1.3456871717513153e-05, "loss": 0.0052, "step": 378640 }, { "epoch": 1.91, "learning_rate": 1.3449304024499143e-05, "loss": 0.0061, "step": 378650 }, { "epoch": 1.91, "learning_rate": 1.3441736331485133e-05, "loss": 0.0063, "step": 378660 }, { "epoch": 1.91, "learning_rate": 1.3434168638471123e-05, "loss": 0.0047, "step": 378670 }, { "epoch": 1.91, "learning_rate": 1.3426600945457111e-05, "loss": 0.0047, "step": 378680 }, { "epoch": 1.91, "learning_rate": 1.3419033252443101e-05, "loss": 0.008, "step": 378690 }, { "epoch": 1.91, "learning_rate": 1.3411465559429091e-05, "loss": 0.0057, "step": 378700 }, { "epoch": 1.91, "learning_rate": 1.3403897866415081e-05, "loss": 0.0062, "step": 378710 }, { "epoch": 1.91, "learning_rate": 1.3396330173401071e-05, "loss": 0.0079, "step": 378720 }, { "epoch": 1.91, "learning_rate": 1.3388762480387061e-05, "loss": 0.0066, "step": 378730 }, { "epoch": 1.91, "learning_rate": 1.338119478737305e-05, "loss": 0.0059, "step": 378740 }, { "epoch": 1.91, "learning_rate": 1.337362709435904e-05, "loss": 0.0065, "step": 378750 }, { "epoch": 1.91, "learning_rate": 1.3366059401345029e-05, "loss": 0.0071, "step": 378760 }, { "epoch": 1.91, "learning_rate": 1.3358491708331019e-05, "loss": 0.0051, "step": 378770 }, { "epoch": 1.91, "learning_rate": 1.3350924015317009e-05, "loss": 0.0043, "step": 378780 }, { "epoch": 1.91, "learning_rate": 1.3343356322302999e-05, "loss": 0.0058, "step": 378790 }, { "epoch": 1.91, "learning_rate": 1.3335788629288989e-05, "loss": 0.0055, "step": 378800 }, { "epoch": 1.91, "learning_rate": 1.3328220936274979e-05, "loss": 0.0047, "step": 378810 }, { "epoch": 1.91, "learning_rate": 1.3320653243260968e-05, "loss": 0.0063, "step": 378820 }, { "epoch": 1.91, "learning_rate": 1.3313085550246958e-05, "loss": 0.0051, "step": 378830 }, { "epoch": 1.91, "learning_rate": 1.3305517857232947e-05, "loss": 0.0048, "step": 378840 }, { "epoch": 1.91, "learning_rate": 1.3297950164218936e-05, "loss": 0.0058, "step": 378850 }, { "epoch": 1.91, "learning_rate": 1.3290382471204926e-05, "loss": 0.0037, "step": 378860 }, { "epoch": 1.91, "learning_rate": 1.3282814778190916e-05, "loss": 0.0055, "step": 378870 }, { "epoch": 1.91, "learning_rate": 1.3275247085176906e-05, "loss": 0.0085, "step": 378880 }, { "epoch": 1.91, "learning_rate": 1.3267679392162896e-05, "loss": 0.0065, "step": 378890 }, { "epoch": 1.91, "learning_rate": 1.3260111699148886e-05, "loss": 0.0074, "step": 378900 }, { "epoch": 1.91, "learning_rate": 1.3252544006134876e-05, "loss": 0.0061, "step": 378910 }, { "epoch": 1.91, "learning_rate": 1.3244976313120864e-05, "loss": 0.007, "step": 378920 }, { "epoch": 1.91, "learning_rate": 1.3237408620106854e-05, "loss": 0.0044, "step": 378930 }, { "epoch": 1.91, "learning_rate": 1.3229840927092844e-05, "loss": 0.0045, "step": 378940 }, { "epoch": 1.91, "learning_rate": 1.3222273234078834e-05, "loss": 0.0047, "step": 378950 }, { "epoch": 1.91, "learning_rate": 1.3214705541064824e-05, "loss": 0.0068, "step": 378960 }, { "epoch": 1.91, "learning_rate": 1.3207137848050814e-05, "loss": 0.005, "step": 378970 }, { "epoch": 1.91, "learning_rate": 1.3199570155036804e-05, "loss": 0.0047, "step": 378980 }, { "epoch": 1.91, "learning_rate": 1.3192002462022794e-05, "loss": 0.0045, "step": 378990 }, { "epoch": 1.91, "learning_rate": 1.3184434769008782e-05, "loss": 0.0051, "step": 379000 }, { "epoch": 1.91, "eval_cer": 0.9144149433240143, "eval_loss": 0.00423853425309062, "eval_runtime": 116.3136, "eval_samples_per_second": 17.195, "eval_steps_per_second": 4.299, "step": 379000 }, { "epoch": 1.91, "learning_rate": 1.3176867075994772e-05, "loss": 0.0044, "step": 379010 }, { "epoch": 1.91, "learning_rate": 1.3169299382980762e-05, "loss": 0.0048, "step": 379020 }, { "epoch": 1.91, "learning_rate": 1.3161731689966752e-05, "loss": 0.0064, "step": 379030 }, { "epoch": 1.91, "learning_rate": 1.3154163996952741e-05, "loss": 0.0069, "step": 379040 }, { "epoch": 1.91, "learning_rate": 1.3146596303938731e-05, "loss": 0.0046, "step": 379050 }, { "epoch": 1.91, "learning_rate": 1.3139028610924721e-05, "loss": 0.0054, "step": 379060 }, { "epoch": 1.91, "learning_rate": 1.313146091791071e-05, "loss": 0.0038, "step": 379070 }, { "epoch": 1.91, "learning_rate": 1.31238932248967e-05, "loss": 0.0042, "step": 379080 }, { "epoch": 1.91, "learning_rate": 1.311632553188269e-05, "loss": 0.0056, "step": 379090 }, { "epoch": 1.91, "learning_rate": 1.310875783886868e-05, "loss": 0.0079, "step": 379100 }, { "epoch": 1.91, "learning_rate": 1.3101190145854669e-05, "loss": 0.0066, "step": 379110 }, { "epoch": 1.91, "learning_rate": 1.3093622452840659e-05, "loss": 0.0059, "step": 379120 }, { "epoch": 1.91, "learning_rate": 1.3086054759826649e-05, "loss": 0.0054, "step": 379130 }, { "epoch": 1.91, "learning_rate": 1.3078487066812639e-05, "loss": 0.0039, "step": 379140 }, { "epoch": 1.91, "learning_rate": 1.3070919373798627e-05, "loss": 0.0061, "step": 379150 }, { "epoch": 1.91, "learning_rate": 1.3063351680784617e-05, "loss": 0.0048, "step": 379160 }, { "epoch": 1.91, "learning_rate": 1.3055783987770607e-05, "loss": 0.0057, "step": 379170 }, { "epoch": 1.91, "learning_rate": 1.3048216294756597e-05, "loss": 0.0061, "step": 379180 }, { "epoch": 1.91, "learning_rate": 1.3040648601742587e-05, "loss": 0.0043, "step": 379190 }, { "epoch": 1.91, "learning_rate": 1.3033080908728577e-05, "loss": 0.0042, "step": 379200 }, { "epoch": 1.91, "learning_rate": 1.3025513215714567e-05, "loss": 0.0041, "step": 379210 }, { "epoch": 1.91, "learning_rate": 1.3017945522700556e-05, "loss": 0.0074, "step": 379220 }, { "epoch": 1.91, "learning_rate": 1.3010377829686545e-05, "loss": 0.0056, "step": 379230 }, { "epoch": 1.91, "learning_rate": 1.3002810136672535e-05, "loss": 0.0048, "step": 379240 }, { "epoch": 1.91, "learning_rate": 1.2995242443658525e-05, "loss": 0.0044, "step": 379250 }, { "epoch": 1.91, "learning_rate": 1.2987674750644514e-05, "loss": 0.0051, "step": 379260 }, { "epoch": 1.91, "learning_rate": 1.2980107057630504e-05, "loss": 0.0061, "step": 379270 }, { "epoch": 1.91, "learning_rate": 1.2972539364616494e-05, "loss": 0.0045, "step": 379280 }, { "epoch": 1.91, "learning_rate": 1.2964971671602484e-05, "loss": 0.0048, "step": 379290 }, { "epoch": 1.91, "learning_rate": 1.2957403978588474e-05, "loss": 0.0051, "step": 379300 }, { "epoch": 1.91, "learning_rate": 1.2949836285574462e-05, "loss": 0.0049, "step": 379310 }, { "epoch": 1.91, "learning_rate": 1.2942268592560452e-05, "loss": 0.0056, "step": 379320 }, { "epoch": 1.91, "learning_rate": 1.2934700899546442e-05, "loss": 0.0067, "step": 379330 }, { "epoch": 1.91, "learning_rate": 1.2927133206532432e-05, "loss": 0.0064, "step": 379340 }, { "epoch": 1.91, "learning_rate": 1.2919565513518422e-05, "loss": 0.0048, "step": 379350 }, { "epoch": 1.91, "learning_rate": 1.2911997820504412e-05, "loss": 0.0061, "step": 379360 }, { "epoch": 1.91, "learning_rate": 1.2904430127490402e-05, "loss": 0.0046, "step": 379370 }, { "epoch": 1.91, "learning_rate": 1.2896862434476392e-05, "loss": 0.0062, "step": 379380 }, { "epoch": 1.91, "learning_rate": 1.2889294741462378e-05, "loss": 0.0053, "step": 379390 }, { "epoch": 1.91, "learning_rate": 1.2881727048448368e-05, "loss": 0.0068, "step": 379400 }, { "epoch": 1.91, "learning_rate": 1.287415935543436e-05, "loss": 0.008, "step": 379410 }, { "epoch": 1.91, "learning_rate": 1.286659166242035e-05, "loss": 0.0054, "step": 379420 }, { "epoch": 1.91, "learning_rate": 1.285902396940634e-05, "loss": 0.0045, "step": 379430 }, { "epoch": 1.91, "learning_rate": 1.285145627639233e-05, "loss": 0.0052, "step": 379440 }, { "epoch": 1.91, "learning_rate": 1.284388858337832e-05, "loss": 0.0047, "step": 379450 }, { "epoch": 1.91, "learning_rate": 1.283632089036431e-05, "loss": 0.0058, "step": 379460 }, { "epoch": 1.91, "learning_rate": 1.2828753197350296e-05, "loss": 0.0049, "step": 379470 }, { "epoch": 1.91, "learning_rate": 1.2821185504336286e-05, "loss": 0.0052, "step": 379480 }, { "epoch": 1.91, "learning_rate": 1.2813617811322276e-05, "loss": 0.0056, "step": 379490 }, { "epoch": 1.91, "learning_rate": 1.2806050118308266e-05, "loss": 0.0062, "step": 379500 }, { "epoch": 1.91, "learning_rate": 1.2798482425294255e-05, "loss": 0.0061, "step": 379510 }, { "epoch": 1.91, "learning_rate": 1.2790914732280245e-05, "loss": 0.0061, "step": 379520 }, { "epoch": 1.91, "learning_rate": 1.2783347039266235e-05, "loss": 0.005, "step": 379530 }, { "epoch": 1.91, "learning_rate": 1.2775779346252227e-05, "loss": 0.0083, "step": 379540 }, { "epoch": 1.91, "learning_rate": 1.2768211653238213e-05, "loss": 0.0064, "step": 379550 }, { "epoch": 1.91, "learning_rate": 1.2760643960224203e-05, "loss": 0.0057, "step": 379560 }, { "epoch": 1.91, "learning_rate": 1.2753076267210193e-05, "loss": 0.0053, "step": 379570 }, { "epoch": 1.92, "learning_rate": 1.2745508574196183e-05, "loss": 0.0066, "step": 379580 }, { "epoch": 1.92, "learning_rate": 1.2737940881182173e-05, "loss": 0.0065, "step": 379590 }, { "epoch": 1.92, "learning_rate": 1.2730373188168163e-05, "loss": 0.0053, "step": 379600 }, { "epoch": 1.92, "learning_rate": 1.2722805495154153e-05, "loss": 0.0049, "step": 379610 }, { "epoch": 1.92, "learning_rate": 1.2715237802140141e-05, "loss": 0.0047, "step": 379620 }, { "epoch": 1.92, "learning_rate": 1.2707670109126131e-05, "loss": 0.0066, "step": 379630 }, { "epoch": 1.92, "learning_rate": 1.2700102416112121e-05, "loss": 0.0059, "step": 379640 }, { "epoch": 1.92, "learning_rate": 1.2692534723098111e-05, "loss": 0.0046, "step": 379650 }, { "epoch": 1.92, "learning_rate": 1.26849670300841e-05, "loss": 0.004, "step": 379660 }, { "epoch": 1.92, "learning_rate": 1.267739933707009e-05, "loss": 0.0048, "step": 379670 }, { "epoch": 1.92, "learning_rate": 1.266983164405608e-05, "loss": 0.0051, "step": 379680 }, { "epoch": 1.92, "learning_rate": 1.266226395104207e-05, "loss": 0.0054, "step": 379690 }, { "epoch": 1.92, "learning_rate": 1.2654696258028059e-05, "loss": 0.0077, "step": 379700 }, { "epoch": 1.92, "learning_rate": 1.2647128565014049e-05, "loss": 0.0076, "step": 379710 }, { "epoch": 1.92, "learning_rate": 1.2639560872000039e-05, "loss": 0.0045, "step": 379720 }, { "epoch": 1.92, "learning_rate": 1.2631993178986028e-05, "loss": 0.0058, "step": 379730 }, { "epoch": 1.92, "learning_rate": 1.2624425485972018e-05, "loss": 0.006, "step": 379740 }, { "epoch": 1.92, "learning_rate": 1.2616857792958008e-05, "loss": 0.0077, "step": 379750 }, { "epoch": 1.92, "learning_rate": 1.2609290099943998e-05, "loss": 0.0067, "step": 379760 }, { "epoch": 1.92, "learning_rate": 1.2601722406929988e-05, "loss": 0.0066, "step": 379770 }, { "epoch": 1.92, "learning_rate": 1.2594154713915976e-05, "loss": 0.0063, "step": 379780 }, { "epoch": 1.92, "learning_rate": 1.2586587020901966e-05, "loss": 0.0049, "step": 379790 }, { "epoch": 1.92, "learning_rate": 1.2579019327887956e-05, "loss": 0.0064, "step": 379800 }, { "epoch": 1.92, "learning_rate": 1.2571451634873946e-05, "loss": 0.0052, "step": 379810 }, { "epoch": 1.92, "learning_rate": 1.2563883941859936e-05, "loss": 0.0072, "step": 379820 }, { "epoch": 1.92, "learning_rate": 1.2556316248845926e-05, "loss": 0.0061, "step": 379830 }, { "epoch": 1.92, "learning_rate": 1.2548748555831916e-05, "loss": 0.0057, "step": 379840 }, { "epoch": 1.92, "learning_rate": 1.2541180862817906e-05, "loss": 0.0062, "step": 379850 }, { "epoch": 1.92, "learning_rate": 1.2533613169803894e-05, "loss": 0.0075, "step": 379860 }, { "epoch": 1.92, "learning_rate": 1.2526045476789884e-05, "loss": 0.0047, "step": 379870 }, { "epoch": 1.92, "learning_rate": 1.2518477783775874e-05, "loss": 0.0049, "step": 379880 }, { "epoch": 1.92, "learning_rate": 1.2510910090761864e-05, "loss": 0.0059, "step": 379890 }, { "epoch": 1.92, "learning_rate": 1.2503342397747854e-05, "loss": 0.0085, "step": 379900 }, { "epoch": 1.92, "learning_rate": 1.2495774704733844e-05, "loss": 0.0054, "step": 379910 }, { "epoch": 1.92, "learning_rate": 1.2488207011719833e-05, "loss": 0.0053, "step": 379920 }, { "epoch": 1.92, "learning_rate": 1.2480639318705823e-05, "loss": 0.0058, "step": 379930 }, { "epoch": 1.92, "learning_rate": 1.2473071625691812e-05, "loss": 0.0087, "step": 379940 }, { "epoch": 1.92, "learning_rate": 1.2465503932677801e-05, "loss": 0.0052, "step": 379950 }, { "epoch": 1.92, "learning_rate": 1.2457936239663791e-05, "loss": 0.0074, "step": 379960 }, { "epoch": 1.92, "learning_rate": 1.2450368546649781e-05, "loss": 0.0063, "step": 379970 }, { "epoch": 1.92, "learning_rate": 1.2442800853635771e-05, "loss": 0.0072, "step": 379980 }, { "epoch": 1.92, "learning_rate": 1.2435233160621761e-05, "loss": 0.0043, "step": 379990 }, { "epoch": 1.92, "learning_rate": 1.2427665467607751e-05, "loss": 0.0057, "step": 380000 }, { "epoch": 1.92, "eval_cer": 0.9144217360968921, "eval_loss": 0.004196519032120705, "eval_runtime": 116.3652, "eval_samples_per_second": 17.187, "eval_steps_per_second": 4.297, "step": 380000 }, { "epoch": 1.92, "learning_rate": 1.2420097774593741e-05, "loss": 0.0058, "step": 380010 }, { "epoch": 1.92, "learning_rate": 1.241253008157973e-05, "loss": 0.0044, "step": 380020 }, { "epoch": 1.92, "learning_rate": 1.2404962388565719e-05, "loss": 0.0079, "step": 380030 }, { "epoch": 1.92, "learning_rate": 1.2397394695551709e-05, "loss": 0.0054, "step": 380040 }, { "epoch": 1.92, "learning_rate": 1.2389827002537699e-05, "loss": 0.0058, "step": 380050 }, { "epoch": 1.92, "learning_rate": 1.2382259309523689e-05, "loss": 0.0062, "step": 380060 }, { "epoch": 1.92, "learning_rate": 1.2374691616509679e-05, "loss": 0.0038, "step": 380070 }, { "epoch": 1.92, "learning_rate": 1.2367123923495669e-05, "loss": 0.0052, "step": 380080 }, { "epoch": 1.92, "learning_rate": 1.2359556230481659e-05, "loss": 0.0056, "step": 380090 }, { "epoch": 1.92, "learning_rate": 1.2351988537467647e-05, "loss": 0.006, "step": 380100 }, { "epoch": 1.92, "learning_rate": 1.2344420844453637e-05, "loss": 0.006, "step": 380110 }, { "epoch": 1.92, "learning_rate": 1.2336853151439627e-05, "loss": 0.0061, "step": 380120 }, { "epoch": 1.92, "learning_rate": 1.2329285458425617e-05, "loss": 0.0059, "step": 380130 }, { "epoch": 1.92, "learning_rate": 1.2321717765411606e-05, "loss": 0.0051, "step": 380140 }, { "epoch": 1.92, "learning_rate": 1.2314150072397596e-05, "loss": 0.0056, "step": 380150 }, { "epoch": 1.92, "learning_rate": 1.2306582379383586e-05, "loss": 0.0065, "step": 380160 }, { "epoch": 1.92, "learning_rate": 1.2299014686369574e-05, "loss": 0.005, "step": 380170 }, { "epoch": 1.92, "learning_rate": 1.2291446993355564e-05, "loss": 0.007, "step": 380180 }, { "epoch": 1.92, "learning_rate": 1.2283879300341554e-05, "loss": 0.0051, "step": 380190 }, { "epoch": 1.92, "learning_rate": 1.2276311607327544e-05, "loss": 0.0032, "step": 380200 }, { "epoch": 1.92, "learning_rate": 1.2268743914313534e-05, "loss": 0.0054, "step": 380210 }, { "epoch": 1.92, "learning_rate": 1.2261176221299524e-05, "loss": 0.0054, "step": 380220 }, { "epoch": 1.92, "learning_rate": 1.2253608528285514e-05, "loss": 0.0063, "step": 380230 }, { "epoch": 1.92, "learning_rate": 1.2246040835271504e-05, "loss": 0.0052, "step": 380240 }, { "epoch": 1.92, "learning_rate": 1.223847314225749e-05, "loss": 0.0054, "step": 380250 }, { "epoch": 1.92, "learning_rate": 1.2230905449243482e-05, "loss": 0.0061, "step": 380260 }, { "epoch": 1.92, "learning_rate": 1.2223337756229472e-05, "loss": 0.0068, "step": 380270 }, { "epoch": 1.92, "learning_rate": 1.2215770063215462e-05, "loss": 0.0058, "step": 380280 }, { "epoch": 1.92, "learning_rate": 1.2208202370201452e-05, "loss": 0.0066, "step": 380290 }, { "epoch": 1.92, "learning_rate": 1.2200634677187442e-05, "loss": 0.0049, "step": 380300 }, { "epoch": 1.92, "learning_rate": 1.2193066984173432e-05, "loss": 0.0045, "step": 380310 }, { "epoch": 1.92, "learning_rate": 1.2185499291159421e-05, "loss": 0.0056, "step": 380320 }, { "epoch": 1.92, "learning_rate": 1.2177931598145408e-05, "loss": 0.0054, "step": 380330 }, { "epoch": 1.92, "learning_rate": 1.2170363905131398e-05, "loss": 0.0053, "step": 380340 }, { "epoch": 1.92, "learning_rate": 1.2162796212117388e-05, "loss": 0.0082, "step": 380350 }, { "epoch": 1.92, "learning_rate": 1.2155228519103378e-05, "loss": 0.0056, "step": 380360 }, { "epoch": 1.92, "learning_rate": 1.2147660826089368e-05, "loss": 0.0053, "step": 380370 }, { "epoch": 1.92, "learning_rate": 1.214009313307536e-05, "loss": 0.0053, "step": 380380 }, { "epoch": 1.92, "learning_rate": 1.213252544006135e-05, "loss": 0.0072, "step": 380390 }, { "epoch": 1.92, "learning_rate": 1.2124957747047339e-05, "loss": 0.0092, "step": 380400 }, { "epoch": 1.92, "learning_rate": 1.2117390054033326e-05, "loss": 0.0049, "step": 380410 }, { "epoch": 1.92, "learning_rate": 1.2109822361019316e-05, "loss": 0.0046, "step": 380420 }, { "epoch": 1.92, "learning_rate": 1.2102254668005305e-05, "loss": 0.0075, "step": 380430 }, { "epoch": 1.92, "learning_rate": 1.2094686974991295e-05, "loss": 0.0057, "step": 380440 }, { "epoch": 1.92, "learning_rate": 1.2087119281977285e-05, "loss": 0.0052, "step": 380450 }, { "epoch": 1.92, "learning_rate": 1.2079551588963275e-05, "loss": 0.0064, "step": 380460 }, { "epoch": 1.92, "learning_rate": 1.2071983895949265e-05, "loss": 0.0042, "step": 380470 }, { "epoch": 1.92, "learning_rate": 1.2064416202935255e-05, "loss": 0.0061, "step": 380480 }, { "epoch": 1.92, "learning_rate": 1.2056848509921243e-05, "loss": 0.0066, "step": 380490 }, { "epoch": 1.92, "learning_rate": 1.2049280816907233e-05, "loss": 0.0046, "step": 380500 }, { "epoch": 1.92, "learning_rate": 1.2041713123893223e-05, "loss": 0.005, "step": 380510 }, { "epoch": 1.92, "learning_rate": 1.2034145430879213e-05, "loss": 0.0042, "step": 380520 }, { "epoch": 1.92, "learning_rate": 1.2026577737865203e-05, "loss": 0.0079, "step": 380530 }, { "epoch": 1.92, "learning_rate": 1.2019010044851193e-05, "loss": 0.006, "step": 380540 }, { "epoch": 1.92, "learning_rate": 1.2011442351837183e-05, "loss": 0.0095, "step": 380550 }, { "epoch": 1.92, "learning_rate": 1.2003874658823173e-05, "loss": 0.0063, "step": 380560 }, { "epoch": 1.92, "learning_rate": 1.199630696580916e-05, "loss": 0.0052, "step": 380570 }, { "epoch": 1.92, "learning_rate": 1.198873927279515e-05, "loss": 0.0061, "step": 380580 }, { "epoch": 1.92, "learning_rate": 1.198117157978114e-05, "loss": 0.0056, "step": 380590 }, { "epoch": 1.92, "learning_rate": 1.197360388676713e-05, "loss": 0.0058, "step": 380600 }, { "epoch": 1.92, "learning_rate": 1.196603619375312e-05, "loss": 0.0042, "step": 380610 }, { "epoch": 1.92, "learning_rate": 1.195846850073911e-05, "loss": 0.0054, "step": 380620 }, { "epoch": 1.92, "learning_rate": 1.19509008077251e-05, "loss": 0.0061, "step": 380630 }, { "epoch": 1.92, "learning_rate": 1.194333311471109e-05, "loss": 0.006, "step": 380640 }, { "epoch": 1.92, "learning_rate": 1.1935765421697078e-05, "loss": 0.0057, "step": 380650 }, { "epoch": 1.92, "learning_rate": 1.1928197728683068e-05, "loss": 0.0068, "step": 380660 }, { "epoch": 1.92, "learning_rate": 1.1920630035669058e-05, "loss": 0.0045, "step": 380670 }, { "epoch": 1.92, "learning_rate": 1.1913062342655048e-05, "loss": 0.0055, "step": 380680 }, { "epoch": 1.92, "learning_rate": 1.1905494649641038e-05, "loss": 0.0044, "step": 380690 }, { "epoch": 1.92, "learning_rate": 1.1897926956627028e-05, "loss": 0.0054, "step": 380700 }, { "epoch": 1.92, "learning_rate": 1.1890359263613018e-05, "loss": 0.0052, "step": 380710 }, { "epoch": 1.92, "learning_rate": 1.1882791570599006e-05, "loss": 0.0057, "step": 380720 }, { "epoch": 1.92, "learning_rate": 1.1875223877584996e-05, "loss": 0.0068, "step": 380730 }, { "epoch": 1.92, "learning_rate": 1.1867656184570986e-05, "loss": 0.0059, "step": 380740 }, { "epoch": 1.92, "learning_rate": 1.1860088491556976e-05, "loss": 0.0046, "step": 380750 }, { "epoch": 1.92, "learning_rate": 1.1852520798542966e-05, "loss": 0.0063, "step": 380760 }, { "epoch": 1.92, "learning_rate": 1.1844953105528956e-05, "loss": 0.0049, "step": 380770 }, { "epoch": 1.92, "learning_rate": 1.1837385412514946e-05, "loss": 0.0052, "step": 380780 }, { "epoch": 1.92, "learning_rate": 1.1829817719500936e-05, "loss": 0.0032, "step": 380790 }, { "epoch": 1.92, "learning_rate": 1.1822250026486924e-05, "loss": 0.006, "step": 380800 }, { "epoch": 1.92, "learning_rate": 1.1814682333472914e-05, "loss": 0.0055, "step": 380810 }, { "epoch": 1.92, "learning_rate": 1.1807114640458904e-05, "loss": 0.0082, "step": 380820 }, { "epoch": 1.92, "learning_rate": 1.1799546947444893e-05, "loss": 0.0071, "step": 380830 }, { "epoch": 1.92, "learning_rate": 1.1791979254430883e-05, "loss": 0.0036, "step": 380840 }, { "epoch": 1.92, "learning_rate": 1.1784411561416873e-05, "loss": 0.0057, "step": 380850 }, { "epoch": 1.92, "learning_rate": 1.1776843868402863e-05, "loss": 0.0057, "step": 380860 }, { "epoch": 1.92, "learning_rate": 1.1769276175388853e-05, "loss": 0.0058, "step": 380870 }, { "epoch": 1.92, "learning_rate": 1.1761708482374841e-05, "loss": 0.004, "step": 380880 }, { "epoch": 1.92, "learning_rate": 1.1754140789360831e-05, "loss": 0.0049, "step": 380890 }, { "epoch": 1.92, "learning_rate": 1.1746573096346821e-05, "loss": 0.0047, "step": 380900 }, { "epoch": 1.92, "learning_rate": 1.1739005403332811e-05, "loss": 0.0053, "step": 380910 }, { "epoch": 1.92, "learning_rate": 1.1731437710318801e-05, "loss": 0.0043, "step": 380920 }, { "epoch": 1.92, "learning_rate": 1.1723870017304791e-05, "loss": 0.0056, "step": 380930 }, { "epoch": 1.92, "learning_rate": 1.171630232429078e-05, "loss": 0.0054, "step": 380940 }, { "epoch": 1.92, "learning_rate": 1.170873463127677e-05, "loss": 0.0059, "step": 380950 }, { "epoch": 1.92, "learning_rate": 1.1701166938262759e-05, "loss": 0.0054, "step": 380960 }, { "epoch": 1.92, "learning_rate": 1.1693599245248749e-05, "loss": 0.0045, "step": 380970 }, { "epoch": 1.92, "learning_rate": 1.1686031552234739e-05, "loss": 0.0052, "step": 380980 }, { "epoch": 1.92, "learning_rate": 1.1678463859220729e-05, "loss": 0.0086, "step": 380990 }, { "epoch": 1.92, "learning_rate": 1.1670896166206719e-05, "loss": 0.0066, "step": 381000 }, { "epoch": 1.92, "eval_cer": 0.9144256176813937, "eval_loss": 0.004235303029417992, "eval_runtime": 116.578, "eval_samples_per_second": 17.156, "eval_steps_per_second": 4.289, "step": 381000 }, { "epoch": 1.92, "learning_rate": 1.1663328473192709e-05, "loss": 0.0058, "step": 381010 }, { "epoch": 1.92, "learning_rate": 1.1655760780178698e-05, "loss": 0.0065, "step": 381020 }, { "epoch": 1.92, "learning_rate": 1.1648193087164688e-05, "loss": 0.0102, "step": 381030 }, { "epoch": 1.92, "learning_rate": 1.1640625394150677e-05, "loss": 0.0047, "step": 381040 }, { "epoch": 1.92, "learning_rate": 1.1633057701136666e-05, "loss": 0.0055, "step": 381050 }, { "epoch": 1.92, "learning_rate": 1.1625490008122656e-05, "loss": 0.0044, "step": 381060 }, { "epoch": 1.92, "learning_rate": 1.1617922315108646e-05, "loss": 0.0046, "step": 381070 }, { "epoch": 1.92, "learning_rate": 1.1610354622094636e-05, "loss": 0.0051, "step": 381080 }, { "epoch": 1.92, "learning_rate": 1.1602786929080626e-05, "loss": 0.0061, "step": 381090 }, { "epoch": 1.92, "learning_rate": 1.1595219236066616e-05, "loss": 0.0056, "step": 381100 }, { "epoch": 1.92, "learning_rate": 1.1587651543052606e-05, "loss": 0.0068, "step": 381110 }, { "epoch": 1.92, "learning_rate": 1.1580083850038594e-05, "loss": 0.0079, "step": 381120 }, { "epoch": 1.92, "learning_rate": 1.1572516157024584e-05, "loss": 0.0066, "step": 381130 }, { "epoch": 1.92, "learning_rate": 1.1564948464010574e-05, "loss": 0.0048, "step": 381140 }, { "epoch": 1.92, "learning_rate": 1.1557380770996564e-05, "loss": 0.0063, "step": 381150 }, { "epoch": 1.92, "learning_rate": 1.1549813077982554e-05, "loss": 0.0066, "step": 381160 }, { "epoch": 1.92, "learning_rate": 1.1542245384968544e-05, "loss": 0.0069, "step": 381170 }, { "epoch": 1.92, "learning_rate": 1.1534677691954534e-05, "loss": 0.0074, "step": 381180 }, { "epoch": 1.92, "learning_rate": 1.1527109998940524e-05, "loss": 0.0068, "step": 381190 }, { "epoch": 1.92, "learning_rate": 1.151954230592651e-05, "loss": 0.0068, "step": 381200 }, { "epoch": 1.92, "learning_rate": 1.15119746129125e-05, "loss": 0.0046, "step": 381210 }, { "epoch": 1.92, "learning_rate": 1.150440691989849e-05, "loss": 0.0047, "step": 381220 }, { "epoch": 1.92, "learning_rate": 1.1496839226884482e-05, "loss": 0.004, "step": 381230 }, { "epoch": 1.92, "learning_rate": 1.1489271533870471e-05, "loss": 0.0055, "step": 381240 }, { "epoch": 1.92, "learning_rate": 1.1481703840856461e-05, "loss": 0.0061, "step": 381250 }, { "epoch": 1.92, "learning_rate": 1.1474136147842451e-05, "loss": 0.004, "step": 381260 }, { "epoch": 1.92, "learning_rate": 1.1466568454828438e-05, "loss": 0.0067, "step": 381270 }, { "epoch": 1.92, "learning_rate": 1.1459000761814428e-05, "loss": 0.0045, "step": 381280 }, { "epoch": 1.92, "learning_rate": 1.1451433068800418e-05, "loss": 0.0043, "step": 381290 }, { "epoch": 1.92, "learning_rate": 1.1443865375786408e-05, "loss": 0.0062, "step": 381300 }, { "epoch": 1.92, "learning_rate": 1.1436297682772397e-05, "loss": 0.0074, "step": 381310 }, { "epoch": 1.92, "learning_rate": 1.1428729989758387e-05, "loss": 0.0049, "step": 381320 }, { "epoch": 1.92, "learning_rate": 1.1421162296744377e-05, "loss": 0.0058, "step": 381330 }, { "epoch": 1.92, "learning_rate": 1.1413594603730367e-05, "loss": 0.0047, "step": 381340 }, { "epoch": 1.92, "learning_rate": 1.1406026910716355e-05, "loss": 0.0086, "step": 381350 }, { "epoch": 1.92, "learning_rate": 1.1398459217702345e-05, "loss": 0.005, "step": 381360 }, { "epoch": 1.92, "learning_rate": 1.1390891524688335e-05, "loss": 0.0063, "step": 381370 }, { "epoch": 1.92, "learning_rate": 1.1383323831674325e-05, "loss": 0.0046, "step": 381380 }, { "epoch": 1.92, "learning_rate": 1.1375756138660315e-05, "loss": 0.0048, "step": 381390 }, { "epoch": 1.92, "learning_rate": 1.1368188445646305e-05, "loss": 0.0072, "step": 381400 }, { "epoch": 1.92, "learning_rate": 1.1360620752632295e-05, "loss": 0.0079, "step": 381410 }, { "epoch": 1.92, "learning_rate": 1.1353053059618285e-05, "loss": 0.0064, "step": 381420 }, { "epoch": 1.92, "learning_rate": 1.1345485366604273e-05, "loss": 0.0069, "step": 381430 }, { "epoch": 1.92, "learning_rate": 1.1337917673590263e-05, "loss": 0.0054, "step": 381440 }, { "epoch": 1.92, "learning_rate": 1.1330349980576253e-05, "loss": 0.0058, "step": 381450 }, { "epoch": 1.92, "learning_rate": 1.1322782287562243e-05, "loss": 0.005, "step": 381460 }, { "epoch": 1.92, "learning_rate": 1.1315214594548233e-05, "loss": 0.0061, "step": 381470 }, { "epoch": 1.92, "learning_rate": 1.1307646901534223e-05, "loss": 0.0047, "step": 381480 }, { "epoch": 1.92, "learning_rate": 1.1300079208520212e-05, "loss": 0.0064, "step": 381490 }, { "epoch": 1.92, "learning_rate": 1.1292511515506202e-05, "loss": 0.0067, "step": 381500 }, { "epoch": 1.92, "learning_rate": 1.128494382249219e-05, "loss": 0.0059, "step": 381510 }, { "epoch": 1.92, "learning_rate": 1.127737612947818e-05, "loss": 0.0061, "step": 381520 }, { "epoch": 1.92, "learning_rate": 1.126980843646417e-05, "loss": 0.008, "step": 381530 }, { "epoch": 1.92, "learning_rate": 1.126224074345016e-05, "loss": 0.0051, "step": 381540 }, { "epoch": 1.92, "learning_rate": 1.125467305043615e-05, "loss": 0.0065, "step": 381550 }, { "epoch": 1.93, "learning_rate": 1.124710535742214e-05, "loss": 0.006, "step": 381560 }, { "epoch": 1.93, "learning_rate": 1.123953766440813e-05, "loss": 0.0067, "step": 381570 }, { "epoch": 1.93, "learning_rate": 1.123196997139412e-05, "loss": 0.0074, "step": 381580 }, { "epoch": 1.93, "learning_rate": 1.1224402278380108e-05, "loss": 0.0081, "step": 381590 }, { "epoch": 1.93, "learning_rate": 1.1216834585366098e-05, "loss": 0.0044, "step": 381600 }, { "epoch": 1.93, "learning_rate": 1.1209266892352088e-05, "loss": 0.0046, "step": 381610 }, { "epoch": 1.93, "learning_rate": 1.1201699199338078e-05, "loss": 0.005, "step": 381620 }, { "epoch": 1.93, "learning_rate": 1.1194131506324068e-05, "loss": 0.0068, "step": 381630 }, { "epoch": 1.93, "learning_rate": 1.1186563813310058e-05, "loss": 0.0054, "step": 381640 }, { "epoch": 1.93, "learning_rate": 1.1178996120296048e-05, "loss": 0.0058, "step": 381650 }, { "epoch": 1.93, "learning_rate": 1.1171428427282038e-05, "loss": 0.0062, "step": 381660 }, { "epoch": 1.93, "learning_rate": 1.1163860734268026e-05, "loss": 0.0052, "step": 381670 }, { "epoch": 1.93, "learning_rate": 1.1156293041254016e-05, "loss": 0.0046, "step": 381680 }, { "epoch": 1.93, "learning_rate": 1.1148725348240006e-05, "loss": 0.0052, "step": 381690 }, { "epoch": 1.93, "learning_rate": 1.1141157655225996e-05, "loss": 0.0079, "step": 381700 }, { "epoch": 1.93, "learning_rate": 1.1133589962211985e-05, "loss": 0.0053, "step": 381710 }, { "epoch": 1.93, "learning_rate": 1.1126022269197975e-05, "loss": 0.0056, "step": 381720 }, { "epoch": 1.93, "learning_rate": 1.1118454576183965e-05, "loss": 0.0057, "step": 381730 }, { "epoch": 1.93, "learning_rate": 1.1110886883169954e-05, "loss": 0.0048, "step": 381740 }, { "epoch": 1.93, "learning_rate": 1.1103319190155943e-05, "loss": 0.0042, "step": 381750 }, { "epoch": 1.93, "learning_rate": 1.1095751497141933e-05, "loss": 0.0058, "step": 381760 }, { "epoch": 1.93, "learning_rate": 1.1088183804127923e-05, "loss": 0.0059, "step": 381770 }, { "epoch": 1.93, "learning_rate": 1.1080616111113913e-05, "loss": 0.0073, "step": 381780 }, { "epoch": 1.93, "learning_rate": 1.1073048418099903e-05, "loss": 0.0073, "step": 381790 }, { "epoch": 1.93, "learning_rate": 1.1065480725085893e-05, "loss": 0.0043, "step": 381800 }, { "epoch": 1.93, "learning_rate": 1.1057913032071883e-05, "loss": 0.0096, "step": 381810 }, { "epoch": 1.93, "learning_rate": 1.1050345339057871e-05, "loss": 0.005, "step": 381820 }, { "epoch": 1.93, "learning_rate": 1.1042777646043861e-05, "loss": 0.0041, "step": 381830 }, { "epoch": 1.93, "learning_rate": 1.1035209953029851e-05, "loss": 0.0056, "step": 381840 }, { "epoch": 1.93, "learning_rate": 1.1027642260015841e-05, "loss": 0.0046, "step": 381850 }, { "epoch": 1.93, "learning_rate": 1.102007456700183e-05, "loss": 0.0044, "step": 381860 }, { "epoch": 1.93, "learning_rate": 1.101250687398782e-05, "loss": 0.0047, "step": 381870 }, { "epoch": 1.93, "learning_rate": 1.100493918097381e-05, "loss": 0.005, "step": 381880 }, { "epoch": 1.93, "learning_rate": 1.09973714879598e-05, "loss": 0.0059, "step": 381890 }, { "epoch": 1.93, "learning_rate": 1.0989803794945789e-05, "loss": 0.0068, "step": 381900 }, { "epoch": 1.93, "learning_rate": 1.0982236101931779e-05, "loss": 0.0049, "step": 381910 }, { "epoch": 1.93, "learning_rate": 1.0974668408917769e-05, "loss": 0.0044, "step": 381920 }, { "epoch": 1.93, "learning_rate": 1.0967100715903758e-05, "loss": 0.008, "step": 381930 }, { "epoch": 1.93, "learning_rate": 1.0959533022889748e-05, "loss": 0.0059, "step": 381940 }, { "epoch": 1.93, "learning_rate": 1.0951965329875738e-05, "loss": 0.0038, "step": 381950 }, { "epoch": 1.93, "learning_rate": 1.0944397636861728e-05, "loss": 0.0051, "step": 381960 }, { "epoch": 1.93, "learning_rate": 1.0936829943847718e-05, "loss": 0.0054, "step": 381970 }, { "epoch": 1.93, "learning_rate": 1.0929262250833706e-05, "loss": 0.0086, "step": 381980 }, { "epoch": 1.93, "learning_rate": 1.0921694557819696e-05, "loss": 0.0052, "step": 381990 }, { "epoch": 1.93, "learning_rate": 1.0914126864805686e-05, "loss": 0.0067, "step": 382000 }, { "epoch": 1.93, "eval_cer": 0.9144032985705095, "eval_loss": 0.004233332350850105, "eval_runtime": 116.331, "eval_samples_per_second": 17.192, "eval_steps_per_second": 4.298, "step": 382000 }, { "epoch": 1.93, "learning_rate": 1.0906559171791676e-05, "loss": 0.0065, "step": 382010 }, { "epoch": 1.93, "learning_rate": 1.0898991478777666e-05, "loss": 0.0067, "step": 382020 }, { "epoch": 1.93, "learning_rate": 1.0891423785763656e-05, "loss": 0.0071, "step": 382030 }, { "epoch": 1.93, "learning_rate": 1.0883856092749646e-05, "loss": 0.0059, "step": 382040 }, { "epoch": 1.93, "learning_rate": 1.0876288399735636e-05, "loss": 0.0059, "step": 382050 }, { "epoch": 1.93, "learning_rate": 1.0868720706721622e-05, "loss": 0.0075, "step": 382060 }, { "epoch": 1.93, "learning_rate": 1.0861153013707614e-05, "loss": 0.0048, "step": 382070 }, { "epoch": 1.93, "learning_rate": 1.0853585320693604e-05, "loss": 0.0072, "step": 382080 }, { "epoch": 1.93, "learning_rate": 1.0846017627679594e-05, "loss": 0.0054, "step": 382090 }, { "epoch": 1.93, "learning_rate": 1.0838449934665584e-05, "loss": 0.006, "step": 382100 }, { "epoch": 1.93, "learning_rate": 1.0830882241651574e-05, "loss": 0.0085, "step": 382110 }, { "epoch": 1.93, "learning_rate": 1.0823314548637563e-05, "loss": 0.0055, "step": 382120 }, { "epoch": 1.93, "learning_rate": 1.0815746855623553e-05, "loss": 0.0041, "step": 382130 }, { "epoch": 1.93, "learning_rate": 1.080817916260954e-05, "loss": 0.0053, "step": 382140 }, { "epoch": 1.93, "learning_rate": 1.080061146959553e-05, "loss": 0.0035, "step": 382150 }, { "epoch": 1.93, "learning_rate": 1.079304377658152e-05, "loss": 0.0043, "step": 382160 }, { "epoch": 1.93, "learning_rate": 1.078547608356751e-05, "loss": 0.0066, "step": 382170 }, { "epoch": 1.93, "learning_rate": 1.07779083905535e-05, "loss": 0.0049, "step": 382180 }, { "epoch": 1.93, "learning_rate": 1.077034069753949e-05, "loss": 0.005, "step": 382190 }, { "epoch": 1.93, "learning_rate": 1.0762773004525481e-05, "loss": 0.0054, "step": 382200 }, { "epoch": 1.93, "learning_rate": 1.0755205311511471e-05, "loss": 0.0072, "step": 382210 }, { "epoch": 1.93, "learning_rate": 1.0747637618497457e-05, "loss": 0.0045, "step": 382220 }, { "epoch": 1.93, "learning_rate": 1.0740069925483447e-05, "loss": 0.005, "step": 382230 }, { "epoch": 1.93, "learning_rate": 1.0732502232469437e-05, "loss": 0.0099, "step": 382240 }, { "epoch": 1.93, "learning_rate": 1.0724934539455427e-05, "loss": 0.0048, "step": 382250 }, { "epoch": 1.93, "learning_rate": 1.0717366846441417e-05, "loss": 0.0069, "step": 382260 }, { "epoch": 1.93, "learning_rate": 1.0709799153427407e-05, "loss": 0.0053, "step": 382270 }, { "epoch": 1.93, "learning_rate": 1.0702231460413397e-05, "loss": 0.0056, "step": 382280 }, { "epoch": 1.93, "learning_rate": 1.0694663767399385e-05, "loss": 0.0055, "step": 382290 }, { "epoch": 1.93, "learning_rate": 1.0687096074385375e-05, "loss": 0.0042, "step": 382300 }, { "epoch": 1.93, "learning_rate": 1.0679528381371365e-05, "loss": 0.0063, "step": 382310 }, { "epoch": 1.93, "learning_rate": 1.0671960688357355e-05, "loss": 0.0042, "step": 382320 }, { "epoch": 1.93, "learning_rate": 1.0664392995343345e-05, "loss": 0.0076, "step": 382330 }, { "epoch": 1.93, "learning_rate": 1.0656825302329335e-05, "loss": 0.006, "step": 382340 }, { "epoch": 1.93, "learning_rate": 1.0649257609315325e-05, "loss": 0.0054, "step": 382350 }, { "epoch": 1.93, "learning_rate": 1.0641689916301315e-05, "loss": 0.0044, "step": 382360 }, { "epoch": 1.93, "learning_rate": 1.0634122223287303e-05, "loss": 0.0074, "step": 382370 }, { "epoch": 1.93, "learning_rate": 1.0626554530273293e-05, "loss": 0.005, "step": 382380 }, { "epoch": 1.93, "learning_rate": 1.0618986837259283e-05, "loss": 0.0049, "step": 382390 }, { "epoch": 1.93, "learning_rate": 1.0611419144245273e-05, "loss": 0.0055, "step": 382400 }, { "epoch": 1.93, "learning_rate": 1.0603851451231262e-05, "loss": 0.0056, "step": 382410 }, { "epoch": 1.93, "learning_rate": 1.0596283758217252e-05, "loss": 0.0063, "step": 382420 }, { "epoch": 1.93, "learning_rate": 1.0588716065203242e-05, "loss": 0.0047, "step": 382430 }, { "epoch": 1.93, "learning_rate": 1.0581148372189232e-05, "loss": 0.0059, "step": 382440 }, { "epoch": 1.93, "learning_rate": 1.057358067917522e-05, "loss": 0.0059, "step": 382450 }, { "epoch": 1.93, "learning_rate": 1.056601298616121e-05, "loss": 0.0071, "step": 382460 }, { "epoch": 1.93, "learning_rate": 1.05584452931472e-05, "loss": 0.0071, "step": 382470 }, { "epoch": 1.93, "learning_rate": 1.055087760013319e-05, "loss": 0.0035, "step": 382480 }, { "epoch": 1.93, "learning_rate": 1.054330990711918e-05, "loss": 0.0061, "step": 382490 }, { "epoch": 1.93, "learning_rate": 1.053574221410517e-05, "loss": 0.0059, "step": 382500 }, { "epoch": 1.93, "learning_rate": 1.052817452109116e-05, "loss": 0.007, "step": 382510 }, { "epoch": 1.93, "learning_rate": 1.052060682807715e-05, "loss": 0.0069, "step": 382520 }, { "epoch": 1.93, "learning_rate": 1.0513039135063138e-05, "loss": 0.0043, "step": 382530 }, { "epoch": 1.93, "learning_rate": 1.0505471442049128e-05, "loss": 0.0041, "step": 382540 }, { "epoch": 1.93, "learning_rate": 1.0497903749035118e-05, "loss": 0.0048, "step": 382550 }, { "epoch": 1.93, "learning_rate": 1.0490336056021108e-05, "loss": 0.0055, "step": 382560 }, { "epoch": 1.93, "learning_rate": 1.0482768363007098e-05, "loss": 0.0065, "step": 382570 }, { "epoch": 1.93, "learning_rate": 1.0475200669993088e-05, "loss": 0.0079, "step": 382580 }, { "epoch": 1.93, "learning_rate": 1.0467632976979077e-05, "loss": 0.0053, "step": 382590 }, { "epoch": 1.93, "learning_rate": 1.0460065283965067e-05, "loss": 0.0044, "step": 382600 }, { "epoch": 1.93, "learning_rate": 1.0452497590951056e-05, "loss": 0.0052, "step": 382610 }, { "epoch": 1.93, "learning_rate": 1.0444929897937046e-05, "loss": 0.0059, "step": 382620 }, { "epoch": 1.93, "learning_rate": 1.0437362204923035e-05, "loss": 0.006, "step": 382630 }, { "epoch": 1.93, "learning_rate": 1.0429794511909025e-05, "loss": 0.0057, "step": 382640 }, { "epoch": 1.93, "learning_rate": 1.0422226818895015e-05, "loss": 0.0076, "step": 382650 }, { "epoch": 1.93, "learning_rate": 1.0414659125881005e-05, "loss": 0.0061, "step": 382660 }, { "epoch": 1.93, "learning_rate": 1.0407091432866995e-05, "loss": 0.006, "step": 382670 }, { "epoch": 1.93, "learning_rate": 1.0399523739852985e-05, "loss": 0.0087, "step": 382680 }, { "epoch": 1.93, "learning_rate": 1.0391956046838973e-05, "loss": 0.0045, "step": 382690 }, { "epoch": 1.93, "learning_rate": 1.0384388353824963e-05, "loss": 0.0098, "step": 382700 }, { "epoch": 1.93, "learning_rate": 1.0376820660810953e-05, "loss": 0.0071, "step": 382710 }, { "epoch": 1.93, "learning_rate": 1.0369252967796943e-05, "loss": 0.0084, "step": 382720 }, { "epoch": 1.93, "learning_rate": 1.0361685274782933e-05, "loss": 0.0049, "step": 382730 }, { "epoch": 1.93, "learning_rate": 1.0354117581768923e-05, "loss": 0.0049, "step": 382740 }, { "epoch": 1.93, "learning_rate": 1.0346549888754913e-05, "loss": 0.0058, "step": 382750 }, { "epoch": 1.93, "learning_rate": 1.0338982195740903e-05, "loss": 0.0052, "step": 382760 }, { "epoch": 1.93, "learning_rate": 1.033141450272689e-05, "loss": 0.0062, "step": 382770 }, { "epoch": 1.93, "learning_rate": 1.032384680971288e-05, "loss": 0.0063, "step": 382780 }, { "epoch": 1.93, "learning_rate": 1.031627911669887e-05, "loss": 0.0053, "step": 382790 }, { "epoch": 1.93, "learning_rate": 1.030871142368486e-05, "loss": 0.0045, "step": 382800 }, { "epoch": 1.93, "learning_rate": 1.030114373067085e-05, "loss": 0.0066, "step": 382810 }, { "epoch": 1.93, "learning_rate": 1.029357603765684e-05, "loss": 0.0041, "step": 382820 }, { "epoch": 1.93, "learning_rate": 1.028600834464283e-05, "loss": 0.0052, "step": 382830 }, { "epoch": 1.93, "learning_rate": 1.0278440651628819e-05, "loss": 0.0047, "step": 382840 }, { "epoch": 1.93, "learning_rate": 1.0270872958614808e-05, "loss": 0.0066, "step": 382850 }, { "epoch": 1.93, "learning_rate": 1.0263305265600798e-05, "loss": 0.0048, "step": 382860 }, { "epoch": 1.93, "learning_rate": 1.0255737572586788e-05, "loss": 0.0049, "step": 382870 }, { "epoch": 1.93, "learning_rate": 1.0248169879572778e-05, "loss": 0.0068, "step": 382880 }, { "epoch": 1.93, "learning_rate": 1.0240602186558768e-05, "loss": 0.0076, "step": 382890 }, { "epoch": 1.93, "learning_rate": 1.0233034493544758e-05, "loss": 0.0071, "step": 382900 }, { "epoch": 1.93, "learning_rate": 1.0225466800530748e-05, "loss": 0.0076, "step": 382910 }, { "epoch": 1.93, "learning_rate": 1.0217899107516736e-05, "loss": 0.0052, "step": 382920 }, { "epoch": 1.93, "learning_rate": 1.0210331414502726e-05, "loss": 0.0052, "step": 382930 }, { "epoch": 1.93, "learning_rate": 1.0202763721488716e-05, "loss": 0.0068, "step": 382940 }, { "epoch": 1.93, "learning_rate": 1.0195196028474706e-05, "loss": 0.0077, "step": 382950 }, { "epoch": 1.93, "learning_rate": 1.0187628335460696e-05, "loss": 0.0064, "step": 382960 }, { "epoch": 1.93, "learning_rate": 1.0180060642446686e-05, "loss": 0.0052, "step": 382970 }, { "epoch": 1.93, "learning_rate": 1.0172492949432676e-05, "loss": 0.0055, "step": 382980 }, { "epoch": 1.93, "learning_rate": 1.0164925256418666e-05, "loss": 0.006, "step": 382990 }, { "epoch": 1.93, "learning_rate": 1.0157357563404652e-05, "loss": 0.0059, "step": 383000 }, { "epoch": 1.93, "eval_cer": 0.9144265880775191, "eval_loss": 0.004191742278635502, "eval_runtime": 116.3481, "eval_samples_per_second": 17.19, "eval_steps_per_second": 4.297, "step": 383000 }, { "epoch": 1.93, "learning_rate": 1.0149789870390642e-05, "loss": 0.0063, "step": 383010 }, { "epoch": 1.93, "learning_rate": 1.0142222177376632e-05, "loss": 0.0046, "step": 383020 }, { "epoch": 1.93, "learning_rate": 1.0134654484362622e-05, "loss": 0.0064, "step": 383030 }, { "epoch": 1.93, "learning_rate": 1.0127086791348613e-05, "loss": 0.0064, "step": 383040 }, { "epoch": 1.93, "learning_rate": 1.0119519098334603e-05, "loss": 0.0057, "step": 383050 }, { "epoch": 1.93, "learning_rate": 1.0111951405320593e-05, "loss": 0.0048, "step": 383060 }, { "epoch": 1.93, "learning_rate": 1.0104383712306583e-05, "loss": 0.0055, "step": 383070 }, { "epoch": 1.93, "learning_rate": 1.009681601929257e-05, "loss": 0.0067, "step": 383080 }, { "epoch": 1.93, "learning_rate": 1.008924832627856e-05, "loss": 0.0062, "step": 383090 }, { "epoch": 1.93, "learning_rate": 1.008168063326455e-05, "loss": 0.0055, "step": 383100 }, { "epoch": 1.93, "learning_rate": 1.007411294025054e-05, "loss": 0.0048, "step": 383110 }, { "epoch": 1.93, "learning_rate": 1.006654524723653e-05, "loss": 0.0047, "step": 383120 }, { "epoch": 1.93, "learning_rate": 1.005897755422252e-05, "loss": 0.0055, "step": 383130 }, { "epoch": 1.93, "learning_rate": 1.0051409861208509e-05, "loss": 0.0057, "step": 383140 }, { "epoch": 1.93, "learning_rate": 1.0043842168194499e-05, "loss": 0.0059, "step": 383150 }, { "epoch": 1.93, "learning_rate": 1.0036274475180487e-05, "loss": 0.005, "step": 383160 }, { "epoch": 1.93, "learning_rate": 1.0028706782166477e-05, "loss": 0.0043, "step": 383170 }, { "epoch": 1.93, "learning_rate": 1.0021139089152467e-05, "loss": 0.0054, "step": 383180 }, { "epoch": 1.93, "learning_rate": 1.0013571396138457e-05, "loss": 0.0057, "step": 383190 }, { "epoch": 1.93, "learning_rate": 1.0006003703124447e-05, "loss": 0.0063, "step": 383200 }, { "epoch": 1.93, "learning_rate": 9.998436010110437e-06, "loss": 0.0059, "step": 383210 }, { "epoch": 1.93, "learning_rate": 9.990868317096427e-06, "loss": 0.0083, "step": 383220 }, { "epoch": 1.93, "learning_rate": 9.983300624082417e-06, "loss": 0.004, "step": 383230 }, { "epoch": 1.93, "learning_rate": 9.975732931068405e-06, "loss": 0.0071, "step": 383240 }, { "epoch": 1.93, "learning_rate": 9.968165238054395e-06, "loss": 0.0043, "step": 383250 }, { "epoch": 1.93, "learning_rate": 9.960597545040385e-06, "loss": 0.0045, "step": 383260 }, { "epoch": 1.93, "learning_rate": 9.953029852026375e-06, "loss": 0.0071, "step": 383270 }, { "epoch": 1.93, "learning_rate": 9.945462159012365e-06, "loss": 0.0075, "step": 383280 }, { "epoch": 1.93, "learning_rate": 9.937894465998354e-06, "loss": 0.0059, "step": 383290 }, { "epoch": 1.93, "learning_rate": 9.930326772984344e-06, "loss": 0.0062, "step": 383300 }, { "epoch": 1.93, "learning_rate": 9.922759079970334e-06, "loss": 0.0057, "step": 383310 }, { "epoch": 1.93, "learning_rate": 9.915191386956322e-06, "loss": 0.0051, "step": 383320 }, { "epoch": 1.93, "learning_rate": 9.907623693942312e-06, "loss": 0.0055, "step": 383330 }, { "epoch": 1.93, "learning_rate": 9.900056000928302e-06, "loss": 0.0058, "step": 383340 }, { "epoch": 1.93, "learning_rate": 9.892488307914292e-06, "loss": 0.0051, "step": 383350 }, { "epoch": 1.93, "learning_rate": 9.884920614900282e-06, "loss": 0.0057, "step": 383360 }, { "epoch": 1.93, "learning_rate": 9.877352921886272e-06, "loss": 0.0066, "step": 383370 }, { "epoch": 1.93, "learning_rate": 9.869785228872262e-06, "loss": 0.0049, "step": 383380 }, { "epoch": 1.93, "learning_rate": 9.86221753585825e-06, "loss": 0.0061, "step": 383390 }, { "epoch": 1.93, "learning_rate": 9.85464984284424e-06, "loss": 0.0039, "step": 383400 }, { "epoch": 1.93, "learning_rate": 9.84708214983023e-06, "loss": 0.0051, "step": 383410 }, { "epoch": 1.93, "learning_rate": 9.83951445681622e-06, "loss": 0.0043, "step": 383420 }, { "epoch": 1.93, "learning_rate": 9.83194676380221e-06, "loss": 0.0051, "step": 383430 }, { "epoch": 1.93, "learning_rate": 9.8243790707882e-06, "loss": 0.004, "step": 383440 }, { "epoch": 1.93, "learning_rate": 9.81681137777419e-06, "loss": 0.0047, "step": 383450 }, { "epoch": 1.93, "learning_rate": 9.80924368476018e-06, "loss": 0.0041, "step": 383460 }, { "epoch": 1.93, "learning_rate": 9.801675991746168e-06, "loss": 0.005, "step": 383470 }, { "epoch": 1.93, "learning_rate": 9.794108298732158e-06, "loss": 0.0055, "step": 383480 }, { "epoch": 1.93, "learning_rate": 9.786540605718148e-06, "loss": 0.0049, "step": 383490 }, { "epoch": 1.93, "learning_rate": 9.778972912704138e-06, "loss": 0.0054, "step": 383500 }, { "epoch": 1.93, "learning_rate": 9.771405219690127e-06, "loss": 0.0079, "step": 383510 }, { "epoch": 1.93, "learning_rate": 9.763837526676117e-06, "loss": 0.0044, "step": 383520 }, { "epoch": 1.93, "learning_rate": 9.756269833662107e-06, "loss": 0.0052, "step": 383530 }, { "epoch": 1.94, "learning_rate": 9.748702140648097e-06, "loss": 0.0059, "step": 383540 }, { "epoch": 1.94, "learning_rate": 9.741134447634085e-06, "loss": 0.006, "step": 383550 }, { "epoch": 1.94, "learning_rate": 9.733566754620075e-06, "loss": 0.0043, "step": 383560 }, { "epoch": 1.94, "learning_rate": 9.725999061606065e-06, "loss": 0.0065, "step": 383570 }, { "epoch": 1.94, "learning_rate": 9.718431368592055e-06, "loss": 0.005, "step": 383580 }, { "epoch": 1.94, "learning_rate": 9.710863675578045e-06, "loss": 0.0067, "step": 383590 }, { "epoch": 1.94, "learning_rate": 9.703295982564035e-06, "loss": 0.0065, "step": 383600 }, { "epoch": 1.94, "learning_rate": 9.695728289550025e-06, "loss": 0.0047, "step": 383610 }, { "epoch": 1.94, "learning_rate": 9.688160596536015e-06, "loss": 0.0043, "step": 383620 }, { "epoch": 1.94, "learning_rate": 9.680592903522003e-06, "loss": 0.005, "step": 383630 }, { "epoch": 1.94, "learning_rate": 9.673025210507993e-06, "loss": 0.0059, "step": 383640 }, { "epoch": 1.94, "learning_rate": 9.665457517493983e-06, "loss": 0.0063, "step": 383650 }, { "epoch": 1.94, "learning_rate": 9.657889824479973e-06, "loss": 0.006, "step": 383660 }, { "epoch": 1.94, "learning_rate": 9.650322131465963e-06, "loss": 0.0053, "step": 383670 }, { "epoch": 1.94, "learning_rate": 9.642754438451953e-06, "loss": 0.0049, "step": 383680 }, { "epoch": 1.94, "learning_rate": 9.635186745437942e-06, "loss": 0.0068, "step": 383690 }, { "epoch": 1.94, "learning_rate": 9.627619052423932e-06, "loss": 0.0036, "step": 383700 }, { "epoch": 1.94, "learning_rate": 9.62005135940992e-06, "loss": 0.0044, "step": 383710 }, { "epoch": 1.94, "learning_rate": 9.61248366639591e-06, "loss": 0.0053, "step": 383720 }, { "epoch": 1.94, "learning_rate": 9.6049159733819e-06, "loss": 0.0055, "step": 383730 }, { "epoch": 1.94, "learning_rate": 9.59734828036789e-06, "loss": 0.0056, "step": 383740 }, { "epoch": 1.94, "learning_rate": 9.58978058735388e-06, "loss": 0.0042, "step": 383750 }, { "epoch": 1.94, "learning_rate": 9.58221289433987e-06, "loss": 0.0057, "step": 383760 }, { "epoch": 1.94, "learning_rate": 9.57464520132586e-06, "loss": 0.0045, "step": 383770 }, { "epoch": 1.94, "learning_rate": 9.56707750831185e-06, "loss": 0.0056, "step": 383780 }, { "epoch": 1.94, "learning_rate": 9.559509815297838e-06, "loss": 0.0051, "step": 383790 }, { "epoch": 1.94, "learning_rate": 9.551942122283828e-06, "loss": 0.006, "step": 383800 }, { "epoch": 1.94, "learning_rate": 9.544374429269818e-06, "loss": 0.0075, "step": 383810 }, { "epoch": 1.94, "learning_rate": 9.536806736255808e-06, "loss": 0.0054, "step": 383820 }, { "epoch": 1.94, "learning_rate": 9.529239043241798e-06, "loss": 0.0052, "step": 383830 }, { "epoch": 1.94, "learning_rate": 9.521671350227788e-06, "loss": 0.0061, "step": 383840 }, { "epoch": 1.94, "learning_rate": 9.514103657213778e-06, "loss": 0.0046, "step": 383850 }, { "epoch": 1.94, "learning_rate": 9.506535964199768e-06, "loss": 0.0058, "step": 383860 }, { "epoch": 1.94, "learning_rate": 9.498968271185754e-06, "loss": 0.0048, "step": 383870 }, { "epoch": 1.94, "learning_rate": 9.491400578171746e-06, "loss": 0.0042, "step": 383880 }, { "epoch": 1.94, "learning_rate": 9.483832885157736e-06, "loss": 0.0055, "step": 383890 }, { "epoch": 1.94, "learning_rate": 9.476265192143726e-06, "loss": 0.0061, "step": 383900 }, { "epoch": 1.94, "learning_rate": 9.468697499129715e-06, "loss": 0.009, "step": 383910 }, { "epoch": 1.94, "learning_rate": 9.461129806115705e-06, "loss": 0.0062, "step": 383920 }, { "epoch": 1.94, "learning_rate": 9.453562113101695e-06, "loss": 0.005, "step": 383930 }, { "epoch": 1.94, "learning_rate": 9.445994420087682e-06, "loss": 0.0058, "step": 383940 }, { "epoch": 1.94, "learning_rate": 9.438426727073672e-06, "loss": 0.0078, "step": 383950 }, { "epoch": 1.94, "learning_rate": 9.430859034059662e-06, "loss": 0.0058, "step": 383960 }, { "epoch": 1.94, "learning_rate": 9.423291341045652e-06, "loss": 0.0057, "step": 383970 }, { "epoch": 1.94, "learning_rate": 9.415723648031641e-06, "loss": 0.0046, "step": 383980 }, { "epoch": 1.94, "learning_rate": 9.408155955017631e-06, "loss": 0.0062, "step": 383990 }, { "epoch": 1.94, "learning_rate": 9.400588262003621e-06, "loss": 0.0047, "step": 384000 }, { "epoch": 1.94, "eval_cer": 0.9144159137201398, "eval_loss": 0.004220431204885244, "eval_runtime": 116.4383, "eval_samples_per_second": 17.176, "eval_steps_per_second": 4.294, "step": 384000 }, { "epoch": 1.94, "learning_rate": 9.393020568989613e-06, "loss": 0.0066, "step": 384010 }, { "epoch": 1.94, "learning_rate": 9.3854528759756e-06, "loss": 0.0059, "step": 384020 }, { "epoch": 1.94, "learning_rate": 9.37788518296159e-06, "loss": 0.0034, "step": 384030 }, { "epoch": 1.94, "learning_rate": 9.37031748994758e-06, "loss": 0.0055, "step": 384040 }, { "epoch": 1.94, "learning_rate": 9.36274979693357e-06, "loss": 0.0049, "step": 384050 }, { "epoch": 1.94, "learning_rate": 9.355182103919559e-06, "loss": 0.0035, "step": 384060 }, { "epoch": 1.94, "learning_rate": 9.347614410905549e-06, "loss": 0.0055, "step": 384070 }, { "epoch": 1.94, "learning_rate": 9.340046717891539e-06, "loss": 0.0041, "step": 384080 }, { "epoch": 1.94, "learning_rate": 9.332479024877529e-06, "loss": 0.005, "step": 384090 }, { "epoch": 1.94, "learning_rate": 9.324911331863519e-06, "loss": 0.0058, "step": 384100 }, { "epoch": 1.94, "learning_rate": 9.317343638849509e-06, "loss": 0.0052, "step": 384110 }, { "epoch": 1.94, "learning_rate": 9.309775945835497e-06, "loss": 0.0056, "step": 384120 }, { "epoch": 1.94, "learning_rate": 9.302208252821487e-06, "loss": 0.0062, "step": 384130 }, { "epoch": 1.94, "learning_rate": 9.294640559807477e-06, "loss": 0.0073, "step": 384140 }, { "epoch": 1.94, "learning_rate": 9.287072866793467e-06, "loss": 0.0071, "step": 384150 }, { "epoch": 1.94, "learning_rate": 9.279505173779457e-06, "loss": 0.0048, "step": 384160 }, { "epoch": 1.94, "learning_rate": 9.271937480765446e-06, "loss": 0.0054, "step": 384170 }, { "epoch": 1.94, "learning_rate": 9.264369787751436e-06, "loss": 0.007, "step": 384180 }, { "epoch": 1.94, "learning_rate": 9.256802094737426e-06, "loss": 0.0053, "step": 384190 }, { "epoch": 1.94, "learning_rate": 9.249234401723414e-06, "loss": 0.0051, "step": 384200 }, { "epoch": 1.94, "learning_rate": 9.241666708709404e-06, "loss": 0.0057, "step": 384210 }, { "epoch": 1.94, "learning_rate": 9.234099015695394e-06, "loss": 0.0054, "step": 384220 }, { "epoch": 1.94, "learning_rate": 9.226531322681384e-06, "loss": 0.0039, "step": 384230 }, { "epoch": 1.94, "learning_rate": 9.218963629667374e-06, "loss": 0.0054, "step": 384240 }, { "epoch": 1.94, "learning_rate": 9.211395936653364e-06, "loss": 0.0042, "step": 384250 }, { "epoch": 1.94, "learning_rate": 9.203828243639354e-06, "loss": 0.0073, "step": 384260 }, { "epoch": 1.94, "learning_rate": 9.196260550625344e-06, "loss": 0.0076, "step": 384270 }, { "epoch": 1.94, "learning_rate": 9.188692857611332e-06, "loss": 0.0051, "step": 384280 }, { "epoch": 1.94, "learning_rate": 9.181125164597322e-06, "loss": 0.0066, "step": 384290 }, { "epoch": 1.94, "learning_rate": 9.173557471583312e-06, "loss": 0.0052, "step": 384300 }, { "epoch": 1.94, "learning_rate": 9.165989778569302e-06, "loss": 0.004, "step": 384310 }, { "epoch": 1.94, "learning_rate": 9.158422085555292e-06, "loss": 0.0066, "step": 384320 }, { "epoch": 1.94, "learning_rate": 9.150854392541282e-06, "loss": 0.0052, "step": 384330 }, { "epoch": 1.94, "learning_rate": 9.143286699527272e-06, "loss": 0.0047, "step": 384340 }, { "epoch": 1.94, "learning_rate": 9.135719006513261e-06, "loss": 0.006, "step": 384350 }, { "epoch": 1.94, "learning_rate": 9.12815131349925e-06, "loss": 0.0048, "step": 384360 }, { "epoch": 1.94, "learning_rate": 9.12058362048524e-06, "loss": 0.006, "step": 384370 }, { "epoch": 1.94, "learning_rate": 9.11301592747123e-06, "loss": 0.0055, "step": 384380 }, { "epoch": 1.94, "learning_rate": 9.10544823445722e-06, "loss": 0.0052, "step": 384390 }, { "epoch": 1.94, "learning_rate": 9.097880541443208e-06, "loss": 0.0067, "step": 384400 }, { "epoch": 1.94, "learning_rate": 9.090312848429198e-06, "loss": 0.004, "step": 384410 }, { "epoch": 1.94, "learning_rate": 9.082745155415187e-06, "loss": 0.0062, "step": 384420 }, { "epoch": 1.94, "learning_rate": 9.075177462401179e-06, "loss": 0.0058, "step": 384430 }, { "epoch": 1.94, "learning_rate": 9.067609769387167e-06, "loss": 0.0055, "step": 384440 }, { "epoch": 1.94, "learning_rate": 9.060042076373157e-06, "loss": 0.0067, "step": 384450 }, { "epoch": 1.94, "learning_rate": 9.052474383359147e-06, "loss": 0.0056, "step": 384460 }, { "epoch": 1.94, "learning_rate": 9.044906690345135e-06, "loss": 0.0041, "step": 384470 }, { "epoch": 1.94, "learning_rate": 9.037338997331125e-06, "loss": 0.0043, "step": 384480 }, { "epoch": 1.94, "learning_rate": 9.029771304317115e-06, "loss": 0.0047, "step": 384490 }, { "epoch": 1.94, "learning_rate": 9.022203611303105e-06, "loss": 0.0062, "step": 384500 }, { "epoch": 1.94, "learning_rate": 9.014635918289095e-06, "loss": 0.0053, "step": 384510 }, { "epoch": 1.94, "learning_rate": 9.007068225275085e-06, "loss": 0.0064, "step": 384520 }, { "epoch": 1.94, "learning_rate": 8.999500532261075e-06, "loss": 0.0056, "step": 384530 }, { "epoch": 1.94, "learning_rate": 8.991932839247065e-06, "loss": 0.0057, "step": 384540 }, { "epoch": 1.94, "learning_rate": 8.984365146233053e-06, "loss": 0.0083, "step": 384550 }, { "epoch": 1.94, "learning_rate": 8.976797453219043e-06, "loss": 0.0074, "step": 384560 }, { "epoch": 1.94, "learning_rate": 8.969229760205033e-06, "loss": 0.004, "step": 384570 }, { "epoch": 1.94, "learning_rate": 8.961662067191023e-06, "loss": 0.0054, "step": 384580 }, { "epoch": 1.94, "learning_rate": 8.954094374177013e-06, "loss": 0.0074, "step": 384590 }, { "epoch": 1.94, "learning_rate": 8.946526681163003e-06, "loss": 0.0044, "step": 384600 }, { "epoch": 1.94, "learning_rate": 8.938958988148992e-06, "loss": 0.0072, "step": 384610 }, { "epoch": 1.94, "learning_rate": 8.931391295134982e-06, "loss": 0.0057, "step": 384620 }, { "epoch": 1.94, "learning_rate": 8.92382360212097e-06, "loss": 0.0056, "step": 384630 }, { "epoch": 1.94, "learning_rate": 8.91625590910696e-06, "loss": 0.0046, "step": 384640 }, { "epoch": 1.94, "learning_rate": 8.90868821609295e-06, "loss": 0.0042, "step": 384650 }, { "epoch": 1.94, "learning_rate": 8.90112052307894e-06, "loss": 0.0053, "step": 384660 }, { "epoch": 1.94, "learning_rate": 8.89355283006493e-06, "loss": 0.0053, "step": 384670 }, { "epoch": 1.94, "learning_rate": 8.88598513705092e-06, "loss": 0.0058, "step": 384680 }, { "epoch": 1.94, "learning_rate": 8.87841744403691e-06, "loss": 0.0053, "step": 384690 }, { "epoch": 1.94, "learning_rate": 8.8708497510229e-06, "loss": 0.0072, "step": 384700 }, { "epoch": 1.94, "learning_rate": 8.863282058008888e-06, "loss": 0.0055, "step": 384710 }, { "epoch": 1.94, "learning_rate": 8.855714364994878e-06, "loss": 0.0063, "step": 384720 }, { "epoch": 1.94, "learning_rate": 8.848146671980868e-06, "loss": 0.0064, "step": 384730 }, { "epoch": 1.94, "learning_rate": 8.840578978966858e-06, "loss": 0.0066, "step": 384740 }, { "epoch": 1.94, "learning_rate": 8.833011285952848e-06, "loss": 0.0059, "step": 384750 }, { "epoch": 1.94, "learning_rate": 8.825443592938838e-06, "loss": 0.0049, "step": 384760 }, { "epoch": 1.94, "learning_rate": 8.817875899924828e-06, "loss": 0.007, "step": 384770 }, { "epoch": 1.94, "learning_rate": 8.810308206910818e-06, "loss": 0.0046, "step": 384780 }, { "epoch": 1.94, "learning_rate": 8.802740513896806e-06, "loss": 0.0057, "step": 384790 }, { "epoch": 1.94, "learning_rate": 8.795172820882796e-06, "loss": 0.0062, "step": 384800 }, { "epoch": 1.94, "learning_rate": 8.787605127868786e-06, "loss": 0.0076, "step": 384810 }, { "epoch": 1.94, "learning_rate": 8.780037434854776e-06, "loss": 0.0067, "step": 384820 }, { "epoch": 1.94, "learning_rate": 8.772469741840764e-06, "loss": 0.0071, "step": 384830 }, { "epoch": 1.94, "learning_rate": 8.764902048826754e-06, "loss": 0.0048, "step": 384840 }, { "epoch": 1.94, "learning_rate": 8.757334355812745e-06, "loss": 0.0088, "step": 384850 }, { "epoch": 1.94, "learning_rate": 8.749766662798735e-06, "loss": 0.0055, "step": 384860 }, { "epoch": 1.94, "learning_rate": 8.742198969784723e-06, "loss": 0.0062, "step": 384870 }, { "epoch": 1.94, "learning_rate": 8.734631276770713e-06, "loss": 0.0078, "step": 384880 }, { "epoch": 1.94, "learning_rate": 8.727063583756703e-06, "loss": 0.0059, "step": 384890 }, { "epoch": 1.94, "learning_rate": 8.719495890742693e-06, "loss": 0.0042, "step": 384900 }, { "epoch": 1.94, "learning_rate": 8.711928197728681e-06, "loss": 0.0059, "step": 384910 }, { "epoch": 1.94, "learning_rate": 8.704360504714671e-06, "loss": 0.0047, "step": 384920 }, { "epoch": 1.94, "learning_rate": 8.696792811700661e-06, "loss": 0.0088, "step": 384930 }, { "epoch": 1.94, "learning_rate": 8.689225118686651e-06, "loss": 0.0042, "step": 384940 }, { "epoch": 1.94, "learning_rate": 8.681657425672641e-06, "loss": 0.0049, "step": 384950 }, { "epoch": 1.94, "learning_rate": 8.674089732658631e-06, "loss": 0.007, "step": 384960 }, { "epoch": 1.94, "learning_rate": 8.66652203964462e-06, "loss": 0.0054, "step": 384970 }, { "epoch": 1.94, "learning_rate": 8.65895434663061e-06, "loss": 0.0049, "step": 384980 }, { "epoch": 1.94, "learning_rate": 8.651386653616599e-06, "loss": 0.0048, "step": 384990 }, { "epoch": 1.94, "learning_rate": 8.643818960602589e-06, "loss": 0.0064, "step": 385000 }, { "epoch": 1.94, "eval_cer": 0.914423676889143, "eval_loss": 0.0041769566014409065, "eval_runtime": 116.103, "eval_samples_per_second": 17.226, "eval_steps_per_second": 4.307, "step": 385000 }, { "epoch": 1.94, "learning_rate": 8.636251267588579e-06, "loss": 0.0061, "step": 385010 }, { "epoch": 1.94, "learning_rate": 8.628683574574569e-06, "loss": 0.0048, "step": 385020 }, { "epoch": 1.94, "learning_rate": 8.621115881560559e-06, "loss": 0.0053, "step": 385030 }, { "epoch": 1.94, "learning_rate": 8.613548188546549e-06, "loss": 0.0046, "step": 385040 }, { "epoch": 1.94, "learning_rate": 8.605980495532538e-06, "loss": 0.0047, "step": 385050 }, { "epoch": 1.94, "learning_rate": 8.598412802518527e-06, "loss": 0.0063, "step": 385060 }, { "epoch": 1.94, "learning_rate": 8.590845109504517e-06, "loss": 0.0051, "step": 385070 }, { "epoch": 1.94, "learning_rate": 8.583277416490506e-06, "loss": 0.0051, "step": 385080 }, { "epoch": 1.94, "learning_rate": 8.575709723476496e-06, "loss": 0.0059, "step": 385090 }, { "epoch": 1.94, "learning_rate": 8.568142030462486e-06, "loss": 0.005, "step": 385100 }, { "epoch": 1.94, "learning_rate": 8.560574337448476e-06, "loss": 0.0055, "step": 385110 }, { "epoch": 1.94, "learning_rate": 8.553006644434466e-06, "loss": 0.0067, "step": 385120 }, { "epoch": 1.94, "learning_rate": 8.545438951420456e-06, "loss": 0.005, "step": 385130 }, { "epoch": 1.94, "learning_rate": 8.537871258406444e-06, "loss": 0.0048, "step": 385140 }, { "epoch": 1.94, "learning_rate": 8.530303565392434e-06, "loss": 0.0049, "step": 385150 }, { "epoch": 1.94, "learning_rate": 8.522735872378424e-06, "loss": 0.0049, "step": 385160 }, { "epoch": 1.94, "learning_rate": 8.515168179364414e-06, "loss": 0.0073, "step": 385170 }, { "epoch": 1.94, "learning_rate": 8.507600486350404e-06, "loss": 0.0051, "step": 385180 }, { "epoch": 1.94, "learning_rate": 8.500032793336394e-06, "loss": 0.0057, "step": 385190 }, { "epoch": 1.94, "learning_rate": 8.492465100322384e-06, "loss": 0.0069, "step": 385200 }, { "epoch": 1.94, "learning_rate": 8.484897407308374e-06, "loss": 0.0054, "step": 385210 }, { "epoch": 1.94, "learning_rate": 8.477329714294362e-06, "loss": 0.007, "step": 385220 }, { "epoch": 1.94, "learning_rate": 8.469762021280352e-06, "loss": 0.0066, "step": 385230 }, { "epoch": 1.94, "learning_rate": 8.462194328266342e-06, "loss": 0.0054, "step": 385240 }, { "epoch": 1.94, "learning_rate": 8.454626635252332e-06, "loss": 0.0066, "step": 385250 }, { "epoch": 1.94, "learning_rate": 8.44705894223832e-06, "loss": 0.0072, "step": 385260 }, { "epoch": 1.94, "learning_rate": 8.439491249224311e-06, "loss": 0.0062, "step": 385270 }, { "epoch": 1.94, "learning_rate": 8.431923556210301e-06, "loss": 0.0062, "step": 385280 }, { "epoch": 1.94, "learning_rate": 8.424355863196291e-06, "loss": 0.0041, "step": 385290 }, { "epoch": 1.94, "learning_rate": 8.41678817018228e-06, "loss": 0.0063, "step": 385300 }, { "epoch": 1.94, "learning_rate": 8.40922047716827e-06, "loss": 0.0042, "step": 385310 }, { "epoch": 1.94, "learning_rate": 8.40165278415426e-06, "loss": 0.0039, "step": 385320 }, { "epoch": 1.94, "learning_rate": 8.39408509114025e-06, "loss": 0.0041, "step": 385330 }, { "epoch": 1.94, "learning_rate": 8.386517398126237e-06, "loss": 0.0061, "step": 385340 }, { "epoch": 1.94, "learning_rate": 8.378949705112227e-06, "loss": 0.0078, "step": 385350 }, { "epoch": 1.94, "learning_rate": 8.371382012098217e-06, "loss": 0.0052, "step": 385360 }, { "epoch": 1.94, "learning_rate": 8.363814319084207e-06, "loss": 0.0114, "step": 385370 }, { "epoch": 1.94, "learning_rate": 8.356246626070197e-06, "loss": 0.0044, "step": 385380 }, { "epoch": 1.94, "learning_rate": 8.348678933056187e-06, "loss": 0.0052, "step": 385390 }, { "epoch": 1.94, "learning_rate": 8.341111240042177e-06, "loss": 0.0046, "step": 385400 }, { "epoch": 1.94, "learning_rate": 8.333543547028167e-06, "loss": 0.0042, "step": 385410 }, { "epoch": 1.94, "learning_rate": 8.325975854014155e-06, "loss": 0.0053, "step": 385420 }, { "epoch": 1.94, "learning_rate": 8.318408161000145e-06, "loss": 0.0042, "step": 385430 }, { "epoch": 1.94, "learning_rate": 8.310840467986135e-06, "loss": 0.0059, "step": 385440 }, { "epoch": 1.94, "learning_rate": 8.303272774972125e-06, "loss": 0.0039, "step": 385450 }, { "epoch": 1.94, "learning_rate": 8.295705081958115e-06, "loss": 0.0059, "step": 385460 }, { "epoch": 1.94, "learning_rate": 8.288137388944105e-06, "loss": 0.0046, "step": 385470 }, { "epoch": 1.94, "learning_rate": 8.280569695930095e-06, "loss": 0.0064, "step": 385480 }, { "epoch": 1.94, "learning_rate": 8.273002002916084e-06, "loss": 0.0048, "step": 385490 }, { "epoch": 1.94, "learning_rate": 8.265434309902073e-06, "loss": 0.0052, "step": 385500 }, { "epoch": 1.94, "learning_rate": 8.257866616888063e-06, "loss": 0.0079, "step": 385510 }, { "epoch": 1.94, "learning_rate": 8.250298923874052e-06, "loss": 0.0059, "step": 385520 }, { "epoch": 1.95, "learning_rate": 8.242731230860042e-06, "loss": 0.0047, "step": 385530 }, { "epoch": 1.95, "learning_rate": 8.235163537846032e-06, "loss": 0.0067, "step": 385540 }, { "epoch": 1.95, "learning_rate": 8.227595844832022e-06, "loss": 0.0055, "step": 385550 }, { "epoch": 1.95, "learning_rate": 8.220028151818012e-06, "loss": 0.0094, "step": 385560 }, { "epoch": 1.95, "learning_rate": 8.212460458804e-06, "loss": 0.0041, "step": 385570 }, { "epoch": 1.95, "learning_rate": 8.20489276578999e-06, "loss": 0.006, "step": 385580 }, { "epoch": 1.95, "learning_rate": 8.19732507277598e-06, "loss": 0.0053, "step": 385590 }, { "epoch": 1.95, "learning_rate": 8.18975737976197e-06, "loss": 0.0062, "step": 385600 }, { "epoch": 1.95, "learning_rate": 8.18218968674796e-06, "loss": 0.0064, "step": 385610 }, { "epoch": 1.95, "learning_rate": 8.17462199373395e-06, "loss": 0.0062, "step": 385620 }, { "epoch": 1.95, "learning_rate": 8.16705430071994e-06, "loss": 0.0054, "step": 385630 }, { "epoch": 1.95, "learning_rate": 8.15948660770593e-06, "loss": 0.0053, "step": 385640 }, { "epoch": 1.95, "learning_rate": 8.151918914691918e-06, "loss": 0.0042, "step": 385650 }, { "epoch": 1.95, "learning_rate": 8.144351221677908e-06, "loss": 0.0062, "step": 385660 }, { "epoch": 1.95, "learning_rate": 8.136783528663898e-06, "loss": 0.0057, "step": 385670 }, { "epoch": 1.95, "learning_rate": 8.129215835649888e-06, "loss": 0.0061, "step": 385680 }, { "epoch": 1.95, "learning_rate": 8.121648142635878e-06, "loss": 0.0056, "step": 385690 }, { "epoch": 1.95, "learning_rate": 8.114080449621868e-06, "loss": 0.0077, "step": 385700 }, { "epoch": 1.95, "learning_rate": 8.106512756607857e-06, "loss": 0.0064, "step": 385710 }, { "epoch": 1.95, "learning_rate": 8.098945063593847e-06, "loss": 0.0086, "step": 385720 }, { "epoch": 1.95, "learning_rate": 8.091377370579836e-06, "loss": 0.0047, "step": 385730 }, { "epoch": 1.95, "learning_rate": 8.083809677565825e-06, "loss": 0.0047, "step": 385740 }, { "epoch": 1.95, "learning_rate": 8.076241984551815e-06, "loss": 0.005, "step": 385750 }, { "epoch": 1.95, "learning_rate": 8.068674291537805e-06, "loss": 0.0047, "step": 385760 }, { "epoch": 1.95, "learning_rate": 8.061106598523794e-06, "loss": 0.0064, "step": 385770 }, { "epoch": 1.95, "learning_rate": 8.053538905509783e-06, "loss": 0.0057, "step": 385780 }, { "epoch": 1.95, "learning_rate": 8.045971212495773e-06, "loss": 0.0045, "step": 385790 }, { "epoch": 1.95, "learning_rate": 8.038403519481763e-06, "loss": 0.0048, "step": 385800 }, { "epoch": 1.95, "learning_rate": 8.030835826467753e-06, "loss": 0.0065, "step": 385810 }, { "epoch": 1.95, "learning_rate": 8.023268133453743e-06, "loss": 0.0064, "step": 385820 }, { "epoch": 1.95, "learning_rate": 8.015700440439733e-06, "loss": 0.0065, "step": 385830 }, { "epoch": 1.95, "learning_rate": 8.008132747425723e-06, "loss": 0.0061, "step": 385840 }, { "epoch": 1.95, "learning_rate": 8.000565054411711e-06, "loss": 0.0058, "step": 385850 }, { "epoch": 1.95, "learning_rate": 7.992997361397701e-06, "loss": 0.0066, "step": 385860 }, { "epoch": 1.95, "learning_rate": 7.985429668383691e-06, "loss": 0.0061, "step": 385870 }, { "epoch": 1.95, "learning_rate": 7.977861975369681e-06, "loss": 0.0045, "step": 385880 }, { "epoch": 1.95, "learning_rate": 7.97029428235567e-06, "loss": 0.0059, "step": 385890 }, { "epoch": 1.95, "learning_rate": 7.96272658934166e-06, "loss": 0.0068, "step": 385900 }, { "epoch": 1.95, "learning_rate": 7.95515889632765e-06, "loss": 0.006, "step": 385910 }, { "epoch": 1.95, "learning_rate": 7.94759120331364e-06, "loss": 0.0061, "step": 385920 }, { "epoch": 1.95, "learning_rate": 7.940023510299629e-06, "loss": 0.0059, "step": 385930 }, { "epoch": 1.95, "learning_rate": 7.932455817285619e-06, "loss": 0.0046, "step": 385940 }, { "epoch": 1.95, "learning_rate": 7.924888124271609e-06, "loss": 0.0049, "step": 385950 }, { "epoch": 1.95, "learning_rate": 7.917320431257598e-06, "loss": 0.0063, "step": 385960 }, { "epoch": 1.95, "learning_rate": 7.909752738243588e-06, "loss": 0.0065, "step": 385970 }, { "epoch": 1.95, "learning_rate": 7.902185045229578e-06, "loss": 0.0048, "step": 385980 }, { "epoch": 1.95, "learning_rate": 7.894617352215568e-06, "loss": 0.0071, "step": 385990 }, { "epoch": 1.95, "learning_rate": 7.887049659201558e-06, "loss": 0.0072, "step": 386000 }, { "epoch": 1.95, "eval_cer": 0.9144178545123905, "eval_loss": 0.0041864411905407906, "eval_runtime": 116.4755, "eval_samples_per_second": 17.171, "eval_steps_per_second": 4.293, "step": 386000 }, { "epoch": 1.95, "learning_rate": 7.879481966187546e-06, "loss": 0.006, "step": 386010 }, { "epoch": 1.95, "learning_rate": 7.871914273173536e-06, "loss": 0.0031, "step": 386020 }, { "epoch": 1.95, "learning_rate": 7.864346580159526e-06, "loss": 0.0065, "step": 386030 }, { "epoch": 1.95, "learning_rate": 7.856778887145516e-06, "loss": 0.0066, "step": 386040 }, { "epoch": 1.95, "learning_rate": 7.849211194131506e-06, "loss": 0.0056, "step": 386050 }, { "epoch": 1.95, "learning_rate": 7.841643501117496e-06, "loss": 0.0035, "step": 386060 }, { "epoch": 1.95, "learning_rate": 7.834075808103486e-06, "loss": 0.0078, "step": 386070 }, { "epoch": 1.95, "learning_rate": 7.826508115089476e-06, "loss": 0.0037, "step": 386080 }, { "epoch": 1.95, "learning_rate": 7.818940422075464e-06, "loss": 0.0078, "step": 386090 }, { "epoch": 1.95, "learning_rate": 7.811372729061454e-06, "loss": 0.0063, "step": 386100 }, { "epoch": 1.95, "learning_rate": 7.803805036047444e-06, "loss": 0.0043, "step": 386110 }, { "epoch": 1.95, "learning_rate": 7.796237343033434e-06, "loss": 0.0041, "step": 386120 }, { "epoch": 1.95, "learning_rate": 7.788669650019424e-06, "loss": 0.0053, "step": 386130 }, { "epoch": 1.95, "learning_rate": 7.781101957005414e-06, "loss": 0.0045, "step": 386140 }, { "epoch": 1.95, "learning_rate": 7.773534263991403e-06, "loss": 0.0076, "step": 386150 }, { "epoch": 1.95, "learning_rate": 7.765966570977392e-06, "loss": 0.0047, "step": 386160 }, { "epoch": 1.95, "learning_rate": 7.758398877963382e-06, "loss": 0.0044, "step": 386170 }, { "epoch": 1.95, "learning_rate": 7.750831184949371e-06, "loss": 0.0069, "step": 386180 }, { "epoch": 1.95, "learning_rate": 7.743263491935361e-06, "loss": 0.0048, "step": 386190 }, { "epoch": 1.95, "learning_rate": 7.73569579892135e-06, "loss": 0.0064, "step": 386200 }, { "epoch": 1.95, "learning_rate": 7.72812810590734e-06, "loss": 0.0078, "step": 386210 }, { "epoch": 1.95, "learning_rate": 7.72056041289333e-06, "loss": 0.0056, "step": 386220 }, { "epoch": 1.95, "learning_rate": 7.71299271987932e-06, "loss": 0.0061, "step": 386230 }, { "epoch": 1.95, "learning_rate": 7.70542502686531e-06, "loss": 0.0058, "step": 386240 }, { "epoch": 1.95, "learning_rate": 7.6978573338513e-06, "loss": 0.0057, "step": 386250 }, { "epoch": 1.95, "learning_rate": 7.690289640837289e-06, "loss": 0.0061, "step": 386260 }, { "epoch": 1.95, "learning_rate": 7.682721947823279e-06, "loss": 0.0064, "step": 386270 }, { "epoch": 1.95, "learning_rate": 7.675154254809267e-06, "loss": 0.0056, "step": 386280 }, { "epoch": 1.95, "learning_rate": 7.667586561795257e-06, "loss": 0.004, "step": 386290 }, { "epoch": 1.95, "learning_rate": 7.660018868781247e-06, "loss": 0.0053, "step": 386300 }, { "epoch": 1.95, "learning_rate": 7.652451175767237e-06, "loss": 0.0055, "step": 386310 }, { "epoch": 1.95, "learning_rate": 7.644883482753227e-06, "loss": 0.0043, "step": 386320 }, { "epoch": 1.95, "learning_rate": 7.637315789739217e-06, "loss": 0.0044, "step": 386330 }, { "epoch": 1.95, "learning_rate": 7.629748096725207e-06, "loss": 0.0053, "step": 386340 }, { "epoch": 1.95, "learning_rate": 7.622180403711197e-06, "loss": 0.0067, "step": 386350 }, { "epoch": 1.95, "learning_rate": 7.614612710697186e-06, "loss": 0.0038, "step": 386360 }, { "epoch": 1.95, "learning_rate": 7.607045017683176e-06, "loss": 0.0078, "step": 386370 }, { "epoch": 1.95, "learning_rate": 7.5994773246691655e-06, "loss": 0.0069, "step": 386380 }, { "epoch": 1.95, "learning_rate": 7.591909631655155e-06, "loss": 0.0039, "step": 386390 }, { "epoch": 1.95, "learning_rate": 7.584341938641144e-06, "loss": 0.0051, "step": 386400 }, { "epoch": 1.95, "learning_rate": 7.5767742456271335e-06, "loss": 0.0045, "step": 386410 }, { "epoch": 1.95, "learning_rate": 7.569206552613124e-06, "loss": 0.0058, "step": 386420 }, { "epoch": 1.95, "learning_rate": 7.561638859599114e-06, "loss": 0.0065, "step": 386430 }, { "epoch": 1.95, "learning_rate": 7.5540711665851024e-06, "loss": 0.0077, "step": 386440 }, { "epoch": 1.95, "learning_rate": 7.546503473571092e-06, "loss": 0.0068, "step": 386450 }, { "epoch": 1.95, "learning_rate": 7.538935780557082e-06, "loss": 0.007, "step": 386460 }, { "epoch": 1.95, "learning_rate": 7.531368087543072e-06, "loss": 0.0057, "step": 386470 }, { "epoch": 1.95, "learning_rate": 7.523800394529061e-06, "loss": 0.0055, "step": 386480 }, { "epoch": 1.95, "learning_rate": 7.516232701515051e-06, "loss": 0.0064, "step": 386490 }, { "epoch": 1.95, "learning_rate": 7.508665008501041e-06, "loss": 0.0051, "step": 386500 }, { "epoch": 1.95, "learning_rate": 7.501097315487031e-06, "loss": 0.0053, "step": 386510 }, { "epoch": 1.95, "learning_rate": 7.49352962247302e-06, "loss": 0.006, "step": 386520 }, { "epoch": 1.95, "learning_rate": 7.48596192945901e-06, "loss": 0.0047, "step": 386530 }, { "epoch": 1.95, "learning_rate": 7.478394236445e-06, "loss": 0.0046, "step": 386540 }, { "epoch": 1.95, "learning_rate": 7.47082654343099e-06, "loss": 0.0085, "step": 386550 }, { "epoch": 1.95, "learning_rate": 7.463258850416979e-06, "loss": 0.0081, "step": 386560 }, { "epoch": 1.95, "learning_rate": 7.455691157402969e-06, "loss": 0.0066, "step": 386570 }, { "epoch": 1.95, "learning_rate": 7.448123464388959e-06, "loss": 0.0055, "step": 386580 }, { "epoch": 1.95, "learning_rate": 7.440555771374949e-06, "loss": 0.0063, "step": 386590 }, { "epoch": 1.95, "learning_rate": 7.432988078360938e-06, "loss": 0.0069, "step": 386600 }, { "epoch": 1.95, "learning_rate": 7.4254203853469276e-06, "loss": 0.0048, "step": 386610 }, { "epoch": 1.95, "learning_rate": 7.4178526923329175e-06, "loss": 0.0061, "step": 386620 }, { "epoch": 1.95, "learning_rate": 7.410284999318907e-06, "loss": 0.006, "step": 386630 }, { "epoch": 1.95, "learning_rate": 7.4027173063048965e-06, "loss": 0.0071, "step": 386640 }, { "epoch": 1.95, "learning_rate": 7.395149613290886e-06, "loss": 0.0062, "step": 386650 }, { "epoch": 1.95, "learning_rate": 7.387581920276876e-06, "loss": 0.0053, "step": 386660 }, { "epoch": 1.95, "learning_rate": 7.380014227262865e-06, "loss": 0.0051, "step": 386670 }, { "epoch": 1.95, "learning_rate": 7.372446534248855e-06, "loss": 0.0045, "step": 386680 }, { "epoch": 1.95, "learning_rate": 7.364878841234845e-06, "loss": 0.0063, "step": 386690 }, { "epoch": 1.95, "learning_rate": 7.357311148220835e-06, "loss": 0.0064, "step": 386700 }, { "epoch": 1.95, "learning_rate": 7.349743455206824e-06, "loss": 0.0046, "step": 386710 }, { "epoch": 1.95, "learning_rate": 7.342175762192814e-06, "loss": 0.006, "step": 386720 }, { "epoch": 1.95, "learning_rate": 7.334608069178804e-06, "loss": 0.005, "step": 386730 }, { "epoch": 1.95, "learning_rate": 7.327040376164794e-06, "loss": 0.0049, "step": 386740 }, { "epoch": 1.95, "learning_rate": 7.319472683150783e-06, "loss": 0.0064, "step": 386750 }, { "epoch": 1.95, "learning_rate": 7.311904990136773e-06, "loss": 0.0085, "step": 386760 }, { "epoch": 1.95, "learning_rate": 7.304337297122763e-06, "loss": 0.0057, "step": 386770 }, { "epoch": 1.95, "learning_rate": 7.296769604108753e-06, "loss": 0.0048, "step": 386780 }, { "epoch": 1.95, "learning_rate": 7.289201911094742e-06, "loss": 0.007, "step": 386790 }, { "epoch": 1.95, "learning_rate": 7.281634218080732e-06, "loss": 0.005, "step": 386800 }, { "epoch": 1.95, "learning_rate": 7.274066525066722e-06, "loss": 0.0066, "step": 386810 }, { "epoch": 1.95, "learning_rate": 7.2664988320527115e-06, "loss": 0.0057, "step": 386820 }, { "epoch": 1.95, "learning_rate": 7.2589311390387e-06, "loss": 0.0047, "step": 386830 }, { "epoch": 1.95, "learning_rate": 7.2513634460246905e-06, "loss": 0.0047, "step": 386840 }, { "epoch": 1.95, "learning_rate": 7.24379575301068e-06, "loss": 0.0058, "step": 386850 }, { "epoch": 1.95, "learning_rate": 7.23622805999667e-06, "loss": 0.0035, "step": 386860 }, { "epoch": 1.95, "learning_rate": 7.2286603669826585e-06, "loss": 0.0056, "step": 386870 }, { "epoch": 1.95, "learning_rate": 7.2210926739686484e-06, "loss": 0.0049, "step": 386880 }, { "epoch": 1.95, "learning_rate": 7.213524980954638e-06, "loss": 0.0056, "step": 386890 }, { "epoch": 1.95, "learning_rate": 7.205957287940628e-06, "loss": 0.0032, "step": 386900 }, { "epoch": 1.95, "learning_rate": 7.198389594926617e-06, "loss": 0.0052, "step": 386910 }, { "epoch": 1.95, "learning_rate": 7.190821901912607e-06, "loss": 0.0089, "step": 386920 }, { "epoch": 1.95, "learning_rate": 7.183254208898597e-06, "loss": 0.0062, "step": 386930 }, { "epoch": 1.95, "learning_rate": 7.175686515884587e-06, "loss": 0.0066, "step": 386940 }, { "epoch": 1.95, "learning_rate": 7.168118822870576e-06, "loss": 0.0051, "step": 386950 }, { "epoch": 1.95, "learning_rate": 7.160551129856566e-06, "loss": 0.0056, "step": 386960 }, { "epoch": 1.95, "learning_rate": 7.152983436842556e-06, "loss": 0.0069, "step": 386970 }, { "epoch": 1.95, "learning_rate": 7.145415743828546e-06, "loss": 0.0072, "step": 386980 }, { "epoch": 1.95, "learning_rate": 7.137848050814535e-06, "loss": 0.0047, "step": 386990 }, { "epoch": 1.95, "learning_rate": 7.130280357800525e-06, "loss": 0.0078, "step": 387000 }, { "epoch": 1.95, "eval_cer": 0.9144052393627603, "eval_loss": 0.004187974147498608, "eval_runtime": 116.3794, "eval_samples_per_second": 17.185, "eval_steps_per_second": 4.296, "step": 387000 }, { "epoch": 1.95, "learning_rate": 7.122712664786515e-06, "loss": 0.0064, "step": 387010 }, { "epoch": 1.95, "learning_rate": 7.115144971772505e-06, "loss": 0.009, "step": 387020 }, { "epoch": 1.95, "learning_rate": 7.107577278758494e-06, "loss": 0.0104, "step": 387030 }, { "epoch": 1.95, "learning_rate": 7.100009585744484e-06, "loss": 0.0053, "step": 387040 }, { "epoch": 1.95, "learning_rate": 7.0924418927304736e-06, "loss": 0.005, "step": 387050 }, { "epoch": 1.95, "learning_rate": 7.0848741997164635e-06, "loss": 0.0054, "step": 387060 }, { "epoch": 1.95, "learning_rate": 7.0773065067024526e-06, "loss": 0.0062, "step": 387070 }, { "epoch": 1.95, "learning_rate": 7.0697388136884425e-06, "loss": 0.0057, "step": 387080 }, { "epoch": 1.95, "learning_rate": 7.062171120674432e-06, "loss": 0.0062, "step": 387090 }, { "epoch": 1.95, "learning_rate": 7.054603427660422e-06, "loss": 0.0059, "step": 387100 }, { "epoch": 1.95, "learning_rate": 7.047035734646411e-06, "loss": 0.0053, "step": 387110 }, { "epoch": 1.95, "learning_rate": 7.039468041632401e-06, "loss": 0.0077, "step": 387120 }, { "epoch": 1.95, "learning_rate": 7.031900348618391e-06, "loss": 0.0051, "step": 387130 }, { "epoch": 1.95, "learning_rate": 7.024332655604381e-06, "loss": 0.005, "step": 387140 }, { "epoch": 1.95, "learning_rate": 7.01676496259037e-06, "loss": 0.0045, "step": 387150 }, { "epoch": 1.95, "learning_rate": 7.00919726957636e-06, "loss": 0.0102, "step": 387160 }, { "epoch": 1.95, "learning_rate": 7.00162957656235e-06, "loss": 0.0043, "step": 387170 }, { "epoch": 1.95, "learning_rate": 6.994061883548339e-06, "loss": 0.0058, "step": 387180 }, { "epoch": 1.95, "learning_rate": 6.986494190534329e-06, "loss": 0.0056, "step": 387190 }, { "epoch": 1.95, "learning_rate": 6.978926497520319e-06, "loss": 0.007, "step": 387200 }, { "epoch": 1.95, "learning_rate": 6.971358804506309e-06, "loss": 0.0069, "step": 387210 }, { "epoch": 1.95, "learning_rate": 6.963791111492298e-06, "loss": 0.0061, "step": 387220 }, { "epoch": 1.95, "learning_rate": 6.956223418478288e-06, "loss": 0.0051, "step": 387230 }, { "epoch": 1.95, "learning_rate": 6.948655725464278e-06, "loss": 0.0054, "step": 387240 }, { "epoch": 1.95, "learning_rate": 6.941088032450268e-06, "loss": 0.0044, "step": 387250 }, { "epoch": 1.95, "learning_rate": 6.933520339436256e-06, "loss": 0.0064, "step": 387260 }, { "epoch": 1.95, "learning_rate": 6.9259526464222466e-06, "loss": 0.008, "step": 387270 }, { "epoch": 1.95, "learning_rate": 6.9183849534082365e-06, "loss": 0.0053, "step": 387280 }, { "epoch": 1.95, "learning_rate": 6.910817260394226e-06, "loss": 0.0046, "step": 387290 }, { "epoch": 1.95, "learning_rate": 6.903249567380215e-06, "loss": 0.0086, "step": 387300 }, { "epoch": 1.95, "learning_rate": 6.8956818743662045e-06, "loss": 0.0052, "step": 387310 }, { "epoch": 1.95, "learning_rate": 6.8881141813521944e-06, "loss": 0.0047, "step": 387320 }, { "epoch": 1.95, "learning_rate": 6.880546488338185e-06, "loss": 0.0064, "step": 387330 }, { "epoch": 1.95, "learning_rate": 6.872978795324173e-06, "loss": 0.0135, "step": 387340 }, { "epoch": 1.95, "learning_rate": 6.865411102310163e-06, "loss": 0.0059, "step": 387350 }, { "epoch": 1.95, "learning_rate": 6.857843409296153e-06, "loss": 0.0055, "step": 387360 }, { "epoch": 1.95, "learning_rate": 6.850275716282143e-06, "loss": 0.0048, "step": 387370 }, { "epoch": 1.95, "learning_rate": 6.842708023268132e-06, "loss": 0.0052, "step": 387380 }, { "epoch": 1.95, "learning_rate": 6.835140330254122e-06, "loss": 0.0053, "step": 387390 }, { "epoch": 1.95, "learning_rate": 6.827572637240112e-06, "loss": 0.0065, "step": 387400 }, { "epoch": 1.95, "learning_rate": 6.820004944226102e-06, "loss": 0.0057, "step": 387410 }, { "epoch": 1.95, "learning_rate": 6.812437251212091e-06, "loss": 0.0046, "step": 387420 }, { "epoch": 1.95, "learning_rate": 6.804869558198081e-06, "loss": 0.0048, "step": 387430 }, { "epoch": 1.95, "learning_rate": 6.797301865184071e-06, "loss": 0.007, "step": 387440 }, { "epoch": 1.95, "learning_rate": 6.789734172170061e-06, "loss": 0.0045, "step": 387450 }, { "epoch": 1.95, "learning_rate": 6.78216647915605e-06, "loss": 0.0055, "step": 387460 }, { "epoch": 1.95, "learning_rate": 6.77459878614204e-06, "loss": 0.0051, "step": 387470 }, { "epoch": 1.95, "learning_rate": 6.76703109312803e-06, "loss": 0.0065, "step": 387480 }, { "epoch": 1.95, "learning_rate": 6.7594634001140196e-06, "loss": 0.0063, "step": 387490 }, { "epoch": 1.95, "learning_rate": 6.751895707100009e-06, "loss": 0.0068, "step": 387500 }, { "epoch": 1.96, "learning_rate": 6.7443280140859986e-06, "loss": 0.0063, "step": 387510 }, { "epoch": 1.96, "learning_rate": 6.7367603210719885e-06, "loss": 0.0071, "step": 387520 }, { "epoch": 1.96, "learning_rate": 6.729192628057978e-06, "loss": 0.0046, "step": 387530 }, { "epoch": 1.96, "learning_rate": 6.7216249350439674e-06, "loss": 0.0058, "step": 387540 }, { "epoch": 1.96, "learning_rate": 6.714057242029957e-06, "loss": 0.0061, "step": 387550 }, { "epoch": 1.96, "learning_rate": 6.706489549015947e-06, "loss": 0.0057, "step": 387560 }, { "epoch": 1.96, "learning_rate": 6.698921856001937e-06, "loss": 0.0054, "step": 387570 }, { "epoch": 1.96, "learning_rate": 6.691354162987926e-06, "loss": 0.0098, "step": 387580 }, { "epoch": 1.96, "learning_rate": 6.683786469973916e-06, "loss": 0.0052, "step": 387590 }, { "epoch": 1.96, "learning_rate": 6.676218776959906e-06, "loss": 0.0053, "step": 387600 }, { "epoch": 1.96, "learning_rate": 6.668651083945896e-06, "loss": 0.005, "step": 387610 }, { "epoch": 1.96, "learning_rate": 6.661083390931885e-06, "loss": 0.006, "step": 387620 }, { "epoch": 1.96, "learning_rate": 6.653515697917875e-06, "loss": 0.0075, "step": 387630 }, { "epoch": 1.96, "learning_rate": 6.645948004903865e-06, "loss": 0.0061, "step": 387640 }, { "epoch": 1.96, "learning_rate": 6.638380311889855e-06, "loss": 0.006, "step": 387650 }, { "epoch": 1.96, "learning_rate": 6.630812618875844e-06, "loss": 0.0057, "step": 387660 }, { "epoch": 1.96, "learning_rate": 6.623244925861834e-06, "loss": 0.0054, "step": 387670 }, { "epoch": 1.96, "learning_rate": 6.615677232847824e-06, "loss": 0.0065, "step": 387680 }, { "epoch": 1.96, "learning_rate": 6.608109539833814e-06, "loss": 0.0045, "step": 387690 }, { "epoch": 1.96, "learning_rate": 6.600541846819803e-06, "loss": 0.0087, "step": 387700 }, { "epoch": 1.96, "learning_rate": 6.5929741538057926e-06, "loss": 0.0064, "step": 387710 }, { "epoch": 1.96, "learning_rate": 6.5854064607917825e-06, "loss": 0.0054, "step": 387720 }, { "epoch": 1.96, "learning_rate": 6.577838767777771e-06, "loss": 0.005, "step": 387730 }, { "epoch": 1.96, "learning_rate": 6.570271074763761e-06, "loss": 0.0056, "step": 387740 }, { "epoch": 1.96, "learning_rate": 6.562703381749751e-06, "loss": 0.0062, "step": 387750 }, { "epoch": 1.96, "learning_rate": 6.555135688735741e-06, "loss": 0.0042, "step": 387760 }, { "epoch": 1.96, "learning_rate": 6.5475679957217295e-06, "loss": 0.0063, "step": 387770 }, { "epoch": 1.96, "learning_rate": 6.540000302707719e-06, "loss": 0.0058, "step": 387780 }, { "epoch": 1.96, "learning_rate": 6.532432609693709e-06, "loss": 0.0052, "step": 387790 }, { "epoch": 1.96, "learning_rate": 6.524864916679699e-06, "loss": 0.0052, "step": 387800 }, { "epoch": 1.96, "learning_rate": 6.517297223665688e-06, "loss": 0.0064, "step": 387810 }, { "epoch": 1.96, "learning_rate": 6.509729530651678e-06, "loss": 0.0049, "step": 387820 }, { "epoch": 1.96, "learning_rate": 6.502161837637668e-06, "loss": 0.0046, "step": 387830 }, { "epoch": 1.96, "learning_rate": 6.494594144623658e-06, "loss": 0.0063, "step": 387840 }, { "epoch": 1.96, "learning_rate": 6.487026451609647e-06, "loss": 0.0056, "step": 387850 }, { "epoch": 1.96, "learning_rate": 6.479458758595637e-06, "loss": 0.0058, "step": 387860 }, { "epoch": 1.96, "learning_rate": 6.471891065581627e-06, "loss": 0.0054, "step": 387870 }, { "epoch": 1.96, "learning_rate": 6.464323372567617e-06, "loss": 0.0052, "step": 387880 }, { "epoch": 1.96, "learning_rate": 6.456755679553606e-06, "loss": 0.0037, "step": 387890 }, { "epoch": 1.96, "learning_rate": 6.449187986539596e-06, "loss": 0.0057, "step": 387900 }, { "epoch": 1.96, "learning_rate": 6.441620293525586e-06, "loss": 0.0055, "step": 387910 }, { "epoch": 1.96, "learning_rate": 6.434052600511576e-06, "loss": 0.0061, "step": 387920 }, { "epoch": 1.96, "learning_rate": 6.426484907497565e-06, "loss": 0.0045, "step": 387930 }, { "epoch": 1.96, "learning_rate": 6.418917214483555e-06, "loss": 0.0056, "step": 387940 }, { "epoch": 1.96, "learning_rate": 6.4113495214695446e-06, "loss": 0.0064, "step": 387950 }, { "epoch": 1.96, "learning_rate": 6.4037818284555345e-06, "loss": 0.007, "step": 387960 }, { "epoch": 1.96, "learning_rate": 6.3962141354415235e-06, "loss": 0.0054, "step": 387970 }, { "epoch": 1.96, "learning_rate": 6.3886464424275134e-06, "loss": 0.0063, "step": 387980 }, { "epoch": 1.96, "learning_rate": 6.381078749413503e-06, "loss": 0.0051, "step": 387990 }, { "epoch": 1.96, "learning_rate": 6.373511056399493e-06, "loss": 0.0051, "step": 388000 }, { "epoch": 1.96, "eval_cer": 0.9144062097588856, "eval_loss": 0.004157001152634621, "eval_runtime": 116.3242, "eval_samples_per_second": 17.193, "eval_steps_per_second": 4.298, "step": 388000 }, { "epoch": 1.96, "learning_rate": 6.365943363385482e-06, "loss": 0.0045, "step": 388010 }, { "epoch": 1.96, "learning_rate": 6.358375670371472e-06, "loss": 0.0044, "step": 388020 }, { "epoch": 1.96, "learning_rate": 6.350807977357462e-06, "loss": 0.0038, "step": 388030 }, { "epoch": 1.96, "learning_rate": 6.343240284343452e-06, "loss": 0.0045, "step": 388040 }, { "epoch": 1.96, "learning_rate": 6.335672591329441e-06, "loss": 0.0068, "step": 388050 }, { "epoch": 1.96, "learning_rate": 6.328104898315431e-06, "loss": 0.0055, "step": 388060 }, { "epoch": 1.96, "learning_rate": 6.320537205301421e-06, "loss": 0.0046, "step": 388070 }, { "epoch": 1.96, "learning_rate": 6.312969512287411e-06, "loss": 0.0059, "step": 388080 }, { "epoch": 1.96, "learning_rate": 6.3054018192734e-06, "loss": 0.0055, "step": 388090 }, { "epoch": 1.96, "learning_rate": 6.29783412625939e-06, "loss": 0.0043, "step": 388100 }, { "epoch": 1.96, "learning_rate": 6.29026643324538e-06, "loss": 0.0087, "step": 388110 }, { "epoch": 1.96, "learning_rate": 6.28269874023137e-06, "loss": 0.0042, "step": 388120 }, { "epoch": 1.96, "learning_rate": 6.275131047217359e-06, "loss": 0.0067, "step": 388130 }, { "epoch": 1.96, "learning_rate": 6.267563354203349e-06, "loss": 0.0049, "step": 388140 }, { "epoch": 1.96, "learning_rate": 6.2599956611893386e-06, "loss": 0.0064, "step": 388150 }, { "epoch": 1.96, "learning_rate": 6.2524279681753285e-06, "loss": 0.0044, "step": 388160 }, { "epoch": 1.96, "learning_rate": 6.2448602751613176e-06, "loss": 0.0061, "step": 388170 }, { "epoch": 1.96, "learning_rate": 6.2372925821473075e-06, "loss": 0.0056, "step": 388180 }, { "epoch": 1.96, "learning_rate": 6.229724889133297e-06, "loss": 0.0066, "step": 388190 }, { "epoch": 1.96, "learning_rate": 6.222157196119287e-06, "loss": 0.0063, "step": 388200 }, { "epoch": 1.96, "learning_rate": 6.2145895031052755e-06, "loss": 0.0067, "step": 388210 }, { "epoch": 1.96, "learning_rate": 6.207021810091265e-06, "loss": 0.0051, "step": 388220 }, { "epoch": 1.96, "learning_rate": 6.199454117077255e-06, "loss": 0.0056, "step": 388230 }, { "epoch": 1.96, "learning_rate": 6.191886424063246e-06, "loss": 0.0041, "step": 388240 }, { "epoch": 1.96, "learning_rate": 6.184318731049234e-06, "loss": 0.0064, "step": 388250 }, { "epoch": 1.96, "learning_rate": 6.176751038035224e-06, "loss": 0.0047, "step": 388260 }, { "epoch": 1.96, "learning_rate": 6.169183345021214e-06, "loss": 0.0041, "step": 388270 }, { "epoch": 1.96, "learning_rate": 6.161615652007203e-06, "loss": 0.0046, "step": 388280 }, { "epoch": 1.96, "learning_rate": 6.154047958993193e-06, "loss": 0.006, "step": 388290 }, { "epoch": 1.96, "learning_rate": 6.146480265979183e-06, "loss": 0.0046, "step": 388300 }, { "epoch": 1.96, "learning_rate": 6.138912572965173e-06, "loss": 0.0055, "step": 388310 }, { "epoch": 1.96, "learning_rate": 6.131344879951162e-06, "loss": 0.0048, "step": 388320 }, { "epoch": 1.96, "learning_rate": 6.123777186937152e-06, "loss": 0.0052, "step": 388330 }, { "epoch": 1.96, "learning_rate": 6.116209493923142e-06, "loss": 0.0073, "step": 388340 }, { "epoch": 1.96, "learning_rate": 6.108641800909132e-06, "loss": 0.0053, "step": 388350 }, { "epoch": 1.96, "learning_rate": 6.101074107895121e-06, "loss": 0.0083, "step": 388360 }, { "epoch": 1.96, "learning_rate": 6.093506414881111e-06, "loss": 0.0052, "step": 388370 }, { "epoch": 1.96, "learning_rate": 6.085938721867101e-06, "loss": 0.006, "step": 388380 }, { "epoch": 1.96, "learning_rate": 6.0783710288530906e-06, "loss": 0.006, "step": 388390 }, { "epoch": 1.96, "learning_rate": 6.07080333583908e-06, "loss": 0.0056, "step": 388400 }, { "epoch": 1.96, "learning_rate": 6.0632356428250695e-06, "loss": 0.0059, "step": 388410 }, { "epoch": 1.96, "learning_rate": 6.0556679498110594e-06, "loss": 0.0063, "step": 388420 }, { "epoch": 1.96, "learning_rate": 6.048100256797049e-06, "loss": 0.0048, "step": 388430 }, { "epoch": 1.96, "learning_rate": 6.040532563783038e-06, "loss": 0.0043, "step": 388440 }, { "epoch": 1.96, "learning_rate": 6.032964870769028e-06, "loss": 0.0055, "step": 388450 }, { "epoch": 1.96, "learning_rate": 6.025397177755018e-06, "loss": 0.005, "step": 388460 }, { "epoch": 1.96, "learning_rate": 6.017829484741008e-06, "loss": 0.0081, "step": 388470 }, { "epoch": 1.96, "learning_rate": 6.010261791726997e-06, "loss": 0.0058, "step": 388480 }, { "epoch": 1.96, "learning_rate": 6.002694098712987e-06, "loss": 0.005, "step": 388490 }, { "epoch": 1.96, "learning_rate": 5.995126405698977e-06, "loss": 0.0051, "step": 388500 }, { "epoch": 1.96, "learning_rate": 5.987558712684967e-06, "loss": 0.0041, "step": 388510 }, { "epoch": 1.96, "learning_rate": 5.979991019670956e-06, "loss": 0.0066, "step": 388520 }, { "epoch": 1.96, "learning_rate": 5.972423326656946e-06, "loss": 0.0069, "step": 388530 }, { "epoch": 1.96, "learning_rate": 5.964855633642936e-06, "loss": 0.0059, "step": 388540 }, { "epoch": 1.96, "learning_rate": 5.957287940628926e-06, "loss": 0.0057, "step": 388550 }, { "epoch": 1.96, "learning_rate": 5.949720247614915e-06, "loss": 0.0051, "step": 388560 }, { "epoch": 1.96, "learning_rate": 5.942152554600905e-06, "loss": 0.0074, "step": 388570 }, { "epoch": 1.96, "learning_rate": 5.934584861586895e-06, "loss": 0.006, "step": 388580 }, { "epoch": 1.96, "learning_rate": 5.9270171685728846e-06, "loss": 0.0054, "step": 388590 }, { "epoch": 1.96, "learning_rate": 5.919449475558874e-06, "loss": 0.0057, "step": 388600 }, { "epoch": 1.96, "learning_rate": 5.9118817825448636e-06, "loss": 0.006, "step": 388610 }, { "epoch": 1.96, "learning_rate": 5.9043140895308535e-06, "loss": 0.0064, "step": 388620 }, { "epoch": 1.96, "learning_rate": 5.896746396516843e-06, "loss": 0.005, "step": 388630 }, { "epoch": 1.96, "learning_rate": 5.889178703502832e-06, "loss": 0.0055, "step": 388640 }, { "epoch": 1.96, "learning_rate": 5.8816110104888215e-06, "loss": 0.0056, "step": 388650 }, { "epoch": 1.96, "learning_rate": 5.874043317474812e-06, "loss": 0.005, "step": 388660 }, { "epoch": 1.96, "learning_rate": 5.866475624460802e-06, "loss": 0.0056, "step": 388670 }, { "epoch": 1.96, "learning_rate": 5.85890793144679e-06, "loss": 0.0049, "step": 388680 }, { "epoch": 1.96, "learning_rate": 5.85134023843278e-06, "loss": 0.0056, "step": 388690 }, { "epoch": 1.96, "learning_rate": 5.84377254541877e-06, "loss": 0.0057, "step": 388700 }, { "epoch": 1.96, "learning_rate": 5.83620485240476e-06, "loss": 0.0063, "step": 388710 }, { "epoch": 1.96, "learning_rate": 5.828637159390749e-06, "loss": 0.0065, "step": 388720 }, { "epoch": 1.96, "learning_rate": 5.821069466376739e-06, "loss": 0.0069, "step": 388730 }, { "epoch": 1.96, "learning_rate": 5.813501773362729e-06, "loss": 0.0043, "step": 388740 }, { "epoch": 1.96, "learning_rate": 5.805934080348719e-06, "loss": 0.0052, "step": 388750 }, { "epoch": 1.96, "learning_rate": 5.798366387334708e-06, "loss": 0.0057, "step": 388760 }, { "epoch": 1.96, "learning_rate": 5.790798694320698e-06, "loss": 0.005, "step": 388770 }, { "epoch": 1.96, "learning_rate": 5.783231001306688e-06, "loss": 0.0072, "step": 388780 }, { "epoch": 1.96, "learning_rate": 5.775663308292678e-06, "loss": 0.0047, "step": 388790 }, { "epoch": 1.96, "learning_rate": 5.768095615278667e-06, "loss": 0.0054, "step": 388800 }, { "epoch": 1.96, "learning_rate": 5.760527922264657e-06, "loss": 0.0054, "step": 388810 }, { "epoch": 1.96, "learning_rate": 5.752960229250647e-06, "loss": 0.0069, "step": 388820 }, { "epoch": 1.96, "learning_rate": 5.745392536236636e-06, "loss": 0.0042, "step": 388830 }, { "epoch": 1.96, "learning_rate": 5.737824843222626e-06, "loss": 0.0058, "step": 388840 }, { "epoch": 1.96, "learning_rate": 5.7302571502086155e-06, "loss": 0.0049, "step": 388850 }, { "epoch": 1.96, "learning_rate": 5.7226894571946054e-06, "loss": 0.0053, "step": 388860 }, { "epoch": 1.96, "learning_rate": 5.7151217641805945e-06, "loss": 0.006, "step": 388870 }, { "epoch": 1.96, "learning_rate": 5.7075540711665844e-06, "loss": 0.0043, "step": 388880 }, { "epoch": 1.96, "learning_rate": 5.699986378152574e-06, "loss": 0.007, "step": 388890 }, { "epoch": 1.96, "learning_rate": 5.692418685138564e-06, "loss": 0.0046, "step": 388900 }, { "epoch": 1.96, "learning_rate": 5.684850992124553e-06, "loss": 0.0047, "step": 388910 }, { "epoch": 1.96, "learning_rate": 5.677283299110543e-06, "loss": 0.0061, "step": 388920 }, { "epoch": 1.96, "learning_rate": 5.669715606096533e-06, "loss": 0.0048, "step": 388930 }, { "epoch": 1.96, "learning_rate": 5.662147913082523e-06, "loss": 0.0055, "step": 388940 }, { "epoch": 1.96, "learning_rate": 5.654580220068512e-06, "loss": 0.0066, "step": 388950 }, { "epoch": 1.96, "learning_rate": 5.647012527054502e-06, "loss": 0.0067, "step": 388960 }, { "epoch": 1.96, "learning_rate": 5.639444834040492e-06, "loss": 0.0048, "step": 388970 }, { "epoch": 1.96, "learning_rate": 5.631877141026482e-06, "loss": 0.0047, "step": 388980 }, { "epoch": 1.96, "learning_rate": 5.624309448012471e-06, "loss": 0.0049, "step": 388990 }, { "epoch": 1.96, "learning_rate": 5.616741754998461e-06, "loss": 0.0048, "step": 389000 }, { "epoch": 1.96, "eval_cer": 0.9143994169860079, "eval_loss": 0.004172166809439659, "eval_runtime": 116.4331, "eval_samples_per_second": 17.177, "eval_steps_per_second": 4.294, "step": 389000 }, { "epoch": 1.96, "learning_rate": 5.609174061984451e-06, "loss": 0.0074, "step": 389010 }, { "epoch": 1.96, "learning_rate": 5.601606368970441e-06, "loss": 0.009, "step": 389020 }, { "epoch": 1.96, "learning_rate": 5.59403867595643e-06, "loss": 0.0077, "step": 389030 }, { "epoch": 1.96, "learning_rate": 5.58647098294242e-06, "loss": 0.0045, "step": 389040 }, { "epoch": 1.96, "learning_rate": 5.5789032899284096e-06, "loss": 0.0046, "step": 389050 }, { "epoch": 1.96, "learning_rate": 5.5713355969143995e-06, "loss": 0.0067, "step": 389060 }, { "epoch": 1.96, "learning_rate": 5.563767903900388e-06, "loss": 0.0034, "step": 389070 }, { "epoch": 1.96, "learning_rate": 5.5562002108863784e-06, "loss": 0.0074, "step": 389080 }, { "epoch": 1.96, "learning_rate": 5.548632517872368e-06, "loss": 0.0076, "step": 389090 }, { "epoch": 1.96, "learning_rate": 5.541064824858358e-06, "loss": 0.0057, "step": 389100 }, { "epoch": 1.96, "learning_rate": 5.5334971318443465e-06, "loss": 0.0057, "step": 389110 }, { "epoch": 1.96, "learning_rate": 5.525929438830336e-06, "loss": 0.0073, "step": 389120 }, { "epoch": 1.96, "learning_rate": 5.518361745816326e-06, "loss": 0.0064, "step": 389130 }, { "epoch": 1.96, "learning_rate": 5.510794052802317e-06, "loss": 0.0055, "step": 389140 }, { "epoch": 1.96, "learning_rate": 5.503226359788305e-06, "loss": 0.0052, "step": 389150 }, { "epoch": 1.96, "learning_rate": 5.495658666774295e-06, "loss": 0.0055, "step": 389160 }, { "epoch": 1.96, "learning_rate": 5.488090973760285e-06, "loss": 0.0061, "step": 389170 }, { "epoch": 1.96, "learning_rate": 5.480523280746275e-06, "loss": 0.0041, "step": 389180 }, { "epoch": 1.96, "learning_rate": 5.472955587732264e-06, "loss": 0.0062, "step": 389190 }, { "epoch": 1.96, "learning_rate": 5.465387894718254e-06, "loss": 0.0064, "step": 389200 }, { "epoch": 1.96, "learning_rate": 5.457820201704244e-06, "loss": 0.006, "step": 389210 }, { "epoch": 1.96, "learning_rate": 5.450252508690234e-06, "loss": 0.0065, "step": 389220 }, { "epoch": 1.96, "learning_rate": 5.442684815676223e-06, "loss": 0.0058, "step": 389230 }, { "epoch": 1.96, "learning_rate": 5.435117122662213e-06, "loss": 0.0061, "step": 389240 }, { "epoch": 1.96, "learning_rate": 5.427549429648203e-06, "loss": 0.0042, "step": 389250 }, { "epoch": 1.96, "learning_rate": 5.419981736634193e-06, "loss": 0.0056, "step": 389260 }, { "epoch": 1.96, "learning_rate": 5.412414043620182e-06, "loss": 0.0052, "step": 389270 }, { "epoch": 1.96, "learning_rate": 5.404846350606172e-06, "loss": 0.0053, "step": 389280 }, { "epoch": 1.96, "learning_rate": 5.3972786575921615e-06, "loss": 0.0048, "step": 389290 }, { "epoch": 1.96, "learning_rate": 5.3897109645781514e-06, "loss": 0.006, "step": 389300 }, { "epoch": 1.96, "learning_rate": 5.3821432715641405e-06, "loss": 0.0043, "step": 389310 }, { "epoch": 1.96, "learning_rate": 5.3745755785501304e-06, "loss": 0.005, "step": 389320 }, { "epoch": 1.96, "learning_rate": 5.36700788553612e-06, "loss": 0.0061, "step": 389330 }, { "epoch": 1.96, "learning_rate": 5.35944019252211e-06, "loss": 0.0056, "step": 389340 }, { "epoch": 1.96, "learning_rate": 5.351872499508099e-06, "loss": 0.0041, "step": 389350 }, { "epoch": 1.96, "learning_rate": 5.344304806494089e-06, "loss": 0.0062, "step": 389360 }, { "epoch": 1.96, "learning_rate": 5.336737113480079e-06, "loss": 0.0051, "step": 389370 }, { "epoch": 1.96, "learning_rate": 5.329169420466068e-06, "loss": 0.0051, "step": 389380 }, { "epoch": 1.96, "learning_rate": 5.321601727452058e-06, "loss": 0.0067, "step": 389390 }, { "epoch": 1.96, "learning_rate": 5.314034034438048e-06, "loss": 0.0049, "step": 389400 }, { "epoch": 1.96, "learning_rate": 5.306466341424038e-06, "loss": 0.0088, "step": 389410 }, { "epoch": 1.96, "learning_rate": 5.298898648410027e-06, "loss": 0.004, "step": 389420 }, { "epoch": 1.96, "learning_rate": 5.291330955396017e-06, "loss": 0.0057, "step": 389430 }, { "epoch": 1.96, "learning_rate": 5.283763262382007e-06, "loss": 0.0057, "step": 389440 }, { "epoch": 1.96, "learning_rate": 5.276195569367997e-06, "loss": 0.0056, "step": 389450 }, { "epoch": 1.96, "learning_rate": 5.268627876353986e-06, "loss": 0.0054, "step": 389460 }, { "epoch": 1.96, "learning_rate": 5.261060183339976e-06, "loss": 0.0039, "step": 389470 }, { "epoch": 1.96, "learning_rate": 5.253492490325966e-06, "loss": 0.0092, "step": 389480 }, { "epoch": 1.97, "learning_rate": 5.2459247973119556e-06, "loss": 0.0053, "step": 389490 }, { "epoch": 1.97, "learning_rate": 5.238357104297945e-06, "loss": 0.0059, "step": 389500 }, { "epoch": 1.97, "learning_rate": 5.2307894112839345e-06, "loss": 0.0048, "step": 389510 }, { "epoch": 1.97, "learning_rate": 5.2232217182699244e-06, "loss": 0.0042, "step": 389520 }, { "epoch": 1.97, "learning_rate": 5.215654025255914e-06, "loss": 0.0058, "step": 389530 }, { "epoch": 1.97, "learning_rate": 5.208086332241903e-06, "loss": 0.0055, "step": 389540 }, { "epoch": 1.97, "learning_rate": 5.2005186392278925e-06, "loss": 0.0027, "step": 389550 }, { "epoch": 1.97, "learning_rate": 5.192950946213883e-06, "loss": 0.0036, "step": 389560 }, { "epoch": 1.97, "learning_rate": 5.185383253199873e-06, "loss": 0.0067, "step": 389570 }, { "epoch": 1.97, "learning_rate": 5.177815560185861e-06, "loss": 0.0056, "step": 389580 }, { "epoch": 1.97, "learning_rate": 5.170247867171851e-06, "loss": 0.0058, "step": 389590 }, { "epoch": 1.97, "learning_rate": 5.162680174157841e-06, "loss": 0.005, "step": 389600 }, { "epoch": 1.97, "learning_rate": 5.155112481143831e-06, "loss": 0.0068, "step": 389610 }, { "epoch": 1.97, "learning_rate": 5.14754478812982e-06, "loss": 0.0055, "step": 389620 }, { "epoch": 1.97, "learning_rate": 5.13997709511581e-06, "loss": 0.0063, "step": 389630 }, { "epoch": 1.97, "learning_rate": 5.1324094021018e-06, "loss": 0.0062, "step": 389640 }, { "epoch": 1.97, "learning_rate": 5.12484170908779e-06, "loss": 0.0073, "step": 389650 }, { "epoch": 1.97, "learning_rate": 5.117274016073779e-06, "loss": 0.0058, "step": 389660 }, { "epoch": 1.97, "learning_rate": 5.109706323059769e-06, "loss": 0.0063, "step": 389670 }, { "epoch": 1.97, "learning_rate": 5.102138630045759e-06, "loss": 0.0029, "step": 389680 }, { "epoch": 1.97, "learning_rate": 5.094570937031749e-06, "loss": 0.0052, "step": 389690 }, { "epoch": 1.97, "learning_rate": 5.087003244017738e-06, "loss": 0.0054, "step": 389700 }, { "epoch": 1.97, "learning_rate": 5.079435551003728e-06, "loss": 0.0052, "step": 389710 }, { "epoch": 1.97, "learning_rate": 5.071867857989718e-06, "loss": 0.0059, "step": 389720 }, { "epoch": 1.97, "learning_rate": 5.0643001649757075e-06, "loss": 0.0059, "step": 389730 }, { "epoch": 1.97, "learning_rate": 5.056732471961697e-06, "loss": 0.0072, "step": 389740 }, { "epoch": 1.97, "learning_rate": 5.0491647789476865e-06, "loss": 0.0055, "step": 389750 }, { "epoch": 1.97, "learning_rate": 5.0415970859336764e-06, "loss": 0.0045, "step": 389760 }, { "epoch": 1.97, "learning_rate": 5.034029392919666e-06, "loss": 0.0055, "step": 389770 }, { "epoch": 1.97, "learning_rate": 5.026461699905655e-06, "loss": 0.0048, "step": 389780 }, { "epoch": 1.97, "learning_rate": 5.018894006891645e-06, "loss": 0.0064, "step": 389790 }, { "epoch": 1.97, "learning_rate": 5.011326313877635e-06, "loss": 0.006, "step": 389800 }, { "epoch": 1.97, "learning_rate": 5.003758620863625e-06, "loss": 0.007, "step": 389810 }, { "epoch": 1.97, "learning_rate": 4.996190927849614e-06, "loss": 0.0051, "step": 389820 }, { "epoch": 1.97, "learning_rate": 4.988623234835604e-06, "loss": 0.0056, "step": 389830 }, { "epoch": 1.97, "learning_rate": 4.981055541821594e-06, "loss": 0.0048, "step": 389840 }, { "epoch": 1.97, "learning_rate": 4.973487848807584e-06, "loss": 0.0042, "step": 389850 }, { "epoch": 1.97, "learning_rate": 4.965920155793573e-06, "loss": 0.0072, "step": 389860 }, { "epoch": 1.97, "learning_rate": 4.958352462779563e-06, "loss": 0.0049, "step": 389870 }, { "epoch": 1.97, "learning_rate": 4.950784769765553e-06, "loss": 0.0052, "step": 389880 }, { "epoch": 1.97, "learning_rate": 4.943217076751543e-06, "loss": 0.0042, "step": 389890 }, { "epoch": 1.97, "learning_rate": 4.935649383737532e-06, "loss": 0.0076, "step": 389900 }, { "epoch": 1.97, "learning_rate": 4.928081690723522e-06, "loss": 0.0056, "step": 389910 }, { "epoch": 1.97, "learning_rate": 4.920513997709512e-06, "loss": 0.0062, "step": 389920 }, { "epoch": 1.97, "learning_rate": 4.912946304695501e-06, "loss": 0.0061, "step": 389930 }, { "epoch": 1.97, "learning_rate": 4.905378611681491e-06, "loss": 0.0058, "step": 389940 }, { "epoch": 1.97, "learning_rate": 4.8978109186674805e-06, "loss": 0.0058, "step": 389950 }, { "epoch": 1.97, "learning_rate": 4.8902432256534704e-06, "loss": 0.0066, "step": 389960 }, { "epoch": 1.97, "learning_rate": 4.882675532639459e-06, "loss": 0.0056, "step": 389970 }, { "epoch": 1.97, "learning_rate": 4.875107839625449e-06, "loss": 0.0048, "step": 389980 }, { "epoch": 1.97, "learning_rate": 4.867540146611439e-06, "loss": 0.0068, "step": 389990 }, { "epoch": 1.97, "learning_rate": 4.859972453597429e-06, "loss": 0.0059, "step": 390000 }, { "epoch": 1.97, "eval_cer": 0.9143955354015062, "eval_loss": 0.004140438511967659, "eval_runtime": 116.3675, "eval_samples_per_second": 17.187, "eval_steps_per_second": 4.297, "step": 390000 }, { "epoch": 1.97, "learning_rate": 4.8524047605834175e-06, "loss": 0.0059, "step": 390010 }, { "epoch": 1.97, "learning_rate": 4.844837067569407e-06, "loss": 0.0046, "step": 390020 }, { "epoch": 1.97, "learning_rate": 4.837269374555397e-06, "loss": 0.0049, "step": 390030 }, { "epoch": 1.97, "learning_rate": 4.829701681541387e-06, "loss": 0.0064, "step": 390040 }, { "epoch": 1.97, "learning_rate": 4.822133988527376e-06, "loss": 0.0044, "step": 390050 }, { "epoch": 1.97, "learning_rate": 4.814566295513366e-06, "loss": 0.0058, "step": 390060 }, { "epoch": 1.97, "learning_rate": 4.806998602499356e-06, "loss": 0.0054, "step": 390070 }, { "epoch": 1.97, "learning_rate": 4.799430909485346e-06, "loss": 0.0064, "step": 390080 }, { "epoch": 1.97, "learning_rate": 4.791863216471335e-06, "loss": 0.0052, "step": 390090 }, { "epoch": 1.97, "learning_rate": 4.784295523457325e-06, "loss": 0.0053, "step": 390100 }, { "epoch": 1.97, "learning_rate": 4.776727830443315e-06, "loss": 0.0043, "step": 390110 }, { "epoch": 1.97, "learning_rate": 4.769160137429305e-06, "loss": 0.0048, "step": 390120 }, { "epoch": 1.97, "learning_rate": 4.761592444415294e-06, "loss": 0.0045, "step": 390130 }, { "epoch": 1.97, "learning_rate": 4.754024751401284e-06, "loss": 0.0033, "step": 390140 }, { "epoch": 1.97, "learning_rate": 4.746457058387274e-06, "loss": 0.0094, "step": 390150 }, { "epoch": 1.97, "learning_rate": 4.738889365373264e-06, "loss": 0.0056, "step": 390160 }, { "epoch": 1.97, "learning_rate": 4.731321672359253e-06, "loss": 0.0068, "step": 390170 }, { "epoch": 1.97, "learning_rate": 4.723753979345243e-06, "loss": 0.0084, "step": 390180 }, { "epoch": 1.97, "learning_rate": 4.7161862863312325e-06, "loss": 0.0051, "step": 390190 }, { "epoch": 1.97, "learning_rate": 4.7086185933172224e-06, "loss": 0.0047, "step": 390200 }, { "epoch": 1.97, "learning_rate": 4.7010509003032115e-06, "loss": 0.0095, "step": 390210 }, { "epoch": 1.97, "learning_rate": 4.693483207289201e-06, "loss": 0.0061, "step": 390220 }, { "epoch": 1.97, "learning_rate": 4.685915514275191e-06, "loss": 0.006, "step": 390230 }, { "epoch": 1.97, "learning_rate": 4.67834782126118e-06, "loss": 0.0035, "step": 390240 }, { "epoch": 1.97, "learning_rate": 4.67078012824717e-06, "loss": 0.0049, "step": 390250 }, { "epoch": 1.97, "learning_rate": 4.66321243523316e-06, "loss": 0.0071, "step": 390260 }, { "epoch": 1.97, "learning_rate": 4.65564474221915e-06, "loss": 0.0063, "step": 390270 }, { "epoch": 1.97, "learning_rate": 4.648077049205139e-06, "loss": 0.006, "step": 390280 }, { "epoch": 1.97, "learning_rate": 4.640509356191129e-06, "loss": 0.0044, "step": 390290 }, { "epoch": 1.97, "learning_rate": 4.632941663177119e-06, "loss": 0.0045, "step": 390300 }, { "epoch": 1.97, "learning_rate": 4.625373970163109e-06, "loss": 0.0066, "step": 390310 }, { "epoch": 1.97, "learning_rate": 4.617806277149098e-06, "loss": 0.0052, "step": 390320 }, { "epoch": 1.97, "learning_rate": 4.610238584135088e-06, "loss": 0.0048, "step": 390330 }, { "epoch": 1.97, "learning_rate": 4.602670891121078e-06, "loss": 0.0059, "step": 390340 }, { "epoch": 1.97, "learning_rate": 4.595103198107068e-06, "loss": 0.0058, "step": 390350 }, { "epoch": 1.97, "learning_rate": 4.587535505093057e-06, "loss": 0.0054, "step": 390360 }, { "epoch": 1.97, "learning_rate": 4.579967812079047e-06, "loss": 0.0065, "step": 390370 }, { "epoch": 1.97, "learning_rate": 4.572400119065037e-06, "loss": 0.0063, "step": 390380 }, { "epoch": 1.97, "learning_rate": 4.5648324260510265e-06, "loss": 0.0057, "step": 390390 }, { "epoch": 1.97, "learning_rate": 4.557264733037016e-06, "loss": 0.0058, "step": 390400 }, { "epoch": 1.97, "learning_rate": 4.5496970400230055e-06, "loss": 0.0055, "step": 390410 }, { "epoch": 1.97, "learning_rate": 4.5421293470089954e-06, "loss": 0.0079, "step": 390420 }, { "epoch": 1.97, "learning_rate": 4.534561653994985e-06, "loss": 0.0052, "step": 390430 }, { "epoch": 1.97, "learning_rate": 4.526993960980974e-06, "loss": 0.0042, "step": 390440 }, { "epoch": 1.97, "learning_rate": 4.5194262679669635e-06, "loss": 0.0043, "step": 390450 }, { "epoch": 1.97, "learning_rate": 4.511858574952953e-06, "loss": 0.0058, "step": 390460 }, { "epoch": 1.97, "learning_rate": 4.504290881938943e-06, "loss": 0.0055, "step": 390470 }, { "epoch": 1.97, "learning_rate": 4.496723188924933e-06, "loss": 0.0058, "step": 390480 }, { "epoch": 1.97, "learning_rate": 4.489155495910922e-06, "loss": 0.0099, "step": 390490 }, { "epoch": 1.97, "learning_rate": 4.481587802896912e-06, "loss": 0.0068, "step": 390500 }, { "epoch": 1.97, "learning_rate": 4.474020109882902e-06, "loss": 0.0059, "step": 390510 }, { "epoch": 1.97, "learning_rate": 4.466452416868892e-06, "loss": 0.0052, "step": 390520 }, { "epoch": 1.97, "learning_rate": 4.458884723854881e-06, "loss": 0.0053, "step": 390530 }, { "epoch": 1.97, "learning_rate": 4.451317030840871e-06, "loss": 0.0045, "step": 390540 }, { "epoch": 1.97, "learning_rate": 4.443749337826861e-06, "loss": 0.0046, "step": 390550 }, { "epoch": 1.97, "learning_rate": 4.436181644812851e-06, "loss": 0.0071, "step": 390560 }, { "epoch": 1.97, "learning_rate": 4.42861395179884e-06, "loss": 0.0071, "step": 390570 }, { "epoch": 1.97, "learning_rate": 4.42104625878483e-06, "loss": 0.0059, "step": 390580 }, { "epoch": 1.97, "learning_rate": 4.41347856577082e-06, "loss": 0.0036, "step": 390590 }, { "epoch": 1.97, "learning_rate": 4.40591087275681e-06, "loss": 0.0047, "step": 390600 }, { "epoch": 1.97, "learning_rate": 4.398343179742799e-06, "loss": 0.004, "step": 390610 }, { "epoch": 1.97, "learning_rate": 4.390775486728789e-06, "loss": 0.0074, "step": 390620 }, { "epoch": 1.97, "learning_rate": 4.3832077937147785e-06, "loss": 0.0056, "step": 390630 }, { "epoch": 1.97, "learning_rate": 4.3756401007007684e-06, "loss": 0.0057, "step": 390640 }, { "epoch": 1.97, "learning_rate": 4.3680724076867575e-06, "loss": 0.0057, "step": 390650 }, { "epoch": 1.97, "learning_rate": 4.360504714672747e-06, "loss": 0.0053, "step": 390660 }, { "epoch": 1.97, "learning_rate": 4.3529370216587365e-06, "loss": 0.0062, "step": 390670 }, { "epoch": 1.97, "learning_rate": 4.345369328644727e-06, "loss": 0.0043, "step": 390680 }, { "epoch": 1.97, "learning_rate": 4.337801635630716e-06, "loss": 0.0089, "step": 390690 }, { "epoch": 1.97, "learning_rate": 4.330233942616706e-06, "loss": 0.0051, "step": 390700 }, { "epoch": 1.97, "learning_rate": 4.322666249602695e-06, "loss": 0.0059, "step": 390710 }, { "epoch": 1.97, "learning_rate": 4.315098556588685e-06, "loss": 0.0051, "step": 390720 }, { "epoch": 1.97, "learning_rate": 4.307530863574675e-06, "loss": 0.0055, "step": 390730 }, { "epoch": 1.97, "learning_rate": 4.299963170560665e-06, "loss": 0.0056, "step": 390740 }, { "epoch": 1.97, "learning_rate": 4.292395477546654e-06, "loss": 0.0047, "step": 390750 }, { "epoch": 1.97, "learning_rate": 4.284827784532644e-06, "loss": 0.0071, "step": 390760 }, { "epoch": 1.97, "learning_rate": 4.277260091518634e-06, "loss": 0.0052, "step": 390770 }, { "epoch": 1.97, "learning_rate": 4.269692398504624e-06, "loss": 0.0046, "step": 390780 }, { "epoch": 1.97, "learning_rate": 4.262124705490613e-06, "loss": 0.0056, "step": 390790 }, { "epoch": 1.97, "learning_rate": 4.254557012476603e-06, "loss": 0.0088, "step": 390800 }, { "epoch": 1.97, "learning_rate": 4.246989319462593e-06, "loss": 0.0038, "step": 390810 }, { "epoch": 1.97, "learning_rate": 4.239421626448583e-06, "loss": 0.0046, "step": 390820 }, { "epoch": 1.97, "learning_rate": 4.231853933434572e-06, "loss": 0.0093, "step": 390830 }, { "epoch": 1.97, "learning_rate": 4.224286240420562e-06, "loss": 0.0093, "step": 390840 }, { "epoch": 1.97, "learning_rate": 4.2167185474065515e-06, "loss": 0.0056, "step": 390850 }, { "epoch": 1.97, "learning_rate": 4.2091508543925414e-06, "loss": 0.0048, "step": 390860 }, { "epoch": 1.97, "learning_rate": 4.2015831613785305e-06, "loss": 0.0055, "step": 390870 }, { "epoch": 1.97, "learning_rate": 4.19401546836452e-06, "loss": 0.0041, "step": 390880 }, { "epoch": 1.97, "learning_rate": 4.18644777535051e-06, "loss": 0.0059, "step": 390890 }, { "epoch": 1.97, "learning_rate": 4.1788800823365e-06, "loss": 0.007, "step": 390900 }, { "epoch": 1.97, "learning_rate": 4.171312389322489e-06, "loss": 0.0055, "step": 390910 }, { "epoch": 1.97, "learning_rate": 4.163744696308479e-06, "loss": 0.0055, "step": 390920 }, { "epoch": 1.97, "learning_rate": 4.156177003294468e-06, "loss": 0.0071, "step": 390930 }, { "epoch": 1.97, "learning_rate": 4.148609310280458e-06, "loss": 0.0044, "step": 390940 }, { "epoch": 1.97, "learning_rate": 4.141041617266448e-06, "loss": 0.007, "step": 390950 }, { "epoch": 1.97, "learning_rate": 4.133473924252438e-06, "loss": 0.0038, "step": 390960 }, { "epoch": 1.97, "learning_rate": 4.125906231238427e-06, "loss": 0.0057, "step": 390970 }, { "epoch": 1.97, "learning_rate": 4.118338538224417e-06, "loss": 0.005, "step": 390980 }, { "epoch": 1.97, "learning_rate": 4.110770845210407e-06, "loss": 0.0062, "step": 390990 }, { "epoch": 1.97, "learning_rate": 4.103203152196396e-06, "loss": 0.0061, "step": 391000 }, { "epoch": 1.97, "eval_cer": 0.9144003873821333, "eval_loss": 0.00414480222389102, "eval_runtime": 116.2164, "eval_samples_per_second": 17.209, "eval_steps_per_second": 4.302, "step": 391000 }, { "epoch": 1.97, "learning_rate": 4.095635459182386e-06, "loss": 0.0084, "step": 391010 }, { "epoch": 1.97, "learning_rate": 4.088067766168376e-06, "loss": 0.0054, "step": 391020 }, { "epoch": 1.97, "learning_rate": 4.080500073154366e-06, "loss": 0.0064, "step": 391030 }, { "epoch": 1.97, "learning_rate": 4.072932380140355e-06, "loss": 0.0057, "step": 391040 }, { "epoch": 1.97, "learning_rate": 4.065364687126345e-06, "loss": 0.0049, "step": 391050 }, { "epoch": 1.97, "learning_rate": 4.057796994112335e-06, "loss": 0.0048, "step": 391060 }, { "epoch": 1.97, "learning_rate": 4.0502293010983245e-06, "loss": 0.0054, "step": 391070 }, { "epoch": 1.97, "learning_rate": 4.042661608084314e-06, "loss": 0.004, "step": 391080 }, { "epoch": 1.97, "learning_rate": 4.0350939150703035e-06, "loss": 0.0058, "step": 391090 }, { "epoch": 1.97, "learning_rate": 4.027526222056293e-06, "loss": 0.0046, "step": 391100 }, { "epoch": 1.97, "learning_rate": 4.019958529042283e-06, "loss": 0.0063, "step": 391110 }, { "epoch": 1.97, "learning_rate": 4.012390836028272e-06, "loss": 0.0045, "step": 391120 }, { "epoch": 1.97, "learning_rate": 4.004823143014262e-06, "loss": 0.0058, "step": 391130 }, { "epoch": 1.97, "learning_rate": 3.997255450000251e-06, "loss": 0.0054, "step": 391140 }, { "epoch": 1.97, "learning_rate": 3.989687756986241e-06, "loss": 0.0035, "step": 391150 }, { "epoch": 1.97, "learning_rate": 3.982120063972231e-06, "loss": 0.0049, "step": 391160 }, { "epoch": 1.97, "learning_rate": 3.974552370958221e-06, "loss": 0.0056, "step": 391170 }, { "epoch": 1.97, "learning_rate": 3.96698467794421e-06, "loss": 0.0053, "step": 391180 }, { "epoch": 1.97, "learning_rate": 3.9594169849302e-06, "loss": 0.0054, "step": 391190 }, { "epoch": 1.97, "learning_rate": 3.95184929191619e-06, "loss": 0.0049, "step": 391200 }, { "epoch": 1.97, "learning_rate": 3.94428159890218e-06, "loss": 0.006, "step": 391210 }, { "epoch": 1.97, "learning_rate": 3.936713905888169e-06, "loss": 0.0052, "step": 391220 }, { "epoch": 1.97, "learning_rate": 3.929146212874159e-06, "loss": 0.0053, "step": 391230 }, { "epoch": 1.97, "learning_rate": 3.921578519860149e-06, "loss": 0.0072, "step": 391240 }, { "epoch": 1.97, "learning_rate": 3.914010826846139e-06, "loss": 0.0052, "step": 391250 }, { "epoch": 1.97, "learning_rate": 3.906443133832128e-06, "loss": 0.0064, "step": 391260 }, { "epoch": 1.97, "learning_rate": 3.898875440818118e-06, "loss": 0.0041, "step": 391270 }, { "epoch": 1.97, "learning_rate": 3.891307747804108e-06, "loss": 0.0048, "step": 391280 }, { "epoch": 1.97, "learning_rate": 3.8837400547900975e-06, "loss": 0.0046, "step": 391290 }, { "epoch": 1.97, "learning_rate": 3.876172361776087e-06, "loss": 0.0065, "step": 391300 }, { "epoch": 1.97, "learning_rate": 3.8686046687620765e-06, "loss": 0.0061, "step": 391310 }, { "epoch": 1.97, "learning_rate": 3.861036975748066e-06, "loss": 0.0092, "step": 391320 }, { "epoch": 1.97, "learning_rate": 3.853469282734056e-06, "loss": 0.0039, "step": 391330 }, { "epoch": 1.97, "learning_rate": 3.845901589720045e-06, "loss": 0.0042, "step": 391340 }, { "epoch": 1.97, "learning_rate": 3.838333896706035e-06, "loss": 0.0051, "step": 391350 }, { "epoch": 1.97, "learning_rate": 3.830766203692024e-06, "loss": 0.0053, "step": 391360 }, { "epoch": 1.97, "learning_rate": 3.823198510678014e-06, "loss": 0.0039, "step": 391370 }, { "epoch": 1.97, "learning_rate": 3.815630817664004e-06, "loss": 0.0054, "step": 391380 }, { "epoch": 1.97, "learning_rate": 3.808063124649994e-06, "loss": 0.0062, "step": 391390 }, { "epoch": 1.97, "learning_rate": 3.8004954316359836e-06, "loss": 0.0057, "step": 391400 }, { "epoch": 1.97, "learning_rate": 3.7929277386219735e-06, "loss": 0.0047, "step": 391410 }, { "epoch": 1.97, "learning_rate": 3.785360045607963e-06, "loss": 0.0054, "step": 391420 }, { "epoch": 1.97, "learning_rate": 3.777792352593953e-06, "loss": 0.006, "step": 391430 }, { "epoch": 1.97, "learning_rate": 3.7702246595799424e-06, "loss": 0.0035, "step": 391440 }, { "epoch": 1.97, "learning_rate": 3.7626569665659323e-06, "loss": 0.0038, "step": 391450 }, { "epoch": 1.97, "learning_rate": 3.7550892735519214e-06, "loss": 0.0053, "step": 391460 }, { "epoch": 1.98, "learning_rate": 3.7475215805379117e-06, "loss": 0.0053, "step": 391470 }, { "epoch": 1.98, "learning_rate": 3.7399538875239008e-06, "loss": 0.0048, "step": 391480 }, { "epoch": 1.98, "learning_rate": 3.7323861945098907e-06, "loss": 0.0047, "step": 391490 }, { "epoch": 1.98, "learning_rate": 3.72481850149588e-06, "loss": 0.0091, "step": 391500 }, { "epoch": 1.98, "learning_rate": 3.71725080848187e-06, "loss": 0.0053, "step": 391510 }, { "epoch": 1.98, "learning_rate": 3.7096831154678596e-06, "loss": 0.0064, "step": 391520 }, { "epoch": 1.98, "learning_rate": 3.702115422453849e-06, "loss": 0.0049, "step": 391530 }, { "epoch": 1.98, "learning_rate": 3.694547729439839e-06, "loss": 0.0063, "step": 391540 }, { "epoch": 1.98, "learning_rate": 3.6869800364258285e-06, "loss": 0.0049, "step": 391550 }, { "epoch": 1.98, "learning_rate": 3.6794123434118184e-06, "loss": 0.0054, "step": 391560 }, { "epoch": 1.98, "learning_rate": 3.671844650397808e-06, "loss": 0.0055, "step": 391570 }, { "epoch": 1.98, "learning_rate": 3.6642769573837978e-06, "loss": 0.0064, "step": 391580 }, { "epoch": 1.98, "learning_rate": 3.6567092643697873e-06, "loss": 0.0055, "step": 391590 }, { "epoch": 1.98, "learning_rate": 3.649141571355777e-06, "loss": 0.0051, "step": 391600 }, { "epoch": 1.98, "learning_rate": 3.6415738783417667e-06, "loss": 0.004, "step": 391610 }, { "epoch": 1.98, "learning_rate": 3.6340061853277566e-06, "loss": 0.0051, "step": 391620 }, { "epoch": 1.98, "learning_rate": 3.626438492313746e-06, "loss": 0.0081, "step": 391630 }, { "epoch": 1.98, "learning_rate": 3.618870799299736e-06, "loss": 0.009, "step": 391640 }, { "epoch": 1.98, "learning_rate": 3.6113031062857255e-06, "loss": 0.0033, "step": 391650 }, { "epoch": 1.98, "learning_rate": 3.6037354132717154e-06, "loss": 0.006, "step": 391660 }, { "epoch": 1.98, "learning_rate": 3.5961677202577045e-06, "loss": 0.0046, "step": 391670 }, { "epoch": 1.98, "learning_rate": 3.588600027243695e-06, "loss": 0.0057, "step": 391680 }, { "epoch": 1.98, "learning_rate": 3.581032334229684e-06, "loss": 0.0076, "step": 391690 }, { "epoch": 1.98, "learning_rate": 3.5734646412156738e-06, "loss": 0.0063, "step": 391700 }, { "epoch": 1.98, "learning_rate": 3.5658969482016633e-06, "loss": 0.0055, "step": 391710 }, { "epoch": 1.98, "learning_rate": 3.558329255187653e-06, "loss": 0.005, "step": 391720 }, { "epoch": 1.98, "learning_rate": 3.5507615621736427e-06, "loss": 0.0072, "step": 391730 }, { "epoch": 1.98, "learning_rate": 3.5431938691596326e-06, "loss": 0.0058, "step": 391740 }, { "epoch": 1.98, "learning_rate": 3.535626176145622e-06, "loss": 0.0039, "step": 391750 }, { "epoch": 1.98, "learning_rate": 3.528058483131612e-06, "loss": 0.0067, "step": 391760 }, { "epoch": 1.98, "learning_rate": 3.5204907901176015e-06, "loss": 0.0043, "step": 391770 }, { "epoch": 1.98, "learning_rate": 3.5129230971035914e-06, "loss": 0.0057, "step": 391780 }, { "epoch": 1.98, "learning_rate": 3.505355404089581e-06, "loss": 0.0087, "step": 391790 }, { "epoch": 1.98, "learning_rate": 3.4977877110755708e-06, "loss": 0.0045, "step": 391800 }, { "epoch": 1.98, "learning_rate": 3.4902200180615603e-06, "loss": 0.0046, "step": 391810 }, { "epoch": 1.98, "learning_rate": 3.48265232504755e-06, "loss": 0.0051, "step": 391820 }, { "epoch": 1.98, "learning_rate": 3.4750846320335397e-06, "loss": 0.006, "step": 391830 }, { "epoch": 1.98, "learning_rate": 3.4675169390195296e-06, "loss": 0.0066, "step": 391840 }, { "epoch": 1.98, "learning_rate": 3.459949246005519e-06, "loss": 0.0051, "step": 391850 }, { "epoch": 1.98, "learning_rate": 3.452381552991509e-06, "loss": 0.0046, "step": 391860 }, { "epoch": 1.98, "learning_rate": 3.4448138599774985e-06, "loss": 0.009, "step": 391870 }, { "epoch": 1.98, "learning_rate": 3.4372461669634884e-06, "loss": 0.0059, "step": 391880 }, { "epoch": 1.98, "learning_rate": 3.429678473949478e-06, "loss": 0.0049, "step": 391890 }, { "epoch": 1.98, "learning_rate": 3.422110780935468e-06, "loss": 0.0061, "step": 391900 }, { "epoch": 1.98, "learning_rate": 3.414543087921457e-06, "loss": 0.0063, "step": 391910 }, { "epoch": 1.98, "learning_rate": 3.406975394907447e-06, "loss": 0.008, "step": 391920 }, { "epoch": 1.98, "learning_rate": 3.3994077018934363e-06, "loss": 0.0062, "step": 391930 }, { "epoch": 1.98, "learning_rate": 3.391840008879426e-06, "loss": 0.0052, "step": 391940 }, { "epoch": 1.98, "learning_rate": 3.3842723158654157e-06, "loss": 0.0044, "step": 391950 }, { "epoch": 1.98, "learning_rate": 3.3767046228514056e-06, "loss": 0.0078, "step": 391960 }, { "epoch": 1.98, "learning_rate": 3.369136929837395e-06, "loss": 0.0048, "step": 391970 }, { "epoch": 1.98, "learning_rate": 3.361569236823385e-06, "loss": 0.0071, "step": 391980 }, { "epoch": 1.98, "learning_rate": 3.3540015438093745e-06, "loss": 0.004, "step": 391990 }, { "epoch": 1.98, "learning_rate": 3.3464338507953644e-06, "loss": 0.0048, "step": 392000 }, { "epoch": 1.98, "eval_cer": 0.9144130025317635, "eval_loss": 0.004128037486225367, "eval_runtime": 116.0593, "eval_samples_per_second": 17.233, "eval_steps_per_second": 4.308, "step": 392000 }, { "epoch": 1.98, "learning_rate": 3.338866157781354e-06, "loss": 0.0077, "step": 392010 }, { "epoch": 1.98, "learning_rate": 3.331298464767344e-06, "loss": 0.0051, "step": 392020 }, { "epoch": 1.98, "learning_rate": 3.3237307717533333e-06, "loss": 0.004, "step": 392030 }, { "epoch": 1.98, "learning_rate": 3.316163078739323e-06, "loss": 0.0056, "step": 392040 }, { "epoch": 1.98, "learning_rate": 3.3085953857253127e-06, "loss": 0.0052, "step": 392050 }, { "epoch": 1.98, "learning_rate": 3.3010276927113026e-06, "loss": 0.0064, "step": 392060 }, { "epoch": 1.98, "learning_rate": 3.293459999697292e-06, "loss": 0.0061, "step": 392070 }, { "epoch": 1.98, "learning_rate": 3.2858923066832816e-06, "loss": 0.0061, "step": 392080 }, { "epoch": 1.98, "learning_rate": 3.2783246136692715e-06, "loss": 0.0051, "step": 392090 }, { "epoch": 1.98, "learning_rate": 3.270756920655261e-06, "loss": 0.0055, "step": 392100 }, { "epoch": 1.98, "learning_rate": 3.263189227641251e-06, "loss": 0.005, "step": 392110 }, { "epoch": 1.98, "learning_rate": 3.25562153462724e-06, "loss": 0.0054, "step": 392120 }, { "epoch": 1.98, "learning_rate": 3.2480538416132303e-06, "loss": 0.004, "step": 392130 }, { "epoch": 1.98, "learning_rate": 3.2404861485992194e-06, "loss": 0.0061, "step": 392140 }, { "epoch": 1.98, "learning_rate": 3.2329184555852093e-06, "loss": 0.0055, "step": 392150 }, { "epoch": 1.98, "learning_rate": 3.2253507625711988e-06, "loss": 0.0042, "step": 392160 }, { "epoch": 1.98, "learning_rate": 3.2177830695571887e-06, "loss": 0.01, "step": 392170 }, { "epoch": 1.98, "learning_rate": 3.210215376543178e-06, "loss": 0.0038, "step": 392180 }, { "epoch": 1.98, "learning_rate": 3.202647683529168e-06, "loss": 0.0051, "step": 392190 }, { "epoch": 1.98, "learning_rate": 3.1950799905151576e-06, "loss": 0.0054, "step": 392200 }, { "epoch": 1.98, "learning_rate": 3.1875122975011475e-06, "loss": 0.0056, "step": 392210 }, { "epoch": 1.98, "learning_rate": 3.179944604487137e-06, "loss": 0.0052, "step": 392220 }, { "epoch": 1.98, "learning_rate": 3.172376911473127e-06, "loss": 0.004, "step": 392230 }, { "epoch": 1.98, "learning_rate": 3.1648092184591164e-06, "loss": 0.0033, "step": 392240 }, { "epoch": 1.98, "learning_rate": 3.1572415254451063e-06, "loss": 0.0056, "step": 392250 }, { "epoch": 1.98, "learning_rate": 3.1496738324310958e-06, "loss": 0.0044, "step": 392260 }, { "epoch": 1.98, "learning_rate": 3.1421061394170857e-06, "loss": 0.005, "step": 392270 }, { "epoch": 1.98, "learning_rate": 3.134538446403075e-06, "loss": 0.0049, "step": 392280 }, { "epoch": 1.98, "learning_rate": 3.126970753389065e-06, "loss": 0.0052, "step": 392290 }, { "epoch": 1.98, "learning_rate": 3.1194030603750546e-06, "loss": 0.0047, "step": 392300 }, { "epoch": 1.98, "learning_rate": 3.1118353673610445e-06, "loss": 0.0059, "step": 392310 }, { "epoch": 1.98, "learning_rate": 3.104267674347034e-06, "loss": 0.0068, "step": 392320 }, { "epoch": 1.98, "learning_rate": 3.096699981333024e-06, "loss": 0.0064, "step": 392330 }, { "epoch": 1.98, "learning_rate": 3.0891322883190134e-06, "loss": 0.0061, "step": 392340 }, { "epoch": 1.98, "learning_rate": 3.0815645953050033e-06, "loss": 0.0046, "step": 392350 }, { "epoch": 1.98, "learning_rate": 3.0739969022909924e-06, "loss": 0.0095, "step": 392360 }, { "epoch": 1.98, "learning_rate": 3.0664292092769827e-06, "loss": 0.0051, "step": 392370 }, { "epoch": 1.98, "learning_rate": 3.0588615162629718e-06, "loss": 0.0036, "step": 392380 }, { "epoch": 1.98, "learning_rate": 3.0512938232489617e-06, "loss": 0.0042, "step": 392390 }, { "epoch": 1.98, "learning_rate": 3.043726130234951e-06, "loss": 0.0054, "step": 392400 }, { "epoch": 1.98, "learning_rate": 3.036158437220941e-06, "loss": 0.0077, "step": 392410 }, { "epoch": 1.98, "learning_rate": 3.0285907442069306e-06, "loss": 0.0063, "step": 392420 }, { "epoch": 1.98, "learning_rate": 3.0210230511929205e-06, "loss": 0.0034, "step": 392430 }, { "epoch": 1.98, "learning_rate": 3.01345535817891e-06, "loss": 0.0081, "step": 392440 }, { "epoch": 1.98, "learning_rate": 3.0058876651649e-06, "loss": 0.0055, "step": 392450 }, { "epoch": 1.98, "learning_rate": 2.9983199721508894e-06, "loss": 0.0056, "step": 392460 }, { "epoch": 1.98, "learning_rate": 2.9907522791368793e-06, "loss": 0.0046, "step": 392470 }, { "epoch": 1.98, "learning_rate": 2.9831845861228688e-06, "loss": 0.0063, "step": 392480 }, { "epoch": 1.98, "learning_rate": 2.9756168931088587e-06, "loss": 0.0078, "step": 392490 }, { "epoch": 1.98, "learning_rate": 2.968049200094848e-06, "loss": 0.0049, "step": 392500 }, { "epoch": 1.98, "learning_rate": 2.960481507080838e-06, "loss": 0.0044, "step": 392510 }, { "epoch": 1.98, "learning_rate": 2.9529138140668276e-06, "loss": 0.0063, "step": 392520 }, { "epoch": 1.98, "learning_rate": 2.9453461210528175e-06, "loss": 0.0051, "step": 392530 }, { "epoch": 1.98, "learning_rate": 2.937778428038807e-06, "loss": 0.0075, "step": 392540 }, { "epoch": 1.98, "learning_rate": 2.930210735024797e-06, "loss": 0.0053, "step": 392550 }, { "epoch": 1.98, "learning_rate": 2.9226430420107864e-06, "loss": 0.0042, "step": 392560 }, { "epoch": 1.98, "learning_rate": 2.9150753489967763e-06, "loss": 0.0062, "step": 392570 }, { "epoch": 1.98, "learning_rate": 2.9075076559827658e-06, "loss": 0.0094, "step": 392580 }, { "epoch": 1.98, "learning_rate": 2.8999399629687557e-06, "loss": 0.004, "step": 392590 }, { "epoch": 1.98, "learning_rate": 2.8923722699547448e-06, "loss": 0.0071, "step": 392600 }, { "epoch": 1.98, "learning_rate": 2.8848045769407347e-06, "loss": 0.0082, "step": 392610 }, { "epoch": 1.98, "learning_rate": 2.877236883926724e-06, "loss": 0.0052, "step": 392620 }, { "epoch": 1.98, "learning_rate": 2.8696691909127136e-06, "loss": 0.0043, "step": 392630 }, { "epoch": 1.98, "learning_rate": 2.8621014978987036e-06, "loss": 0.004, "step": 392640 }, { "epoch": 1.98, "learning_rate": 2.854533804884693e-06, "loss": 0.0063, "step": 392650 }, { "epoch": 1.98, "learning_rate": 2.846966111870683e-06, "loss": 0.0045, "step": 392660 }, { "epoch": 1.98, "learning_rate": 2.8393984188566725e-06, "loss": 0.0035, "step": 392670 }, { "epoch": 1.98, "learning_rate": 2.8318307258426624e-06, "loss": 0.0055, "step": 392680 }, { "epoch": 1.98, "learning_rate": 2.824263032828652e-06, "loss": 0.0048, "step": 392690 }, { "epoch": 1.98, "learning_rate": 2.8166953398146418e-06, "loss": 0.006, "step": 392700 }, { "epoch": 1.98, "learning_rate": 2.8091276468006313e-06, "loss": 0.0047, "step": 392710 }, { "epoch": 1.98, "learning_rate": 2.801559953786621e-06, "loss": 0.0072, "step": 392720 }, { "epoch": 1.98, "learning_rate": 2.7939922607726107e-06, "loss": 0.0072, "step": 392730 }, { "epoch": 1.98, "learning_rate": 2.7864245677586006e-06, "loss": 0.0058, "step": 392740 }, { "epoch": 1.98, "learning_rate": 2.77885687474459e-06, "loss": 0.0055, "step": 392750 }, { "epoch": 1.98, "learning_rate": 2.77128918173058e-06, "loss": 0.0057, "step": 392760 }, { "epoch": 1.98, "learning_rate": 2.7637214887165695e-06, "loss": 0.0065, "step": 392770 }, { "epoch": 1.98, "learning_rate": 2.7561537957025594e-06, "loss": 0.0039, "step": 392780 }, { "epoch": 1.98, "learning_rate": 2.7485861026885484e-06, "loss": 0.0066, "step": 392790 }, { "epoch": 1.98, "learning_rate": 2.7410184096745388e-06, "loss": 0.0073, "step": 392800 }, { "epoch": 1.98, "learning_rate": 2.733450716660528e-06, "loss": 0.0041, "step": 392810 }, { "epoch": 1.98, "learning_rate": 2.7258830236465178e-06, "loss": 0.0048, "step": 392820 }, { "epoch": 1.98, "learning_rate": 2.7183153306325072e-06, "loss": 0.0054, "step": 392830 }, { "epoch": 1.98, "learning_rate": 2.710747637618497e-06, "loss": 0.005, "step": 392840 }, { "epoch": 1.98, "learning_rate": 2.7031799446044866e-06, "loss": 0.0046, "step": 392850 }, { "epoch": 1.98, "learning_rate": 2.6956122515904766e-06, "loss": 0.0054, "step": 392860 }, { "epoch": 1.98, "learning_rate": 2.688044558576466e-06, "loss": 0.005, "step": 392870 }, { "epoch": 1.98, "learning_rate": 2.680476865562456e-06, "loss": 0.0038, "step": 392880 }, { "epoch": 1.98, "learning_rate": 2.6729091725484455e-06, "loss": 0.0049, "step": 392890 }, { "epoch": 1.98, "learning_rate": 2.6653414795344354e-06, "loss": 0.0053, "step": 392900 }, { "epoch": 1.98, "learning_rate": 2.657773786520425e-06, "loss": 0.006, "step": 392910 }, { "epoch": 1.98, "learning_rate": 2.6502060935064148e-06, "loss": 0.0067, "step": 392920 }, { "epoch": 1.98, "learning_rate": 2.6426384004924043e-06, "loss": 0.0068, "step": 392930 }, { "epoch": 1.98, "learning_rate": 2.635070707478394e-06, "loss": 0.0044, "step": 392940 }, { "epoch": 1.98, "learning_rate": 2.6275030144643837e-06, "loss": 0.0058, "step": 392950 }, { "epoch": 1.98, "learning_rate": 2.6199353214503736e-06, "loss": 0.0042, "step": 392960 }, { "epoch": 1.98, "learning_rate": 2.612367628436363e-06, "loss": 0.0049, "step": 392970 }, { "epoch": 1.98, "learning_rate": 2.604799935422353e-06, "loss": 0.005, "step": 392980 }, { "epoch": 1.98, "learning_rate": 2.5972322424083425e-06, "loss": 0.0045, "step": 392990 }, { "epoch": 1.98, "learning_rate": 2.5896645493943324e-06, "loss": 0.0069, "step": 393000 }, { "epoch": 1.98, "eval_cer": 0.9144188249085159, "eval_loss": 0.004126059357076883, "eval_runtime": 116.0572, "eval_samples_per_second": 17.233, "eval_steps_per_second": 4.308, "step": 393000 }, { "epoch": 1.98, "learning_rate": 2.582096856380322e-06, "loss": 0.0053, "step": 393010 }, { "epoch": 1.98, "learning_rate": 2.5745291633663118e-06, "loss": 0.01, "step": 393020 }, { "epoch": 1.98, "learning_rate": 2.566961470352301e-06, "loss": 0.005, "step": 393030 }, { "epoch": 1.98, "learning_rate": 2.559393777338291e-06, "loss": 0.0069, "step": 393040 }, { "epoch": 1.98, "learning_rate": 2.5518260843242802e-06, "loss": 0.0043, "step": 393050 }, { "epoch": 1.98, "learning_rate": 2.54425839131027e-06, "loss": 0.0065, "step": 393060 }, { "epoch": 1.98, "learning_rate": 2.5366906982962596e-06, "loss": 0.0053, "step": 393070 }, { "epoch": 1.98, "learning_rate": 2.5291230052822496e-06, "loss": 0.0051, "step": 393080 }, { "epoch": 1.98, "learning_rate": 2.521555312268239e-06, "loss": 0.0072, "step": 393090 }, { "epoch": 1.98, "learning_rate": 2.513987619254229e-06, "loss": 0.005, "step": 393100 }, { "epoch": 1.98, "learning_rate": 2.5064199262402185e-06, "loss": 0.005, "step": 393110 }, { "epoch": 1.98, "learning_rate": 2.4988522332262084e-06, "loss": 0.006, "step": 393120 }, { "epoch": 1.98, "learning_rate": 2.491284540212198e-06, "loss": 0.005, "step": 393130 }, { "epoch": 1.98, "learning_rate": 2.4837168471981878e-06, "loss": 0.0049, "step": 393140 }, { "epoch": 1.98, "learning_rate": 2.4761491541841773e-06, "loss": 0.0053, "step": 393150 }, { "epoch": 1.98, "learning_rate": 2.4685814611701667e-06, "loss": 0.0042, "step": 393160 }, { "epoch": 1.98, "learning_rate": 2.4610137681561567e-06, "loss": 0.0057, "step": 393170 }, { "epoch": 1.98, "learning_rate": 2.453446075142146e-06, "loss": 0.0075, "step": 393180 }, { "epoch": 1.98, "learning_rate": 2.445878382128136e-06, "loss": 0.0069, "step": 393190 }, { "epoch": 1.98, "learning_rate": 2.4383106891141256e-06, "loss": 0.0038, "step": 393200 }, { "epoch": 1.98, "learning_rate": 2.4307429961001155e-06, "loss": 0.0048, "step": 393210 }, { "epoch": 1.98, "learning_rate": 2.423175303086105e-06, "loss": 0.007, "step": 393220 }, { "epoch": 1.98, "learning_rate": 2.415607610072095e-06, "loss": 0.0049, "step": 393230 }, { "epoch": 1.98, "learning_rate": 2.408039917058084e-06, "loss": 0.0062, "step": 393240 }, { "epoch": 1.98, "learning_rate": 2.4004722240440743e-06, "loss": 0.0051, "step": 393250 }, { "epoch": 1.98, "learning_rate": 2.3929045310300633e-06, "loss": 0.0052, "step": 393260 }, { "epoch": 1.98, "learning_rate": 2.3853368380160532e-06, "loss": 0.0055, "step": 393270 }, { "epoch": 1.98, "learning_rate": 2.3777691450020427e-06, "loss": 0.0047, "step": 393280 }, { "epoch": 1.98, "learning_rate": 2.3702014519880327e-06, "loss": 0.0045, "step": 393290 }, { "epoch": 1.98, "learning_rate": 2.362633758974022e-06, "loss": 0.0048, "step": 393300 }, { "epoch": 1.98, "learning_rate": 2.355066065960012e-06, "loss": 0.0052, "step": 393310 }, { "epoch": 1.98, "learning_rate": 2.3474983729460015e-06, "loss": 0.0064, "step": 393320 }, { "epoch": 1.98, "learning_rate": 2.3399306799319915e-06, "loss": 0.0075, "step": 393330 }, { "epoch": 1.98, "learning_rate": 2.3323629869179814e-06, "loss": 0.0049, "step": 393340 }, { "epoch": 1.98, "learning_rate": 2.324795293903971e-06, "loss": 0.0092, "step": 393350 }, { "epoch": 1.98, "learning_rate": 2.3172276008899608e-06, "loss": 0.0072, "step": 393360 }, { "epoch": 1.98, "learning_rate": 2.3096599078759503e-06, "loss": 0.0064, "step": 393370 }, { "epoch": 1.98, "learning_rate": 2.3020922148619397e-06, "loss": 0.008, "step": 393380 }, { "epoch": 1.98, "learning_rate": 2.2945245218479297e-06, "loss": 0.0091, "step": 393390 }, { "epoch": 1.98, "learning_rate": 2.286956828833919e-06, "loss": 0.0048, "step": 393400 }, { "epoch": 1.98, "learning_rate": 2.279389135819909e-06, "loss": 0.0055, "step": 393410 }, { "epoch": 1.98, "learning_rate": 2.2718214428058986e-06, "loss": 0.0047, "step": 393420 }, { "epoch": 1.98, "learning_rate": 2.2642537497918885e-06, "loss": 0.0053, "step": 393430 }, { "epoch": 1.98, "learning_rate": 2.256686056777878e-06, "loss": 0.0059, "step": 393440 }, { "epoch": 1.98, "learning_rate": 2.2491183637638674e-06, "loss": 0.0043, "step": 393450 }, { "epoch": 1.99, "learning_rate": 2.2415506707498574e-06, "loss": 0.006, "step": 393460 }, { "epoch": 1.99, "learning_rate": 2.233982977735847e-06, "loss": 0.0056, "step": 393470 }, { "epoch": 1.99, "learning_rate": 2.2264152847218363e-06, "loss": 0.0046, "step": 393480 }, { "epoch": 1.99, "learning_rate": 2.2188475917078262e-06, "loss": 0.0063, "step": 393490 }, { "epoch": 1.99, "learning_rate": 2.2112798986938157e-06, "loss": 0.0049, "step": 393500 }, { "epoch": 1.99, "learning_rate": 2.2037122056798057e-06, "loss": 0.0059, "step": 393510 }, { "epoch": 1.99, "learning_rate": 2.196144512665795e-06, "loss": 0.0071, "step": 393520 }, { "epoch": 1.99, "learning_rate": 2.188576819651785e-06, "loss": 0.0075, "step": 393530 }, { "epoch": 1.99, "learning_rate": 2.1810091266377745e-06, "loss": 0.0065, "step": 393540 }, { "epoch": 1.99, "learning_rate": 2.1734414336237645e-06, "loss": 0.007, "step": 393550 }, { "epoch": 1.99, "learning_rate": 2.165873740609754e-06, "loss": 0.007, "step": 393560 }, { "epoch": 1.99, "learning_rate": 2.158306047595744e-06, "loss": 0.0054, "step": 393570 }, { "epoch": 1.99, "learning_rate": 2.1507383545817333e-06, "loss": 0.0037, "step": 393580 }, { "epoch": 1.99, "learning_rate": 2.143170661567723e-06, "loss": 0.005, "step": 393590 }, { "epoch": 1.99, "learning_rate": 2.1356029685537127e-06, "loss": 0.0076, "step": 393600 }, { "epoch": 1.99, "learning_rate": 2.1280352755397022e-06, "loss": 0.0066, "step": 393610 }, { "epoch": 1.99, "learning_rate": 2.120467582525692e-06, "loss": 0.0054, "step": 393620 }, { "epoch": 1.99, "learning_rate": 2.1128998895116816e-06, "loss": 0.0048, "step": 393630 }, { "epoch": 1.99, "learning_rate": 2.1053321964976716e-06, "loss": 0.0085, "step": 393640 }, { "epoch": 1.99, "learning_rate": 2.097764503483661e-06, "loss": 0.0042, "step": 393650 }, { "epoch": 1.99, "learning_rate": 2.090196810469651e-06, "loss": 0.0063, "step": 393660 }, { "epoch": 1.99, "learning_rate": 2.0826291174556404e-06, "loss": 0.0067, "step": 393670 }, { "epoch": 1.99, "learning_rate": 2.0750614244416304e-06, "loss": 0.0048, "step": 393680 }, { "epoch": 1.99, "learning_rate": 2.06749373142762e-06, "loss": 0.0066, "step": 393690 }, { "epoch": 1.99, "learning_rate": 2.0599260384136098e-06, "loss": 0.0069, "step": 393700 }, { "epoch": 1.99, "learning_rate": 2.0523583453995992e-06, "loss": 0.0059, "step": 393710 }, { "epoch": 1.99, "learning_rate": 2.0447906523855887e-06, "loss": 0.0066, "step": 393720 }, { "epoch": 1.99, "learning_rate": 2.0372229593715787e-06, "loss": 0.007, "step": 393730 }, { "epoch": 1.99, "learning_rate": 2.029655266357568e-06, "loss": 0.0072, "step": 393740 }, { "epoch": 1.99, "learning_rate": 2.022087573343558e-06, "loss": 0.0047, "step": 393750 }, { "epoch": 1.99, "learning_rate": 2.0145198803295475e-06, "loss": 0.0066, "step": 393760 }, { "epoch": 1.99, "learning_rate": 2.0069521873155375e-06, "loss": 0.0054, "step": 393770 }, { "epoch": 1.99, "learning_rate": 1.999384494301527e-06, "loss": 0.0057, "step": 393780 }, { "epoch": 1.99, "learning_rate": 1.991816801287517e-06, "loss": 0.0039, "step": 393790 }, { "epoch": 1.99, "learning_rate": 1.9842491082735063e-06, "loss": 0.005, "step": 393800 }, { "epoch": 1.99, "learning_rate": 1.9766814152594963e-06, "loss": 0.0051, "step": 393810 }, { "epoch": 1.99, "learning_rate": 1.9691137222454857e-06, "loss": 0.006, "step": 393820 }, { "epoch": 1.99, "learning_rate": 1.9615460292314752e-06, "loss": 0.0049, "step": 393830 }, { "epoch": 1.99, "learning_rate": 1.953978336217465e-06, "loss": 0.0051, "step": 393840 }, { "epoch": 1.99, "learning_rate": 1.9464106432034546e-06, "loss": 0.0055, "step": 393850 }, { "epoch": 1.99, "learning_rate": 1.9388429501894446e-06, "loss": 0.0036, "step": 393860 }, { "epoch": 1.99, "learning_rate": 1.931275257175434e-06, "loss": 0.0066, "step": 393870 }, { "epoch": 1.99, "learning_rate": 1.923707564161424e-06, "loss": 0.0051, "step": 393880 }, { "epoch": 1.99, "learning_rate": 1.9161398711474134e-06, "loss": 0.0059, "step": 393890 }, { "epoch": 1.99, "learning_rate": 1.9085721781334034e-06, "loss": 0.0053, "step": 393900 }, { "epoch": 1.99, "learning_rate": 1.9010044851193928e-06, "loss": 0.007, "step": 393910 }, { "epoch": 1.99, "learning_rate": 1.8934367921053825e-06, "loss": 0.0079, "step": 393920 }, { "epoch": 1.99, "learning_rate": 1.8858690990913722e-06, "loss": 0.0077, "step": 393930 }, { "epoch": 1.99, "learning_rate": 1.878301406077362e-06, "loss": 0.0078, "step": 393940 }, { "epoch": 1.99, "learning_rate": 1.8707337130633517e-06, "loss": 0.006, "step": 393950 }, { "epoch": 1.99, "learning_rate": 1.8631660200493414e-06, "loss": 0.0053, "step": 393960 }, { "epoch": 1.99, "learning_rate": 1.855598327035331e-06, "loss": 0.0037, "step": 393970 }, { "epoch": 1.99, "learning_rate": 1.8480306340213203e-06, "loss": 0.0062, "step": 393980 }, { "epoch": 1.99, "learning_rate": 1.84046294100731e-06, "loss": 0.006, "step": 393990 }, { "epoch": 1.99, "learning_rate": 1.8328952479932997e-06, "loss": 0.0053, "step": 394000 }, { "epoch": 1.99, "eval_cer": 0.9144168841162651, "eval_loss": 0.004111087881028652, "eval_runtime": 116.0484, "eval_samples_per_second": 17.234, "eval_steps_per_second": 4.309, "step": 394000 }, { "epoch": 1.99, "learning_rate": 1.8253275549792894e-06, "loss": 0.0062, "step": 394010 }, { "epoch": 1.99, "learning_rate": 1.8177598619652791e-06, "loss": 0.0054, "step": 394020 }, { "epoch": 1.99, "learning_rate": 1.8101921689512688e-06, "loss": 0.0059, "step": 394030 }, { "epoch": 1.99, "learning_rate": 1.8026244759372585e-06, "loss": 0.005, "step": 394040 }, { "epoch": 1.99, "learning_rate": 1.7950567829232482e-06, "loss": 0.0062, "step": 394050 }, { "epoch": 1.99, "learning_rate": 1.787489089909238e-06, "loss": 0.0051, "step": 394060 }, { "epoch": 1.99, "learning_rate": 1.7799213968952276e-06, "loss": 0.0051, "step": 394070 }, { "epoch": 1.99, "learning_rate": 1.7723537038812173e-06, "loss": 0.0047, "step": 394080 }, { "epoch": 1.99, "learning_rate": 1.764786010867207e-06, "loss": 0.0046, "step": 394090 }, { "epoch": 1.99, "learning_rate": 1.7572183178531965e-06, "loss": 0.0053, "step": 394100 }, { "epoch": 1.99, "learning_rate": 1.7496506248391862e-06, "loss": 0.0046, "step": 394110 }, { "epoch": 1.99, "learning_rate": 1.742082931825176e-06, "loss": 0.0062, "step": 394120 }, { "epoch": 1.99, "learning_rate": 1.7345152388111656e-06, "loss": 0.0045, "step": 394130 }, { "epoch": 1.99, "learning_rate": 1.7269475457971553e-06, "loss": 0.006, "step": 394140 }, { "epoch": 1.99, "learning_rate": 1.719379852783145e-06, "loss": 0.0057, "step": 394150 }, { "epoch": 1.99, "learning_rate": 1.7118121597691347e-06, "loss": 0.0055, "step": 394160 }, { "epoch": 1.99, "learning_rate": 1.7042444667551244e-06, "loss": 0.0048, "step": 394170 }, { "epoch": 1.99, "learning_rate": 1.6966767737411141e-06, "loss": 0.0041, "step": 394180 }, { "epoch": 1.99, "learning_rate": 1.6891090807271038e-06, "loss": 0.0071, "step": 394190 }, { "epoch": 1.99, "learning_rate": 1.6815413877130935e-06, "loss": 0.0059, "step": 394200 }, { "epoch": 1.99, "learning_rate": 1.673973694699083e-06, "loss": 0.0045, "step": 394210 }, { "epoch": 1.99, "learning_rate": 1.6664060016850727e-06, "loss": 0.0053, "step": 394220 }, { "epoch": 1.99, "learning_rate": 1.6588383086710624e-06, "loss": 0.0075, "step": 394230 }, { "epoch": 1.99, "learning_rate": 1.6512706156570521e-06, "loss": 0.0047, "step": 394240 }, { "epoch": 1.99, "learning_rate": 1.6437029226430418e-06, "loss": 0.0053, "step": 394250 }, { "epoch": 1.99, "learning_rate": 1.6361352296290315e-06, "loss": 0.0046, "step": 394260 }, { "epoch": 1.99, "learning_rate": 1.6285675366150212e-06, "loss": 0.0049, "step": 394270 }, { "epoch": 1.99, "learning_rate": 1.620999843601011e-06, "loss": 0.007, "step": 394280 }, { "epoch": 1.99, "learning_rate": 1.6134321505870006e-06, "loss": 0.0071, "step": 394290 }, { "epoch": 1.99, "learning_rate": 1.6058644575729903e-06, "loss": 0.0059, "step": 394300 }, { "epoch": 1.99, "learning_rate": 1.59829676455898e-06, "loss": 0.0046, "step": 394310 }, { "epoch": 1.99, "learning_rate": 1.5907290715449697e-06, "loss": 0.0058, "step": 394320 }, { "epoch": 1.99, "learning_rate": 1.5831613785309592e-06, "loss": 0.0063, "step": 394330 }, { "epoch": 1.99, "learning_rate": 1.575593685516949e-06, "loss": 0.005, "step": 394340 }, { "epoch": 1.99, "learning_rate": 1.5680259925029386e-06, "loss": 0.0046, "step": 394350 }, { "epoch": 1.99, "learning_rate": 1.5604582994889283e-06, "loss": 0.0044, "step": 394360 }, { "epoch": 1.99, "learning_rate": 1.552890606474918e-06, "loss": 0.005, "step": 394370 }, { "epoch": 1.99, "learning_rate": 1.5453229134609077e-06, "loss": 0.0063, "step": 394380 }, { "epoch": 1.99, "learning_rate": 1.5377552204468974e-06, "loss": 0.0064, "step": 394390 }, { "epoch": 1.99, "learning_rate": 1.5301875274328871e-06, "loss": 0.0061, "step": 394400 }, { "epoch": 1.99, "learning_rate": 1.5226198344188768e-06, "loss": 0.0071, "step": 394410 }, { "epoch": 1.99, "learning_rate": 1.5150521414048665e-06, "loss": 0.006, "step": 394420 }, { "epoch": 1.99, "learning_rate": 1.5074844483908562e-06, "loss": 0.0063, "step": 394430 }, { "epoch": 1.99, "learning_rate": 1.499916755376846e-06, "loss": 0.0037, "step": 394440 }, { "epoch": 1.99, "learning_rate": 1.4923490623628354e-06, "loss": 0.0047, "step": 394450 }, { "epoch": 1.99, "learning_rate": 1.4847813693488251e-06, "loss": 0.0053, "step": 394460 }, { "epoch": 1.99, "learning_rate": 1.4772136763348148e-06, "loss": 0.0051, "step": 394470 }, { "epoch": 1.99, "learning_rate": 1.4696459833208045e-06, "loss": 0.005, "step": 394480 }, { "epoch": 1.99, "learning_rate": 1.4620782903067942e-06, "loss": 0.0075, "step": 394490 }, { "epoch": 1.99, "learning_rate": 1.454510597292784e-06, "loss": 0.0063, "step": 394500 }, { "epoch": 1.99, "learning_rate": 1.4469429042787736e-06, "loss": 0.0043, "step": 394510 }, { "epoch": 1.99, "learning_rate": 1.4393752112647631e-06, "loss": 0.0044, "step": 394520 }, { "epoch": 1.99, "learning_rate": 1.4318075182507528e-06, "loss": 0.0048, "step": 394530 }, { "epoch": 1.99, "learning_rate": 1.4242398252367423e-06, "loss": 0.0061, "step": 394540 }, { "epoch": 1.99, "learning_rate": 1.416672132222732e-06, "loss": 0.007, "step": 394550 }, { "epoch": 1.99, "learning_rate": 1.4091044392087217e-06, "loss": 0.0042, "step": 394560 }, { "epoch": 1.99, "learning_rate": 1.4015367461947114e-06, "loss": 0.0042, "step": 394570 }, { "epoch": 1.99, "learning_rate": 1.3939690531807011e-06, "loss": 0.005, "step": 394580 }, { "epoch": 1.99, "learning_rate": 1.3864013601666908e-06, "loss": 0.0062, "step": 394590 }, { "epoch": 1.99, "learning_rate": 1.3788336671526805e-06, "loss": 0.0074, "step": 394600 }, { "epoch": 1.99, "learning_rate": 1.3712659741386702e-06, "loss": 0.0055, "step": 394610 }, { "epoch": 1.99, "learning_rate": 1.36369828112466e-06, "loss": 0.0052, "step": 394620 }, { "epoch": 1.99, "learning_rate": 1.3561305881106496e-06, "loss": 0.004, "step": 394630 }, { "epoch": 1.99, "learning_rate": 1.3485628950966393e-06, "loss": 0.0093, "step": 394640 }, { "epoch": 1.99, "learning_rate": 1.340995202082629e-06, "loss": 0.0063, "step": 394650 }, { "epoch": 1.99, "learning_rate": 1.3334275090686185e-06, "loss": 0.0048, "step": 394660 }, { "epoch": 1.99, "learning_rate": 1.3258598160546082e-06, "loss": 0.0072, "step": 394670 }, { "epoch": 1.99, "learning_rate": 1.318292123040598e-06, "loss": 0.0054, "step": 394680 }, { "epoch": 1.99, "learning_rate": 1.3107244300265876e-06, "loss": 0.0043, "step": 394690 }, { "epoch": 1.99, "learning_rate": 1.3031567370125773e-06, "loss": 0.0046, "step": 394700 }, { "epoch": 1.99, "learning_rate": 1.295589043998567e-06, "loss": 0.0046, "step": 394710 }, { "epoch": 1.99, "learning_rate": 1.2880213509845567e-06, "loss": 0.0069, "step": 394720 }, { "epoch": 1.99, "learning_rate": 1.2804536579705464e-06, "loss": 0.0058, "step": 394730 }, { "epoch": 1.99, "learning_rate": 1.2728859649565361e-06, "loss": 0.0044, "step": 394740 }, { "epoch": 1.99, "learning_rate": 1.2653182719425258e-06, "loss": 0.0052, "step": 394750 }, { "epoch": 1.99, "learning_rate": 1.2577505789285155e-06, "loss": 0.0067, "step": 394760 }, { "epoch": 1.99, "learning_rate": 1.2501828859145052e-06, "loss": 0.0053, "step": 394770 }, { "epoch": 1.99, "learning_rate": 1.2426151929004947e-06, "loss": 0.0084, "step": 394780 }, { "epoch": 1.99, "learning_rate": 1.2350474998864844e-06, "loss": 0.0058, "step": 394790 }, { "epoch": 1.99, "learning_rate": 1.2274798068724741e-06, "loss": 0.0066, "step": 394800 }, { "epoch": 1.99, "learning_rate": 1.2199121138584638e-06, "loss": 0.0061, "step": 394810 }, { "epoch": 1.99, "learning_rate": 1.2123444208444535e-06, "loss": 0.0048, "step": 394820 }, { "epoch": 1.99, "learning_rate": 1.2047767278304432e-06, "loss": 0.0051, "step": 394830 }, { "epoch": 1.99, "learning_rate": 1.197209034816433e-06, "loss": 0.0089, "step": 394840 }, { "epoch": 1.99, "learning_rate": 1.1896413418024226e-06, "loss": 0.0069, "step": 394850 }, { "epoch": 1.99, "learning_rate": 1.1820736487884123e-06, "loss": 0.0043, "step": 394860 }, { "epoch": 1.99, "learning_rate": 1.174505955774402e-06, "loss": 0.0074, "step": 394870 }, { "epoch": 1.99, "learning_rate": 1.1669382627603917e-06, "loss": 0.0052, "step": 394880 }, { "epoch": 1.99, "learning_rate": 1.1593705697463812e-06, "loss": 0.0048, "step": 394890 }, { "epoch": 1.99, "learning_rate": 1.151802876732371e-06, "loss": 0.0045, "step": 394900 }, { "epoch": 1.99, "learning_rate": 1.1442351837183606e-06, "loss": 0.0047, "step": 394910 }, { "epoch": 1.99, "learning_rate": 1.1366674907043503e-06, "loss": 0.0048, "step": 394920 }, { "epoch": 1.99, "learning_rate": 1.12909979769034e-06, "loss": 0.0046, "step": 394930 }, { "epoch": 1.99, "learning_rate": 1.1215321046763295e-06, "loss": 0.0046, "step": 394940 }, { "epoch": 1.99, "learning_rate": 1.1139644116623192e-06, "loss": 0.0043, "step": 394950 }, { "epoch": 1.99, "learning_rate": 1.106396718648309e-06, "loss": 0.0062, "step": 394960 }, { "epoch": 1.99, "learning_rate": 1.0988290256342986e-06, "loss": 0.0056, "step": 394970 }, { "epoch": 1.99, "learning_rate": 1.0912613326202883e-06, "loss": 0.0034, "step": 394980 }, { "epoch": 1.99, "learning_rate": 1.083693639606278e-06, "loss": 0.0043, "step": 394990 }, { "epoch": 1.99, "learning_rate": 1.0761259465922677e-06, "loss": 0.0048, "step": 395000 }, { "epoch": 1.99, "eval_cer": 0.9144168841162651, "eval_loss": 0.004111517686396837, "eval_runtime": 115.9763, "eval_samples_per_second": 17.245, "eval_steps_per_second": 4.311, "step": 395000 }, { "epoch": 1.99, "learning_rate": 1.0685582535782574e-06, "loss": 0.0043, "step": 395010 }, { "epoch": 1.99, "learning_rate": 1.0609905605642471e-06, "loss": 0.0083, "step": 395020 }, { "epoch": 1.99, "learning_rate": 1.0534228675502368e-06, "loss": 0.0055, "step": 395030 }, { "epoch": 1.99, "learning_rate": 1.0458551745362265e-06, "loss": 0.0054, "step": 395040 }, { "epoch": 1.99, "learning_rate": 1.0382874815222162e-06, "loss": 0.0062, "step": 395050 }, { "epoch": 1.99, "learning_rate": 1.0307197885082057e-06, "loss": 0.0048, "step": 395060 }, { "epoch": 1.99, "learning_rate": 1.0231520954941954e-06, "loss": 0.0065, "step": 395070 }, { "epoch": 1.99, "learning_rate": 1.0155844024801851e-06, "loss": 0.0055, "step": 395080 }, { "epoch": 1.99, "learning_rate": 1.0080167094661748e-06, "loss": 0.0058, "step": 395090 }, { "epoch": 1.99, "learning_rate": 1.0004490164521645e-06, "loss": 0.0066, "step": 395100 }, { "epoch": 1.99, "learning_rate": 9.928813234381542e-07, "loss": 0.0042, "step": 395110 }, { "epoch": 1.99, "learning_rate": 9.85313630424144e-07, "loss": 0.0051, "step": 395120 }, { "epoch": 1.99, "learning_rate": 9.777459374101336e-07, "loss": 0.0048, "step": 395130 }, { "epoch": 1.99, "learning_rate": 9.701782443961233e-07, "loss": 0.0041, "step": 395140 }, { "epoch": 1.99, "learning_rate": 9.62610551382113e-07, "loss": 0.0046, "step": 395150 }, { "epoch": 1.99, "learning_rate": 9.550428583681027e-07, "loss": 0.0058, "step": 395160 }, { "epoch": 1.99, "learning_rate": 9.474751653540923e-07, "loss": 0.0049, "step": 395170 }, { "epoch": 1.99, "learning_rate": 9.39907472340082e-07, "loss": 0.0058, "step": 395180 }, { "epoch": 1.99, "learning_rate": 9.323397793260717e-07, "loss": 0.0057, "step": 395190 }, { "epoch": 1.99, "learning_rate": 9.247720863120612e-07, "loss": 0.0089, "step": 395200 }, { "epoch": 1.99, "learning_rate": 9.172043932980509e-07, "loss": 0.006, "step": 395210 }, { "epoch": 1.99, "learning_rate": 9.096367002840406e-07, "loss": 0.005, "step": 395220 }, { "epoch": 1.99, "learning_rate": 9.020690072700303e-07, "loss": 0.0051, "step": 395230 }, { "epoch": 1.99, "learning_rate": 8.9450131425602e-07, "loss": 0.006, "step": 395240 }, { "epoch": 1.99, "learning_rate": 8.869336212420096e-07, "loss": 0.0049, "step": 395250 }, { "epoch": 1.99, "learning_rate": 8.793659282279993e-07, "loss": 0.0057, "step": 395260 }, { "epoch": 1.99, "learning_rate": 8.71798235213989e-07, "loss": 0.0048, "step": 395270 }, { "epoch": 1.99, "learning_rate": 8.642305421999787e-07, "loss": 0.004, "step": 395280 }, { "epoch": 1.99, "learning_rate": 8.566628491859684e-07, "loss": 0.0033, "step": 395290 }, { "epoch": 1.99, "learning_rate": 8.490951561719581e-07, "loss": 0.0053, "step": 395300 }, { "epoch": 1.99, "learning_rate": 8.415274631579477e-07, "loss": 0.0056, "step": 395310 }, { "epoch": 1.99, "learning_rate": 8.339597701439374e-07, "loss": 0.0054, "step": 395320 }, { "epoch": 1.99, "learning_rate": 8.263920771299271e-07, "loss": 0.0045, "step": 395330 }, { "epoch": 1.99, "learning_rate": 8.188243841159168e-07, "loss": 0.0059, "step": 395340 }, { "epoch": 1.99, "learning_rate": 8.112566911019065e-07, "loss": 0.0061, "step": 395350 }, { "epoch": 1.99, "learning_rate": 8.036889980878962e-07, "loss": 0.005, "step": 395360 }, { "epoch": 1.99, "learning_rate": 7.961213050738858e-07, "loss": 0.0051, "step": 395370 }, { "epoch": 1.99, "learning_rate": 7.885536120598755e-07, "loss": 0.0066, "step": 395380 }, { "epoch": 1.99, "learning_rate": 7.809859190458652e-07, "loss": 0.0048, "step": 395390 }, { "epoch": 1.99, "learning_rate": 7.734182260318549e-07, "loss": 0.0054, "step": 395400 }, { "epoch": 1.99, "learning_rate": 7.658505330178446e-07, "loss": 0.0068, "step": 395410 }, { "epoch": 1.99, "learning_rate": 7.582828400038343e-07, "loss": 0.0089, "step": 395420 }, { "epoch": 1.99, "learning_rate": 7.507151469898239e-07, "loss": 0.0066, "step": 395430 }, { "epoch": 2.0, "learning_rate": 7.431474539758136e-07, "loss": 0.0056, "step": 395440 }, { "epoch": 2.0, "learning_rate": 7.355797609618033e-07, "loss": 0.0045, "step": 395450 }, { "epoch": 2.0, "learning_rate": 7.28012067947793e-07, "loss": 0.0056, "step": 395460 }, { "epoch": 2.0, "learning_rate": 7.204443749337827e-07, "loss": 0.0042, "step": 395470 }, { "epoch": 2.0, "learning_rate": 7.128766819197722e-07, "loss": 0.0059, "step": 395480 }, { "epoch": 2.0, "learning_rate": 7.053089889057619e-07, "loss": 0.008, "step": 395490 }, { "epoch": 2.0, "learning_rate": 6.977412958917516e-07, "loss": 0.0062, "step": 395500 }, { "epoch": 2.0, "learning_rate": 6.901736028777413e-07, "loss": 0.0062, "step": 395510 }, { "epoch": 2.0, "learning_rate": 6.82605909863731e-07, "loss": 0.0042, "step": 395520 }, { "epoch": 2.0, "learning_rate": 6.750382168497206e-07, "loss": 0.004, "step": 395530 }, { "epoch": 2.0, "learning_rate": 6.674705238357103e-07, "loss": 0.0054, "step": 395540 }, { "epoch": 2.0, "learning_rate": 6.599028308217e-07, "loss": 0.0066, "step": 395550 }, { "epoch": 2.0, "learning_rate": 6.523351378076897e-07, "loss": 0.0051, "step": 395560 }, { "epoch": 2.0, "learning_rate": 6.447674447936794e-07, "loss": 0.0068, "step": 395570 }, { "epoch": 2.0, "learning_rate": 6.371997517796691e-07, "loss": 0.0058, "step": 395580 }, { "epoch": 2.0, "learning_rate": 6.296320587656587e-07, "loss": 0.0053, "step": 395590 }, { "epoch": 2.0, "learning_rate": 6.220643657516484e-07, "loss": 0.0043, "step": 395600 }, { "epoch": 2.0, "learning_rate": 6.144966727376381e-07, "loss": 0.0056, "step": 395610 }, { "epoch": 2.0, "learning_rate": 6.069289797236278e-07, "loss": 0.0036, "step": 395620 }, { "epoch": 2.0, "learning_rate": 5.993612867096175e-07, "loss": 0.0052, "step": 395630 }, { "epoch": 2.0, "learning_rate": 5.917935936956072e-07, "loss": 0.0069, "step": 395640 }, { "epoch": 2.0, "learning_rate": 5.842259006815968e-07, "loss": 0.0048, "step": 395650 }, { "epoch": 2.0, "learning_rate": 5.766582076675865e-07, "loss": 0.0064, "step": 395660 }, { "epoch": 2.0, "learning_rate": 5.690905146535762e-07, "loss": 0.005, "step": 395670 }, { "epoch": 2.0, "learning_rate": 5.615228216395658e-07, "loss": 0.0061, "step": 395680 }, { "epoch": 2.0, "learning_rate": 5.539551286255555e-07, "loss": 0.0051, "step": 395690 }, { "epoch": 2.0, "learning_rate": 5.463874356115452e-07, "loss": 0.0065, "step": 395700 }, { "epoch": 2.0, "learning_rate": 5.388197425975349e-07, "loss": 0.0054, "step": 395710 }, { "epoch": 2.0, "learning_rate": 5.312520495835246e-07, "loss": 0.0042, "step": 395720 }, { "epoch": 2.0, "learning_rate": 5.236843565695142e-07, "loss": 0.0079, "step": 395730 }, { "epoch": 2.0, "learning_rate": 5.161166635555039e-07, "loss": 0.0063, "step": 395740 }, { "epoch": 2.0, "learning_rate": 5.085489705414936e-07, "loss": 0.0047, "step": 395750 }, { "epoch": 2.0, "learning_rate": 5.009812775274833e-07, "loss": 0.0086, "step": 395760 }, { "epoch": 2.0, "learning_rate": 4.93413584513473e-07, "loss": 0.0062, "step": 395770 }, { "epoch": 2.0, "learning_rate": 4.858458914994627e-07, "loss": 0.0044, "step": 395780 }, { "epoch": 2.0, "learning_rate": 4.782781984854523e-07, "loss": 0.0036, "step": 395790 }, { "epoch": 2.0, "learning_rate": 4.70710505471442e-07, "loss": 0.0067, "step": 395800 }, { "epoch": 2.0, "learning_rate": 4.631428124574317e-07, "loss": 0.0058, "step": 395810 }, { "epoch": 2.0, "learning_rate": 4.5557511944342136e-07, "loss": 0.0068, "step": 395820 }, { "epoch": 2.0, "learning_rate": 4.48007426429411e-07, "loss": 0.0067, "step": 395830 }, { "epoch": 2.0, "learning_rate": 4.404397334154007e-07, "loss": 0.0083, "step": 395840 }, { "epoch": 2.0, "learning_rate": 4.328720404013904e-07, "loss": 0.005, "step": 395850 }, { "epoch": 2.0, "learning_rate": 4.2530434738738006e-07, "loss": 0.006, "step": 395860 }, { "epoch": 2.0, "learning_rate": 4.1773665437336976e-07, "loss": 0.0043, "step": 395870 }, { "epoch": 2.0, "learning_rate": 4.1016896135935946e-07, "loss": 0.0056, "step": 395880 }, { "epoch": 2.0, "learning_rate": 4.026012683453491e-07, "loss": 0.0065, "step": 395890 }, { "epoch": 2.0, "learning_rate": 3.950335753313388e-07, "loss": 0.0047, "step": 395900 }, { "epoch": 2.0, "learning_rate": 3.8746588231732846e-07, "loss": 0.0051, "step": 395910 }, { "epoch": 2.0, "learning_rate": 3.7989818930331816e-07, "loss": 0.0048, "step": 395920 }, { "epoch": 2.0, "learning_rate": 3.7233049628930786e-07, "loss": 0.0056, "step": 395930 }, { "epoch": 2.0, "learning_rate": 3.647628032752975e-07, "loss": 0.0061, "step": 395940 }, { "epoch": 2.0, "learning_rate": 3.5719511026128716e-07, "loss": 0.004, "step": 395950 }, { "epoch": 2.0, "learning_rate": 3.4962741724727686e-07, "loss": 0.0052, "step": 395960 }, { "epoch": 2.0, "learning_rate": 3.420597242332665e-07, "loss": 0.0054, "step": 395970 }, { "epoch": 2.0, "learning_rate": 3.344920312192562e-07, "loss": 0.0061, "step": 395980 }, { "epoch": 2.0, "learning_rate": 3.269243382052459e-07, "loss": 0.005, "step": 395990 }, { "epoch": 2.0, "learning_rate": 3.1935664519123556e-07, "loss": 0.0044, "step": 396000 }, { "epoch": 2.0, "eval_cer": 0.9144159137201398, "eval_loss": 0.004107584245502949, "eval_runtime": 116.1979, "eval_samples_per_second": 17.212, "eval_steps_per_second": 4.303, "step": 396000 }, { "epoch": 2.0, "learning_rate": 3.1178895217722526e-07, "loss": 0.0042, "step": 396010 }, { "epoch": 2.0, "learning_rate": 3.0422125916321496e-07, "loss": 0.0065, "step": 396020 }, { "epoch": 2.0, "learning_rate": 2.966535661492046e-07, "loss": 0.0079, "step": 396030 }, { "epoch": 2.0, "learning_rate": 2.890858731351943e-07, "loss": 0.0049, "step": 396040 }, { "epoch": 2.0, "learning_rate": 2.8151818012118396e-07, "loss": 0.0066, "step": 396050 }, { "epoch": 2.0, "learning_rate": 2.7395048710717366e-07, "loss": 0.0055, "step": 396060 }, { "epoch": 2.0, "learning_rate": 2.663827940931633e-07, "loss": 0.0048, "step": 396070 }, { "epoch": 2.0, "learning_rate": 2.58815101079153e-07, "loss": 0.0059, "step": 396080 }, { "epoch": 2.0, "learning_rate": 2.512474080651427e-07, "loss": 0.0055, "step": 396090 }, { "epoch": 2.0, "learning_rate": 2.4367971505113236e-07, "loss": 0.0039, "step": 396100 }, { "epoch": 2.0, "learning_rate": 2.3611202203712206e-07, "loss": 0.0043, "step": 396110 }, { "epoch": 2.0, "learning_rate": 2.285443290231117e-07, "loss": 0.0069, "step": 396120 }, { "epoch": 2.0, "learning_rate": 2.2097663600910138e-07, "loss": 0.0048, "step": 396130 }, { "epoch": 2.0, "learning_rate": 2.1340894299509105e-07, "loss": 0.0041, "step": 396140 }, { "epoch": 2.0, "learning_rate": 2.0584124998108076e-07, "loss": 0.0069, "step": 396150 }, { "epoch": 2.0, "learning_rate": 1.9827355696707043e-07, "loss": 0.0048, "step": 396160 }, { "epoch": 2.0, "learning_rate": 1.907058639530601e-07, "loss": 0.0061, "step": 396170 }, { "epoch": 2.0, "learning_rate": 1.831381709390498e-07, "loss": 0.0049, "step": 396180 }, { "epoch": 2.0, "learning_rate": 1.7557047792503945e-07, "loss": 0.0058, "step": 396190 }, { "epoch": 2.0, "learning_rate": 1.6800278491102913e-07, "loss": 0.0052, "step": 396200 }, { "epoch": 2.0, "learning_rate": 1.604350918970188e-07, "loss": 0.0048, "step": 396210 }, { "epoch": 2.0, "learning_rate": 1.528673988830085e-07, "loss": 0.0044, "step": 396220 }, { "epoch": 2.0, "learning_rate": 1.4529970586899818e-07, "loss": 0.0069, "step": 396230 }, { "epoch": 2.0, "learning_rate": 1.3773201285498785e-07, "loss": 0.0053, "step": 396240 }, { "epoch": 2.0, "learning_rate": 1.3016431984097753e-07, "loss": 0.0071, "step": 396250 }, { "epoch": 2.0, "learning_rate": 1.225966268269672e-07, "loss": 0.0066, "step": 396260 }, { "epoch": 2.0, "learning_rate": 1.1502893381295688e-07, "loss": 0.0054, "step": 396270 }, { "epoch": 2.0, "learning_rate": 1.0746124079894656e-07, "loss": 0.006, "step": 396280 }, { "epoch": 2.0, "learning_rate": 9.989354778493625e-08, "loss": 0.0061, "step": 396290 }, { "epoch": 2.0, "learning_rate": 9.232585477092593e-08, "loss": 0.0059, "step": 396300 }, { "epoch": 2.0, "learning_rate": 8.47581617569156e-08, "loss": 0.0049, "step": 396310 }, { "epoch": 2.0, "learning_rate": 7.719046874290528e-08, "loss": 0.0063, "step": 396320 }, { "epoch": 2.0, "learning_rate": 6.962277572889495e-08, "loss": 0.0069, "step": 396330 }, { "epoch": 2.0, "learning_rate": 6.205508271488464e-08, "loss": 0.0054, "step": 396340 }, { "epoch": 2.0, "learning_rate": 5.4487389700874314e-08, "loss": 0.0046, "step": 396350 }, { "epoch": 2.0, "learning_rate": 4.6919696686863995e-08, "loss": 0.0044, "step": 396360 }, { "epoch": 2.0, "learning_rate": 3.935200367285367e-08, "loss": 0.0049, "step": 396370 }, { "epoch": 2.0, "learning_rate": 3.178431065884335e-08, "loss": 0.0076, "step": 396380 }, { "epoch": 2.0, "learning_rate": 2.421661764483303e-08, "loss": 0.0049, "step": 396390 }, { "epoch": 2.0, "learning_rate": 1.6648924630822707e-08, "loss": 0.007, "step": 396400 }, { "epoch": 2.0, "learning_rate": 9.081231616812386e-09, "loss": 0.0071, "step": 396410 }, { "epoch": 2.0, "learning_rate": 1.5135386028020643e-09, "loss": 0.0046, "step": 396420 }, { "epoch": 2.0, "step": 396422, "total_flos": 1.969031441954304e+18, "train_loss": 0.013614018808192265, "train_runtime": 415192.129, "train_samples_per_second": 30.553, "train_steps_per_second": 0.955 } ], "max_steps": 396422, "num_train_epochs": 2, "total_flos": 1.969031441954304e+18, "trial_name": null, "trial_params": null }