{ "best_metric": 0.9197731329793244, "best_model_checkpoint": "./models/bart-base-spelling-nl-2m/checkpoint-158000", "epoch": 1.9999935457845905, "global_step": 309874, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 0.00029999031864564305, "loss": 4.6156, "step": 10 }, { "epoch": 0.0, "learning_rate": 0.00029998063729128613, "loss": 1.343, "step": 20 }, { "epoch": 0.0, "learning_rate": 0.0002999709559369292, "loss": 1.0206, "step": 30 }, { "epoch": 0.0, "learning_rate": 0.00029996127458257224, "loss": 0.9534, "step": 40 }, { "epoch": 0.0, "learning_rate": 0.0002999515932282153, "loss": 0.8341, "step": 50 }, { "epoch": 0.0, "learning_rate": 0.0002999419118738584, "loss": 0.7678, "step": 60 }, { "epoch": 0.0, "learning_rate": 0.0002999322305195014, "loss": 0.7105, "step": 70 }, { "epoch": 0.0, "learning_rate": 0.0002999225491651445, "loss": 0.699, "step": 80 }, { "epoch": 0.0, "learning_rate": 0.0002999128678107876, "loss": 0.6662, "step": 90 }, { "epoch": 0.0, "learning_rate": 0.00029990318645643066, "loss": 0.6317, "step": 100 }, { "epoch": 0.0, "learning_rate": 0.0002998935051020737, "loss": 0.622, "step": 110 }, { "epoch": 0.0, "learning_rate": 0.00029988382374771677, "loss": 0.6266, "step": 120 }, { "epoch": 0.0, "learning_rate": 0.00029987414239335985, "loss": 0.5759, "step": 130 }, { "epoch": 0.0, "learning_rate": 0.00029986446103900293, "loss": 0.5915, "step": 140 }, { "epoch": 0.0, "learning_rate": 0.000299854779684646, "loss": 0.5852, "step": 150 }, { "epoch": 0.0, "learning_rate": 0.0002998450983302891, "loss": 0.5174, "step": 160 }, { "epoch": 0.0, "learning_rate": 0.00029983541697593217, "loss": 0.5193, "step": 170 }, { "epoch": 0.0, "learning_rate": 0.0002998257356215752, "loss": 0.5252, "step": 180 }, { "epoch": 0.0, "learning_rate": 0.0002998160542672183, "loss": 0.5231, "step": 190 }, { "epoch": 0.0, "learning_rate": 0.00029980637291286135, "loss": 0.5039, "step": 200 }, { "epoch": 0.0, "learning_rate": 0.0002997966915585044, "loss": 0.5046, "step": 210 }, { "epoch": 0.0, "learning_rate": 0.00029978701020414746, "loss": 0.4904, "step": 220 }, { "epoch": 0.0, "learning_rate": 0.00029977732884979054, "loss": 0.4778, "step": 230 }, { "epoch": 0.0, "learning_rate": 0.0002997676474954336, "loss": 0.4769, "step": 240 }, { "epoch": 0.0, "learning_rate": 0.00029975796614107664, "loss": 0.4826, "step": 250 }, { "epoch": 0.0, "learning_rate": 0.0002997482847867197, "loss": 0.4792, "step": 260 }, { "epoch": 0.0, "learning_rate": 0.0002997386034323628, "loss": 0.4771, "step": 270 }, { "epoch": 0.0, "learning_rate": 0.0002997289220780059, "loss": 0.4732, "step": 280 }, { "epoch": 0.0, "learning_rate": 0.00029971924072364896, "loss": 0.4576, "step": 290 }, { "epoch": 0.0, "learning_rate": 0.00029970955936929204, "loss": 0.4423, "step": 300 }, { "epoch": 0.0, "learning_rate": 0.00029969987801493507, "loss": 0.4416, "step": 310 }, { "epoch": 0.0, "learning_rate": 0.00029969019666057815, "loss": 0.448, "step": 320 }, { "epoch": 0.0, "learning_rate": 0.00029968051530622123, "loss": 0.4101, "step": 330 }, { "epoch": 0.0, "learning_rate": 0.00029967083395186425, "loss": 0.4048, "step": 340 }, { "epoch": 0.0, "learning_rate": 0.00029966115259750733, "loss": 0.4128, "step": 350 }, { "epoch": 0.0, "learning_rate": 0.0002996514712431504, "loss": 0.4237, "step": 360 }, { "epoch": 0.0, "learning_rate": 0.0002996417898887935, "loss": 0.3986, "step": 370 }, { "epoch": 0.0, "learning_rate": 0.00029963210853443657, "loss": 0.433, "step": 380 }, { "epoch": 0.0, "learning_rate": 0.0002996224271800796, "loss": 0.3928, "step": 390 }, { "epoch": 0.0, "learning_rate": 0.0002996127458257227, "loss": 0.3997, "step": 400 }, { "epoch": 0.0, "learning_rate": 0.00029960306447136576, "loss": 0.3833, "step": 410 }, { "epoch": 0.0, "learning_rate": 0.00029959338311700884, "loss": 0.3819, "step": 420 }, { "epoch": 0.0, "learning_rate": 0.0002995837017626519, "loss": 0.3894, "step": 430 }, { "epoch": 0.0, "learning_rate": 0.00029957402040829494, "loss": 0.3804, "step": 440 }, { "epoch": 0.0, "learning_rate": 0.000299564339053938, "loss": 0.3933, "step": 450 }, { "epoch": 0.0, "learning_rate": 0.0002995546576995811, "loss": 0.3748, "step": 460 }, { "epoch": 0.0, "learning_rate": 0.00029954497634522413, "loss": 0.3799, "step": 470 }, { "epoch": 0.0, "learning_rate": 0.0002995352949908672, "loss": 0.3612, "step": 480 }, { "epoch": 0.0, "learning_rate": 0.0002995256136365103, "loss": 0.392, "step": 490 }, { "epoch": 0.0, "learning_rate": 0.00029951593228215337, "loss": 0.3791, "step": 500 }, { "epoch": 0.0, "learning_rate": 0.00029950625092779645, "loss": 0.3663, "step": 510 }, { "epoch": 0.0, "learning_rate": 0.0002994965695734395, "loss": 0.3514, "step": 520 }, { "epoch": 0.0, "learning_rate": 0.00029948688821908255, "loss": 0.3595, "step": 530 }, { "epoch": 0.0, "learning_rate": 0.00029947720686472563, "loss": 0.3605, "step": 540 }, { "epoch": 0.0, "learning_rate": 0.0002994675255103687, "loss": 0.3555, "step": 550 }, { "epoch": 0.0, "learning_rate": 0.0002994578441560118, "loss": 0.3563, "step": 560 }, { "epoch": 0.0, "learning_rate": 0.00029944816280165487, "loss": 0.3481, "step": 570 }, { "epoch": 0.0, "learning_rate": 0.0002994384814472979, "loss": 0.3557, "step": 580 }, { "epoch": 0.0, "learning_rate": 0.000299428800092941, "loss": 0.3522, "step": 590 }, { "epoch": 0.0, "learning_rate": 0.00029941911873858406, "loss": 0.3563, "step": 600 }, { "epoch": 0.0, "learning_rate": 0.0002994094373842271, "loss": 0.3507, "step": 610 }, { "epoch": 0.0, "learning_rate": 0.00029939975602987016, "loss": 0.3356, "step": 620 }, { "epoch": 0.0, "learning_rate": 0.00029939007467551324, "loss": 0.3457, "step": 630 }, { "epoch": 0.0, "learning_rate": 0.0002993803933211563, "loss": 0.3522, "step": 640 }, { "epoch": 0.0, "learning_rate": 0.0002993707119667994, "loss": 0.3329, "step": 650 }, { "epoch": 0.0, "learning_rate": 0.0002993610306124425, "loss": 0.3286, "step": 660 }, { "epoch": 0.0, "learning_rate": 0.0002993513492580855, "loss": 0.3394, "step": 670 }, { "epoch": 0.0, "learning_rate": 0.0002993416679037286, "loss": 0.3201, "step": 680 }, { "epoch": 0.0, "learning_rate": 0.00029933198654937167, "loss": 0.3277, "step": 690 }, { "epoch": 0.0, "learning_rate": 0.00029932230519501475, "loss": 0.3332, "step": 700 }, { "epoch": 0.0, "learning_rate": 0.00029931262384065777, "loss": 0.314, "step": 710 }, { "epoch": 0.0, "learning_rate": 0.00029930294248630085, "loss": 0.3204, "step": 720 }, { "epoch": 0.0, "learning_rate": 0.00029929326113194393, "loss": 0.3157, "step": 730 }, { "epoch": 0.0, "learning_rate": 0.00029928357977758696, "loss": 0.313, "step": 740 }, { "epoch": 0.0, "learning_rate": 0.00029927389842323004, "loss": 0.3161, "step": 750 }, { "epoch": 0.0, "learning_rate": 0.0002992642170688731, "loss": 0.3139, "step": 760 }, { "epoch": 0.0, "learning_rate": 0.0002992545357145162, "loss": 0.3181, "step": 770 }, { "epoch": 0.01, "learning_rate": 0.0002992448543601593, "loss": 0.3069, "step": 780 }, { "epoch": 0.01, "learning_rate": 0.00029923517300580236, "loss": 0.3001, "step": 790 }, { "epoch": 0.01, "learning_rate": 0.00029922549165144544, "loss": 0.3222, "step": 800 }, { "epoch": 0.01, "learning_rate": 0.00029921581029708846, "loss": 0.3097, "step": 810 }, { "epoch": 0.01, "learning_rate": 0.00029920612894273154, "loss": 0.3168, "step": 820 }, { "epoch": 0.01, "learning_rate": 0.0002991964475883746, "loss": 0.3012, "step": 830 }, { "epoch": 0.01, "learning_rate": 0.00029918676623401765, "loss": 0.2954, "step": 840 }, { "epoch": 0.01, "learning_rate": 0.0002991770848796607, "loss": 0.305, "step": 850 }, { "epoch": 0.01, "learning_rate": 0.0002991674035253038, "loss": 0.3022, "step": 860 }, { "epoch": 0.01, "learning_rate": 0.0002991577221709469, "loss": 0.2964, "step": 870 }, { "epoch": 0.01, "learning_rate": 0.0002991480408165899, "loss": 0.287, "step": 880 }, { "epoch": 0.01, "learning_rate": 0.000299138359462233, "loss": 0.3079, "step": 890 }, { "epoch": 0.01, "learning_rate": 0.00029912867810787607, "loss": 0.2928, "step": 900 }, { "epoch": 0.01, "learning_rate": 0.00029911899675351915, "loss": 0.301, "step": 910 }, { "epoch": 0.01, "learning_rate": 0.00029910931539916223, "loss": 0.2889, "step": 920 }, { "epoch": 0.01, "learning_rate": 0.0002990996340448053, "loss": 0.2932, "step": 930 }, { "epoch": 0.01, "learning_rate": 0.0002990899526904484, "loss": 0.3026, "step": 940 }, { "epoch": 0.01, "learning_rate": 0.0002990802713360914, "loss": 0.2827, "step": 950 }, { "epoch": 0.01, "learning_rate": 0.0002990705899817345, "loss": 0.2945, "step": 960 }, { "epoch": 0.01, "learning_rate": 0.0002990609086273776, "loss": 0.2753, "step": 970 }, { "epoch": 0.01, "learning_rate": 0.0002990512272730206, "loss": 0.2733, "step": 980 }, { "epoch": 0.01, "learning_rate": 0.0002990415459186637, "loss": 0.2932, "step": 990 }, { "epoch": 0.01, "learning_rate": 0.00029903186456430676, "loss": 0.277, "step": 1000 }, { "epoch": 0.01, "eval_cer": 0.9206128121116258, "eval_loss": 0.2336636185646057, "eval_runtime": 119.7068, "eval_samples_per_second": 16.707, "eval_steps_per_second": 4.177, "step": 1000 }, { "epoch": 0.01, "learning_rate": 0.00029902218320994984, "loss": 0.2856, "step": 1010 }, { "epoch": 0.01, "learning_rate": 0.00029901250185559287, "loss": 0.2949, "step": 1020 }, { "epoch": 0.01, "learning_rate": 0.00029900282050123595, "loss": 0.295, "step": 1030 }, { "epoch": 0.01, "learning_rate": 0.000298993139146879, "loss": 0.2615, "step": 1040 }, { "epoch": 0.01, "learning_rate": 0.0002989834577925221, "loss": 0.2862, "step": 1050 }, { "epoch": 0.01, "learning_rate": 0.0002989737764381652, "loss": 0.2766, "step": 1060 }, { "epoch": 0.01, "learning_rate": 0.00029896409508380826, "loss": 0.2733, "step": 1070 }, { "epoch": 0.01, "learning_rate": 0.0002989544137294513, "loss": 0.2808, "step": 1080 }, { "epoch": 0.01, "learning_rate": 0.00029894473237509437, "loss": 0.2812, "step": 1090 }, { "epoch": 0.01, "learning_rate": 0.00029893505102073745, "loss": 0.2724, "step": 1100 }, { "epoch": 0.01, "learning_rate": 0.0002989253696663805, "loss": 0.2764, "step": 1110 }, { "epoch": 0.01, "learning_rate": 0.00029891568831202356, "loss": 0.2796, "step": 1120 }, { "epoch": 0.01, "learning_rate": 0.00029890600695766663, "loss": 0.2724, "step": 1130 }, { "epoch": 0.01, "learning_rate": 0.0002988963256033097, "loss": 0.2541, "step": 1140 }, { "epoch": 0.01, "learning_rate": 0.0002988866442489528, "loss": 0.2541, "step": 1150 }, { "epoch": 0.01, "learning_rate": 0.0002988769628945958, "loss": 0.2694, "step": 1160 }, { "epoch": 0.01, "learning_rate": 0.0002988672815402389, "loss": 0.2667, "step": 1170 }, { "epoch": 0.01, "learning_rate": 0.000298857600185882, "loss": 0.2663, "step": 1180 }, { "epoch": 0.01, "learning_rate": 0.00029884791883152506, "loss": 0.2622, "step": 1190 }, { "epoch": 0.01, "learning_rate": 0.00029883823747716814, "loss": 0.2689, "step": 1200 }, { "epoch": 0.01, "learning_rate": 0.00029882855612281116, "loss": 0.2575, "step": 1210 }, { "epoch": 0.01, "learning_rate": 0.00029881887476845424, "loss": 0.2625, "step": 1220 }, { "epoch": 0.01, "learning_rate": 0.0002988091934140973, "loss": 0.2727, "step": 1230 }, { "epoch": 0.01, "learning_rate": 0.00029879951205974035, "loss": 0.2649, "step": 1240 }, { "epoch": 0.01, "learning_rate": 0.00029878983070538343, "loss": 0.2687, "step": 1250 }, { "epoch": 0.01, "learning_rate": 0.0002987801493510265, "loss": 0.262, "step": 1260 }, { "epoch": 0.01, "learning_rate": 0.0002987704679966696, "loss": 0.2517, "step": 1270 }, { "epoch": 0.01, "learning_rate": 0.00029876078664231267, "loss": 0.2721, "step": 1280 }, { "epoch": 0.01, "learning_rate": 0.00029875110528795575, "loss": 0.2573, "step": 1290 }, { "epoch": 0.01, "learning_rate": 0.0002987414239335988, "loss": 0.2716, "step": 1300 }, { "epoch": 0.01, "learning_rate": 0.00029873174257924185, "loss": 0.2558, "step": 1310 }, { "epoch": 0.01, "learning_rate": 0.00029872206122488493, "loss": 0.2672, "step": 1320 }, { "epoch": 0.01, "learning_rate": 0.000298712379870528, "loss": 0.2624, "step": 1330 }, { "epoch": 0.01, "learning_rate": 0.0002987026985161711, "loss": 0.2629, "step": 1340 }, { "epoch": 0.01, "learning_rate": 0.0002986930171618141, "loss": 0.2537, "step": 1350 }, { "epoch": 0.01, "learning_rate": 0.0002986833358074572, "loss": 0.2608, "step": 1360 }, { "epoch": 0.01, "learning_rate": 0.0002986736544531003, "loss": 0.2553, "step": 1370 }, { "epoch": 0.01, "learning_rate": 0.0002986639730987433, "loss": 0.2651, "step": 1380 }, { "epoch": 0.01, "learning_rate": 0.0002986542917443864, "loss": 0.2504, "step": 1390 }, { "epoch": 0.01, "learning_rate": 0.00029864461039002946, "loss": 0.2465, "step": 1400 }, { "epoch": 0.01, "learning_rate": 0.00029863492903567254, "loss": 0.2565, "step": 1410 }, { "epoch": 0.01, "learning_rate": 0.0002986252476813156, "loss": 0.2687, "step": 1420 }, { "epoch": 0.01, "learning_rate": 0.0002986155663269587, "loss": 0.2671, "step": 1430 }, { "epoch": 0.01, "learning_rate": 0.00029860588497260173, "loss": 0.2442, "step": 1440 }, { "epoch": 0.01, "learning_rate": 0.0002985962036182448, "loss": 0.2556, "step": 1450 }, { "epoch": 0.01, "learning_rate": 0.0002985865222638879, "loss": 0.2609, "step": 1460 }, { "epoch": 0.01, "learning_rate": 0.00029857684090953097, "loss": 0.2459, "step": 1470 }, { "epoch": 0.01, "learning_rate": 0.000298567159555174, "loss": 0.2409, "step": 1480 }, { "epoch": 0.01, "learning_rate": 0.0002985574782008171, "loss": 0.2457, "step": 1490 }, { "epoch": 0.01, "learning_rate": 0.00029854779684646015, "loss": 0.2614, "step": 1500 }, { "epoch": 0.01, "learning_rate": 0.0002985381154921032, "loss": 0.2455, "step": 1510 }, { "epoch": 0.01, "learning_rate": 0.00029852843413774626, "loss": 0.2352, "step": 1520 }, { "epoch": 0.01, "learning_rate": 0.00029851875278338934, "loss": 0.243, "step": 1530 }, { "epoch": 0.01, "learning_rate": 0.0002985090714290324, "loss": 0.2383, "step": 1540 }, { "epoch": 0.01, "learning_rate": 0.0002984993900746755, "loss": 0.2359, "step": 1550 }, { "epoch": 0.01, "learning_rate": 0.0002984897087203186, "loss": 0.2542, "step": 1560 }, { "epoch": 0.01, "learning_rate": 0.00029848002736596166, "loss": 0.2485, "step": 1570 }, { "epoch": 0.01, "learning_rate": 0.0002984703460116047, "loss": 0.2399, "step": 1580 }, { "epoch": 0.01, "learning_rate": 0.00029846066465724776, "loss": 0.2427, "step": 1590 }, { "epoch": 0.01, "learning_rate": 0.00029845098330289084, "loss": 0.2422, "step": 1600 }, { "epoch": 0.01, "learning_rate": 0.00029844130194853387, "loss": 0.2327, "step": 1610 }, { "epoch": 0.01, "learning_rate": 0.00029843162059417695, "loss": 0.24, "step": 1620 }, { "epoch": 0.01, "learning_rate": 0.00029842193923982003, "loss": 0.2288, "step": 1630 }, { "epoch": 0.01, "learning_rate": 0.0002984122578854631, "loss": 0.2422, "step": 1640 }, { "epoch": 0.01, "learning_rate": 0.00029840257653110613, "loss": 0.2256, "step": 1650 }, { "epoch": 0.01, "learning_rate": 0.0002983928951767492, "loss": 0.2395, "step": 1660 }, { "epoch": 0.01, "learning_rate": 0.0002983832138223923, "loss": 0.2367, "step": 1670 }, { "epoch": 0.01, "learning_rate": 0.0002983735324680354, "loss": 0.2373, "step": 1680 }, { "epoch": 0.01, "learning_rate": 0.00029836385111367845, "loss": 0.2324, "step": 1690 }, { "epoch": 0.01, "learning_rate": 0.00029835416975932153, "loss": 0.2337, "step": 1700 }, { "epoch": 0.01, "learning_rate": 0.0002983444884049646, "loss": 0.2105, "step": 1710 }, { "epoch": 0.01, "learning_rate": 0.00029833480705060764, "loss": 0.2311, "step": 1720 }, { "epoch": 0.01, "learning_rate": 0.0002983251256962507, "loss": 0.2334, "step": 1730 }, { "epoch": 0.01, "learning_rate": 0.0002983154443418938, "loss": 0.2551, "step": 1740 }, { "epoch": 0.01, "learning_rate": 0.0002983057629875368, "loss": 0.2379, "step": 1750 }, { "epoch": 0.01, "learning_rate": 0.0002982960816331799, "loss": 0.2399, "step": 1760 }, { "epoch": 0.01, "learning_rate": 0.000298286400278823, "loss": 0.2271, "step": 1770 }, { "epoch": 0.01, "learning_rate": 0.00029827671892446606, "loss": 0.2369, "step": 1780 }, { "epoch": 0.01, "learning_rate": 0.0002982670375701091, "loss": 0.2296, "step": 1790 }, { "epoch": 0.01, "learning_rate": 0.00029825735621575217, "loss": 0.2223, "step": 1800 }, { "epoch": 0.01, "learning_rate": 0.00029824767486139525, "loss": 0.2359, "step": 1810 }, { "epoch": 0.01, "learning_rate": 0.00029823799350703833, "loss": 0.2307, "step": 1820 }, { "epoch": 0.01, "learning_rate": 0.0002982283121526814, "loss": 0.2218, "step": 1830 }, { "epoch": 0.01, "learning_rate": 0.0002982186307983245, "loss": 0.2424, "step": 1840 }, { "epoch": 0.01, "learning_rate": 0.0002982089494439675, "loss": 0.2239, "step": 1850 }, { "epoch": 0.01, "learning_rate": 0.0002981992680896106, "loss": 0.224, "step": 1860 }, { "epoch": 0.01, "learning_rate": 0.00029818958673525367, "loss": 0.2339, "step": 1870 }, { "epoch": 0.01, "learning_rate": 0.0002981799053808967, "loss": 0.2185, "step": 1880 }, { "epoch": 0.01, "learning_rate": 0.0002981702240265398, "loss": 0.2397, "step": 1890 }, { "epoch": 0.01, "learning_rate": 0.00029816054267218286, "loss": 0.2466, "step": 1900 }, { "epoch": 0.01, "learning_rate": 0.00029815086131782594, "loss": 0.2206, "step": 1910 }, { "epoch": 0.01, "learning_rate": 0.000298141179963469, "loss": 0.2361, "step": 1920 }, { "epoch": 0.01, "learning_rate": 0.00029813149860911204, "loss": 0.221, "step": 1930 }, { "epoch": 0.01, "learning_rate": 0.0002981218172547551, "loss": 0.205, "step": 1940 }, { "epoch": 0.01, "learning_rate": 0.0002981121359003982, "loss": 0.2301, "step": 1950 }, { "epoch": 0.01, "learning_rate": 0.0002981024545460413, "loss": 0.2227, "step": 1960 }, { "epoch": 0.01, "learning_rate": 0.00029809277319168436, "loss": 0.2191, "step": 1970 }, { "epoch": 0.01, "learning_rate": 0.00029808309183732744, "loss": 0.217, "step": 1980 }, { "epoch": 0.01, "learning_rate": 0.00029807341048297047, "loss": 0.2146, "step": 1990 }, { "epoch": 0.01, "learning_rate": 0.00029806372912861355, "loss": 0.2349, "step": 2000 }, { "epoch": 0.01, "eval_cer": 0.9204428878092871, "eval_loss": 0.1756814867258072, "eval_runtime": 120.0499, "eval_samples_per_second": 16.66, "eval_steps_per_second": 4.165, "step": 2000 }, { "epoch": 0.01, "learning_rate": 0.00029805404777425657, "loss": 0.2146, "step": 2010 }, { "epoch": 0.01, "learning_rate": 0.00029804436641989965, "loss": 0.2262, "step": 2020 }, { "epoch": 0.01, "learning_rate": 0.00029803468506554273, "loss": 0.2296, "step": 2030 }, { "epoch": 0.01, "learning_rate": 0.0002980250037111858, "loss": 0.2168, "step": 2040 }, { "epoch": 0.01, "learning_rate": 0.0002980153223568289, "loss": 0.2247, "step": 2050 }, { "epoch": 0.01, "learning_rate": 0.00029800564100247197, "loss": 0.2219, "step": 2060 }, { "epoch": 0.01, "learning_rate": 0.000297995959648115, "loss": 0.2259, "step": 2070 }, { "epoch": 0.01, "learning_rate": 0.0002979862782937581, "loss": 0.2176, "step": 2080 }, { "epoch": 0.01, "learning_rate": 0.00029797659693940116, "loss": 0.22, "step": 2090 }, { "epoch": 0.01, "learning_rate": 0.00029796691558504424, "loss": 0.2176, "step": 2100 }, { "epoch": 0.01, "learning_rate": 0.0002979572342306873, "loss": 0.2179, "step": 2110 }, { "epoch": 0.01, "learning_rate": 0.00029794755287633034, "loss": 0.2146, "step": 2120 }, { "epoch": 0.01, "learning_rate": 0.0002979378715219734, "loss": 0.2029, "step": 2130 }, { "epoch": 0.01, "learning_rate": 0.0002979281901676165, "loss": 0.2322, "step": 2140 }, { "epoch": 0.01, "learning_rate": 0.0002979185088132595, "loss": 0.2138, "step": 2150 }, { "epoch": 0.01, "learning_rate": 0.0002979088274589026, "loss": 0.2083, "step": 2160 }, { "epoch": 0.01, "learning_rate": 0.0002978991461045457, "loss": 0.2172, "step": 2170 }, { "epoch": 0.01, "learning_rate": 0.00029788946475018877, "loss": 0.2299, "step": 2180 }, { "epoch": 0.01, "learning_rate": 0.00029787978339583185, "loss": 0.2178, "step": 2190 }, { "epoch": 0.01, "learning_rate": 0.0002978701020414749, "loss": 0.2136, "step": 2200 }, { "epoch": 0.01, "learning_rate": 0.00029786042068711795, "loss": 0.2081, "step": 2210 }, { "epoch": 0.01, "learning_rate": 0.00029785073933276103, "loss": 0.2113, "step": 2220 }, { "epoch": 0.01, "learning_rate": 0.0002978410579784041, "loss": 0.2195, "step": 2230 }, { "epoch": 0.01, "learning_rate": 0.0002978313766240472, "loss": 0.2239, "step": 2240 }, { "epoch": 0.01, "learning_rate": 0.0002978216952696902, "loss": 0.2077, "step": 2250 }, { "epoch": 0.01, "learning_rate": 0.0002978120139153333, "loss": 0.2167, "step": 2260 }, { "epoch": 0.01, "learning_rate": 0.0002978023325609764, "loss": 0.2048, "step": 2270 }, { "epoch": 0.01, "learning_rate": 0.0002977926512066194, "loss": 0.2235, "step": 2280 }, { "epoch": 0.01, "learning_rate": 0.0002977829698522625, "loss": 0.2353, "step": 2290 }, { "epoch": 0.01, "learning_rate": 0.00029777328849790556, "loss": 0.2184, "step": 2300 }, { "epoch": 0.01, "learning_rate": 0.00029776360714354864, "loss": 0.2137, "step": 2310 }, { "epoch": 0.01, "learning_rate": 0.0002977539257891917, "loss": 0.2075, "step": 2320 }, { "epoch": 0.02, "learning_rate": 0.0002977442444348348, "loss": 0.1974, "step": 2330 }, { "epoch": 0.02, "learning_rate": 0.0002977345630804779, "loss": 0.1973, "step": 2340 }, { "epoch": 0.02, "learning_rate": 0.0002977248817261209, "loss": 0.2029, "step": 2350 }, { "epoch": 0.02, "learning_rate": 0.000297715200371764, "loss": 0.2081, "step": 2360 }, { "epoch": 0.02, "learning_rate": 0.00029770551901740707, "loss": 0.217, "step": 2370 }, { "epoch": 0.02, "learning_rate": 0.00029769583766305015, "loss": 0.1976, "step": 2380 }, { "epoch": 0.02, "learning_rate": 0.00029768615630869317, "loss": 0.2072, "step": 2390 }, { "epoch": 0.02, "learning_rate": 0.00029767647495433625, "loss": 0.204, "step": 2400 }, { "epoch": 0.02, "learning_rate": 0.00029766679359997933, "loss": 0.2068, "step": 2410 }, { "epoch": 0.02, "learning_rate": 0.00029765711224562236, "loss": 0.1977, "step": 2420 }, { "epoch": 0.02, "learning_rate": 0.00029764743089126544, "loss": 0.2093, "step": 2430 }, { "epoch": 0.02, "learning_rate": 0.0002976377495369085, "loss": 0.2053, "step": 2440 }, { "epoch": 0.02, "learning_rate": 0.0002976280681825516, "loss": 0.2134, "step": 2450 }, { "epoch": 0.02, "learning_rate": 0.0002976183868281947, "loss": 0.2036, "step": 2460 }, { "epoch": 0.02, "learning_rate": 0.00029760870547383775, "loss": 0.2059, "step": 2470 }, { "epoch": 0.02, "learning_rate": 0.00029759902411948083, "loss": 0.202, "step": 2480 }, { "epoch": 0.02, "learning_rate": 0.00029758934276512386, "loss": 0.1888, "step": 2490 }, { "epoch": 0.02, "learning_rate": 0.00029757966141076694, "loss": 0.2163, "step": 2500 }, { "epoch": 0.02, "learning_rate": 0.00029756998005641, "loss": 0.2155, "step": 2510 }, { "epoch": 0.02, "learning_rate": 0.00029756029870205305, "loss": 0.1994, "step": 2520 }, { "epoch": 0.02, "learning_rate": 0.0002975506173476961, "loss": 0.2103, "step": 2530 }, { "epoch": 0.02, "learning_rate": 0.0002975409359933392, "loss": 0.2211, "step": 2540 }, { "epoch": 0.02, "learning_rate": 0.0002975312546389823, "loss": 0.2132, "step": 2550 }, { "epoch": 0.02, "learning_rate": 0.0002975215732846253, "loss": 0.2035, "step": 2560 }, { "epoch": 0.02, "learning_rate": 0.0002975118919302684, "loss": 0.2082, "step": 2570 }, { "epoch": 0.02, "learning_rate": 0.00029750221057591147, "loss": 0.2018, "step": 2580 }, { "epoch": 0.02, "learning_rate": 0.00029749252922155455, "loss": 0.197, "step": 2590 }, { "epoch": 0.02, "learning_rate": 0.00029748284786719763, "loss": 0.1911, "step": 2600 }, { "epoch": 0.02, "learning_rate": 0.0002974731665128407, "loss": 0.1997, "step": 2610 }, { "epoch": 0.02, "learning_rate": 0.00029746348515848373, "loss": 0.203, "step": 2620 }, { "epoch": 0.02, "learning_rate": 0.0002974538038041268, "loss": 0.2004, "step": 2630 }, { "epoch": 0.02, "learning_rate": 0.0002974441224497699, "loss": 0.1991, "step": 2640 }, { "epoch": 0.02, "learning_rate": 0.0002974344410954129, "loss": 0.1913, "step": 2650 }, { "epoch": 0.02, "learning_rate": 0.000297424759741056, "loss": 0.1939, "step": 2660 }, { "epoch": 0.02, "learning_rate": 0.0002974150783866991, "loss": 0.2052, "step": 2670 }, { "epoch": 0.02, "learning_rate": 0.00029740539703234216, "loss": 0.1933, "step": 2680 }, { "epoch": 0.02, "learning_rate": 0.00029739571567798524, "loss": 0.2108, "step": 2690 }, { "epoch": 0.02, "learning_rate": 0.00029738603432362826, "loss": 0.2009, "step": 2700 }, { "epoch": 0.02, "learning_rate": 0.00029737635296927134, "loss": 0.1924, "step": 2710 }, { "epoch": 0.02, "learning_rate": 0.0002973666716149144, "loss": 0.1862, "step": 2720 }, { "epoch": 0.02, "learning_rate": 0.0002973569902605575, "loss": 0.1983, "step": 2730 }, { "epoch": 0.02, "learning_rate": 0.0002973473089062006, "loss": 0.1993, "step": 2740 }, { "epoch": 0.02, "learning_rate": 0.00029733762755184366, "loss": 0.1986, "step": 2750 }, { "epoch": 0.02, "learning_rate": 0.0002973279461974867, "loss": 0.2015, "step": 2760 }, { "epoch": 0.02, "learning_rate": 0.00029731826484312977, "loss": 0.2058, "step": 2770 }, { "epoch": 0.02, "learning_rate": 0.00029730858348877285, "loss": 0.2012, "step": 2780 }, { "epoch": 0.02, "learning_rate": 0.0002972989021344159, "loss": 0.2021, "step": 2790 }, { "epoch": 0.02, "learning_rate": 0.00029728922078005895, "loss": 0.1987, "step": 2800 }, { "epoch": 0.02, "learning_rate": 0.00029727953942570203, "loss": 0.1999, "step": 2810 }, { "epoch": 0.02, "learning_rate": 0.0002972698580713451, "loss": 0.1976, "step": 2820 }, { "epoch": 0.02, "learning_rate": 0.0002972601767169882, "loss": 0.2014, "step": 2830 }, { "epoch": 0.02, "learning_rate": 0.0002972504953626312, "loss": 0.1955, "step": 2840 }, { "epoch": 0.02, "learning_rate": 0.0002972408140082743, "loss": 0.216, "step": 2850 }, { "epoch": 0.02, "learning_rate": 0.0002972311326539174, "loss": 0.2178, "step": 2860 }, { "epoch": 0.02, "learning_rate": 0.00029722145129956046, "loss": 0.1887, "step": 2870 }, { "epoch": 0.02, "learning_rate": 0.00029721176994520354, "loss": 0.1936, "step": 2880 }, { "epoch": 0.02, "learning_rate": 0.00029720208859084656, "loss": 0.1834, "step": 2890 }, { "epoch": 0.02, "learning_rate": 0.00029719240723648964, "loss": 0.1873, "step": 2900 }, { "epoch": 0.02, "learning_rate": 0.0002971827258821327, "loss": 0.2133, "step": 2910 }, { "epoch": 0.02, "learning_rate": 0.00029717304452777575, "loss": 0.1958, "step": 2920 }, { "epoch": 0.02, "learning_rate": 0.00029716336317341883, "loss": 0.1991, "step": 2930 }, { "epoch": 0.02, "learning_rate": 0.0002971536818190619, "loss": 0.188, "step": 2940 }, { "epoch": 0.02, "learning_rate": 0.000297144000464705, "loss": 0.1802, "step": 2950 }, { "epoch": 0.02, "learning_rate": 0.00029713431911034807, "loss": 0.1936, "step": 2960 }, { "epoch": 0.02, "learning_rate": 0.00029712463775599115, "loss": 0.1866, "step": 2970 }, { "epoch": 0.02, "learning_rate": 0.0002971149564016342, "loss": 0.1826, "step": 2980 }, { "epoch": 0.02, "learning_rate": 0.00029710527504727725, "loss": 0.196, "step": 2990 }, { "epoch": 0.02, "learning_rate": 0.00029709559369292033, "loss": 0.1929, "step": 3000 }, { "epoch": 0.02, "eval_cer": 0.9204690995367755, "eval_loss": 0.14816394448280334, "eval_runtime": 120.365, "eval_samples_per_second": 16.616, "eval_steps_per_second": 4.154, "step": 3000 }, { "epoch": 0.02, "learning_rate": 0.0002970859123385634, "loss": 0.1944, "step": 3010 }, { "epoch": 0.02, "learning_rate": 0.00029707623098420644, "loss": 0.1924, "step": 3020 }, { "epoch": 0.02, "learning_rate": 0.0002970665496298495, "loss": 0.1789, "step": 3030 }, { "epoch": 0.02, "learning_rate": 0.0002970568682754926, "loss": 0.1865, "step": 3040 }, { "epoch": 0.02, "learning_rate": 0.0002970471869211356, "loss": 0.1836, "step": 3050 }, { "epoch": 0.02, "learning_rate": 0.0002970375055667787, "loss": 0.2035, "step": 3060 }, { "epoch": 0.02, "learning_rate": 0.0002970278242124218, "loss": 0.1871, "step": 3070 }, { "epoch": 0.02, "learning_rate": 0.00029701814285806486, "loss": 0.1853, "step": 3080 }, { "epoch": 0.02, "learning_rate": 0.00029700846150370794, "loss": 0.1796, "step": 3090 }, { "epoch": 0.02, "learning_rate": 0.000296998780149351, "loss": 0.1727, "step": 3100 }, { "epoch": 0.02, "learning_rate": 0.0002969890987949941, "loss": 0.1846, "step": 3110 }, { "epoch": 0.02, "learning_rate": 0.00029697941744063713, "loss": 0.1907, "step": 3120 }, { "epoch": 0.02, "learning_rate": 0.0002969697360862802, "loss": 0.189, "step": 3130 }, { "epoch": 0.02, "learning_rate": 0.0002969600547319233, "loss": 0.185, "step": 3140 }, { "epoch": 0.02, "learning_rate": 0.00029695037337756637, "loss": 0.192, "step": 3150 }, { "epoch": 0.02, "learning_rate": 0.0002969406920232094, "loss": 0.1885, "step": 3160 }, { "epoch": 0.02, "learning_rate": 0.0002969310106688525, "loss": 0.1976, "step": 3170 }, { "epoch": 0.02, "learning_rate": 0.00029692132931449555, "loss": 0.194, "step": 3180 }, { "epoch": 0.02, "learning_rate": 0.0002969116479601386, "loss": 0.1877, "step": 3190 }, { "epoch": 0.02, "learning_rate": 0.00029690196660578166, "loss": 0.1863, "step": 3200 }, { "epoch": 0.02, "learning_rate": 0.00029689228525142474, "loss": 0.192, "step": 3210 }, { "epoch": 0.02, "learning_rate": 0.0002968826038970678, "loss": 0.1788, "step": 3220 }, { "epoch": 0.02, "learning_rate": 0.0002968729225427109, "loss": 0.174, "step": 3230 }, { "epoch": 0.02, "learning_rate": 0.000296863241188354, "loss": 0.1919, "step": 3240 }, { "epoch": 0.02, "learning_rate": 0.00029685355983399706, "loss": 0.181, "step": 3250 }, { "epoch": 0.02, "learning_rate": 0.0002968438784796401, "loss": 0.1869, "step": 3260 }, { "epoch": 0.02, "learning_rate": 0.00029683419712528316, "loss": 0.1874, "step": 3270 }, { "epoch": 0.02, "learning_rate": 0.00029682451577092624, "loss": 0.1993, "step": 3280 }, { "epoch": 0.02, "learning_rate": 0.00029681483441656927, "loss": 0.1709, "step": 3290 }, { "epoch": 0.02, "learning_rate": 0.00029680515306221235, "loss": 0.1963, "step": 3300 }, { "epoch": 0.02, "learning_rate": 0.00029679547170785543, "loss": 0.1749, "step": 3310 }, { "epoch": 0.02, "learning_rate": 0.0002967857903534985, "loss": 0.1753, "step": 3320 }, { "epoch": 0.02, "learning_rate": 0.00029677610899914153, "loss": 0.1761, "step": 3330 }, { "epoch": 0.02, "learning_rate": 0.0002967664276447846, "loss": 0.174, "step": 3340 }, { "epoch": 0.02, "learning_rate": 0.0002967567462904277, "loss": 0.1839, "step": 3350 }, { "epoch": 0.02, "learning_rate": 0.00029674706493607077, "loss": 0.187, "step": 3360 }, { "epoch": 0.02, "learning_rate": 0.00029673738358171385, "loss": 0.1938, "step": 3370 }, { "epoch": 0.02, "learning_rate": 0.00029672770222735693, "loss": 0.1758, "step": 3380 }, { "epoch": 0.02, "learning_rate": 0.00029671802087299996, "loss": 0.1819, "step": 3390 }, { "epoch": 0.02, "learning_rate": 0.00029670833951864304, "loss": 0.1855, "step": 3400 }, { "epoch": 0.02, "learning_rate": 0.0002966986581642861, "loss": 0.1851, "step": 3410 }, { "epoch": 0.02, "learning_rate": 0.00029668897680992914, "loss": 0.1934, "step": 3420 }, { "epoch": 0.02, "learning_rate": 0.0002966792954555722, "loss": 0.1875, "step": 3430 }, { "epoch": 0.02, "learning_rate": 0.0002966696141012153, "loss": 0.1727, "step": 3440 }, { "epoch": 0.02, "learning_rate": 0.0002966599327468584, "loss": 0.1789, "step": 3450 }, { "epoch": 0.02, "learning_rate": 0.0002966502513925014, "loss": 0.1786, "step": 3460 }, { "epoch": 0.02, "learning_rate": 0.0002966405700381445, "loss": 0.1708, "step": 3470 }, { "epoch": 0.02, "learning_rate": 0.00029663088868378757, "loss": 0.1784, "step": 3480 }, { "epoch": 0.02, "learning_rate": 0.00029662120732943065, "loss": 0.1866, "step": 3490 }, { "epoch": 0.02, "learning_rate": 0.0002966115259750737, "loss": 0.1944, "step": 3500 }, { "epoch": 0.02, "learning_rate": 0.0002966018446207168, "loss": 0.1765, "step": 3510 }, { "epoch": 0.02, "learning_rate": 0.0002965921632663599, "loss": 0.1748, "step": 3520 }, { "epoch": 0.02, "learning_rate": 0.0002965824819120029, "loss": 0.1763, "step": 3530 }, { "epoch": 0.02, "learning_rate": 0.000296572800557646, "loss": 0.1897, "step": 3540 }, { "epoch": 0.02, "learning_rate": 0.00029656311920328907, "loss": 0.1747, "step": 3550 }, { "epoch": 0.02, "learning_rate": 0.0002965534378489321, "loss": 0.1931, "step": 3560 }, { "epoch": 0.02, "learning_rate": 0.0002965437564945752, "loss": 0.1789, "step": 3570 }, { "epoch": 0.02, "learning_rate": 0.00029653407514021826, "loss": 0.186, "step": 3580 }, { "epoch": 0.02, "learning_rate": 0.00029652439378586134, "loss": 0.1809, "step": 3590 }, { "epoch": 0.02, "learning_rate": 0.00029651471243150436, "loss": 0.1753, "step": 3600 }, { "epoch": 0.02, "learning_rate": 0.00029650503107714744, "loss": 0.1699, "step": 3610 }, { "epoch": 0.02, "learning_rate": 0.0002964953497227905, "loss": 0.1679, "step": 3620 }, { "epoch": 0.02, "learning_rate": 0.0002964856683684336, "loss": 0.1782, "step": 3630 }, { "epoch": 0.02, "learning_rate": 0.0002964759870140767, "loss": 0.1892, "step": 3640 }, { "epoch": 0.02, "learning_rate": 0.00029646630565971976, "loss": 0.1684, "step": 3650 }, { "epoch": 0.02, "learning_rate": 0.0002964566243053628, "loss": 0.1747, "step": 3660 }, { "epoch": 0.02, "learning_rate": 0.00029644694295100587, "loss": 0.1767, "step": 3670 }, { "epoch": 0.02, "learning_rate": 0.00029643726159664895, "loss": 0.1824, "step": 3680 }, { "epoch": 0.02, "learning_rate": 0.00029642758024229197, "loss": 0.1768, "step": 3690 }, { "epoch": 0.02, "learning_rate": 0.00029641789888793505, "loss": 0.1783, "step": 3700 }, { "epoch": 0.02, "learning_rate": 0.00029640821753357813, "loss": 0.1656, "step": 3710 }, { "epoch": 0.02, "learning_rate": 0.0002963985361792212, "loss": 0.1845, "step": 3720 }, { "epoch": 0.02, "learning_rate": 0.0002963888548248643, "loss": 0.1875, "step": 3730 }, { "epoch": 0.02, "learning_rate": 0.0002963791734705073, "loss": 0.1781, "step": 3740 }, { "epoch": 0.02, "learning_rate": 0.0002963694921161504, "loss": 0.1837, "step": 3750 }, { "epoch": 0.02, "learning_rate": 0.0002963598107617935, "loss": 0.1742, "step": 3760 }, { "epoch": 0.02, "learning_rate": 0.00029635012940743656, "loss": 0.175, "step": 3770 }, { "epoch": 0.02, "learning_rate": 0.00029634044805307964, "loss": 0.1749, "step": 3780 }, { "epoch": 0.02, "learning_rate": 0.00029633076669872266, "loss": 0.1729, "step": 3790 }, { "epoch": 0.02, "learning_rate": 0.00029632108534436574, "loss": 0.1797, "step": 3800 }, { "epoch": 0.02, "learning_rate": 0.0002963114039900088, "loss": 0.1908, "step": 3810 }, { "epoch": 0.02, "learning_rate": 0.00029630172263565185, "loss": 0.1965, "step": 3820 }, { "epoch": 0.02, "learning_rate": 0.0002962920412812949, "loss": 0.1661, "step": 3830 }, { "epoch": 0.02, "learning_rate": 0.000296282359926938, "loss": 0.1709, "step": 3840 }, { "epoch": 0.02, "learning_rate": 0.0002962726785725811, "loss": 0.1792, "step": 3850 }, { "epoch": 0.02, "learning_rate": 0.00029626299721822417, "loss": 0.1721, "step": 3860 }, { "epoch": 0.02, "learning_rate": 0.00029625331586386725, "loss": 0.1671, "step": 3870 }, { "epoch": 0.03, "learning_rate": 0.00029624363450951027, "loss": 0.1652, "step": 3880 }, { "epoch": 0.03, "learning_rate": 0.00029623395315515335, "loss": 0.1718, "step": 3890 }, { "epoch": 0.03, "learning_rate": 0.00029622427180079643, "loss": 0.1702, "step": 3900 }, { "epoch": 0.03, "learning_rate": 0.0002962145904464395, "loss": 0.1709, "step": 3910 }, { "epoch": 0.03, "learning_rate": 0.0002962049090920826, "loss": 0.1673, "step": 3920 }, { "epoch": 0.03, "learning_rate": 0.0002961952277377256, "loss": 0.1748, "step": 3930 }, { "epoch": 0.03, "learning_rate": 0.0002961855463833687, "loss": 0.1646, "step": 3940 }, { "epoch": 0.03, "learning_rate": 0.0002961758650290118, "loss": 0.1815, "step": 3950 }, { "epoch": 0.03, "learning_rate": 0.0002961661836746548, "loss": 0.1857, "step": 3960 }, { "epoch": 0.03, "learning_rate": 0.0002961565023202979, "loss": 0.1643, "step": 3970 }, { "epoch": 0.03, "learning_rate": 0.00029614682096594096, "loss": 0.1717, "step": 3980 }, { "epoch": 0.03, "learning_rate": 0.00029613713961158404, "loss": 0.1698, "step": 3990 }, { "epoch": 0.03, "learning_rate": 0.0002961274582572271, "loss": 0.1686, "step": 4000 }, { "epoch": 0.03, "eval_cer": 0.9202214439046436, "eval_loss": 0.13143764436244965, "eval_runtime": 120.5794, "eval_samples_per_second": 16.587, "eval_steps_per_second": 4.147, "step": 4000 }, { "epoch": 0.03, "learning_rate": 0.0002961177769028702, "loss": 0.1757, "step": 4010 }, { "epoch": 0.03, "learning_rate": 0.0002961080955485132, "loss": 0.1865, "step": 4020 }, { "epoch": 0.03, "learning_rate": 0.0002960984141941563, "loss": 0.1712, "step": 4030 }, { "epoch": 0.03, "learning_rate": 0.0002960887328397994, "loss": 0.1643, "step": 4040 }, { "epoch": 0.03, "learning_rate": 0.00029607905148544246, "loss": 0.1675, "step": 4050 }, { "epoch": 0.03, "learning_rate": 0.0002960693701310855, "loss": 0.1717, "step": 4060 }, { "epoch": 0.03, "learning_rate": 0.00029605968877672857, "loss": 0.1708, "step": 4070 }, { "epoch": 0.03, "learning_rate": 0.00029605000742237165, "loss": 0.1727, "step": 4080 }, { "epoch": 0.03, "learning_rate": 0.0002960403260680147, "loss": 0.1726, "step": 4090 }, { "epoch": 0.03, "learning_rate": 0.00029603064471365776, "loss": 0.1588, "step": 4100 }, { "epoch": 0.03, "learning_rate": 0.00029602096335930083, "loss": 0.168, "step": 4110 }, { "epoch": 0.03, "learning_rate": 0.0002960112820049439, "loss": 0.1642, "step": 4120 }, { "epoch": 0.03, "learning_rate": 0.000296001600650587, "loss": 0.1704, "step": 4130 }, { "epoch": 0.03, "learning_rate": 0.0002959919192962301, "loss": 0.163, "step": 4140 }, { "epoch": 0.03, "learning_rate": 0.00029598223794187315, "loss": 0.1668, "step": 4150 }, { "epoch": 0.03, "learning_rate": 0.0002959725565875162, "loss": 0.1732, "step": 4160 }, { "epoch": 0.03, "learning_rate": 0.00029596287523315926, "loss": 0.1665, "step": 4170 }, { "epoch": 0.03, "learning_rate": 0.00029595319387880234, "loss": 0.1528, "step": 4180 }, { "epoch": 0.03, "learning_rate": 0.00029594351252444536, "loss": 0.1749, "step": 4190 }, { "epoch": 0.03, "learning_rate": 0.00029593383117008844, "loss": 0.1748, "step": 4200 }, { "epoch": 0.03, "learning_rate": 0.0002959241498157315, "loss": 0.1636, "step": 4210 }, { "epoch": 0.03, "learning_rate": 0.0002959144684613746, "loss": 0.1548, "step": 4220 }, { "epoch": 0.03, "learning_rate": 0.00029590478710701763, "loss": 0.1783, "step": 4230 }, { "epoch": 0.03, "learning_rate": 0.0002958951057526607, "loss": 0.1676, "step": 4240 }, { "epoch": 0.03, "learning_rate": 0.0002958854243983038, "loss": 0.1716, "step": 4250 }, { "epoch": 0.03, "learning_rate": 0.00029587574304394687, "loss": 0.1813, "step": 4260 }, { "epoch": 0.03, "learning_rate": 0.00029586606168958995, "loss": 0.177, "step": 4270 }, { "epoch": 0.03, "learning_rate": 0.00029585638033523303, "loss": 0.1679, "step": 4280 }, { "epoch": 0.03, "learning_rate": 0.0002958466989808761, "loss": 0.1675, "step": 4290 }, { "epoch": 0.03, "learning_rate": 0.00029583701762651913, "loss": 0.1704, "step": 4300 }, { "epoch": 0.03, "learning_rate": 0.0002958273362721622, "loss": 0.1601, "step": 4310 }, { "epoch": 0.03, "learning_rate": 0.0002958176549178053, "loss": 0.1704, "step": 4320 }, { "epoch": 0.03, "learning_rate": 0.0002958079735634483, "loss": 0.1524, "step": 4330 }, { "epoch": 0.03, "learning_rate": 0.0002957982922090914, "loss": 0.1649, "step": 4340 }, { "epoch": 0.03, "learning_rate": 0.0002957886108547345, "loss": 0.1678, "step": 4350 }, { "epoch": 0.03, "learning_rate": 0.00029577892950037756, "loss": 0.165, "step": 4360 }, { "epoch": 0.03, "learning_rate": 0.0002957692481460206, "loss": 0.1678, "step": 4370 }, { "epoch": 0.03, "learning_rate": 0.00029575956679166366, "loss": 0.1698, "step": 4380 }, { "epoch": 0.03, "learning_rate": 0.00029574988543730674, "loss": 0.1609, "step": 4390 }, { "epoch": 0.03, "learning_rate": 0.0002957402040829498, "loss": 0.1747, "step": 4400 }, { "epoch": 0.03, "learning_rate": 0.0002957305227285929, "loss": 0.1796, "step": 4410 }, { "epoch": 0.03, "learning_rate": 0.000295720841374236, "loss": 0.1647, "step": 4420 }, { "epoch": 0.03, "learning_rate": 0.000295711160019879, "loss": 0.1547, "step": 4430 }, { "epoch": 0.03, "learning_rate": 0.0002957014786655221, "loss": 0.1632, "step": 4440 }, { "epoch": 0.03, "learning_rate": 0.00029569179731116517, "loss": 0.1606, "step": 4450 }, { "epoch": 0.03, "learning_rate": 0.0002956821159568082, "loss": 0.1676, "step": 4460 }, { "epoch": 0.03, "learning_rate": 0.0002956724346024513, "loss": 0.1658, "step": 4470 }, { "epoch": 0.03, "learning_rate": 0.00029566275324809435, "loss": 0.1724, "step": 4480 }, { "epoch": 0.03, "learning_rate": 0.00029565307189373743, "loss": 0.165, "step": 4490 }, { "epoch": 0.03, "learning_rate": 0.0002956433905393805, "loss": 0.1719, "step": 4500 }, { "epoch": 0.03, "learning_rate": 0.00029563370918502354, "loss": 0.166, "step": 4510 }, { "epoch": 0.03, "learning_rate": 0.0002956240278306666, "loss": 0.1635, "step": 4520 }, { "epoch": 0.03, "learning_rate": 0.0002956143464763097, "loss": 0.1696, "step": 4530 }, { "epoch": 0.03, "learning_rate": 0.0002956046651219528, "loss": 0.1781, "step": 4540 }, { "epoch": 0.03, "learning_rate": 0.00029559498376759586, "loss": 0.1605, "step": 4550 }, { "epoch": 0.03, "learning_rate": 0.00029558530241323894, "loss": 0.1701, "step": 4560 }, { "epoch": 0.03, "learning_rate": 0.00029557562105888196, "loss": 0.1613, "step": 4570 }, { "epoch": 0.03, "learning_rate": 0.00029556593970452504, "loss": 0.1563, "step": 4580 }, { "epoch": 0.03, "learning_rate": 0.0002955562583501681, "loss": 0.1591, "step": 4590 }, { "epoch": 0.03, "learning_rate": 0.00029554657699581115, "loss": 0.1609, "step": 4600 }, { "epoch": 0.03, "learning_rate": 0.00029553689564145423, "loss": 0.1613, "step": 4610 }, { "epoch": 0.03, "learning_rate": 0.0002955272142870973, "loss": 0.1668, "step": 4620 }, { "epoch": 0.03, "learning_rate": 0.0002955175329327404, "loss": 0.168, "step": 4630 }, { "epoch": 0.03, "learning_rate": 0.00029550785157838347, "loss": 0.1668, "step": 4640 }, { "epoch": 0.03, "learning_rate": 0.0002954981702240265, "loss": 0.1656, "step": 4650 }, { "epoch": 0.03, "learning_rate": 0.0002954884888696696, "loss": 0.1467, "step": 4660 }, { "epoch": 0.03, "learning_rate": 0.00029547880751531265, "loss": 0.1548, "step": 4670 }, { "epoch": 0.03, "learning_rate": 0.00029546912616095573, "loss": 0.1574, "step": 4680 }, { "epoch": 0.03, "learning_rate": 0.0002954594448065988, "loss": 0.1495, "step": 4690 }, { "epoch": 0.03, "learning_rate": 0.00029544976345224184, "loss": 0.1575, "step": 4700 }, { "epoch": 0.03, "learning_rate": 0.0002954400820978849, "loss": 0.1592, "step": 4710 }, { "epoch": 0.03, "learning_rate": 0.000295430400743528, "loss": 0.1645, "step": 4720 }, { "epoch": 0.03, "learning_rate": 0.000295420719389171, "loss": 0.1587, "step": 4730 }, { "epoch": 0.03, "learning_rate": 0.0002954110380348141, "loss": 0.1636, "step": 4740 }, { "epoch": 0.03, "learning_rate": 0.0002954013566804572, "loss": 0.1643, "step": 4750 }, { "epoch": 0.03, "learning_rate": 0.00029539167532610026, "loss": 0.1487, "step": 4760 }, { "epoch": 0.03, "learning_rate": 0.00029538199397174334, "loss": 0.1581, "step": 4770 }, { "epoch": 0.03, "learning_rate": 0.0002953723126173864, "loss": 0.1535, "step": 4780 }, { "epoch": 0.03, "learning_rate": 0.00029536263126302945, "loss": 0.1745, "step": 4790 }, { "epoch": 0.03, "learning_rate": 0.00029535294990867253, "loss": 0.1581, "step": 4800 }, { "epoch": 0.03, "learning_rate": 0.0002953432685543156, "loss": 0.1652, "step": 4810 }, { "epoch": 0.03, "learning_rate": 0.0002953335871999587, "loss": 0.1545, "step": 4820 }, { "epoch": 0.03, "learning_rate": 0.0002953239058456017, "loss": 0.1679, "step": 4830 }, { "epoch": 0.03, "learning_rate": 0.0002953142244912448, "loss": 0.1594, "step": 4840 }, { "epoch": 0.03, "learning_rate": 0.00029530454313688787, "loss": 0.1421, "step": 4850 }, { "epoch": 0.03, "learning_rate": 0.0002952948617825309, "loss": 0.1492, "step": 4860 }, { "epoch": 0.03, "learning_rate": 0.000295285180428174, "loss": 0.1579, "step": 4870 }, { "epoch": 0.03, "learning_rate": 0.00029527549907381706, "loss": 0.1519, "step": 4880 }, { "epoch": 0.03, "learning_rate": 0.00029526581771946014, "loss": 0.1515, "step": 4890 }, { "epoch": 0.03, "learning_rate": 0.0002952561363651032, "loss": 0.1607, "step": 4900 }, { "epoch": 0.03, "learning_rate": 0.0002952464550107463, "loss": 0.165, "step": 4910 }, { "epoch": 0.03, "learning_rate": 0.0002952367736563894, "loss": 0.1546, "step": 4920 }, { "epoch": 0.03, "learning_rate": 0.0002952270923020324, "loss": 0.1613, "step": 4930 }, { "epoch": 0.03, "learning_rate": 0.0002952174109476755, "loss": 0.1442, "step": 4940 }, { "epoch": 0.03, "learning_rate": 0.00029520772959331856, "loss": 0.1547, "step": 4950 }, { "epoch": 0.03, "learning_rate": 0.00029519804823896164, "loss": 0.1483, "step": 4960 }, { "epoch": 0.03, "learning_rate": 0.00029518836688460467, "loss": 0.1528, "step": 4970 }, { "epoch": 0.03, "learning_rate": 0.00029517868553024775, "loss": 0.1709, "step": 4980 }, { "epoch": 0.03, "learning_rate": 0.0002951690041758908, "loss": 0.1527, "step": 4990 }, { "epoch": 0.03, "learning_rate": 0.00029515932282153385, "loss": 0.1435, "step": 5000 }, { "epoch": 0.03, "eval_cer": 0.9202720596542764, "eval_loss": 0.11752115935087204, "eval_runtime": 120.5405, "eval_samples_per_second": 16.592, "eval_steps_per_second": 4.148, "step": 5000 }, { "epoch": 0.03, "learning_rate": 0.00029514964146717693, "loss": 0.1587, "step": 5010 }, { "epoch": 0.03, "learning_rate": 0.00029513996011282, "loss": 0.1598, "step": 5020 }, { "epoch": 0.03, "learning_rate": 0.0002951302787584631, "loss": 0.1555, "step": 5030 }, { "epoch": 0.03, "learning_rate": 0.00029512059740410617, "loss": 0.1445, "step": 5040 }, { "epoch": 0.03, "learning_rate": 0.00029511091604974925, "loss": 0.1461, "step": 5050 }, { "epoch": 0.03, "learning_rate": 0.00029510123469539233, "loss": 0.1512, "step": 5060 }, { "epoch": 0.03, "learning_rate": 0.00029509155334103536, "loss": 0.1567, "step": 5070 }, { "epoch": 0.03, "learning_rate": 0.00029508187198667844, "loss": 0.1444, "step": 5080 }, { "epoch": 0.03, "learning_rate": 0.0002950721906323215, "loss": 0.1479, "step": 5090 }, { "epoch": 0.03, "learning_rate": 0.00029506250927796454, "loss": 0.1521, "step": 5100 }, { "epoch": 0.03, "learning_rate": 0.0002950528279236076, "loss": 0.1399, "step": 5110 }, { "epoch": 0.03, "learning_rate": 0.0002950431465692507, "loss": 0.1568, "step": 5120 }, { "epoch": 0.03, "learning_rate": 0.0002950334652148938, "loss": 0.1437, "step": 5130 }, { "epoch": 0.03, "learning_rate": 0.0002950237838605368, "loss": 0.1578, "step": 5140 }, { "epoch": 0.03, "learning_rate": 0.0002950141025061799, "loss": 0.1373, "step": 5150 }, { "epoch": 0.03, "learning_rate": 0.00029500442115182297, "loss": 0.1526, "step": 5160 }, { "epoch": 0.03, "learning_rate": 0.00029499473979746605, "loss": 0.1635, "step": 5170 }, { "epoch": 0.03, "learning_rate": 0.0002949850584431091, "loss": 0.1476, "step": 5180 }, { "epoch": 0.03, "learning_rate": 0.0002949753770887522, "loss": 0.1721, "step": 5190 }, { "epoch": 0.03, "learning_rate": 0.00029496569573439523, "loss": 0.1519, "step": 5200 }, { "epoch": 0.03, "learning_rate": 0.0002949560143800383, "loss": 0.1522, "step": 5210 }, { "epoch": 0.03, "learning_rate": 0.0002949463330256814, "loss": 0.1545, "step": 5220 }, { "epoch": 0.03, "learning_rate": 0.0002949366516713244, "loss": 0.1531, "step": 5230 }, { "epoch": 0.03, "learning_rate": 0.0002949269703169675, "loss": 0.1531, "step": 5240 }, { "epoch": 0.03, "learning_rate": 0.0002949172889626106, "loss": 0.1446, "step": 5250 }, { "epoch": 0.03, "learning_rate": 0.00029490760760825366, "loss": 0.1454, "step": 5260 }, { "epoch": 0.03, "learning_rate": 0.00029489792625389674, "loss": 0.1457, "step": 5270 }, { "epoch": 0.03, "learning_rate": 0.00029488824489953976, "loss": 0.1523, "step": 5280 }, { "epoch": 0.03, "learning_rate": 0.00029487856354518284, "loss": 0.1594, "step": 5290 }, { "epoch": 0.03, "learning_rate": 0.0002948688821908259, "loss": 0.1423, "step": 5300 }, { "epoch": 0.03, "learning_rate": 0.000294859200836469, "loss": 0.1493, "step": 5310 }, { "epoch": 0.03, "learning_rate": 0.0002948495194821121, "loss": 0.1573, "step": 5320 }, { "epoch": 0.03, "learning_rate": 0.00029483983812775516, "loss": 0.1592, "step": 5330 }, { "epoch": 0.03, "learning_rate": 0.0002948301567733982, "loss": 0.1715, "step": 5340 }, { "epoch": 0.03, "learning_rate": 0.00029482047541904127, "loss": 0.138, "step": 5350 }, { "epoch": 0.03, "learning_rate": 0.00029481079406468435, "loss": 0.1524, "step": 5360 }, { "epoch": 0.03, "learning_rate": 0.00029480111271032737, "loss": 0.1443, "step": 5370 }, { "epoch": 0.03, "learning_rate": 0.00029479143135597045, "loss": 0.1384, "step": 5380 }, { "epoch": 0.03, "learning_rate": 0.00029478175000161353, "loss": 0.1533, "step": 5390 }, { "epoch": 0.03, "learning_rate": 0.0002947720686472566, "loss": 0.1419, "step": 5400 }, { "epoch": 0.03, "learning_rate": 0.0002947623872928997, "loss": 0.1362, "step": 5410 }, { "epoch": 0.03, "learning_rate": 0.0002947527059385427, "loss": 0.1451, "step": 5420 }, { "epoch": 0.04, "learning_rate": 0.0002947430245841858, "loss": 0.1496, "step": 5430 }, { "epoch": 0.04, "learning_rate": 0.0002947333432298289, "loss": 0.1457, "step": 5440 }, { "epoch": 0.04, "learning_rate": 0.00029472366187547195, "loss": 0.1553, "step": 5450 }, { "epoch": 0.04, "learning_rate": 0.00029471398052111503, "loss": 0.1477, "step": 5460 }, { "epoch": 0.04, "learning_rate": 0.00029470429916675806, "loss": 0.1456, "step": 5470 }, { "epoch": 0.04, "learning_rate": 0.00029469461781240114, "loss": 0.1504, "step": 5480 }, { "epoch": 0.04, "learning_rate": 0.0002946849364580442, "loss": 0.144, "step": 5490 }, { "epoch": 0.04, "learning_rate": 0.00029467525510368725, "loss": 0.1527, "step": 5500 }, { "epoch": 0.04, "learning_rate": 0.0002946655737493303, "loss": 0.1424, "step": 5510 }, { "epoch": 0.04, "learning_rate": 0.0002946558923949734, "loss": 0.1421, "step": 5520 }, { "epoch": 0.04, "learning_rate": 0.0002946462110406165, "loss": 0.1441, "step": 5530 }, { "epoch": 0.04, "learning_rate": 0.00029463652968625956, "loss": 0.1489, "step": 5540 }, { "epoch": 0.04, "learning_rate": 0.00029462684833190264, "loss": 0.143, "step": 5550 }, { "epoch": 0.04, "learning_rate": 0.00029461716697754567, "loss": 0.1462, "step": 5560 }, { "epoch": 0.04, "learning_rate": 0.00029460748562318875, "loss": 0.1505, "step": 5570 }, { "epoch": 0.04, "learning_rate": 0.00029459780426883183, "loss": 0.1619, "step": 5580 }, { "epoch": 0.04, "learning_rate": 0.0002945881229144749, "loss": 0.1587, "step": 5590 }, { "epoch": 0.04, "learning_rate": 0.00029457844156011794, "loss": 0.1495, "step": 5600 }, { "epoch": 0.04, "learning_rate": 0.000294568760205761, "loss": 0.1498, "step": 5610 }, { "epoch": 0.04, "learning_rate": 0.0002945590788514041, "loss": 0.1476, "step": 5620 }, { "epoch": 0.04, "learning_rate": 0.0002945493974970471, "loss": 0.1599, "step": 5630 }, { "epoch": 0.04, "learning_rate": 0.0002945397161426902, "loss": 0.1463, "step": 5640 }, { "epoch": 0.04, "learning_rate": 0.0002945300347883333, "loss": 0.1478, "step": 5650 }, { "epoch": 0.04, "learning_rate": 0.00029452035343397636, "loss": 0.1506, "step": 5660 }, { "epoch": 0.04, "learning_rate": 0.00029451067207961944, "loss": 0.1525, "step": 5670 }, { "epoch": 0.04, "learning_rate": 0.0002945009907252625, "loss": 0.1511, "step": 5680 }, { "epoch": 0.04, "learning_rate": 0.0002944913093709056, "loss": 0.1454, "step": 5690 }, { "epoch": 0.04, "learning_rate": 0.0002944816280165486, "loss": 0.158, "step": 5700 }, { "epoch": 0.04, "learning_rate": 0.0002944719466621917, "loss": 0.1532, "step": 5710 }, { "epoch": 0.04, "learning_rate": 0.0002944622653078348, "loss": 0.1466, "step": 5720 }, { "epoch": 0.04, "learning_rate": 0.00029445258395347786, "loss": 0.1484, "step": 5730 }, { "epoch": 0.04, "learning_rate": 0.0002944429025991209, "loss": 0.1447, "step": 5740 }, { "epoch": 0.04, "learning_rate": 0.00029443322124476397, "loss": 0.1752, "step": 5750 }, { "epoch": 0.04, "learning_rate": 0.00029442353989040705, "loss": 0.154, "step": 5760 }, { "epoch": 0.04, "learning_rate": 0.0002944138585360501, "loss": 0.1467, "step": 5770 }, { "epoch": 0.04, "learning_rate": 0.00029440417718169315, "loss": 0.1485, "step": 5780 }, { "epoch": 0.04, "learning_rate": 0.00029439449582733623, "loss": 0.1538, "step": 5790 }, { "epoch": 0.04, "learning_rate": 0.0002943848144729793, "loss": 0.1539, "step": 5800 }, { "epoch": 0.04, "learning_rate": 0.0002943751331186224, "loss": 0.15, "step": 5810 }, { "epoch": 0.04, "learning_rate": 0.0002943654517642655, "loss": 0.1469, "step": 5820 }, { "epoch": 0.04, "learning_rate": 0.00029435577040990855, "loss": 0.1423, "step": 5830 }, { "epoch": 0.04, "learning_rate": 0.0002943460890555516, "loss": 0.1426, "step": 5840 }, { "epoch": 0.04, "learning_rate": 0.00029433640770119466, "loss": 0.1513, "step": 5850 }, { "epoch": 0.04, "learning_rate": 0.00029432672634683774, "loss": 0.1474, "step": 5860 }, { "epoch": 0.04, "learning_rate": 0.00029431704499248076, "loss": 0.1476, "step": 5870 }, { "epoch": 0.04, "learning_rate": 0.00029430736363812384, "loss": 0.1538, "step": 5880 }, { "epoch": 0.04, "learning_rate": 0.0002942976822837669, "loss": 0.1421, "step": 5890 }, { "epoch": 0.04, "learning_rate": 0.00029428800092941, "loss": 0.1368, "step": 5900 }, { "epoch": 0.04, "learning_rate": 0.00029427831957505303, "loss": 0.1442, "step": 5910 }, { "epoch": 0.04, "learning_rate": 0.0002942686382206961, "loss": 0.1365, "step": 5920 }, { "epoch": 0.04, "learning_rate": 0.0002942589568663392, "loss": 0.1462, "step": 5930 }, { "epoch": 0.04, "learning_rate": 0.00029424927551198227, "loss": 0.1438, "step": 5940 }, { "epoch": 0.04, "learning_rate": 0.00029423959415762535, "loss": 0.1495, "step": 5950 }, { "epoch": 0.04, "learning_rate": 0.00029422991280326843, "loss": 0.1427, "step": 5960 }, { "epoch": 0.04, "learning_rate": 0.0002942202314489115, "loss": 0.1476, "step": 5970 }, { "epoch": 0.04, "learning_rate": 0.00029421055009455453, "loss": 0.1562, "step": 5980 }, { "epoch": 0.04, "learning_rate": 0.0002942008687401976, "loss": 0.1451, "step": 5990 }, { "epoch": 0.04, "learning_rate": 0.00029419118738584064, "loss": 0.1505, "step": 6000 }, { "epoch": 0.04, "eval_cer": 0.9203606372161338, "eval_loss": 0.1086047813296318, "eval_runtime": 120.5193, "eval_samples_per_second": 16.595, "eval_steps_per_second": 4.149, "step": 6000 }, { "epoch": 0.04, "learning_rate": 0.0002941815060314837, "loss": 0.1335, "step": 6010 }, { "epoch": 0.04, "learning_rate": 0.0002941718246771268, "loss": 0.1449, "step": 6020 }, { "epoch": 0.04, "learning_rate": 0.0002941621433227699, "loss": 0.1478, "step": 6030 }, { "epoch": 0.04, "learning_rate": 0.00029415246196841296, "loss": 0.159, "step": 6040 }, { "epoch": 0.04, "learning_rate": 0.000294142780614056, "loss": 0.1473, "step": 6050 }, { "epoch": 0.04, "learning_rate": 0.00029413309925969906, "loss": 0.1431, "step": 6060 }, { "epoch": 0.04, "learning_rate": 0.00029412341790534214, "loss": 0.1511, "step": 6070 }, { "epoch": 0.04, "learning_rate": 0.0002941137365509852, "loss": 0.1466, "step": 6080 }, { "epoch": 0.04, "learning_rate": 0.0002941040551966283, "loss": 0.1526, "step": 6090 }, { "epoch": 0.04, "learning_rate": 0.0002940943738422714, "loss": 0.1464, "step": 6100 }, { "epoch": 0.04, "learning_rate": 0.0002940846924879144, "loss": 0.155, "step": 6110 }, { "epoch": 0.04, "learning_rate": 0.0002940750111335575, "loss": 0.1405, "step": 6120 }, { "epoch": 0.04, "learning_rate": 0.00029406532977920057, "loss": 0.1549, "step": 6130 }, { "epoch": 0.04, "learning_rate": 0.0002940556484248436, "loss": 0.1439, "step": 6140 }, { "epoch": 0.04, "learning_rate": 0.0002940459670704867, "loss": 0.1446, "step": 6150 }, { "epoch": 0.04, "learning_rate": 0.00029403628571612975, "loss": 0.1538, "step": 6160 }, { "epoch": 0.04, "learning_rate": 0.00029402660436177283, "loss": 0.1401, "step": 6170 }, { "epoch": 0.04, "learning_rate": 0.0002940169230074159, "loss": 0.1451, "step": 6180 }, { "epoch": 0.04, "learning_rate": 0.00029400724165305894, "loss": 0.1303, "step": 6190 }, { "epoch": 0.04, "learning_rate": 0.000293997560298702, "loss": 0.1395, "step": 6200 }, { "epoch": 0.04, "learning_rate": 0.0002939878789443451, "loss": 0.1384, "step": 6210 }, { "epoch": 0.04, "learning_rate": 0.0002939781975899882, "loss": 0.1402, "step": 6220 }, { "epoch": 0.04, "learning_rate": 0.00029396851623563126, "loss": 0.1452, "step": 6230 }, { "epoch": 0.04, "learning_rate": 0.0002939588348812743, "loss": 0.1342, "step": 6240 }, { "epoch": 0.04, "learning_rate": 0.00029394915352691736, "loss": 0.1362, "step": 6250 }, { "epoch": 0.04, "learning_rate": 0.00029393947217256044, "loss": 0.1499, "step": 6260 }, { "epoch": 0.04, "learning_rate": 0.00029392979081820347, "loss": 0.1445, "step": 6270 }, { "epoch": 0.04, "learning_rate": 0.00029392010946384655, "loss": 0.1339, "step": 6280 }, { "epoch": 0.04, "learning_rate": 0.00029391042810948963, "loss": 0.1372, "step": 6290 }, { "epoch": 0.04, "learning_rate": 0.0002939007467551327, "loss": 0.1323, "step": 6300 }, { "epoch": 0.04, "learning_rate": 0.0002938910654007758, "loss": 0.1459, "step": 6310 }, { "epoch": 0.04, "learning_rate": 0.00029388138404641887, "loss": 0.1472, "step": 6320 }, { "epoch": 0.04, "learning_rate": 0.0002938717026920619, "loss": 0.144, "step": 6330 }, { "epoch": 0.04, "learning_rate": 0.00029386202133770497, "loss": 0.1399, "step": 6340 }, { "epoch": 0.04, "learning_rate": 0.00029385233998334805, "loss": 0.1411, "step": 6350 }, { "epoch": 0.04, "learning_rate": 0.00029384265862899113, "loss": 0.1462, "step": 6360 }, { "epoch": 0.04, "learning_rate": 0.0002938329772746342, "loss": 0.1461, "step": 6370 }, { "epoch": 0.04, "learning_rate": 0.00029382329592027724, "loss": 0.1473, "step": 6380 }, { "epoch": 0.04, "learning_rate": 0.0002938136145659203, "loss": 0.1478, "step": 6390 }, { "epoch": 0.04, "learning_rate": 0.00029380393321156334, "loss": 0.1348, "step": 6400 }, { "epoch": 0.04, "learning_rate": 0.0002937942518572064, "loss": 0.1443, "step": 6410 }, { "epoch": 0.04, "learning_rate": 0.0002937845705028495, "loss": 0.148, "step": 6420 }, { "epoch": 0.04, "learning_rate": 0.0002937748891484926, "loss": 0.1411, "step": 6430 }, { "epoch": 0.04, "learning_rate": 0.00029376520779413566, "loss": 0.1418, "step": 6440 }, { "epoch": 0.04, "learning_rate": 0.00029375552643977874, "loss": 0.1392, "step": 6450 }, { "epoch": 0.04, "learning_rate": 0.0002937458450854218, "loss": 0.1498, "step": 6460 }, { "epoch": 0.04, "learning_rate": 0.00029373616373106485, "loss": 0.1484, "step": 6470 }, { "epoch": 0.04, "learning_rate": 0.0002937264823767079, "loss": 0.1362, "step": 6480 }, { "epoch": 0.04, "learning_rate": 0.000293716801022351, "loss": 0.1456, "step": 6490 }, { "epoch": 0.04, "learning_rate": 0.0002937071196679941, "loss": 0.1453, "step": 6500 }, { "epoch": 0.04, "learning_rate": 0.0002936974383136371, "loss": 0.1413, "step": 6510 }, { "epoch": 0.04, "learning_rate": 0.0002936877569592802, "loss": 0.1515, "step": 6520 }, { "epoch": 0.04, "learning_rate": 0.00029367807560492327, "loss": 0.143, "step": 6530 }, { "epoch": 0.04, "learning_rate": 0.0002936683942505663, "loss": 0.1395, "step": 6540 }, { "epoch": 0.04, "learning_rate": 0.0002936587128962094, "loss": 0.1388, "step": 6550 }, { "epoch": 0.04, "learning_rate": 0.00029364903154185246, "loss": 0.1405, "step": 6560 }, { "epoch": 0.04, "learning_rate": 0.00029363935018749554, "loss": 0.1428, "step": 6570 }, { "epoch": 0.04, "learning_rate": 0.0002936296688331386, "loss": 0.1373, "step": 6580 }, { "epoch": 0.04, "learning_rate": 0.0002936199874787817, "loss": 0.1329, "step": 6590 }, { "epoch": 0.04, "learning_rate": 0.0002936103061244248, "loss": 0.1354, "step": 6600 }, { "epoch": 0.04, "learning_rate": 0.0002936006247700678, "loss": 0.1373, "step": 6610 }, { "epoch": 0.04, "learning_rate": 0.0002935909434157109, "loss": 0.1326, "step": 6620 }, { "epoch": 0.04, "learning_rate": 0.00029358126206135396, "loss": 0.1493, "step": 6630 }, { "epoch": 0.04, "learning_rate": 0.000293571580706997, "loss": 0.1384, "step": 6640 }, { "epoch": 0.04, "learning_rate": 0.00029356189935264007, "loss": 0.134, "step": 6650 }, { "epoch": 0.04, "learning_rate": 0.00029355221799828315, "loss": 0.1398, "step": 6660 }, { "epoch": 0.04, "learning_rate": 0.0002935425366439262, "loss": 0.1439, "step": 6670 }, { "epoch": 0.04, "learning_rate": 0.00029353285528956925, "loss": 0.1395, "step": 6680 }, { "epoch": 0.04, "learning_rate": 0.00029352317393521233, "loss": 0.1417, "step": 6690 }, { "epoch": 0.04, "learning_rate": 0.0002935134925808554, "loss": 0.14, "step": 6700 }, { "epoch": 0.04, "learning_rate": 0.0002935038112264985, "loss": 0.148, "step": 6710 }, { "epoch": 0.04, "learning_rate": 0.00029349412987214157, "loss": 0.1517, "step": 6720 }, { "epoch": 0.04, "learning_rate": 0.00029348444851778465, "loss": 0.1478, "step": 6730 }, { "epoch": 0.04, "learning_rate": 0.00029347476716342773, "loss": 0.1413, "step": 6740 }, { "epoch": 0.04, "learning_rate": 0.00029346508580907076, "loss": 0.1348, "step": 6750 }, { "epoch": 0.04, "learning_rate": 0.00029345540445471384, "loss": 0.128, "step": 6760 }, { "epoch": 0.04, "learning_rate": 0.0002934457231003569, "loss": 0.1242, "step": 6770 }, { "epoch": 0.04, "learning_rate": 0.00029343604174599994, "loss": 0.1384, "step": 6780 }, { "epoch": 0.04, "learning_rate": 0.000293426360391643, "loss": 0.1522, "step": 6790 }, { "epoch": 0.04, "learning_rate": 0.0002934166790372861, "loss": 0.1375, "step": 6800 }, { "epoch": 0.04, "learning_rate": 0.0002934069976829292, "loss": 0.1435, "step": 6810 }, { "epoch": 0.04, "learning_rate": 0.0002933973163285722, "loss": 0.1282, "step": 6820 }, { "epoch": 0.04, "learning_rate": 0.0002933876349742153, "loss": 0.1349, "step": 6830 }, { "epoch": 0.04, "learning_rate": 0.00029337795361985837, "loss": 0.1427, "step": 6840 }, { "epoch": 0.04, "learning_rate": 0.00029336827226550145, "loss": 0.1346, "step": 6850 }, { "epoch": 0.04, "learning_rate": 0.0002933585909111445, "loss": 0.1294, "step": 6860 }, { "epoch": 0.04, "learning_rate": 0.0002933489095567876, "loss": 0.1475, "step": 6870 }, { "epoch": 0.04, "learning_rate": 0.00029333922820243063, "loss": 0.1376, "step": 6880 }, { "epoch": 0.04, "learning_rate": 0.0002933295468480737, "loss": 0.1389, "step": 6890 }, { "epoch": 0.04, "learning_rate": 0.0002933198654937168, "loss": 0.1385, "step": 6900 }, { "epoch": 0.04, "learning_rate": 0.0002933101841393598, "loss": 0.132, "step": 6910 }, { "epoch": 0.04, "learning_rate": 0.0002933005027850029, "loss": 0.1271, "step": 6920 }, { "epoch": 0.04, "learning_rate": 0.000293290821430646, "loss": 0.1367, "step": 6930 }, { "epoch": 0.04, "learning_rate": 0.00029328114007628905, "loss": 0.149, "step": 6940 }, { "epoch": 0.04, "learning_rate": 0.00029327145872193213, "loss": 0.1377, "step": 6950 }, { "epoch": 0.04, "learning_rate": 0.00029326177736757516, "loss": 0.1376, "step": 6960 }, { "epoch": 0.04, "learning_rate": 0.00029325209601321824, "loss": 0.1402, "step": 6970 }, { "epoch": 0.05, "learning_rate": 0.0002932424146588613, "loss": 0.1444, "step": 6980 }, { "epoch": 0.05, "learning_rate": 0.0002932327333045044, "loss": 0.1421, "step": 6990 }, { "epoch": 0.05, "learning_rate": 0.0002932230519501475, "loss": 0.1438, "step": 7000 }, { "epoch": 0.05, "eval_cer": 0.9203208676985651, "eval_loss": 0.09841650724411011, "eval_runtime": 120.3287, "eval_samples_per_second": 16.621, "eval_steps_per_second": 4.155, "step": 7000 }, { "epoch": 0.05, "learning_rate": 0.0002932133705957905, "loss": 0.1261, "step": 7010 }, { "epoch": 0.05, "learning_rate": 0.0002932036892414336, "loss": 0.1343, "step": 7020 }, { "epoch": 0.05, "learning_rate": 0.00029319400788707666, "loss": 0.1392, "step": 7030 }, { "epoch": 0.05, "learning_rate": 0.0002931843265327197, "loss": 0.1348, "step": 7040 }, { "epoch": 0.05, "learning_rate": 0.00029317464517836277, "loss": 0.1412, "step": 7050 }, { "epoch": 0.05, "learning_rate": 0.00029316496382400585, "loss": 0.1379, "step": 7060 }, { "epoch": 0.05, "learning_rate": 0.00029315528246964893, "loss": 0.1321, "step": 7070 }, { "epoch": 0.05, "learning_rate": 0.000293145601115292, "loss": 0.1372, "step": 7080 }, { "epoch": 0.05, "learning_rate": 0.0002931359197609351, "loss": 0.1428, "step": 7090 }, { "epoch": 0.05, "learning_rate": 0.0002931262384065781, "loss": 0.1326, "step": 7100 }, { "epoch": 0.05, "learning_rate": 0.0002931165570522212, "loss": 0.1317, "step": 7110 }, { "epoch": 0.05, "learning_rate": 0.0002931068756978643, "loss": 0.1363, "step": 7120 }, { "epoch": 0.05, "learning_rate": 0.00029309719434350735, "loss": 0.1345, "step": 7130 }, { "epoch": 0.05, "learning_rate": 0.00029308751298915043, "loss": 0.1292, "step": 7140 }, { "epoch": 0.05, "learning_rate": 0.00029307783163479346, "loss": 0.1308, "step": 7150 }, { "epoch": 0.05, "learning_rate": 0.00029306815028043654, "loss": 0.1367, "step": 7160 }, { "epoch": 0.05, "learning_rate": 0.0002930584689260796, "loss": 0.1389, "step": 7170 }, { "epoch": 0.05, "learning_rate": 0.00029304878757172264, "loss": 0.1341, "step": 7180 }, { "epoch": 0.05, "learning_rate": 0.0002930391062173657, "loss": 0.1278, "step": 7190 }, { "epoch": 0.05, "learning_rate": 0.0002930294248630088, "loss": 0.1542, "step": 7200 }, { "epoch": 0.05, "learning_rate": 0.0002930197435086519, "loss": 0.1322, "step": 7210 }, { "epoch": 0.05, "learning_rate": 0.00029301006215429496, "loss": 0.1383, "step": 7220 }, { "epoch": 0.05, "learning_rate": 0.00029300038079993804, "loss": 0.1471, "step": 7230 }, { "epoch": 0.05, "learning_rate": 0.00029299069944558107, "loss": 0.142, "step": 7240 }, { "epoch": 0.05, "learning_rate": 0.00029298101809122415, "loss": 0.1319, "step": 7250 }, { "epoch": 0.05, "learning_rate": 0.00029297133673686723, "loss": 0.1375, "step": 7260 }, { "epoch": 0.05, "learning_rate": 0.0002929616553825103, "loss": 0.1252, "step": 7270 }, { "epoch": 0.05, "learning_rate": 0.00029295197402815333, "loss": 0.1299, "step": 7280 }, { "epoch": 0.05, "learning_rate": 0.0002929422926737964, "loss": 0.1458, "step": 7290 }, { "epoch": 0.05, "learning_rate": 0.0002929326113194395, "loss": 0.1378, "step": 7300 }, { "epoch": 0.05, "learning_rate": 0.0002929229299650825, "loss": 0.139, "step": 7310 }, { "epoch": 0.05, "learning_rate": 0.0002929132486107256, "loss": 0.1283, "step": 7320 }, { "epoch": 0.05, "learning_rate": 0.0002929035672563687, "loss": 0.1338, "step": 7330 }, { "epoch": 0.05, "learning_rate": 0.00029289388590201176, "loss": 0.1248, "step": 7340 }, { "epoch": 0.05, "learning_rate": 0.00029288420454765484, "loss": 0.1316, "step": 7350 }, { "epoch": 0.05, "learning_rate": 0.0002928745231932979, "loss": 0.1321, "step": 7360 }, { "epoch": 0.05, "learning_rate": 0.000292864841838941, "loss": 0.131, "step": 7370 }, { "epoch": 0.05, "learning_rate": 0.000292855160484584, "loss": 0.1313, "step": 7380 }, { "epoch": 0.05, "learning_rate": 0.0002928454791302271, "loss": 0.1424, "step": 7390 }, { "epoch": 0.05, "learning_rate": 0.0002928357977758702, "loss": 0.1266, "step": 7400 }, { "epoch": 0.05, "learning_rate": 0.0002928261164215132, "loss": 0.1284, "step": 7410 }, { "epoch": 0.05, "learning_rate": 0.0002928164350671563, "loss": 0.1332, "step": 7420 }, { "epoch": 0.05, "learning_rate": 0.00029280675371279937, "loss": 0.1358, "step": 7430 }, { "epoch": 0.05, "learning_rate": 0.00029279707235844245, "loss": 0.122, "step": 7440 }, { "epoch": 0.05, "learning_rate": 0.0002927873910040855, "loss": 0.1325, "step": 7450 }, { "epoch": 0.05, "learning_rate": 0.00029277770964972855, "loss": 0.1434, "step": 7460 }, { "epoch": 0.05, "learning_rate": 0.00029276802829537163, "loss": 0.1273, "step": 7470 }, { "epoch": 0.05, "learning_rate": 0.0002927583469410147, "loss": 0.1311, "step": 7480 }, { "epoch": 0.05, "learning_rate": 0.0002927486655866578, "loss": 0.1464, "step": 7490 }, { "epoch": 0.05, "learning_rate": 0.00029273898423230087, "loss": 0.1308, "step": 7500 }, { "epoch": 0.05, "learning_rate": 0.00029272930287794395, "loss": 0.1379, "step": 7510 }, { "epoch": 0.05, "learning_rate": 0.000292719621523587, "loss": 0.1346, "step": 7520 }, { "epoch": 0.05, "learning_rate": 0.00029270994016923006, "loss": 0.1377, "step": 7530 }, { "epoch": 0.05, "learning_rate": 0.00029270025881487314, "loss": 0.1296, "step": 7540 }, { "epoch": 0.05, "learning_rate": 0.00029269057746051616, "loss": 0.1384, "step": 7550 }, { "epoch": 0.05, "learning_rate": 0.00029268089610615924, "loss": 0.1259, "step": 7560 }, { "epoch": 0.05, "learning_rate": 0.0002926712147518023, "loss": 0.1289, "step": 7570 }, { "epoch": 0.05, "learning_rate": 0.0002926615333974454, "loss": 0.1312, "step": 7580 }, { "epoch": 0.05, "learning_rate": 0.00029265185204308843, "loss": 0.1331, "step": 7590 }, { "epoch": 0.05, "learning_rate": 0.0002926421706887315, "loss": 0.1336, "step": 7600 }, { "epoch": 0.05, "learning_rate": 0.0002926324893343746, "loss": 0.136, "step": 7610 }, { "epoch": 0.05, "learning_rate": 0.00029262280798001767, "loss": 0.1287, "step": 7620 }, { "epoch": 0.05, "learning_rate": 0.00029261312662566075, "loss": 0.1359, "step": 7630 }, { "epoch": 0.05, "learning_rate": 0.00029260344527130383, "loss": 0.1299, "step": 7640 }, { "epoch": 0.05, "learning_rate": 0.00029259376391694685, "loss": 0.1235, "step": 7650 }, { "epoch": 0.05, "learning_rate": 0.00029258408256258993, "loss": 0.1242, "step": 7660 }, { "epoch": 0.05, "learning_rate": 0.000292574401208233, "loss": 0.1304, "step": 7670 }, { "epoch": 0.05, "learning_rate": 0.00029256471985387604, "loss": 0.1341, "step": 7680 }, { "epoch": 0.05, "learning_rate": 0.0002925550384995191, "loss": 0.1333, "step": 7690 }, { "epoch": 0.05, "learning_rate": 0.0002925453571451622, "loss": 0.1355, "step": 7700 }, { "epoch": 0.05, "learning_rate": 0.0002925356757908053, "loss": 0.1384, "step": 7710 }, { "epoch": 0.05, "learning_rate": 0.00029252599443644836, "loss": 0.1281, "step": 7720 }, { "epoch": 0.05, "learning_rate": 0.0002925163130820914, "loss": 0.1317, "step": 7730 }, { "epoch": 0.05, "learning_rate": 0.00029250663172773446, "loss": 0.1337, "step": 7740 }, { "epoch": 0.05, "learning_rate": 0.00029249695037337754, "loss": 0.1392, "step": 7750 }, { "epoch": 0.05, "learning_rate": 0.0002924872690190206, "loss": 0.1284, "step": 7760 }, { "epoch": 0.05, "learning_rate": 0.0002924775876646637, "loss": 0.1259, "step": 7770 }, { "epoch": 0.05, "learning_rate": 0.00029246790631030673, "loss": 0.1305, "step": 7780 }, { "epoch": 0.05, "learning_rate": 0.0002924582249559498, "loss": 0.1325, "step": 7790 }, { "epoch": 0.05, "learning_rate": 0.0002924485436015929, "loss": 0.1327, "step": 7800 }, { "epoch": 0.05, "learning_rate": 0.0002924388622472359, "loss": 0.1305, "step": 7810 }, { "epoch": 0.05, "learning_rate": 0.000292429180892879, "loss": 0.1284, "step": 7820 }, { "epoch": 0.05, "learning_rate": 0.00029241949953852207, "loss": 0.131, "step": 7830 }, { "epoch": 0.05, "learning_rate": 0.00029240981818416515, "loss": 0.1227, "step": 7840 }, { "epoch": 0.05, "learning_rate": 0.00029240013682980823, "loss": 0.1229, "step": 7850 }, { "epoch": 0.05, "learning_rate": 0.0002923904554754513, "loss": 0.139, "step": 7860 }, { "epoch": 0.05, "learning_rate": 0.00029238077412109434, "loss": 0.137, "step": 7870 }, { "epoch": 0.05, "learning_rate": 0.0002923710927667374, "loss": 0.1292, "step": 7880 }, { "epoch": 0.05, "learning_rate": 0.0002923614114123805, "loss": 0.1209, "step": 7890 }, { "epoch": 0.05, "learning_rate": 0.0002923517300580236, "loss": 0.1206, "step": 7900 }, { "epoch": 0.05, "learning_rate": 0.00029234204870366666, "loss": 0.1245, "step": 7910 }, { "epoch": 0.05, "learning_rate": 0.0002923323673493097, "loss": 0.1208, "step": 7920 }, { "epoch": 0.05, "learning_rate": 0.00029232268599495276, "loss": 0.1367, "step": 7930 }, { "epoch": 0.05, "learning_rate": 0.00029231300464059584, "loss": 0.1284, "step": 7940 }, { "epoch": 0.05, "learning_rate": 0.00029230332328623887, "loss": 0.1203, "step": 7950 }, { "epoch": 0.05, "learning_rate": 0.00029229364193188195, "loss": 0.1426, "step": 7960 }, { "epoch": 0.05, "learning_rate": 0.000292283960577525, "loss": 0.1313, "step": 7970 }, { "epoch": 0.05, "learning_rate": 0.0002922742792231681, "loss": 0.1297, "step": 7980 }, { "epoch": 0.05, "learning_rate": 0.0002922645978688112, "loss": 0.1345, "step": 7990 }, { "epoch": 0.05, "learning_rate": 0.00029225491651445427, "loss": 0.1362, "step": 8000 }, { "epoch": 0.05, "eval_cer": 0.9203235792565811, "eval_loss": 0.09412429481744766, "eval_runtime": 120.4163, "eval_samples_per_second": 16.609, "eval_steps_per_second": 4.152, "step": 8000 }, { "epoch": 0.05, "learning_rate": 0.0002922452351600973, "loss": 0.1282, "step": 8010 }, { "epoch": 0.05, "learning_rate": 0.00029223555380574037, "loss": 0.1346, "step": 8020 }, { "epoch": 0.05, "learning_rate": 0.00029222587245138345, "loss": 0.1372, "step": 8030 }, { "epoch": 0.05, "learning_rate": 0.00029221619109702653, "loss": 0.1296, "step": 8040 }, { "epoch": 0.05, "learning_rate": 0.00029220650974266956, "loss": 0.1306, "step": 8050 }, { "epoch": 0.05, "learning_rate": 0.00029219682838831264, "loss": 0.1472, "step": 8060 }, { "epoch": 0.05, "learning_rate": 0.0002921871470339557, "loss": 0.1274, "step": 8070 }, { "epoch": 0.05, "learning_rate": 0.00029217746567959874, "loss": 0.1247, "step": 8080 }, { "epoch": 0.05, "learning_rate": 0.0002921677843252418, "loss": 0.1447, "step": 8090 }, { "epoch": 0.05, "learning_rate": 0.0002921581029708849, "loss": 0.1404, "step": 8100 }, { "epoch": 0.05, "learning_rate": 0.000292148421616528, "loss": 0.126, "step": 8110 }, { "epoch": 0.05, "learning_rate": 0.00029213874026217106, "loss": 0.1356, "step": 8120 }, { "epoch": 0.05, "learning_rate": 0.00029212905890781414, "loss": 0.1206, "step": 8130 }, { "epoch": 0.05, "learning_rate": 0.0002921193775534572, "loss": 0.132, "step": 8140 }, { "epoch": 0.05, "learning_rate": 0.00029210969619910025, "loss": 0.1217, "step": 8150 }, { "epoch": 0.05, "learning_rate": 0.0002921000148447433, "loss": 0.1342, "step": 8160 }, { "epoch": 0.05, "learning_rate": 0.0002920903334903864, "loss": 0.1156, "step": 8170 }, { "epoch": 0.05, "learning_rate": 0.00029208065213602943, "loss": 0.1298, "step": 8180 }, { "epoch": 0.05, "learning_rate": 0.0002920709707816725, "loss": 0.1287, "step": 8190 }, { "epoch": 0.05, "learning_rate": 0.0002920612894273156, "loss": 0.1279, "step": 8200 }, { "epoch": 0.05, "learning_rate": 0.00029205160807295867, "loss": 0.1285, "step": 8210 }, { "epoch": 0.05, "learning_rate": 0.0002920419267186017, "loss": 0.1315, "step": 8220 }, { "epoch": 0.05, "learning_rate": 0.0002920322453642448, "loss": 0.1204, "step": 8230 }, { "epoch": 0.05, "learning_rate": 0.00029202256400988786, "loss": 0.125, "step": 8240 }, { "epoch": 0.05, "learning_rate": 0.00029201288265553094, "loss": 0.1237, "step": 8250 }, { "epoch": 0.05, "learning_rate": 0.000292003201301174, "loss": 0.1432, "step": 8260 }, { "epoch": 0.05, "learning_rate": 0.0002919935199468171, "loss": 0.1284, "step": 8270 }, { "epoch": 0.05, "learning_rate": 0.0002919838385924602, "loss": 0.13, "step": 8280 }, { "epoch": 0.05, "learning_rate": 0.0002919741572381032, "loss": 0.1318, "step": 8290 }, { "epoch": 0.05, "learning_rate": 0.0002919644758837463, "loss": 0.128, "step": 8300 }, { "epoch": 0.05, "learning_rate": 0.00029195479452938936, "loss": 0.1307, "step": 8310 }, { "epoch": 0.05, "learning_rate": 0.0002919451131750324, "loss": 0.1311, "step": 8320 }, { "epoch": 0.05, "learning_rate": 0.00029193543182067547, "loss": 0.1209, "step": 8330 }, { "epoch": 0.05, "learning_rate": 0.00029192575046631855, "loss": 0.1346, "step": 8340 }, { "epoch": 0.05, "learning_rate": 0.0002919160691119616, "loss": 0.1222, "step": 8350 }, { "epoch": 0.05, "learning_rate": 0.00029190638775760465, "loss": 0.1243, "step": 8360 }, { "epoch": 0.05, "learning_rate": 0.00029189670640324773, "loss": 0.1249, "step": 8370 }, { "epoch": 0.05, "learning_rate": 0.0002918870250488908, "loss": 0.1351, "step": 8380 }, { "epoch": 0.05, "learning_rate": 0.0002918773436945339, "loss": 0.1447, "step": 8390 }, { "epoch": 0.05, "learning_rate": 0.00029186766234017697, "loss": 0.143, "step": 8400 }, { "epoch": 0.05, "learning_rate": 0.00029185798098582005, "loss": 0.1344, "step": 8410 }, { "epoch": 0.05, "learning_rate": 0.0002918482996314631, "loss": 0.117, "step": 8420 }, { "epoch": 0.05, "learning_rate": 0.00029183861827710616, "loss": 0.1292, "step": 8430 }, { "epoch": 0.05, "learning_rate": 0.00029182893692274923, "loss": 0.1385, "step": 8440 }, { "epoch": 0.05, "learning_rate": 0.00029181925556839226, "loss": 0.1363, "step": 8450 }, { "epoch": 0.05, "learning_rate": 0.00029180957421403534, "loss": 0.1302, "step": 8460 }, { "epoch": 0.05, "learning_rate": 0.0002917998928596784, "loss": 0.1254, "step": 8470 }, { "epoch": 0.05, "learning_rate": 0.0002917902115053215, "loss": 0.129, "step": 8480 }, { "epoch": 0.05, "learning_rate": 0.0002917805301509646, "loss": 0.1159, "step": 8490 }, { "epoch": 0.05, "learning_rate": 0.0002917708487966076, "loss": 0.1278, "step": 8500 }, { "epoch": 0.05, "learning_rate": 0.0002917611674422507, "loss": 0.1308, "step": 8510 }, { "epoch": 0.05, "learning_rate": 0.00029175148608789376, "loss": 0.1204, "step": 8520 }, { "epoch": 0.06, "learning_rate": 0.00029174180473353684, "loss": 0.1307, "step": 8530 }, { "epoch": 0.06, "learning_rate": 0.0002917321233791799, "loss": 0.1383, "step": 8540 }, { "epoch": 0.06, "learning_rate": 0.000291722442024823, "loss": 0.1287, "step": 8550 }, { "epoch": 0.06, "learning_rate": 0.00029171276067046603, "loss": 0.1343, "step": 8560 }, { "epoch": 0.06, "learning_rate": 0.0002917030793161091, "loss": 0.1179, "step": 8570 }, { "epoch": 0.06, "learning_rate": 0.00029169339796175214, "loss": 0.124, "step": 8580 }, { "epoch": 0.06, "learning_rate": 0.0002916837166073952, "loss": 0.1261, "step": 8590 }, { "epoch": 0.06, "learning_rate": 0.0002916740352530383, "loss": 0.1152, "step": 8600 }, { "epoch": 0.06, "learning_rate": 0.0002916643538986814, "loss": 0.1229, "step": 8610 }, { "epoch": 0.06, "learning_rate": 0.00029165467254432445, "loss": 0.1166, "step": 8620 }, { "epoch": 0.06, "learning_rate": 0.00029164499118996753, "loss": 0.1296, "step": 8630 }, { "epoch": 0.06, "learning_rate": 0.00029163530983561056, "loss": 0.1257, "step": 8640 }, { "epoch": 0.06, "learning_rate": 0.00029162562848125364, "loss": 0.138, "step": 8650 }, { "epoch": 0.06, "learning_rate": 0.0002916159471268967, "loss": 0.1365, "step": 8660 }, { "epoch": 0.06, "learning_rate": 0.0002916062657725398, "loss": 0.1164, "step": 8670 }, { "epoch": 0.06, "learning_rate": 0.0002915965844181829, "loss": 0.1351, "step": 8680 }, { "epoch": 0.06, "learning_rate": 0.0002915869030638259, "loss": 0.1285, "step": 8690 }, { "epoch": 0.06, "learning_rate": 0.000291577221709469, "loss": 0.1225, "step": 8700 }, { "epoch": 0.06, "learning_rate": 0.00029156754035511206, "loss": 0.1274, "step": 8710 }, { "epoch": 0.06, "learning_rate": 0.0002915578590007551, "loss": 0.1229, "step": 8720 }, { "epoch": 0.06, "learning_rate": 0.00029154817764639817, "loss": 0.1333, "step": 8730 }, { "epoch": 0.06, "learning_rate": 0.00029153849629204125, "loss": 0.1284, "step": 8740 }, { "epoch": 0.06, "learning_rate": 0.00029152881493768433, "loss": 0.1239, "step": 8750 }, { "epoch": 0.06, "learning_rate": 0.0002915191335833274, "loss": 0.1329, "step": 8760 }, { "epoch": 0.06, "learning_rate": 0.0002915094522289705, "loss": 0.1271, "step": 8770 }, { "epoch": 0.06, "learning_rate": 0.0002914997708746135, "loss": 0.122, "step": 8780 }, { "epoch": 0.06, "learning_rate": 0.0002914900895202566, "loss": 0.1344, "step": 8790 }, { "epoch": 0.06, "learning_rate": 0.0002914804081658997, "loss": 0.12, "step": 8800 }, { "epoch": 0.06, "learning_rate": 0.00029147072681154275, "loss": 0.1229, "step": 8810 }, { "epoch": 0.06, "learning_rate": 0.0002914610454571858, "loss": 0.1309, "step": 8820 }, { "epoch": 0.06, "learning_rate": 0.00029145136410282886, "loss": 0.1243, "step": 8830 }, { "epoch": 0.06, "learning_rate": 0.00029144168274847194, "loss": 0.1253, "step": 8840 }, { "epoch": 0.06, "learning_rate": 0.00029143200139411496, "loss": 0.1226, "step": 8850 }, { "epoch": 0.06, "learning_rate": 0.00029142232003975804, "loss": 0.1384, "step": 8860 }, { "epoch": 0.06, "learning_rate": 0.0002914126386854011, "loss": 0.1259, "step": 8870 }, { "epoch": 0.06, "learning_rate": 0.0002914029573310442, "loss": 0.119, "step": 8880 }, { "epoch": 0.06, "learning_rate": 0.0002913932759766873, "loss": 0.1297, "step": 8890 }, { "epoch": 0.06, "learning_rate": 0.00029138359462233036, "loss": 0.1283, "step": 8900 }, { "epoch": 0.06, "learning_rate": 0.00029137391326797344, "loss": 0.1276, "step": 8910 }, { "epoch": 0.06, "learning_rate": 0.00029136423191361647, "loss": 0.1265, "step": 8920 }, { "epoch": 0.06, "learning_rate": 0.00029135455055925955, "loss": 0.1229, "step": 8930 }, { "epoch": 0.06, "learning_rate": 0.00029134486920490263, "loss": 0.1367, "step": 8940 }, { "epoch": 0.06, "learning_rate": 0.0002913351878505457, "loss": 0.1156, "step": 8950 }, { "epoch": 0.06, "learning_rate": 0.00029132550649618873, "loss": 0.1181, "step": 8960 }, { "epoch": 0.06, "learning_rate": 0.0002913158251418318, "loss": 0.1173, "step": 8970 }, { "epoch": 0.06, "learning_rate": 0.0002913061437874749, "loss": 0.1178, "step": 8980 }, { "epoch": 0.06, "learning_rate": 0.0002912964624331179, "loss": 0.1138, "step": 8990 }, { "epoch": 0.06, "learning_rate": 0.000291286781078761, "loss": 0.1207, "step": 9000 }, { "epoch": 0.06, "eval_cer": 0.9200921929725455, "eval_loss": 0.08904129266738892, "eval_runtime": 120.7527, "eval_samples_per_second": 16.563, "eval_steps_per_second": 4.141, "step": 9000 }, { "epoch": 0.06, "learning_rate": 0.0002912770997244041, "loss": 0.1224, "step": 9010 }, { "epoch": 0.06, "learning_rate": 0.00029126741837004716, "loss": 0.1263, "step": 9020 }, { "epoch": 0.06, "learning_rate": 0.00029125773701569024, "loss": 0.1122, "step": 9030 }, { "epoch": 0.06, "learning_rate": 0.0002912480556613333, "loss": 0.1397, "step": 9040 }, { "epoch": 0.06, "learning_rate": 0.0002912383743069764, "loss": 0.1378, "step": 9050 }, { "epoch": 0.06, "learning_rate": 0.0002912286929526194, "loss": 0.13, "step": 9060 }, { "epoch": 0.06, "learning_rate": 0.0002912190115982625, "loss": 0.1289, "step": 9070 }, { "epoch": 0.06, "learning_rate": 0.0002912093302439056, "loss": 0.1193, "step": 9080 }, { "epoch": 0.06, "learning_rate": 0.0002911996488895486, "loss": 0.121, "step": 9090 }, { "epoch": 0.06, "learning_rate": 0.0002911899675351917, "loss": 0.1117, "step": 9100 }, { "epoch": 0.06, "learning_rate": 0.00029118028618083477, "loss": 0.1257, "step": 9110 }, { "epoch": 0.06, "learning_rate": 0.00029117060482647785, "loss": 0.1286, "step": 9120 }, { "epoch": 0.06, "learning_rate": 0.0002911609234721209, "loss": 0.1253, "step": 9130 }, { "epoch": 0.06, "learning_rate": 0.00029115124211776395, "loss": 0.1231, "step": 9140 }, { "epoch": 0.06, "learning_rate": 0.00029114156076340703, "loss": 0.1191, "step": 9150 }, { "epoch": 0.06, "learning_rate": 0.0002911318794090501, "loss": 0.1254, "step": 9160 }, { "epoch": 0.06, "learning_rate": 0.0002911221980546932, "loss": 0.1206, "step": 9170 }, { "epoch": 0.06, "learning_rate": 0.00029111251670033627, "loss": 0.1197, "step": 9180 }, { "epoch": 0.06, "learning_rate": 0.0002911028353459793, "loss": 0.1212, "step": 9190 }, { "epoch": 0.06, "learning_rate": 0.0002910931539916224, "loss": 0.1221, "step": 9200 }, { "epoch": 0.06, "learning_rate": 0.00029108347263726546, "loss": 0.1264, "step": 9210 }, { "epoch": 0.06, "learning_rate": 0.0002910737912829085, "loss": 0.1127, "step": 9220 }, { "epoch": 0.06, "learning_rate": 0.00029106410992855156, "loss": 0.1353, "step": 9230 }, { "epoch": 0.06, "learning_rate": 0.00029105442857419464, "loss": 0.118, "step": 9240 }, { "epoch": 0.06, "learning_rate": 0.0002910447472198377, "loss": 0.1233, "step": 9250 }, { "epoch": 0.06, "learning_rate": 0.0002910350658654808, "loss": 0.1133, "step": 9260 }, { "epoch": 0.06, "learning_rate": 0.00029102538451112383, "loss": 0.1122, "step": 9270 }, { "epoch": 0.06, "learning_rate": 0.0002910157031567669, "loss": 0.1188, "step": 9280 }, { "epoch": 0.06, "learning_rate": 0.00029100602180241, "loss": 0.1215, "step": 9290 }, { "epoch": 0.06, "learning_rate": 0.00029099634044805307, "loss": 0.1203, "step": 9300 }, { "epoch": 0.06, "learning_rate": 0.00029098665909369615, "loss": 0.1171, "step": 9310 }, { "epoch": 0.06, "learning_rate": 0.0002909769777393392, "loss": 0.1298, "step": 9320 }, { "epoch": 0.06, "learning_rate": 0.00029096729638498225, "loss": 0.1149, "step": 9330 }, { "epoch": 0.06, "learning_rate": 0.00029095761503062533, "loss": 0.1204, "step": 9340 }, { "epoch": 0.06, "learning_rate": 0.0002909479336762684, "loss": 0.1112, "step": 9350 }, { "epoch": 0.06, "learning_rate": 0.00029093825232191144, "loss": 0.1196, "step": 9360 }, { "epoch": 0.06, "learning_rate": 0.0002909285709675545, "loss": 0.1193, "step": 9370 }, { "epoch": 0.06, "learning_rate": 0.0002909188896131976, "loss": 0.1165, "step": 9380 }, { "epoch": 0.06, "learning_rate": 0.0002909092082588407, "loss": 0.1229, "step": 9390 }, { "epoch": 0.06, "learning_rate": 0.00029089952690448376, "loss": 0.1221, "step": 9400 }, { "epoch": 0.06, "learning_rate": 0.0002908898455501268, "loss": 0.1232, "step": 9410 }, { "epoch": 0.06, "learning_rate": 0.00029088016419576986, "loss": 0.113, "step": 9420 }, { "epoch": 0.06, "learning_rate": 0.00029087048284141294, "loss": 0.1181, "step": 9430 }, { "epoch": 0.06, "learning_rate": 0.000290860801487056, "loss": 0.1147, "step": 9440 }, { "epoch": 0.06, "learning_rate": 0.0002908511201326991, "loss": 0.1206, "step": 9450 }, { "epoch": 0.06, "learning_rate": 0.0002908414387783421, "loss": 0.1307, "step": 9460 }, { "epoch": 0.06, "learning_rate": 0.0002908317574239852, "loss": 0.1103, "step": 9470 }, { "epoch": 0.06, "learning_rate": 0.0002908220760696283, "loss": 0.1193, "step": 9480 }, { "epoch": 0.06, "learning_rate": 0.0002908123947152713, "loss": 0.112, "step": 9490 }, { "epoch": 0.06, "learning_rate": 0.0002908027133609144, "loss": 0.1163, "step": 9500 }, { "epoch": 0.06, "learning_rate": 0.00029079303200655747, "loss": 0.112, "step": 9510 }, { "epoch": 0.06, "learning_rate": 0.00029078335065220055, "loss": 0.1215, "step": 9520 }, { "epoch": 0.06, "learning_rate": 0.00029077366929784363, "loss": 0.1113, "step": 9530 }, { "epoch": 0.06, "learning_rate": 0.0002907639879434867, "loss": 0.1199, "step": 9540 }, { "epoch": 0.06, "learning_rate": 0.00029075430658912974, "loss": 0.1195, "step": 9550 }, { "epoch": 0.06, "learning_rate": 0.0002907446252347728, "loss": 0.1104, "step": 9560 }, { "epoch": 0.06, "learning_rate": 0.0002907349438804159, "loss": 0.1064, "step": 9570 }, { "epoch": 0.06, "learning_rate": 0.000290725262526059, "loss": 0.1188, "step": 9580 }, { "epoch": 0.06, "learning_rate": 0.000290715581171702, "loss": 0.1191, "step": 9590 }, { "epoch": 0.06, "learning_rate": 0.0002907058998173451, "loss": 0.1127, "step": 9600 }, { "epoch": 0.06, "learning_rate": 0.00029069621846298816, "loss": 0.1081, "step": 9610 }, { "epoch": 0.06, "learning_rate": 0.0002906865371086312, "loss": 0.1121, "step": 9620 }, { "epoch": 0.06, "learning_rate": 0.00029067685575427427, "loss": 0.1163, "step": 9630 }, { "epoch": 0.06, "learning_rate": 0.00029066717439991735, "loss": 0.1198, "step": 9640 }, { "epoch": 0.06, "learning_rate": 0.0002906574930455604, "loss": 0.1142, "step": 9650 }, { "epoch": 0.06, "learning_rate": 0.0002906478116912035, "loss": 0.1139, "step": 9660 }, { "epoch": 0.06, "learning_rate": 0.0002906381303368466, "loss": 0.1096, "step": 9670 }, { "epoch": 0.06, "learning_rate": 0.00029062844898248967, "loss": 0.1076, "step": 9680 }, { "epoch": 0.06, "learning_rate": 0.0002906187676281327, "loss": 0.1236, "step": 9690 }, { "epoch": 0.06, "learning_rate": 0.00029060908627377577, "loss": 0.1202, "step": 9700 }, { "epoch": 0.06, "learning_rate": 0.00029059940491941885, "loss": 0.1304, "step": 9710 }, { "epoch": 0.06, "learning_rate": 0.00029058972356506193, "loss": 0.115, "step": 9720 }, { "epoch": 0.06, "learning_rate": 0.00029058004221070496, "loss": 0.1073, "step": 9730 }, { "epoch": 0.06, "learning_rate": 0.00029057036085634804, "loss": 0.1184, "step": 9740 }, { "epoch": 0.06, "learning_rate": 0.0002905606795019911, "loss": 0.1168, "step": 9750 }, { "epoch": 0.06, "learning_rate": 0.00029055099814763414, "loss": 0.1299, "step": 9760 }, { "epoch": 0.06, "learning_rate": 0.0002905413167932772, "loss": 0.1141, "step": 9770 }, { "epoch": 0.06, "learning_rate": 0.0002905316354389203, "loss": 0.1167, "step": 9780 }, { "epoch": 0.06, "learning_rate": 0.0002905219540845634, "loss": 0.1216, "step": 9790 }, { "epoch": 0.06, "learning_rate": 0.00029051227273020646, "loss": 0.1187, "step": 9800 }, { "epoch": 0.06, "learning_rate": 0.00029050259137584954, "loss": 0.129, "step": 9810 }, { "epoch": 0.06, "learning_rate": 0.0002904929100214926, "loss": 0.1273, "step": 9820 }, { "epoch": 0.06, "learning_rate": 0.00029048322866713565, "loss": 0.1172, "step": 9830 }, { "epoch": 0.06, "learning_rate": 0.0002904735473127787, "loss": 0.1277, "step": 9840 }, { "epoch": 0.06, "learning_rate": 0.0002904638659584218, "loss": 0.121, "step": 9850 }, { "epoch": 0.06, "learning_rate": 0.00029045418460406483, "loss": 0.1226, "step": 9860 }, { "epoch": 0.06, "learning_rate": 0.0002904445032497079, "loss": 0.1169, "step": 9870 }, { "epoch": 0.06, "learning_rate": 0.000290434821895351, "loss": 0.1157, "step": 9880 }, { "epoch": 0.06, "learning_rate": 0.00029042514054099407, "loss": 0.1224, "step": 9890 }, { "epoch": 0.06, "learning_rate": 0.0002904154591866371, "loss": 0.1175, "step": 9900 }, { "epoch": 0.06, "learning_rate": 0.0002904057778322802, "loss": 0.1297, "step": 9910 }, { "epoch": 0.06, "learning_rate": 0.00029039609647792326, "loss": 0.1127, "step": 9920 }, { "epoch": 0.06, "learning_rate": 0.00029038641512356633, "loss": 0.1217, "step": 9930 }, { "epoch": 0.06, "learning_rate": 0.0002903767337692094, "loss": 0.1264, "step": 9940 }, { "epoch": 0.06, "learning_rate": 0.0002903670524148525, "loss": 0.1153, "step": 9950 }, { "epoch": 0.06, "learning_rate": 0.0002903573710604956, "loss": 0.1199, "step": 9960 }, { "epoch": 0.06, "learning_rate": 0.0002903476897061386, "loss": 0.1229, "step": 9970 }, { "epoch": 0.06, "learning_rate": 0.0002903380083517817, "loss": 0.1257, "step": 9980 }, { "epoch": 0.06, "learning_rate": 0.0002903283269974247, "loss": 0.1215, "step": 9990 }, { "epoch": 0.06, "learning_rate": 0.0002903186456430678, "loss": 0.108, "step": 10000 }, { "epoch": 0.06, "eval_cer": 0.9202810981809965, "eval_loss": 0.08496131747961044, "eval_runtime": 120.7005, "eval_samples_per_second": 16.57, "eval_steps_per_second": 4.142, "step": 10000 }, { "epoch": 0.06, "learning_rate": 0.00029030896428871086, "loss": 0.1288, "step": 10010 }, { "epoch": 0.06, "learning_rate": 0.00029029928293435394, "loss": 0.1277, "step": 10020 }, { "epoch": 0.06, "learning_rate": 0.000290289601579997, "loss": 0.1249, "step": 10030 }, { "epoch": 0.06, "learning_rate": 0.00029027992022564005, "loss": 0.1236, "step": 10040 }, { "epoch": 0.06, "learning_rate": 0.00029027023887128313, "loss": 0.1177, "step": 10050 }, { "epoch": 0.06, "learning_rate": 0.0002902605575169262, "loss": 0.1177, "step": 10060 }, { "epoch": 0.06, "learning_rate": 0.0002902508761625693, "loss": 0.1067, "step": 10070 }, { "epoch": 0.07, "learning_rate": 0.00029024119480821237, "loss": 0.1173, "step": 10080 }, { "epoch": 0.07, "learning_rate": 0.00029023151345385545, "loss": 0.1194, "step": 10090 }, { "epoch": 0.07, "learning_rate": 0.0002902218320994985, "loss": 0.1133, "step": 10100 }, { "epoch": 0.07, "learning_rate": 0.00029021215074514155, "loss": 0.1167, "step": 10110 }, { "epoch": 0.07, "learning_rate": 0.00029020246939078463, "loss": 0.119, "step": 10120 }, { "epoch": 0.07, "learning_rate": 0.00029019278803642766, "loss": 0.1302, "step": 10130 }, { "epoch": 0.07, "learning_rate": 0.00029018310668207074, "loss": 0.117, "step": 10140 }, { "epoch": 0.07, "learning_rate": 0.0002901734253277138, "loss": 0.1096, "step": 10150 }, { "epoch": 0.07, "learning_rate": 0.0002901637439733569, "loss": 0.1137, "step": 10160 }, { "epoch": 0.07, "learning_rate": 0.000290154062619, "loss": 0.1066, "step": 10170 }, { "epoch": 0.07, "learning_rate": 0.000290144381264643, "loss": 0.1131, "step": 10180 }, { "epoch": 0.07, "learning_rate": 0.0002901346999102861, "loss": 0.1181, "step": 10190 }, { "epoch": 0.07, "learning_rate": 0.00029012501855592916, "loss": 0.1111, "step": 10200 }, { "epoch": 0.07, "learning_rate": 0.00029011533720157224, "loss": 0.1074, "step": 10210 }, { "epoch": 0.07, "learning_rate": 0.0002901056558472153, "loss": 0.1192, "step": 10220 }, { "epoch": 0.07, "learning_rate": 0.00029009597449285835, "loss": 0.123, "step": 10230 }, { "epoch": 0.07, "learning_rate": 0.00029008629313850143, "loss": 0.1196, "step": 10240 }, { "epoch": 0.07, "learning_rate": 0.0002900766117841445, "loss": 0.1151, "step": 10250 }, { "epoch": 0.07, "learning_rate": 0.00029006693042978753, "loss": 0.1218, "step": 10260 }, { "epoch": 0.07, "learning_rate": 0.0002900572490754306, "loss": 0.1234, "step": 10270 }, { "epoch": 0.07, "learning_rate": 0.0002900475677210737, "loss": 0.1194, "step": 10280 }, { "epoch": 0.07, "learning_rate": 0.0002900378863667168, "loss": 0.1171, "step": 10290 }, { "epoch": 0.07, "learning_rate": 0.00029002820501235985, "loss": 0.122, "step": 10300 }, { "epoch": 0.07, "learning_rate": 0.00029001852365800293, "loss": 0.1293, "step": 10310 }, { "epoch": 0.07, "learning_rate": 0.00029000884230364596, "loss": 0.1249, "step": 10320 }, { "epoch": 0.07, "learning_rate": 0.00028999916094928904, "loss": 0.1106, "step": 10330 }, { "epoch": 0.07, "learning_rate": 0.0002899894795949321, "loss": 0.111, "step": 10340 }, { "epoch": 0.07, "learning_rate": 0.0002899797982405752, "loss": 0.1155, "step": 10350 }, { "epoch": 0.07, "learning_rate": 0.0002899701168862183, "loss": 0.1093, "step": 10360 }, { "epoch": 0.07, "learning_rate": 0.0002899604355318613, "loss": 0.1148, "step": 10370 }, { "epoch": 0.07, "learning_rate": 0.0002899507541775044, "loss": 0.1198, "step": 10380 }, { "epoch": 0.07, "learning_rate": 0.0002899410728231474, "loss": 0.1193, "step": 10390 }, { "epoch": 0.07, "learning_rate": 0.0002899313914687905, "loss": 0.1049, "step": 10400 }, { "epoch": 0.07, "learning_rate": 0.00028992171011443357, "loss": 0.1124, "step": 10410 }, { "epoch": 0.07, "learning_rate": 0.00028991202876007665, "loss": 0.1122, "step": 10420 }, { "epoch": 0.07, "learning_rate": 0.00028990234740571973, "loss": 0.1122, "step": 10430 }, { "epoch": 0.07, "learning_rate": 0.0002898926660513628, "loss": 0.114, "step": 10440 }, { "epoch": 0.07, "learning_rate": 0.00028988298469700583, "loss": 0.1279, "step": 10450 }, { "epoch": 0.07, "learning_rate": 0.0002898733033426489, "loss": 0.1215, "step": 10460 }, { "epoch": 0.07, "learning_rate": 0.000289863621988292, "loss": 0.1143, "step": 10470 }, { "epoch": 0.07, "learning_rate": 0.00028985394063393507, "loss": 0.1178, "step": 10480 }, { "epoch": 0.07, "learning_rate": 0.00028984425927957815, "loss": 0.1145, "step": 10490 }, { "epoch": 0.07, "learning_rate": 0.0002898345779252212, "loss": 0.1103, "step": 10500 }, { "epoch": 0.07, "learning_rate": 0.00028982489657086426, "loss": 0.1113, "step": 10510 }, { "epoch": 0.07, "learning_rate": 0.00028981521521650734, "loss": 0.1196, "step": 10520 }, { "epoch": 0.07, "learning_rate": 0.00028980553386215036, "loss": 0.1134, "step": 10530 }, { "epoch": 0.07, "learning_rate": 0.00028979585250779344, "loss": 0.1102, "step": 10540 }, { "epoch": 0.07, "learning_rate": 0.0002897861711534365, "loss": 0.1164, "step": 10550 }, { "epoch": 0.07, "learning_rate": 0.0002897764897990796, "loss": 0.1105, "step": 10560 }, { "epoch": 0.07, "learning_rate": 0.0002897668084447227, "loss": 0.117, "step": 10570 }, { "epoch": 0.07, "learning_rate": 0.00028975712709036576, "loss": 0.1184, "step": 10580 }, { "epoch": 0.07, "learning_rate": 0.0002897474457360088, "loss": 0.106, "step": 10590 }, { "epoch": 0.07, "learning_rate": 0.00028973776438165187, "loss": 0.1166, "step": 10600 }, { "epoch": 0.07, "learning_rate": 0.00028972808302729495, "loss": 0.1231, "step": 10610 }, { "epoch": 0.07, "learning_rate": 0.00028971840167293803, "loss": 0.1099, "step": 10620 }, { "epoch": 0.07, "learning_rate": 0.00028970872031858105, "loss": 0.1197, "step": 10630 }, { "epoch": 0.07, "learning_rate": 0.00028969903896422413, "loss": 0.1077, "step": 10640 }, { "epoch": 0.07, "learning_rate": 0.0002896893576098672, "loss": 0.1333, "step": 10650 }, { "epoch": 0.07, "learning_rate": 0.00028967967625551024, "loss": 0.1157, "step": 10660 }, { "epoch": 0.07, "learning_rate": 0.0002896699949011533, "loss": 0.1154, "step": 10670 }, { "epoch": 0.07, "learning_rate": 0.0002896603135467964, "loss": 0.1191, "step": 10680 }, { "epoch": 0.07, "learning_rate": 0.0002896506321924395, "loss": 0.1076, "step": 10690 }, { "epoch": 0.07, "learning_rate": 0.00028964095083808256, "loss": 0.1175, "step": 10700 }, { "epoch": 0.07, "learning_rate": 0.00028963126948372564, "loss": 0.1108, "step": 10710 }, { "epoch": 0.07, "learning_rate": 0.0002896215881293687, "loss": 0.1103, "step": 10720 }, { "epoch": 0.07, "learning_rate": 0.00028961190677501174, "loss": 0.1112, "step": 10730 }, { "epoch": 0.07, "learning_rate": 0.0002896022254206548, "loss": 0.1196, "step": 10740 }, { "epoch": 0.07, "learning_rate": 0.0002895925440662979, "loss": 0.1198, "step": 10750 }, { "epoch": 0.07, "learning_rate": 0.000289582862711941, "loss": 0.1203, "step": 10760 }, { "epoch": 0.07, "learning_rate": 0.000289573181357584, "loss": 0.1255, "step": 10770 }, { "epoch": 0.07, "learning_rate": 0.0002895635000032271, "loss": 0.1105, "step": 10780 }, { "epoch": 0.07, "learning_rate": 0.00028955381864887017, "loss": 0.1034, "step": 10790 }, { "epoch": 0.07, "learning_rate": 0.0002895441372945132, "loss": 0.1062, "step": 10800 }, { "epoch": 0.07, "learning_rate": 0.00028953445594015627, "loss": 0.1156, "step": 10810 }, { "epoch": 0.07, "learning_rate": 0.00028952477458579935, "loss": 0.1167, "step": 10820 }, { "epoch": 0.07, "learning_rate": 0.00028951509323144243, "loss": 0.1108, "step": 10830 }, { "epoch": 0.07, "learning_rate": 0.0002895054118770855, "loss": 0.1143, "step": 10840 }, { "epoch": 0.07, "learning_rate": 0.0002894957305227286, "loss": 0.1137, "step": 10850 }, { "epoch": 0.07, "learning_rate": 0.00028948604916837167, "loss": 0.1101, "step": 10860 }, { "epoch": 0.07, "learning_rate": 0.0002894763678140147, "loss": 0.11, "step": 10870 }, { "epoch": 0.07, "learning_rate": 0.0002894666864596578, "loss": 0.1036, "step": 10880 }, { "epoch": 0.07, "learning_rate": 0.00028945700510530086, "loss": 0.1133, "step": 10890 }, { "epoch": 0.07, "learning_rate": 0.0002894473237509439, "loss": 0.1183, "step": 10900 }, { "epoch": 0.07, "learning_rate": 0.00028943764239658696, "loss": 0.111, "step": 10910 }, { "epoch": 0.07, "learning_rate": 0.00028942796104223004, "loss": 0.1195, "step": 10920 }, { "epoch": 0.07, "learning_rate": 0.0002894182796878731, "loss": 0.1145, "step": 10930 }, { "epoch": 0.07, "learning_rate": 0.00028940859833351615, "loss": 0.1164, "step": 10940 }, { "epoch": 0.07, "learning_rate": 0.0002893989169791592, "loss": 0.1166, "step": 10950 }, { "epoch": 0.07, "learning_rate": 0.0002893892356248023, "loss": 0.1019, "step": 10960 }, { "epoch": 0.07, "learning_rate": 0.0002893795542704454, "loss": 0.1066, "step": 10970 }, { "epoch": 0.07, "learning_rate": 0.00028936987291608847, "loss": 0.1175, "step": 10980 }, { "epoch": 0.07, "learning_rate": 0.00028936019156173155, "loss": 0.1139, "step": 10990 }, { "epoch": 0.07, "learning_rate": 0.00028935051020737457, "loss": 0.1142, "step": 11000 }, { "epoch": 0.07, "eval_cer": 0.920128347079426, "eval_loss": 0.07976210117340088, "eval_runtime": 120.34, "eval_samples_per_second": 16.62, "eval_steps_per_second": 4.155, "step": 11000 }, { "epoch": 0.07, "learning_rate": 0.00028934082885301765, "loss": 0.1083, "step": 11010 }, { "epoch": 0.07, "learning_rate": 0.00028933114749866073, "loss": 0.1146, "step": 11020 }, { "epoch": 0.07, "learning_rate": 0.00028932146614430376, "loss": 0.1131, "step": 11030 }, { "epoch": 0.07, "learning_rate": 0.00028931178478994684, "loss": 0.1171, "step": 11040 }, { "epoch": 0.07, "learning_rate": 0.0002893021034355899, "loss": 0.1049, "step": 11050 }, { "epoch": 0.07, "learning_rate": 0.000289292422081233, "loss": 0.1213, "step": 11060 }, { "epoch": 0.07, "learning_rate": 0.0002892827407268761, "loss": 0.1202, "step": 11070 }, { "epoch": 0.07, "learning_rate": 0.0002892730593725191, "loss": 0.1142, "step": 11080 }, { "epoch": 0.07, "learning_rate": 0.0002892633780181622, "loss": 0.1154, "step": 11090 }, { "epoch": 0.07, "learning_rate": 0.00028925369666380526, "loss": 0.1266, "step": 11100 }, { "epoch": 0.07, "learning_rate": 0.00028924401530944834, "loss": 0.1064, "step": 11110 }, { "epoch": 0.07, "learning_rate": 0.0002892343339550914, "loss": 0.1048, "step": 11120 }, { "epoch": 0.07, "learning_rate": 0.0002892246526007345, "loss": 0.1167, "step": 11130 }, { "epoch": 0.07, "learning_rate": 0.0002892149712463775, "loss": 0.1051, "step": 11140 }, { "epoch": 0.07, "learning_rate": 0.0002892052898920206, "loss": 0.1121, "step": 11150 }, { "epoch": 0.07, "learning_rate": 0.0002891956085376637, "loss": 0.1068, "step": 11160 }, { "epoch": 0.07, "learning_rate": 0.0002891859271833067, "loss": 0.1137, "step": 11170 }, { "epoch": 0.07, "learning_rate": 0.0002891762458289498, "loss": 0.1107, "step": 11180 }, { "epoch": 0.07, "learning_rate": 0.00028916656447459287, "loss": 0.1118, "step": 11190 }, { "epoch": 0.07, "learning_rate": 0.00028915688312023595, "loss": 0.1275, "step": 11200 }, { "epoch": 0.07, "learning_rate": 0.00028914720176587903, "loss": 0.1006, "step": 11210 }, { "epoch": 0.07, "learning_rate": 0.00028913752041152206, "loss": 0.1065, "step": 11220 }, { "epoch": 0.07, "learning_rate": 0.00028912783905716514, "loss": 0.1061, "step": 11230 }, { "epoch": 0.07, "learning_rate": 0.0002891181577028082, "loss": 0.1058, "step": 11240 }, { "epoch": 0.07, "learning_rate": 0.0002891084763484513, "loss": 0.1008, "step": 11250 }, { "epoch": 0.07, "learning_rate": 0.0002890987949940944, "loss": 0.1071, "step": 11260 }, { "epoch": 0.07, "learning_rate": 0.0002890891136397374, "loss": 0.1137, "step": 11270 }, { "epoch": 0.07, "learning_rate": 0.0002890794322853805, "loss": 0.1134, "step": 11280 }, { "epoch": 0.07, "learning_rate": 0.00028906975093102356, "loss": 0.1041, "step": 11290 }, { "epoch": 0.07, "learning_rate": 0.0002890600695766666, "loss": 0.1209, "step": 11300 }, { "epoch": 0.07, "learning_rate": 0.00028905038822230967, "loss": 0.1086, "step": 11310 }, { "epoch": 0.07, "learning_rate": 0.00028904070686795275, "loss": 0.1082, "step": 11320 }, { "epoch": 0.07, "learning_rate": 0.0002890310255135958, "loss": 0.1062, "step": 11330 }, { "epoch": 0.07, "learning_rate": 0.0002890213441592389, "loss": 0.111, "step": 11340 }, { "epoch": 0.07, "learning_rate": 0.000289011662804882, "loss": 0.1112, "step": 11350 }, { "epoch": 0.07, "learning_rate": 0.000289001981450525, "loss": 0.1177, "step": 11360 }, { "epoch": 0.07, "learning_rate": 0.0002889923000961681, "loss": 0.1056, "step": 11370 }, { "epoch": 0.07, "learning_rate": 0.00028898261874181117, "loss": 0.1022, "step": 11380 }, { "epoch": 0.07, "learning_rate": 0.00028897293738745425, "loss": 0.1045, "step": 11390 }, { "epoch": 0.07, "learning_rate": 0.0002889632560330973, "loss": 0.1075, "step": 11400 }, { "epoch": 0.07, "learning_rate": 0.00028895357467874036, "loss": 0.1036, "step": 11410 }, { "epoch": 0.07, "learning_rate": 0.00028894389332438343, "loss": 0.1022, "step": 11420 }, { "epoch": 0.07, "learning_rate": 0.00028893421197002646, "loss": 0.1255, "step": 11430 }, { "epoch": 0.07, "learning_rate": 0.00028892453061566954, "loss": 0.1036, "step": 11440 }, { "epoch": 0.07, "learning_rate": 0.0002889148492613126, "loss": 0.1194, "step": 11450 }, { "epoch": 0.07, "learning_rate": 0.0002889051679069557, "loss": 0.1103, "step": 11460 }, { "epoch": 0.07, "learning_rate": 0.0002888954865525988, "loss": 0.1209, "step": 11470 }, { "epoch": 0.07, "learning_rate": 0.00028888580519824186, "loss": 0.114, "step": 11480 }, { "epoch": 0.07, "learning_rate": 0.00028887612384388494, "loss": 0.1153, "step": 11490 }, { "epoch": 0.07, "learning_rate": 0.00028886644248952796, "loss": 0.1126, "step": 11500 }, { "epoch": 0.07, "learning_rate": 0.00028885676113517104, "loss": 0.1131, "step": 11510 }, { "epoch": 0.07, "learning_rate": 0.0002888470797808141, "loss": 0.1094, "step": 11520 }, { "epoch": 0.07, "learning_rate": 0.0002888373984264572, "loss": 0.1006, "step": 11530 }, { "epoch": 0.07, "learning_rate": 0.00028882771707210023, "loss": 0.1115, "step": 11540 }, { "epoch": 0.07, "learning_rate": 0.0002888180357177433, "loss": 0.1005, "step": 11550 }, { "epoch": 0.07, "learning_rate": 0.0002888083543633864, "loss": 0.1102, "step": 11560 }, { "epoch": 0.07, "learning_rate": 0.0002887986730090294, "loss": 0.0981, "step": 11570 }, { "epoch": 0.07, "learning_rate": 0.0002887889916546725, "loss": 0.1029, "step": 11580 }, { "epoch": 0.07, "learning_rate": 0.0002887793103003156, "loss": 0.1115, "step": 11590 }, { "epoch": 0.07, "learning_rate": 0.00028876962894595865, "loss": 0.1028, "step": 11600 }, { "epoch": 0.07, "learning_rate": 0.00028875994759160173, "loss": 0.1053, "step": 11610 }, { "epoch": 0.07, "learning_rate": 0.0002887502662372448, "loss": 0.1137, "step": 11620 }, { "epoch": 0.08, "learning_rate": 0.0002887405848828879, "loss": 0.1059, "step": 11630 }, { "epoch": 0.08, "learning_rate": 0.0002887309035285309, "loss": 0.1125, "step": 11640 }, { "epoch": 0.08, "learning_rate": 0.000288721222174174, "loss": 0.1039, "step": 11650 }, { "epoch": 0.08, "learning_rate": 0.0002887115408198171, "loss": 0.1143, "step": 11660 }, { "epoch": 0.08, "learning_rate": 0.0002887018594654601, "loss": 0.1081, "step": 11670 }, { "epoch": 0.08, "learning_rate": 0.0002886921781111032, "loss": 0.1031, "step": 11680 }, { "epoch": 0.08, "learning_rate": 0.00028868249675674626, "loss": 0.0974, "step": 11690 }, { "epoch": 0.08, "learning_rate": 0.00028867281540238934, "loss": 0.1086, "step": 11700 }, { "epoch": 0.08, "learning_rate": 0.00028866313404803237, "loss": 0.1157, "step": 11710 }, { "epoch": 0.08, "learning_rate": 0.00028865345269367545, "loss": 0.104, "step": 11720 }, { "epoch": 0.08, "learning_rate": 0.00028864377133931853, "loss": 0.1155, "step": 11730 }, { "epoch": 0.08, "learning_rate": 0.0002886340899849616, "loss": 0.1152, "step": 11740 }, { "epoch": 0.08, "learning_rate": 0.0002886244086306047, "loss": 0.1047, "step": 11750 }, { "epoch": 0.08, "learning_rate": 0.00028861472727624777, "loss": 0.107, "step": 11760 }, { "epoch": 0.08, "learning_rate": 0.0002886050459218908, "loss": 0.1107, "step": 11770 }, { "epoch": 0.08, "learning_rate": 0.0002885953645675339, "loss": 0.1163, "step": 11780 }, { "epoch": 0.08, "learning_rate": 0.00028858568321317695, "loss": 0.1133, "step": 11790 }, { "epoch": 0.08, "learning_rate": 0.00028857600185882, "loss": 0.1188, "step": 11800 }, { "epoch": 0.08, "learning_rate": 0.00028856632050446306, "loss": 0.1077, "step": 11810 }, { "epoch": 0.08, "learning_rate": 0.00028855663915010614, "loss": 0.1058, "step": 11820 }, { "epoch": 0.08, "learning_rate": 0.0002885469577957492, "loss": 0.11, "step": 11830 }, { "epoch": 0.08, "learning_rate": 0.0002885372764413923, "loss": 0.1238, "step": 11840 }, { "epoch": 0.08, "learning_rate": 0.0002885275950870353, "loss": 0.1099, "step": 11850 }, { "epoch": 0.08, "learning_rate": 0.0002885179137326784, "loss": 0.108, "step": 11860 }, { "epoch": 0.08, "learning_rate": 0.0002885082323783215, "loss": 0.113, "step": 11870 }, { "epoch": 0.08, "learning_rate": 0.00028849855102396456, "loss": 0.1078, "step": 11880 }, { "epoch": 0.08, "learning_rate": 0.00028848886966960764, "loss": 0.109, "step": 11890 }, { "epoch": 0.08, "learning_rate": 0.0002884791883152507, "loss": 0.1145, "step": 11900 }, { "epoch": 0.08, "learning_rate": 0.00028846950696089375, "loss": 0.1139, "step": 11910 }, { "epoch": 0.08, "learning_rate": 0.00028845982560653683, "loss": 0.1083, "step": 11920 }, { "epoch": 0.08, "learning_rate": 0.0002884501442521799, "loss": 0.1032, "step": 11930 }, { "epoch": 0.08, "learning_rate": 0.00028844046289782293, "loss": 0.0933, "step": 11940 }, { "epoch": 0.08, "learning_rate": 0.000288430781543466, "loss": 0.1059, "step": 11950 }, { "epoch": 0.08, "learning_rate": 0.0002884211001891091, "loss": 0.1007, "step": 11960 }, { "epoch": 0.08, "learning_rate": 0.00028841141883475217, "loss": 0.1074, "step": 11970 }, { "epoch": 0.08, "learning_rate": 0.00028840173748039525, "loss": 0.1127, "step": 11980 }, { "epoch": 0.08, "learning_rate": 0.0002883920561260383, "loss": 0.1007, "step": 11990 }, { "epoch": 0.08, "learning_rate": 0.00028838237477168136, "loss": 0.1081, "step": 12000 }, { "epoch": 0.08, "eval_cer": 0.920316348435205, "eval_loss": 0.07571277767419815, "eval_runtime": 120.2448, "eval_samples_per_second": 16.633, "eval_steps_per_second": 4.158, "step": 12000 }, { "epoch": 0.08, "learning_rate": 0.00028837269341732444, "loss": 0.1088, "step": 12010 }, { "epoch": 0.08, "learning_rate": 0.0002883630120629675, "loss": 0.111, "step": 12020 }, { "epoch": 0.08, "learning_rate": 0.0002883533307086106, "loss": 0.1104, "step": 12030 }, { "epoch": 0.08, "learning_rate": 0.0002883436493542536, "loss": 0.1104, "step": 12040 }, { "epoch": 0.08, "learning_rate": 0.0002883339679998967, "loss": 0.1076, "step": 12050 }, { "epoch": 0.08, "learning_rate": 0.0002883242866455398, "loss": 0.1234, "step": 12060 }, { "epoch": 0.08, "learning_rate": 0.0002883146052911828, "loss": 0.1044, "step": 12070 }, { "epoch": 0.08, "learning_rate": 0.0002883049239368259, "loss": 0.1194, "step": 12080 }, { "epoch": 0.08, "learning_rate": 0.00028829524258246897, "loss": 0.1128, "step": 12090 }, { "epoch": 0.08, "learning_rate": 0.00028828556122811205, "loss": 0.1037, "step": 12100 }, { "epoch": 0.08, "learning_rate": 0.00028827587987375513, "loss": 0.1062, "step": 12110 }, { "epoch": 0.08, "learning_rate": 0.0002882661985193982, "loss": 0.1088, "step": 12120 }, { "epoch": 0.08, "learning_rate": 0.00028825651716504123, "loss": 0.1076, "step": 12130 }, { "epoch": 0.08, "learning_rate": 0.0002882468358106843, "loss": 0.116, "step": 12140 }, { "epoch": 0.08, "learning_rate": 0.0002882371544563274, "loss": 0.1093, "step": 12150 }, { "epoch": 0.08, "learning_rate": 0.00028822747310197047, "loss": 0.1039, "step": 12160 }, { "epoch": 0.08, "learning_rate": 0.0002882177917476135, "loss": 0.1146, "step": 12170 }, { "epoch": 0.08, "learning_rate": 0.0002882081103932566, "loss": 0.1074, "step": 12180 }, { "epoch": 0.08, "learning_rate": 0.00028819842903889966, "loss": 0.1046, "step": 12190 }, { "epoch": 0.08, "learning_rate": 0.0002881887476845427, "loss": 0.1088, "step": 12200 }, { "epoch": 0.08, "learning_rate": 0.00028817906633018576, "loss": 0.11, "step": 12210 }, { "epoch": 0.08, "learning_rate": 0.00028816938497582884, "loss": 0.1105, "step": 12220 }, { "epoch": 0.08, "learning_rate": 0.0002881597036214719, "loss": 0.1048, "step": 12230 }, { "epoch": 0.08, "learning_rate": 0.000288150022267115, "loss": 0.1145, "step": 12240 }, { "epoch": 0.08, "learning_rate": 0.0002881403409127581, "loss": 0.1006, "step": 12250 }, { "epoch": 0.08, "learning_rate": 0.00028813065955840116, "loss": 0.0995, "step": 12260 }, { "epoch": 0.08, "learning_rate": 0.0002881209782040442, "loss": 0.1108, "step": 12270 }, { "epoch": 0.08, "learning_rate": 0.00028811129684968727, "loss": 0.1227, "step": 12280 }, { "epoch": 0.08, "learning_rate": 0.00028810161549533035, "loss": 0.1099, "step": 12290 }, { "epoch": 0.08, "learning_rate": 0.0002880919341409734, "loss": 0.1059, "step": 12300 }, { "epoch": 0.08, "learning_rate": 0.00028808225278661645, "loss": 0.1061, "step": 12310 }, { "epoch": 0.08, "learning_rate": 0.00028807257143225953, "loss": 0.112, "step": 12320 }, { "epoch": 0.08, "learning_rate": 0.0002880628900779026, "loss": 0.1048, "step": 12330 }, { "epoch": 0.08, "learning_rate": 0.00028805320872354564, "loss": 0.1037, "step": 12340 }, { "epoch": 0.08, "learning_rate": 0.0002880435273691887, "loss": 0.1008, "step": 12350 }, { "epoch": 0.08, "learning_rate": 0.0002880338460148318, "loss": 0.0988, "step": 12360 }, { "epoch": 0.08, "learning_rate": 0.0002880241646604749, "loss": 0.11, "step": 12370 }, { "epoch": 0.08, "learning_rate": 0.00028801448330611796, "loss": 0.1127, "step": 12380 }, { "epoch": 0.08, "learning_rate": 0.00028800480195176104, "loss": 0.1076, "step": 12390 }, { "epoch": 0.08, "learning_rate": 0.0002879951205974041, "loss": 0.1037, "step": 12400 }, { "epoch": 0.08, "learning_rate": 0.00028798543924304714, "loss": 0.1055, "step": 12410 }, { "epoch": 0.08, "learning_rate": 0.0002879757578886902, "loss": 0.1052, "step": 12420 }, { "epoch": 0.08, "learning_rate": 0.0002879660765343333, "loss": 0.0989, "step": 12430 }, { "epoch": 0.08, "learning_rate": 0.0002879563951799763, "loss": 0.1195, "step": 12440 }, { "epoch": 0.08, "learning_rate": 0.0002879467138256194, "loss": 0.1037, "step": 12450 }, { "epoch": 0.08, "learning_rate": 0.0002879370324712625, "loss": 0.1097, "step": 12460 }, { "epoch": 0.08, "learning_rate": 0.00028792735111690557, "loss": 0.1202, "step": 12470 }, { "epoch": 0.08, "learning_rate": 0.0002879176697625486, "loss": 0.1073, "step": 12480 }, { "epoch": 0.08, "learning_rate": 0.00028790798840819167, "loss": 0.1054, "step": 12490 }, { "epoch": 0.08, "learning_rate": 0.00028789830705383475, "loss": 0.0992, "step": 12500 }, { "epoch": 0.08, "learning_rate": 0.00028788862569947783, "loss": 0.1095, "step": 12510 }, { "epoch": 0.08, "learning_rate": 0.0002878789443451209, "loss": 0.1057, "step": 12520 }, { "epoch": 0.08, "learning_rate": 0.000287869262990764, "loss": 0.1009, "step": 12530 }, { "epoch": 0.08, "learning_rate": 0.00028785958163640707, "loss": 0.1088, "step": 12540 }, { "epoch": 0.08, "learning_rate": 0.0002878499002820501, "loss": 0.1106, "step": 12550 }, { "epoch": 0.08, "learning_rate": 0.0002878402189276932, "loss": 0.1064, "step": 12560 }, { "epoch": 0.08, "learning_rate": 0.0002878305375733362, "loss": 0.1094, "step": 12570 }, { "epoch": 0.08, "learning_rate": 0.0002878208562189793, "loss": 0.1145, "step": 12580 }, { "epoch": 0.08, "learning_rate": 0.00028781117486462236, "loss": 0.1088, "step": 12590 }, { "epoch": 0.08, "learning_rate": 0.00028780149351026544, "loss": 0.1171, "step": 12600 }, { "epoch": 0.08, "learning_rate": 0.0002877918121559085, "loss": 0.101, "step": 12610 }, { "epoch": 0.08, "learning_rate": 0.00028778213080155155, "loss": 0.1133, "step": 12620 }, { "epoch": 0.08, "learning_rate": 0.0002877724494471946, "loss": 0.1089, "step": 12630 }, { "epoch": 0.08, "learning_rate": 0.0002877627680928377, "loss": 0.1027, "step": 12640 }, { "epoch": 0.08, "learning_rate": 0.0002877530867384808, "loss": 0.1025, "step": 12650 }, { "epoch": 0.08, "learning_rate": 0.00028774340538412387, "loss": 0.1063, "step": 12660 }, { "epoch": 0.08, "learning_rate": 0.00028773372402976695, "loss": 0.1088, "step": 12670 }, { "epoch": 0.08, "learning_rate": 0.00028772404267540997, "loss": 0.1023, "step": 12680 }, { "epoch": 0.08, "learning_rate": 0.00028771436132105305, "loss": 0.1077, "step": 12690 }, { "epoch": 0.08, "learning_rate": 0.00028770467996669613, "loss": 0.1099, "step": 12700 }, { "epoch": 0.08, "learning_rate": 0.00028769499861233916, "loss": 0.1072, "step": 12710 }, { "epoch": 0.08, "learning_rate": 0.00028768531725798224, "loss": 0.106, "step": 12720 }, { "epoch": 0.08, "learning_rate": 0.0002876756359036253, "loss": 0.1086, "step": 12730 }, { "epoch": 0.08, "learning_rate": 0.0002876659545492684, "loss": 0.1094, "step": 12740 }, { "epoch": 0.08, "learning_rate": 0.0002876562731949115, "loss": 0.1035, "step": 12750 }, { "epoch": 0.08, "learning_rate": 0.0002876465918405545, "loss": 0.1051, "step": 12760 }, { "epoch": 0.08, "learning_rate": 0.0002876369104861976, "loss": 0.1097, "step": 12770 }, { "epoch": 0.08, "learning_rate": 0.00028762722913184066, "loss": 0.1026, "step": 12780 }, { "epoch": 0.08, "learning_rate": 0.00028761754777748374, "loss": 0.1115, "step": 12790 }, { "epoch": 0.08, "learning_rate": 0.0002876078664231268, "loss": 0.1126, "step": 12800 }, { "epoch": 0.08, "learning_rate": 0.00028759818506876985, "loss": 0.1075, "step": 12810 }, { "epoch": 0.08, "learning_rate": 0.0002875885037144129, "loss": 0.1071, "step": 12820 }, { "epoch": 0.08, "learning_rate": 0.000287578822360056, "loss": 0.1042, "step": 12830 }, { "epoch": 0.08, "learning_rate": 0.00028756914100569903, "loss": 0.1119, "step": 12840 }, { "epoch": 0.08, "learning_rate": 0.0002875594596513421, "loss": 0.1126, "step": 12850 }, { "epoch": 0.08, "learning_rate": 0.0002875497782969852, "loss": 0.1006, "step": 12860 }, { "epoch": 0.08, "learning_rate": 0.00028754009694262827, "loss": 0.1066, "step": 12870 }, { "epoch": 0.08, "learning_rate": 0.00028753041558827135, "loss": 0.1041, "step": 12880 }, { "epoch": 0.08, "learning_rate": 0.00028752073423391443, "loss": 0.1031, "step": 12890 }, { "epoch": 0.08, "learning_rate": 0.00028751105287955746, "loss": 0.1085, "step": 12900 }, { "epoch": 0.08, "learning_rate": 0.00028750137152520053, "loss": 0.1102, "step": 12910 }, { "epoch": 0.08, "learning_rate": 0.0002874916901708436, "loss": 0.0984, "step": 12920 }, { "epoch": 0.08, "learning_rate": 0.0002874820088164867, "loss": 0.0965, "step": 12930 }, { "epoch": 0.08, "learning_rate": 0.0002874723274621298, "loss": 0.1145, "step": 12940 }, { "epoch": 0.08, "learning_rate": 0.0002874626461077728, "loss": 0.1155, "step": 12950 }, { "epoch": 0.08, "learning_rate": 0.0002874529647534159, "loss": 0.1136, "step": 12960 }, { "epoch": 0.08, "learning_rate": 0.00028744328339905896, "loss": 0.1069, "step": 12970 }, { "epoch": 0.08, "learning_rate": 0.000287433602044702, "loss": 0.1121, "step": 12980 }, { "epoch": 0.08, "learning_rate": 0.00028742392069034506, "loss": 0.1005, "step": 12990 }, { "epoch": 0.08, "learning_rate": 0.00028741423933598814, "loss": 0.0987, "step": 13000 }, { "epoch": 0.08, "eval_cer": 0.9200958083832336, "eval_loss": 0.07392711937427521, "eval_runtime": 120.3312, "eval_samples_per_second": 16.621, "eval_steps_per_second": 4.155, "step": 13000 }, { "epoch": 0.08, "learning_rate": 0.0002874045579816312, "loss": 0.1149, "step": 13010 }, { "epoch": 0.08, "learning_rate": 0.0002873948766272743, "loss": 0.1011, "step": 13020 }, { "epoch": 0.08, "learning_rate": 0.0002873851952729174, "loss": 0.1136, "step": 13030 }, { "epoch": 0.08, "learning_rate": 0.0002873755139185604, "loss": 0.1109, "step": 13040 }, { "epoch": 0.08, "learning_rate": 0.0002873658325642035, "loss": 0.1117, "step": 13050 }, { "epoch": 0.08, "learning_rate": 0.00028735615120984657, "loss": 0.1051, "step": 13060 }, { "epoch": 0.08, "learning_rate": 0.00028734646985548965, "loss": 0.1075, "step": 13070 }, { "epoch": 0.08, "learning_rate": 0.0002873367885011327, "loss": 0.1025, "step": 13080 }, { "epoch": 0.08, "learning_rate": 0.00028732710714677575, "loss": 0.0982, "step": 13090 }, { "epoch": 0.08, "learning_rate": 0.00028731742579241883, "loss": 0.1047, "step": 13100 }, { "epoch": 0.08, "learning_rate": 0.00028730774443806186, "loss": 0.1087, "step": 13110 }, { "epoch": 0.08, "learning_rate": 0.00028729806308370494, "loss": 0.1004, "step": 13120 }, { "epoch": 0.08, "learning_rate": 0.000287288381729348, "loss": 0.1101, "step": 13130 }, { "epoch": 0.08, "learning_rate": 0.0002872787003749911, "loss": 0.1023, "step": 13140 }, { "epoch": 0.08, "learning_rate": 0.0002872690190206342, "loss": 0.111, "step": 13150 }, { "epoch": 0.08, "learning_rate": 0.00028725933766627726, "loss": 0.1117, "step": 13160 }, { "epoch": 0.09, "learning_rate": 0.00028724965631192034, "loss": 0.1172, "step": 13170 }, { "epoch": 0.09, "learning_rate": 0.00028723997495756336, "loss": 0.1033, "step": 13180 }, { "epoch": 0.09, "learning_rate": 0.00028723029360320644, "loss": 0.1043, "step": 13190 }, { "epoch": 0.09, "learning_rate": 0.0002872206122488495, "loss": 0.1074, "step": 13200 }, { "epoch": 0.09, "learning_rate": 0.00028721093089449255, "loss": 0.1021, "step": 13210 }, { "epoch": 0.09, "learning_rate": 0.00028720124954013563, "loss": 0.0979, "step": 13220 }, { "epoch": 0.09, "learning_rate": 0.0002871915681857787, "loss": 0.1012, "step": 13230 }, { "epoch": 0.09, "learning_rate": 0.0002871818868314218, "loss": 0.0964, "step": 13240 }, { "epoch": 0.09, "learning_rate": 0.0002871722054770648, "loss": 0.1136, "step": 13250 }, { "epoch": 0.09, "learning_rate": 0.0002871625241227079, "loss": 0.1072, "step": 13260 }, { "epoch": 0.09, "learning_rate": 0.000287152842768351, "loss": 0.1078, "step": 13270 }, { "epoch": 0.09, "learning_rate": 0.00028714316141399405, "loss": 0.1058, "step": 13280 }, { "epoch": 0.09, "learning_rate": 0.00028713348005963713, "loss": 0.0991, "step": 13290 }, { "epoch": 0.09, "learning_rate": 0.0002871237987052802, "loss": 0.1021, "step": 13300 }, { "epoch": 0.09, "learning_rate": 0.0002871141173509233, "loss": 0.1068, "step": 13310 }, { "epoch": 0.09, "learning_rate": 0.0002871044359965663, "loss": 0.1028, "step": 13320 }, { "epoch": 0.09, "learning_rate": 0.0002870947546422094, "loss": 0.1019, "step": 13330 }, { "epoch": 0.09, "learning_rate": 0.0002870850732878525, "loss": 0.0967, "step": 13340 }, { "epoch": 0.09, "learning_rate": 0.0002870753919334955, "loss": 0.1013, "step": 13350 }, { "epoch": 0.09, "learning_rate": 0.0002870657105791386, "loss": 0.1055, "step": 13360 }, { "epoch": 0.09, "learning_rate": 0.00028705602922478166, "loss": 0.0909, "step": 13370 }, { "epoch": 0.09, "learning_rate": 0.00028704634787042474, "loss": 0.1077, "step": 13380 }, { "epoch": 0.09, "learning_rate": 0.00028703666651606777, "loss": 0.1056, "step": 13390 }, { "epoch": 0.09, "learning_rate": 0.00028702698516171085, "loss": 0.0997, "step": 13400 }, { "epoch": 0.09, "learning_rate": 0.00028701730380735393, "loss": 0.0975, "step": 13410 }, { "epoch": 0.09, "learning_rate": 0.000287007622452997, "loss": 0.0976, "step": 13420 }, { "epoch": 0.09, "learning_rate": 0.0002869979410986401, "loss": 0.1058, "step": 13430 }, { "epoch": 0.09, "learning_rate": 0.00028698825974428317, "loss": 0.101, "step": 13440 }, { "epoch": 0.09, "learning_rate": 0.0002869785783899262, "loss": 0.1106, "step": 13450 }, { "epoch": 0.09, "learning_rate": 0.0002869688970355693, "loss": 0.0943, "step": 13460 }, { "epoch": 0.09, "learning_rate": 0.00028695921568121235, "loss": 0.1046, "step": 13470 }, { "epoch": 0.09, "learning_rate": 0.0002869495343268554, "loss": 0.1279, "step": 13480 }, { "epoch": 0.09, "learning_rate": 0.00028693985297249846, "loss": 0.1141, "step": 13490 }, { "epoch": 0.09, "learning_rate": 0.00028693017161814154, "loss": 0.1097, "step": 13500 }, { "epoch": 0.09, "learning_rate": 0.0002869204902637846, "loss": 0.1144, "step": 13510 }, { "epoch": 0.09, "learning_rate": 0.0002869108089094277, "loss": 0.1093, "step": 13520 }, { "epoch": 0.09, "learning_rate": 0.0002869011275550707, "loss": 0.1072, "step": 13530 }, { "epoch": 0.09, "learning_rate": 0.0002868914462007138, "loss": 0.1045, "step": 13540 }, { "epoch": 0.09, "learning_rate": 0.0002868817648463569, "loss": 0.1038, "step": 13550 }, { "epoch": 0.09, "learning_rate": 0.00028687208349199996, "loss": 0.1176, "step": 13560 }, { "epoch": 0.09, "learning_rate": 0.00028686240213764304, "loss": 0.1019, "step": 13570 }, { "epoch": 0.09, "learning_rate": 0.00028685272078328607, "loss": 0.1171, "step": 13580 }, { "epoch": 0.09, "learning_rate": 0.00028684303942892915, "loss": 0.1281, "step": 13590 }, { "epoch": 0.09, "learning_rate": 0.00028683335807457223, "loss": 0.1104, "step": 13600 }, { "epoch": 0.09, "learning_rate": 0.00028682367672021525, "loss": 0.1136, "step": 13610 }, { "epoch": 0.09, "learning_rate": 0.00028681399536585833, "loss": 0.1009, "step": 13620 }, { "epoch": 0.09, "learning_rate": 0.0002868043140115014, "loss": 0.1042, "step": 13630 }, { "epoch": 0.09, "learning_rate": 0.0002867946326571445, "loss": 0.1112, "step": 13640 }, { "epoch": 0.09, "learning_rate": 0.00028678495130278757, "loss": 0.1037, "step": 13650 }, { "epoch": 0.09, "learning_rate": 0.00028677526994843065, "loss": 0.106, "step": 13660 }, { "epoch": 0.09, "learning_rate": 0.0002867655885940737, "loss": 0.1124, "step": 13670 }, { "epoch": 0.09, "learning_rate": 0.00028675590723971676, "loss": 0.1055, "step": 13680 }, { "epoch": 0.09, "learning_rate": 0.00028674622588535984, "loss": 0.1024, "step": 13690 }, { "epoch": 0.09, "learning_rate": 0.0002867365445310029, "loss": 0.1022, "step": 13700 }, { "epoch": 0.09, "learning_rate": 0.000286726863176646, "loss": 0.0967, "step": 13710 }, { "epoch": 0.09, "learning_rate": 0.000286717181822289, "loss": 0.1016, "step": 13720 }, { "epoch": 0.09, "learning_rate": 0.0002867075004679321, "loss": 0.0918, "step": 13730 }, { "epoch": 0.09, "learning_rate": 0.0002866978191135752, "loss": 0.0949, "step": 13740 }, { "epoch": 0.09, "learning_rate": 0.0002866881377592182, "loss": 0.1166, "step": 13750 }, { "epoch": 0.09, "learning_rate": 0.0002866784564048613, "loss": 0.1115, "step": 13760 }, { "epoch": 0.09, "learning_rate": 0.00028666877505050437, "loss": 0.1073, "step": 13770 }, { "epoch": 0.09, "learning_rate": 0.00028665909369614745, "loss": 0.1031, "step": 13780 }, { "epoch": 0.09, "learning_rate": 0.0002866494123417905, "loss": 0.105, "step": 13790 }, { "epoch": 0.09, "learning_rate": 0.0002866397309874336, "loss": 0.1006, "step": 13800 }, { "epoch": 0.09, "learning_rate": 0.00028663004963307663, "loss": 0.1089, "step": 13810 }, { "epoch": 0.09, "learning_rate": 0.0002866203682787197, "loss": 0.1081, "step": 13820 }, { "epoch": 0.09, "learning_rate": 0.0002866106869243628, "loss": 0.1045, "step": 13830 }, { "epoch": 0.09, "learning_rate": 0.00028660100557000587, "loss": 0.0947, "step": 13840 }, { "epoch": 0.09, "learning_rate": 0.0002865913242156489, "loss": 0.1136, "step": 13850 }, { "epoch": 0.09, "learning_rate": 0.000286581642861292, "loss": 0.1049, "step": 13860 }, { "epoch": 0.09, "learning_rate": 0.00028657196150693506, "loss": 0.1044, "step": 13870 }, { "epoch": 0.09, "learning_rate": 0.0002865622801525781, "loss": 0.111, "step": 13880 }, { "epoch": 0.09, "learning_rate": 0.00028655259879822116, "loss": 0.1042, "step": 13890 }, { "epoch": 0.09, "learning_rate": 0.00028654291744386424, "loss": 0.106, "step": 13900 }, { "epoch": 0.09, "learning_rate": 0.0002865332360895073, "loss": 0.1027, "step": 13910 }, { "epoch": 0.09, "learning_rate": 0.0002865235547351504, "loss": 0.1079, "step": 13920 }, { "epoch": 0.09, "learning_rate": 0.0002865138733807935, "loss": 0.1066, "step": 13930 }, { "epoch": 0.09, "learning_rate": 0.00028650419202643656, "loss": 0.1073, "step": 13940 }, { "epoch": 0.09, "learning_rate": 0.0002864945106720796, "loss": 0.1035, "step": 13950 }, { "epoch": 0.09, "learning_rate": 0.00028648482931772267, "loss": 0.1221, "step": 13960 }, { "epoch": 0.09, "learning_rate": 0.00028647514796336575, "loss": 0.1062, "step": 13970 }, { "epoch": 0.09, "learning_rate": 0.00028646546660900877, "loss": 0.1043, "step": 13980 }, { "epoch": 0.09, "learning_rate": 0.00028645578525465185, "loss": 0.1011, "step": 13990 }, { "epoch": 0.09, "learning_rate": 0.00028644610390029493, "loss": 0.1103, "step": 14000 }, { "epoch": 0.09, "eval_cer": 0.9202286747260197, "eval_loss": 0.07276194542646408, "eval_runtime": 120.2789, "eval_samples_per_second": 16.628, "eval_steps_per_second": 4.157, "step": 14000 }, { "epoch": 0.09, "learning_rate": 0.000286436422545938, "loss": 0.1069, "step": 14010 }, { "epoch": 0.09, "learning_rate": 0.00028642674119158104, "loss": 0.1014, "step": 14020 }, { "epoch": 0.09, "learning_rate": 0.0002864170598372241, "loss": 0.1042, "step": 14030 }, { "epoch": 0.09, "learning_rate": 0.0002864073784828672, "loss": 0.1031, "step": 14040 }, { "epoch": 0.09, "learning_rate": 0.0002863976971285103, "loss": 0.1017, "step": 14050 }, { "epoch": 0.09, "learning_rate": 0.00028638801577415336, "loss": 0.1092, "step": 14060 }, { "epoch": 0.09, "learning_rate": 0.00028637833441979644, "loss": 0.139, "step": 14070 }, { "epoch": 0.09, "learning_rate": 0.0002863686530654395, "loss": 0.1212, "step": 14080 }, { "epoch": 0.09, "learning_rate": 0.00028635897171108254, "loss": 0.1001, "step": 14090 }, { "epoch": 0.09, "learning_rate": 0.0002863492903567256, "loss": 0.1005, "step": 14100 }, { "epoch": 0.09, "learning_rate": 0.0002863396090023687, "loss": 0.0959, "step": 14110 }, { "epoch": 0.09, "learning_rate": 0.0002863299276480117, "loss": 0.1051, "step": 14120 }, { "epoch": 0.09, "learning_rate": 0.0002863202462936548, "loss": 0.101, "step": 14130 }, { "epoch": 0.09, "learning_rate": 0.0002863105649392979, "loss": 0.0959, "step": 14140 }, { "epoch": 0.09, "learning_rate": 0.00028630088358494097, "loss": 0.1032, "step": 14150 }, { "epoch": 0.09, "learning_rate": 0.000286291202230584, "loss": 0.0946, "step": 14160 }, { "epoch": 0.09, "learning_rate": 0.00028628152087622707, "loss": 0.104, "step": 14170 }, { "epoch": 0.09, "learning_rate": 0.00028627183952187015, "loss": 0.1004, "step": 14180 }, { "epoch": 0.09, "learning_rate": 0.00028626215816751323, "loss": 0.1112, "step": 14190 }, { "epoch": 0.09, "learning_rate": 0.0002862524768131563, "loss": 0.1029, "step": 14200 }, { "epoch": 0.09, "learning_rate": 0.0002862427954587994, "loss": 0.101, "step": 14210 }, { "epoch": 0.09, "learning_rate": 0.0002862331141044424, "loss": 0.1008, "step": 14220 }, { "epoch": 0.09, "learning_rate": 0.0002862234327500855, "loss": 0.0969, "step": 14230 }, { "epoch": 0.09, "learning_rate": 0.0002862137513957286, "loss": 0.1021, "step": 14240 }, { "epoch": 0.09, "learning_rate": 0.0002862040700413716, "loss": 0.1099, "step": 14250 }, { "epoch": 0.09, "learning_rate": 0.0002861943886870147, "loss": 0.1084, "step": 14260 }, { "epoch": 0.09, "learning_rate": 0.00028618470733265776, "loss": 0.1078, "step": 14270 }, { "epoch": 0.09, "learning_rate": 0.00028617502597830084, "loss": 0.1011, "step": 14280 }, { "epoch": 0.09, "learning_rate": 0.0002861653446239439, "loss": 0.1044, "step": 14290 }, { "epoch": 0.09, "learning_rate": 0.00028615566326958695, "loss": 0.1026, "step": 14300 }, { "epoch": 0.09, "learning_rate": 0.00028614598191523, "loss": 0.101, "step": 14310 }, { "epoch": 0.09, "learning_rate": 0.0002861363005608731, "loss": 0.1053, "step": 14320 }, { "epoch": 0.09, "learning_rate": 0.0002861266192065162, "loss": 0.0979, "step": 14330 }, { "epoch": 0.09, "learning_rate": 0.00028611693785215926, "loss": 0.1103, "step": 14340 }, { "epoch": 0.09, "learning_rate": 0.00028610725649780234, "loss": 0.1124, "step": 14350 }, { "epoch": 0.09, "learning_rate": 0.00028609757514344537, "loss": 0.1092, "step": 14360 }, { "epoch": 0.09, "learning_rate": 0.00028608789378908845, "loss": 0.1079, "step": 14370 }, { "epoch": 0.09, "learning_rate": 0.0002860782124347315, "loss": 0.0947, "step": 14380 }, { "epoch": 0.09, "learning_rate": 0.00028606853108037456, "loss": 0.1024, "step": 14390 }, { "epoch": 0.09, "learning_rate": 0.00028605884972601763, "loss": 0.1067, "step": 14400 }, { "epoch": 0.09, "learning_rate": 0.0002860491683716607, "loss": 0.1036, "step": 14410 }, { "epoch": 0.09, "learning_rate": 0.0002860394870173038, "loss": 0.1066, "step": 14420 }, { "epoch": 0.09, "learning_rate": 0.0002860298056629469, "loss": 0.1053, "step": 14430 }, { "epoch": 0.09, "learning_rate": 0.0002860201243085899, "loss": 0.1058, "step": 14440 }, { "epoch": 0.09, "learning_rate": 0.000286010442954233, "loss": 0.1182, "step": 14450 }, { "epoch": 0.09, "learning_rate": 0.00028600076159987606, "loss": 0.1034, "step": 14460 }, { "epoch": 0.09, "learning_rate": 0.00028599108024551914, "loss": 0.1111, "step": 14470 }, { "epoch": 0.09, "learning_rate": 0.0002859813988911622, "loss": 0.099, "step": 14480 }, { "epoch": 0.09, "learning_rate": 0.00028597171753680524, "loss": 0.1009, "step": 14490 }, { "epoch": 0.09, "learning_rate": 0.0002859620361824483, "loss": 0.0996, "step": 14500 }, { "epoch": 0.09, "learning_rate": 0.0002859523548280914, "loss": 0.0919, "step": 14510 }, { "epoch": 0.09, "learning_rate": 0.00028594267347373443, "loss": 0.099, "step": 14520 }, { "epoch": 0.09, "learning_rate": 0.0002859329921193775, "loss": 0.1008, "step": 14530 }, { "epoch": 0.09, "learning_rate": 0.0002859233107650206, "loss": 0.0936, "step": 14540 }, { "epoch": 0.09, "learning_rate": 0.00028591362941066367, "loss": 0.0996, "step": 14550 }, { "epoch": 0.09, "learning_rate": 0.00028590394805630675, "loss": 0.0957, "step": 14560 }, { "epoch": 0.09, "learning_rate": 0.00028589426670194983, "loss": 0.0986, "step": 14570 }, { "epoch": 0.09, "learning_rate": 0.00028588458534759285, "loss": 0.1045, "step": 14580 }, { "epoch": 0.09, "learning_rate": 0.00028587490399323593, "loss": 0.1011, "step": 14590 }, { "epoch": 0.09, "learning_rate": 0.000285865222638879, "loss": 0.0972, "step": 14600 }, { "epoch": 0.09, "learning_rate": 0.0002858555412845221, "loss": 0.1052, "step": 14610 }, { "epoch": 0.09, "learning_rate": 0.0002858458599301651, "loss": 0.1155, "step": 14620 }, { "epoch": 0.09, "learning_rate": 0.0002858361785758082, "loss": 0.0995, "step": 14630 }, { "epoch": 0.09, "learning_rate": 0.0002858264972214513, "loss": 0.1212, "step": 14640 }, { "epoch": 0.09, "learning_rate": 0.0002858168158670943, "loss": 0.1033, "step": 14650 }, { "epoch": 0.09, "learning_rate": 0.0002858071345127374, "loss": 0.1007, "step": 14660 }, { "epoch": 0.09, "learning_rate": 0.00028579745315838046, "loss": 0.0987, "step": 14670 }, { "epoch": 0.09, "learning_rate": 0.00028578777180402354, "loss": 0.1038, "step": 14680 }, { "epoch": 0.09, "learning_rate": 0.0002857780904496666, "loss": 0.1036, "step": 14690 }, { "epoch": 0.09, "learning_rate": 0.0002857684090953097, "loss": 0.0976, "step": 14700 }, { "epoch": 0.09, "learning_rate": 0.0002857587277409528, "loss": 0.106, "step": 14710 }, { "epoch": 0.1, "learning_rate": 0.0002857490463865958, "loss": 0.1001, "step": 14720 }, { "epoch": 0.1, "learning_rate": 0.0002857393650322389, "loss": 0.0998, "step": 14730 }, { "epoch": 0.1, "learning_rate": 0.00028572968367788197, "loss": 0.0958, "step": 14740 }, { "epoch": 0.1, "learning_rate": 0.00028572000232352505, "loss": 0.1017, "step": 14750 }, { "epoch": 0.1, "learning_rate": 0.0002857103209691681, "loss": 0.0914, "step": 14760 }, { "epoch": 0.1, "learning_rate": 0.00028570063961481115, "loss": 0.0973, "step": 14770 }, { "epoch": 0.1, "learning_rate": 0.00028569095826045423, "loss": 0.1059, "step": 14780 }, { "epoch": 0.1, "learning_rate": 0.00028568127690609726, "loss": 0.087, "step": 14790 }, { "epoch": 0.1, "learning_rate": 0.00028567159555174034, "loss": 0.0975, "step": 14800 }, { "epoch": 0.1, "learning_rate": 0.0002856619141973834, "loss": 0.0959, "step": 14810 }, { "epoch": 0.1, "learning_rate": 0.0002856522328430265, "loss": 0.1045, "step": 14820 }, { "epoch": 0.1, "learning_rate": 0.0002856425514886696, "loss": 0.1027, "step": 14830 }, { "epoch": 0.1, "learning_rate": 0.00028563287013431266, "loss": 0.1016, "step": 14840 }, { "epoch": 0.1, "learning_rate": 0.00028562318877995574, "loss": 0.1028, "step": 14850 }, { "epoch": 0.1, "learning_rate": 0.00028561350742559876, "loss": 0.1035, "step": 14860 }, { "epoch": 0.1, "learning_rate": 0.00028560382607124184, "loss": 0.0938, "step": 14870 }, { "epoch": 0.1, "learning_rate": 0.0002855941447168849, "loss": 0.106, "step": 14880 }, { "epoch": 0.1, "learning_rate": 0.00028558446336252795, "loss": 0.1043, "step": 14890 }, { "epoch": 0.1, "learning_rate": 0.00028557478200817103, "loss": 0.0851, "step": 14900 }, { "epoch": 0.1, "learning_rate": 0.0002855651006538141, "loss": 0.0939, "step": 14910 }, { "epoch": 0.1, "learning_rate": 0.0002855554192994572, "loss": 0.0974, "step": 14920 }, { "epoch": 0.1, "learning_rate": 0.0002855457379451002, "loss": 0.0912, "step": 14930 }, { "epoch": 0.1, "learning_rate": 0.0002855360565907433, "loss": 0.0976, "step": 14940 }, { "epoch": 0.1, "learning_rate": 0.0002855263752363864, "loss": 0.0929, "step": 14950 }, { "epoch": 0.1, "learning_rate": 0.00028551669388202945, "loss": 0.0936, "step": 14960 }, { "epoch": 0.1, "learning_rate": 0.00028550701252767253, "loss": 0.0907, "step": 14970 }, { "epoch": 0.1, "learning_rate": 0.0002854973311733156, "loss": 0.0955, "step": 14980 }, { "epoch": 0.1, "learning_rate": 0.00028548764981895864, "loss": 0.1038, "step": 14990 }, { "epoch": 0.1, "learning_rate": 0.0002854779684646017, "loss": 0.0961, "step": 15000 }, { "epoch": 0.1, "eval_cer": 0.920247655632132, "eval_loss": 0.06776795536279678, "eval_runtime": 120.3481, "eval_samples_per_second": 16.618, "eval_steps_per_second": 4.155, "step": 15000 }, { "epoch": 0.1, "learning_rate": 0.0002854682871102448, "loss": 0.0853, "step": 15010 }, { "epoch": 0.1, "learning_rate": 0.0002854586057558878, "loss": 0.0897, "step": 15020 }, { "epoch": 0.1, "learning_rate": 0.0002854489244015309, "loss": 0.0973, "step": 15030 }, { "epoch": 0.1, "learning_rate": 0.000285439243047174, "loss": 0.1026, "step": 15040 }, { "epoch": 0.1, "learning_rate": 0.00028542956169281706, "loss": 0.1108, "step": 15050 }, { "epoch": 0.1, "learning_rate": 0.00028541988033846014, "loss": 0.1114, "step": 15060 }, { "epoch": 0.1, "learning_rate": 0.00028541019898410317, "loss": 0.1023, "step": 15070 }, { "epoch": 0.1, "learning_rate": 0.00028540051762974625, "loss": 0.0959, "step": 15080 }, { "epoch": 0.1, "learning_rate": 0.00028539083627538933, "loss": 0.0984, "step": 15090 }, { "epoch": 0.1, "learning_rate": 0.0002853811549210324, "loss": 0.0919, "step": 15100 }, { "epoch": 0.1, "learning_rate": 0.0002853714735666755, "loss": 0.1085, "step": 15110 }, { "epoch": 0.1, "learning_rate": 0.00028536179221231857, "loss": 0.1042, "step": 15120 }, { "epoch": 0.1, "learning_rate": 0.0002853521108579616, "loss": 0.1105, "step": 15130 }, { "epoch": 0.1, "learning_rate": 0.00028534242950360467, "loss": 0.0926, "step": 15140 }, { "epoch": 0.1, "learning_rate": 0.00028533274814924775, "loss": 0.0997, "step": 15150 }, { "epoch": 0.1, "learning_rate": 0.0002853230667948908, "loss": 0.0958, "step": 15160 }, { "epoch": 0.1, "learning_rate": 0.00028531338544053386, "loss": 0.101, "step": 15170 }, { "epoch": 0.1, "learning_rate": 0.00028530370408617694, "loss": 0.1052, "step": 15180 }, { "epoch": 0.1, "learning_rate": 0.00028529402273182, "loss": 0.0912, "step": 15190 }, { "epoch": 0.1, "learning_rate": 0.0002852843413774631, "loss": 0.1009, "step": 15200 }, { "epoch": 0.1, "learning_rate": 0.0002852746600231061, "loss": 0.0997, "step": 15210 }, { "epoch": 0.1, "learning_rate": 0.0002852649786687492, "loss": 0.0946, "step": 15220 }, { "epoch": 0.1, "learning_rate": 0.0002852552973143923, "loss": 0.0972, "step": 15230 }, { "epoch": 0.1, "learning_rate": 0.00028524561596003536, "loss": 0.1068, "step": 15240 }, { "epoch": 0.1, "learning_rate": 0.00028523593460567844, "loss": 0.1036, "step": 15250 }, { "epoch": 0.1, "learning_rate": 0.00028522625325132147, "loss": 0.0936, "step": 15260 }, { "epoch": 0.1, "learning_rate": 0.00028521657189696455, "loss": 0.0935, "step": 15270 }, { "epoch": 0.1, "learning_rate": 0.0002852068905426076, "loss": 0.0956, "step": 15280 }, { "epoch": 0.1, "learning_rate": 0.00028519720918825065, "loss": 0.1018, "step": 15290 }, { "epoch": 0.1, "learning_rate": 0.00028518752783389373, "loss": 0.0972, "step": 15300 }, { "epoch": 0.1, "learning_rate": 0.0002851778464795368, "loss": 0.1001, "step": 15310 }, { "epoch": 0.1, "learning_rate": 0.0002851681651251799, "loss": 0.0963, "step": 15320 }, { "epoch": 0.1, "learning_rate": 0.00028515848377082297, "loss": 0.1074, "step": 15330 }, { "epoch": 0.1, "learning_rate": 0.00028514880241646605, "loss": 0.0972, "step": 15340 }, { "epoch": 0.1, "learning_rate": 0.0002851391210621091, "loss": 0.0921, "step": 15350 }, { "epoch": 0.1, "learning_rate": 0.00028512943970775216, "loss": 0.0981, "step": 15360 }, { "epoch": 0.1, "learning_rate": 0.00028511975835339524, "loss": 0.103, "step": 15370 }, { "epoch": 0.1, "learning_rate": 0.0002851100769990383, "loss": 0.0917, "step": 15380 }, { "epoch": 0.1, "learning_rate": 0.00028510039564468134, "loss": 0.0997, "step": 15390 }, { "epoch": 0.1, "learning_rate": 0.0002850907142903244, "loss": 0.0978, "step": 15400 }, { "epoch": 0.1, "learning_rate": 0.0002850810329359675, "loss": 0.1009, "step": 15410 }, { "epoch": 0.1, "learning_rate": 0.0002850713515816105, "loss": 0.0993, "step": 15420 }, { "epoch": 0.1, "learning_rate": 0.0002850616702272536, "loss": 0.1005, "step": 15430 }, { "epoch": 0.1, "learning_rate": 0.0002850519888728967, "loss": 0.0921, "step": 15440 }, { "epoch": 0.1, "learning_rate": 0.00028504230751853977, "loss": 0.0853, "step": 15450 }, { "epoch": 0.1, "learning_rate": 0.00028503262616418285, "loss": 0.1108, "step": 15460 }, { "epoch": 0.1, "learning_rate": 0.0002850229448098259, "loss": 0.1126, "step": 15470 }, { "epoch": 0.1, "learning_rate": 0.000285013263455469, "loss": 0.1089, "step": 15480 }, { "epoch": 0.1, "learning_rate": 0.00028500358210111203, "loss": 0.099, "step": 15490 }, { "epoch": 0.1, "learning_rate": 0.0002849939007467551, "loss": 0.0974, "step": 15500 }, { "epoch": 0.1, "learning_rate": 0.0002849842193923982, "loss": 0.0993, "step": 15510 }, { "epoch": 0.1, "learning_rate": 0.00028497453803804127, "loss": 0.0981, "step": 15520 }, { "epoch": 0.1, "learning_rate": 0.0002849648566836843, "loss": 0.0908, "step": 15530 }, { "epoch": 0.1, "learning_rate": 0.0002849551753293274, "loss": 0.1029, "step": 15540 }, { "epoch": 0.1, "learning_rate": 0.00028494549397497046, "loss": 0.0925, "step": 15550 }, { "epoch": 0.1, "learning_rate": 0.0002849358126206135, "loss": 0.1004, "step": 15560 }, { "epoch": 0.1, "learning_rate": 0.00028492613126625656, "loss": 0.0998, "step": 15570 }, { "epoch": 0.1, "learning_rate": 0.00028491644991189964, "loss": 0.1028, "step": 15580 }, { "epoch": 0.1, "learning_rate": 0.0002849067685575427, "loss": 0.0997, "step": 15590 }, { "epoch": 0.1, "learning_rate": 0.0002848970872031858, "loss": 0.0942, "step": 15600 }, { "epoch": 0.1, "learning_rate": 0.0002848874058488289, "loss": 0.0996, "step": 15610 }, { "epoch": 0.1, "learning_rate": 0.00028487772449447196, "loss": 0.0999, "step": 15620 }, { "epoch": 0.1, "learning_rate": 0.000284868043140115, "loss": 0.09, "step": 15630 }, { "epoch": 0.1, "learning_rate": 0.00028485836178575807, "loss": 0.0962, "step": 15640 }, { "epoch": 0.1, "learning_rate": 0.00028484868043140115, "loss": 0.0972, "step": 15650 }, { "epoch": 0.1, "learning_rate": 0.00028483899907704417, "loss": 0.0863, "step": 15660 }, { "epoch": 0.1, "learning_rate": 0.00028482931772268725, "loss": 0.0994, "step": 15670 }, { "epoch": 0.1, "learning_rate": 0.00028481963636833033, "loss": 0.101, "step": 15680 }, { "epoch": 0.1, "learning_rate": 0.0002848099550139734, "loss": 0.0956, "step": 15690 }, { "epoch": 0.1, "learning_rate": 0.00028480027365961644, "loss": 0.0891, "step": 15700 }, { "epoch": 0.1, "learning_rate": 0.0002847905923052595, "loss": 0.0925, "step": 15710 }, { "epoch": 0.1, "learning_rate": 0.0002847809109509026, "loss": 0.0992, "step": 15720 }, { "epoch": 0.1, "learning_rate": 0.0002847712295965457, "loss": 0.0942, "step": 15730 }, { "epoch": 0.1, "learning_rate": 0.00028476154824218875, "loss": 0.1007, "step": 15740 }, { "epoch": 0.1, "learning_rate": 0.00028475186688783183, "loss": 0.0996, "step": 15750 }, { "epoch": 0.1, "learning_rate": 0.00028474218553347486, "loss": 0.1, "step": 15760 }, { "epoch": 0.1, "learning_rate": 0.00028473250417911794, "loss": 0.1066, "step": 15770 }, { "epoch": 0.1, "learning_rate": 0.000284722822824761, "loss": 0.107, "step": 15780 }, { "epoch": 0.1, "learning_rate": 0.00028471314147040405, "loss": 0.0939, "step": 15790 }, { "epoch": 0.1, "learning_rate": 0.0002847034601160471, "loss": 0.1056, "step": 15800 }, { "epoch": 0.1, "learning_rate": 0.0002846937787616902, "loss": 0.099, "step": 15810 }, { "epoch": 0.1, "learning_rate": 0.0002846840974073333, "loss": 0.0986, "step": 15820 }, { "epoch": 0.1, "learning_rate": 0.00028467441605297636, "loss": 0.1002, "step": 15830 }, { "epoch": 0.1, "learning_rate": 0.0002846647346986194, "loss": 0.106, "step": 15840 }, { "epoch": 0.1, "learning_rate": 0.00028465505334426247, "loss": 0.1035, "step": 15850 }, { "epoch": 0.1, "learning_rate": 0.00028464537198990555, "loss": 0.1059, "step": 15860 }, { "epoch": 0.1, "learning_rate": 0.00028463569063554863, "loss": 0.0931, "step": 15870 }, { "epoch": 0.1, "learning_rate": 0.0002846260092811917, "loss": 0.0956, "step": 15880 }, { "epoch": 0.1, "learning_rate": 0.0002846163279268348, "loss": 0.1004, "step": 15890 }, { "epoch": 0.1, "learning_rate": 0.0002846066465724778, "loss": 0.0895, "step": 15900 }, { "epoch": 0.1, "learning_rate": 0.0002845969652181209, "loss": 0.0894, "step": 15910 }, { "epoch": 0.1, "learning_rate": 0.000284587283863764, "loss": 0.0906, "step": 15920 }, { "epoch": 0.1, "learning_rate": 0.000284577602509407, "loss": 0.0971, "step": 15930 }, { "epoch": 0.1, "learning_rate": 0.0002845679211550501, "loss": 0.0994, "step": 15940 }, { "epoch": 0.1, "learning_rate": 0.00028455823980069316, "loss": 0.0999, "step": 15950 }, { "epoch": 0.1, "learning_rate": 0.00028454855844633624, "loss": 0.1041, "step": 15960 }, { "epoch": 0.1, "learning_rate": 0.0002845388770919793, "loss": 0.1059, "step": 15970 }, { "epoch": 0.1, "learning_rate": 0.00028452919573762234, "loss": 0.106, "step": 15980 }, { "epoch": 0.1, "learning_rate": 0.0002845195143832654, "loss": 0.0953, "step": 15990 }, { "epoch": 0.1, "learning_rate": 0.0002845098330289085, "loss": 0.0976, "step": 16000 }, { "epoch": 0.1, "eval_cer": 0.9202431363687719, "eval_loss": 0.06717900186777115, "eval_runtime": 120.6812, "eval_samples_per_second": 16.573, "eval_steps_per_second": 4.143, "step": 16000 }, { "epoch": 0.1, "learning_rate": 0.0002845001516745516, "loss": 0.0971, "step": 16010 }, { "epoch": 0.1, "learning_rate": 0.00028449047032019466, "loss": 0.1026, "step": 16020 }, { "epoch": 0.1, "learning_rate": 0.0002844807889658377, "loss": 0.0891, "step": 16030 }, { "epoch": 0.1, "learning_rate": 0.00028447110761148077, "loss": 0.1018, "step": 16040 }, { "epoch": 0.1, "learning_rate": 0.00028446142625712385, "loss": 0.1035, "step": 16050 }, { "epoch": 0.1, "learning_rate": 0.0002844517449027669, "loss": 0.1053, "step": 16060 }, { "epoch": 0.1, "learning_rate": 0.00028444206354840995, "loss": 0.0942, "step": 16070 }, { "epoch": 0.1, "learning_rate": 0.00028443238219405303, "loss": 0.0926, "step": 16080 }, { "epoch": 0.1, "learning_rate": 0.0002844227008396961, "loss": 0.1007, "step": 16090 }, { "epoch": 0.1, "learning_rate": 0.0002844130194853392, "loss": 0.102, "step": 16100 }, { "epoch": 0.1, "learning_rate": 0.0002844033381309823, "loss": 0.0927, "step": 16110 }, { "epoch": 0.1, "learning_rate": 0.0002843936567766253, "loss": 0.0997, "step": 16120 }, { "epoch": 0.1, "learning_rate": 0.0002843839754222684, "loss": 0.0954, "step": 16130 }, { "epoch": 0.1, "learning_rate": 0.00028437429406791146, "loss": 0.1012, "step": 16140 }, { "epoch": 0.1, "learning_rate": 0.00028436461271355454, "loss": 0.0955, "step": 16150 }, { "epoch": 0.1, "learning_rate": 0.00028435493135919756, "loss": 0.1029, "step": 16160 }, { "epoch": 0.1, "learning_rate": 0.00028434525000484064, "loss": 0.0899, "step": 16170 }, { "epoch": 0.1, "learning_rate": 0.0002843355686504837, "loss": 0.1038, "step": 16180 }, { "epoch": 0.1, "learning_rate": 0.00028432588729612675, "loss": 0.0971, "step": 16190 }, { "epoch": 0.1, "learning_rate": 0.00028431620594176983, "loss": 0.111, "step": 16200 }, { "epoch": 0.1, "learning_rate": 0.0002843065245874129, "loss": 0.0914, "step": 16210 }, { "epoch": 0.1, "learning_rate": 0.000284296843233056, "loss": 0.0933, "step": 16220 }, { "epoch": 0.1, "learning_rate": 0.00028428716187869907, "loss": 0.0908, "step": 16230 }, { "epoch": 0.1, "learning_rate": 0.00028427748052434215, "loss": 0.0858, "step": 16240 }, { "epoch": 0.1, "learning_rate": 0.00028426779916998523, "loss": 0.0952, "step": 16250 }, { "epoch": 0.1, "learning_rate": 0.00028425811781562825, "loss": 0.089, "step": 16260 }, { "epoch": 0.11, "learning_rate": 0.00028424843646127133, "loss": 0.0954, "step": 16270 }, { "epoch": 0.11, "learning_rate": 0.0002842387551069144, "loss": 0.0928, "step": 16280 }, { "epoch": 0.11, "learning_rate": 0.0002842290737525575, "loss": 0.0905, "step": 16290 }, { "epoch": 0.11, "learning_rate": 0.0002842193923982005, "loss": 0.1, "step": 16300 }, { "epoch": 0.11, "learning_rate": 0.0002842097110438436, "loss": 0.0976, "step": 16310 }, { "epoch": 0.11, "learning_rate": 0.0002842000296894867, "loss": 0.0956, "step": 16320 }, { "epoch": 0.11, "learning_rate": 0.0002841903483351297, "loss": 0.1034, "step": 16330 }, { "epoch": 0.11, "learning_rate": 0.0002841806669807728, "loss": 0.0926, "step": 16340 }, { "epoch": 0.11, "learning_rate": 0.00028417098562641586, "loss": 0.102, "step": 16350 }, { "epoch": 0.11, "learning_rate": 0.00028416130427205894, "loss": 0.0967, "step": 16360 }, { "epoch": 0.11, "learning_rate": 0.000284151622917702, "loss": 0.0974, "step": 16370 }, { "epoch": 0.11, "learning_rate": 0.0002841419415633451, "loss": 0.0878, "step": 16380 }, { "epoch": 0.11, "learning_rate": 0.0002841322602089882, "loss": 0.0982, "step": 16390 }, { "epoch": 0.11, "learning_rate": 0.0002841225788546312, "loss": 0.0962, "step": 16400 }, { "epoch": 0.11, "learning_rate": 0.0002841128975002743, "loss": 0.0977, "step": 16410 }, { "epoch": 0.11, "learning_rate": 0.00028410321614591737, "loss": 0.0946, "step": 16420 }, { "epoch": 0.11, "learning_rate": 0.0002840935347915604, "loss": 0.1005, "step": 16430 }, { "epoch": 0.11, "learning_rate": 0.0002840838534372035, "loss": 0.0946, "step": 16440 }, { "epoch": 0.11, "learning_rate": 0.00028407417208284655, "loss": 0.1006, "step": 16450 }, { "epoch": 0.11, "learning_rate": 0.00028406449072848963, "loss": 0.1001, "step": 16460 }, { "epoch": 0.11, "learning_rate": 0.00028405480937413266, "loss": 0.099, "step": 16470 }, { "epoch": 0.11, "learning_rate": 0.00028404512801977574, "loss": 0.094, "step": 16480 }, { "epoch": 0.11, "learning_rate": 0.0002840354466654188, "loss": 0.0894, "step": 16490 }, { "epoch": 0.11, "learning_rate": 0.0002840257653110619, "loss": 0.0975, "step": 16500 }, { "epoch": 0.11, "learning_rate": 0.000284016083956705, "loss": 0.0951, "step": 16510 }, { "epoch": 0.11, "learning_rate": 0.00028400640260234806, "loss": 0.0971, "step": 16520 }, { "epoch": 0.11, "learning_rate": 0.00028399672124799114, "loss": 0.0979, "step": 16530 }, { "epoch": 0.11, "learning_rate": 0.00028398703989363416, "loss": 0.0917, "step": 16540 }, { "epoch": 0.11, "learning_rate": 0.00028397735853927724, "loss": 0.0933, "step": 16550 }, { "epoch": 0.11, "learning_rate": 0.00028396767718492027, "loss": 0.0916, "step": 16560 }, { "epoch": 0.11, "learning_rate": 0.00028395799583056335, "loss": 0.0933, "step": 16570 }, { "epoch": 0.11, "learning_rate": 0.00028394831447620643, "loss": 0.1018, "step": 16580 }, { "epoch": 0.11, "learning_rate": 0.0002839386331218495, "loss": 0.0857, "step": 16590 }, { "epoch": 0.11, "learning_rate": 0.0002839289517674926, "loss": 0.0895, "step": 16600 }, { "epoch": 0.11, "learning_rate": 0.0002839192704131356, "loss": 0.0986, "step": 16610 }, { "epoch": 0.11, "learning_rate": 0.0002839095890587787, "loss": 0.0917, "step": 16620 }, { "epoch": 0.11, "learning_rate": 0.00028389990770442177, "loss": 0.0929, "step": 16630 }, { "epoch": 0.11, "learning_rate": 0.00028389022635006485, "loss": 0.0973, "step": 16640 }, { "epoch": 0.11, "learning_rate": 0.00028388054499570793, "loss": 0.0982, "step": 16650 }, { "epoch": 0.11, "learning_rate": 0.000283870863641351, "loss": 0.1178, "step": 16660 }, { "epoch": 0.11, "learning_rate": 0.00028386118228699404, "loss": 0.094, "step": 16670 }, { "epoch": 0.11, "learning_rate": 0.0002838515009326371, "loss": 0.0945, "step": 16680 }, { "epoch": 0.11, "learning_rate": 0.0002838418195782802, "loss": 0.1011, "step": 16690 }, { "epoch": 0.11, "learning_rate": 0.0002838321382239232, "loss": 0.1004, "step": 16700 }, { "epoch": 0.11, "learning_rate": 0.0002838224568695663, "loss": 0.0913, "step": 16710 }, { "epoch": 0.11, "learning_rate": 0.0002838127755152094, "loss": 0.1008, "step": 16720 }, { "epoch": 0.11, "learning_rate": 0.00028380309416085246, "loss": 0.1036, "step": 16730 }, { "epoch": 0.11, "learning_rate": 0.00028379341280649554, "loss": 0.0951, "step": 16740 }, { "epoch": 0.11, "learning_rate": 0.00028378373145213857, "loss": 0.1009, "step": 16750 }, { "epoch": 0.11, "learning_rate": 0.00028377405009778165, "loss": 0.0869, "step": 16760 }, { "epoch": 0.11, "learning_rate": 0.0002837643687434247, "loss": 0.0986, "step": 16770 }, { "epoch": 0.11, "learning_rate": 0.0002837546873890678, "loss": 0.0959, "step": 16780 }, { "epoch": 0.11, "learning_rate": 0.0002837450060347109, "loss": 0.0997, "step": 16790 }, { "epoch": 0.11, "learning_rate": 0.0002837353246803539, "loss": 0.0886, "step": 16800 }, { "epoch": 0.11, "learning_rate": 0.000283725643325997, "loss": 0.0863, "step": 16810 }, { "epoch": 0.11, "learning_rate": 0.00028371596197164007, "loss": 0.095, "step": 16820 }, { "epoch": 0.11, "learning_rate": 0.0002837062806172831, "loss": 0.085, "step": 16830 }, { "epoch": 0.11, "learning_rate": 0.0002836965992629262, "loss": 0.0993, "step": 16840 }, { "epoch": 0.11, "learning_rate": 0.00028368691790856926, "loss": 0.0941, "step": 16850 }, { "epoch": 0.11, "learning_rate": 0.00028367723655421234, "loss": 0.0962, "step": 16860 }, { "epoch": 0.11, "learning_rate": 0.0002836675551998554, "loss": 0.099, "step": 16870 }, { "epoch": 0.11, "learning_rate": 0.0002836578738454985, "loss": 0.0865, "step": 16880 }, { "epoch": 0.11, "learning_rate": 0.0002836481924911415, "loss": 0.0984, "step": 16890 }, { "epoch": 0.11, "learning_rate": 0.0002836385111367846, "loss": 0.0927, "step": 16900 }, { "epoch": 0.11, "learning_rate": 0.0002836288297824277, "loss": 0.0898, "step": 16910 }, { "epoch": 0.11, "learning_rate": 0.00028361914842807076, "loss": 0.091, "step": 16920 }, { "epoch": 0.11, "learning_rate": 0.00028360946707371384, "loss": 0.0903, "step": 16930 }, { "epoch": 0.11, "learning_rate": 0.00028359978571935687, "loss": 0.0881, "step": 16940 }, { "epoch": 0.11, "learning_rate": 0.00028359010436499995, "loss": 0.0926, "step": 16950 }, { "epoch": 0.11, "learning_rate": 0.00028358042301064297, "loss": 0.0982, "step": 16960 }, { "epoch": 0.11, "learning_rate": 0.00028357074165628605, "loss": 0.0906, "step": 16970 }, { "epoch": 0.11, "learning_rate": 0.00028356106030192913, "loss": 0.0915, "step": 16980 }, { "epoch": 0.11, "learning_rate": 0.0002835513789475722, "loss": 0.0924, "step": 16990 }, { "epoch": 0.11, "learning_rate": 0.0002835416975932153, "loss": 0.0949, "step": 17000 }, { "epoch": 0.11, "eval_cer": 0.9201943283244831, "eval_loss": 0.06401708722114563, "eval_runtime": 120.4041, "eval_samples_per_second": 16.611, "eval_steps_per_second": 4.153, "step": 17000 }, { "epoch": 0.11, "learning_rate": 0.00028353201623885837, "loss": 0.1014, "step": 17010 }, { "epoch": 0.11, "learning_rate": 0.00028352233488450145, "loss": 0.0924, "step": 17020 }, { "epoch": 0.11, "learning_rate": 0.0002835126535301445, "loss": 0.0964, "step": 17030 }, { "epoch": 0.11, "learning_rate": 0.00028350297217578756, "loss": 0.0907, "step": 17040 }, { "epoch": 0.11, "learning_rate": 0.00028349329082143064, "loss": 0.1097, "step": 17050 }, { "epoch": 0.11, "learning_rate": 0.0002834836094670737, "loss": 0.0916, "step": 17060 }, { "epoch": 0.11, "learning_rate": 0.00028347392811271674, "loss": 0.0922, "step": 17070 }, { "epoch": 0.11, "learning_rate": 0.0002834642467583598, "loss": 0.0875, "step": 17080 }, { "epoch": 0.11, "learning_rate": 0.0002834545654040029, "loss": 0.0863, "step": 17090 }, { "epoch": 0.11, "learning_rate": 0.0002834448840496459, "loss": 0.1121, "step": 17100 }, { "epoch": 0.11, "learning_rate": 0.000283435202695289, "loss": 0.0921, "step": 17110 }, { "epoch": 0.11, "learning_rate": 0.0002834255213409321, "loss": 0.0899, "step": 17120 }, { "epoch": 0.11, "learning_rate": 0.00028341583998657517, "loss": 0.0917, "step": 17130 }, { "epoch": 0.11, "learning_rate": 0.00028340615863221825, "loss": 0.092, "step": 17140 }, { "epoch": 0.11, "learning_rate": 0.0002833964772778613, "loss": 0.0889, "step": 17150 }, { "epoch": 0.11, "learning_rate": 0.0002833867959235044, "loss": 0.0928, "step": 17160 }, { "epoch": 0.11, "learning_rate": 0.00028337711456914743, "loss": 0.0906, "step": 17170 }, { "epoch": 0.11, "learning_rate": 0.0002833674332147905, "loss": 0.0987, "step": 17180 }, { "epoch": 0.11, "learning_rate": 0.0002833577518604336, "loss": 0.0935, "step": 17190 }, { "epoch": 0.11, "learning_rate": 0.0002833480705060766, "loss": 0.1067, "step": 17200 }, { "epoch": 0.11, "learning_rate": 0.0002833383891517197, "loss": 0.0941, "step": 17210 }, { "epoch": 0.11, "learning_rate": 0.0002833287077973628, "loss": 0.0891, "step": 17220 }, { "epoch": 0.11, "learning_rate": 0.0002833190264430058, "loss": 0.0937, "step": 17230 }, { "epoch": 0.11, "learning_rate": 0.0002833093450886489, "loss": 0.1014, "step": 17240 }, { "epoch": 0.11, "learning_rate": 0.00028329966373429196, "loss": 0.0965, "step": 17250 }, { "epoch": 0.11, "learning_rate": 0.00028328998237993504, "loss": 0.0962, "step": 17260 }, { "epoch": 0.11, "learning_rate": 0.0002832803010255781, "loss": 0.1005, "step": 17270 }, { "epoch": 0.11, "learning_rate": 0.0002832706196712212, "loss": 0.0978, "step": 17280 }, { "epoch": 0.11, "learning_rate": 0.0002832609383168643, "loss": 0.099, "step": 17290 }, { "epoch": 0.11, "learning_rate": 0.0002832512569625073, "loss": 0.0997, "step": 17300 }, { "epoch": 0.11, "learning_rate": 0.0002832415756081504, "loss": 0.0924, "step": 17310 }, { "epoch": 0.11, "learning_rate": 0.00028323189425379346, "loss": 0.0928, "step": 17320 }, { "epoch": 0.11, "learning_rate": 0.00028322221289943654, "loss": 0.0959, "step": 17330 }, { "epoch": 0.11, "learning_rate": 0.00028321253154507957, "loss": 0.0911, "step": 17340 }, { "epoch": 0.11, "learning_rate": 0.00028320285019072265, "loss": 0.1007, "step": 17350 }, { "epoch": 0.11, "learning_rate": 0.00028319316883636573, "loss": 0.0861, "step": 17360 }, { "epoch": 0.11, "learning_rate": 0.00028318348748200876, "loss": 0.0894, "step": 17370 }, { "epoch": 0.11, "learning_rate": 0.00028317380612765183, "loss": 0.0874, "step": 17380 }, { "epoch": 0.11, "learning_rate": 0.0002831641247732949, "loss": 0.1041, "step": 17390 }, { "epoch": 0.11, "learning_rate": 0.000283154443418938, "loss": 0.0932, "step": 17400 }, { "epoch": 0.11, "learning_rate": 0.0002831447620645811, "loss": 0.0876, "step": 17410 }, { "epoch": 0.11, "learning_rate": 0.00028313508071022415, "loss": 0.0971, "step": 17420 }, { "epoch": 0.11, "learning_rate": 0.00028312539935586723, "loss": 0.0878, "step": 17430 }, { "epoch": 0.11, "learning_rate": 0.00028311571800151026, "loss": 0.0911, "step": 17440 }, { "epoch": 0.11, "learning_rate": 0.00028310603664715334, "loss": 0.0871, "step": 17450 }, { "epoch": 0.11, "learning_rate": 0.0002830963552927964, "loss": 0.0888, "step": 17460 }, { "epoch": 0.11, "learning_rate": 0.00028308667393843944, "loss": 0.0856, "step": 17470 }, { "epoch": 0.11, "learning_rate": 0.0002830769925840825, "loss": 0.0913, "step": 17480 }, { "epoch": 0.11, "learning_rate": 0.0002830673112297256, "loss": 0.0973, "step": 17490 }, { "epoch": 0.11, "learning_rate": 0.0002830576298753687, "loss": 0.0857, "step": 17500 }, { "epoch": 0.11, "learning_rate": 0.0002830479485210117, "loss": 0.1043, "step": 17510 }, { "epoch": 0.11, "learning_rate": 0.0002830382671666548, "loss": 0.0951, "step": 17520 }, { "epoch": 0.11, "learning_rate": 0.00028302858581229787, "loss": 0.1021, "step": 17530 }, { "epoch": 0.11, "learning_rate": 0.00028301890445794095, "loss": 0.0907, "step": 17540 }, { "epoch": 0.11, "learning_rate": 0.00028300922310358403, "loss": 0.0894, "step": 17550 }, { "epoch": 0.11, "learning_rate": 0.0002829995417492271, "loss": 0.1018, "step": 17560 }, { "epoch": 0.11, "learning_rate": 0.00028298986039487013, "loss": 0.0914, "step": 17570 }, { "epoch": 0.11, "learning_rate": 0.0002829801790405132, "loss": 0.0827, "step": 17580 }, { "epoch": 0.11, "learning_rate": 0.0002829704976861563, "loss": 0.1096, "step": 17590 }, { "epoch": 0.11, "learning_rate": 0.0002829608163317993, "loss": 0.1036, "step": 17600 }, { "epoch": 0.11, "learning_rate": 0.0002829511349774424, "loss": 0.1066, "step": 17610 }, { "epoch": 0.11, "learning_rate": 0.0002829414536230855, "loss": 0.0907, "step": 17620 }, { "epoch": 0.11, "learning_rate": 0.00028293177226872856, "loss": 0.0906, "step": 17630 }, { "epoch": 0.11, "learning_rate": 0.00028292209091437164, "loss": 0.0943, "step": 17640 }, { "epoch": 0.11, "learning_rate": 0.00028291240956001466, "loss": 0.0983, "step": 17650 }, { "epoch": 0.11, "learning_rate": 0.00028290272820565774, "loss": 0.1, "step": 17660 }, { "epoch": 0.11, "learning_rate": 0.0002828930468513008, "loss": 0.0911, "step": 17670 }, { "epoch": 0.11, "learning_rate": 0.0002828833654969439, "loss": 0.0865, "step": 17680 }, { "epoch": 0.11, "learning_rate": 0.000282873684142587, "loss": 0.0978, "step": 17690 }, { "epoch": 0.11, "learning_rate": 0.00028286400278823006, "loss": 0.0998, "step": 17700 }, { "epoch": 0.11, "learning_rate": 0.0002828543214338731, "loss": 0.0952, "step": 17710 }, { "epoch": 0.11, "learning_rate": 0.00028284464007951617, "loss": 0.0994, "step": 17720 }, { "epoch": 0.11, "learning_rate": 0.00028283495872515925, "loss": 0.0895, "step": 17730 }, { "epoch": 0.11, "learning_rate": 0.0002828252773708023, "loss": 0.0916, "step": 17740 }, { "epoch": 0.11, "learning_rate": 0.00028281559601644535, "loss": 0.0995, "step": 17750 }, { "epoch": 0.11, "learning_rate": 0.00028280591466208843, "loss": 0.0827, "step": 17760 }, { "epoch": 0.11, "learning_rate": 0.0002827962333077315, "loss": 0.0811, "step": 17770 }, { "epoch": 0.11, "learning_rate": 0.0002827865519533746, "loss": 0.0821, "step": 17780 }, { "epoch": 0.11, "learning_rate": 0.0002827768705990176, "loss": 0.0881, "step": 17790 }, { "epoch": 0.11, "learning_rate": 0.0002827671892446607, "loss": 0.0891, "step": 17800 }, { "epoch": 0.11, "learning_rate": 0.0002827575078903038, "loss": 0.0851, "step": 17810 }, { "epoch": 0.12, "learning_rate": 0.00028274782653594686, "loss": 0.0837, "step": 17820 }, { "epoch": 0.12, "learning_rate": 0.00028273814518158994, "loss": 0.0888, "step": 17830 }, { "epoch": 0.12, "learning_rate": 0.00028272846382723296, "loss": 0.0865, "step": 17840 }, { "epoch": 0.12, "learning_rate": 0.00028271878247287604, "loss": 0.0865, "step": 17850 }, { "epoch": 0.12, "learning_rate": 0.0002827091011185191, "loss": 0.0948, "step": 17860 }, { "epoch": 0.12, "learning_rate": 0.00028269941976416215, "loss": 0.0955, "step": 17870 }, { "epoch": 0.12, "learning_rate": 0.00028268973840980523, "loss": 0.0923, "step": 17880 }, { "epoch": 0.12, "learning_rate": 0.0002826800570554483, "loss": 0.0914, "step": 17890 }, { "epoch": 0.12, "learning_rate": 0.0002826703757010914, "loss": 0.095, "step": 17900 }, { "epoch": 0.12, "learning_rate": 0.00028266069434673447, "loss": 0.0963, "step": 17910 }, { "epoch": 0.12, "learning_rate": 0.00028265101299237755, "loss": 0.0986, "step": 17920 }, { "epoch": 0.12, "learning_rate": 0.0002826413316380206, "loss": 0.105, "step": 17930 }, { "epoch": 0.12, "learning_rate": 0.00028263165028366365, "loss": 0.0948, "step": 17940 }, { "epoch": 0.12, "learning_rate": 0.00028262196892930673, "loss": 0.1032, "step": 17950 }, { "epoch": 0.12, "learning_rate": 0.0002826122875749498, "loss": 0.0888, "step": 17960 }, { "epoch": 0.12, "learning_rate": 0.00028260260622059284, "loss": 0.1002, "step": 17970 }, { "epoch": 0.12, "learning_rate": 0.0002825929248662359, "loss": 0.0967, "step": 17980 }, { "epoch": 0.12, "learning_rate": 0.000282583243511879, "loss": 0.0935, "step": 17990 }, { "epoch": 0.12, "learning_rate": 0.000282573562157522, "loss": 0.1026, "step": 18000 }, { "epoch": 0.12, "eval_cer": 0.9202557903061801, "eval_loss": 0.06353824585676193, "eval_runtime": 120.4302, "eval_samples_per_second": 16.607, "eval_steps_per_second": 4.152, "step": 18000 }, { "epoch": 0.12, "learning_rate": 0.0002825638808031651, "loss": 0.092, "step": 18010 }, { "epoch": 0.12, "learning_rate": 0.0002825541994488082, "loss": 0.0913, "step": 18020 }, { "epoch": 0.12, "learning_rate": 0.00028254451809445126, "loss": 0.097, "step": 18030 }, { "epoch": 0.12, "learning_rate": 0.00028253483674009434, "loss": 0.1017, "step": 18040 }, { "epoch": 0.12, "learning_rate": 0.0002825251553857374, "loss": 0.1009, "step": 18050 }, { "epoch": 0.12, "learning_rate": 0.0002825154740313805, "loss": 0.0962, "step": 18060 }, { "epoch": 0.12, "learning_rate": 0.00028250579267702353, "loss": 0.0942, "step": 18070 }, { "epoch": 0.12, "learning_rate": 0.0002824961113226666, "loss": 0.0949, "step": 18080 }, { "epoch": 0.12, "learning_rate": 0.0002824864299683097, "loss": 0.1029, "step": 18090 }, { "epoch": 0.12, "learning_rate": 0.00028247674861395277, "loss": 0.1035, "step": 18100 }, { "epoch": 0.12, "learning_rate": 0.0002824670672595958, "loss": 0.0965, "step": 18110 }, { "epoch": 0.12, "learning_rate": 0.00028245738590523887, "loss": 0.0962, "step": 18120 }, { "epoch": 0.12, "learning_rate": 0.00028244770455088195, "loss": 0.088, "step": 18130 }, { "epoch": 0.12, "learning_rate": 0.000282438023196525, "loss": 0.0988, "step": 18140 }, { "epoch": 0.12, "learning_rate": 0.00028242834184216806, "loss": 0.0946, "step": 18150 }, { "epoch": 0.12, "learning_rate": 0.00028241866048781114, "loss": 0.0929, "step": 18160 }, { "epoch": 0.12, "learning_rate": 0.0002824089791334542, "loss": 0.09, "step": 18170 }, { "epoch": 0.12, "learning_rate": 0.0002823992977790973, "loss": 0.0985, "step": 18180 }, { "epoch": 0.12, "learning_rate": 0.0002823896164247404, "loss": 0.0932, "step": 18190 }, { "epoch": 0.12, "learning_rate": 0.00028237993507038346, "loss": 0.094, "step": 18200 }, { "epoch": 0.12, "learning_rate": 0.0002823702537160265, "loss": 0.098, "step": 18210 }, { "epoch": 0.12, "learning_rate": 0.00028236057236166956, "loss": 0.1014, "step": 18220 }, { "epoch": 0.12, "learning_rate": 0.00028235089100731264, "loss": 0.096, "step": 18230 }, { "epoch": 0.12, "learning_rate": 0.00028234120965295567, "loss": 0.0929, "step": 18240 }, { "epoch": 0.12, "learning_rate": 0.00028233152829859875, "loss": 0.0936, "step": 18250 }, { "epoch": 0.12, "learning_rate": 0.0002823218469442418, "loss": 0.0903, "step": 18260 }, { "epoch": 0.12, "learning_rate": 0.0002823121655898849, "loss": 0.0991, "step": 18270 }, { "epoch": 0.12, "learning_rate": 0.00028230248423552793, "loss": 0.0946, "step": 18280 }, { "epoch": 0.12, "learning_rate": 0.000282292802881171, "loss": 0.0826, "step": 18290 }, { "epoch": 0.12, "learning_rate": 0.0002822831215268141, "loss": 0.0882, "step": 18300 }, { "epoch": 0.12, "learning_rate": 0.00028227344017245717, "loss": 0.0983, "step": 18310 }, { "epoch": 0.12, "learning_rate": 0.00028226375881810025, "loss": 0.0921, "step": 18320 }, { "epoch": 0.12, "learning_rate": 0.00028225407746374333, "loss": 0.0873, "step": 18330 }, { "epoch": 0.12, "learning_rate": 0.0002822443961093864, "loss": 0.0965, "step": 18340 }, { "epoch": 0.12, "learning_rate": 0.00028223471475502944, "loss": 0.0926, "step": 18350 }, { "epoch": 0.12, "learning_rate": 0.0002822250334006725, "loss": 0.0923, "step": 18360 }, { "epoch": 0.12, "learning_rate": 0.00028221535204631554, "loss": 0.0907, "step": 18370 }, { "epoch": 0.12, "learning_rate": 0.0002822056706919586, "loss": 0.0938, "step": 18380 }, { "epoch": 0.12, "learning_rate": 0.0002821959893376017, "loss": 0.0832, "step": 18390 }, { "epoch": 0.12, "learning_rate": 0.0002821863079832448, "loss": 0.09, "step": 18400 }, { "epoch": 0.12, "learning_rate": 0.00028217662662888786, "loss": 0.0877, "step": 18410 }, { "epoch": 0.12, "learning_rate": 0.0002821669452745309, "loss": 0.0963, "step": 18420 }, { "epoch": 0.12, "learning_rate": 0.00028215726392017397, "loss": 0.0967, "step": 18430 }, { "epoch": 0.12, "learning_rate": 0.00028214758256581705, "loss": 0.0871, "step": 18440 }, { "epoch": 0.12, "learning_rate": 0.0002821379012114601, "loss": 0.0901, "step": 18450 }, { "epoch": 0.12, "learning_rate": 0.0002821282198571032, "loss": 0.0924, "step": 18460 }, { "epoch": 0.12, "learning_rate": 0.0002821185385027463, "loss": 0.0951, "step": 18470 }, { "epoch": 0.12, "learning_rate": 0.0002821088571483893, "loss": 0.0811, "step": 18480 }, { "epoch": 0.12, "learning_rate": 0.0002820991757940324, "loss": 0.0957, "step": 18490 }, { "epoch": 0.12, "learning_rate": 0.00028208949443967547, "loss": 0.0866, "step": 18500 }, { "epoch": 0.12, "learning_rate": 0.0002820798130853185, "loss": 0.0875, "step": 18510 }, { "epoch": 0.12, "learning_rate": 0.0002820701317309616, "loss": 0.0944, "step": 18520 }, { "epoch": 0.12, "learning_rate": 0.00028206045037660466, "loss": 0.0905, "step": 18530 }, { "epoch": 0.12, "learning_rate": 0.00028205076902224774, "loss": 0.0974, "step": 18540 }, { "epoch": 0.12, "learning_rate": 0.0002820410876678908, "loss": 0.0958, "step": 18550 }, { "epoch": 0.12, "learning_rate": 0.00028203140631353384, "loss": 0.0816, "step": 18560 }, { "epoch": 0.12, "learning_rate": 0.0002820217249591769, "loss": 0.0899, "step": 18570 }, { "epoch": 0.12, "learning_rate": 0.00028201204360482, "loss": 0.0881, "step": 18580 }, { "epoch": 0.12, "learning_rate": 0.0002820023622504631, "loss": 0.0823, "step": 18590 }, { "epoch": 0.12, "learning_rate": 0.00028199268089610616, "loss": 0.0909, "step": 18600 }, { "epoch": 0.12, "learning_rate": 0.0002819829995417492, "loss": 0.0881, "step": 18610 }, { "epoch": 0.12, "learning_rate": 0.00028197331818739227, "loss": 0.1171, "step": 18620 }, { "epoch": 0.12, "learning_rate": 0.00028196363683303535, "loss": 0.1105, "step": 18630 }, { "epoch": 0.12, "learning_rate": 0.00028195395547867837, "loss": 0.098, "step": 18640 }, { "epoch": 0.12, "learning_rate": 0.00028194427412432145, "loss": 0.099, "step": 18650 }, { "epoch": 0.12, "learning_rate": 0.00028193459276996453, "loss": 0.0884, "step": 18660 }, { "epoch": 0.12, "learning_rate": 0.0002819249114156076, "loss": 0.0907, "step": 18670 }, { "epoch": 0.12, "learning_rate": 0.0002819152300612507, "loss": 0.0944, "step": 18680 }, { "epoch": 0.12, "learning_rate": 0.00028190554870689377, "loss": 0.0934, "step": 18690 }, { "epoch": 0.12, "learning_rate": 0.0002818958673525368, "loss": 0.0949, "step": 18700 }, { "epoch": 0.12, "learning_rate": 0.0002818861859981799, "loss": 0.0893, "step": 18710 }, { "epoch": 0.12, "learning_rate": 0.00028187650464382295, "loss": 0.0894, "step": 18720 }, { "epoch": 0.12, "learning_rate": 0.00028186682328946603, "loss": 0.0959, "step": 18730 }, { "epoch": 0.12, "learning_rate": 0.0002818571419351091, "loss": 0.1003, "step": 18740 }, { "epoch": 0.12, "learning_rate": 0.00028184746058075214, "loss": 0.0946, "step": 18750 }, { "epoch": 0.12, "learning_rate": 0.0002818377792263952, "loss": 0.0904, "step": 18760 }, { "epoch": 0.12, "learning_rate": 0.00028182809787203825, "loss": 0.0956, "step": 18770 }, { "epoch": 0.12, "learning_rate": 0.0002818184165176813, "loss": 0.092, "step": 18780 }, { "epoch": 0.12, "learning_rate": 0.0002818087351633244, "loss": 0.0924, "step": 18790 }, { "epoch": 0.12, "learning_rate": 0.0002817990538089675, "loss": 0.0845, "step": 18800 }, { "epoch": 0.12, "learning_rate": 0.00028178937245461056, "loss": 0.0935, "step": 18810 }, { "epoch": 0.12, "learning_rate": 0.00028177969110025364, "loss": 0.0915, "step": 18820 }, { "epoch": 0.12, "learning_rate": 0.0002817700097458967, "loss": 0.0903, "step": 18830 }, { "epoch": 0.12, "learning_rate": 0.00028176032839153975, "loss": 0.0943, "step": 18840 }, { "epoch": 0.12, "learning_rate": 0.00028175064703718283, "loss": 0.0873, "step": 18850 }, { "epoch": 0.12, "learning_rate": 0.0002817409656828259, "loss": 0.0861, "step": 18860 }, { "epoch": 0.12, "learning_rate": 0.000281731284328469, "loss": 0.0841, "step": 18870 }, { "epoch": 0.12, "learning_rate": 0.000281721602974112, "loss": 0.0964, "step": 18880 }, { "epoch": 0.12, "learning_rate": 0.0002817119216197551, "loss": 0.0873, "step": 18890 }, { "epoch": 0.12, "learning_rate": 0.0002817022402653982, "loss": 0.0849, "step": 18900 }, { "epoch": 0.12, "learning_rate": 0.0002816925589110412, "loss": 0.091, "step": 18910 }, { "epoch": 0.12, "learning_rate": 0.0002816828775566843, "loss": 0.0938, "step": 18920 }, { "epoch": 0.12, "learning_rate": 0.00028167319620232736, "loss": 0.0951, "step": 18930 }, { "epoch": 0.12, "learning_rate": 0.00028166351484797044, "loss": 0.096, "step": 18940 }, { "epoch": 0.12, "learning_rate": 0.0002816538334936135, "loss": 0.0972, "step": 18950 }, { "epoch": 0.12, "learning_rate": 0.0002816441521392566, "loss": 0.0955, "step": 18960 }, { "epoch": 0.12, "learning_rate": 0.0002816344707848997, "loss": 0.0916, "step": 18970 }, { "epoch": 0.12, "learning_rate": 0.0002816247894305427, "loss": 0.1013, "step": 18980 }, { "epoch": 0.12, "learning_rate": 0.0002816151080761858, "loss": 0.0868, "step": 18990 }, { "epoch": 0.12, "learning_rate": 0.00028160542672182886, "loss": 0.1049, "step": 19000 }, { "epoch": 0.12, "eval_cer": 0.9201301547847701, "eval_loss": 0.061801835894584656, "eval_runtime": 120.5064, "eval_samples_per_second": 16.597, "eval_steps_per_second": 4.149, "step": 19000 }, { "epoch": 0.12, "learning_rate": 0.0002815957453674719, "loss": 0.0817, "step": 19010 }, { "epoch": 0.12, "learning_rate": 0.00028158606401311497, "loss": 0.087, "step": 19020 }, { "epoch": 0.12, "learning_rate": 0.00028157638265875805, "loss": 0.0936, "step": 19030 }, { "epoch": 0.12, "learning_rate": 0.00028156670130440113, "loss": 0.0906, "step": 19040 }, { "epoch": 0.12, "learning_rate": 0.00028155701995004415, "loss": 0.0897, "step": 19050 }, { "epoch": 0.12, "learning_rate": 0.00028154733859568723, "loss": 0.0822, "step": 19060 }, { "epoch": 0.12, "learning_rate": 0.0002815376572413303, "loss": 0.0894, "step": 19070 }, { "epoch": 0.12, "learning_rate": 0.0002815279758869734, "loss": 0.0967, "step": 19080 }, { "epoch": 0.12, "learning_rate": 0.0002815182945326165, "loss": 0.0817, "step": 19090 }, { "epoch": 0.12, "learning_rate": 0.00028150861317825955, "loss": 0.0874, "step": 19100 }, { "epoch": 0.12, "learning_rate": 0.00028149893182390263, "loss": 0.0824, "step": 19110 }, { "epoch": 0.12, "learning_rate": 0.00028148925046954566, "loss": 0.0837, "step": 19120 }, { "epoch": 0.12, "learning_rate": 0.00028147956911518874, "loss": 0.0946, "step": 19130 }, { "epoch": 0.12, "learning_rate": 0.0002814698877608318, "loss": 0.0835, "step": 19140 }, { "epoch": 0.12, "learning_rate": 0.00028146020640647484, "loss": 0.0969, "step": 19150 }, { "epoch": 0.12, "learning_rate": 0.0002814505250521179, "loss": 0.0824, "step": 19160 }, { "epoch": 0.12, "learning_rate": 0.000281440843697761, "loss": 0.087, "step": 19170 }, { "epoch": 0.12, "learning_rate": 0.0002814311623434041, "loss": 0.0855, "step": 19180 }, { "epoch": 0.12, "learning_rate": 0.0002814214809890471, "loss": 0.0852, "step": 19190 }, { "epoch": 0.12, "learning_rate": 0.0002814117996346902, "loss": 0.0853, "step": 19200 }, { "epoch": 0.12, "learning_rate": 0.00028140211828033327, "loss": 0.0883, "step": 19210 }, { "epoch": 0.12, "learning_rate": 0.00028139243692597635, "loss": 0.0913, "step": 19220 }, { "epoch": 0.12, "learning_rate": 0.00028138275557161943, "loss": 0.0953, "step": 19230 }, { "epoch": 0.12, "learning_rate": 0.0002813730742172625, "loss": 0.0886, "step": 19240 }, { "epoch": 0.12, "learning_rate": 0.00028136339286290553, "loss": 0.0885, "step": 19250 }, { "epoch": 0.12, "learning_rate": 0.0002813537115085486, "loss": 0.0913, "step": 19260 }, { "epoch": 0.12, "learning_rate": 0.0002813440301541917, "loss": 0.0874, "step": 19270 }, { "epoch": 0.12, "learning_rate": 0.0002813343487998347, "loss": 0.0911, "step": 19280 }, { "epoch": 0.12, "learning_rate": 0.0002813246674454778, "loss": 0.0937, "step": 19290 }, { "epoch": 0.12, "learning_rate": 0.0002813149860911209, "loss": 0.0878, "step": 19300 }, { "epoch": 0.12, "learning_rate": 0.00028130530473676396, "loss": 0.0914, "step": 19310 }, { "epoch": 0.12, "learning_rate": 0.00028129562338240704, "loss": 0.094, "step": 19320 }, { "epoch": 0.12, "learning_rate": 0.00028128594202805006, "loss": 0.0918, "step": 19330 }, { "epoch": 0.12, "learning_rate": 0.00028127626067369314, "loss": 0.0973, "step": 19340 }, { "epoch": 0.12, "learning_rate": 0.0002812665793193362, "loss": 0.0961, "step": 19350 }, { "epoch": 0.12, "learning_rate": 0.0002812568979649793, "loss": 0.092, "step": 19360 }, { "epoch": 0.13, "learning_rate": 0.0002812472166106224, "loss": 0.0907, "step": 19370 }, { "epoch": 0.13, "learning_rate": 0.0002812375352562654, "loss": 0.0929, "step": 19380 }, { "epoch": 0.13, "learning_rate": 0.0002812278539019085, "loss": 0.1038, "step": 19390 }, { "epoch": 0.13, "learning_rate": 0.00028121817254755157, "loss": 0.1033, "step": 19400 }, { "epoch": 0.13, "learning_rate": 0.0002812084911931946, "loss": 0.0982, "step": 19410 }, { "epoch": 0.13, "learning_rate": 0.0002811988098388377, "loss": 0.0934, "step": 19420 }, { "epoch": 0.13, "learning_rate": 0.00028118912848448075, "loss": 0.0902, "step": 19430 }, { "epoch": 0.13, "learning_rate": 0.00028117944713012383, "loss": 0.0876, "step": 19440 }, { "epoch": 0.13, "learning_rate": 0.0002811697657757669, "loss": 0.0883, "step": 19450 }, { "epoch": 0.13, "learning_rate": 0.00028116008442141, "loss": 0.0987, "step": 19460 }, { "epoch": 0.13, "learning_rate": 0.000281150403067053, "loss": 0.0868, "step": 19470 }, { "epoch": 0.13, "learning_rate": 0.0002811407217126961, "loss": 0.0942, "step": 19480 }, { "epoch": 0.13, "learning_rate": 0.0002811310403583392, "loss": 0.0883, "step": 19490 }, { "epoch": 0.13, "learning_rate": 0.00028112135900398226, "loss": 0.0852, "step": 19500 }, { "epoch": 0.13, "learning_rate": 0.00028111167764962534, "loss": 0.0836, "step": 19510 }, { "epoch": 0.13, "learning_rate": 0.00028110199629526836, "loss": 0.0858, "step": 19520 }, { "epoch": 0.13, "learning_rate": 0.00028109231494091144, "loss": 0.0841, "step": 19530 }, { "epoch": 0.13, "learning_rate": 0.0002810826335865545, "loss": 0.0911, "step": 19540 }, { "epoch": 0.13, "learning_rate": 0.00028107295223219755, "loss": 0.0891, "step": 19550 }, { "epoch": 0.13, "learning_rate": 0.00028106327087784063, "loss": 0.091, "step": 19560 }, { "epoch": 0.13, "learning_rate": 0.0002810535895234837, "loss": 0.0977, "step": 19570 }, { "epoch": 0.13, "learning_rate": 0.0002810439081691268, "loss": 0.0923, "step": 19580 }, { "epoch": 0.13, "learning_rate": 0.00028103422681476987, "loss": 0.0925, "step": 19590 }, { "epoch": 0.13, "learning_rate": 0.00028102454546041295, "loss": 0.089, "step": 19600 }, { "epoch": 0.13, "learning_rate": 0.00028101486410605597, "loss": 0.091, "step": 19610 }, { "epoch": 0.13, "learning_rate": 0.00028100518275169905, "loss": 0.0954, "step": 19620 }, { "epoch": 0.13, "learning_rate": 0.00028099550139734213, "loss": 0.0941, "step": 19630 }, { "epoch": 0.13, "learning_rate": 0.0002809858200429852, "loss": 0.0894, "step": 19640 }, { "epoch": 0.13, "learning_rate": 0.00028097613868862824, "loss": 0.0888, "step": 19650 }, { "epoch": 0.13, "learning_rate": 0.0002809664573342713, "loss": 0.0767, "step": 19660 }, { "epoch": 0.13, "learning_rate": 0.0002809567759799144, "loss": 0.0934, "step": 19670 }, { "epoch": 0.13, "learning_rate": 0.0002809470946255574, "loss": 0.0837, "step": 19680 }, { "epoch": 0.13, "learning_rate": 0.0002809374132712005, "loss": 0.0877, "step": 19690 }, { "epoch": 0.13, "learning_rate": 0.0002809277319168436, "loss": 0.0977, "step": 19700 }, { "epoch": 0.13, "learning_rate": 0.00028091805056248666, "loss": 0.0953, "step": 19710 }, { "epoch": 0.13, "learning_rate": 0.00028090836920812974, "loss": 0.0901, "step": 19720 }, { "epoch": 0.13, "learning_rate": 0.0002808986878537728, "loss": 0.0872, "step": 19730 }, { "epoch": 0.13, "learning_rate": 0.0002808890064994159, "loss": 0.094, "step": 19740 }, { "epoch": 0.13, "learning_rate": 0.0002808793251450589, "loss": 0.0804, "step": 19750 }, { "epoch": 0.13, "learning_rate": 0.000280869643790702, "loss": 0.0929, "step": 19760 }, { "epoch": 0.13, "learning_rate": 0.0002808599624363451, "loss": 0.0794, "step": 19770 }, { "epoch": 0.13, "learning_rate": 0.0002808502810819881, "loss": 0.0907, "step": 19780 }, { "epoch": 0.13, "learning_rate": 0.0002808405997276312, "loss": 0.0979, "step": 19790 }, { "epoch": 0.13, "learning_rate": 0.00028083091837327427, "loss": 0.0928, "step": 19800 }, { "epoch": 0.13, "learning_rate": 0.00028082123701891735, "loss": 0.0865, "step": 19810 }, { "epoch": 0.13, "learning_rate": 0.0002808115556645604, "loss": 0.1105, "step": 19820 }, { "epoch": 0.13, "learning_rate": 0.00028080187431020346, "loss": 0.088, "step": 19830 }, { "epoch": 0.13, "learning_rate": 0.00028079219295584654, "loss": 0.0871, "step": 19840 }, { "epoch": 0.13, "learning_rate": 0.0002807825116014896, "loss": 0.0994, "step": 19850 }, { "epoch": 0.13, "learning_rate": 0.0002807728302471327, "loss": 0.0874, "step": 19860 }, { "epoch": 0.13, "learning_rate": 0.0002807631488927758, "loss": 0.0849, "step": 19870 }, { "epoch": 0.13, "learning_rate": 0.00028075346753841886, "loss": 0.0859, "step": 19880 }, { "epoch": 0.13, "learning_rate": 0.0002807437861840619, "loss": 0.0839, "step": 19890 }, { "epoch": 0.13, "learning_rate": 0.00028073410482970496, "loss": 0.0876, "step": 19900 }, { "epoch": 0.13, "learning_rate": 0.00028072442347534804, "loss": 0.0905, "step": 19910 }, { "epoch": 0.13, "learning_rate": 0.00028071474212099107, "loss": 0.0839, "step": 19920 }, { "epoch": 0.13, "learning_rate": 0.00028070506076663415, "loss": 0.0942, "step": 19930 }, { "epoch": 0.13, "learning_rate": 0.0002806953794122772, "loss": 0.0983, "step": 19940 }, { "epoch": 0.13, "learning_rate": 0.0002806856980579203, "loss": 0.0908, "step": 19950 }, { "epoch": 0.13, "learning_rate": 0.00028067601670356333, "loss": 0.0869, "step": 19960 }, { "epoch": 0.13, "learning_rate": 0.0002806663353492064, "loss": 0.098, "step": 19970 }, { "epoch": 0.13, "learning_rate": 0.0002806566539948495, "loss": 0.0949, "step": 19980 }, { "epoch": 0.13, "learning_rate": 0.00028064697264049257, "loss": 0.0903, "step": 19990 }, { "epoch": 0.13, "learning_rate": 0.00028063729128613565, "loss": 0.0893, "step": 20000 }, { "epoch": 0.13, "eval_cer": 0.9201129815840018, "eval_loss": 0.0617336705327034, "eval_runtime": 120.5228, "eval_samples_per_second": 16.594, "eval_steps_per_second": 4.149, "step": 20000 }, { "epoch": 0.13, "learning_rate": 0.00028062760993177873, "loss": 0.0877, "step": 20010 }, { "epoch": 0.13, "learning_rate": 0.00028061792857742176, "loss": 0.0923, "step": 20020 }, { "epoch": 0.13, "learning_rate": 0.00028060824722306484, "loss": 0.0889, "step": 20030 }, { "epoch": 0.13, "learning_rate": 0.0002805985658687079, "loss": 0.0913, "step": 20040 }, { "epoch": 0.13, "learning_rate": 0.00028058888451435094, "loss": 0.096, "step": 20050 }, { "epoch": 0.13, "learning_rate": 0.000280579203159994, "loss": 0.0952, "step": 20060 }, { "epoch": 0.13, "learning_rate": 0.0002805695218056371, "loss": 0.0936, "step": 20070 }, { "epoch": 0.13, "learning_rate": 0.0002805598404512802, "loss": 0.0893, "step": 20080 }, { "epoch": 0.13, "learning_rate": 0.00028055015909692326, "loss": 0.0956, "step": 20090 }, { "epoch": 0.13, "learning_rate": 0.0002805404777425663, "loss": 0.0822, "step": 20100 }, { "epoch": 0.13, "learning_rate": 0.00028053079638820937, "loss": 0.0889, "step": 20110 }, { "epoch": 0.13, "learning_rate": 0.00028052111503385245, "loss": 0.0948, "step": 20120 }, { "epoch": 0.13, "learning_rate": 0.0002805114336794955, "loss": 0.0932, "step": 20130 }, { "epoch": 0.13, "learning_rate": 0.0002805017523251386, "loss": 0.0903, "step": 20140 }, { "epoch": 0.13, "learning_rate": 0.00028049207097078163, "loss": 0.0974, "step": 20150 }, { "epoch": 0.13, "learning_rate": 0.0002804823896164247, "loss": 0.0844, "step": 20160 }, { "epoch": 0.13, "learning_rate": 0.0002804727082620678, "loss": 0.0987, "step": 20170 }, { "epoch": 0.13, "learning_rate": 0.0002804630269077108, "loss": 0.0943, "step": 20180 }, { "epoch": 0.13, "learning_rate": 0.0002804533455533539, "loss": 0.0893, "step": 20190 }, { "epoch": 0.13, "learning_rate": 0.000280443664198997, "loss": 0.0872, "step": 20200 }, { "epoch": 0.13, "learning_rate": 0.00028043398284464005, "loss": 0.0928, "step": 20210 }, { "epoch": 0.13, "learning_rate": 0.00028042430149028313, "loss": 0.0956, "step": 20220 }, { "epoch": 0.13, "learning_rate": 0.0002804146201359262, "loss": 0.0847, "step": 20230 }, { "epoch": 0.13, "learning_rate": 0.00028040493878156924, "loss": 0.0894, "step": 20240 }, { "epoch": 0.13, "learning_rate": 0.0002803952574272123, "loss": 0.0932, "step": 20250 }, { "epoch": 0.13, "learning_rate": 0.0002803855760728554, "loss": 0.0895, "step": 20260 }, { "epoch": 0.13, "learning_rate": 0.0002803758947184985, "loss": 0.0924, "step": 20270 }, { "epoch": 0.13, "learning_rate": 0.00028036621336414156, "loss": 0.0878, "step": 20280 }, { "epoch": 0.13, "learning_rate": 0.0002803565320097846, "loss": 0.082, "step": 20290 }, { "epoch": 0.13, "learning_rate": 0.00028034685065542766, "loss": 0.0905, "step": 20300 }, { "epoch": 0.13, "learning_rate": 0.00028033716930107074, "loss": 0.0831, "step": 20310 }, { "epoch": 0.13, "learning_rate": 0.00028032748794671377, "loss": 0.0863, "step": 20320 }, { "epoch": 0.13, "learning_rate": 0.00028031780659235685, "loss": 0.0847, "step": 20330 }, { "epoch": 0.13, "learning_rate": 0.00028030812523799993, "loss": 0.0892, "step": 20340 }, { "epoch": 0.13, "learning_rate": 0.000280298443883643, "loss": 0.0942, "step": 20350 }, { "epoch": 0.13, "learning_rate": 0.0002802887625292861, "loss": 0.0878, "step": 20360 }, { "epoch": 0.13, "learning_rate": 0.00028027908117492917, "loss": 0.0905, "step": 20370 }, { "epoch": 0.13, "learning_rate": 0.0002802693998205722, "loss": 0.0888, "step": 20380 }, { "epoch": 0.13, "learning_rate": 0.0002802597184662153, "loss": 0.0854, "step": 20390 }, { "epoch": 0.13, "learning_rate": 0.00028025003711185835, "loss": 0.0857, "step": 20400 }, { "epoch": 0.13, "learning_rate": 0.00028024035575750143, "loss": 0.0841, "step": 20410 }, { "epoch": 0.13, "learning_rate": 0.00028023067440314446, "loss": 0.0917, "step": 20420 }, { "epoch": 0.13, "learning_rate": 0.00028022099304878754, "loss": 0.0919, "step": 20430 }, { "epoch": 0.13, "learning_rate": 0.0002802113116944306, "loss": 0.095, "step": 20440 }, { "epoch": 0.13, "learning_rate": 0.00028020163034007364, "loss": 0.0873, "step": 20450 }, { "epoch": 0.13, "learning_rate": 0.0002801919489857167, "loss": 0.0891, "step": 20460 }, { "epoch": 0.13, "learning_rate": 0.0002801822676313598, "loss": 0.081, "step": 20470 }, { "epoch": 0.13, "learning_rate": 0.0002801725862770029, "loss": 0.088, "step": 20480 }, { "epoch": 0.13, "learning_rate": 0.00028016290492264596, "loss": 0.0876, "step": 20490 }, { "epoch": 0.13, "learning_rate": 0.00028015322356828904, "loss": 0.0932, "step": 20500 }, { "epoch": 0.13, "learning_rate": 0.0002801435422139321, "loss": 0.1059, "step": 20510 }, { "epoch": 0.13, "learning_rate": 0.00028013386085957515, "loss": 0.0906, "step": 20520 }, { "epoch": 0.13, "learning_rate": 0.00028012417950521823, "loss": 0.0893, "step": 20530 }, { "epoch": 0.13, "learning_rate": 0.0002801144981508613, "loss": 0.0891, "step": 20540 }, { "epoch": 0.13, "learning_rate": 0.00028010481679650433, "loss": 0.0956, "step": 20550 }, { "epoch": 0.13, "learning_rate": 0.0002800951354421474, "loss": 0.0828, "step": 20560 }, { "epoch": 0.13, "learning_rate": 0.0002800854540877905, "loss": 0.0866, "step": 20570 }, { "epoch": 0.13, "learning_rate": 0.0002800757727334336, "loss": 0.0918, "step": 20580 }, { "epoch": 0.13, "learning_rate": 0.0002800660913790766, "loss": 0.0956, "step": 20590 }, { "epoch": 0.13, "learning_rate": 0.0002800564100247197, "loss": 0.1036, "step": 20600 }, { "epoch": 0.13, "learning_rate": 0.00028004672867036276, "loss": 0.0942, "step": 20610 }, { "epoch": 0.13, "learning_rate": 0.00028003704731600584, "loss": 0.0904, "step": 20620 }, { "epoch": 0.13, "learning_rate": 0.0002800273659616489, "loss": 0.0893, "step": 20630 }, { "epoch": 0.13, "learning_rate": 0.000280017684607292, "loss": 0.0894, "step": 20640 }, { "epoch": 0.13, "learning_rate": 0.0002800080032529351, "loss": 0.0861, "step": 20650 }, { "epoch": 0.13, "learning_rate": 0.0002799983218985781, "loss": 0.0985, "step": 20660 }, { "epoch": 0.13, "learning_rate": 0.0002799886405442212, "loss": 0.0885, "step": 20670 }, { "epoch": 0.13, "learning_rate": 0.00027997895918986426, "loss": 0.0958, "step": 20680 }, { "epoch": 0.13, "learning_rate": 0.0002799692778355073, "loss": 0.0909, "step": 20690 }, { "epoch": 0.13, "learning_rate": 0.00027995959648115037, "loss": 0.0896, "step": 20700 }, { "epoch": 0.13, "learning_rate": 0.00027994991512679345, "loss": 0.0867, "step": 20710 }, { "epoch": 0.13, "learning_rate": 0.00027994023377243653, "loss": 0.0924, "step": 20720 }, { "epoch": 0.13, "learning_rate": 0.00027993055241807955, "loss": 0.0919, "step": 20730 }, { "epoch": 0.13, "learning_rate": 0.00027992087106372263, "loss": 0.0937, "step": 20740 }, { "epoch": 0.13, "learning_rate": 0.0002799111897093657, "loss": 0.0841, "step": 20750 }, { "epoch": 0.13, "learning_rate": 0.0002799015083550088, "loss": 0.0913, "step": 20760 }, { "epoch": 0.13, "learning_rate": 0.00027989182700065187, "loss": 0.0917, "step": 20770 }, { "epoch": 0.13, "learning_rate": 0.00027988214564629495, "loss": 0.0824, "step": 20780 }, { "epoch": 0.13, "learning_rate": 0.000279872464291938, "loss": 0.0915, "step": 20790 }, { "epoch": 0.13, "learning_rate": 0.00027986278293758106, "loss": 0.0903, "step": 20800 }, { "epoch": 0.13, "learning_rate": 0.00027985310158322414, "loss": 0.0961, "step": 20810 }, { "epoch": 0.13, "learning_rate": 0.00027984342022886716, "loss": 0.0852, "step": 20820 }, { "epoch": 0.13, "learning_rate": 0.00027983373887451024, "loss": 0.0901, "step": 20830 }, { "epoch": 0.13, "learning_rate": 0.0002798240575201533, "loss": 0.0975, "step": 20840 }, { "epoch": 0.13, "learning_rate": 0.0002798143761657964, "loss": 0.1021, "step": 20850 }, { "epoch": 0.13, "learning_rate": 0.0002798046948114395, "loss": 0.0892, "step": 20860 }, { "epoch": 0.13, "learning_rate": 0.0002797950134570825, "loss": 0.0838, "step": 20870 }, { "epoch": 0.13, "learning_rate": 0.0002797853321027256, "loss": 0.0859, "step": 20880 }, { "epoch": 0.13, "learning_rate": 0.00027977565074836867, "loss": 0.0897, "step": 20890 }, { "epoch": 0.13, "learning_rate": 0.00027976596939401175, "loss": 0.0892, "step": 20900 }, { "epoch": 0.13, "learning_rate": 0.00027975628803965483, "loss": 0.0871, "step": 20910 }, { "epoch": 0.14, "learning_rate": 0.0002797466066852979, "loss": 0.085, "step": 20920 }, { "epoch": 0.14, "learning_rate": 0.00027973692533094093, "loss": 0.0877, "step": 20930 }, { "epoch": 0.14, "learning_rate": 0.000279727243976584, "loss": 0.0885, "step": 20940 }, { "epoch": 0.14, "learning_rate": 0.00027971756262222704, "loss": 0.0845, "step": 20950 }, { "epoch": 0.14, "learning_rate": 0.0002797078812678701, "loss": 0.0914, "step": 20960 }, { "epoch": 0.14, "learning_rate": 0.0002796981999135132, "loss": 0.0927, "step": 20970 }, { "epoch": 0.14, "learning_rate": 0.0002796885185591563, "loss": 0.0908, "step": 20980 }, { "epoch": 0.14, "learning_rate": 0.00027967883720479936, "loss": 0.0919, "step": 20990 }, { "epoch": 0.14, "learning_rate": 0.00027966915585044244, "loss": 0.0834, "step": 21000 }, { "epoch": 0.14, "eval_cer": 0.9202223477573156, "eval_loss": 0.05823448300361633, "eval_runtime": 120.3243, "eval_samples_per_second": 16.622, "eval_steps_per_second": 4.155, "step": 21000 }, { "epoch": 0.14, "learning_rate": 0.00027965947449608546, "loss": 0.0809, "step": 21010 }, { "epoch": 0.14, "learning_rate": 0.00027964979314172854, "loss": 0.0962, "step": 21020 }, { "epoch": 0.14, "learning_rate": 0.0002796401117873716, "loss": 0.0888, "step": 21030 }, { "epoch": 0.14, "learning_rate": 0.0002796304304330147, "loss": 0.1118, "step": 21040 }, { "epoch": 0.14, "learning_rate": 0.0002796207490786578, "loss": 0.0849, "step": 21050 }, { "epoch": 0.14, "learning_rate": 0.0002796110677243008, "loss": 0.0872, "step": 21060 }, { "epoch": 0.14, "learning_rate": 0.0002796013863699439, "loss": 0.0928, "step": 21070 }, { "epoch": 0.14, "learning_rate": 0.00027959170501558697, "loss": 0.0871, "step": 21080 }, { "epoch": 0.14, "learning_rate": 0.00027958202366123, "loss": 0.0832, "step": 21090 }, { "epoch": 0.14, "learning_rate": 0.00027957234230687307, "loss": 0.0811, "step": 21100 }, { "epoch": 0.14, "learning_rate": 0.00027956266095251615, "loss": 0.0977, "step": 21110 }, { "epoch": 0.14, "learning_rate": 0.00027955297959815923, "loss": 0.0911, "step": 21120 }, { "epoch": 0.14, "learning_rate": 0.0002795432982438023, "loss": 0.0842, "step": 21130 }, { "epoch": 0.14, "learning_rate": 0.0002795336168894454, "loss": 0.0876, "step": 21140 }, { "epoch": 0.14, "learning_rate": 0.0002795239355350884, "loss": 0.0853, "step": 21150 }, { "epoch": 0.14, "learning_rate": 0.0002795142541807315, "loss": 0.0926, "step": 21160 }, { "epoch": 0.14, "learning_rate": 0.0002795045728263746, "loss": 0.0926, "step": 21170 }, { "epoch": 0.14, "learning_rate": 0.00027949489147201766, "loss": 0.0858, "step": 21180 }, { "epoch": 0.14, "learning_rate": 0.0002794852101176607, "loss": 0.0838, "step": 21190 }, { "epoch": 0.14, "learning_rate": 0.00027947552876330376, "loss": 0.0829, "step": 21200 }, { "epoch": 0.14, "learning_rate": 0.00027946584740894684, "loss": 0.0883, "step": 21210 }, { "epoch": 0.14, "learning_rate": 0.00027945616605458987, "loss": 0.0827, "step": 21220 }, { "epoch": 0.14, "learning_rate": 0.00027944648470023295, "loss": 0.0829, "step": 21230 }, { "epoch": 0.14, "learning_rate": 0.000279436803345876, "loss": 0.0826, "step": 21240 }, { "epoch": 0.14, "learning_rate": 0.0002794271219915191, "loss": 0.0762, "step": 21250 }, { "epoch": 0.14, "learning_rate": 0.0002794174406371622, "loss": 0.0883, "step": 21260 }, { "epoch": 0.14, "learning_rate": 0.00027940775928280527, "loss": 0.095, "step": 21270 }, { "epoch": 0.14, "learning_rate": 0.00027939807792844835, "loss": 0.0813, "step": 21280 }, { "epoch": 0.14, "learning_rate": 0.00027938839657409137, "loss": 0.0904, "step": 21290 }, { "epoch": 0.14, "learning_rate": 0.00027937871521973445, "loss": 0.0799, "step": 21300 }, { "epoch": 0.14, "learning_rate": 0.00027936903386537753, "loss": 0.0824, "step": 21310 }, { "epoch": 0.14, "learning_rate": 0.0002793593525110206, "loss": 0.0868, "step": 21320 }, { "epoch": 0.14, "learning_rate": 0.00027934967115666364, "loss": 0.0898, "step": 21330 }, { "epoch": 0.14, "learning_rate": 0.0002793399898023067, "loss": 0.0923, "step": 21340 }, { "epoch": 0.14, "learning_rate": 0.0002793303084479498, "loss": 0.0995, "step": 21350 }, { "epoch": 0.14, "learning_rate": 0.0002793206270935928, "loss": 0.0846, "step": 21360 }, { "epoch": 0.14, "learning_rate": 0.0002793109457392359, "loss": 0.0831, "step": 21370 }, { "epoch": 0.14, "learning_rate": 0.000279301264384879, "loss": 0.0853, "step": 21380 }, { "epoch": 0.14, "learning_rate": 0.00027929158303052206, "loss": 0.0807, "step": 21390 }, { "epoch": 0.14, "learning_rate": 0.00027928190167616514, "loss": 0.0855, "step": 21400 }, { "epoch": 0.14, "learning_rate": 0.0002792722203218082, "loss": 0.0817, "step": 21410 }, { "epoch": 0.14, "learning_rate": 0.0002792625389674513, "loss": 0.0828, "step": 21420 }, { "epoch": 0.14, "learning_rate": 0.0002792528576130943, "loss": 0.079, "step": 21430 }, { "epoch": 0.14, "learning_rate": 0.0002792431762587374, "loss": 0.0984, "step": 21440 }, { "epoch": 0.14, "learning_rate": 0.0002792334949043805, "loss": 0.0875, "step": 21450 }, { "epoch": 0.14, "learning_rate": 0.0002792238135500235, "loss": 0.0795, "step": 21460 }, { "epoch": 0.14, "learning_rate": 0.0002792141321956666, "loss": 0.088, "step": 21470 }, { "epoch": 0.14, "learning_rate": 0.00027920445084130967, "loss": 0.0871, "step": 21480 }, { "epoch": 0.14, "learning_rate": 0.00027919476948695275, "loss": 0.0846, "step": 21490 }, { "epoch": 0.14, "learning_rate": 0.0002791850881325958, "loss": 0.0867, "step": 21500 }, { "epoch": 0.14, "learning_rate": 0.00027917540677823886, "loss": 0.0869, "step": 21510 }, { "epoch": 0.14, "learning_rate": 0.00027916572542388194, "loss": 0.082, "step": 21520 }, { "epoch": 0.14, "learning_rate": 0.000279156044069525, "loss": 0.0821, "step": 21530 }, { "epoch": 0.14, "learning_rate": 0.0002791463627151681, "loss": 0.0959, "step": 21540 }, { "epoch": 0.14, "learning_rate": 0.0002791366813608112, "loss": 0.0878, "step": 21550 }, { "epoch": 0.14, "learning_rate": 0.0002791270000064542, "loss": 0.0863, "step": 21560 }, { "epoch": 0.14, "learning_rate": 0.0002791173186520973, "loss": 0.0894, "step": 21570 }, { "epoch": 0.14, "learning_rate": 0.00027910763729774036, "loss": 0.0915, "step": 21580 }, { "epoch": 0.14, "learning_rate": 0.0002790979559433834, "loss": 0.0836, "step": 21590 }, { "epoch": 0.14, "learning_rate": 0.00027908827458902647, "loss": 0.0846, "step": 21600 }, { "epoch": 0.14, "learning_rate": 0.00027907859323466955, "loss": 0.0864, "step": 21610 }, { "epoch": 0.14, "learning_rate": 0.0002790689118803126, "loss": 0.0886, "step": 21620 }, { "epoch": 0.14, "learning_rate": 0.0002790592305259557, "loss": 0.0809, "step": 21630 }, { "epoch": 0.14, "learning_rate": 0.00027904954917159873, "loss": 0.0842, "step": 21640 }, { "epoch": 0.14, "learning_rate": 0.0002790398678172418, "loss": 0.0854, "step": 21650 }, { "epoch": 0.14, "learning_rate": 0.0002790301864628849, "loss": 0.0841, "step": 21660 }, { "epoch": 0.14, "learning_rate": 0.00027902050510852797, "loss": 0.0806, "step": 21670 }, { "epoch": 0.14, "learning_rate": 0.00027901082375417105, "loss": 0.094, "step": 21680 }, { "epoch": 0.14, "learning_rate": 0.00027900114239981413, "loss": 0.0861, "step": 21690 }, { "epoch": 0.14, "learning_rate": 0.00027899146104545716, "loss": 0.0838, "step": 21700 }, { "epoch": 0.14, "learning_rate": 0.00027898177969110023, "loss": 0.091, "step": 21710 }, { "epoch": 0.14, "learning_rate": 0.0002789720983367433, "loss": 0.0874, "step": 21720 }, { "epoch": 0.14, "learning_rate": 0.00027896241698238634, "loss": 0.0942, "step": 21730 }, { "epoch": 0.14, "learning_rate": 0.0002789527356280294, "loss": 0.0922, "step": 21740 }, { "epoch": 0.14, "learning_rate": 0.0002789430542736725, "loss": 0.0884, "step": 21750 }, { "epoch": 0.14, "learning_rate": 0.0002789333729193156, "loss": 0.0837, "step": 21760 }, { "epoch": 0.14, "learning_rate": 0.00027892369156495866, "loss": 0.0817, "step": 21770 }, { "epoch": 0.14, "learning_rate": 0.0002789140102106017, "loss": 0.0761, "step": 21780 }, { "epoch": 0.14, "learning_rate": 0.00027890432885624476, "loss": 0.0959, "step": 21790 }, { "epoch": 0.14, "learning_rate": 0.00027889464750188784, "loss": 0.0828, "step": 21800 }, { "epoch": 0.14, "learning_rate": 0.0002788849661475309, "loss": 0.0794, "step": 21810 }, { "epoch": 0.14, "learning_rate": 0.000278875284793174, "loss": 0.0823, "step": 21820 }, { "epoch": 0.14, "learning_rate": 0.00027886560343881703, "loss": 0.0945, "step": 21830 }, { "epoch": 0.14, "learning_rate": 0.0002788559220844601, "loss": 0.0778, "step": 21840 }, { "epoch": 0.14, "learning_rate": 0.0002788462407301032, "loss": 0.0832, "step": 21850 }, { "epoch": 0.14, "learning_rate": 0.0002788365593757462, "loss": 0.086, "step": 21860 }, { "epoch": 0.14, "learning_rate": 0.0002788268780213893, "loss": 0.0821, "step": 21870 }, { "epoch": 0.14, "learning_rate": 0.0002788171966670324, "loss": 0.0882, "step": 21880 }, { "epoch": 0.14, "learning_rate": 0.00027880751531267545, "loss": 0.0738, "step": 21890 }, { "epoch": 0.14, "learning_rate": 0.00027879783395831853, "loss": 0.083, "step": 21900 }, { "epoch": 0.14, "learning_rate": 0.0002787881526039616, "loss": 0.086, "step": 21910 }, { "epoch": 0.14, "learning_rate": 0.00027877847124960464, "loss": 0.0844, "step": 21920 }, { "epoch": 0.14, "learning_rate": 0.0002787687898952477, "loss": 0.0889, "step": 21930 }, { "epoch": 0.14, "learning_rate": 0.0002787591085408908, "loss": 0.0853, "step": 21940 }, { "epoch": 0.14, "learning_rate": 0.0002787494271865339, "loss": 0.0814, "step": 21950 }, { "epoch": 0.14, "learning_rate": 0.0002787397458321769, "loss": 0.0881, "step": 21960 }, { "epoch": 0.14, "learning_rate": 0.00027873006447782, "loss": 0.0802, "step": 21970 }, { "epoch": 0.14, "learning_rate": 0.00027872038312346306, "loss": 0.0876, "step": 21980 }, { "epoch": 0.14, "learning_rate": 0.0002787107017691061, "loss": 0.1003, "step": 21990 }, { "epoch": 0.14, "learning_rate": 0.00027870102041474917, "loss": 0.0815, "step": 22000 }, { "epoch": 0.14, "eval_cer": 0.9202078861145633, "eval_loss": 0.05837943032383919, "eval_runtime": 120.4265, "eval_samples_per_second": 16.608, "eval_steps_per_second": 4.152, "step": 22000 }, { "epoch": 0.14, "learning_rate": 0.00027869133906039225, "loss": 0.0908, "step": 22010 }, { "epoch": 0.14, "learning_rate": 0.00027868165770603533, "loss": 0.0827, "step": 22020 }, { "epoch": 0.14, "learning_rate": 0.0002786719763516784, "loss": 0.0863, "step": 22030 }, { "epoch": 0.14, "learning_rate": 0.0002786622949973215, "loss": 0.0861, "step": 22040 }, { "epoch": 0.14, "learning_rate": 0.00027865261364296457, "loss": 0.0893, "step": 22050 }, { "epoch": 0.14, "learning_rate": 0.0002786429322886076, "loss": 0.0987, "step": 22060 }, { "epoch": 0.14, "learning_rate": 0.0002786332509342507, "loss": 0.0806, "step": 22070 }, { "epoch": 0.14, "learning_rate": 0.00027862356957989375, "loss": 0.0958, "step": 22080 }, { "epoch": 0.14, "learning_rate": 0.00027861388822553683, "loss": 0.0992, "step": 22090 }, { "epoch": 0.14, "learning_rate": 0.00027860420687117986, "loss": 0.0949, "step": 22100 }, { "epoch": 0.14, "learning_rate": 0.00027859452551682294, "loss": 0.0819, "step": 22110 }, { "epoch": 0.14, "learning_rate": 0.000278584844162466, "loss": 0.0935, "step": 22120 }, { "epoch": 0.14, "learning_rate": 0.00027857516280810904, "loss": 0.0851, "step": 22130 }, { "epoch": 0.14, "learning_rate": 0.0002785654814537521, "loss": 0.0844, "step": 22140 }, { "epoch": 0.14, "learning_rate": 0.0002785558000993952, "loss": 0.0854, "step": 22150 }, { "epoch": 0.14, "learning_rate": 0.0002785461187450383, "loss": 0.079, "step": 22160 }, { "epoch": 0.14, "learning_rate": 0.00027853643739068136, "loss": 0.0878, "step": 22170 }, { "epoch": 0.14, "learning_rate": 0.00027852675603632444, "loss": 0.0863, "step": 22180 }, { "epoch": 0.14, "learning_rate": 0.0002785170746819675, "loss": 0.0834, "step": 22190 }, { "epoch": 0.14, "learning_rate": 0.00027850739332761055, "loss": 0.0865, "step": 22200 }, { "epoch": 0.14, "learning_rate": 0.00027849771197325363, "loss": 0.0854, "step": 22210 }, { "epoch": 0.14, "learning_rate": 0.0002784880306188967, "loss": 0.0752, "step": 22220 }, { "epoch": 0.14, "learning_rate": 0.00027847834926453973, "loss": 0.0943, "step": 22230 }, { "epoch": 0.14, "learning_rate": 0.0002784686679101828, "loss": 0.0914, "step": 22240 }, { "epoch": 0.14, "learning_rate": 0.0002784589865558259, "loss": 0.0916, "step": 22250 }, { "epoch": 0.14, "learning_rate": 0.00027844930520146897, "loss": 0.0776, "step": 22260 }, { "epoch": 0.14, "learning_rate": 0.000278439623847112, "loss": 0.0932, "step": 22270 }, { "epoch": 0.14, "learning_rate": 0.0002784299424927551, "loss": 0.0895, "step": 22280 }, { "epoch": 0.14, "learning_rate": 0.00027842026113839816, "loss": 0.0972, "step": 22290 }, { "epoch": 0.14, "learning_rate": 0.00027841057978404124, "loss": 0.0865, "step": 22300 }, { "epoch": 0.14, "learning_rate": 0.0002784008984296843, "loss": 0.0883, "step": 22310 }, { "epoch": 0.14, "learning_rate": 0.0002783912170753274, "loss": 0.0872, "step": 22320 }, { "epoch": 0.14, "learning_rate": 0.0002783815357209704, "loss": 0.1006, "step": 22330 }, { "epoch": 0.14, "learning_rate": 0.0002783718543666135, "loss": 0.0807, "step": 22340 }, { "epoch": 0.14, "learning_rate": 0.0002783621730122566, "loss": 0.0862, "step": 22350 }, { "epoch": 0.14, "learning_rate": 0.0002783524916578996, "loss": 0.091, "step": 22360 }, { "epoch": 0.14, "learning_rate": 0.0002783428103035427, "loss": 0.0831, "step": 22370 }, { "epoch": 0.14, "learning_rate": 0.00027833312894918577, "loss": 0.0741, "step": 22380 }, { "epoch": 0.14, "learning_rate": 0.00027832344759482885, "loss": 0.0913, "step": 22390 }, { "epoch": 0.14, "learning_rate": 0.00027831376624047193, "loss": 0.0852, "step": 22400 }, { "epoch": 0.14, "learning_rate": 0.00027830408488611495, "loss": 0.0787, "step": 22410 }, { "epoch": 0.14, "learning_rate": 0.00027829440353175803, "loss": 0.0924, "step": 22420 }, { "epoch": 0.14, "learning_rate": 0.0002782847221774011, "loss": 0.0769, "step": 22430 }, { "epoch": 0.14, "learning_rate": 0.0002782750408230442, "loss": 0.0869, "step": 22440 }, { "epoch": 0.14, "learning_rate": 0.00027826535946868727, "loss": 0.0888, "step": 22450 }, { "epoch": 0.14, "learning_rate": 0.00027825567811433035, "loss": 0.0938, "step": 22460 }, { "epoch": 0.15, "learning_rate": 0.0002782459967599734, "loss": 0.0889, "step": 22470 }, { "epoch": 0.15, "learning_rate": 0.00027823631540561646, "loss": 0.0837, "step": 22480 }, { "epoch": 0.15, "learning_rate": 0.00027822663405125954, "loss": 0.0864, "step": 22490 }, { "epoch": 0.15, "learning_rate": 0.00027821695269690256, "loss": 0.0951, "step": 22500 }, { "epoch": 0.15, "learning_rate": 0.00027820727134254564, "loss": 0.0865, "step": 22510 }, { "epoch": 0.15, "learning_rate": 0.0002781975899881887, "loss": 0.0865, "step": 22520 }, { "epoch": 0.15, "learning_rate": 0.0002781879086338318, "loss": 0.085, "step": 22530 }, { "epoch": 0.15, "learning_rate": 0.0002781782272794749, "loss": 0.0851, "step": 22540 }, { "epoch": 0.15, "learning_rate": 0.0002781685459251179, "loss": 0.0882, "step": 22550 }, { "epoch": 0.15, "learning_rate": 0.000278158864570761, "loss": 0.0921, "step": 22560 }, { "epoch": 0.15, "learning_rate": 0.00027814918321640407, "loss": 0.0955, "step": 22570 }, { "epoch": 0.15, "learning_rate": 0.00027813950186204715, "loss": 0.0897, "step": 22580 }, { "epoch": 0.15, "learning_rate": 0.0002781298205076902, "loss": 0.0882, "step": 22590 }, { "epoch": 0.15, "learning_rate": 0.00027812013915333325, "loss": 0.0851, "step": 22600 }, { "epoch": 0.15, "learning_rate": 0.00027811045779897633, "loss": 0.0875, "step": 22610 }, { "epoch": 0.15, "learning_rate": 0.0002781007764446194, "loss": 0.0901, "step": 22620 }, { "epoch": 0.15, "learning_rate": 0.00027809109509026244, "loss": 0.0803, "step": 22630 }, { "epoch": 0.15, "learning_rate": 0.0002780814137359055, "loss": 0.0953, "step": 22640 }, { "epoch": 0.15, "learning_rate": 0.0002780717323815486, "loss": 0.0928, "step": 22650 }, { "epoch": 0.15, "learning_rate": 0.0002780620510271917, "loss": 0.0852, "step": 22660 }, { "epoch": 0.15, "learning_rate": 0.00027805236967283476, "loss": 0.0895, "step": 22670 }, { "epoch": 0.15, "learning_rate": 0.00027804268831847784, "loss": 0.0824, "step": 22680 }, { "epoch": 0.15, "learning_rate": 0.00027803300696412086, "loss": 0.0882, "step": 22690 }, { "epoch": 0.15, "learning_rate": 0.00027802332560976394, "loss": 0.0834, "step": 22700 }, { "epoch": 0.15, "learning_rate": 0.000278013644255407, "loss": 0.0839, "step": 22710 }, { "epoch": 0.15, "learning_rate": 0.0002780039629010501, "loss": 0.0845, "step": 22720 }, { "epoch": 0.15, "learning_rate": 0.0002779942815466932, "loss": 0.0868, "step": 22730 }, { "epoch": 0.15, "learning_rate": 0.0002779846001923362, "loss": 0.0835, "step": 22740 }, { "epoch": 0.15, "learning_rate": 0.0002779749188379793, "loss": 0.0873, "step": 22750 }, { "epoch": 0.15, "learning_rate": 0.0002779652374836223, "loss": 0.0964, "step": 22760 }, { "epoch": 0.15, "learning_rate": 0.0002779555561292654, "loss": 0.0862, "step": 22770 }, { "epoch": 0.15, "learning_rate": 0.00027794587477490847, "loss": 0.0854, "step": 22780 }, { "epoch": 0.15, "learning_rate": 0.00027793619342055155, "loss": 0.0942, "step": 22790 }, { "epoch": 0.15, "learning_rate": 0.00027792651206619463, "loss": 0.0959, "step": 22800 }, { "epoch": 0.15, "learning_rate": 0.0002779168307118377, "loss": 0.0846, "step": 22810 }, { "epoch": 0.15, "learning_rate": 0.0002779071493574808, "loss": 0.083, "step": 22820 }, { "epoch": 0.15, "learning_rate": 0.0002778974680031238, "loss": 0.091, "step": 22830 }, { "epoch": 0.15, "learning_rate": 0.0002778877866487669, "loss": 0.0762, "step": 22840 }, { "epoch": 0.15, "learning_rate": 0.00027787810529441, "loss": 0.0788, "step": 22850 }, { "epoch": 0.15, "learning_rate": 0.00027786842394005306, "loss": 0.0962, "step": 22860 }, { "epoch": 0.15, "learning_rate": 0.0002778587425856961, "loss": 0.0805, "step": 22870 }, { "epoch": 0.15, "learning_rate": 0.00027784906123133916, "loss": 0.0905, "step": 22880 }, { "epoch": 0.15, "learning_rate": 0.00027783937987698224, "loss": 0.0842, "step": 22890 }, { "epoch": 0.15, "learning_rate": 0.00027782969852262527, "loss": 0.0782, "step": 22900 }, { "epoch": 0.15, "learning_rate": 0.00027782001716826835, "loss": 0.0891, "step": 22910 }, { "epoch": 0.15, "learning_rate": 0.0002778103358139114, "loss": 0.0791, "step": 22920 }, { "epoch": 0.15, "learning_rate": 0.0002778006544595545, "loss": 0.0859, "step": 22930 }, { "epoch": 0.15, "learning_rate": 0.0002777909731051976, "loss": 0.0843, "step": 22940 }, { "epoch": 0.15, "learning_rate": 0.00027778129175084067, "loss": 0.0767, "step": 22950 }, { "epoch": 0.15, "learning_rate": 0.00027777161039648375, "loss": 0.0834, "step": 22960 }, { "epoch": 0.15, "learning_rate": 0.00027776192904212677, "loss": 0.0858, "step": 22970 }, { "epoch": 0.15, "learning_rate": 0.00027775224768776985, "loss": 0.0829, "step": 22980 }, { "epoch": 0.15, "learning_rate": 0.00027774256633341293, "loss": 0.096, "step": 22990 }, { "epoch": 0.15, "learning_rate": 0.00027773288497905596, "loss": 0.0801, "step": 23000 }, { "epoch": 0.15, "eval_cer": 0.9202295785786917, "eval_loss": 0.06064927205443382, "eval_runtime": 120.4894, "eval_samples_per_second": 16.599, "eval_steps_per_second": 4.15, "step": 23000 }, { "epoch": 0.15, "learning_rate": 0.00027772320362469904, "loss": 0.0825, "step": 23010 }, { "epoch": 0.15, "learning_rate": 0.0002777135222703421, "loss": 0.0786, "step": 23020 }, { "epoch": 0.15, "learning_rate": 0.0002777038409159852, "loss": 0.0859, "step": 23030 }, { "epoch": 0.15, "learning_rate": 0.0002776941595616282, "loss": 0.0909, "step": 23040 }, { "epoch": 0.15, "learning_rate": 0.0002776844782072713, "loss": 0.0806, "step": 23050 }, { "epoch": 0.15, "learning_rate": 0.0002776747968529144, "loss": 0.0754, "step": 23060 }, { "epoch": 0.15, "learning_rate": 0.00027766511549855746, "loss": 0.0807, "step": 23070 }, { "epoch": 0.15, "learning_rate": 0.00027765543414420054, "loss": 0.0853, "step": 23080 }, { "epoch": 0.15, "learning_rate": 0.0002776457527898436, "loss": 0.0819, "step": 23090 }, { "epoch": 0.15, "learning_rate": 0.0002776360714354867, "loss": 0.0742, "step": 23100 }, { "epoch": 0.15, "learning_rate": 0.0002776263900811297, "loss": 0.0853, "step": 23110 }, { "epoch": 0.15, "learning_rate": 0.0002776167087267728, "loss": 0.0893, "step": 23120 }, { "epoch": 0.15, "learning_rate": 0.0002776070273724159, "loss": 0.0786, "step": 23130 }, { "epoch": 0.15, "learning_rate": 0.0002775973460180589, "loss": 0.0899, "step": 23140 }, { "epoch": 0.15, "learning_rate": 0.000277587664663702, "loss": 0.0777, "step": 23150 }, { "epoch": 0.15, "learning_rate": 0.00027757798330934507, "loss": 0.0835, "step": 23160 }, { "epoch": 0.15, "learning_rate": 0.00027756830195498815, "loss": 0.0871, "step": 23170 }, { "epoch": 0.15, "learning_rate": 0.0002775586206006312, "loss": 0.084, "step": 23180 }, { "epoch": 0.15, "learning_rate": 0.00027754893924627426, "loss": 0.0844, "step": 23190 }, { "epoch": 0.15, "learning_rate": 0.00027753925789191733, "loss": 0.0889, "step": 23200 }, { "epoch": 0.15, "learning_rate": 0.0002775295765375604, "loss": 0.0907, "step": 23210 }, { "epoch": 0.15, "learning_rate": 0.0002775198951832035, "loss": 0.0862, "step": 23220 }, { "epoch": 0.15, "learning_rate": 0.0002775102138288466, "loss": 0.0866, "step": 23230 }, { "epoch": 0.15, "learning_rate": 0.0002775005324744896, "loss": 0.0837, "step": 23240 }, { "epoch": 0.15, "learning_rate": 0.0002774908511201327, "loss": 0.0837, "step": 23250 }, { "epoch": 0.15, "learning_rate": 0.00027748116976577576, "loss": 0.0831, "step": 23260 }, { "epoch": 0.15, "learning_rate": 0.0002774714884114188, "loss": 0.0838, "step": 23270 }, { "epoch": 0.15, "learning_rate": 0.00027746180705706186, "loss": 0.084, "step": 23280 }, { "epoch": 0.15, "learning_rate": 0.00027745212570270494, "loss": 0.0949, "step": 23290 }, { "epoch": 0.15, "learning_rate": 0.000277442444348348, "loss": 0.0867, "step": 23300 }, { "epoch": 0.15, "learning_rate": 0.0002774327629939911, "loss": 0.0979, "step": 23310 }, { "epoch": 0.15, "learning_rate": 0.00027742308163963413, "loss": 0.0777, "step": 23320 }, { "epoch": 0.15, "learning_rate": 0.0002774134002852772, "loss": 0.0789, "step": 23330 }, { "epoch": 0.15, "learning_rate": 0.0002774037189309203, "loss": 0.0872, "step": 23340 }, { "epoch": 0.15, "learning_rate": 0.00027739403757656337, "loss": 0.0829, "step": 23350 }, { "epoch": 0.15, "learning_rate": 0.00027738435622220645, "loss": 0.0835, "step": 23360 }, { "epoch": 0.15, "learning_rate": 0.0002773746748678495, "loss": 0.087, "step": 23370 }, { "epoch": 0.15, "learning_rate": 0.00027736499351349255, "loss": 0.1009, "step": 23380 }, { "epoch": 0.15, "learning_rate": 0.00027735531215913563, "loss": 0.09, "step": 23390 }, { "epoch": 0.15, "learning_rate": 0.00027734563080477866, "loss": 0.0763, "step": 23400 }, { "epoch": 0.15, "learning_rate": 0.00027733594945042174, "loss": 0.0835, "step": 23410 }, { "epoch": 0.15, "learning_rate": 0.0002773262680960648, "loss": 0.0953, "step": 23420 }, { "epoch": 0.15, "learning_rate": 0.0002773165867417079, "loss": 0.0795, "step": 23430 }, { "epoch": 0.15, "learning_rate": 0.000277306905387351, "loss": 0.0847, "step": 23440 }, { "epoch": 0.15, "learning_rate": 0.00027729722403299406, "loss": 0.084, "step": 23450 }, { "epoch": 0.15, "learning_rate": 0.0002772875426786371, "loss": 0.0885, "step": 23460 }, { "epoch": 0.15, "learning_rate": 0.00027727786132428016, "loss": 0.0782, "step": 23470 }, { "epoch": 0.15, "learning_rate": 0.00027726817996992324, "loss": 0.0843, "step": 23480 }, { "epoch": 0.15, "learning_rate": 0.0002772584986155663, "loss": 0.1056, "step": 23490 }, { "epoch": 0.15, "learning_rate": 0.0002772488172612094, "loss": 0.0892, "step": 23500 }, { "epoch": 0.15, "learning_rate": 0.00027723913590685243, "loss": 0.0827, "step": 23510 }, { "epoch": 0.15, "learning_rate": 0.0002772294545524955, "loss": 0.0775, "step": 23520 }, { "epoch": 0.15, "learning_rate": 0.0002772197731981386, "loss": 0.0886, "step": 23530 }, { "epoch": 0.15, "learning_rate": 0.0002772100918437816, "loss": 0.0802, "step": 23540 }, { "epoch": 0.15, "learning_rate": 0.0002772004104894247, "loss": 0.0841, "step": 23550 }, { "epoch": 0.15, "learning_rate": 0.0002771907291350678, "loss": 0.0892, "step": 23560 }, { "epoch": 0.15, "learning_rate": 0.00027718104778071085, "loss": 0.0921, "step": 23570 }, { "epoch": 0.15, "learning_rate": 0.00027717136642635393, "loss": 0.0875, "step": 23580 }, { "epoch": 0.15, "learning_rate": 0.000277161685071997, "loss": 0.0791, "step": 23590 }, { "epoch": 0.15, "learning_rate": 0.00027715200371764004, "loss": 0.0801, "step": 23600 }, { "epoch": 0.15, "learning_rate": 0.0002771423223632831, "loss": 0.0805, "step": 23610 }, { "epoch": 0.15, "learning_rate": 0.0002771326410089262, "loss": 0.0831, "step": 23620 }, { "epoch": 0.15, "learning_rate": 0.0002771229596545693, "loss": 0.0806, "step": 23630 }, { "epoch": 0.15, "learning_rate": 0.0002771132783002123, "loss": 0.0813, "step": 23640 }, { "epoch": 0.15, "learning_rate": 0.0002771035969458554, "loss": 0.08, "step": 23650 }, { "epoch": 0.15, "learning_rate": 0.00027709391559149846, "loss": 0.0829, "step": 23660 }, { "epoch": 0.15, "learning_rate": 0.0002770842342371415, "loss": 0.0822, "step": 23670 }, { "epoch": 0.15, "learning_rate": 0.00027707455288278457, "loss": 0.0754, "step": 23680 }, { "epoch": 0.15, "learning_rate": 0.00027706487152842765, "loss": 0.0773, "step": 23690 }, { "epoch": 0.15, "learning_rate": 0.00027705519017407073, "loss": 0.0754, "step": 23700 }, { "epoch": 0.15, "learning_rate": 0.0002770455088197138, "loss": 0.0874, "step": 23710 }, { "epoch": 0.15, "learning_rate": 0.0002770358274653569, "loss": 0.0813, "step": 23720 }, { "epoch": 0.15, "learning_rate": 0.00027702614611099997, "loss": 0.0836, "step": 23730 }, { "epoch": 0.15, "learning_rate": 0.000277016464756643, "loss": 0.085, "step": 23740 }, { "epoch": 0.15, "learning_rate": 0.00027700678340228607, "loss": 0.0947, "step": 23750 }, { "epoch": 0.15, "learning_rate": 0.00027699710204792915, "loss": 0.0881, "step": 23760 }, { "epoch": 0.15, "learning_rate": 0.0002769874206935722, "loss": 0.0918, "step": 23770 }, { "epoch": 0.15, "learning_rate": 0.00027697773933921526, "loss": 0.0887, "step": 23780 }, { "epoch": 0.15, "learning_rate": 0.00027696805798485834, "loss": 0.0871, "step": 23790 }, { "epoch": 0.15, "learning_rate": 0.0002769583766305014, "loss": 0.0891, "step": 23800 }, { "epoch": 0.15, "learning_rate": 0.00027694869527614444, "loss": 0.0802, "step": 23810 }, { "epoch": 0.15, "learning_rate": 0.0002769390139217875, "loss": 0.0794, "step": 23820 }, { "epoch": 0.15, "learning_rate": 0.0002769293325674306, "loss": 0.099, "step": 23830 }, { "epoch": 0.15, "learning_rate": 0.0002769196512130737, "loss": 0.0877, "step": 23840 }, { "epoch": 0.15, "learning_rate": 0.00027690996985871676, "loss": 0.076, "step": 23850 }, { "epoch": 0.15, "learning_rate": 0.00027690028850435984, "loss": 0.0859, "step": 23860 }, { "epoch": 0.15, "learning_rate": 0.0002768906071500029, "loss": 0.0943, "step": 23870 }, { "epoch": 0.15, "learning_rate": 0.00027688092579564595, "loss": 0.0795, "step": 23880 }, { "epoch": 0.15, "learning_rate": 0.00027687124444128903, "loss": 0.0917, "step": 23890 }, { "epoch": 0.15, "learning_rate": 0.0002768615630869321, "loss": 0.0919, "step": 23900 }, { "epoch": 0.15, "learning_rate": 0.00027685188173257513, "loss": 0.0935, "step": 23910 }, { "epoch": 0.15, "learning_rate": 0.0002768422003782182, "loss": 0.0776, "step": 23920 }, { "epoch": 0.15, "learning_rate": 0.0002768325190238613, "loss": 0.0901, "step": 23930 }, { "epoch": 0.15, "learning_rate": 0.00027682283766950437, "loss": 0.0854, "step": 23940 }, { "epoch": 0.15, "learning_rate": 0.0002768131563151474, "loss": 0.0786, "step": 23950 }, { "epoch": 0.15, "learning_rate": 0.0002768034749607905, "loss": 0.0867, "step": 23960 }, { "epoch": 0.15, "learning_rate": 0.00027679379360643356, "loss": 0.0776, "step": 23970 }, { "epoch": 0.15, "learning_rate": 0.00027678411225207664, "loss": 0.0895, "step": 23980 }, { "epoch": 0.15, "learning_rate": 0.0002767744308977197, "loss": 0.0833, "step": 23990 }, { "epoch": 0.15, "learning_rate": 0.0002767647495433628, "loss": 0.0764, "step": 24000 }, { "epoch": 0.15, "eval_cer": 0.920127443226754, "eval_loss": 0.05912618711590767, "eval_runtime": 120.5476, "eval_samples_per_second": 16.591, "eval_steps_per_second": 4.148, "step": 24000 }, { "epoch": 0.15, "learning_rate": 0.0002767550681890058, "loss": 0.089, "step": 24010 }, { "epoch": 0.16, "learning_rate": 0.0002767453868346489, "loss": 0.0763, "step": 24020 }, { "epoch": 0.16, "learning_rate": 0.000276735705480292, "loss": 0.1077, "step": 24030 }, { "epoch": 0.16, "learning_rate": 0.000276726024125935, "loss": 0.084, "step": 24040 }, { "epoch": 0.16, "learning_rate": 0.0002767163427715781, "loss": 0.0774, "step": 24050 }, { "epoch": 0.16, "learning_rate": 0.00027670666141722117, "loss": 0.0827, "step": 24060 }, { "epoch": 0.16, "learning_rate": 0.00027669698006286425, "loss": 0.0831, "step": 24070 }, { "epoch": 0.16, "learning_rate": 0.0002766872987085073, "loss": 0.0865, "step": 24080 }, { "epoch": 0.16, "learning_rate": 0.00027667761735415035, "loss": 0.0803, "step": 24090 }, { "epoch": 0.16, "learning_rate": 0.00027666793599979343, "loss": 0.0828, "step": 24100 }, { "epoch": 0.16, "learning_rate": 0.0002766582546454365, "loss": 0.0902, "step": 24110 }, { "epoch": 0.16, "learning_rate": 0.0002766485732910796, "loss": 0.0817, "step": 24120 }, { "epoch": 0.16, "learning_rate": 0.00027663889193672267, "loss": 0.0863, "step": 24130 }, { "epoch": 0.16, "learning_rate": 0.0002766292105823657, "loss": 0.0878, "step": 24140 }, { "epoch": 0.16, "learning_rate": 0.0002766195292280088, "loss": 0.0832, "step": 24150 }, { "epoch": 0.16, "learning_rate": 0.00027660984787365186, "loss": 0.0952, "step": 24160 }, { "epoch": 0.16, "learning_rate": 0.0002766001665192949, "loss": 0.1014, "step": 24170 }, { "epoch": 0.16, "learning_rate": 0.00027659048516493796, "loss": 0.0823, "step": 24180 }, { "epoch": 0.16, "learning_rate": 0.00027658080381058104, "loss": 0.0901, "step": 24190 }, { "epoch": 0.16, "learning_rate": 0.0002765711224562241, "loss": 0.0863, "step": 24200 }, { "epoch": 0.16, "learning_rate": 0.0002765614411018672, "loss": 0.0839, "step": 24210 }, { "epoch": 0.16, "learning_rate": 0.0002765517597475102, "loss": 0.0868, "step": 24220 }, { "epoch": 0.16, "learning_rate": 0.0002765420783931533, "loss": 0.0877, "step": 24230 }, { "epoch": 0.16, "learning_rate": 0.0002765323970387964, "loss": 0.0801, "step": 24240 }, { "epoch": 0.16, "learning_rate": 0.00027652271568443947, "loss": 0.0874, "step": 24250 }, { "epoch": 0.16, "learning_rate": 0.00027651303433008255, "loss": 0.0953, "step": 24260 }, { "epoch": 0.16, "learning_rate": 0.0002765033529757256, "loss": 0.0825, "step": 24270 }, { "epoch": 0.16, "learning_rate": 0.00027649367162136865, "loss": 0.0843, "step": 24280 }, { "epoch": 0.16, "learning_rate": 0.00027648399026701173, "loss": 0.085, "step": 24290 }, { "epoch": 0.16, "learning_rate": 0.0002764743089126548, "loss": 0.0968, "step": 24300 }, { "epoch": 0.16, "learning_rate": 0.00027646462755829784, "loss": 0.0835, "step": 24310 }, { "epoch": 0.16, "learning_rate": 0.0002764549462039409, "loss": 0.0902, "step": 24320 }, { "epoch": 0.16, "learning_rate": 0.000276445264849584, "loss": 0.0896, "step": 24330 }, { "epoch": 0.16, "learning_rate": 0.0002764355834952271, "loss": 0.0869, "step": 24340 }, { "epoch": 0.16, "learning_rate": 0.00027642590214087016, "loss": 0.0846, "step": 24350 }, { "epoch": 0.16, "learning_rate": 0.0002764162207865132, "loss": 0.0834, "step": 24360 }, { "epoch": 0.16, "learning_rate": 0.00027640653943215626, "loss": 0.0743, "step": 24370 }, { "epoch": 0.16, "learning_rate": 0.00027639685807779934, "loss": 0.0856, "step": 24380 }, { "epoch": 0.16, "learning_rate": 0.0002763871767234424, "loss": 0.0804, "step": 24390 }, { "epoch": 0.16, "learning_rate": 0.0002763774953690855, "loss": 0.0856, "step": 24400 }, { "epoch": 0.16, "learning_rate": 0.0002763678140147285, "loss": 0.0962, "step": 24410 }, { "epoch": 0.16, "learning_rate": 0.0002763581326603716, "loss": 0.0898, "step": 24420 }, { "epoch": 0.16, "learning_rate": 0.0002763484513060147, "loss": 0.0944, "step": 24430 }, { "epoch": 0.16, "learning_rate": 0.0002763387699516577, "loss": 0.0858, "step": 24440 }, { "epoch": 0.16, "learning_rate": 0.0002763290885973008, "loss": 0.0812, "step": 24450 }, { "epoch": 0.16, "learning_rate": 0.00027631940724294387, "loss": 0.084, "step": 24460 }, { "epoch": 0.16, "learning_rate": 0.00027630972588858695, "loss": 0.0755, "step": 24470 }, { "epoch": 0.16, "learning_rate": 0.00027630004453423003, "loss": 0.085, "step": 24480 }, { "epoch": 0.16, "learning_rate": 0.0002762903631798731, "loss": 0.0766, "step": 24490 }, { "epoch": 0.16, "learning_rate": 0.00027628068182551614, "loss": 0.0846, "step": 24500 }, { "epoch": 0.16, "learning_rate": 0.0002762710004711592, "loss": 0.0878, "step": 24510 }, { "epoch": 0.16, "learning_rate": 0.0002762613191168023, "loss": 0.0907, "step": 24520 }, { "epoch": 0.16, "learning_rate": 0.0002762516377624454, "loss": 0.0784, "step": 24530 }, { "epoch": 0.16, "learning_rate": 0.0002762419564080884, "loss": 0.0869, "step": 24540 }, { "epoch": 0.16, "learning_rate": 0.0002762322750537315, "loss": 0.0841, "step": 24550 }, { "epoch": 0.16, "learning_rate": 0.00027622259369937456, "loss": 0.0877, "step": 24560 }, { "epoch": 0.16, "learning_rate": 0.0002762129123450176, "loss": 0.0771, "step": 24570 }, { "epoch": 0.16, "learning_rate": 0.00027620323099066067, "loss": 0.0892, "step": 24580 }, { "epoch": 0.16, "learning_rate": 0.00027619354963630375, "loss": 0.0895, "step": 24590 }, { "epoch": 0.16, "learning_rate": 0.0002761838682819468, "loss": 0.089, "step": 24600 }, { "epoch": 0.16, "learning_rate": 0.0002761741869275899, "loss": 0.0774, "step": 24610 }, { "epoch": 0.16, "learning_rate": 0.000276164505573233, "loss": 0.0892, "step": 24620 }, { "epoch": 0.16, "learning_rate": 0.00027615482421887606, "loss": 0.0756, "step": 24630 }, { "epoch": 0.16, "learning_rate": 0.0002761451428645191, "loss": 0.0872, "step": 24640 }, { "epoch": 0.16, "learning_rate": 0.00027613546151016217, "loss": 0.1005, "step": 24650 }, { "epoch": 0.16, "learning_rate": 0.00027612578015580525, "loss": 0.0867, "step": 24660 }, { "epoch": 0.16, "learning_rate": 0.00027611609880144833, "loss": 0.0829, "step": 24670 }, { "epoch": 0.16, "learning_rate": 0.00027610641744709136, "loss": 0.0862, "step": 24680 }, { "epoch": 0.16, "learning_rate": 0.00027609673609273443, "loss": 0.0864, "step": 24690 }, { "epoch": 0.16, "learning_rate": 0.0002760870547383775, "loss": 0.0763, "step": 24700 }, { "epoch": 0.16, "learning_rate": 0.00027607737338402054, "loss": 0.0859, "step": 24710 }, { "epoch": 0.16, "learning_rate": 0.0002760676920296636, "loss": 0.0757, "step": 24720 }, { "epoch": 0.16, "learning_rate": 0.0002760580106753067, "loss": 0.088, "step": 24730 }, { "epoch": 0.16, "learning_rate": 0.0002760483293209498, "loss": 0.0835, "step": 24740 }, { "epoch": 0.16, "learning_rate": 0.00027603864796659286, "loss": 0.0874, "step": 24750 }, { "epoch": 0.16, "learning_rate": 0.00027602896661223594, "loss": 0.0854, "step": 24760 }, { "epoch": 0.16, "learning_rate": 0.000276019285257879, "loss": 0.074, "step": 24770 }, { "epoch": 0.16, "learning_rate": 0.00027600960390352204, "loss": 0.0841, "step": 24780 }, { "epoch": 0.16, "learning_rate": 0.0002759999225491651, "loss": 0.0771, "step": 24790 }, { "epoch": 0.16, "learning_rate": 0.0002759902411948082, "loss": 0.0853, "step": 24800 }, { "epoch": 0.16, "learning_rate": 0.00027598055984045123, "loss": 0.0791, "step": 24810 }, { "epoch": 0.16, "learning_rate": 0.0002759708784860943, "loss": 0.0776, "step": 24820 }, { "epoch": 0.16, "learning_rate": 0.0002759611971317374, "loss": 0.0794, "step": 24830 }, { "epoch": 0.16, "learning_rate": 0.00027595151577738047, "loss": 0.0813, "step": 24840 }, { "epoch": 0.16, "learning_rate": 0.0002759418344230235, "loss": 0.0743, "step": 24850 }, { "epoch": 0.16, "learning_rate": 0.0002759321530686666, "loss": 0.0851, "step": 24860 }, { "epoch": 0.16, "learning_rate": 0.00027592247171430965, "loss": 0.0773, "step": 24870 }, { "epoch": 0.16, "learning_rate": 0.00027591279035995273, "loss": 0.0703, "step": 24880 }, { "epoch": 0.16, "learning_rate": 0.0002759031090055958, "loss": 0.0789, "step": 24890 }, { "epoch": 0.16, "learning_rate": 0.0002758934276512389, "loss": 0.0783, "step": 24900 }, { "epoch": 0.16, "learning_rate": 0.000275883746296882, "loss": 0.0737, "step": 24910 }, { "epoch": 0.16, "learning_rate": 0.000275874064942525, "loss": 0.0856, "step": 24920 }, { "epoch": 0.16, "learning_rate": 0.0002758643835881681, "loss": 0.0797, "step": 24930 }, { "epoch": 0.16, "learning_rate": 0.0002758547022338111, "loss": 0.0841, "step": 24940 }, { "epoch": 0.16, "learning_rate": 0.0002758450208794542, "loss": 0.0802, "step": 24950 }, { "epoch": 0.16, "learning_rate": 0.00027583533952509726, "loss": 0.0742, "step": 24960 }, { "epoch": 0.16, "learning_rate": 0.00027582565817074034, "loss": 0.0802, "step": 24970 }, { "epoch": 0.16, "learning_rate": 0.0002758159768163834, "loss": 0.0788, "step": 24980 }, { "epoch": 0.16, "learning_rate": 0.00027580629546202645, "loss": 0.0785, "step": 24990 }, { "epoch": 0.16, "learning_rate": 0.00027579661410766953, "loss": 0.0779, "step": 25000 }, { "epoch": 0.16, "eval_cer": 0.9200786351824652, "eval_loss": 0.055601075291633606, "eval_runtime": 120.6339, "eval_samples_per_second": 16.579, "eval_steps_per_second": 4.145, "step": 25000 }, { "epoch": 0.16, "learning_rate": 0.0002757869327533126, "loss": 0.0794, "step": 25010 }, { "epoch": 0.16, "learning_rate": 0.0002757772513989557, "loss": 0.0827, "step": 25020 }, { "epoch": 0.16, "learning_rate": 0.00027576757004459877, "loss": 0.082, "step": 25030 }, { "epoch": 0.16, "learning_rate": 0.00027575788869024185, "loss": 0.0755, "step": 25040 }, { "epoch": 0.16, "learning_rate": 0.0002757482073358849, "loss": 0.0875, "step": 25050 }, { "epoch": 0.16, "learning_rate": 0.00027573852598152795, "loss": 0.0743, "step": 25060 }, { "epoch": 0.16, "learning_rate": 0.00027572884462717103, "loss": 0.084, "step": 25070 }, { "epoch": 0.16, "learning_rate": 0.00027571916327281406, "loss": 0.079, "step": 25080 }, { "epoch": 0.16, "learning_rate": 0.00027570948191845714, "loss": 0.0709, "step": 25090 }, { "epoch": 0.16, "learning_rate": 0.0002756998005641002, "loss": 0.0891, "step": 25100 }, { "epoch": 0.16, "learning_rate": 0.0002756901192097433, "loss": 0.0788, "step": 25110 }, { "epoch": 0.16, "learning_rate": 0.0002756804378553864, "loss": 0.0821, "step": 25120 }, { "epoch": 0.16, "learning_rate": 0.0002756707565010294, "loss": 0.0805, "step": 25130 }, { "epoch": 0.16, "learning_rate": 0.0002756610751466725, "loss": 0.0893, "step": 25140 }, { "epoch": 0.16, "learning_rate": 0.00027565139379231556, "loss": 0.0821, "step": 25150 }, { "epoch": 0.16, "learning_rate": 0.00027564171243795864, "loss": 0.084, "step": 25160 }, { "epoch": 0.16, "learning_rate": 0.0002756320310836017, "loss": 0.0861, "step": 25170 }, { "epoch": 0.16, "learning_rate": 0.00027562234972924475, "loss": 0.0722, "step": 25180 }, { "epoch": 0.16, "learning_rate": 0.00027561266837488783, "loss": 0.0849, "step": 25190 }, { "epoch": 0.16, "learning_rate": 0.0002756029870205309, "loss": 0.0809, "step": 25200 }, { "epoch": 0.16, "learning_rate": 0.00027559330566617393, "loss": 0.0845, "step": 25210 }, { "epoch": 0.16, "learning_rate": 0.000275583624311817, "loss": 0.0745, "step": 25220 }, { "epoch": 0.16, "learning_rate": 0.0002755739429574601, "loss": 0.0786, "step": 25230 }, { "epoch": 0.16, "learning_rate": 0.00027556426160310317, "loss": 0.09, "step": 25240 }, { "epoch": 0.16, "learning_rate": 0.00027555458024874625, "loss": 0.0857, "step": 25250 }, { "epoch": 0.16, "learning_rate": 0.00027554489889438933, "loss": 0.0831, "step": 25260 }, { "epoch": 0.16, "learning_rate": 0.00027553521754003236, "loss": 0.0783, "step": 25270 }, { "epoch": 0.16, "learning_rate": 0.00027552553618567544, "loss": 0.0744, "step": 25280 }, { "epoch": 0.16, "learning_rate": 0.0002755158548313185, "loss": 0.0801, "step": 25290 }, { "epoch": 0.16, "learning_rate": 0.0002755061734769616, "loss": 0.0843, "step": 25300 }, { "epoch": 0.16, "learning_rate": 0.0002754964921226047, "loss": 0.0846, "step": 25310 }, { "epoch": 0.16, "learning_rate": 0.0002754868107682477, "loss": 0.0823, "step": 25320 }, { "epoch": 0.16, "learning_rate": 0.0002754771294138908, "loss": 0.0865, "step": 25330 }, { "epoch": 0.16, "learning_rate": 0.0002754674480595338, "loss": 0.0809, "step": 25340 }, { "epoch": 0.16, "learning_rate": 0.0002754577667051769, "loss": 0.0823, "step": 25350 }, { "epoch": 0.16, "learning_rate": 0.00027544808535081997, "loss": 0.074, "step": 25360 }, { "epoch": 0.16, "learning_rate": 0.00027543840399646305, "loss": 0.0783, "step": 25370 }, { "epoch": 0.16, "learning_rate": 0.00027542872264210613, "loss": 0.0785, "step": 25380 }, { "epoch": 0.16, "learning_rate": 0.0002754190412877492, "loss": 0.0791, "step": 25390 }, { "epoch": 0.16, "learning_rate": 0.0002754093599333923, "loss": 0.09, "step": 25400 }, { "epoch": 0.16, "learning_rate": 0.0002753996785790353, "loss": 0.0897, "step": 25410 }, { "epoch": 0.16, "learning_rate": 0.0002753899972246784, "loss": 0.0906, "step": 25420 }, { "epoch": 0.16, "learning_rate": 0.00027538031587032147, "loss": 0.0755, "step": 25430 }, { "epoch": 0.16, "learning_rate": 0.00027537063451596455, "loss": 0.0797, "step": 25440 }, { "epoch": 0.16, "learning_rate": 0.0002753609531616076, "loss": 0.0794, "step": 25450 }, { "epoch": 0.16, "learning_rate": 0.00027535127180725066, "loss": 0.0806, "step": 25460 }, { "epoch": 0.16, "learning_rate": 0.00027534159045289374, "loss": 0.0858, "step": 25470 }, { "epoch": 0.16, "learning_rate": 0.00027533190909853676, "loss": 0.0756, "step": 25480 }, { "epoch": 0.16, "learning_rate": 0.00027532222774417984, "loss": 0.0768, "step": 25490 }, { "epoch": 0.16, "learning_rate": 0.0002753125463898229, "loss": 0.0827, "step": 25500 }, { "epoch": 0.16, "learning_rate": 0.000275302865035466, "loss": 0.086, "step": 25510 }, { "epoch": 0.16, "learning_rate": 0.0002752931836811091, "loss": 0.077, "step": 25520 }, { "epoch": 0.16, "learning_rate": 0.00027528350232675216, "loss": 0.081, "step": 25530 }, { "epoch": 0.16, "learning_rate": 0.00027527382097239524, "loss": 0.0796, "step": 25540 }, { "epoch": 0.16, "learning_rate": 0.00027526413961803827, "loss": 0.0907, "step": 25550 }, { "epoch": 0.16, "learning_rate": 0.00027525445826368135, "loss": 0.0859, "step": 25560 }, { "epoch": 0.17, "learning_rate": 0.0002752447769093244, "loss": 0.0851, "step": 25570 }, { "epoch": 0.17, "learning_rate": 0.00027523509555496745, "loss": 0.0849, "step": 25580 }, { "epoch": 0.17, "learning_rate": 0.00027522541420061053, "loss": 0.0801, "step": 25590 }, { "epoch": 0.17, "learning_rate": 0.0002752157328462536, "loss": 0.0787, "step": 25600 }, { "epoch": 0.17, "learning_rate": 0.0002752060514918967, "loss": 0.0805, "step": 25610 }, { "epoch": 0.17, "learning_rate": 0.0002751963701375397, "loss": 0.0807, "step": 25620 }, { "epoch": 0.17, "learning_rate": 0.0002751866887831828, "loss": 0.0777, "step": 25630 }, { "epoch": 0.17, "learning_rate": 0.0002751770074288259, "loss": 0.0858, "step": 25640 }, { "epoch": 0.17, "learning_rate": 0.00027516732607446896, "loss": 0.0756, "step": 25650 }, { "epoch": 0.17, "learning_rate": 0.00027515764472011204, "loss": 0.081, "step": 25660 }, { "epoch": 0.17, "learning_rate": 0.0002751479633657551, "loss": 0.0802, "step": 25670 }, { "epoch": 0.17, "learning_rate": 0.0002751382820113982, "loss": 0.0764, "step": 25680 }, { "epoch": 0.17, "learning_rate": 0.0002751286006570412, "loss": 0.0846, "step": 25690 }, { "epoch": 0.17, "learning_rate": 0.0002751189193026843, "loss": 0.0765, "step": 25700 }, { "epoch": 0.17, "learning_rate": 0.0002751092379483274, "loss": 0.0857, "step": 25710 }, { "epoch": 0.17, "learning_rate": 0.0002750995565939704, "loss": 0.0816, "step": 25720 }, { "epoch": 0.17, "learning_rate": 0.0002750898752396135, "loss": 0.0754, "step": 25730 }, { "epoch": 0.17, "learning_rate": 0.00027508019388525657, "loss": 0.0789, "step": 25740 }, { "epoch": 0.17, "learning_rate": 0.00027507051253089965, "loss": 0.081, "step": 25750 }, { "epoch": 0.17, "learning_rate": 0.00027506083117654267, "loss": 0.0821, "step": 25760 }, { "epoch": 0.17, "learning_rate": 0.00027505114982218575, "loss": 0.074, "step": 25770 }, { "epoch": 0.17, "learning_rate": 0.00027504146846782883, "loss": 0.078, "step": 25780 }, { "epoch": 0.17, "learning_rate": 0.0002750317871134719, "loss": 0.0847, "step": 25790 }, { "epoch": 0.17, "learning_rate": 0.000275022105759115, "loss": 0.0789, "step": 25800 }, { "epoch": 0.17, "learning_rate": 0.00027501242440475807, "loss": 0.0776, "step": 25810 }, { "epoch": 0.17, "learning_rate": 0.0002750027430504011, "loss": 0.0773, "step": 25820 }, { "epoch": 0.17, "learning_rate": 0.0002749930616960442, "loss": 0.0928, "step": 25830 }, { "epoch": 0.17, "learning_rate": 0.00027498338034168726, "loss": 0.0805, "step": 25840 }, { "epoch": 0.17, "learning_rate": 0.0002749736989873303, "loss": 0.0892, "step": 25850 }, { "epoch": 0.17, "learning_rate": 0.00027496401763297336, "loss": 0.0801, "step": 25860 }, { "epoch": 0.17, "learning_rate": 0.00027495433627861644, "loss": 0.0929, "step": 25870 }, { "epoch": 0.17, "learning_rate": 0.0002749446549242595, "loss": 0.085, "step": 25880 }, { "epoch": 0.17, "learning_rate": 0.0002749349735699026, "loss": 0.0845, "step": 25890 }, { "epoch": 0.17, "learning_rate": 0.0002749252922155456, "loss": 0.0766, "step": 25900 }, { "epoch": 0.17, "learning_rate": 0.0002749156108611887, "loss": 0.0809, "step": 25910 }, { "epoch": 0.17, "learning_rate": 0.0002749059295068318, "loss": 0.0844, "step": 25920 }, { "epoch": 0.17, "learning_rate": 0.00027489624815247487, "loss": 0.085, "step": 25930 }, { "epoch": 0.17, "learning_rate": 0.00027488656679811795, "loss": 0.0703, "step": 25940 }, { "epoch": 0.17, "learning_rate": 0.00027487688544376097, "loss": 0.0917, "step": 25950 }, { "epoch": 0.17, "learning_rate": 0.00027486720408940405, "loss": 0.0807, "step": 25960 }, { "epoch": 0.17, "learning_rate": 0.00027485752273504713, "loss": 0.0723, "step": 25970 }, { "epoch": 0.17, "learning_rate": 0.00027484784138069016, "loss": 0.0756, "step": 25980 }, { "epoch": 0.17, "learning_rate": 0.00027483816002633324, "loss": 0.079, "step": 25990 }, { "epoch": 0.17, "learning_rate": 0.0002748284786719763, "loss": 0.0839, "step": 26000 }, { "epoch": 0.17, "eval_cer": 0.920187097503107, "eval_loss": 0.05482678487896919, "eval_runtime": 120.4443, "eval_samples_per_second": 16.605, "eval_steps_per_second": 4.151, "step": 26000 }, { "epoch": 0.17, "learning_rate": 0.0002748187973176194, "loss": 0.0831, "step": 26010 }, { "epoch": 0.17, "learning_rate": 0.0002748091159632625, "loss": 0.0743, "step": 26020 }, { "epoch": 0.17, "learning_rate": 0.00027479943460890555, "loss": 0.0838, "step": 26030 }, { "epoch": 0.17, "learning_rate": 0.0002747897532545486, "loss": 0.0825, "step": 26040 }, { "epoch": 0.17, "learning_rate": 0.00027478007190019166, "loss": 0.0739, "step": 26050 }, { "epoch": 0.17, "learning_rate": 0.00027477039054583474, "loss": 0.0756, "step": 26060 }, { "epoch": 0.17, "learning_rate": 0.0002747607091914778, "loss": 0.0819, "step": 26070 }, { "epoch": 0.17, "learning_rate": 0.0002747510278371209, "loss": 0.0735, "step": 26080 }, { "epoch": 0.17, "learning_rate": 0.0002747413464827639, "loss": 0.0777, "step": 26090 }, { "epoch": 0.17, "learning_rate": 0.000274731665128407, "loss": 0.0859, "step": 26100 }, { "epoch": 0.17, "learning_rate": 0.0002747219837740501, "loss": 0.072, "step": 26110 }, { "epoch": 0.17, "learning_rate": 0.0002747123024196931, "loss": 0.0829, "step": 26120 }, { "epoch": 0.17, "learning_rate": 0.0002747026210653362, "loss": 0.0791, "step": 26130 }, { "epoch": 0.17, "learning_rate": 0.00027469293971097927, "loss": 0.0851, "step": 26140 }, { "epoch": 0.17, "learning_rate": 0.00027468325835662235, "loss": 0.0768, "step": 26150 }, { "epoch": 0.17, "learning_rate": 0.00027467357700226543, "loss": 0.0778, "step": 26160 }, { "epoch": 0.17, "learning_rate": 0.0002746638956479085, "loss": 0.0812, "step": 26170 }, { "epoch": 0.17, "learning_rate": 0.00027465421429355153, "loss": 0.0753, "step": 26180 }, { "epoch": 0.17, "learning_rate": 0.0002746445329391946, "loss": 0.0906, "step": 26190 }, { "epoch": 0.17, "learning_rate": 0.0002746348515848377, "loss": 0.0908, "step": 26200 }, { "epoch": 0.17, "learning_rate": 0.0002746251702304808, "loss": 0.0823, "step": 26210 }, { "epoch": 0.17, "learning_rate": 0.0002746154888761238, "loss": 0.0855, "step": 26220 }, { "epoch": 0.17, "learning_rate": 0.0002746058075217669, "loss": 0.0875, "step": 26230 }, { "epoch": 0.17, "learning_rate": 0.00027459612616740996, "loss": 0.0872, "step": 26240 }, { "epoch": 0.17, "learning_rate": 0.000274586444813053, "loss": 0.0768, "step": 26250 }, { "epoch": 0.17, "learning_rate": 0.00027457676345869606, "loss": 0.0801, "step": 26260 }, { "epoch": 0.17, "learning_rate": 0.00027456708210433914, "loss": 0.0858, "step": 26270 }, { "epoch": 0.17, "learning_rate": 0.0002745574007499822, "loss": 0.081, "step": 26280 }, { "epoch": 0.17, "learning_rate": 0.0002745477193956253, "loss": 0.086, "step": 26290 }, { "epoch": 0.17, "learning_rate": 0.0002745380380412684, "loss": 0.0765, "step": 26300 }, { "epoch": 0.17, "learning_rate": 0.00027452835668691146, "loss": 0.0692, "step": 26310 }, { "epoch": 0.17, "learning_rate": 0.0002745186753325545, "loss": 0.0889, "step": 26320 }, { "epoch": 0.17, "learning_rate": 0.00027450899397819757, "loss": 0.0822, "step": 26330 }, { "epoch": 0.17, "learning_rate": 0.00027449931262384065, "loss": 0.0715, "step": 26340 }, { "epoch": 0.17, "learning_rate": 0.0002744896312694837, "loss": 0.0917, "step": 26350 }, { "epoch": 0.17, "learning_rate": 0.00027447994991512675, "loss": 0.076, "step": 26360 }, { "epoch": 0.17, "learning_rate": 0.00027447026856076983, "loss": 0.0844, "step": 26370 }, { "epoch": 0.17, "learning_rate": 0.0002744605872064129, "loss": 0.0737, "step": 26380 }, { "epoch": 0.17, "learning_rate": 0.00027445090585205594, "loss": 0.086, "step": 26390 }, { "epoch": 0.17, "learning_rate": 0.000274441224497699, "loss": 0.0738, "step": 26400 }, { "epoch": 0.17, "learning_rate": 0.0002744315431433421, "loss": 0.0801, "step": 26410 }, { "epoch": 0.17, "learning_rate": 0.0002744218617889852, "loss": 0.0762, "step": 26420 }, { "epoch": 0.17, "learning_rate": 0.00027441218043462826, "loss": 0.0787, "step": 26430 }, { "epoch": 0.17, "learning_rate": 0.00027440249908027134, "loss": 0.0816, "step": 26440 }, { "epoch": 0.17, "learning_rate": 0.0002743928177259144, "loss": 0.0835, "step": 26450 }, { "epoch": 0.17, "learning_rate": 0.00027438313637155744, "loss": 0.0803, "step": 26460 }, { "epoch": 0.17, "learning_rate": 0.0002743734550172005, "loss": 0.0749, "step": 26470 }, { "epoch": 0.17, "learning_rate": 0.0002743637736628436, "loss": 0.0834, "step": 26480 }, { "epoch": 0.17, "learning_rate": 0.00027435409230848663, "loss": 0.08, "step": 26490 }, { "epoch": 0.17, "learning_rate": 0.0002743444109541297, "loss": 0.0812, "step": 26500 }, { "epoch": 0.17, "learning_rate": 0.0002743347295997728, "loss": 0.0787, "step": 26510 }, { "epoch": 0.17, "learning_rate": 0.00027432504824541587, "loss": 0.0733, "step": 26520 }, { "epoch": 0.17, "learning_rate": 0.0002743153668910589, "loss": 0.0841, "step": 26530 }, { "epoch": 0.17, "learning_rate": 0.000274305685536702, "loss": 0.0779, "step": 26540 }, { "epoch": 0.17, "learning_rate": 0.00027429600418234505, "loss": 0.0809, "step": 26550 }, { "epoch": 0.17, "learning_rate": 0.00027428632282798813, "loss": 0.0848, "step": 26560 }, { "epoch": 0.17, "learning_rate": 0.0002742766414736312, "loss": 0.0786, "step": 26570 }, { "epoch": 0.17, "learning_rate": 0.0002742669601192743, "loss": 0.0825, "step": 26580 }, { "epoch": 0.17, "learning_rate": 0.0002742572787649173, "loss": 0.08, "step": 26590 }, { "epoch": 0.17, "learning_rate": 0.0002742475974105604, "loss": 0.0862, "step": 26600 }, { "epoch": 0.17, "learning_rate": 0.0002742379160562035, "loss": 0.0827, "step": 26610 }, { "epoch": 0.17, "learning_rate": 0.0002742282347018465, "loss": 0.0763, "step": 26620 }, { "epoch": 0.17, "learning_rate": 0.0002742185533474896, "loss": 0.0829, "step": 26630 }, { "epoch": 0.17, "learning_rate": 0.00027420887199313266, "loss": 0.0751, "step": 26640 }, { "epoch": 0.17, "learning_rate": 0.00027419919063877574, "loss": 0.0729, "step": 26650 }, { "epoch": 0.17, "learning_rate": 0.0002741895092844188, "loss": 0.0825, "step": 26660 }, { "epoch": 0.17, "learning_rate": 0.00027417982793006185, "loss": 0.0695, "step": 26670 }, { "epoch": 0.17, "learning_rate": 0.00027417014657570493, "loss": 0.0834, "step": 26680 }, { "epoch": 0.17, "learning_rate": 0.000274160465221348, "loss": 0.0731, "step": 26690 }, { "epoch": 0.17, "learning_rate": 0.0002741507838669911, "loss": 0.0814, "step": 26700 }, { "epoch": 0.17, "learning_rate": 0.00027414110251263417, "loss": 0.0836, "step": 26710 }, { "epoch": 0.17, "learning_rate": 0.0002741314211582772, "loss": 0.0917, "step": 26720 }, { "epoch": 0.17, "learning_rate": 0.0002741217398039203, "loss": 0.0819, "step": 26730 }, { "epoch": 0.17, "learning_rate": 0.00027411205844956335, "loss": 0.0858, "step": 26740 }, { "epoch": 0.17, "learning_rate": 0.0002741023770952064, "loss": 0.0969, "step": 26750 }, { "epoch": 0.17, "learning_rate": 0.00027409269574084946, "loss": 0.0806, "step": 26760 }, { "epoch": 0.17, "learning_rate": 0.00027408301438649254, "loss": 0.0853, "step": 26770 }, { "epoch": 0.17, "learning_rate": 0.0002740733330321356, "loss": 0.0944, "step": 26780 }, { "epoch": 0.17, "learning_rate": 0.0002740636516777787, "loss": 0.0825, "step": 26790 }, { "epoch": 0.17, "learning_rate": 0.0002740539703234218, "loss": 0.0841, "step": 26800 }, { "epoch": 0.17, "learning_rate": 0.0002740442889690648, "loss": 0.0775, "step": 26810 }, { "epoch": 0.17, "learning_rate": 0.0002740346076147079, "loss": 0.0874, "step": 26820 }, { "epoch": 0.17, "learning_rate": 0.00027402492626035096, "loss": 0.0888, "step": 26830 }, { "epoch": 0.17, "learning_rate": 0.00027401524490599404, "loss": 0.0874, "step": 26840 }, { "epoch": 0.17, "learning_rate": 0.0002740055635516371, "loss": 0.0806, "step": 26850 }, { "epoch": 0.17, "learning_rate": 0.00027399588219728015, "loss": 0.0848, "step": 26860 }, { "epoch": 0.17, "learning_rate": 0.00027398620084292323, "loss": 0.0849, "step": 26870 }, { "epoch": 0.17, "learning_rate": 0.0002739765194885663, "loss": 0.0748, "step": 26880 }, { "epoch": 0.17, "learning_rate": 0.00027396683813420933, "loss": 0.0871, "step": 26890 }, { "epoch": 0.17, "learning_rate": 0.0002739571567798524, "loss": 0.0712, "step": 26900 }, { "epoch": 0.17, "learning_rate": 0.0002739474754254955, "loss": 0.0749, "step": 26910 }, { "epoch": 0.17, "learning_rate": 0.00027393779407113857, "loss": 0.0809, "step": 26920 }, { "epoch": 0.17, "learning_rate": 0.00027392811271678165, "loss": 0.093, "step": 26930 }, { "epoch": 0.17, "learning_rate": 0.00027391843136242473, "loss": 0.0829, "step": 26940 }, { "epoch": 0.17, "learning_rate": 0.00027390875000806776, "loss": 0.0739, "step": 26950 }, { "epoch": 0.17, "learning_rate": 0.00027389906865371084, "loss": 0.0842, "step": 26960 }, { "epoch": 0.17, "learning_rate": 0.0002738893872993539, "loss": 0.0819, "step": 26970 }, { "epoch": 0.17, "learning_rate": 0.000273879705944997, "loss": 0.0789, "step": 26980 }, { "epoch": 0.17, "learning_rate": 0.00027387002459064, "loss": 0.0716, "step": 26990 }, { "epoch": 0.17, "learning_rate": 0.0002738603432362831, "loss": 0.0811, "step": 27000 }, { "epoch": 0.17, "eval_cer": 0.9201509433962264, "eval_loss": 0.053227175027132034, "eval_runtime": 120.4018, "eval_samples_per_second": 16.611, "eval_steps_per_second": 4.153, "step": 27000 }, { "epoch": 0.17, "learning_rate": 0.0002738506618819262, "loss": 0.0779, "step": 27010 }, { "epoch": 0.17, "learning_rate": 0.0002738409805275692, "loss": 0.0745, "step": 27020 }, { "epoch": 0.17, "learning_rate": 0.0002738312991732123, "loss": 0.0749, "step": 27030 }, { "epoch": 0.17, "learning_rate": 0.00027382161781885537, "loss": 0.0808, "step": 27040 }, { "epoch": 0.17, "learning_rate": 0.00027381193646449845, "loss": 0.0819, "step": 27050 }, { "epoch": 0.17, "learning_rate": 0.0002738022551101415, "loss": 0.0769, "step": 27060 }, { "epoch": 0.17, "learning_rate": 0.0002737925737557846, "loss": 0.0761, "step": 27070 }, { "epoch": 0.17, "learning_rate": 0.0002737828924014277, "loss": 0.0797, "step": 27080 }, { "epoch": 0.17, "learning_rate": 0.0002737732110470707, "loss": 0.0828, "step": 27090 }, { "epoch": 0.17, "learning_rate": 0.0002737635296927138, "loss": 0.0703, "step": 27100 }, { "epoch": 0.17, "learning_rate": 0.00027375384833835687, "loss": 0.0821, "step": 27110 }, { "epoch": 0.18, "learning_rate": 0.00027374416698399995, "loss": 0.0785, "step": 27120 }, { "epoch": 0.18, "learning_rate": 0.000273734485629643, "loss": 0.0789, "step": 27130 }, { "epoch": 0.18, "learning_rate": 0.00027372480427528606, "loss": 0.0783, "step": 27140 }, { "epoch": 0.18, "learning_rate": 0.00027371512292092914, "loss": 0.0768, "step": 27150 }, { "epoch": 0.18, "learning_rate": 0.00027370544156657216, "loss": 0.0781, "step": 27160 }, { "epoch": 0.18, "learning_rate": 0.00027369576021221524, "loss": 0.078, "step": 27170 }, { "epoch": 0.18, "learning_rate": 0.0002736860788578583, "loss": 0.0853, "step": 27180 }, { "epoch": 0.18, "learning_rate": 0.0002736763975035014, "loss": 0.0755, "step": 27190 }, { "epoch": 0.18, "learning_rate": 0.0002736667161491445, "loss": 0.0833, "step": 27200 }, { "epoch": 0.18, "learning_rate": 0.00027365703479478756, "loss": 0.0771, "step": 27210 }, { "epoch": 0.18, "learning_rate": 0.00027364735344043064, "loss": 0.0918, "step": 27220 }, { "epoch": 0.18, "learning_rate": 0.00027363767208607367, "loss": 0.0806, "step": 27230 }, { "epoch": 0.18, "learning_rate": 0.00027362799073171675, "loss": 0.0797, "step": 27240 }, { "epoch": 0.18, "learning_rate": 0.0002736183093773598, "loss": 0.0776, "step": 27250 }, { "epoch": 0.18, "learning_rate": 0.00027360862802300285, "loss": 0.0858, "step": 27260 }, { "epoch": 0.18, "learning_rate": 0.00027359894666864593, "loss": 0.0947, "step": 27270 }, { "epoch": 0.18, "learning_rate": 0.000273589265314289, "loss": 0.0747, "step": 27280 }, { "epoch": 0.18, "learning_rate": 0.0002735795839599321, "loss": 0.077, "step": 27290 }, { "epoch": 0.18, "learning_rate": 0.0002735699026055751, "loss": 0.0754, "step": 27300 }, { "epoch": 0.18, "learning_rate": 0.0002735602212512182, "loss": 0.0749, "step": 27310 }, { "epoch": 0.18, "learning_rate": 0.0002735505398968613, "loss": 0.0684, "step": 27320 }, { "epoch": 0.18, "learning_rate": 0.00027354085854250436, "loss": 0.0828, "step": 27330 }, { "epoch": 0.18, "learning_rate": 0.00027353117718814744, "loss": 0.0797, "step": 27340 }, { "epoch": 0.18, "learning_rate": 0.0002735214958337905, "loss": 0.0794, "step": 27350 }, { "epoch": 0.18, "learning_rate": 0.00027351181447943354, "loss": 0.0773, "step": 27360 }, { "epoch": 0.18, "learning_rate": 0.0002735021331250766, "loss": 0.0813, "step": 27370 }, { "epoch": 0.18, "learning_rate": 0.0002734924517707197, "loss": 0.0784, "step": 27380 }, { "epoch": 0.18, "learning_rate": 0.0002734827704163627, "loss": 0.0845, "step": 27390 }, { "epoch": 0.18, "learning_rate": 0.0002734730890620058, "loss": 0.0761, "step": 27400 }, { "epoch": 0.18, "learning_rate": 0.0002734634077076489, "loss": 0.0854, "step": 27410 }, { "epoch": 0.18, "learning_rate": 0.00027345372635329197, "loss": 0.0752, "step": 27420 }, { "epoch": 0.18, "learning_rate": 0.00027344404499893505, "loss": 0.0779, "step": 27430 }, { "epoch": 0.18, "learning_rate": 0.00027343436364457807, "loss": 0.0785, "step": 27440 }, { "epoch": 0.18, "learning_rate": 0.00027342468229022115, "loss": 0.0779, "step": 27450 }, { "epoch": 0.18, "learning_rate": 0.00027341500093586423, "loss": 0.0951, "step": 27460 }, { "epoch": 0.18, "learning_rate": 0.0002734053195815073, "loss": 0.0843, "step": 27470 }, { "epoch": 0.18, "learning_rate": 0.0002733956382271504, "loss": 0.0827, "step": 27480 }, { "epoch": 0.18, "learning_rate": 0.00027338595687279347, "loss": 0.0877, "step": 27490 }, { "epoch": 0.18, "learning_rate": 0.0002733762755184365, "loss": 0.0796, "step": 27500 }, { "epoch": 0.18, "learning_rate": 0.0002733665941640796, "loss": 0.0841, "step": 27510 }, { "epoch": 0.18, "learning_rate": 0.00027335691280972265, "loss": 0.0837, "step": 27520 }, { "epoch": 0.18, "learning_rate": 0.0002733472314553657, "loss": 0.0779, "step": 27530 }, { "epoch": 0.18, "learning_rate": 0.00027333755010100876, "loss": 0.0806, "step": 27540 }, { "epoch": 0.18, "learning_rate": 0.00027332786874665184, "loss": 0.081, "step": 27550 }, { "epoch": 0.18, "learning_rate": 0.0002733181873922949, "loss": 0.0768, "step": 27560 }, { "epoch": 0.18, "learning_rate": 0.000273308506037938, "loss": 0.0863, "step": 27570 }, { "epoch": 0.18, "learning_rate": 0.000273298824683581, "loss": 0.0853, "step": 27580 }, { "epoch": 0.18, "learning_rate": 0.0002732891433292241, "loss": 0.0769, "step": 27590 }, { "epoch": 0.18, "learning_rate": 0.0002732794619748672, "loss": 0.0859, "step": 27600 }, { "epoch": 0.18, "learning_rate": 0.00027326978062051026, "loss": 0.0886, "step": 27610 }, { "epoch": 0.18, "learning_rate": 0.00027326009926615334, "loss": 0.0889, "step": 27620 }, { "epoch": 0.18, "learning_rate": 0.00027325041791179637, "loss": 0.0818, "step": 27630 }, { "epoch": 0.18, "learning_rate": 0.00027324073655743945, "loss": 0.0787, "step": 27640 }, { "epoch": 0.18, "learning_rate": 0.00027323105520308253, "loss": 0.0778, "step": 27650 }, { "epoch": 0.18, "learning_rate": 0.00027322137384872556, "loss": 0.0811, "step": 27660 }, { "epoch": 0.18, "learning_rate": 0.00027321169249436863, "loss": 0.0693, "step": 27670 }, { "epoch": 0.18, "learning_rate": 0.0002732020111400117, "loss": 0.076, "step": 27680 }, { "epoch": 0.18, "learning_rate": 0.0002731923297856548, "loss": 0.0781, "step": 27690 }, { "epoch": 0.18, "learning_rate": 0.0002731826484312979, "loss": 0.0887, "step": 27700 }, { "epoch": 0.18, "learning_rate": 0.00027317296707694095, "loss": 0.0725, "step": 27710 }, { "epoch": 0.18, "learning_rate": 0.000273163285722584, "loss": 0.0751, "step": 27720 }, { "epoch": 0.18, "learning_rate": 0.00027315360436822706, "loss": 0.0814, "step": 27730 }, { "epoch": 0.18, "learning_rate": 0.00027314392301387014, "loss": 0.0779, "step": 27740 }, { "epoch": 0.18, "learning_rate": 0.0002731342416595132, "loss": 0.0761, "step": 27750 }, { "epoch": 0.18, "learning_rate": 0.00027312456030515624, "loss": 0.0833, "step": 27760 }, { "epoch": 0.18, "learning_rate": 0.0002731148789507993, "loss": 0.0798, "step": 27770 }, { "epoch": 0.18, "learning_rate": 0.0002731051975964424, "loss": 0.0674, "step": 27780 }, { "epoch": 0.18, "learning_rate": 0.00027309551624208543, "loss": 0.0888, "step": 27790 }, { "epoch": 0.18, "learning_rate": 0.0002730858348877285, "loss": 0.0796, "step": 27800 }, { "epoch": 0.18, "learning_rate": 0.0002730761535333716, "loss": 0.0758, "step": 27810 }, { "epoch": 0.18, "learning_rate": 0.00027306647217901467, "loss": 0.0817, "step": 27820 }, { "epoch": 0.18, "learning_rate": 0.00027305679082465775, "loss": 0.0794, "step": 27830 }, { "epoch": 0.18, "learning_rate": 0.00027304710947030083, "loss": 0.0787, "step": 27840 }, { "epoch": 0.18, "learning_rate": 0.0002730374281159439, "loss": 0.074, "step": 27850 }, { "epoch": 0.18, "learning_rate": 0.00027302774676158693, "loss": 0.0822, "step": 27860 }, { "epoch": 0.18, "learning_rate": 0.00027301806540723, "loss": 0.0654, "step": 27870 }, { "epoch": 0.18, "learning_rate": 0.0002730083840528731, "loss": 0.075, "step": 27880 }, { "epoch": 0.18, "learning_rate": 0.0002729987026985162, "loss": 0.0814, "step": 27890 }, { "epoch": 0.18, "learning_rate": 0.0002729890213441592, "loss": 0.0844, "step": 27900 }, { "epoch": 0.18, "learning_rate": 0.0002729793399898023, "loss": 0.0843, "step": 27910 }, { "epoch": 0.18, "learning_rate": 0.00027296965863544536, "loss": 0.0772, "step": 27920 }, { "epoch": 0.18, "learning_rate": 0.0002729599772810884, "loss": 0.0782, "step": 27930 }, { "epoch": 0.18, "learning_rate": 0.00027295029592673146, "loss": 0.0783, "step": 27940 }, { "epoch": 0.18, "learning_rate": 0.00027294061457237454, "loss": 0.0855, "step": 27950 }, { "epoch": 0.18, "learning_rate": 0.0002729309332180176, "loss": 0.0796, "step": 27960 }, { "epoch": 0.18, "learning_rate": 0.0002729212518636607, "loss": 0.0756, "step": 27970 }, { "epoch": 0.18, "learning_rate": 0.0002729115705093038, "loss": 0.0781, "step": 27980 }, { "epoch": 0.18, "learning_rate": 0.00027290188915494686, "loss": 0.0796, "step": 27990 }, { "epoch": 0.18, "learning_rate": 0.0002728922078005899, "loss": 0.0817, "step": 28000 }, { "epoch": 0.18, "eval_cer": 0.9201979437351712, "eval_loss": 0.053717296570539474, "eval_runtime": 120.3699, "eval_samples_per_second": 16.615, "eval_steps_per_second": 4.154, "step": 28000 }, { "epoch": 0.18, "learning_rate": 0.00027288252644623297, "loss": 0.0819, "step": 28010 }, { "epoch": 0.18, "learning_rate": 0.00027287284509187605, "loss": 0.0742, "step": 28020 }, { "epoch": 0.18, "learning_rate": 0.0002728631637375191, "loss": 0.0732, "step": 28030 }, { "epoch": 0.18, "learning_rate": 0.00027285348238316215, "loss": 0.081, "step": 28040 }, { "epoch": 0.18, "learning_rate": 0.00027284380102880523, "loss": 0.0746, "step": 28050 }, { "epoch": 0.18, "learning_rate": 0.0002728341196744483, "loss": 0.081, "step": 28060 }, { "epoch": 0.18, "learning_rate": 0.00027282443832009134, "loss": 0.0778, "step": 28070 }, { "epoch": 0.18, "learning_rate": 0.0002728147569657344, "loss": 0.0768, "step": 28080 }, { "epoch": 0.18, "learning_rate": 0.0002728050756113775, "loss": 0.0745, "step": 28090 }, { "epoch": 0.18, "learning_rate": 0.0002727953942570206, "loss": 0.0773, "step": 28100 }, { "epoch": 0.18, "learning_rate": 0.00027278571290266366, "loss": 0.0875, "step": 28110 }, { "epoch": 0.18, "learning_rate": 0.00027277603154830674, "loss": 0.0791, "step": 28120 }, { "epoch": 0.18, "learning_rate": 0.00027276635019394976, "loss": 0.0788, "step": 28130 }, { "epoch": 0.18, "learning_rate": 0.00027275666883959284, "loss": 0.0736, "step": 28140 }, { "epoch": 0.18, "learning_rate": 0.0002727469874852359, "loss": 0.0827, "step": 28150 }, { "epoch": 0.18, "learning_rate": 0.00027273730613087895, "loss": 0.0776, "step": 28160 }, { "epoch": 0.18, "learning_rate": 0.00027272762477652203, "loss": 0.075, "step": 28170 }, { "epoch": 0.18, "learning_rate": 0.0002727179434221651, "loss": 0.0919, "step": 28180 }, { "epoch": 0.18, "learning_rate": 0.0002727082620678082, "loss": 0.0821, "step": 28190 }, { "epoch": 0.18, "learning_rate": 0.00027269858071345127, "loss": 0.0789, "step": 28200 }, { "epoch": 0.18, "learning_rate": 0.0002726888993590943, "loss": 0.0772, "step": 28210 }, { "epoch": 0.18, "learning_rate": 0.0002726792180047374, "loss": 0.0771, "step": 28220 }, { "epoch": 0.18, "learning_rate": 0.00027266953665038045, "loss": 0.0711, "step": 28230 }, { "epoch": 0.18, "learning_rate": 0.00027265985529602353, "loss": 0.0816, "step": 28240 }, { "epoch": 0.18, "learning_rate": 0.0002726501739416666, "loss": 0.0687, "step": 28250 }, { "epoch": 0.18, "learning_rate": 0.0002726404925873097, "loss": 0.0809, "step": 28260 }, { "epoch": 0.18, "learning_rate": 0.0002726308112329527, "loss": 0.0729, "step": 28270 }, { "epoch": 0.18, "learning_rate": 0.0002726211298785958, "loss": 0.0775, "step": 28280 }, { "epoch": 0.18, "learning_rate": 0.0002726114485242389, "loss": 0.0865, "step": 28290 }, { "epoch": 0.18, "learning_rate": 0.0002726017671698819, "loss": 0.0814, "step": 28300 }, { "epoch": 0.18, "learning_rate": 0.000272592085815525, "loss": 0.0798, "step": 28310 }, { "epoch": 0.18, "learning_rate": 0.00027258240446116806, "loss": 0.0732, "step": 28320 }, { "epoch": 0.18, "learning_rate": 0.00027257272310681114, "loss": 0.0769, "step": 28330 }, { "epoch": 0.18, "learning_rate": 0.0002725630417524542, "loss": 0.0745, "step": 28340 }, { "epoch": 0.18, "learning_rate": 0.00027255336039809725, "loss": 0.0775, "step": 28350 }, { "epoch": 0.18, "learning_rate": 0.00027254367904374033, "loss": 0.0753, "step": 28360 }, { "epoch": 0.18, "learning_rate": 0.0002725339976893834, "loss": 0.0876, "step": 28370 }, { "epoch": 0.18, "learning_rate": 0.0002725243163350265, "loss": 0.08, "step": 28380 }, { "epoch": 0.18, "learning_rate": 0.00027251463498066957, "loss": 0.068, "step": 28390 }, { "epoch": 0.18, "learning_rate": 0.0002725049536263126, "loss": 0.0776, "step": 28400 }, { "epoch": 0.18, "learning_rate": 0.00027249527227195567, "loss": 0.0744, "step": 28410 }, { "epoch": 0.18, "learning_rate": 0.00027248559091759875, "loss": 0.0809, "step": 28420 }, { "epoch": 0.18, "learning_rate": 0.0002724759095632418, "loss": 0.083, "step": 28430 }, { "epoch": 0.18, "learning_rate": 0.00027246622820888486, "loss": 0.0825, "step": 28440 }, { "epoch": 0.18, "learning_rate": 0.00027245654685452794, "loss": 0.0816, "step": 28450 }, { "epoch": 0.18, "learning_rate": 0.000272446865500171, "loss": 0.0747, "step": 28460 }, { "epoch": 0.18, "learning_rate": 0.0002724371841458141, "loss": 0.0783, "step": 28470 }, { "epoch": 0.18, "learning_rate": 0.0002724275027914572, "loss": 0.0781, "step": 28480 }, { "epoch": 0.18, "learning_rate": 0.0002724178214371002, "loss": 0.0797, "step": 28490 }, { "epoch": 0.18, "learning_rate": 0.0002724081400827433, "loss": 0.0757, "step": 28500 }, { "epoch": 0.18, "learning_rate": 0.00027239845872838636, "loss": 0.0729, "step": 28510 }, { "epoch": 0.18, "learning_rate": 0.00027238877737402944, "loss": 0.0818, "step": 28520 }, { "epoch": 0.18, "learning_rate": 0.00027237909601967247, "loss": 0.0791, "step": 28530 }, { "epoch": 0.18, "learning_rate": 0.00027236941466531555, "loss": 0.0792, "step": 28540 }, { "epoch": 0.18, "learning_rate": 0.0002723597333109586, "loss": 0.0747, "step": 28550 }, { "epoch": 0.18, "learning_rate": 0.00027235005195660165, "loss": 0.077, "step": 28560 }, { "epoch": 0.18, "learning_rate": 0.00027234037060224473, "loss": 0.0883, "step": 28570 }, { "epoch": 0.18, "learning_rate": 0.0002723306892478878, "loss": 0.0691, "step": 28580 }, { "epoch": 0.18, "learning_rate": 0.0002723210078935309, "loss": 0.0784, "step": 28590 }, { "epoch": 0.18, "learning_rate": 0.00027231132653917397, "loss": 0.0868, "step": 28600 }, { "epoch": 0.18, "learning_rate": 0.00027230164518481705, "loss": 0.0763, "step": 28610 }, { "epoch": 0.18, "learning_rate": 0.00027229196383046013, "loss": 0.0785, "step": 28620 }, { "epoch": 0.18, "learning_rate": 0.00027228228247610316, "loss": 0.072, "step": 28630 }, { "epoch": 0.18, "learning_rate": 0.00027227260112174624, "loss": 0.0868, "step": 28640 }, { "epoch": 0.18, "learning_rate": 0.0002722629197673893, "loss": 0.0797, "step": 28650 }, { "epoch": 0.18, "learning_rate": 0.0002722532384130324, "loss": 0.0797, "step": 28660 }, { "epoch": 0.19, "learning_rate": 0.0002722435570586754, "loss": 0.0763, "step": 28670 }, { "epoch": 0.19, "learning_rate": 0.0002722338757043185, "loss": 0.0912, "step": 28680 }, { "epoch": 0.19, "learning_rate": 0.0002722241943499616, "loss": 0.078, "step": 28690 }, { "epoch": 0.19, "learning_rate": 0.0002722145129956046, "loss": 0.0954, "step": 28700 }, { "epoch": 0.19, "learning_rate": 0.0002722048316412477, "loss": 0.0721, "step": 28710 }, { "epoch": 0.19, "learning_rate": 0.00027219515028689077, "loss": 0.0746, "step": 28720 }, { "epoch": 0.19, "learning_rate": 0.00027218546893253385, "loss": 0.0763, "step": 28730 }, { "epoch": 0.19, "learning_rate": 0.0002721757875781769, "loss": 0.0749, "step": 28740 }, { "epoch": 0.19, "learning_rate": 0.00027216610622382, "loss": 0.0769, "step": 28750 }, { "epoch": 0.19, "learning_rate": 0.0002721564248694631, "loss": 0.076, "step": 28760 }, { "epoch": 0.19, "learning_rate": 0.0002721467435151061, "loss": 0.0794, "step": 28770 }, { "epoch": 0.19, "learning_rate": 0.0002721370621607492, "loss": 0.0742, "step": 28780 }, { "epoch": 0.19, "learning_rate": 0.00027212738080639227, "loss": 0.0766, "step": 28790 }, { "epoch": 0.19, "learning_rate": 0.0002721176994520353, "loss": 0.0746, "step": 28800 }, { "epoch": 0.19, "learning_rate": 0.0002721080180976784, "loss": 0.078, "step": 28810 }, { "epoch": 0.19, "learning_rate": 0.00027209833674332146, "loss": 0.0838, "step": 28820 }, { "epoch": 0.19, "learning_rate": 0.00027208865538896454, "loss": 0.076, "step": 28830 }, { "epoch": 0.19, "learning_rate": 0.00027207897403460756, "loss": 0.0832, "step": 28840 }, { "epoch": 0.19, "learning_rate": 0.00027206929268025064, "loss": 0.0815, "step": 28850 }, { "epoch": 0.19, "learning_rate": 0.0002720596113258937, "loss": 0.0901, "step": 28860 }, { "epoch": 0.19, "learning_rate": 0.0002720499299715368, "loss": 0.0766, "step": 28870 }, { "epoch": 0.19, "learning_rate": 0.0002720402486171799, "loss": 0.0735, "step": 28880 }, { "epoch": 0.19, "learning_rate": 0.00027203056726282296, "loss": 0.0751, "step": 28890 }, { "epoch": 0.19, "learning_rate": 0.00027202088590846604, "loss": 0.0845, "step": 28900 }, { "epoch": 0.19, "learning_rate": 0.00027201120455410907, "loss": 0.0843, "step": 28910 }, { "epoch": 0.19, "learning_rate": 0.00027200152319975215, "loss": 0.0805, "step": 28920 }, { "epoch": 0.19, "learning_rate": 0.00027199184184539517, "loss": 0.0756, "step": 28930 }, { "epoch": 0.19, "learning_rate": 0.00027198216049103825, "loss": 0.0776, "step": 28940 }, { "epoch": 0.19, "learning_rate": 0.00027197247913668133, "loss": 0.0888, "step": 28950 }, { "epoch": 0.19, "learning_rate": 0.0002719627977823244, "loss": 0.0812, "step": 28960 }, { "epoch": 0.19, "learning_rate": 0.0002719531164279675, "loss": 0.0766, "step": 28970 }, { "epoch": 0.19, "learning_rate": 0.0002719434350736105, "loss": 0.0796, "step": 28980 }, { "epoch": 0.19, "learning_rate": 0.0002719337537192536, "loss": 0.0813, "step": 28990 }, { "epoch": 0.19, "learning_rate": 0.0002719240723648967, "loss": 0.0809, "step": 29000 }, { "epoch": 0.19, "eval_cer": 0.9201111738786578, "eval_loss": 0.052740730345249176, "eval_runtime": 120.2847, "eval_samples_per_second": 16.627, "eval_steps_per_second": 4.157, "step": 29000 }, { "epoch": 0.19, "learning_rate": 0.00027191439101053975, "loss": 0.0852, "step": 29010 }, { "epoch": 0.19, "learning_rate": 0.00027190470965618283, "loss": 0.075, "step": 29020 }, { "epoch": 0.19, "learning_rate": 0.0002718950283018259, "loss": 0.0823, "step": 29030 }, { "epoch": 0.19, "learning_rate": 0.00027188534694746894, "loss": 0.0825, "step": 29040 }, { "epoch": 0.19, "learning_rate": 0.000271875665593112, "loss": 0.0711, "step": 29050 }, { "epoch": 0.19, "learning_rate": 0.0002718659842387551, "loss": 0.0705, "step": 29060 }, { "epoch": 0.19, "learning_rate": 0.0002718563028843981, "loss": 0.0979, "step": 29070 }, { "epoch": 0.19, "learning_rate": 0.0002718466215300412, "loss": 0.0734, "step": 29080 }, { "epoch": 0.19, "learning_rate": 0.0002718369401756843, "loss": 0.0762, "step": 29090 }, { "epoch": 0.19, "learning_rate": 0.00027182725882132736, "loss": 0.0731, "step": 29100 }, { "epoch": 0.19, "learning_rate": 0.00027181757746697044, "loss": 0.0786, "step": 29110 }, { "epoch": 0.19, "learning_rate": 0.00027180789611261347, "loss": 0.0737, "step": 29120 }, { "epoch": 0.19, "learning_rate": 0.00027179821475825655, "loss": 0.0719, "step": 29130 }, { "epoch": 0.19, "learning_rate": 0.00027178853340389963, "loss": 0.0713, "step": 29140 }, { "epoch": 0.19, "learning_rate": 0.0002717788520495427, "loss": 0.0765, "step": 29150 }, { "epoch": 0.19, "learning_rate": 0.0002717691706951858, "loss": 0.0749, "step": 29160 }, { "epoch": 0.19, "learning_rate": 0.0002717594893408288, "loss": 0.0789, "step": 29170 }, { "epoch": 0.19, "learning_rate": 0.0002717498079864719, "loss": 0.0747, "step": 29180 }, { "epoch": 0.19, "learning_rate": 0.000271740126632115, "loss": 0.0769, "step": 29190 }, { "epoch": 0.19, "learning_rate": 0.000271730445277758, "loss": 0.0768, "step": 29200 }, { "epoch": 0.19, "learning_rate": 0.0002717207639234011, "loss": 0.0799, "step": 29210 }, { "epoch": 0.19, "learning_rate": 0.00027171108256904416, "loss": 0.0719, "step": 29220 }, { "epoch": 0.19, "learning_rate": 0.00027170140121468724, "loss": 0.0848, "step": 29230 }, { "epoch": 0.19, "learning_rate": 0.0002716917198603303, "loss": 0.0782, "step": 29240 }, { "epoch": 0.19, "learning_rate": 0.0002716820385059734, "loss": 0.0922, "step": 29250 }, { "epoch": 0.19, "learning_rate": 0.0002716723571516164, "loss": 0.0744, "step": 29260 }, { "epoch": 0.19, "learning_rate": 0.0002716626757972595, "loss": 0.0815, "step": 29270 }, { "epoch": 0.19, "learning_rate": 0.0002716529944429026, "loss": 0.0841, "step": 29280 }, { "epoch": 0.19, "learning_rate": 0.00027164331308854566, "loss": 0.0812, "step": 29290 }, { "epoch": 0.19, "learning_rate": 0.00027163363173418874, "loss": 0.0699, "step": 29300 }, { "epoch": 0.19, "learning_rate": 0.00027162395037983177, "loss": 0.0743, "step": 29310 }, { "epoch": 0.19, "learning_rate": 0.00027161426902547485, "loss": 0.0787, "step": 29320 }, { "epoch": 0.19, "learning_rate": 0.0002716045876711179, "loss": 0.0727, "step": 29330 }, { "epoch": 0.19, "learning_rate": 0.00027159490631676095, "loss": 0.0782, "step": 29340 }, { "epoch": 0.19, "learning_rate": 0.00027158522496240403, "loss": 0.0759, "step": 29350 }, { "epoch": 0.19, "learning_rate": 0.0002715755436080471, "loss": 0.0752, "step": 29360 }, { "epoch": 0.19, "learning_rate": 0.0002715658622536902, "loss": 0.078, "step": 29370 }, { "epoch": 0.19, "learning_rate": 0.0002715561808993333, "loss": 0.0759, "step": 29380 }, { "epoch": 0.19, "learning_rate": 0.00027154649954497635, "loss": 0.0761, "step": 29390 }, { "epoch": 0.19, "learning_rate": 0.0002715368181906194, "loss": 0.075, "step": 29400 }, { "epoch": 0.19, "learning_rate": 0.00027152713683626246, "loss": 0.0936, "step": 29410 }, { "epoch": 0.19, "learning_rate": 0.00027151745548190554, "loss": 0.0746, "step": 29420 }, { "epoch": 0.19, "learning_rate": 0.0002715077741275486, "loss": 0.0789, "step": 29430 }, { "epoch": 0.19, "learning_rate": 0.00027149809277319164, "loss": 0.08, "step": 29440 }, { "epoch": 0.19, "learning_rate": 0.0002714884114188347, "loss": 0.0837, "step": 29450 }, { "epoch": 0.19, "learning_rate": 0.0002714787300644778, "loss": 0.0749, "step": 29460 }, { "epoch": 0.19, "learning_rate": 0.00027146904871012083, "loss": 0.0818, "step": 29470 }, { "epoch": 0.19, "learning_rate": 0.0002714593673557639, "loss": 0.0722, "step": 29480 }, { "epoch": 0.19, "learning_rate": 0.000271449686001407, "loss": 0.0967, "step": 29490 }, { "epoch": 0.19, "learning_rate": 0.00027144000464705007, "loss": 0.0828, "step": 29500 }, { "epoch": 0.19, "learning_rate": 0.00027143032329269315, "loss": 0.0768, "step": 29510 }, { "epoch": 0.19, "learning_rate": 0.00027142064193833623, "loss": 0.0781, "step": 29520 }, { "epoch": 0.19, "learning_rate": 0.0002714109605839793, "loss": 0.0662, "step": 29530 }, { "epoch": 0.19, "learning_rate": 0.00027140127922962233, "loss": 0.069, "step": 29540 }, { "epoch": 0.19, "learning_rate": 0.0002713915978752654, "loss": 0.0932, "step": 29550 }, { "epoch": 0.19, "learning_rate": 0.0002713819165209085, "loss": 0.0911, "step": 29560 }, { "epoch": 0.19, "learning_rate": 0.0002713722351665515, "loss": 0.0965, "step": 29570 }, { "epoch": 0.19, "learning_rate": 0.0002713625538121946, "loss": 0.0692, "step": 29580 }, { "epoch": 0.19, "learning_rate": 0.0002713528724578377, "loss": 0.0808, "step": 29590 }, { "epoch": 0.19, "learning_rate": 0.00027134319110348076, "loss": 0.0854, "step": 29600 }, { "epoch": 0.19, "learning_rate": 0.0002713335097491238, "loss": 0.0773, "step": 29610 }, { "epoch": 0.19, "learning_rate": 0.00027132382839476686, "loss": 0.0854, "step": 29620 }, { "epoch": 0.19, "learning_rate": 0.00027131414704040994, "loss": 0.0898, "step": 29630 }, { "epoch": 0.19, "learning_rate": 0.000271304465686053, "loss": 0.0866, "step": 29640 }, { "epoch": 0.19, "learning_rate": 0.0002712947843316961, "loss": 0.0827, "step": 29650 }, { "epoch": 0.19, "learning_rate": 0.0002712851029773392, "loss": 0.0718, "step": 29660 }, { "epoch": 0.19, "learning_rate": 0.00027127542162298226, "loss": 0.0798, "step": 29670 }, { "epoch": 0.19, "learning_rate": 0.0002712657402686253, "loss": 0.0828, "step": 29680 }, { "epoch": 0.19, "learning_rate": 0.00027125605891426837, "loss": 0.0723, "step": 29690 }, { "epoch": 0.19, "learning_rate": 0.00027124637755991145, "loss": 0.0764, "step": 29700 }, { "epoch": 0.19, "learning_rate": 0.0002712366962055545, "loss": 0.0803, "step": 29710 }, { "epoch": 0.19, "learning_rate": 0.00027122701485119755, "loss": 0.0694, "step": 29720 }, { "epoch": 0.19, "learning_rate": 0.00027121733349684063, "loss": 0.0819, "step": 29730 }, { "epoch": 0.19, "learning_rate": 0.0002712076521424837, "loss": 0.0692, "step": 29740 }, { "epoch": 0.19, "learning_rate": 0.00027119797078812674, "loss": 0.0838, "step": 29750 }, { "epoch": 0.19, "learning_rate": 0.0002711882894337698, "loss": 0.078, "step": 29760 }, { "epoch": 0.19, "learning_rate": 0.0002711786080794129, "loss": 0.0891, "step": 29770 }, { "epoch": 0.19, "learning_rate": 0.000271168926725056, "loss": 0.0801, "step": 29780 }, { "epoch": 0.19, "learning_rate": 0.00027115924537069906, "loss": 0.0661, "step": 29790 }, { "epoch": 0.19, "learning_rate": 0.00027114956401634214, "loss": 0.0785, "step": 29800 }, { "epoch": 0.19, "learning_rate": 0.00027113988266198516, "loss": 0.078, "step": 29810 }, { "epoch": 0.19, "learning_rate": 0.00027113020130762824, "loss": 0.0828, "step": 29820 }, { "epoch": 0.19, "learning_rate": 0.0002711205199532713, "loss": 0.0862, "step": 29830 }, { "epoch": 0.19, "learning_rate": 0.00027111083859891435, "loss": 0.0788, "step": 29840 }, { "epoch": 0.19, "learning_rate": 0.00027110115724455743, "loss": 0.0786, "step": 29850 }, { "epoch": 0.19, "learning_rate": 0.0002710914758902005, "loss": 0.0845, "step": 29860 }, { "epoch": 0.19, "learning_rate": 0.0002710817945358436, "loss": 0.08, "step": 29870 }, { "epoch": 0.19, "learning_rate": 0.00027107211318148667, "loss": 0.0781, "step": 29880 }, { "epoch": 0.19, "learning_rate": 0.0002710624318271297, "loss": 0.0749, "step": 29890 }, { "epoch": 0.19, "learning_rate": 0.00027105275047277277, "loss": 0.0724, "step": 29900 }, { "epoch": 0.19, "learning_rate": 0.00027104306911841585, "loss": 0.0787, "step": 29910 }, { "epoch": 0.19, "learning_rate": 0.00027103338776405893, "loss": 0.0781, "step": 29920 }, { "epoch": 0.19, "learning_rate": 0.000271023706409702, "loss": 0.0641, "step": 29930 }, { "epoch": 0.19, "learning_rate": 0.00027101402505534504, "loss": 0.078, "step": 29940 }, { "epoch": 0.19, "learning_rate": 0.0002710043437009881, "loss": 0.0766, "step": 29950 }, { "epoch": 0.19, "learning_rate": 0.0002709946623466312, "loss": 0.0772, "step": 29960 }, { "epoch": 0.19, "learning_rate": 0.0002709849809922742, "loss": 0.0844, "step": 29970 }, { "epoch": 0.19, "learning_rate": 0.0002709752996379173, "loss": 0.0789, "step": 29980 }, { "epoch": 0.19, "learning_rate": 0.0002709656182835604, "loss": 0.0768, "step": 29990 }, { "epoch": 0.19, "learning_rate": 0.00027095593692920346, "loss": 0.0812, "step": 30000 }, { "epoch": 0.19, "eval_cer": 0.9201635973336346, "eval_loss": 0.05120238661766052, "eval_runtime": 120.611, "eval_samples_per_second": 16.582, "eval_steps_per_second": 4.146, "step": 30000 }, { "epoch": 0.19, "learning_rate": 0.00027094625557484654, "loss": 0.0775, "step": 30010 }, { "epoch": 0.19, "learning_rate": 0.0002709365742204896, "loss": 0.0779, "step": 30020 }, { "epoch": 0.19, "learning_rate": 0.00027092689286613265, "loss": 0.0775, "step": 30030 }, { "epoch": 0.19, "learning_rate": 0.0002709172115117757, "loss": 0.0758, "step": 30040 }, { "epoch": 0.19, "learning_rate": 0.0002709075301574188, "loss": 0.0762, "step": 30050 }, { "epoch": 0.19, "learning_rate": 0.0002708978488030619, "loss": 0.0794, "step": 30060 }, { "epoch": 0.19, "learning_rate": 0.00027088816744870497, "loss": 0.0754, "step": 30070 }, { "epoch": 0.19, "learning_rate": 0.000270878486094348, "loss": 0.0857, "step": 30080 }, { "epoch": 0.19, "learning_rate": 0.00027086880473999107, "loss": 0.0786, "step": 30090 }, { "epoch": 0.19, "learning_rate": 0.00027085912338563415, "loss": 0.0852, "step": 30100 }, { "epoch": 0.19, "learning_rate": 0.0002708494420312772, "loss": 0.0752, "step": 30110 }, { "epoch": 0.19, "learning_rate": 0.00027083976067692026, "loss": 0.0765, "step": 30120 }, { "epoch": 0.19, "learning_rate": 0.00027083007932256334, "loss": 0.0788, "step": 30130 }, { "epoch": 0.19, "learning_rate": 0.0002708203979682064, "loss": 0.0797, "step": 30140 }, { "epoch": 0.19, "learning_rate": 0.0002708107166138495, "loss": 0.0805, "step": 30150 }, { "epoch": 0.19, "learning_rate": 0.0002708010352594926, "loss": 0.0762, "step": 30160 }, { "epoch": 0.19, "learning_rate": 0.0002707913539051356, "loss": 0.0949, "step": 30170 }, { "epoch": 0.19, "learning_rate": 0.0002707816725507787, "loss": 0.072, "step": 30180 }, { "epoch": 0.19, "learning_rate": 0.00027077199119642176, "loss": 0.0832, "step": 30190 }, { "epoch": 0.19, "learning_rate": 0.00027076230984206484, "loss": 0.0739, "step": 30200 }, { "epoch": 0.19, "learning_rate": 0.00027075262848770787, "loss": 0.0813, "step": 30210 }, { "epoch": 0.2, "learning_rate": 0.00027074294713335095, "loss": 0.073, "step": 30220 }, { "epoch": 0.2, "learning_rate": 0.000270733265778994, "loss": 0.0803, "step": 30230 }, { "epoch": 0.2, "learning_rate": 0.00027072358442463705, "loss": 0.0842, "step": 30240 }, { "epoch": 0.2, "learning_rate": 0.00027071390307028013, "loss": 0.0733, "step": 30250 }, { "epoch": 0.2, "learning_rate": 0.0002707042217159232, "loss": 0.0725, "step": 30260 }, { "epoch": 0.2, "learning_rate": 0.0002706945403615663, "loss": 0.0818, "step": 30270 }, { "epoch": 0.2, "learning_rate": 0.00027068485900720937, "loss": 0.0822, "step": 30280 }, { "epoch": 0.2, "learning_rate": 0.00027067517765285245, "loss": 0.0755, "step": 30290 }, { "epoch": 0.2, "learning_rate": 0.00027066549629849553, "loss": 0.0827, "step": 30300 }, { "epoch": 0.2, "learning_rate": 0.00027065581494413856, "loss": 0.0838, "step": 30310 }, { "epoch": 0.2, "learning_rate": 0.00027064613358978164, "loss": 0.0719, "step": 30320 }, { "epoch": 0.2, "learning_rate": 0.0002706364522354247, "loss": 0.0728, "step": 30330 }, { "epoch": 0.2, "learning_rate": 0.00027062677088106774, "loss": 0.0828, "step": 30340 }, { "epoch": 0.2, "learning_rate": 0.0002706170895267108, "loss": 0.0753, "step": 30350 }, { "epoch": 0.2, "learning_rate": 0.0002706074081723539, "loss": 0.0753, "step": 30360 }, { "epoch": 0.2, "learning_rate": 0.000270597726817997, "loss": 0.0805, "step": 30370 }, { "epoch": 0.2, "learning_rate": 0.00027058804546364, "loss": 0.073, "step": 30380 }, { "epoch": 0.2, "learning_rate": 0.0002705783641092831, "loss": 0.0786, "step": 30390 }, { "epoch": 0.2, "learning_rate": 0.00027056868275492617, "loss": 0.0745, "step": 30400 }, { "epoch": 0.2, "learning_rate": 0.00027055900140056925, "loss": 0.0754, "step": 30410 }, { "epoch": 0.2, "learning_rate": 0.0002705493200462123, "loss": 0.0796, "step": 30420 }, { "epoch": 0.2, "learning_rate": 0.0002705396386918554, "loss": 0.0663, "step": 30430 }, { "epoch": 0.2, "learning_rate": 0.0002705299573374985, "loss": 0.0719, "step": 30440 }, { "epoch": 0.2, "learning_rate": 0.0002705202759831415, "loss": 0.0815, "step": 30450 }, { "epoch": 0.2, "learning_rate": 0.0002705105946287846, "loss": 0.0752, "step": 30460 }, { "epoch": 0.2, "learning_rate": 0.00027050091327442767, "loss": 0.0749, "step": 30470 }, { "epoch": 0.2, "learning_rate": 0.0002704912319200707, "loss": 0.0841, "step": 30480 }, { "epoch": 0.2, "learning_rate": 0.0002704815505657138, "loss": 0.0752, "step": 30490 }, { "epoch": 0.2, "learning_rate": 0.00027047186921135685, "loss": 0.0717, "step": 30500 }, { "epoch": 0.2, "learning_rate": 0.00027046218785699993, "loss": 0.0782, "step": 30510 }, { "epoch": 0.2, "learning_rate": 0.00027045250650264296, "loss": 0.0807, "step": 30520 }, { "epoch": 0.2, "learning_rate": 0.00027044282514828604, "loss": 0.0801, "step": 30530 }, { "epoch": 0.2, "learning_rate": 0.0002704331437939291, "loss": 0.073, "step": 30540 }, { "epoch": 0.2, "learning_rate": 0.0002704234624395722, "loss": 0.0749, "step": 30550 }, { "epoch": 0.2, "learning_rate": 0.0002704137810852153, "loss": 0.0749, "step": 30560 }, { "epoch": 0.2, "learning_rate": 0.00027040409973085836, "loss": 0.0975, "step": 30570 }, { "epoch": 0.2, "learning_rate": 0.0002703944183765014, "loss": 0.0806, "step": 30580 }, { "epoch": 0.2, "learning_rate": 0.00027038473702214446, "loss": 0.0846, "step": 30590 }, { "epoch": 0.2, "learning_rate": 0.00027037505566778754, "loss": 0.0839, "step": 30600 }, { "epoch": 0.2, "learning_rate": 0.00027036537431343057, "loss": 0.0798, "step": 30610 }, { "epoch": 0.2, "learning_rate": 0.00027035569295907365, "loss": 0.0803, "step": 30620 }, { "epoch": 0.2, "learning_rate": 0.00027034601160471673, "loss": 0.0735, "step": 30630 }, { "epoch": 0.2, "learning_rate": 0.0002703363302503598, "loss": 0.0717, "step": 30640 }, { "epoch": 0.2, "learning_rate": 0.0002703266488960029, "loss": 0.0808, "step": 30650 }, { "epoch": 0.2, "learning_rate": 0.0002703169675416459, "loss": 0.0811, "step": 30660 }, { "epoch": 0.2, "learning_rate": 0.000270307286187289, "loss": 0.0691, "step": 30670 }, { "epoch": 0.2, "learning_rate": 0.0002702976048329321, "loss": 0.0806, "step": 30680 }, { "epoch": 0.2, "learning_rate": 0.00027028792347857515, "loss": 0.0679, "step": 30690 }, { "epoch": 0.2, "learning_rate": 0.00027027824212421823, "loss": 0.0915, "step": 30700 }, { "epoch": 0.2, "learning_rate": 0.00027026856076986126, "loss": 0.078, "step": 30710 }, { "epoch": 0.2, "learning_rate": 0.00027025887941550434, "loss": 0.0737, "step": 30720 }, { "epoch": 0.2, "learning_rate": 0.0002702491980611474, "loss": 0.0758, "step": 30730 }, { "epoch": 0.2, "learning_rate": 0.00027023951670679044, "loss": 0.0794, "step": 30740 }, { "epoch": 0.2, "learning_rate": 0.0002702298353524335, "loss": 0.0793, "step": 30750 }, { "epoch": 0.2, "learning_rate": 0.0002702201539980766, "loss": 0.0714, "step": 30760 }, { "epoch": 0.2, "learning_rate": 0.0002702104726437197, "loss": 0.0713, "step": 30770 }, { "epoch": 0.2, "learning_rate": 0.00027020079128936276, "loss": 0.0775, "step": 30780 }, { "epoch": 0.2, "learning_rate": 0.00027019110993500584, "loss": 0.08, "step": 30790 }, { "epoch": 0.2, "learning_rate": 0.00027018142858064887, "loss": 0.0834, "step": 30800 }, { "epoch": 0.2, "learning_rate": 0.00027017174722629195, "loss": 0.0773, "step": 30810 }, { "epoch": 0.2, "learning_rate": 0.00027016206587193503, "loss": 0.0796, "step": 30820 }, { "epoch": 0.2, "learning_rate": 0.0002701523845175781, "loss": 0.0908, "step": 30830 }, { "epoch": 0.2, "learning_rate": 0.0002701427031632212, "loss": 0.0775, "step": 30840 }, { "epoch": 0.2, "learning_rate": 0.0002701330218088642, "loss": 0.0743, "step": 30850 }, { "epoch": 0.2, "learning_rate": 0.0002701233404545073, "loss": 0.0795, "step": 30860 }, { "epoch": 0.2, "learning_rate": 0.0002701136591001504, "loss": 0.0799, "step": 30870 }, { "epoch": 0.2, "learning_rate": 0.0002701039777457934, "loss": 0.0793, "step": 30880 }, { "epoch": 0.2, "learning_rate": 0.0002700942963914365, "loss": 0.0777, "step": 30890 }, { "epoch": 0.2, "learning_rate": 0.00027008461503707956, "loss": 0.0707, "step": 30900 }, { "epoch": 0.2, "learning_rate": 0.00027007493368272264, "loss": 0.0761, "step": 30910 }, { "epoch": 0.2, "learning_rate": 0.0002700652523283657, "loss": 0.0801, "step": 30920 }, { "epoch": 0.2, "learning_rate": 0.0002700555709740088, "loss": 0.0653, "step": 30930 }, { "epoch": 0.2, "learning_rate": 0.0002700458896196518, "loss": 0.0706, "step": 30940 }, { "epoch": 0.2, "learning_rate": 0.0002700362082652949, "loss": 0.0777, "step": 30950 }, { "epoch": 0.2, "learning_rate": 0.000270026526910938, "loss": 0.0797, "step": 30960 }, { "epoch": 0.2, "learning_rate": 0.00027001684555658106, "loss": 0.0737, "step": 30970 }, { "epoch": 0.2, "learning_rate": 0.0002700071642022241, "loss": 0.0671, "step": 30980 }, { "epoch": 0.2, "learning_rate": 0.00026999748284786717, "loss": 0.0789, "step": 30990 }, { "epoch": 0.2, "learning_rate": 0.00026998780149351025, "loss": 0.0741, "step": 31000 }, { "epoch": 0.2, "eval_cer": 0.9201446164275223, "eval_loss": 0.05069497600197792, "eval_runtime": 120.4325, "eval_samples_per_second": 16.607, "eval_steps_per_second": 4.152, "step": 31000 }, { "epoch": 0.2, "learning_rate": 0.0002699781201391533, "loss": 0.0733, "step": 31010 }, { "epoch": 0.2, "learning_rate": 0.00026996843878479635, "loss": 0.07, "step": 31020 }, { "epoch": 0.2, "learning_rate": 0.00026995875743043943, "loss": 0.0665, "step": 31030 }, { "epoch": 0.2, "learning_rate": 0.0002699490760760825, "loss": 0.0767, "step": 31040 }, { "epoch": 0.2, "learning_rate": 0.0002699393947217256, "loss": 0.0745, "step": 31050 }, { "epoch": 0.2, "learning_rate": 0.00026992971336736867, "loss": 0.0752, "step": 31060 }, { "epoch": 0.2, "learning_rate": 0.0002699200320130117, "loss": 0.0675, "step": 31070 }, { "epoch": 0.2, "learning_rate": 0.0002699103506586548, "loss": 0.0761, "step": 31080 }, { "epoch": 0.2, "learning_rate": 0.00026990066930429786, "loss": 0.0768, "step": 31090 }, { "epoch": 0.2, "learning_rate": 0.00026989098794994094, "loss": 0.0741, "step": 31100 }, { "epoch": 0.2, "learning_rate": 0.00026988130659558396, "loss": 0.0683, "step": 31110 }, { "epoch": 0.2, "learning_rate": 0.00026987162524122704, "loss": 0.0705, "step": 31120 }, { "epoch": 0.2, "learning_rate": 0.0002698619438868701, "loss": 0.08, "step": 31130 }, { "epoch": 0.2, "learning_rate": 0.00026985226253251315, "loss": 0.0717, "step": 31140 }, { "epoch": 0.2, "learning_rate": 0.00026984258117815623, "loss": 0.0788, "step": 31150 }, { "epoch": 0.2, "learning_rate": 0.0002698328998237993, "loss": 0.0708, "step": 31160 }, { "epoch": 0.2, "learning_rate": 0.0002698232184694424, "loss": 0.0685, "step": 31170 }, { "epoch": 0.2, "learning_rate": 0.00026981353711508547, "loss": 0.075, "step": 31180 }, { "epoch": 0.2, "learning_rate": 0.00026980385576072855, "loss": 0.0695, "step": 31190 }, { "epoch": 0.2, "learning_rate": 0.00026979417440637163, "loss": 0.0659, "step": 31200 }, { "epoch": 0.2, "learning_rate": 0.00026978449305201465, "loss": 0.0763, "step": 31210 }, { "epoch": 0.2, "learning_rate": 0.00026977481169765773, "loss": 0.0822, "step": 31220 }, { "epoch": 0.2, "learning_rate": 0.0002697651303433008, "loss": 0.0754, "step": 31230 }, { "epoch": 0.2, "learning_rate": 0.0002697554489889439, "loss": 0.0788, "step": 31240 }, { "epoch": 0.2, "learning_rate": 0.0002697457676345869, "loss": 0.0839, "step": 31250 }, { "epoch": 0.2, "learning_rate": 0.00026973608628023, "loss": 0.085, "step": 31260 }, { "epoch": 0.2, "learning_rate": 0.0002697264049258731, "loss": 0.0769, "step": 31270 }, { "epoch": 0.2, "learning_rate": 0.0002697167235715161, "loss": 0.0691, "step": 31280 }, { "epoch": 0.2, "learning_rate": 0.0002697070422171592, "loss": 0.0798, "step": 31290 }, { "epoch": 0.2, "learning_rate": 0.00026969736086280226, "loss": 0.0861, "step": 31300 }, { "epoch": 0.2, "learning_rate": 0.00026968767950844534, "loss": 0.0684, "step": 31310 }, { "epoch": 0.2, "learning_rate": 0.0002696779981540884, "loss": 0.0747, "step": 31320 }, { "epoch": 0.2, "learning_rate": 0.0002696683167997315, "loss": 0.0752, "step": 31330 }, { "epoch": 0.2, "learning_rate": 0.0002696586354453746, "loss": 0.0856, "step": 31340 }, { "epoch": 0.2, "learning_rate": 0.0002696489540910176, "loss": 0.0886, "step": 31350 }, { "epoch": 0.2, "learning_rate": 0.0002696392727366607, "loss": 0.0745, "step": 31360 }, { "epoch": 0.2, "learning_rate": 0.00026962959138230377, "loss": 0.0814, "step": 31370 }, { "epoch": 0.2, "learning_rate": 0.0002696199100279468, "loss": 0.0708, "step": 31380 }, { "epoch": 0.2, "learning_rate": 0.00026961022867358987, "loss": 0.0724, "step": 31390 }, { "epoch": 0.2, "learning_rate": 0.00026960054731923295, "loss": 0.0766, "step": 31400 }, { "epoch": 0.2, "learning_rate": 0.00026959086596487603, "loss": 0.0956, "step": 31410 }, { "epoch": 0.2, "learning_rate": 0.00026958118461051906, "loss": 0.0776, "step": 31420 }, { "epoch": 0.2, "learning_rate": 0.00026957150325616214, "loss": 0.0793, "step": 31430 }, { "epoch": 0.2, "learning_rate": 0.0002695618219018052, "loss": 0.0763, "step": 31440 }, { "epoch": 0.2, "learning_rate": 0.0002695521405474483, "loss": 0.0859, "step": 31450 }, { "epoch": 0.2, "learning_rate": 0.0002695424591930914, "loss": 0.0697, "step": 31460 }, { "epoch": 0.2, "learning_rate": 0.00026953277783873446, "loss": 0.0674, "step": 31470 }, { "epoch": 0.2, "learning_rate": 0.00026952309648437754, "loss": 0.0733, "step": 31480 }, { "epoch": 0.2, "learning_rate": 0.00026951341513002056, "loss": 0.0675, "step": 31490 }, { "epoch": 0.2, "learning_rate": 0.00026950373377566364, "loss": 0.0746, "step": 31500 }, { "epoch": 0.2, "learning_rate": 0.0002694940524213067, "loss": 0.0797, "step": 31510 }, { "epoch": 0.2, "learning_rate": 0.00026948437106694975, "loss": 0.0744, "step": 31520 }, { "epoch": 0.2, "learning_rate": 0.0002694746897125928, "loss": 0.0713, "step": 31530 }, { "epoch": 0.2, "learning_rate": 0.0002694650083582359, "loss": 0.0861, "step": 31540 }, { "epoch": 0.2, "learning_rate": 0.000269455327003879, "loss": 0.0789, "step": 31550 }, { "epoch": 0.2, "learning_rate": 0.000269445645649522, "loss": 0.0719, "step": 31560 }, { "epoch": 0.2, "learning_rate": 0.0002694359642951651, "loss": 0.0753, "step": 31570 }, { "epoch": 0.2, "learning_rate": 0.00026942628294080817, "loss": 0.0907, "step": 31580 }, { "epoch": 0.2, "learning_rate": 0.00026941660158645125, "loss": 0.0691, "step": 31590 }, { "epoch": 0.2, "learning_rate": 0.00026940692023209433, "loss": 0.0698, "step": 31600 }, { "epoch": 0.2, "learning_rate": 0.0002693972388777374, "loss": 0.0776, "step": 31610 }, { "epoch": 0.2, "learning_rate": 0.00026938755752338044, "loss": 0.0746, "step": 31620 }, { "epoch": 0.2, "learning_rate": 0.0002693778761690235, "loss": 0.0763, "step": 31630 }, { "epoch": 0.2, "learning_rate": 0.0002693681948146666, "loss": 0.0763, "step": 31640 }, { "epoch": 0.2, "learning_rate": 0.0002693585134603096, "loss": 0.0739, "step": 31650 }, { "epoch": 0.2, "learning_rate": 0.0002693488321059527, "loss": 0.0714, "step": 31660 }, { "epoch": 0.2, "learning_rate": 0.0002693391507515958, "loss": 0.0714, "step": 31670 }, { "epoch": 0.2, "learning_rate": 0.00026932946939723886, "loss": 0.0779, "step": 31680 }, { "epoch": 0.2, "learning_rate": 0.00026931978804288194, "loss": 0.0704, "step": 31690 }, { "epoch": 0.2, "learning_rate": 0.00026931010668852497, "loss": 0.0718, "step": 31700 }, { "epoch": 0.2, "learning_rate": 0.00026930042533416805, "loss": 0.0812, "step": 31710 }, { "epoch": 0.2, "learning_rate": 0.0002692907439798111, "loss": 0.0689, "step": 31720 }, { "epoch": 0.2, "learning_rate": 0.0002692810626254542, "loss": 0.0772, "step": 31730 }, { "epoch": 0.2, "learning_rate": 0.0002692713812710973, "loss": 0.0735, "step": 31740 }, { "epoch": 0.2, "learning_rate": 0.0002692616999167403, "loss": 0.078, "step": 31750 }, { "epoch": 0.2, "learning_rate": 0.0002692520185623834, "loss": 0.0779, "step": 31760 }, { "epoch": 0.21, "learning_rate": 0.00026924233720802647, "loss": 0.0795, "step": 31770 }, { "epoch": 0.21, "learning_rate": 0.0002692326558536695, "loss": 0.0859, "step": 31780 }, { "epoch": 0.21, "learning_rate": 0.0002692229744993126, "loss": 0.0771, "step": 31790 }, { "epoch": 0.21, "learning_rate": 0.00026921329314495566, "loss": 0.0815, "step": 31800 }, { "epoch": 0.21, "learning_rate": 0.00026920361179059874, "loss": 0.0811, "step": 31810 }, { "epoch": 0.21, "learning_rate": 0.0002691939304362418, "loss": 0.0766, "step": 31820 }, { "epoch": 0.21, "learning_rate": 0.0002691842490818849, "loss": 0.0776, "step": 31830 }, { "epoch": 0.21, "learning_rate": 0.0002691745677275279, "loss": 0.0717, "step": 31840 }, { "epoch": 0.21, "learning_rate": 0.000269164886373171, "loss": 0.0741, "step": 31850 }, { "epoch": 0.21, "learning_rate": 0.0002691552050188141, "loss": 0.079, "step": 31860 }, { "epoch": 0.21, "learning_rate": 0.00026914552366445716, "loss": 0.0749, "step": 31870 }, { "epoch": 0.21, "learning_rate": 0.00026913584231010024, "loss": 0.0799, "step": 31880 }, { "epoch": 0.21, "learning_rate": 0.00026912616095574327, "loss": 0.0693, "step": 31890 }, { "epoch": 0.21, "learning_rate": 0.00026911647960138635, "loss": 0.0784, "step": 31900 }, { "epoch": 0.21, "learning_rate": 0.0002691067982470294, "loss": 0.0743, "step": 31910 }, { "epoch": 0.21, "learning_rate": 0.00026909711689267245, "loss": 0.0672, "step": 31920 }, { "epoch": 0.21, "learning_rate": 0.00026908743553831553, "loss": 0.0776, "step": 31930 }, { "epoch": 0.21, "learning_rate": 0.0002690777541839586, "loss": 0.0736, "step": 31940 }, { "epoch": 0.21, "learning_rate": 0.0002690680728296017, "loss": 0.0712, "step": 31950 }, { "epoch": 0.21, "learning_rate": 0.00026905839147524477, "loss": 0.0761, "step": 31960 }, { "epoch": 0.21, "learning_rate": 0.00026904871012088785, "loss": 0.0782, "step": 31970 }, { "epoch": 0.21, "learning_rate": 0.0002690390287665309, "loss": 0.0872, "step": 31980 }, { "epoch": 0.21, "learning_rate": 0.00026902934741217395, "loss": 0.0729, "step": 31990 }, { "epoch": 0.21, "learning_rate": 0.00026901966605781703, "loss": 0.0764, "step": 32000 }, { "epoch": 0.21, "eval_cer": 0.9201102700259858, "eval_loss": 0.05101795867085457, "eval_runtime": 120.5294, "eval_samples_per_second": 16.593, "eval_steps_per_second": 4.148, "step": 32000 }, { "epoch": 0.21, "learning_rate": 0.0002690099847034601, "loss": 0.0842, "step": 32010 }, { "epoch": 0.21, "learning_rate": 0.00026900030334910314, "loss": 0.0764, "step": 32020 }, { "epoch": 0.21, "learning_rate": 0.0002689906219947462, "loss": 0.0696, "step": 32030 }, { "epoch": 0.21, "learning_rate": 0.0002689809406403893, "loss": 0.0819, "step": 32040 }, { "epoch": 0.21, "learning_rate": 0.0002689712592860323, "loss": 0.0687, "step": 32050 }, { "epoch": 0.21, "learning_rate": 0.0002689615779316754, "loss": 0.0786, "step": 32060 }, { "epoch": 0.21, "learning_rate": 0.0002689518965773185, "loss": 0.0714, "step": 32070 }, { "epoch": 0.21, "learning_rate": 0.00026894221522296156, "loss": 0.074, "step": 32080 }, { "epoch": 0.21, "learning_rate": 0.00026893253386860464, "loss": 0.0682, "step": 32090 }, { "epoch": 0.21, "learning_rate": 0.0002689228525142477, "loss": 0.0767, "step": 32100 }, { "epoch": 0.21, "learning_rate": 0.0002689131711598908, "loss": 0.0696, "step": 32110 }, { "epoch": 0.21, "learning_rate": 0.00026890348980553383, "loss": 0.0678, "step": 32120 }, { "epoch": 0.21, "learning_rate": 0.0002688938084511769, "loss": 0.0701, "step": 32130 }, { "epoch": 0.21, "learning_rate": 0.00026888412709682, "loss": 0.0752, "step": 32140 }, { "epoch": 0.21, "learning_rate": 0.000268874445742463, "loss": 0.0761, "step": 32150 }, { "epoch": 0.21, "learning_rate": 0.0002688647643881061, "loss": 0.0637, "step": 32160 }, { "epoch": 0.21, "learning_rate": 0.0002688550830337492, "loss": 0.0762, "step": 32170 }, { "epoch": 0.21, "learning_rate": 0.00026884540167939225, "loss": 0.0688, "step": 32180 }, { "epoch": 0.21, "learning_rate": 0.0002688357203250353, "loss": 0.0734, "step": 32190 }, { "epoch": 0.21, "learning_rate": 0.00026882603897067836, "loss": 0.074, "step": 32200 }, { "epoch": 0.21, "learning_rate": 0.00026881635761632144, "loss": 0.0748, "step": 32210 }, { "epoch": 0.21, "learning_rate": 0.0002688066762619645, "loss": 0.0675, "step": 32220 }, { "epoch": 0.21, "learning_rate": 0.0002687969949076076, "loss": 0.0773, "step": 32230 }, { "epoch": 0.21, "learning_rate": 0.0002687873135532507, "loss": 0.0738, "step": 32240 }, { "epoch": 0.21, "learning_rate": 0.00026877763219889376, "loss": 0.0847, "step": 32250 }, { "epoch": 0.21, "learning_rate": 0.0002687679508445368, "loss": 0.0657, "step": 32260 }, { "epoch": 0.21, "learning_rate": 0.00026875826949017986, "loss": 0.0888, "step": 32270 }, { "epoch": 0.21, "learning_rate": 0.00026874858813582294, "loss": 0.0816, "step": 32280 }, { "epoch": 0.21, "learning_rate": 0.00026873890678146597, "loss": 0.0677, "step": 32290 }, { "epoch": 0.21, "learning_rate": 0.00026872922542710905, "loss": 0.0812, "step": 32300 }, { "epoch": 0.21, "learning_rate": 0.00026871954407275213, "loss": 0.082, "step": 32310 }, { "epoch": 0.21, "learning_rate": 0.0002687098627183952, "loss": 0.0716, "step": 32320 }, { "epoch": 0.21, "learning_rate": 0.00026870018136403823, "loss": 0.0752, "step": 32330 }, { "epoch": 0.21, "learning_rate": 0.0002686905000096813, "loss": 0.0759, "step": 32340 }, { "epoch": 0.21, "learning_rate": 0.0002686808186553244, "loss": 0.0817, "step": 32350 }, { "epoch": 0.21, "learning_rate": 0.0002686711373009675, "loss": 0.0771, "step": 32360 }, { "epoch": 0.21, "learning_rate": 0.00026866145594661055, "loss": 0.0748, "step": 32370 }, { "epoch": 0.21, "learning_rate": 0.00026865177459225363, "loss": 0.0852, "step": 32380 }, { "epoch": 0.21, "learning_rate": 0.00026864209323789666, "loss": 0.074, "step": 32390 }, { "epoch": 0.21, "learning_rate": 0.00026863241188353974, "loss": 0.0686, "step": 32400 }, { "epoch": 0.21, "learning_rate": 0.0002686227305291828, "loss": 0.0771, "step": 32410 }, { "epoch": 0.21, "learning_rate": 0.00026861304917482584, "loss": 0.071, "step": 32420 }, { "epoch": 0.21, "learning_rate": 0.0002686033678204689, "loss": 0.0674, "step": 32430 }, { "epoch": 0.21, "learning_rate": 0.000268593686466112, "loss": 0.0728, "step": 32440 }, { "epoch": 0.21, "learning_rate": 0.0002685840051117551, "loss": 0.0703, "step": 32450 }, { "epoch": 0.21, "learning_rate": 0.00026857432375739816, "loss": 0.0761, "step": 32460 }, { "epoch": 0.21, "learning_rate": 0.0002685646424030412, "loss": 0.0734, "step": 32470 }, { "epoch": 0.21, "learning_rate": 0.00026855496104868427, "loss": 0.0733, "step": 32480 }, { "epoch": 0.21, "learning_rate": 0.00026854527969432735, "loss": 0.0773, "step": 32490 }, { "epoch": 0.21, "learning_rate": 0.00026853559833997043, "loss": 0.0741, "step": 32500 }, { "epoch": 0.21, "learning_rate": 0.0002685259169856135, "loss": 0.0712, "step": 32510 }, { "epoch": 0.21, "learning_rate": 0.00026851623563125653, "loss": 0.0743, "step": 32520 }, { "epoch": 0.21, "learning_rate": 0.0002685065542768996, "loss": 0.0747, "step": 32530 }, { "epoch": 0.21, "learning_rate": 0.0002684968729225427, "loss": 0.0778, "step": 32540 }, { "epoch": 0.21, "learning_rate": 0.0002684871915681857, "loss": 0.0709, "step": 32550 }, { "epoch": 0.21, "learning_rate": 0.0002684775102138288, "loss": 0.0802, "step": 32560 }, { "epoch": 0.21, "learning_rate": 0.0002684678288594719, "loss": 0.0811, "step": 32570 }, { "epoch": 0.21, "learning_rate": 0.00026845814750511496, "loss": 0.0812, "step": 32580 }, { "epoch": 0.21, "learning_rate": 0.00026844846615075804, "loss": 0.0709, "step": 32590 }, { "epoch": 0.21, "learning_rate": 0.0002684387847964011, "loss": 0.0788, "step": 32600 }, { "epoch": 0.21, "learning_rate": 0.00026842910344204414, "loss": 0.0733, "step": 32610 }, { "epoch": 0.21, "learning_rate": 0.0002684194220876872, "loss": 0.0817, "step": 32620 }, { "epoch": 0.21, "learning_rate": 0.0002684097407333303, "loss": 0.0931, "step": 32630 }, { "epoch": 0.21, "learning_rate": 0.0002684000593789734, "loss": 0.0763, "step": 32640 }, { "epoch": 0.21, "learning_rate": 0.00026839037802461646, "loss": 0.078, "step": 32650 }, { "epoch": 0.21, "learning_rate": 0.0002683806966702595, "loss": 0.066, "step": 32660 }, { "epoch": 0.21, "learning_rate": 0.00026837101531590257, "loss": 0.0834, "step": 32670 }, { "epoch": 0.21, "learning_rate": 0.00026836133396154565, "loss": 0.0702, "step": 32680 }, { "epoch": 0.21, "learning_rate": 0.0002683516526071887, "loss": 0.0711, "step": 32690 }, { "epoch": 0.21, "learning_rate": 0.00026834197125283175, "loss": 0.0741, "step": 32700 }, { "epoch": 0.21, "learning_rate": 0.00026833228989847483, "loss": 0.0725, "step": 32710 }, { "epoch": 0.21, "learning_rate": 0.0002683226085441179, "loss": 0.0812, "step": 32720 }, { "epoch": 0.21, "learning_rate": 0.000268312927189761, "loss": 0.0792, "step": 32730 }, { "epoch": 0.21, "learning_rate": 0.00026830324583540407, "loss": 0.0679, "step": 32740 }, { "epoch": 0.21, "learning_rate": 0.0002682935644810471, "loss": 0.0803, "step": 32750 }, { "epoch": 0.21, "learning_rate": 0.0002682838831266902, "loss": 0.0836, "step": 32760 }, { "epoch": 0.21, "learning_rate": 0.00026827420177233326, "loss": 0.0763, "step": 32770 }, { "epoch": 0.21, "learning_rate": 0.00026826452041797634, "loss": 0.0756, "step": 32780 }, { "epoch": 0.21, "learning_rate": 0.00026825483906361936, "loss": 0.0774, "step": 32790 }, { "epoch": 0.21, "learning_rate": 0.00026824515770926244, "loss": 0.0734, "step": 32800 }, { "epoch": 0.21, "learning_rate": 0.0002682354763549055, "loss": 0.0778, "step": 32810 }, { "epoch": 0.21, "learning_rate": 0.00026822579500054855, "loss": 0.069, "step": 32820 }, { "epoch": 0.21, "learning_rate": 0.00026821611364619163, "loss": 0.084, "step": 32830 }, { "epoch": 0.21, "learning_rate": 0.0002682064322918347, "loss": 0.0795, "step": 32840 }, { "epoch": 0.21, "learning_rate": 0.0002681967509374778, "loss": 0.0684, "step": 32850 }, { "epoch": 0.21, "learning_rate": 0.00026818706958312087, "loss": 0.0713, "step": 32860 }, { "epoch": 0.21, "learning_rate": 0.00026817738822876395, "loss": 0.0737, "step": 32870 }, { "epoch": 0.21, "learning_rate": 0.000268167706874407, "loss": 0.077, "step": 32880 }, { "epoch": 0.21, "learning_rate": 0.00026815802552005005, "loss": 0.079, "step": 32890 }, { "epoch": 0.21, "learning_rate": 0.00026814834416569313, "loss": 0.0692, "step": 32900 }, { "epoch": 0.21, "learning_rate": 0.0002681386628113362, "loss": 0.0676, "step": 32910 }, { "epoch": 0.21, "learning_rate": 0.00026812898145697924, "loss": 0.085, "step": 32920 }, { "epoch": 0.21, "learning_rate": 0.0002681193001026223, "loss": 0.0699, "step": 32930 }, { "epoch": 0.21, "learning_rate": 0.0002681096187482654, "loss": 0.0738, "step": 32940 }, { "epoch": 0.21, "learning_rate": 0.0002680999373939085, "loss": 0.0745, "step": 32950 }, { "epoch": 0.21, "learning_rate": 0.0002680902560395515, "loss": 0.089, "step": 32960 }, { "epoch": 0.21, "learning_rate": 0.0002680805746851946, "loss": 0.0745, "step": 32970 }, { "epoch": 0.21, "learning_rate": 0.00026807089333083766, "loss": 0.0806, "step": 32980 }, { "epoch": 0.21, "learning_rate": 0.00026806121197648074, "loss": 0.0702, "step": 32990 }, { "epoch": 0.21, "learning_rate": 0.0002680515306221238, "loss": 0.0741, "step": 33000 }, { "epoch": 0.21, "eval_cer": 0.9201437125748503, "eval_loss": 0.049433525651693344, "eval_runtime": 120.4106, "eval_samples_per_second": 16.61, "eval_steps_per_second": 4.152, "step": 33000 }, { "epoch": 0.21, "learning_rate": 0.0002680418492677669, "loss": 0.0794, "step": 33010 }, { "epoch": 0.21, "learning_rate": 0.00026803216791341, "loss": 0.0753, "step": 33020 }, { "epoch": 0.21, "learning_rate": 0.000268022486559053, "loss": 0.0753, "step": 33030 }, { "epoch": 0.21, "learning_rate": 0.0002680128052046961, "loss": 0.074, "step": 33040 }, { "epoch": 0.21, "learning_rate": 0.00026800312385033917, "loss": 0.066, "step": 33050 }, { "epoch": 0.21, "learning_rate": 0.0002679934424959822, "loss": 0.0765, "step": 33060 }, { "epoch": 0.21, "learning_rate": 0.00026798376114162527, "loss": 0.0811, "step": 33070 }, { "epoch": 0.21, "learning_rate": 0.00026797407978726835, "loss": 0.0691, "step": 33080 }, { "epoch": 0.21, "learning_rate": 0.00026796439843291143, "loss": 0.0801, "step": 33090 }, { "epoch": 0.21, "learning_rate": 0.00026795471707855446, "loss": 0.0712, "step": 33100 }, { "epoch": 0.21, "learning_rate": 0.00026794503572419754, "loss": 0.079, "step": 33110 }, { "epoch": 0.21, "learning_rate": 0.0002679353543698406, "loss": 0.0702, "step": 33120 }, { "epoch": 0.21, "learning_rate": 0.0002679256730154837, "loss": 0.0701, "step": 33130 }, { "epoch": 0.21, "learning_rate": 0.0002679159916611268, "loss": 0.072, "step": 33140 }, { "epoch": 0.21, "learning_rate": 0.00026790631030676986, "loss": 0.0775, "step": 33150 }, { "epoch": 0.21, "learning_rate": 0.0002678966289524129, "loss": 0.0811, "step": 33160 }, { "epoch": 0.21, "learning_rate": 0.00026788694759805596, "loss": 0.0714, "step": 33170 }, { "epoch": 0.21, "learning_rate": 0.00026787726624369904, "loss": 0.0799, "step": 33180 }, { "epoch": 0.21, "learning_rate": 0.00026786758488934207, "loss": 0.0737, "step": 33190 }, { "epoch": 0.21, "learning_rate": 0.00026785790353498515, "loss": 0.0693, "step": 33200 }, { "epoch": 0.21, "learning_rate": 0.0002678482221806282, "loss": 0.0783, "step": 33210 }, { "epoch": 0.21, "learning_rate": 0.0002678385408262713, "loss": 0.077, "step": 33220 }, { "epoch": 0.21, "learning_rate": 0.0002678288594719144, "loss": 0.071, "step": 33230 }, { "epoch": 0.21, "learning_rate": 0.0002678191781175574, "loss": 0.078, "step": 33240 }, { "epoch": 0.21, "learning_rate": 0.0002678094967632005, "loss": 0.0681, "step": 33250 }, { "epoch": 0.21, "learning_rate": 0.00026779981540884357, "loss": 0.0762, "step": 33260 }, { "epoch": 0.21, "learning_rate": 0.00026779013405448665, "loss": 0.0736, "step": 33270 }, { "epoch": 0.21, "learning_rate": 0.00026778045270012973, "loss": 0.0774, "step": 33280 }, { "epoch": 0.21, "learning_rate": 0.0002677707713457728, "loss": 0.0747, "step": 33290 }, { "epoch": 0.21, "learning_rate": 0.00026776108999141584, "loss": 0.0739, "step": 33300 }, { "epoch": 0.21, "learning_rate": 0.0002677514086370589, "loss": 0.0762, "step": 33310 }, { "epoch": 0.22, "learning_rate": 0.00026774172728270194, "loss": 0.0764, "step": 33320 }, { "epoch": 0.22, "learning_rate": 0.000267732045928345, "loss": 0.0755, "step": 33330 }, { "epoch": 0.22, "learning_rate": 0.0002677223645739881, "loss": 0.0848, "step": 33340 }, { "epoch": 0.22, "learning_rate": 0.0002677126832196312, "loss": 0.0733, "step": 33350 }, { "epoch": 0.22, "learning_rate": 0.00026770300186527426, "loss": 0.0696, "step": 33360 }, { "epoch": 0.22, "learning_rate": 0.00026769332051091734, "loss": 0.0724, "step": 33370 }, { "epoch": 0.22, "learning_rate": 0.00026768363915656037, "loss": 0.0797, "step": 33380 }, { "epoch": 0.22, "learning_rate": 0.00026767395780220345, "loss": 0.0715, "step": 33390 }, { "epoch": 0.22, "learning_rate": 0.0002676642764478465, "loss": 0.072, "step": 33400 }, { "epoch": 0.22, "learning_rate": 0.0002676545950934896, "loss": 0.071, "step": 33410 }, { "epoch": 0.22, "learning_rate": 0.0002676449137391327, "loss": 0.0735, "step": 33420 }, { "epoch": 0.22, "learning_rate": 0.0002676352323847757, "loss": 0.0662, "step": 33430 }, { "epoch": 0.22, "learning_rate": 0.0002676255510304188, "loss": 0.074, "step": 33440 }, { "epoch": 0.22, "learning_rate": 0.00026761586967606187, "loss": 0.0805, "step": 33450 }, { "epoch": 0.22, "learning_rate": 0.0002676061883217049, "loss": 0.0646, "step": 33460 }, { "epoch": 0.22, "learning_rate": 0.000267596506967348, "loss": 0.0728, "step": 33470 }, { "epoch": 0.22, "learning_rate": 0.00026758682561299105, "loss": 0.0695, "step": 33480 }, { "epoch": 0.22, "learning_rate": 0.00026757714425863413, "loss": 0.0683, "step": 33490 }, { "epoch": 0.22, "learning_rate": 0.0002675674629042772, "loss": 0.0756, "step": 33500 }, { "epoch": 0.22, "learning_rate": 0.0002675577815499203, "loss": 0.0767, "step": 33510 }, { "epoch": 0.22, "learning_rate": 0.0002675481001955633, "loss": 0.0792, "step": 33520 }, { "epoch": 0.22, "learning_rate": 0.0002675384188412064, "loss": 0.0812, "step": 33530 }, { "epoch": 0.22, "learning_rate": 0.0002675287374868495, "loss": 0.0847, "step": 33540 }, { "epoch": 0.22, "learning_rate": 0.00026751905613249256, "loss": 0.0686, "step": 33550 }, { "epoch": 0.22, "learning_rate": 0.0002675093747781356, "loss": 0.0638, "step": 33560 }, { "epoch": 0.22, "learning_rate": 0.00026749969342377866, "loss": 0.0756, "step": 33570 }, { "epoch": 0.22, "learning_rate": 0.00026749001206942174, "loss": 0.082, "step": 33580 }, { "epoch": 0.22, "learning_rate": 0.00026748033071506477, "loss": 0.0714, "step": 33590 }, { "epoch": 0.22, "learning_rate": 0.00026747064936070785, "loss": 0.081, "step": 33600 }, { "epoch": 0.22, "learning_rate": 0.00026746096800635093, "loss": 0.0659, "step": 33610 }, { "epoch": 0.22, "learning_rate": 0.000267451286651994, "loss": 0.0759, "step": 33620 }, { "epoch": 0.22, "learning_rate": 0.0002674416052976371, "loss": 0.0772, "step": 33630 }, { "epoch": 0.22, "learning_rate": 0.00026743192394328017, "loss": 0.0682, "step": 33640 }, { "epoch": 0.22, "learning_rate": 0.00026742224258892325, "loss": 0.0806, "step": 33650 }, { "epoch": 0.22, "learning_rate": 0.0002674125612345663, "loss": 0.0887, "step": 33660 }, { "epoch": 0.22, "learning_rate": 0.00026740287988020935, "loss": 0.0794, "step": 33670 }, { "epoch": 0.22, "learning_rate": 0.00026739319852585243, "loss": 0.0794, "step": 33680 }, { "epoch": 0.22, "learning_rate": 0.0002673835171714955, "loss": 0.0737, "step": 33690 }, { "epoch": 0.22, "learning_rate": 0.00026737383581713854, "loss": 0.0743, "step": 33700 }, { "epoch": 0.22, "learning_rate": 0.0002673641544627816, "loss": 0.0764, "step": 33710 }, { "epoch": 0.22, "learning_rate": 0.0002673544731084247, "loss": 0.074, "step": 33720 }, { "epoch": 0.22, "learning_rate": 0.0002673447917540677, "loss": 0.0801, "step": 33730 }, { "epoch": 0.22, "learning_rate": 0.0002673351103997108, "loss": 0.0737, "step": 33740 }, { "epoch": 0.22, "learning_rate": 0.0002673254290453539, "loss": 0.0766, "step": 33750 }, { "epoch": 0.22, "learning_rate": 0.00026731574769099696, "loss": 0.0751, "step": 33760 }, { "epoch": 0.22, "learning_rate": 0.00026730606633664004, "loss": 0.0693, "step": 33770 }, { "epoch": 0.22, "learning_rate": 0.0002672963849822831, "loss": 0.0652, "step": 33780 }, { "epoch": 0.22, "learning_rate": 0.0002672867036279262, "loss": 0.0703, "step": 33790 }, { "epoch": 0.22, "learning_rate": 0.00026727702227356923, "loss": 0.0737, "step": 33800 }, { "epoch": 0.22, "learning_rate": 0.0002672673409192123, "loss": 0.0713, "step": 33810 }, { "epoch": 0.22, "learning_rate": 0.0002672576595648554, "loss": 0.0787, "step": 33820 }, { "epoch": 0.22, "learning_rate": 0.0002672479782104984, "loss": 0.0691, "step": 33830 }, { "epoch": 0.22, "learning_rate": 0.0002672382968561415, "loss": 0.0651, "step": 33840 }, { "epoch": 0.22, "learning_rate": 0.0002672286155017846, "loss": 0.0774, "step": 33850 }, { "epoch": 0.22, "learning_rate": 0.00026721893414742765, "loss": 0.0784, "step": 33860 }, { "epoch": 0.22, "learning_rate": 0.0002672092527930707, "loss": 0.076, "step": 33870 }, { "epoch": 0.22, "learning_rate": 0.00026719957143871376, "loss": 0.0713, "step": 33880 }, { "epoch": 0.22, "learning_rate": 0.00026718989008435684, "loss": 0.0715, "step": 33890 }, { "epoch": 0.22, "learning_rate": 0.0002671802087299999, "loss": 0.0727, "step": 33900 }, { "epoch": 0.22, "learning_rate": 0.000267170527375643, "loss": 0.0715, "step": 33910 }, { "epoch": 0.22, "learning_rate": 0.0002671608460212861, "loss": 0.0766, "step": 33920 }, { "epoch": 0.22, "learning_rate": 0.0002671511646669291, "loss": 0.0688, "step": 33930 }, { "epoch": 0.22, "learning_rate": 0.0002671414833125722, "loss": 0.0703, "step": 33940 }, { "epoch": 0.22, "learning_rate": 0.00026713180195821526, "loss": 0.0698, "step": 33950 }, { "epoch": 0.22, "learning_rate": 0.0002671221206038583, "loss": 0.0809, "step": 33960 }, { "epoch": 0.22, "learning_rate": 0.00026711243924950137, "loss": 0.071, "step": 33970 }, { "epoch": 0.22, "learning_rate": 0.00026710275789514445, "loss": 0.0678, "step": 33980 }, { "epoch": 0.22, "learning_rate": 0.00026709307654078753, "loss": 0.0734, "step": 33990 }, { "epoch": 0.22, "learning_rate": 0.0002670833951864306, "loss": 0.0736, "step": 34000 }, { "epoch": 0.22, "eval_cer": 0.9201382894588183, "eval_loss": 0.049920111894607544, "eval_runtime": 120.2767, "eval_samples_per_second": 16.628, "eval_steps_per_second": 4.157, "step": 34000 }, { "epoch": 0.22, "learning_rate": 0.00026707371383207363, "loss": 0.0733, "step": 34010 }, { "epoch": 0.22, "learning_rate": 0.0002670640324777167, "loss": 0.0795, "step": 34020 }, { "epoch": 0.22, "learning_rate": 0.0002670543511233598, "loss": 0.0762, "step": 34030 }, { "epoch": 0.22, "learning_rate": 0.00026704466976900287, "loss": 0.0708, "step": 34040 }, { "epoch": 0.22, "learning_rate": 0.00026703498841464595, "loss": 0.0761, "step": 34050 }, { "epoch": 0.22, "learning_rate": 0.00026702530706028903, "loss": 0.0775, "step": 34060 }, { "epoch": 0.22, "learning_rate": 0.00026701562570593206, "loss": 0.0704, "step": 34070 }, { "epoch": 0.22, "learning_rate": 0.00026700594435157514, "loss": 0.0771, "step": 34080 }, { "epoch": 0.22, "learning_rate": 0.0002669962629972182, "loss": 0.0743, "step": 34090 }, { "epoch": 0.22, "learning_rate": 0.00026698658164286124, "loss": 0.0754, "step": 34100 }, { "epoch": 0.22, "learning_rate": 0.0002669769002885043, "loss": 0.0862, "step": 34110 }, { "epoch": 0.22, "learning_rate": 0.0002669672189341474, "loss": 0.0676, "step": 34120 }, { "epoch": 0.22, "learning_rate": 0.0002669575375797905, "loss": 0.0739, "step": 34130 }, { "epoch": 0.22, "learning_rate": 0.00026694785622543356, "loss": 0.0779, "step": 34140 }, { "epoch": 0.22, "learning_rate": 0.0002669381748710766, "loss": 0.0734, "step": 34150 }, { "epoch": 0.22, "learning_rate": 0.00026692849351671967, "loss": 0.0719, "step": 34160 }, { "epoch": 0.22, "learning_rate": 0.00026691881216236275, "loss": 0.0887, "step": 34170 }, { "epoch": 0.22, "learning_rate": 0.00026690913080800583, "loss": 0.0752, "step": 34180 }, { "epoch": 0.22, "learning_rate": 0.0002668994494536489, "loss": 0.0754, "step": 34190 }, { "epoch": 0.22, "learning_rate": 0.00026688976809929193, "loss": 0.0772, "step": 34200 }, { "epoch": 0.22, "learning_rate": 0.000266880086744935, "loss": 0.0701, "step": 34210 }, { "epoch": 0.22, "learning_rate": 0.0002668704053905781, "loss": 0.0809, "step": 34220 }, { "epoch": 0.22, "learning_rate": 0.0002668607240362211, "loss": 0.0906, "step": 34230 }, { "epoch": 0.22, "learning_rate": 0.0002668510426818642, "loss": 0.0798, "step": 34240 }, { "epoch": 0.22, "learning_rate": 0.0002668413613275073, "loss": 0.0763, "step": 34250 }, { "epoch": 0.22, "learning_rate": 0.00026683167997315036, "loss": 0.0814, "step": 34260 }, { "epoch": 0.22, "learning_rate": 0.00026682199861879344, "loss": 0.066, "step": 34270 }, { "epoch": 0.22, "learning_rate": 0.0002668123172644365, "loss": 0.0757, "step": 34280 }, { "epoch": 0.22, "learning_rate": 0.00026680263591007954, "loss": 0.0761, "step": 34290 }, { "epoch": 0.22, "learning_rate": 0.0002667929545557226, "loss": 0.0819, "step": 34300 }, { "epoch": 0.22, "learning_rate": 0.0002667832732013657, "loss": 0.0751, "step": 34310 }, { "epoch": 0.22, "learning_rate": 0.0002667735918470088, "loss": 0.0729, "step": 34320 }, { "epoch": 0.22, "learning_rate": 0.0002667639104926518, "loss": 0.0693, "step": 34330 }, { "epoch": 0.22, "learning_rate": 0.0002667542291382949, "loss": 0.0788, "step": 34340 }, { "epoch": 0.22, "learning_rate": 0.00026674454778393797, "loss": 0.0725, "step": 34350 }, { "epoch": 0.22, "learning_rate": 0.000266734866429581, "loss": 0.0847, "step": 34360 }, { "epoch": 0.22, "learning_rate": 0.00026672518507522407, "loss": 0.0759, "step": 34370 }, { "epoch": 0.22, "learning_rate": 0.00026671550372086715, "loss": 0.0756, "step": 34380 }, { "epoch": 0.22, "learning_rate": 0.00026670582236651023, "loss": 0.065, "step": 34390 }, { "epoch": 0.22, "learning_rate": 0.0002666961410121533, "loss": 0.0778, "step": 34400 }, { "epoch": 0.22, "learning_rate": 0.0002666864596577964, "loss": 0.0841, "step": 34410 }, { "epoch": 0.22, "learning_rate": 0.00026667677830343947, "loss": 0.0817, "step": 34420 }, { "epoch": 0.22, "learning_rate": 0.0002666670969490825, "loss": 0.0737, "step": 34430 }, { "epoch": 0.22, "learning_rate": 0.0002666574155947256, "loss": 0.0773, "step": 34440 }, { "epoch": 0.22, "learning_rate": 0.00026664773424036866, "loss": 0.0687, "step": 34450 }, { "epoch": 0.22, "learning_rate": 0.00026663805288601174, "loss": 0.0756, "step": 34460 }, { "epoch": 0.22, "learning_rate": 0.00026662837153165476, "loss": 0.073, "step": 34470 }, { "epoch": 0.22, "learning_rate": 0.00026661869017729784, "loss": 0.0703, "step": 34480 }, { "epoch": 0.22, "learning_rate": 0.0002666090088229409, "loss": 0.0788, "step": 34490 }, { "epoch": 0.22, "learning_rate": 0.00026659932746858395, "loss": 0.0712, "step": 34500 }, { "epoch": 0.22, "learning_rate": 0.000266589646114227, "loss": 0.082, "step": 34510 }, { "epoch": 0.22, "learning_rate": 0.0002665799647598701, "loss": 0.0721, "step": 34520 }, { "epoch": 0.22, "learning_rate": 0.0002665702834055132, "loss": 0.0697, "step": 34530 }, { "epoch": 0.22, "learning_rate": 0.00026656060205115627, "loss": 0.0771, "step": 34540 }, { "epoch": 0.22, "learning_rate": 0.00026655092069679935, "loss": 0.0701, "step": 34550 }, { "epoch": 0.22, "learning_rate": 0.0002665412393424424, "loss": 0.0716, "step": 34560 }, { "epoch": 0.22, "learning_rate": 0.00026653155798808545, "loss": 0.0913, "step": 34570 }, { "epoch": 0.22, "learning_rate": 0.00026652187663372853, "loss": 0.0734, "step": 34580 }, { "epoch": 0.22, "learning_rate": 0.0002665121952793716, "loss": 0.074, "step": 34590 }, { "epoch": 0.22, "learning_rate": 0.00026650251392501464, "loss": 0.0719, "step": 34600 }, { "epoch": 0.22, "learning_rate": 0.0002664928325706577, "loss": 0.0657, "step": 34610 }, { "epoch": 0.22, "learning_rate": 0.0002664831512163008, "loss": 0.0732, "step": 34620 }, { "epoch": 0.22, "learning_rate": 0.0002664734698619439, "loss": 0.0697, "step": 34630 }, { "epoch": 0.22, "learning_rate": 0.0002664637885075869, "loss": 0.0763, "step": 34640 }, { "epoch": 0.22, "learning_rate": 0.00026645410715323, "loss": 0.0827, "step": 34650 }, { "epoch": 0.22, "learning_rate": 0.00026644442579887306, "loss": 0.086, "step": 34660 }, { "epoch": 0.22, "learning_rate": 0.00026643474444451614, "loss": 0.068, "step": 34670 }, { "epoch": 0.22, "learning_rate": 0.0002664250630901592, "loss": 0.0697, "step": 34680 }, { "epoch": 0.22, "learning_rate": 0.0002664153817358023, "loss": 0.0709, "step": 34690 }, { "epoch": 0.22, "learning_rate": 0.0002664057003814453, "loss": 0.0687, "step": 34700 }, { "epoch": 0.22, "learning_rate": 0.0002663960190270884, "loss": 0.0765, "step": 34710 }, { "epoch": 0.22, "learning_rate": 0.0002663863376727315, "loss": 0.0748, "step": 34720 }, { "epoch": 0.22, "learning_rate": 0.0002663766563183745, "loss": 0.0806, "step": 34730 }, { "epoch": 0.22, "learning_rate": 0.0002663669749640176, "loss": 0.0688, "step": 34740 }, { "epoch": 0.22, "learning_rate": 0.00026635729360966067, "loss": 0.0686, "step": 34750 }, { "epoch": 0.22, "learning_rate": 0.00026634761225530375, "loss": 0.07, "step": 34760 }, { "epoch": 0.22, "learning_rate": 0.00026633793090094683, "loss": 0.0713, "step": 34770 }, { "epoch": 0.22, "learning_rate": 0.00026632824954658986, "loss": 0.0693, "step": 34780 }, { "epoch": 0.22, "learning_rate": 0.00026631856819223294, "loss": 0.0708, "step": 34790 }, { "epoch": 0.22, "learning_rate": 0.000266308886837876, "loss": 0.0743, "step": 34800 }, { "epoch": 0.22, "learning_rate": 0.0002662992054835191, "loss": 0.0867, "step": 34810 }, { "epoch": 0.22, "learning_rate": 0.0002662895241291622, "loss": 0.0699, "step": 34820 }, { "epoch": 0.22, "learning_rate": 0.00026627984277480525, "loss": 0.0704, "step": 34830 }, { "epoch": 0.22, "learning_rate": 0.0002662701614204483, "loss": 0.0749, "step": 34840 }, { "epoch": 0.22, "learning_rate": 0.00026626048006609136, "loss": 0.0711, "step": 34850 }, { "epoch": 0.22, "learning_rate": 0.00026625079871173444, "loss": 0.0671, "step": 34860 }, { "epoch": 0.23, "learning_rate": 0.00026624111735737747, "loss": 0.0697, "step": 34870 }, { "epoch": 0.23, "learning_rate": 0.00026623143600302055, "loss": 0.0752, "step": 34880 }, { "epoch": 0.23, "learning_rate": 0.0002662217546486636, "loss": 0.0711, "step": 34890 }, { "epoch": 0.23, "learning_rate": 0.0002662120732943067, "loss": 0.0741, "step": 34900 }, { "epoch": 0.23, "learning_rate": 0.0002662023919399498, "loss": 0.0719, "step": 34910 }, { "epoch": 0.23, "learning_rate": 0.0002661927105855928, "loss": 0.0836, "step": 34920 }, { "epoch": 0.23, "learning_rate": 0.0002661830292312359, "loss": 0.065, "step": 34930 }, { "epoch": 0.23, "learning_rate": 0.00026617334787687897, "loss": 0.0741, "step": 34940 }, { "epoch": 0.23, "learning_rate": 0.00026616366652252205, "loss": 0.0703, "step": 34950 }, { "epoch": 0.23, "learning_rate": 0.00026615398516816513, "loss": 0.0747, "step": 34960 }, { "epoch": 0.23, "learning_rate": 0.00026614430381380816, "loss": 0.0693, "step": 34970 }, { "epoch": 0.23, "learning_rate": 0.00026613462245945123, "loss": 0.0704, "step": 34980 }, { "epoch": 0.23, "learning_rate": 0.0002661249411050943, "loss": 0.0738, "step": 34990 }, { "epoch": 0.23, "learning_rate": 0.00026611525975073734, "loss": 0.0674, "step": 35000 }, { "epoch": 0.23, "eval_cer": 0.9201554626595865, "eval_loss": 0.04858190566301346, "eval_runtime": 120.2631, "eval_samples_per_second": 16.63, "eval_steps_per_second": 4.158, "step": 35000 }, { "epoch": 0.23, "learning_rate": 0.0002661055783963804, "loss": 0.0744, "step": 35010 }, { "epoch": 0.23, "learning_rate": 0.0002660958970420235, "loss": 0.0735, "step": 35020 }, { "epoch": 0.23, "learning_rate": 0.0002660862156876666, "loss": 0.0713, "step": 35030 }, { "epoch": 0.23, "learning_rate": 0.00026607653433330966, "loss": 0.0802, "step": 35040 }, { "epoch": 0.23, "learning_rate": 0.00026606685297895274, "loss": 0.0754, "step": 35050 }, { "epoch": 0.23, "learning_rate": 0.00026605717162459576, "loss": 0.0727, "step": 35060 }, { "epoch": 0.23, "learning_rate": 0.00026604749027023884, "loss": 0.0707, "step": 35070 }, { "epoch": 0.23, "learning_rate": 0.0002660378089158819, "loss": 0.0736, "step": 35080 }, { "epoch": 0.23, "learning_rate": 0.000266028127561525, "loss": 0.065, "step": 35090 }, { "epoch": 0.23, "learning_rate": 0.00026601844620716803, "loss": 0.076, "step": 35100 }, { "epoch": 0.23, "learning_rate": 0.0002660087648528111, "loss": 0.0818, "step": 35110 }, { "epoch": 0.23, "learning_rate": 0.0002659990834984542, "loss": 0.0695, "step": 35120 }, { "epoch": 0.23, "learning_rate": 0.0002659894021440972, "loss": 0.0681, "step": 35130 }, { "epoch": 0.23, "learning_rate": 0.0002659797207897403, "loss": 0.0723, "step": 35140 }, { "epoch": 0.23, "learning_rate": 0.0002659700394353834, "loss": 0.0721, "step": 35150 }, { "epoch": 0.23, "learning_rate": 0.00026596035808102645, "loss": 0.0693, "step": 35160 }, { "epoch": 0.23, "learning_rate": 0.00026595067672666953, "loss": 0.0611, "step": 35170 }, { "epoch": 0.23, "learning_rate": 0.0002659409953723126, "loss": 0.0787, "step": 35180 }, { "epoch": 0.23, "learning_rate": 0.0002659313140179557, "loss": 0.0707, "step": 35190 }, { "epoch": 0.23, "learning_rate": 0.0002659216326635987, "loss": 0.0691, "step": 35200 }, { "epoch": 0.23, "learning_rate": 0.0002659119513092418, "loss": 0.0664, "step": 35210 }, { "epoch": 0.23, "learning_rate": 0.0002659022699548849, "loss": 0.0725, "step": 35220 }, { "epoch": 0.23, "learning_rate": 0.00026589258860052796, "loss": 0.078, "step": 35230 }, { "epoch": 0.23, "learning_rate": 0.000265882907246171, "loss": 0.0719, "step": 35240 }, { "epoch": 0.23, "learning_rate": 0.00026587322589181406, "loss": 0.0713, "step": 35250 }, { "epoch": 0.23, "learning_rate": 0.00026586354453745714, "loss": 0.0673, "step": 35260 }, { "epoch": 0.23, "learning_rate": 0.00026585386318310017, "loss": 0.0707, "step": 35270 }, { "epoch": 0.23, "learning_rate": 0.00026584418182874325, "loss": 0.0721, "step": 35280 }, { "epoch": 0.23, "learning_rate": 0.00026583450047438633, "loss": 0.0758, "step": 35290 }, { "epoch": 0.23, "learning_rate": 0.0002658248191200294, "loss": 0.0803, "step": 35300 }, { "epoch": 0.23, "learning_rate": 0.0002658151377656725, "loss": 0.0762, "step": 35310 }, { "epoch": 0.23, "learning_rate": 0.00026580545641131557, "loss": 0.0802, "step": 35320 }, { "epoch": 0.23, "learning_rate": 0.00026579577505695865, "loss": 0.0718, "step": 35330 }, { "epoch": 0.23, "learning_rate": 0.0002657860937026017, "loss": 0.0706, "step": 35340 }, { "epoch": 0.23, "learning_rate": 0.00026577641234824475, "loss": 0.0696, "step": 35350 }, { "epoch": 0.23, "learning_rate": 0.00026576673099388783, "loss": 0.0743, "step": 35360 }, { "epoch": 0.23, "learning_rate": 0.00026575704963953086, "loss": 0.069, "step": 35370 }, { "epoch": 0.23, "learning_rate": 0.00026574736828517394, "loss": 0.0678, "step": 35380 }, { "epoch": 0.23, "learning_rate": 0.000265737686930817, "loss": 0.0687, "step": 35390 }, { "epoch": 0.23, "learning_rate": 0.0002657280055764601, "loss": 0.0753, "step": 35400 }, { "epoch": 0.23, "learning_rate": 0.0002657183242221031, "loss": 0.0664, "step": 35410 }, { "epoch": 0.23, "learning_rate": 0.0002657086428677462, "loss": 0.0692, "step": 35420 }, { "epoch": 0.23, "learning_rate": 0.0002656989615133893, "loss": 0.0692, "step": 35430 }, { "epoch": 0.23, "learning_rate": 0.00026568928015903236, "loss": 0.0674, "step": 35440 }, { "epoch": 0.23, "learning_rate": 0.00026567959880467544, "loss": 0.0687, "step": 35450 }, { "epoch": 0.23, "learning_rate": 0.0002656699174503185, "loss": 0.0638, "step": 35460 }, { "epoch": 0.23, "learning_rate": 0.0002656602360959616, "loss": 0.0661, "step": 35470 }, { "epoch": 0.23, "learning_rate": 0.00026565055474160463, "loss": 0.0815, "step": 35480 }, { "epoch": 0.23, "learning_rate": 0.0002656408733872477, "loss": 0.0685, "step": 35490 }, { "epoch": 0.23, "learning_rate": 0.0002656311920328908, "loss": 0.0733, "step": 35500 }, { "epoch": 0.23, "learning_rate": 0.0002656215106785338, "loss": 0.0767, "step": 35510 }, { "epoch": 0.23, "learning_rate": 0.0002656118293241769, "loss": 0.0743, "step": 35520 }, { "epoch": 0.23, "learning_rate": 0.00026560214796981997, "loss": 0.0693, "step": 35530 }, { "epoch": 0.23, "learning_rate": 0.00026559246661546305, "loss": 0.0794, "step": 35540 }, { "epoch": 0.23, "learning_rate": 0.0002655827852611061, "loss": 0.0741, "step": 35550 }, { "epoch": 0.23, "learning_rate": 0.00026557310390674916, "loss": 0.0789, "step": 35560 }, { "epoch": 0.23, "learning_rate": 0.00026556342255239224, "loss": 0.0699, "step": 35570 }, { "epoch": 0.23, "learning_rate": 0.0002655537411980353, "loss": 0.0716, "step": 35580 }, { "epoch": 0.23, "learning_rate": 0.0002655440598436784, "loss": 0.0715, "step": 35590 }, { "epoch": 0.23, "learning_rate": 0.0002655343784893215, "loss": 0.0766, "step": 35600 }, { "epoch": 0.23, "learning_rate": 0.0002655246971349645, "loss": 0.0732, "step": 35610 }, { "epoch": 0.23, "learning_rate": 0.0002655150157806076, "loss": 0.0639, "step": 35620 }, { "epoch": 0.23, "learning_rate": 0.00026550533442625066, "loss": 0.0953, "step": 35630 }, { "epoch": 0.23, "learning_rate": 0.0002654956530718937, "loss": 0.0673, "step": 35640 }, { "epoch": 0.23, "learning_rate": 0.00026548597171753677, "loss": 0.0686, "step": 35650 }, { "epoch": 0.23, "learning_rate": 0.00026547629036317985, "loss": 0.0749, "step": 35660 }, { "epoch": 0.23, "learning_rate": 0.00026546660900882293, "loss": 0.0723, "step": 35670 }, { "epoch": 0.23, "learning_rate": 0.000265456927654466, "loss": 0.071, "step": 35680 }, { "epoch": 0.23, "learning_rate": 0.00026544724630010903, "loss": 0.0812, "step": 35690 }, { "epoch": 0.23, "learning_rate": 0.0002654375649457521, "loss": 0.0726, "step": 35700 }, { "epoch": 0.23, "learning_rate": 0.0002654278835913952, "loss": 0.081, "step": 35710 }, { "epoch": 0.23, "learning_rate": 0.00026541820223703827, "loss": 0.068, "step": 35720 }, { "epoch": 0.23, "learning_rate": 0.00026540852088268135, "loss": 0.0722, "step": 35730 }, { "epoch": 0.23, "learning_rate": 0.0002653988395283244, "loss": 0.0686, "step": 35740 }, { "epoch": 0.23, "learning_rate": 0.00026538915817396746, "loss": 0.0772, "step": 35750 }, { "epoch": 0.23, "learning_rate": 0.00026537947681961054, "loss": 0.0747, "step": 35760 }, { "epoch": 0.23, "learning_rate": 0.00026536979546525356, "loss": 0.0794, "step": 35770 }, { "epoch": 0.23, "learning_rate": 0.00026536011411089664, "loss": 0.08, "step": 35780 }, { "epoch": 0.23, "learning_rate": 0.0002653504327565397, "loss": 0.0699, "step": 35790 }, { "epoch": 0.23, "learning_rate": 0.0002653407514021828, "loss": 0.0794, "step": 35800 }, { "epoch": 0.23, "learning_rate": 0.0002653310700478259, "loss": 0.0732, "step": 35810 }, { "epoch": 0.23, "learning_rate": 0.00026532138869346896, "loss": 0.067, "step": 35820 }, { "epoch": 0.23, "learning_rate": 0.000265311707339112, "loss": 0.0678, "step": 35830 }, { "epoch": 0.23, "learning_rate": 0.00026530202598475507, "loss": 0.0724, "step": 35840 }, { "epoch": 0.23, "learning_rate": 0.00026529234463039815, "loss": 0.0719, "step": 35850 }, { "epoch": 0.23, "learning_rate": 0.0002652826632760412, "loss": 0.0765, "step": 35860 }, { "epoch": 0.23, "learning_rate": 0.0002652729819216843, "loss": 0.0824, "step": 35870 }, { "epoch": 0.23, "learning_rate": 0.00026526330056732733, "loss": 0.0712, "step": 35880 }, { "epoch": 0.23, "learning_rate": 0.0002652536192129704, "loss": 0.0734, "step": 35890 }, { "epoch": 0.23, "learning_rate": 0.0002652439378586135, "loss": 0.0793, "step": 35900 }, { "epoch": 0.23, "learning_rate": 0.0002652342565042565, "loss": 0.0711, "step": 35910 }, { "epoch": 0.23, "learning_rate": 0.0002652245751498996, "loss": 0.0749, "step": 35920 }, { "epoch": 0.23, "learning_rate": 0.0002652148937955427, "loss": 0.066, "step": 35930 }, { "epoch": 0.23, "learning_rate": 0.00026520521244118576, "loss": 0.079, "step": 35940 }, { "epoch": 0.23, "learning_rate": 0.00026519553108682884, "loss": 0.0738, "step": 35950 }, { "epoch": 0.23, "learning_rate": 0.0002651858497324719, "loss": 0.0756, "step": 35960 }, { "epoch": 0.23, "learning_rate": 0.00026517616837811494, "loss": 0.065, "step": 35970 }, { "epoch": 0.23, "learning_rate": 0.000265166487023758, "loss": 0.073, "step": 35980 }, { "epoch": 0.23, "learning_rate": 0.0002651568056694011, "loss": 0.0868, "step": 35990 }, { "epoch": 0.23, "learning_rate": 0.0002651471243150442, "loss": 0.0775, "step": 36000 }, { "epoch": 0.23, "eval_cer": 0.9200876737091854, "eval_loss": 0.04887823387980461, "eval_runtime": 120.558, "eval_samples_per_second": 16.59, "eval_steps_per_second": 4.147, "step": 36000 }, { "epoch": 0.23, "learning_rate": 0.0002651374429606872, "loss": 0.0742, "step": 36010 }, { "epoch": 0.23, "learning_rate": 0.0002651277616063303, "loss": 0.0734, "step": 36020 }, { "epoch": 0.23, "learning_rate": 0.00026511808025197337, "loss": 0.0632, "step": 36030 }, { "epoch": 0.23, "learning_rate": 0.0002651083988976164, "loss": 0.0726, "step": 36040 }, { "epoch": 0.23, "learning_rate": 0.00026509871754325947, "loss": 0.0772, "step": 36050 }, { "epoch": 0.23, "learning_rate": 0.00026508903618890255, "loss": 0.068, "step": 36060 }, { "epoch": 0.23, "learning_rate": 0.00026507935483454563, "loss": 0.0679, "step": 36070 }, { "epoch": 0.23, "learning_rate": 0.0002650696734801887, "loss": 0.0741, "step": 36080 }, { "epoch": 0.23, "learning_rate": 0.0002650599921258318, "loss": 0.0772, "step": 36090 }, { "epoch": 0.23, "learning_rate": 0.00026505031077147487, "loss": 0.0759, "step": 36100 }, { "epoch": 0.23, "learning_rate": 0.0002650406294171179, "loss": 0.0621, "step": 36110 }, { "epoch": 0.23, "learning_rate": 0.000265030948062761, "loss": 0.0777, "step": 36120 }, { "epoch": 0.23, "learning_rate": 0.00026502126670840406, "loss": 0.0756, "step": 36130 }, { "epoch": 0.23, "learning_rate": 0.0002650115853540471, "loss": 0.0682, "step": 36140 }, { "epoch": 0.23, "learning_rate": 0.00026500190399969016, "loss": 0.0763, "step": 36150 }, { "epoch": 0.23, "learning_rate": 0.00026499222264533324, "loss": 0.0686, "step": 36160 }, { "epoch": 0.23, "learning_rate": 0.0002649825412909763, "loss": 0.0647, "step": 36170 }, { "epoch": 0.23, "learning_rate": 0.00026497285993661935, "loss": 0.0725, "step": 36180 }, { "epoch": 0.23, "learning_rate": 0.0002649631785822624, "loss": 0.0723, "step": 36190 }, { "epoch": 0.23, "learning_rate": 0.0002649534972279055, "loss": 0.0688, "step": 36200 }, { "epoch": 0.23, "learning_rate": 0.0002649438158735486, "loss": 0.0788, "step": 36210 }, { "epoch": 0.23, "learning_rate": 0.00026493413451919167, "loss": 0.0669, "step": 36220 }, { "epoch": 0.23, "learning_rate": 0.00026492445316483475, "loss": 0.0753, "step": 36230 }, { "epoch": 0.23, "learning_rate": 0.0002649147718104778, "loss": 0.0679, "step": 36240 }, { "epoch": 0.23, "learning_rate": 0.00026490509045612085, "loss": 0.0684, "step": 36250 }, { "epoch": 0.23, "learning_rate": 0.00026489540910176393, "loss": 0.0666, "step": 36260 }, { "epoch": 0.23, "learning_rate": 0.000264885727747407, "loss": 0.0681, "step": 36270 }, { "epoch": 0.23, "learning_rate": 0.00026487604639305004, "loss": 0.0743, "step": 36280 }, { "epoch": 0.23, "learning_rate": 0.0002648663650386931, "loss": 0.07, "step": 36290 }, { "epoch": 0.23, "learning_rate": 0.0002648566836843362, "loss": 0.0701, "step": 36300 }, { "epoch": 0.23, "learning_rate": 0.0002648470023299793, "loss": 0.0695, "step": 36310 }, { "epoch": 0.23, "learning_rate": 0.0002648373209756223, "loss": 0.0727, "step": 36320 }, { "epoch": 0.23, "learning_rate": 0.0002648276396212654, "loss": 0.0774, "step": 36330 }, { "epoch": 0.23, "learning_rate": 0.00026481795826690846, "loss": 0.077, "step": 36340 }, { "epoch": 0.23, "learning_rate": 0.00026480827691255154, "loss": 0.0737, "step": 36350 }, { "epoch": 0.23, "learning_rate": 0.0002647985955581946, "loss": 0.0778, "step": 36360 }, { "epoch": 0.23, "learning_rate": 0.0002647889142038377, "loss": 0.0825, "step": 36370 }, { "epoch": 0.23, "learning_rate": 0.0002647792328494807, "loss": 0.0653, "step": 36380 }, { "epoch": 0.23, "learning_rate": 0.0002647695514951238, "loss": 0.0736, "step": 36390 }, { "epoch": 0.23, "learning_rate": 0.0002647598701407669, "loss": 0.0723, "step": 36400 }, { "epoch": 0.23, "learning_rate": 0.0002647501887864099, "loss": 0.0693, "step": 36410 }, { "epoch": 0.24, "learning_rate": 0.000264740507432053, "loss": 0.0706, "step": 36420 }, { "epoch": 0.24, "learning_rate": 0.00026473082607769607, "loss": 0.0679, "step": 36430 }, { "epoch": 0.24, "learning_rate": 0.00026472114472333915, "loss": 0.0745, "step": 36440 }, { "epoch": 0.24, "learning_rate": 0.00026471146336898223, "loss": 0.0835, "step": 36450 }, { "epoch": 0.24, "learning_rate": 0.00026470178201462526, "loss": 0.0814, "step": 36460 }, { "epoch": 0.24, "learning_rate": 0.00026469210066026833, "loss": 0.0654, "step": 36470 }, { "epoch": 0.24, "learning_rate": 0.0002646824193059114, "loss": 0.0668, "step": 36480 }, { "epoch": 0.24, "learning_rate": 0.0002646727379515545, "loss": 0.0745, "step": 36490 }, { "epoch": 0.24, "learning_rate": 0.0002646630565971976, "loss": 0.0791, "step": 36500 }, { "epoch": 0.24, "learning_rate": 0.0002646533752428406, "loss": 0.0712, "step": 36510 }, { "epoch": 0.24, "learning_rate": 0.0002646436938884837, "loss": 0.0901, "step": 36520 }, { "epoch": 0.24, "learning_rate": 0.00026463401253412676, "loss": 0.0742, "step": 36530 }, { "epoch": 0.24, "learning_rate": 0.0002646243311797698, "loss": 0.068, "step": 36540 }, { "epoch": 0.24, "learning_rate": 0.00026461464982541286, "loss": 0.0651, "step": 36550 }, { "epoch": 0.24, "learning_rate": 0.00026460496847105594, "loss": 0.0673, "step": 36560 }, { "epoch": 0.24, "learning_rate": 0.000264595287116699, "loss": 0.0717, "step": 36570 }, { "epoch": 0.24, "learning_rate": 0.0002645856057623421, "loss": 0.0666, "step": 36580 }, { "epoch": 0.24, "learning_rate": 0.0002645759244079852, "loss": 0.0729, "step": 36590 }, { "epoch": 0.24, "learning_rate": 0.0002645662430536282, "loss": 0.0708, "step": 36600 }, { "epoch": 0.24, "learning_rate": 0.0002645565616992713, "loss": 0.0678, "step": 36610 }, { "epoch": 0.24, "learning_rate": 0.00026454688034491437, "loss": 0.0795, "step": 36620 }, { "epoch": 0.24, "learning_rate": 0.00026453719899055745, "loss": 0.0684, "step": 36630 }, { "epoch": 0.24, "learning_rate": 0.00026452751763620053, "loss": 0.0773, "step": 36640 }, { "epoch": 0.24, "learning_rate": 0.00026451783628184355, "loss": 0.0719, "step": 36650 }, { "epoch": 0.24, "learning_rate": 0.00026450815492748663, "loss": 0.082, "step": 36660 }, { "epoch": 0.24, "learning_rate": 0.0002644984735731297, "loss": 0.0634, "step": 36670 }, { "epoch": 0.24, "learning_rate": 0.00026448879221877274, "loss": 0.0754, "step": 36680 }, { "epoch": 0.24, "learning_rate": 0.0002644791108644158, "loss": 0.0702, "step": 36690 }, { "epoch": 0.24, "learning_rate": 0.0002644694295100589, "loss": 0.0684, "step": 36700 }, { "epoch": 0.24, "learning_rate": 0.000264459748155702, "loss": 0.0747, "step": 36710 }, { "epoch": 0.24, "learning_rate": 0.00026445006680134506, "loss": 0.0688, "step": 36720 }, { "epoch": 0.24, "learning_rate": 0.00026444038544698814, "loss": 0.0722, "step": 36730 }, { "epoch": 0.24, "learning_rate": 0.00026443070409263116, "loss": 0.0848, "step": 36740 }, { "epoch": 0.24, "learning_rate": 0.00026442102273827424, "loss": 0.0661, "step": 36750 }, { "epoch": 0.24, "learning_rate": 0.0002644113413839173, "loss": 0.0774, "step": 36760 }, { "epoch": 0.24, "learning_rate": 0.0002644016600295604, "loss": 0.0703, "step": 36770 }, { "epoch": 0.24, "learning_rate": 0.00026439197867520343, "loss": 0.0707, "step": 36780 }, { "epoch": 0.24, "learning_rate": 0.0002643822973208465, "loss": 0.07, "step": 36790 }, { "epoch": 0.24, "learning_rate": 0.0002643726159664896, "loss": 0.0724, "step": 36800 }, { "epoch": 0.24, "learning_rate": 0.0002643629346121326, "loss": 0.0811, "step": 36810 }, { "epoch": 0.24, "learning_rate": 0.0002643532532577757, "loss": 0.0744, "step": 36820 }, { "epoch": 0.24, "learning_rate": 0.0002643435719034188, "loss": 0.0711, "step": 36830 }, { "epoch": 0.24, "learning_rate": 0.00026433389054906185, "loss": 0.0675, "step": 36840 }, { "epoch": 0.24, "learning_rate": 0.00026432420919470493, "loss": 0.0692, "step": 36850 }, { "epoch": 0.24, "learning_rate": 0.000264314527840348, "loss": 0.0755, "step": 36860 }, { "epoch": 0.24, "learning_rate": 0.0002643048464859911, "loss": 0.0667, "step": 36870 }, { "epoch": 0.24, "learning_rate": 0.0002642951651316341, "loss": 0.0677, "step": 36880 }, { "epoch": 0.24, "learning_rate": 0.0002642854837772772, "loss": 0.0728, "step": 36890 }, { "epoch": 0.24, "learning_rate": 0.0002642758024229203, "loss": 0.0687, "step": 36900 }, { "epoch": 0.24, "learning_rate": 0.0002642661210685633, "loss": 0.0644, "step": 36910 }, { "epoch": 0.24, "learning_rate": 0.0002642564397142064, "loss": 0.0709, "step": 36920 }, { "epoch": 0.24, "learning_rate": 0.00026424675835984946, "loss": 0.0785, "step": 36930 }, { "epoch": 0.24, "learning_rate": 0.00026423707700549254, "loss": 0.0673, "step": 36940 }, { "epoch": 0.24, "learning_rate": 0.00026422739565113557, "loss": 0.0752, "step": 36950 }, { "epoch": 0.24, "learning_rate": 0.00026421771429677865, "loss": 0.0741, "step": 36960 }, { "epoch": 0.24, "learning_rate": 0.00026420803294242173, "loss": 0.0701, "step": 36970 }, { "epoch": 0.24, "learning_rate": 0.0002641983515880648, "loss": 0.079, "step": 36980 }, { "epoch": 0.24, "learning_rate": 0.0002641886702337079, "loss": 0.066, "step": 36990 }, { "epoch": 0.24, "learning_rate": 0.00026417898887935097, "loss": 0.0772, "step": 37000 }, { "epoch": 0.24, "eval_cer": 0.9201798666817309, "eval_loss": 0.048399925231933594, "eval_runtime": 120.3324, "eval_samples_per_second": 16.621, "eval_steps_per_second": 4.155, "step": 37000 }, { "epoch": 0.24, "learning_rate": 0.00026416930752499405, "loss": 0.0766, "step": 37010 }, { "epoch": 0.24, "learning_rate": 0.00026415962617063707, "loss": 0.0687, "step": 37020 }, { "epoch": 0.24, "learning_rate": 0.00026414994481628015, "loss": 0.0706, "step": 37030 }, { "epoch": 0.24, "learning_rate": 0.00026414026346192323, "loss": 0.0752, "step": 37040 }, { "epoch": 0.24, "learning_rate": 0.00026413058210756626, "loss": 0.0734, "step": 37050 }, { "epoch": 0.24, "learning_rate": 0.00026412090075320934, "loss": 0.0706, "step": 37060 }, { "epoch": 0.24, "learning_rate": 0.0002641112193988524, "loss": 0.0699, "step": 37070 }, { "epoch": 0.24, "learning_rate": 0.0002641015380444955, "loss": 0.0717, "step": 37080 }, { "epoch": 0.24, "learning_rate": 0.0002640918566901385, "loss": 0.0647, "step": 37090 }, { "epoch": 0.24, "learning_rate": 0.0002640821753357816, "loss": 0.0688, "step": 37100 }, { "epoch": 0.24, "learning_rate": 0.0002640724939814247, "loss": 0.0697, "step": 37110 }, { "epoch": 0.24, "learning_rate": 0.00026406281262706776, "loss": 0.0694, "step": 37120 }, { "epoch": 0.24, "learning_rate": 0.00026405313127271084, "loss": 0.0697, "step": 37130 }, { "epoch": 0.24, "learning_rate": 0.0002640434499183539, "loss": 0.0662, "step": 37140 }, { "epoch": 0.24, "learning_rate": 0.00026403376856399695, "loss": 0.0706, "step": 37150 }, { "epoch": 0.24, "learning_rate": 0.00026402408720964003, "loss": 0.0747, "step": 37160 }, { "epoch": 0.24, "learning_rate": 0.0002640144058552831, "loss": 0.0671, "step": 37170 }, { "epoch": 0.24, "learning_rate": 0.00026400472450092613, "loss": 0.0713, "step": 37180 }, { "epoch": 0.24, "learning_rate": 0.0002639950431465692, "loss": 0.0694, "step": 37190 }, { "epoch": 0.24, "learning_rate": 0.0002639853617922123, "loss": 0.0686, "step": 37200 }, { "epoch": 0.24, "learning_rate": 0.00026397568043785537, "loss": 0.0707, "step": 37210 }, { "epoch": 0.24, "learning_rate": 0.00026396599908349845, "loss": 0.0758, "step": 37220 }, { "epoch": 0.24, "learning_rate": 0.0002639563177291415, "loss": 0.073, "step": 37230 }, { "epoch": 0.24, "learning_rate": 0.00026394663637478456, "loss": 0.0752, "step": 37240 }, { "epoch": 0.24, "learning_rate": 0.00026393695502042764, "loss": 0.0666, "step": 37250 }, { "epoch": 0.24, "learning_rate": 0.0002639272736660707, "loss": 0.0708, "step": 37260 }, { "epoch": 0.24, "learning_rate": 0.0002639175923117138, "loss": 0.0731, "step": 37270 }, { "epoch": 0.24, "learning_rate": 0.0002639079109573569, "loss": 0.0709, "step": 37280 }, { "epoch": 0.24, "learning_rate": 0.0002638982296029999, "loss": 0.0761, "step": 37290 }, { "epoch": 0.24, "learning_rate": 0.000263888548248643, "loss": 0.0681, "step": 37300 }, { "epoch": 0.24, "learning_rate": 0.000263878866894286, "loss": 0.0821, "step": 37310 }, { "epoch": 0.24, "learning_rate": 0.0002638691855399291, "loss": 0.0698, "step": 37320 }, { "epoch": 0.24, "learning_rate": 0.00026385950418557217, "loss": 0.0639, "step": 37330 }, { "epoch": 0.24, "learning_rate": 0.00026384982283121525, "loss": 0.0718, "step": 37340 }, { "epoch": 0.24, "learning_rate": 0.0002638401414768583, "loss": 0.0776, "step": 37350 }, { "epoch": 0.24, "learning_rate": 0.0002638304601225014, "loss": 0.0827, "step": 37360 }, { "epoch": 0.24, "learning_rate": 0.00026382077876814443, "loss": 0.0733, "step": 37370 }, { "epoch": 0.24, "learning_rate": 0.0002638110974137875, "loss": 0.0692, "step": 37380 }, { "epoch": 0.24, "learning_rate": 0.0002638014160594306, "loss": 0.0715, "step": 37390 }, { "epoch": 0.24, "learning_rate": 0.00026379173470507367, "loss": 0.0754, "step": 37400 }, { "epoch": 0.24, "learning_rate": 0.00026378205335071675, "loss": 0.0769, "step": 37410 }, { "epoch": 0.24, "learning_rate": 0.0002637723719963598, "loss": 0.0676, "step": 37420 }, { "epoch": 0.24, "learning_rate": 0.00026376269064200286, "loss": 0.0683, "step": 37430 }, { "epoch": 0.24, "learning_rate": 0.00026375300928764594, "loss": 0.0628, "step": 37440 }, { "epoch": 0.24, "learning_rate": 0.00026374332793328896, "loss": 0.0672, "step": 37450 }, { "epoch": 0.24, "learning_rate": 0.00026373364657893204, "loss": 0.0678, "step": 37460 }, { "epoch": 0.24, "learning_rate": 0.0002637239652245751, "loss": 0.0676, "step": 37470 }, { "epoch": 0.24, "learning_rate": 0.0002637142838702182, "loss": 0.0809, "step": 37480 }, { "epoch": 0.24, "learning_rate": 0.0002637046025158613, "loss": 0.0708, "step": 37490 }, { "epoch": 0.24, "learning_rate": 0.00026369492116150436, "loss": 0.0773, "step": 37500 }, { "epoch": 0.24, "learning_rate": 0.0002636852398071474, "loss": 0.0691, "step": 37510 }, { "epoch": 0.24, "learning_rate": 0.00026367555845279047, "loss": 0.0788, "step": 37520 }, { "epoch": 0.24, "learning_rate": 0.00026366587709843355, "loss": 0.0674, "step": 37530 }, { "epoch": 0.24, "learning_rate": 0.0002636561957440766, "loss": 0.0729, "step": 37540 }, { "epoch": 0.24, "learning_rate": 0.00026364651438971965, "loss": 0.0685, "step": 37550 }, { "epoch": 0.24, "learning_rate": 0.00026363683303536273, "loss": 0.0739, "step": 37560 }, { "epoch": 0.24, "learning_rate": 0.0002636271516810058, "loss": 0.0667, "step": 37570 }, { "epoch": 0.24, "learning_rate": 0.00026361747032664884, "loss": 0.0703, "step": 37580 }, { "epoch": 0.24, "learning_rate": 0.0002636077889722919, "loss": 0.0676, "step": 37590 }, { "epoch": 0.24, "learning_rate": 0.000263598107617935, "loss": 0.0718, "step": 37600 }, { "epoch": 0.24, "learning_rate": 0.0002635884262635781, "loss": 0.0699, "step": 37610 }, { "epoch": 0.24, "learning_rate": 0.00026357874490922116, "loss": 0.0724, "step": 37620 }, { "epoch": 0.24, "learning_rate": 0.00026356906355486424, "loss": 0.0615, "step": 37630 }, { "epoch": 0.24, "learning_rate": 0.0002635593822005073, "loss": 0.0718, "step": 37640 }, { "epoch": 0.24, "learning_rate": 0.00026354970084615034, "loss": 0.0736, "step": 37650 }, { "epoch": 0.24, "learning_rate": 0.0002635400194917934, "loss": 0.0695, "step": 37660 }, { "epoch": 0.24, "learning_rate": 0.0002635303381374365, "loss": 0.0691, "step": 37670 }, { "epoch": 0.24, "learning_rate": 0.0002635206567830796, "loss": 0.0686, "step": 37680 }, { "epoch": 0.24, "learning_rate": 0.0002635109754287226, "loss": 0.0676, "step": 37690 }, { "epoch": 0.24, "learning_rate": 0.0002635012940743657, "loss": 0.068, "step": 37700 }, { "epoch": 0.24, "learning_rate": 0.00026349161272000877, "loss": 0.0707, "step": 37710 }, { "epoch": 0.24, "learning_rate": 0.0002634819313656518, "loss": 0.0675, "step": 37720 }, { "epoch": 0.24, "learning_rate": 0.00026347225001129487, "loss": 0.0699, "step": 37730 }, { "epoch": 0.24, "learning_rate": 0.00026346256865693795, "loss": 0.078, "step": 37740 }, { "epoch": 0.24, "learning_rate": 0.00026345288730258103, "loss": 0.0687, "step": 37750 }, { "epoch": 0.24, "learning_rate": 0.0002634432059482241, "loss": 0.072, "step": 37760 }, { "epoch": 0.24, "learning_rate": 0.0002634335245938672, "loss": 0.076, "step": 37770 }, { "epoch": 0.24, "learning_rate": 0.00026342384323951027, "loss": 0.084, "step": 37780 }, { "epoch": 0.24, "learning_rate": 0.0002634141618851533, "loss": 0.0754, "step": 37790 }, { "epoch": 0.24, "learning_rate": 0.0002634044805307964, "loss": 0.0702, "step": 37800 }, { "epoch": 0.24, "learning_rate": 0.00026339479917643945, "loss": 0.0712, "step": 37810 }, { "epoch": 0.24, "learning_rate": 0.0002633851178220825, "loss": 0.0796, "step": 37820 }, { "epoch": 0.24, "learning_rate": 0.00026337543646772556, "loss": 0.0722, "step": 37830 }, { "epoch": 0.24, "learning_rate": 0.00026336575511336864, "loss": 0.0721, "step": 37840 }, { "epoch": 0.24, "learning_rate": 0.0002633560737590117, "loss": 0.0752, "step": 37850 }, { "epoch": 0.24, "learning_rate": 0.00026334639240465475, "loss": 0.0761, "step": 37860 }, { "epoch": 0.24, "learning_rate": 0.0002633367110502978, "loss": 0.0692, "step": 37870 }, { "epoch": 0.24, "learning_rate": 0.0002633270296959409, "loss": 0.076, "step": 37880 }, { "epoch": 0.24, "learning_rate": 0.000263317348341584, "loss": 0.0737, "step": 37890 }, { "epoch": 0.24, "learning_rate": 0.00026330766698722706, "loss": 0.0772, "step": 37900 }, { "epoch": 0.24, "learning_rate": 0.00026329798563287014, "loss": 0.0726, "step": 37910 }, { "epoch": 0.24, "learning_rate": 0.00026328830427851317, "loss": 0.0741, "step": 37920 }, { "epoch": 0.24, "learning_rate": 0.00026327862292415625, "loss": 0.0724, "step": 37930 }, { "epoch": 0.24, "learning_rate": 0.00026326894156979933, "loss": 0.0675, "step": 37940 }, { "epoch": 0.24, "learning_rate": 0.00026325926021544236, "loss": 0.0645, "step": 37950 }, { "epoch": 0.25, "learning_rate": 0.00026324957886108543, "loss": 0.0759, "step": 37960 }, { "epoch": 0.25, "learning_rate": 0.0002632398975067285, "loss": 0.0757, "step": 37970 }, { "epoch": 0.25, "learning_rate": 0.0002632302161523716, "loss": 0.0709, "step": 37980 }, { "epoch": 0.25, "learning_rate": 0.0002632205347980146, "loss": 0.0755, "step": 37990 }, { "epoch": 0.25, "learning_rate": 0.0002632108534436577, "loss": 0.073, "step": 38000 }, { "epoch": 0.25, "eval_cer": 0.9201852897977629, "eval_loss": 0.04867184907197952, "eval_runtime": 120.3167, "eval_samples_per_second": 16.623, "eval_steps_per_second": 4.156, "step": 38000 }, { "epoch": 0.25, "learning_rate": 0.0002632011720893008, "loss": 0.0725, "step": 38010 }, { "epoch": 0.25, "learning_rate": 0.00026319149073494386, "loss": 0.0761, "step": 38020 }, { "epoch": 0.25, "learning_rate": 0.00026318180938058694, "loss": 0.0714, "step": 38030 }, { "epoch": 0.25, "learning_rate": 0.00026317212802623, "loss": 0.067, "step": 38040 }, { "epoch": 0.25, "learning_rate": 0.0002631624466718731, "loss": 0.072, "step": 38050 }, { "epoch": 0.25, "learning_rate": 0.0002631527653175161, "loss": 0.0667, "step": 38060 }, { "epoch": 0.25, "learning_rate": 0.0002631430839631592, "loss": 0.0668, "step": 38070 }, { "epoch": 0.25, "learning_rate": 0.0002631334026088023, "loss": 0.0633, "step": 38080 }, { "epoch": 0.25, "learning_rate": 0.0002631237212544453, "loss": 0.0704, "step": 38090 }, { "epoch": 0.25, "learning_rate": 0.0002631140399000884, "loss": 0.0718, "step": 38100 }, { "epoch": 0.25, "learning_rate": 0.00026310435854573147, "loss": 0.0672, "step": 38110 }, { "epoch": 0.25, "learning_rate": 0.00026309467719137455, "loss": 0.0715, "step": 38120 }, { "epoch": 0.25, "learning_rate": 0.0002630849958370176, "loss": 0.0651, "step": 38130 }, { "epoch": 0.25, "learning_rate": 0.00026307531448266065, "loss": 0.0653, "step": 38140 }, { "epoch": 0.25, "learning_rate": 0.00026306563312830373, "loss": 0.0691, "step": 38150 }, { "epoch": 0.25, "learning_rate": 0.0002630559517739468, "loss": 0.0655, "step": 38160 }, { "epoch": 0.25, "learning_rate": 0.0002630462704195899, "loss": 0.0773, "step": 38170 }, { "epoch": 0.25, "learning_rate": 0.000263036589065233, "loss": 0.0783, "step": 38180 }, { "epoch": 0.25, "learning_rate": 0.000263026907710876, "loss": 0.0717, "step": 38190 }, { "epoch": 0.25, "learning_rate": 0.0002630172263565191, "loss": 0.0715, "step": 38200 }, { "epoch": 0.25, "learning_rate": 0.00026300754500216216, "loss": 0.0805, "step": 38210 }, { "epoch": 0.25, "learning_rate": 0.0002629978636478052, "loss": 0.0672, "step": 38220 }, { "epoch": 0.25, "learning_rate": 0.00026298818229344826, "loss": 0.0806, "step": 38230 }, { "epoch": 0.25, "learning_rate": 0.00026297850093909134, "loss": 0.0668, "step": 38240 }, { "epoch": 0.25, "learning_rate": 0.0002629688195847344, "loss": 0.0742, "step": 38250 }, { "epoch": 0.25, "learning_rate": 0.0002629591382303775, "loss": 0.0722, "step": 38260 }, { "epoch": 0.25, "learning_rate": 0.00026294945687602053, "loss": 0.0859, "step": 38270 }, { "epoch": 0.25, "learning_rate": 0.0002629397755216636, "loss": 0.0744, "step": 38280 }, { "epoch": 0.25, "learning_rate": 0.0002629300941673067, "loss": 0.0758, "step": 38290 }, { "epoch": 0.25, "learning_rate": 0.00026292041281294977, "loss": 0.0772, "step": 38300 }, { "epoch": 0.25, "learning_rate": 0.00026291073145859285, "loss": 0.068, "step": 38310 }, { "epoch": 0.25, "learning_rate": 0.0002629010501042359, "loss": 0.0693, "step": 38320 }, { "epoch": 0.25, "learning_rate": 0.00026289136874987895, "loss": 0.0714, "step": 38330 }, { "epoch": 0.25, "learning_rate": 0.00026288168739552203, "loss": 0.0769, "step": 38340 }, { "epoch": 0.25, "learning_rate": 0.00026287200604116506, "loss": 0.0692, "step": 38350 }, { "epoch": 0.25, "learning_rate": 0.00026286232468680814, "loss": 0.0671, "step": 38360 }, { "epoch": 0.25, "learning_rate": 0.0002628526433324512, "loss": 0.0676, "step": 38370 }, { "epoch": 0.25, "learning_rate": 0.0002628429619780943, "loss": 0.0744, "step": 38380 }, { "epoch": 0.25, "learning_rate": 0.0002628332806237374, "loss": 0.0661, "step": 38390 }, { "epoch": 0.25, "learning_rate": 0.00026282359926938046, "loss": 0.0743, "step": 38400 }, { "epoch": 0.25, "learning_rate": 0.0002628139179150235, "loss": 0.0728, "step": 38410 }, { "epoch": 0.25, "learning_rate": 0.00026280423656066656, "loss": 0.0728, "step": 38420 }, { "epoch": 0.25, "learning_rate": 0.00026279455520630964, "loss": 0.0676, "step": 38430 }, { "epoch": 0.25, "learning_rate": 0.0002627848738519527, "loss": 0.0721, "step": 38440 }, { "epoch": 0.25, "learning_rate": 0.0002627751924975958, "loss": 0.0768, "step": 38450 }, { "epoch": 0.25, "learning_rate": 0.00026276551114323883, "loss": 0.0751, "step": 38460 }, { "epoch": 0.25, "learning_rate": 0.0002627558297888819, "loss": 0.0768, "step": 38470 }, { "epoch": 0.25, "learning_rate": 0.000262746148434525, "loss": 0.0729, "step": 38480 }, { "epoch": 0.25, "learning_rate": 0.000262736467080168, "loss": 0.0702, "step": 38490 }, { "epoch": 0.25, "learning_rate": 0.0002627267857258111, "loss": 0.0682, "step": 38500 }, { "epoch": 0.25, "learning_rate": 0.00026271710437145417, "loss": 0.0674, "step": 38510 }, { "epoch": 0.25, "learning_rate": 0.00026270742301709725, "loss": 0.0731, "step": 38520 }, { "epoch": 0.25, "learning_rate": 0.00026269774166274033, "loss": 0.0696, "step": 38530 }, { "epoch": 0.25, "learning_rate": 0.0002626880603083834, "loss": 0.0621, "step": 38540 }, { "epoch": 0.25, "learning_rate": 0.00026267837895402644, "loss": 0.0762, "step": 38550 }, { "epoch": 0.25, "learning_rate": 0.0002626686975996695, "loss": 0.0672, "step": 38560 }, { "epoch": 0.25, "learning_rate": 0.0002626590162453126, "loss": 0.0696, "step": 38570 }, { "epoch": 0.25, "learning_rate": 0.0002626493348909557, "loss": 0.0792, "step": 38580 }, { "epoch": 0.25, "learning_rate": 0.0002626396535365987, "loss": 0.0636, "step": 38590 }, { "epoch": 0.25, "learning_rate": 0.0002626299721822418, "loss": 0.0707, "step": 38600 }, { "epoch": 0.25, "learning_rate": 0.00026262029082788486, "loss": 0.0725, "step": 38610 }, { "epoch": 0.25, "learning_rate": 0.0002626106094735279, "loss": 0.0743, "step": 38620 }, { "epoch": 0.25, "learning_rate": 0.00026260092811917097, "loss": 0.0726, "step": 38630 }, { "epoch": 0.25, "learning_rate": 0.00026259124676481405, "loss": 0.0691, "step": 38640 }, { "epoch": 0.25, "learning_rate": 0.00026258156541045713, "loss": 0.0754, "step": 38650 }, { "epoch": 0.25, "learning_rate": 0.0002625718840561002, "loss": 0.0714, "step": 38660 }, { "epoch": 0.25, "learning_rate": 0.0002625622027017433, "loss": 0.0675, "step": 38670 }, { "epoch": 0.25, "learning_rate": 0.00026255252134738637, "loss": 0.0712, "step": 38680 }, { "epoch": 0.25, "learning_rate": 0.0002625428399930294, "loss": 0.0644, "step": 38690 }, { "epoch": 0.25, "learning_rate": 0.00026253315863867247, "loss": 0.0717, "step": 38700 }, { "epoch": 0.25, "learning_rate": 0.00026252347728431555, "loss": 0.0642, "step": 38710 }, { "epoch": 0.25, "learning_rate": 0.0002625137959299586, "loss": 0.0692, "step": 38720 }, { "epoch": 0.25, "learning_rate": 0.00026250411457560166, "loss": 0.0716, "step": 38730 }, { "epoch": 0.25, "learning_rate": 0.00026249443322124474, "loss": 0.077, "step": 38740 }, { "epoch": 0.25, "learning_rate": 0.0002624847518668878, "loss": 0.0746, "step": 38750 }, { "epoch": 0.25, "learning_rate": 0.00026247507051253084, "loss": 0.0706, "step": 38760 }, { "epoch": 0.25, "learning_rate": 0.0002624653891581739, "loss": 0.0779, "step": 38770 }, { "epoch": 0.25, "learning_rate": 0.000262455707803817, "loss": 0.0841, "step": 38780 }, { "epoch": 0.25, "learning_rate": 0.0002624460264494601, "loss": 0.0688, "step": 38790 }, { "epoch": 0.25, "learning_rate": 0.00026243634509510316, "loss": 0.0638, "step": 38800 }, { "epoch": 0.25, "learning_rate": 0.00026242666374074624, "loss": 0.0716, "step": 38810 }, { "epoch": 0.25, "learning_rate": 0.0002624169823863893, "loss": 0.0717, "step": 38820 }, { "epoch": 0.25, "learning_rate": 0.00026240730103203235, "loss": 0.08, "step": 38830 }, { "epoch": 0.25, "learning_rate": 0.0002623976196776754, "loss": 0.0915, "step": 38840 }, { "epoch": 0.25, "learning_rate": 0.0002623879383233185, "loss": 0.0671, "step": 38850 }, { "epoch": 0.25, "learning_rate": 0.00026237825696896153, "loss": 0.0744, "step": 38860 }, { "epoch": 0.25, "learning_rate": 0.0002623685756146046, "loss": 0.0759, "step": 38870 }, { "epoch": 0.25, "learning_rate": 0.0002623588942602477, "loss": 0.0671, "step": 38880 }, { "epoch": 0.25, "learning_rate": 0.00026234921290589077, "loss": 0.0693, "step": 38890 }, { "epoch": 0.25, "learning_rate": 0.0002623395315515338, "loss": 0.0708, "step": 38900 }, { "epoch": 0.25, "learning_rate": 0.0002623298501971769, "loss": 0.0661, "step": 38910 }, { "epoch": 0.25, "learning_rate": 0.00026232016884281996, "loss": 0.0711, "step": 38920 }, { "epoch": 0.25, "learning_rate": 0.00026231048748846304, "loss": 0.0744, "step": 38930 }, { "epoch": 0.25, "learning_rate": 0.0002623008061341061, "loss": 0.0736, "step": 38940 }, { "epoch": 0.25, "learning_rate": 0.0002622911247797492, "loss": 0.0663, "step": 38950 }, { "epoch": 0.25, "learning_rate": 0.0002622814434253922, "loss": 0.0689, "step": 38960 }, { "epoch": 0.25, "learning_rate": 0.0002622717620710353, "loss": 0.0679, "step": 38970 }, { "epoch": 0.25, "learning_rate": 0.0002622620807166784, "loss": 0.0678, "step": 38980 }, { "epoch": 0.25, "learning_rate": 0.0002622523993623214, "loss": 0.0731, "step": 38990 }, { "epoch": 0.25, "learning_rate": 0.0002622427180079645, "loss": 0.0675, "step": 39000 }, { "epoch": 0.25, "eval_cer": 0.919996384589312, "eval_loss": 0.047410257160663605, "eval_runtime": 120.2237, "eval_samples_per_second": 16.636, "eval_steps_per_second": 4.159, "step": 39000 }, { "epoch": 0.25, "learning_rate": 0.00026223303665360757, "loss": 0.0729, "step": 39010 }, { "epoch": 0.25, "learning_rate": 0.00026222335529925065, "loss": 0.0711, "step": 39020 }, { "epoch": 0.25, "learning_rate": 0.0002622136739448937, "loss": 0.0652, "step": 39030 }, { "epoch": 0.25, "learning_rate": 0.00026220399259053675, "loss": 0.0658, "step": 39040 }, { "epoch": 0.25, "learning_rate": 0.00026219431123617983, "loss": 0.0686, "step": 39050 }, { "epoch": 0.25, "learning_rate": 0.0002621846298818229, "loss": 0.0653, "step": 39060 }, { "epoch": 0.25, "learning_rate": 0.000262174948527466, "loss": 0.068, "step": 39070 }, { "epoch": 0.25, "learning_rate": 0.00026216526717310907, "loss": 0.0674, "step": 39080 }, { "epoch": 0.25, "learning_rate": 0.0002621555858187521, "loss": 0.0613, "step": 39090 }, { "epoch": 0.25, "learning_rate": 0.0002621459044643952, "loss": 0.0705, "step": 39100 }, { "epoch": 0.25, "learning_rate": 0.00026213622311003826, "loss": 0.0632, "step": 39110 }, { "epoch": 0.25, "learning_rate": 0.0002621265417556813, "loss": 0.0621, "step": 39120 }, { "epoch": 0.25, "learning_rate": 0.00026211686040132436, "loss": 0.0717, "step": 39130 }, { "epoch": 0.25, "learning_rate": 0.00026210717904696744, "loss": 0.0715, "step": 39140 }, { "epoch": 0.25, "learning_rate": 0.0002620974976926105, "loss": 0.0672, "step": 39150 }, { "epoch": 0.25, "learning_rate": 0.0002620878163382536, "loss": 0.0664, "step": 39160 }, { "epoch": 0.25, "learning_rate": 0.0002620781349838967, "loss": 0.0683, "step": 39170 }, { "epoch": 0.25, "learning_rate": 0.0002620684536295397, "loss": 0.068, "step": 39180 }, { "epoch": 0.25, "learning_rate": 0.0002620587722751828, "loss": 0.0634, "step": 39190 }, { "epoch": 0.25, "learning_rate": 0.00026204909092082587, "loss": 0.068, "step": 39200 }, { "epoch": 0.25, "learning_rate": 0.00026203940956646895, "loss": 0.0736, "step": 39210 }, { "epoch": 0.25, "learning_rate": 0.000262029728212112, "loss": 0.0626, "step": 39220 }, { "epoch": 0.25, "learning_rate": 0.00026202004685775505, "loss": 0.0634, "step": 39230 }, { "epoch": 0.25, "learning_rate": 0.00026201036550339813, "loss": 0.0632, "step": 39240 }, { "epoch": 0.25, "learning_rate": 0.0002620006841490412, "loss": 0.064, "step": 39250 }, { "epoch": 0.25, "learning_rate": 0.00026199100279468424, "loss": 0.063, "step": 39260 }, { "epoch": 0.25, "learning_rate": 0.0002619813214403273, "loss": 0.0707, "step": 39270 }, { "epoch": 0.25, "learning_rate": 0.0002619716400859704, "loss": 0.0661, "step": 39280 }, { "epoch": 0.25, "learning_rate": 0.0002619619587316135, "loss": 0.0609, "step": 39290 }, { "epoch": 0.25, "learning_rate": 0.00026195227737725655, "loss": 0.0663, "step": 39300 }, { "epoch": 0.25, "learning_rate": 0.00026194259602289963, "loss": 0.064, "step": 39310 }, { "epoch": 0.25, "learning_rate": 0.00026193291466854266, "loss": 0.0713, "step": 39320 }, { "epoch": 0.25, "learning_rate": 0.00026192323331418574, "loss": 0.0702, "step": 39330 }, { "epoch": 0.25, "learning_rate": 0.0002619135519598288, "loss": 0.0598, "step": 39340 }, { "epoch": 0.25, "learning_rate": 0.0002619038706054719, "loss": 0.074, "step": 39350 }, { "epoch": 0.25, "learning_rate": 0.0002618941892511149, "loss": 0.0678, "step": 39360 }, { "epoch": 0.25, "learning_rate": 0.000261884507896758, "loss": 0.0672, "step": 39370 }, { "epoch": 0.25, "learning_rate": 0.0002618748265424011, "loss": 0.0752, "step": 39380 }, { "epoch": 0.25, "learning_rate": 0.0002618651451880441, "loss": 0.0799, "step": 39390 }, { "epoch": 0.25, "learning_rate": 0.0002618554638336872, "loss": 0.082, "step": 39400 }, { "epoch": 0.25, "learning_rate": 0.00026184578247933027, "loss": 0.0672, "step": 39410 }, { "epoch": 0.25, "learning_rate": 0.00026183610112497335, "loss": 0.0697, "step": 39420 }, { "epoch": 0.25, "learning_rate": 0.00026182641977061643, "loss": 0.0677, "step": 39430 }, { "epoch": 0.25, "learning_rate": 0.0002618167384162595, "loss": 0.0627, "step": 39440 }, { "epoch": 0.25, "learning_rate": 0.0002618070570619026, "loss": 0.0687, "step": 39450 }, { "epoch": 0.25, "learning_rate": 0.0002617973757075456, "loss": 0.0743, "step": 39460 }, { "epoch": 0.25, "learning_rate": 0.0002617876943531887, "loss": 0.0949, "step": 39470 }, { "epoch": 0.25, "learning_rate": 0.0002617780129988318, "loss": 0.0829, "step": 39480 }, { "epoch": 0.25, "learning_rate": 0.0002617683316444748, "loss": 0.0723, "step": 39490 }, { "epoch": 0.25, "learning_rate": 0.0002617586502901179, "loss": 0.083, "step": 39500 }, { "epoch": 0.26, "learning_rate": 0.00026174896893576096, "loss": 0.0666, "step": 39510 }, { "epoch": 0.26, "learning_rate": 0.00026173928758140404, "loss": 0.0693, "step": 39520 }, { "epoch": 0.26, "learning_rate": 0.00026172960622704706, "loss": 0.0681, "step": 39530 }, { "epoch": 0.26, "learning_rate": 0.00026171992487269014, "loss": 0.0859, "step": 39540 }, { "epoch": 0.26, "learning_rate": 0.0002617102435183332, "loss": 0.0696, "step": 39550 }, { "epoch": 0.26, "learning_rate": 0.0002617005621639763, "loss": 0.0667, "step": 39560 }, { "epoch": 0.26, "learning_rate": 0.0002616908808096194, "loss": 0.0708, "step": 39570 }, { "epoch": 0.26, "learning_rate": 0.00026168119945526246, "loss": 0.0687, "step": 39580 }, { "epoch": 0.26, "learning_rate": 0.00026167151810090554, "loss": 0.0783, "step": 39590 }, { "epoch": 0.26, "learning_rate": 0.00026166183674654857, "loss": 0.0698, "step": 39600 }, { "epoch": 0.26, "learning_rate": 0.00026165215539219165, "loss": 0.0739, "step": 39610 }, { "epoch": 0.26, "learning_rate": 0.00026164247403783473, "loss": 0.0664, "step": 39620 }, { "epoch": 0.26, "learning_rate": 0.00026163279268347775, "loss": 0.0647, "step": 39630 }, { "epoch": 0.26, "learning_rate": 0.00026162311132912083, "loss": 0.0648, "step": 39640 }, { "epoch": 0.26, "learning_rate": 0.0002616134299747639, "loss": 0.0659, "step": 39650 }, { "epoch": 0.26, "learning_rate": 0.000261603748620407, "loss": 0.0722, "step": 39660 }, { "epoch": 0.26, "learning_rate": 0.00026159406726605, "loss": 0.0678, "step": 39670 }, { "epoch": 0.26, "learning_rate": 0.0002615843859116931, "loss": 0.0683, "step": 39680 }, { "epoch": 0.26, "learning_rate": 0.0002615747045573362, "loss": 0.0668, "step": 39690 }, { "epoch": 0.26, "learning_rate": 0.00026156502320297926, "loss": 0.0703, "step": 39700 }, { "epoch": 0.26, "learning_rate": 0.00026155534184862234, "loss": 0.0656, "step": 39710 }, { "epoch": 0.26, "learning_rate": 0.0002615456604942654, "loss": 0.0656, "step": 39720 }, { "epoch": 0.26, "learning_rate": 0.00026153597913990844, "loss": 0.0736, "step": 39730 }, { "epoch": 0.26, "learning_rate": 0.0002615262977855515, "loss": 0.0635, "step": 39740 }, { "epoch": 0.26, "learning_rate": 0.0002615166164311946, "loss": 0.0666, "step": 39750 }, { "epoch": 0.26, "learning_rate": 0.00026150693507683763, "loss": 0.0656, "step": 39760 }, { "epoch": 0.26, "learning_rate": 0.0002614972537224807, "loss": 0.0713, "step": 39770 }, { "epoch": 0.26, "learning_rate": 0.0002614875723681238, "loss": 0.0647, "step": 39780 }, { "epoch": 0.26, "learning_rate": 0.00026147789101376687, "loss": 0.0696, "step": 39790 }, { "epoch": 0.26, "learning_rate": 0.00026146820965940995, "loss": 0.0705, "step": 39800 }, { "epoch": 0.26, "learning_rate": 0.000261458528305053, "loss": 0.0796, "step": 39810 }, { "epoch": 0.26, "learning_rate": 0.00026144884695069605, "loss": 0.0673, "step": 39820 }, { "epoch": 0.26, "learning_rate": 0.00026143916559633913, "loss": 0.0744, "step": 39830 }, { "epoch": 0.26, "learning_rate": 0.0002614294842419822, "loss": 0.07, "step": 39840 }, { "epoch": 0.26, "learning_rate": 0.0002614198028876253, "loss": 0.0611, "step": 39850 }, { "epoch": 0.26, "learning_rate": 0.00026141012153326837, "loss": 0.0649, "step": 39860 }, { "epoch": 0.26, "learning_rate": 0.0002614004401789114, "loss": 0.0739, "step": 39870 }, { "epoch": 0.26, "learning_rate": 0.0002613907588245545, "loss": 0.0715, "step": 39880 }, { "epoch": 0.26, "learning_rate": 0.00026138107747019756, "loss": 0.069, "step": 39890 }, { "epoch": 0.26, "learning_rate": 0.0002613713961158406, "loss": 0.067, "step": 39900 }, { "epoch": 0.26, "learning_rate": 0.00026136171476148366, "loss": 0.0665, "step": 39910 }, { "epoch": 0.26, "learning_rate": 0.00026135203340712674, "loss": 0.0727, "step": 39920 }, { "epoch": 0.26, "learning_rate": 0.0002613423520527698, "loss": 0.0735, "step": 39930 }, { "epoch": 0.26, "learning_rate": 0.0002613326706984129, "loss": 0.071, "step": 39940 }, { "epoch": 0.26, "learning_rate": 0.00026132298934405593, "loss": 0.0679, "step": 39950 }, { "epoch": 0.26, "learning_rate": 0.000261313307989699, "loss": 0.0736, "step": 39960 }, { "epoch": 0.26, "learning_rate": 0.0002613036266353421, "loss": 0.0731, "step": 39970 }, { "epoch": 0.26, "learning_rate": 0.00026129394528098517, "loss": 0.0618, "step": 39980 }, { "epoch": 0.26, "learning_rate": 0.00026128426392662825, "loss": 0.0672, "step": 39990 }, { "epoch": 0.26, "learning_rate": 0.0002612745825722713, "loss": 0.0739, "step": 40000 }, { "epoch": 0.26, "eval_cer": 0.9201039430572817, "eval_loss": 0.04600047320127487, "eval_runtime": 120.2571, "eval_samples_per_second": 16.631, "eval_steps_per_second": 4.158, "step": 40000 }, { "epoch": 0.26, "learning_rate": 0.00026126490121791435, "loss": 0.0708, "step": 40010 }, { "epoch": 0.26, "learning_rate": 0.00026125521986355743, "loss": 0.068, "step": 40020 }, { "epoch": 0.26, "learning_rate": 0.00026124553850920046, "loss": 0.072, "step": 40030 }, { "epoch": 0.26, "learning_rate": 0.00026123585715484354, "loss": 0.0924, "step": 40040 }, { "epoch": 0.26, "learning_rate": 0.0002612261758004866, "loss": 0.0713, "step": 40050 }, { "epoch": 0.26, "learning_rate": 0.0002612164944461297, "loss": 0.079, "step": 40060 }, { "epoch": 0.26, "learning_rate": 0.0002612068130917728, "loss": 0.0671, "step": 40070 }, { "epoch": 0.26, "learning_rate": 0.00026119713173741586, "loss": 0.0696, "step": 40080 }, { "epoch": 0.26, "learning_rate": 0.0002611874503830589, "loss": 0.0801, "step": 40090 }, { "epoch": 0.26, "learning_rate": 0.00026117776902870196, "loss": 0.0718, "step": 40100 }, { "epoch": 0.26, "learning_rate": 0.00026116808767434504, "loss": 0.0659, "step": 40110 }, { "epoch": 0.26, "learning_rate": 0.0002611584063199881, "loss": 0.0664, "step": 40120 }, { "epoch": 0.26, "learning_rate": 0.00026114872496563115, "loss": 0.068, "step": 40130 }, { "epoch": 0.26, "learning_rate": 0.00026113904361127423, "loss": 0.0695, "step": 40140 }, { "epoch": 0.26, "learning_rate": 0.0002611293622569173, "loss": 0.073, "step": 40150 }, { "epoch": 0.26, "learning_rate": 0.00026111968090256033, "loss": 0.0678, "step": 40160 }, { "epoch": 0.26, "learning_rate": 0.0002611099995482034, "loss": 0.0737, "step": 40170 }, { "epoch": 0.26, "learning_rate": 0.0002611003181938465, "loss": 0.0772, "step": 40180 }, { "epoch": 0.26, "learning_rate": 0.00026109063683948957, "loss": 0.0747, "step": 40190 }, { "epoch": 0.26, "learning_rate": 0.00026108095548513265, "loss": 0.0703, "step": 40200 }, { "epoch": 0.26, "learning_rate": 0.00026107127413077573, "loss": 0.0665, "step": 40210 }, { "epoch": 0.26, "learning_rate": 0.0002610615927764188, "loss": 0.0668, "step": 40220 }, { "epoch": 0.26, "learning_rate": 0.00026105191142206184, "loss": 0.0707, "step": 40230 }, { "epoch": 0.26, "learning_rate": 0.0002610422300677049, "loss": 0.0698, "step": 40240 }, { "epoch": 0.26, "learning_rate": 0.000261032548713348, "loss": 0.0701, "step": 40250 }, { "epoch": 0.26, "learning_rate": 0.0002610228673589911, "loss": 0.0639, "step": 40260 }, { "epoch": 0.26, "learning_rate": 0.0002610131860046341, "loss": 0.066, "step": 40270 }, { "epoch": 0.26, "learning_rate": 0.0002610035046502772, "loss": 0.0742, "step": 40280 }, { "epoch": 0.26, "learning_rate": 0.00026099382329592026, "loss": 0.0639, "step": 40290 }, { "epoch": 0.26, "learning_rate": 0.0002609841419415633, "loss": 0.0643, "step": 40300 }, { "epoch": 0.26, "learning_rate": 0.00026097446058720637, "loss": 0.0625, "step": 40310 }, { "epoch": 0.26, "learning_rate": 0.00026096477923284945, "loss": 0.0689, "step": 40320 }, { "epoch": 0.26, "learning_rate": 0.0002609550978784925, "loss": 0.0733, "step": 40330 }, { "epoch": 0.26, "learning_rate": 0.0002609454165241356, "loss": 0.0706, "step": 40340 }, { "epoch": 0.26, "learning_rate": 0.0002609357351697787, "loss": 0.0666, "step": 40350 }, { "epoch": 0.26, "learning_rate": 0.00026092605381542177, "loss": 0.0666, "step": 40360 }, { "epoch": 0.26, "learning_rate": 0.0002609163724610648, "loss": 0.0712, "step": 40370 }, { "epoch": 0.26, "learning_rate": 0.00026090669110670787, "loss": 0.0644, "step": 40380 }, { "epoch": 0.26, "learning_rate": 0.00026089700975235095, "loss": 0.0697, "step": 40390 }, { "epoch": 0.26, "learning_rate": 0.000260887328397994, "loss": 0.0684, "step": 40400 }, { "epoch": 0.26, "learning_rate": 0.00026087764704363706, "loss": 0.0702, "step": 40410 }, { "epoch": 0.26, "learning_rate": 0.00026086796568928014, "loss": 0.0698, "step": 40420 }, { "epoch": 0.26, "learning_rate": 0.0002608582843349232, "loss": 0.0655, "step": 40430 }, { "epoch": 0.26, "learning_rate": 0.00026084860298056624, "loss": 0.0614, "step": 40440 }, { "epoch": 0.26, "learning_rate": 0.0002608389216262093, "loss": 0.0706, "step": 40450 }, { "epoch": 0.26, "learning_rate": 0.0002608292402718524, "loss": 0.0693, "step": 40460 }, { "epoch": 0.26, "learning_rate": 0.0002608195589174955, "loss": 0.072, "step": 40470 }, { "epoch": 0.26, "learning_rate": 0.00026080987756313856, "loss": 0.0682, "step": 40480 }, { "epoch": 0.26, "learning_rate": 0.00026080019620878164, "loss": 0.0607, "step": 40490 }, { "epoch": 0.26, "learning_rate": 0.00026079051485442467, "loss": 0.0703, "step": 40500 }, { "epoch": 0.26, "learning_rate": 0.00026078083350006775, "loss": 0.0703, "step": 40510 }, { "epoch": 0.26, "learning_rate": 0.0002607711521457108, "loss": 0.0669, "step": 40520 }, { "epoch": 0.26, "learning_rate": 0.00026076147079135385, "loss": 0.0707, "step": 40530 }, { "epoch": 0.26, "learning_rate": 0.00026075178943699693, "loss": 0.0648, "step": 40540 }, { "epoch": 0.26, "learning_rate": 0.00026074210808264, "loss": 0.0741, "step": 40550 }, { "epoch": 0.26, "learning_rate": 0.0002607324267282831, "loss": 0.0701, "step": 40560 }, { "epoch": 0.26, "learning_rate": 0.00026072274537392617, "loss": 0.0689, "step": 40570 }, { "epoch": 0.26, "learning_rate": 0.0002607130640195692, "loss": 0.072, "step": 40580 }, { "epoch": 0.26, "learning_rate": 0.0002607033826652123, "loss": 0.0678, "step": 40590 }, { "epoch": 0.26, "learning_rate": 0.00026069370131085536, "loss": 0.0699, "step": 40600 }, { "epoch": 0.26, "learning_rate": 0.00026068401995649844, "loss": 0.072, "step": 40610 }, { "epoch": 0.26, "learning_rate": 0.0002606743386021415, "loss": 0.0732, "step": 40620 }, { "epoch": 0.26, "learning_rate": 0.0002606646572477846, "loss": 0.0663, "step": 40630 }, { "epoch": 0.26, "learning_rate": 0.0002606549758934276, "loss": 0.0701, "step": 40640 }, { "epoch": 0.26, "learning_rate": 0.0002606452945390707, "loss": 0.0681, "step": 40650 }, { "epoch": 0.26, "learning_rate": 0.0002606356131847138, "loss": 0.0659, "step": 40660 }, { "epoch": 0.26, "learning_rate": 0.0002606259318303568, "loss": 0.0775, "step": 40670 }, { "epoch": 0.26, "learning_rate": 0.0002606162504759999, "loss": 0.066, "step": 40680 }, { "epoch": 0.26, "learning_rate": 0.00026060656912164297, "loss": 0.0661, "step": 40690 }, { "epoch": 0.26, "learning_rate": 0.00026059688776728605, "loss": 0.0654, "step": 40700 }, { "epoch": 0.26, "learning_rate": 0.0002605872064129291, "loss": 0.069, "step": 40710 }, { "epoch": 0.26, "learning_rate": 0.00026057752505857215, "loss": 0.072, "step": 40720 }, { "epoch": 0.26, "learning_rate": 0.00026056784370421523, "loss": 0.0713, "step": 40730 }, { "epoch": 0.26, "learning_rate": 0.0002605581623498583, "loss": 0.076, "step": 40740 }, { "epoch": 0.26, "learning_rate": 0.0002605484809955014, "loss": 0.0733, "step": 40750 }, { "epoch": 0.26, "learning_rate": 0.00026053879964114447, "loss": 0.0712, "step": 40760 }, { "epoch": 0.26, "learning_rate": 0.0002605291182867875, "loss": 0.0769, "step": 40770 }, { "epoch": 0.26, "learning_rate": 0.0002605194369324306, "loss": 0.0643, "step": 40780 }, { "epoch": 0.26, "learning_rate": 0.00026050975557807365, "loss": 0.0642, "step": 40790 }, { "epoch": 0.26, "learning_rate": 0.0002605000742237167, "loss": 0.076, "step": 40800 }, { "epoch": 0.26, "learning_rate": 0.00026049039286935976, "loss": 0.0703, "step": 40810 }, { "epoch": 0.26, "learning_rate": 0.00026048071151500284, "loss": 0.0705, "step": 40820 }, { "epoch": 0.26, "learning_rate": 0.0002604710301606459, "loss": 0.0626, "step": 40830 }, { "epoch": 0.26, "learning_rate": 0.000260461348806289, "loss": 0.0722, "step": 40840 }, { "epoch": 0.26, "learning_rate": 0.0002604516674519321, "loss": 0.0662, "step": 40850 }, { "epoch": 0.26, "learning_rate": 0.0002604419860975751, "loss": 0.0634, "step": 40860 }, { "epoch": 0.26, "learning_rate": 0.0002604323047432182, "loss": 0.0699, "step": 40870 }, { "epoch": 0.26, "learning_rate": 0.00026042262338886126, "loss": 0.0636, "step": 40880 }, { "epoch": 0.26, "learning_rate": 0.00026041294203450434, "loss": 0.0742, "step": 40890 }, { "epoch": 0.26, "learning_rate": 0.00026040326068014737, "loss": 0.0734, "step": 40900 }, { "epoch": 0.26, "learning_rate": 0.00026039357932579045, "loss": 0.064, "step": 40910 }, { "epoch": 0.26, "learning_rate": 0.00026038389797143353, "loss": 0.0635, "step": 40920 }, { "epoch": 0.26, "learning_rate": 0.00026037421661707656, "loss": 0.0739, "step": 40930 }, { "epoch": 0.26, "learning_rate": 0.00026036453526271963, "loss": 0.0747, "step": 40940 }, { "epoch": 0.26, "learning_rate": 0.0002603548539083627, "loss": 0.075, "step": 40950 }, { "epoch": 0.26, "learning_rate": 0.0002603451725540058, "loss": 0.067, "step": 40960 }, { "epoch": 0.26, "learning_rate": 0.0002603354911996489, "loss": 0.0635, "step": 40970 }, { "epoch": 0.26, "learning_rate": 0.00026032580984529195, "loss": 0.0585, "step": 40980 }, { "epoch": 0.26, "learning_rate": 0.00026031612849093503, "loss": 0.0698, "step": 40990 }, { "epoch": 0.26, "learning_rate": 0.00026030644713657806, "loss": 0.0694, "step": 41000 }, { "epoch": 0.26, "eval_cer": 0.9200316348435205, "eval_loss": 0.04777882248163223, "eval_runtime": 120.3453, "eval_samples_per_second": 16.619, "eval_steps_per_second": 4.155, "step": 41000 }, { "epoch": 0.26, "learning_rate": 0.00026029676578222114, "loss": 0.0727, "step": 41010 }, { "epoch": 0.26, "learning_rate": 0.0002602870844278642, "loss": 0.0695, "step": 41020 }, { "epoch": 0.26, "learning_rate": 0.0002602774030735073, "loss": 0.0671, "step": 41030 }, { "epoch": 0.26, "learning_rate": 0.0002602677217191503, "loss": 0.0644, "step": 41040 }, { "epoch": 0.26, "learning_rate": 0.0002602580403647934, "loss": 0.0736, "step": 41050 }, { "epoch": 0.27, "learning_rate": 0.0002602483590104365, "loss": 0.0704, "step": 41060 }, { "epoch": 0.27, "learning_rate": 0.0002602386776560795, "loss": 0.0682, "step": 41070 }, { "epoch": 0.27, "learning_rate": 0.0002602289963017226, "loss": 0.0652, "step": 41080 }, { "epoch": 0.27, "learning_rate": 0.00026021931494736567, "loss": 0.0676, "step": 41090 }, { "epoch": 0.27, "learning_rate": 0.00026020963359300875, "loss": 0.0614, "step": 41100 }, { "epoch": 0.27, "learning_rate": 0.00026019995223865183, "loss": 0.0629, "step": 41110 }, { "epoch": 0.27, "learning_rate": 0.0002601902708842949, "loss": 0.0637, "step": 41120 }, { "epoch": 0.27, "learning_rate": 0.000260180589529938, "loss": 0.063, "step": 41130 }, { "epoch": 0.27, "learning_rate": 0.000260170908175581, "loss": 0.0634, "step": 41140 }, { "epoch": 0.27, "learning_rate": 0.0002601612268212241, "loss": 0.0704, "step": 41150 }, { "epoch": 0.27, "learning_rate": 0.0002601515454668672, "loss": 0.0703, "step": 41160 }, { "epoch": 0.27, "learning_rate": 0.0002601418641125102, "loss": 0.0652, "step": 41170 }, { "epoch": 0.27, "learning_rate": 0.0002601321827581533, "loss": 0.0629, "step": 41180 }, { "epoch": 0.27, "learning_rate": 0.00026012250140379636, "loss": 0.0707, "step": 41190 }, { "epoch": 0.27, "learning_rate": 0.00026011282004943944, "loss": 0.0652, "step": 41200 }, { "epoch": 0.27, "learning_rate": 0.00026010313869508246, "loss": 0.0702, "step": 41210 }, { "epoch": 0.27, "learning_rate": 0.00026009345734072554, "loss": 0.0678, "step": 41220 }, { "epoch": 0.27, "learning_rate": 0.0002600837759863686, "loss": 0.0806, "step": 41230 }, { "epoch": 0.27, "learning_rate": 0.0002600740946320117, "loss": 0.0615, "step": 41240 }, { "epoch": 0.27, "learning_rate": 0.0002600644132776548, "loss": 0.0608, "step": 41250 }, { "epoch": 0.27, "learning_rate": 0.00026005473192329786, "loss": 0.0678, "step": 41260 }, { "epoch": 0.27, "learning_rate": 0.00026004505056894094, "loss": 0.0691, "step": 41270 }, { "epoch": 0.27, "learning_rate": 0.00026003536921458397, "loss": 0.0641, "step": 41280 }, { "epoch": 0.27, "learning_rate": 0.00026002568786022705, "loss": 0.0669, "step": 41290 }, { "epoch": 0.27, "learning_rate": 0.0002600160065058701, "loss": 0.0662, "step": 41300 }, { "epoch": 0.27, "learning_rate": 0.00026000632515151315, "loss": 0.071, "step": 41310 }, { "epoch": 0.27, "learning_rate": 0.00025999664379715623, "loss": 0.0678, "step": 41320 }, { "epoch": 0.27, "learning_rate": 0.0002599869624427993, "loss": 0.0719, "step": 41330 }, { "epoch": 0.27, "learning_rate": 0.0002599772810884424, "loss": 0.0659, "step": 41340 }, { "epoch": 0.27, "learning_rate": 0.0002599675997340854, "loss": 0.0666, "step": 41350 }, { "epoch": 0.27, "learning_rate": 0.0002599579183797285, "loss": 0.0652, "step": 41360 }, { "epoch": 0.27, "learning_rate": 0.0002599482370253716, "loss": 0.0707, "step": 41370 }, { "epoch": 0.27, "learning_rate": 0.00025993855567101466, "loss": 0.0659, "step": 41380 }, { "epoch": 0.27, "learning_rate": 0.00025992887431665774, "loss": 0.0626, "step": 41390 }, { "epoch": 0.27, "learning_rate": 0.0002599191929623008, "loss": 0.0663, "step": 41400 }, { "epoch": 0.27, "learning_rate": 0.00025990951160794384, "loss": 0.0727, "step": 41410 }, { "epoch": 0.27, "learning_rate": 0.0002598998302535869, "loss": 0.0697, "step": 41420 }, { "epoch": 0.27, "learning_rate": 0.00025989014889923, "loss": 0.0757, "step": 41430 }, { "epoch": 0.27, "learning_rate": 0.00025988046754487303, "loss": 0.0724, "step": 41440 }, { "epoch": 0.27, "learning_rate": 0.0002598707861905161, "loss": 0.0649, "step": 41450 }, { "epoch": 0.27, "learning_rate": 0.0002598611048361592, "loss": 0.0701, "step": 41460 }, { "epoch": 0.27, "learning_rate": 0.00025985142348180227, "loss": 0.0696, "step": 41470 }, { "epoch": 0.27, "learning_rate": 0.00025984174212744535, "loss": 0.0697, "step": 41480 }, { "epoch": 0.27, "learning_rate": 0.0002598320607730884, "loss": 0.0703, "step": 41490 }, { "epoch": 0.27, "learning_rate": 0.00025982237941873145, "loss": 0.0719, "step": 41500 }, { "epoch": 0.27, "learning_rate": 0.00025981269806437453, "loss": 0.0765, "step": 41510 }, { "epoch": 0.27, "learning_rate": 0.0002598030167100176, "loss": 0.0692, "step": 41520 }, { "epoch": 0.27, "learning_rate": 0.0002597933353556607, "loss": 0.0705, "step": 41530 }, { "epoch": 0.27, "learning_rate": 0.0002597836540013037, "loss": 0.0671, "step": 41540 }, { "epoch": 0.27, "learning_rate": 0.0002597739726469468, "loss": 0.0706, "step": 41550 }, { "epoch": 0.27, "learning_rate": 0.0002597642912925899, "loss": 0.0675, "step": 41560 }, { "epoch": 0.27, "learning_rate": 0.0002597546099382329, "loss": 0.065, "step": 41570 }, { "epoch": 0.27, "learning_rate": 0.000259744928583876, "loss": 0.0643, "step": 41580 }, { "epoch": 0.27, "learning_rate": 0.00025973524722951906, "loss": 0.0676, "step": 41590 }, { "epoch": 0.27, "learning_rate": 0.00025972556587516214, "loss": 0.069, "step": 41600 }, { "epoch": 0.27, "learning_rate": 0.0002597158845208052, "loss": 0.0713, "step": 41610 }, { "epoch": 0.27, "learning_rate": 0.0002597062031664483, "loss": 0.0787, "step": 41620 }, { "epoch": 0.27, "learning_rate": 0.00025969652181209133, "loss": 0.0734, "step": 41630 }, { "epoch": 0.27, "learning_rate": 0.0002596868404577344, "loss": 0.0762, "step": 41640 }, { "epoch": 0.27, "learning_rate": 0.0002596771591033775, "loss": 0.0708, "step": 41650 }, { "epoch": 0.27, "learning_rate": 0.00025966747774902057, "loss": 0.064, "step": 41660 }, { "epoch": 0.27, "learning_rate": 0.00025965779639466365, "loss": 0.0753, "step": 41670 }, { "epoch": 0.27, "learning_rate": 0.00025964811504030667, "loss": 0.0688, "step": 41680 }, { "epoch": 0.27, "learning_rate": 0.00025963843368594975, "loss": 0.0639, "step": 41690 }, { "epoch": 0.27, "learning_rate": 0.0002596287523315928, "loss": 0.0722, "step": 41700 }, { "epoch": 0.27, "learning_rate": 0.00025961907097723586, "loss": 0.0602, "step": 41710 }, { "epoch": 0.27, "learning_rate": 0.00025960938962287894, "loss": 0.0681, "step": 41720 }, { "epoch": 0.27, "learning_rate": 0.000259599708268522, "loss": 0.0714, "step": 41730 }, { "epoch": 0.27, "learning_rate": 0.0002595900269141651, "loss": 0.0704, "step": 41740 }, { "epoch": 0.27, "learning_rate": 0.0002595803455598082, "loss": 0.0648, "step": 41750 }, { "epoch": 0.27, "learning_rate": 0.00025957066420545126, "loss": 0.0592, "step": 41760 }, { "epoch": 0.27, "learning_rate": 0.0002595609828510943, "loss": 0.075, "step": 41770 }, { "epoch": 0.27, "learning_rate": 0.00025955130149673736, "loss": 0.0709, "step": 41780 }, { "epoch": 0.27, "learning_rate": 0.00025954162014238044, "loss": 0.0655, "step": 41790 }, { "epoch": 0.27, "learning_rate": 0.0002595319387880235, "loss": 0.0703, "step": 41800 }, { "epoch": 0.27, "learning_rate": 0.00025952225743366655, "loss": 0.0705, "step": 41810 }, { "epoch": 0.27, "learning_rate": 0.0002595125760793096, "loss": 0.0724, "step": 41820 }, { "epoch": 0.27, "learning_rate": 0.0002595028947249527, "loss": 0.07, "step": 41830 }, { "epoch": 0.27, "learning_rate": 0.00025949321337059573, "loss": 0.0673, "step": 41840 }, { "epoch": 0.27, "learning_rate": 0.0002594835320162388, "loss": 0.0741, "step": 41850 }, { "epoch": 0.27, "learning_rate": 0.0002594738506618819, "loss": 0.0746, "step": 41860 }, { "epoch": 0.27, "learning_rate": 0.00025946416930752497, "loss": 0.064, "step": 41870 }, { "epoch": 0.27, "learning_rate": 0.00025945448795316805, "loss": 0.0682, "step": 41880 }, { "epoch": 0.27, "learning_rate": 0.00025944480659881113, "loss": 0.0655, "step": 41890 }, { "epoch": 0.27, "learning_rate": 0.0002594351252444542, "loss": 0.0707, "step": 41900 }, { "epoch": 0.27, "learning_rate": 0.00025942544389009724, "loss": 0.0627, "step": 41910 }, { "epoch": 0.27, "learning_rate": 0.0002594157625357403, "loss": 0.06, "step": 41920 }, { "epoch": 0.27, "learning_rate": 0.0002594060811813834, "loss": 0.0646, "step": 41930 }, { "epoch": 0.27, "learning_rate": 0.0002593963998270264, "loss": 0.0585, "step": 41940 }, { "epoch": 0.27, "learning_rate": 0.0002593867184726695, "loss": 0.0668, "step": 41950 }, { "epoch": 0.27, "learning_rate": 0.0002593770371183126, "loss": 0.0739, "step": 41960 }, { "epoch": 0.27, "learning_rate": 0.00025936735576395566, "loss": 0.0672, "step": 41970 }, { "epoch": 0.27, "learning_rate": 0.0002593576744095987, "loss": 0.0675, "step": 41980 }, { "epoch": 0.27, "learning_rate": 0.00025934799305524177, "loss": 0.0674, "step": 41990 }, { "epoch": 0.27, "learning_rate": 0.00025933831170088485, "loss": 0.0659, "step": 42000 }, { "epoch": 0.27, "eval_cer": 0.9200949045305615, "eval_loss": 0.04507534205913544, "eval_runtime": 120.3293, "eval_samples_per_second": 16.621, "eval_steps_per_second": 4.155, "step": 42000 }, { "epoch": 0.27, "learning_rate": 0.0002593286303465279, "loss": 0.0675, "step": 42010 }, { "epoch": 0.27, "learning_rate": 0.000259318948992171, "loss": 0.06, "step": 42020 }, { "epoch": 0.27, "learning_rate": 0.0002593092676378141, "loss": 0.0757, "step": 42030 }, { "epoch": 0.27, "learning_rate": 0.00025929958628345717, "loss": 0.066, "step": 42040 }, { "epoch": 0.27, "learning_rate": 0.0002592899049291002, "loss": 0.0664, "step": 42050 }, { "epoch": 0.27, "learning_rate": 0.00025928022357474327, "loss": 0.0697, "step": 42060 }, { "epoch": 0.27, "learning_rate": 0.00025927054222038635, "loss": 0.0626, "step": 42070 }, { "epoch": 0.27, "learning_rate": 0.0002592608608660294, "loss": 0.0736, "step": 42080 }, { "epoch": 0.27, "learning_rate": 0.00025925117951167246, "loss": 0.0651, "step": 42090 }, { "epoch": 0.27, "learning_rate": 0.00025924149815731554, "loss": 0.0649, "step": 42100 }, { "epoch": 0.27, "learning_rate": 0.0002592318168029586, "loss": 0.07, "step": 42110 }, { "epoch": 0.27, "learning_rate": 0.00025922213544860164, "loss": 0.0719, "step": 42120 }, { "epoch": 0.27, "learning_rate": 0.0002592124540942447, "loss": 0.0697, "step": 42130 }, { "epoch": 0.27, "learning_rate": 0.0002592027727398878, "loss": 0.0721, "step": 42140 }, { "epoch": 0.27, "learning_rate": 0.0002591930913855309, "loss": 0.0765, "step": 42150 }, { "epoch": 0.27, "learning_rate": 0.00025918341003117396, "loss": 0.0751, "step": 42160 }, { "epoch": 0.27, "learning_rate": 0.00025917372867681704, "loss": 0.0818, "step": 42170 }, { "epoch": 0.27, "learning_rate": 0.00025916404732246007, "loss": 0.0707, "step": 42180 }, { "epoch": 0.27, "learning_rate": 0.00025915436596810315, "loss": 0.0762, "step": 42190 }, { "epoch": 0.27, "learning_rate": 0.0002591446846137462, "loss": 0.0746, "step": 42200 }, { "epoch": 0.27, "learning_rate": 0.00025913500325938925, "loss": 0.0734, "step": 42210 }, { "epoch": 0.27, "learning_rate": 0.00025912532190503233, "loss": 0.0676, "step": 42220 }, { "epoch": 0.27, "learning_rate": 0.0002591156405506754, "loss": 0.0732, "step": 42230 }, { "epoch": 0.27, "learning_rate": 0.0002591059591963185, "loss": 0.0631, "step": 42240 }, { "epoch": 0.27, "learning_rate": 0.00025909627784196157, "loss": 0.0593, "step": 42250 }, { "epoch": 0.27, "learning_rate": 0.0002590865964876046, "loss": 0.0717, "step": 42260 }, { "epoch": 0.27, "learning_rate": 0.0002590769151332477, "loss": 0.0669, "step": 42270 }, { "epoch": 0.27, "learning_rate": 0.00025906723377889075, "loss": 0.0642, "step": 42280 }, { "epoch": 0.27, "learning_rate": 0.00025905755242453383, "loss": 0.0729, "step": 42290 }, { "epoch": 0.27, "learning_rate": 0.0002590478710701769, "loss": 0.0736, "step": 42300 }, { "epoch": 0.27, "learning_rate": 0.00025903818971581994, "loss": 0.0789, "step": 42310 }, { "epoch": 0.27, "learning_rate": 0.000259028508361463, "loss": 0.0678, "step": 42320 }, { "epoch": 0.27, "learning_rate": 0.0002590188270071061, "loss": 0.0668, "step": 42330 }, { "epoch": 0.27, "learning_rate": 0.0002590091456527491, "loss": 0.0699, "step": 42340 }, { "epoch": 0.27, "learning_rate": 0.0002589994642983922, "loss": 0.0709, "step": 42350 }, { "epoch": 0.27, "learning_rate": 0.0002589897829440353, "loss": 0.0726, "step": 42360 }, { "epoch": 0.27, "learning_rate": 0.00025898010158967836, "loss": 0.0795, "step": 42370 }, { "epoch": 0.27, "learning_rate": 0.00025897042023532144, "loss": 0.0655, "step": 42380 }, { "epoch": 0.27, "learning_rate": 0.0002589607388809645, "loss": 0.0638, "step": 42390 }, { "epoch": 0.27, "learning_rate": 0.00025895105752660755, "loss": 0.0659, "step": 42400 }, { "epoch": 0.27, "learning_rate": 0.00025894137617225063, "loss": 0.0693, "step": 42410 }, { "epoch": 0.27, "learning_rate": 0.0002589316948178937, "loss": 0.0733, "step": 42420 }, { "epoch": 0.27, "learning_rate": 0.0002589220134635368, "loss": 0.0679, "step": 42430 }, { "epoch": 0.27, "learning_rate": 0.00025891233210917987, "loss": 0.0657, "step": 42440 }, { "epoch": 0.27, "learning_rate": 0.0002589026507548229, "loss": 0.0719, "step": 42450 }, { "epoch": 0.27, "learning_rate": 0.000258892969400466, "loss": 0.0639, "step": 42460 }, { "epoch": 0.27, "learning_rate": 0.00025888328804610905, "loss": 0.066, "step": 42470 }, { "epoch": 0.27, "learning_rate": 0.0002588736066917521, "loss": 0.0748, "step": 42480 }, { "epoch": 0.27, "learning_rate": 0.00025886392533739516, "loss": 0.0773, "step": 42490 }, { "epoch": 0.27, "learning_rate": 0.00025885424398303824, "loss": 0.0687, "step": 42500 }, { "epoch": 0.27, "learning_rate": 0.0002588445626286813, "loss": 0.0773, "step": 42510 }, { "epoch": 0.27, "learning_rate": 0.0002588348812743244, "loss": 0.0619, "step": 42520 }, { "epoch": 0.27, "learning_rate": 0.0002588251999199675, "loss": 0.0642, "step": 42530 }, { "epoch": 0.27, "learning_rate": 0.0002588155185656105, "loss": 0.0667, "step": 42540 }, { "epoch": 0.27, "learning_rate": 0.0002588058372112536, "loss": 0.0689, "step": 42550 }, { "epoch": 0.27, "learning_rate": 0.00025879615585689666, "loss": 0.0734, "step": 42560 }, { "epoch": 0.27, "learning_rate": 0.00025878647450253974, "loss": 0.072, "step": 42570 }, { "epoch": 0.27, "learning_rate": 0.00025877679314818277, "loss": 0.0655, "step": 42580 }, { "epoch": 0.27, "learning_rate": 0.00025876711179382585, "loss": 0.0717, "step": 42590 }, { "epoch": 0.27, "learning_rate": 0.00025875743043946893, "loss": 0.0726, "step": 42600 }, { "epoch": 0.28, "learning_rate": 0.00025874774908511195, "loss": 0.0665, "step": 42610 }, { "epoch": 0.28, "learning_rate": 0.00025873806773075503, "loss": 0.066, "step": 42620 }, { "epoch": 0.28, "learning_rate": 0.0002587283863763981, "loss": 0.0731, "step": 42630 }, { "epoch": 0.28, "learning_rate": 0.0002587187050220412, "loss": 0.0638, "step": 42640 }, { "epoch": 0.28, "learning_rate": 0.0002587090236676843, "loss": 0.0721, "step": 42650 }, { "epoch": 0.28, "learning_rate": 0.00025869934231332735, "loss": 0.0736, "step": 42660 }, { "epoch": 0.28, "learning_rate": 0.00025868966095897043, "loss": 0.0679, "step": 42670 }, { "epoch": 0.28, "learning_rate": 0.00025867997960461346, "loss": 0.0663, "step": 42680 }, { "epoch": 0.28, "learning_rate": 0.00025867029825025654, "loss": 0.0599, "step": 42690 }, { "epoch": 0.28, "learning_rate": 0.0002586606168958996, "loss": 0.0693, "step": 42700 }, { "epoch": 0.28, "learning_rate": 0.00025865093554154264, "loss": 0.0707, "step": 42710 }, { "epoch": 0.28, "learning_rate": 0.0002586412541871857, "loss": 0.0665, "step": 42720 }, { "epoch": 0.28, "learning_rate": 0.0002586315728328288, "loss": 0.062, "step": 42730 }, { "epoch": 0.28, "learning_rate": 0.0002586218914784719, "loss": 0.058, "step": 42740 }, { "epoch": 0.28, "learning_rate": 0.0002586122101241149, "loss": 0.0599, "step": 42750 }, { "epoch": 0.28, "learning_rate": 0.000258602528769758, "loss": 0.0637, "step": 42760 }, { "epoch": 0.28, "learning_rate": 0.00025859284741540107, "loss": 0.0599, "step": 42770 }, { "epoch": 0.28, "learning_rate": 0.00025858316606104415, "loss": 0.0632, "step": 42780 }, { "epoch": 0.28, "learning_rate": 0.00025857348470668723, "loss": 0.0711, "step": 42790 }, { "epoch": 0.28, "learning_rate": 0.0002585638033523303, "loss": 0.0706, "step": 42800 }, { "epoch": 0.28, "learning_rate": 0.0002585541219979734, "loss": 0.0663, "step": 42810 }, { "epoch": 0.28, "learning_rate": 0.0002585444406436164, "loss": 0.0638, "step": 42820 }, { "epoch": 0.28, "learning_rate": 0.0002585347592892595, "loss": 0.07, "step": 42830 }, { "epoch": 0.28, "learning_rate": 0.00025852507793490257, "loss": 0.0627, "step": 42840 }, { "epoch": 0.28, "learning_rate": 0.0002585153965805456, "loss": 0.064, "step": 42850 }, { "epoch": 0.28, "learning_rate": 0.0002585057152261887, "loss": 0.0694, "step": 42860 }, { "epoch": 0.28, "learning_rate": 0.00025849603387183176, "loss": 0.0722, "step": 42870 }, { "epoch": 0.28, "learning_rate": 0.00025848635251747484, "loss": 0.0643, "step": 42880 }, { "epoch": 0.28, "learning_rate": 0.00025847667116311786, "loss": 0.0678, "step": 42890 }, { "epoch": 0.28, "learning_rate": 0.00025846698980876094, "loss": 0.0666, "step": 42900 }, { "epoch": 0.28, "learning_rate": 0.000258457308454404, "loss": 0.0571, "step": 42910 }, { "epoch": 0.28, "learning_rate": 0.0002584476271000471, "loss": 0.0643, "step": 42920 }, { "epoch": 0.28, "learning_rate": 0.0002584379457456902, "loss": 0.0705, "step": 42930 }, { "epoch": 0.28, "learning_rate": 0.00025842826439133326, "loss": 0.0606, "step": 42940 }, { "epoch": 0.28, "learning_rate": 0.0002584185830369763, "loss": 0.0617, "step": 42950 }, { "epoch": 0.28, "learning_rate": 0.00025840890168261937, "loss": 0.0721, "step": 42960 }, { "epoch": 0.28, "learning_rate": 0.00025839922032826245, "loss": 0.0698, "step": 42970 }, { "epoch": 0.28, "learning_rate": 0.0002583895389739055, "loss": 0.0674, "step": 42980 }, { "epoch": 0.28, "learning_rate": 0.00025837985761954855, "loss": 0.064, "step": 42990 }, { "epoch": 0.28, "learning_rate": 0.00025837017626519163, "loss": 0.0638, "step": 43000 }, { "epoch": 0.28, "eval_cer": 0.9200361541068806, "eval_loss": 0.044854536652565, "eval_runtime": 120.1061, "eval_samples_per_second": 16.652, "eval_steps_per_second": 4.163, "step": 43000 }, { "epoch": 0.28, "learning_rate": 0.0002583604949108347, "loss": 0.0634, "step": 43010 }, { "epoch": 0.28, "learning_rate": 0.0002583508135564778, "loss": 0.0679, "step": 43020 }, { "epoch": 0.28, "learning_rate": 0.0002583411322021208, "loss": 0.061, "step": 43030 }, { "epoch": 0.28, "learning_rate": 0.0002583314508477639, "loss": 0.0665, "step": 43040 }, { "epoch": 0.28, "learning_rate": 0.000258321769493407, "loss": 0.0691, "step": 43050 }, { "epoch": 0.28, "learning_rate": 0.00025831208813905006, "loss": 0.0679, "step": 43060 }, { "epoch": 0.28, "learning_rate": 0.00025830240678469314, "loss": 0.0695, "step": 43070 }, { "epoch": 0.28, "learning_rate": 0.00025829272543033616, "loss": 0.0698, "step": 43080 }, { "epoch": 0.28, "learning_rate": 0.00025828304407597924, "loss": 0.0669, "step": 43090 }, { "epoch": 0.28, "learning_rate": 0.0002582733627216223, "loss": 0.0676, "step": 43100 }, { "epoch": 0.28, "learning_rate": 0.00025826368136726535, "loss": 0.0623, "step": 43110 }, { "epoch": 0.28, "learning_rate": 0.00025825400001290843, "loss": 0.0647, "step": 43120 }, { "epoch": 0.28, "learning_rate": 0.0002582443186585515, "loss": 0.0647, "step": 43130 }, { "epoch": 0.28, "learning_rate": 0.0002582346373041946, "loss": 0.0593, "step": 43140 }, { "epoch": 0.28, "learning_rate": 0.00025822495594983767, "loss": 0.0584, "step": 43150 }, { "epoch": 0.28, "learning_rate": 0.00025821527459548075, "loss": 0.064, "step": 43160 }, { "epoch": 0.28, "learning_rate": 0.00025820559324112377, "loss": 0.0621, "step": 43170 }, { "epoch": 0.28, "learning_rate": 0.00025819591188676685, "loss": 0.0697, "step": 43180 }, { "epoch": 0.28, "learning_rate": 0.00025818623053240993, "loss": 0.0664, "step": 43190 }, { "epoch": 0.28, "learning_rate": 0.000258176549178053, "loss": 0.0676, "step": 43200 }, { "epoch": 0.28, "learning_rate": 0.0002581668678236961, "loss": 0.0649, "step": 43210 }, { "epoch": 0.28, "learning_rate": 0.0002581571864693391, "loss": 0.0621, "step": 43220 }, { "epoch": 0.28, "learning_rate": 0.0002581475051149822, "loss": 0.068, "step": 43230 }, { "epoch": 0.28, "learning_rate": 0.0002581378237606253, "loss": 0.069, "step": 43240 }, { "epoch": 0.28, "learning_rate": 0.0002581281424062683, "loss": 0.0682, "step": 43250 }, { "epoch": 0.28, "learning_rate": 0.0002581184610519114, "loss": 0.0636, "step": 43260 }, { "epoch": 0.28, "learning_rate": 0.00025810877969755446, "loss": 0.0679, "step": 43270 }, { "epoch": 0.28, "learning_rate": 0.00025809909834319754, "loss": 0.0626, "step": 43280 }, { "epoch": 0.28, "learning_rate": 0.0002580894169888406, "loss": 0.0705, "step": 43290 }, { "epoch": 0.28, "learning_rate": 0.0002580797356344837, "loss": 0.0707, "step": 43300 }, { "epoch": 0.28, "learning_rate": 0.0002580700542801267, "loss": 0.0657, "step": 43310 }, { "epoch": 0.28, "learning_rate": 0.0002580603729257698, "loss": 0.0676, "step": 43320 }, { "epoch": 0.28, "learning_rate": 0.0002580506915714129, "loss": 0.0658, "step": 43330 }, { "epoch": 0.28, "learning_rate": 0.00025804101021705597, "loss": 0.0627, "step": 43340 }, { "epoch": 0.28, "learning_rate": 0.000258031328862699, "loss": 0.066, "step": 43350 }, { "epoch": 0.28, "learning_rate": 0.00025802164750834207, "loss": 0.0736, "step": 43360 }, { "epoch": 0.28, "learning_rate": 0.00025801196615398515, "loss": 0.0653, "step": 43370 }, { "epoch": 0.28, "learning_rate": 0.0002580022847996282, "loss": 0.0691, "step": 43380 }, { "epoch": 0.28, "learning_rate": 0.00025799260344527126, "loss": 0.0647, "step": 43390 }, { "epoch": 0.28, "learning_rate": 0.00025798292209091434, "loss": 0.0686, "step": 43400 }, { "epoch": 0.28, "learning_rate": 0.0002579732407365574, "loss": 0.0666, "step": 43410 }, { "epoch": 0.28, "learning_rate": 0.0002579635593822005, "loss": 0.067, "step": 43420 }, { "epoch": 0.28, "learning_rate": 0.0002579538780278436, "loss": 0.0644, "step": 43430 }, { "epoch": 0.28, "learning_rate": 0.00025794419667348666, "loss": 0.0601, "step": 43440 }, { "epoch": 0.28, "learning_rate": 0.0002579345153191297, "loss": 0.0704, "step": 43450 }, { "epoch": 0.28, "learning_rate": 0.00025792483396477276, "loss": 0.0679, "step": 43460 }, { "epoch": 0.28, "learning_rate": 0.00025791515261041584, "loss": 0.065, "step": 43470 }, { "epoch": 0.28, "learning_rate": 0.00025790547125605887, "loss": 0.0641, "step": 43480 }, { "epoch": 0.28, "learning_rate": 0.00025789578990170195, "loss": 0.0638, "step": 43490 }, { "epoch": 0.28, "learning_rate": 0.000257886108547345, "loss": 0.0617, "step": 43500 }, { "epoch": 0.28, "learning_rate": 0.0002578764271929881, "loss": 0.0637, "step": 43510 }, { "epoch": 0.28, "learning_rate": 0.00025786674583863113, "loss": 0.069, "step": 43520 }, { "epoch": 0.28, "learning_rate": 0.0002578570644842742, "loss": 0.0656, "step": 43530 }, { "epoch": 0.28, "learning_rate": 0.0002578473831299173, "loss": 0.0619, "step": 43540 }, { "epoch": 0.28, "learning_rate": 0.00025783770177556037, "loss": 0.0649, "step": 43550 }, { "epoch": 0.28, "learning_rate": 0.00025782802042120345, "loss": 0.0707, "step": 43560 }, { "epoch": 0.28, "learning_rate": 0.00025781833906684653, "loss": 0.0626, "step": 43570 }, { "epoch": 0.28, "learning_rate": 0.0002578086577124896, "loss": 0.0678, "step": 43580 }, { "epoch": 0.28, "learning_rate": 0.00025779897635813264, "loss": 0.072, "step": 43590 }, { "epoch": 0.28, "learning_rate": 0.0002577892950037757, "loss": 0.0651, "step": 43600 }, { "epoch": 0.28, "learning_rate": 0.0002577796136494188, "loss": 0.0721, "step": 43610 }, { "epoch": 0.28, "learning_rate": 0.0002577699322950618, "loss": 0.067, "step": 43620 }, { "epoch": 0.28, "learning_rate": 0.0002577602509407049, "loss": 0.0599, "step": 43630 }, { "epoch": 0.28, "learning_rate": 0.000257750569586348, "loss": 0.0743, "step": 43640 }, { "epoch": 0.28, "learning_rate": 0.00025774088823199106, "loss": 0.069, "step": 43650 }, { "epoch": 0.28, "learning_rate": 0.0002577312068776341, "loss": 0.0663, "step": 43660 }, { "epoch": 0.28, "learning_rate": 0.00025772152552327717, "loss": 0.0718, "step": 43670 }, { "epoch": 0.28, "learning_rate": 0.00025771184416892025, "loss": 0.0682, "step": 43680 }, { "epoch": 0.28, "learning_rate": 0.0002577021628145633, "loss": 0.0674, "step": 43690 }, { "epoch": 0.28, "learning_rate": 0.0002576924814602064, "loss": 0.0757, "step": 43700 }, { "epoch": 0.28, "learning_rate": 0.0002576828001058495, "loss": 0.0659, "step": 43710 }, { "epoch": 0.28, "learning_rate": 0.0002576731187514925, "loss": 0.0625, "step": 43720 }, { "epoch": 0.28, "learning_rate": 0.0002576634373971356, "loss": 0.069, "step": 43730 }, { "epoch": 0.28, "learning_rate": 0.00025765375604277867, "loss": 0.0681, "step": 43740 }, { "epoch": 0.28, "learning_rate": 0.0002576440746884217, "loss": 0.079, "step": 43750 }, { "epoch": 0.28, "learning_rate": 0.0002576343933340648, "loss": 0.0718, "step": 43760 }, { "epoch": 0.28, "learning_rate": 0.00025762471197970785, "loss": 0.0668, "step": 43770 }, { "epoch": 0.28, "learning_rate": 0.00025761503062535093, "loss": 0.0715, "step": 43780 }, { "epoch": 0.28, "learning_rate": 0.000257605349270994, "loss": 0.0653, "step": 43790 }, { "epoch": 0.28, "learning_rate": 0.00025759566791663704, "loss": 0.0731, "step": 43800 }, { "epoch": 0.28, "learning_rate": 0.0002575859865622801, "loss": 0.0694, "step": 43810 }, { "epoch": 0.28, "learning_rate": 0.0002575763052079232, "loss": 0.0651, "step": 43820 }, { "epoch": 0.28, "learning_rate": 0.0002575666238535663, "loss": 0.0669, "step": 43830 }, { "epoch": 0.28, "learning_rate": 0.00025755694249920936, "loss": 0.0777, "step": 43840 }, { "epoch": 0.28, "learning_rate": 0.00025754726114485244, "loss": 0.0674, "step": 43850 }, { "epoch": 0.28, "learning_rate": 0.00025753757979049546, "loss": 0.0695, "step": 43860 }, { "epoch": 0.28, "learning_rate": 0.00025752789843613854, "loss": 0.0701, "step": 43870 }, { "epoch": 0.28, "learning_rate": 0.00025751821708178157, "loss": 0.0765, "step": 43880 }, { "epoch": 0.28, "learning_rate": 0.00025750853572742465, "loss": 0.0755, "step": 43890 }, { "epoch": 0.28, "learning_rate": 0.00025749885437306773, "loss": 0.0706, "step": 43900 }, { "epoch": 0.28, "learning_rate": 0.0002574891730187108, "loss": 0.0673, "step": 43910 }, { "epoch": 0.28, "learning_rate": 0.0002574794916643539, "loss": 0.0667, "step": 43920 }, { "epoch": 0.28, "learning_rate": 0.00025746981030999697, "loss": 0.065, "step": 43930 }, { "epoch": 0.28, "learning_rate": 0.00025746012895564, "loss": 0.0613, "step": 43940 }, { "epoch": 0.28, "learning_rate": 0.0002574504476012831, "loss": 0.0638, "step": 43950 }, { "epoch": 0.28, "learning_rate": 0.00025744076624692615, "loss": 0.0672, "step": 43960 }, { "epoch": 0.28, "learning_rate": 0.00025743108489256923, "loss": 0.0698, "step": 43970 }, { "epoch": 0.28, "learning_rate": 0.0002574214035382123, "loss": 0.0609, "step": 43980 }, { "epoch": 0.28, "learning_rate": 0.00025741172218385534, "loss": 0.0668, "step": 43990 }, { "epoch": 0.28, "learning_rate": 0.0002574020408294984, "loss": 0.0704, "step": 44000 }, { "epoch": 0.28, "eval_cer": 0.920119308552706, "eval_loss": 0.044700879603624344, "eval_runtime": 120.2434, "eval_samples_per_second": 16.633, "eval_steps_per_second": 4.158, "step": 44000 }, { "epoch": 0.28, "learning_rate": 0.0002573923594751415, "loss": 0.0653, "step": 44010 }, { "epoch": 0.28, "learning_rate": 0.0002573826781207845, "loss": 0.0601, "step": 44020 }, { "epoch": 0.28, "learning_rate": 0.0002573729967664276, "loss": 0.0725, "step": 44030 }, { "epoch": 0.28, "learning_rate": 0.0002573633154120707, "loss": 0.0705, "step": 44040 }, { "epoch": 0.28, "learning_rate": 0.00025735363405771376, "loss": 0.0642, "step": 44050 }, { "epoch": 0.28, "learning_rate": 0.00025734395270335684, "loss": 0.0669, "step": 44060 }, { "epoch": 0.28, "learning_rate": 0.0002573342713489999, "loss": 0.069, "step": 44070 }, { "epoch": 0.28, "learning_rate": 0.00025732458999464295, "loss": 0.0664, "step": 44080 }, { "epoch": 0.28, "learning_rate": 0.00025731490864028603, "loss": 0.0616, "step": 44090 }, { "epoch": 0.28, "learning_rate": 0.0002573052272859291, "loss": 0.0682, "step": 44100 }, { "epoch": 0.28, "learning_rate": 0.0002572955459315722, "loss": 0.0655, "step": 44110 }, { "epoch": 0.28, "learning_rate": 0.0002572858645772152, "loss": 0.0676, "step": 44120 }, { "epoch": 0.28, "learning_rate": 0.0002572761832228583, "loss": 0.0642, "step": 44130 }, { "epoch": 0.28, "learning_rate": 0.0002572665018685014, "loss": 0.063, "step": 44140 }, { "epoch": 0.28, "learning_rate": 0.0002572568205141444, "loss": 0.0589, "step": 44150 }, { "epoch": 0.29, "learning_rate": 0.0002572471391597875, "loss": 0.0619, "step": 44160 }, { "epoch": 0.29, "learning_rate": 0.00025723745780543056, "loss": 0.0692, "step": 44170 }, { "epoch": 0.29, "learning_rate": 0.00025722777645107364, "loss": 0.0621, "step": 44180 }, { "epoch": 0.29, "learning_rate": 0.0002572180950967167, "loss": 0.0697, "step": 44190 }, { "epoch": 0.29, "learning_rate": 0.0002572084137423598, "loss": 0.0644, "step": 44200 }, { "epoch": 0.29, "learning_rate": 0.0002571987323880029, "loss": 0.0616, "step": 44210 }, { "epoch": 0.29, "learning_rate": 0.0002571890510336459, "loss": 0.0723, "step": 44220 }, { "epoch": 0.29, "learning_rate": 0.000257179369679289, "loss": 0.0644, "step": 44230 }, { "epoch": 0.29, "learning_rate": 0.00025716968832493206, "loss": 0.0705, "step": 44240 }, { "epoch": 0.29, "learning_rate": 0.00025716000697057514, "loss": 0.0706, "step": 44250 }, { "epoch": 0.29, "learning_rate": 0.00025715032561621817, "loss": 0.0756, "step": 44260 }, { "epoch": 0.29, "learning_rate": 0.00025714064426186125, "loss": 0.0716, "step": 44270 }, { "epoch": 0.29, "learning_rate": 0.00025713096290750433, "loss": 0.0763, "step": 44280 }, { "epoch": 0.29, "learning_rate": 0.00025712128155314735, "loss": 0.0647, "step": 44290 }, { "epoch": 0.29, "learning_rate": 0.00025711160019879043, "loss": 0.0632, "step": 44300 }, { "epoch": 0.29, "learning_rate": 0.0002571019188444335, "loss": 0.0652, "step": 44310 }, { "epoch": 0.29, "learning_rate": 0.0002570922374900766, "loss": 0.0643, "step": 44320 }, { "epoch": 0.29, "learning_rate": 0.00025708255613571967, "loss": 0.0671, "step": 44330 }, { "epoch": 0.29, "learning_rate": 0.00025707287478136275, "loss": 0.0691, "step": 44340 }, { "epoch": 0.29, "learning_rate": 0.00025706319342700583, "loss": 0.0661, "step": 44350 }, { "epoch": 0.29, "learning_rate": 0.00025705351207264886, "loss": 0.0646, "step": 44360 }, { "epoch": 0.29, "learning_rate": 0.00025704383071829194, "loss": 0.0625, "step": 44370 }, { "epoch": 0.29, "learning_rate": 0.000257034149363935, "loss": 0.0648, "step": 44380 }, { "epoch": 0.29, "learning_rate": 0.00025702446800957804, "loss": 0.0709, "step": 44390 }, { "epoch": 0.29, "learning_rate": 0.0002570147866552211, "loss": 0.0663, "step": 44400 }, { "epoch": 0.29, "learning_rate": 0.0002570051053008642, "loss": 0.0609, "step": 44410 }, { "epoch": 0.29, "learning_rate": 0.0002569954239465073, "loss": 0.0613, "step": 44420 }, { "epoch": 0.29, "learning_rate": 0.0002569857425921503, "loss": 0.0673, "step": 44430 }, { "epoch": 0.29, "learning_rate": 0.0002569760612377934, "loss": 0.0679, "step": 44440 }, { "epoch": 0.29, "learning_rate": 0.00025696637988343647, "loss": 0.065, "step": 44450 }, { "epoch": 0.29, "learning_rate": 0.00025695669852907955, "loss": 0.0717, "step": 44460 }, { "epoch": 0.29, "learning_rate": 0.00025694701717472263, "loss": 0.0729, "step": 44470 }, { "epoch": 0.29, "learning_rate": 0.0002569373358203657, "loss": 0.0653, "step": 44480 }, { "epoch": 0.29, "learning_rate": 0.00025692765446600873, "loss": 0.0746, "step": 44490 }, { "epoch": 0.29, "learning_rate": 0.0002569179731116518, "loss": 0.0721, "step": 44500 }, { "epoch": 0.29, "learning_rate": 0.0002569082917572949, "loss": 0.0773, "step": 44510 }, { "epoch": 0.29, "learning_rate": 0.0002568986104029379, "loss": 0.0734, "step": 44520 }, { "epoch": 0.29, "learning_rate": 0.000256888929048581, "loss": 0.0738, "step": 44530 }, { "epoch": 0.29, "learning_rate": 0.0002568792476942241, "loss": 0.0617, "step": 44540 }, { "epoch": 0.29, "learning_rate": 0.00025686956633986716, "loss": 0.0606, "step": 44550 }, { "epoch": 0.29, "learning_rate": 0.00025685988498551024, "loss": 0.0709, "step": 44560 }, { "epoch": 0.29, "learning_rate": 0.00025685020363115326, "loss": 0.0705, "step": 44570 }, { "epoch": 0.29, "learning_rate": 0.00025684052227679634, "loss": 0.0686, "step": 44580 }, { "epoch": 0.29, "learning_rate": 0.0002568308409224394, "loss": 0.0762, "step": 44590 }, { "epoch": 0.29, "learning_rate": 0.0002568211595680825, "loss": 0.0704, "step": 44600 }, { "epoch": 0.29, "learning_rate": 0.0002568114782137256, "loss": 0.0646, "step": 44610 }, { "epoch": 0.29, "learning_rate": 0.00025680179685936866, "loss": 0.0696, "step": 44620 }, { "epoch": 0.29, "learning_rate": 0.0002567921155050117, "loss": 0.0622, "step": 44630 }, { "epoch": 0.29, "learning_rate": 0.00025678243415065477, "loss": 0.0643, "step": 44640 }, { "epoch": 0.29, "learning_rate": 0.00025677275279629785, "loss": 0.0595, "step": 44650 }, { "epoch": 0.29, "learning_rate": 0.00025676307144194087, "loss": 0.0645, "step": 44660 }, { "epoch": 0.29, "learning_rate": 0.00025675339008758395, "loss": 0.0689, "step": 44670 }, { "epoch": 0.29, "learning_rate": 0.00025674370873322703, "loss": 0.0639, "step": 44680 }, { "epoch": 0.29, "learning_rate": 0.0002567340273788701, "loss": 0.0678, "step": 44690 }, { "epoch": 0.29, "learning_rate": 0.0002567243460245132, "loss": 0.0649, "step": 44700 }, { "epoch": 0.29, "learning_rate": 0.0002567146646701562, "loss": 0.0597, "step": 44710 }, { "epoch": 0.29, "learning_rate": 0.0002567049833157993, "loss": 0.0617, "step": 44720 }, { "epoch": 0.29, "learning_rate": 0.0002566953019614424, "loss": 0.0679, "step": 44730 }, { "epoch": 0.29, "learning_rate": 0.00025668562060708546, "loss": 0.0602, "step": 44740 }, { "epoch": 0.29, "learning_rate": 0.00025667593925272854, "loss": 0.0671, "step": 44750 }, { "epoch": 0.29, "learning_rate": 0.00025666625789837156, "loss": 0.0603, "step": 44760 }, { "epoch": 0.29, "learning_rate": 0.00025665657654401464, "loss": 0.0555, "step": 44770 }, { "epoch": 0.29, "learning_rate": 0.0002566468951896577, "loss": 0.0689, "step": 44780 }, { "epoch": 0.29, "learning_rate": 0.00025663721383530075, "loss": 0.0605, "step": 44790 }, { "epoch": 0.29, "learning_rate": 0.0002566275324809438, "loss": 0.0686, "step": 44800 }, { "epoch": 0.29, "learning_rate": 0.0002566178511265869, "loss": 0.0647, "step": 44810 }, { "epoch": 0.29, "learning_rate": 0.00025660816977223, "loss": 0.0639, "step": 44820 }, { "epoch": 0.29, "learning_rate": 0.00025659848841787307, "loss": 0.0689, "step": 44830 }, { "epoch": 0.29, "learning_rate": 0.0002565888070635161, "loss": 0.0701, "step": 44840 }, { "epoch": 0.29, "learning_rate": 0.00025657912570915917, "loss": 0.0795, "step": 44850 }, { "epoch": 0.29, "learning_rate": 0.00025656944435480225, "loss": 0.0622, "step": 44860 }, { "epoch": 0.29, "learning_rate": 0.00025655976300044533, "loss": 0.0654, "step": 44870 }, { "epoch": 0.29, "learning_rate": 0.0002565500816460884, "loss": 0.0756, "step": 44880 }, { "epoch": 0.29, "learning_rate": 0.00025654040029173144, "loss": 0.0748, "step": 44890 }, { "epoch": 0.29, "learning_rate": 0.0002565307189373745, "loss": 0.0676, "step": 44900 }, { "epoch": 0.29, "learning_rate": 0.0002565210375830176, "loss": 0.0689, "step": 44910 }, { "epoch": 0.29, "learning_rate": 0.0002565113562286606, "loss": 0.0657, "step": 44920 }, { "epoch": 0.29, "learning_rate": 0.0002565016748743037, "loss": 0.0706, "step": 44930 }, { "epoch": 0.29, "learning_rate": 0.0002564919935199468, "loss": 0.0619, "step": 44940 }, { "epoch": 0.29, "learning_rate": 0.00025648231216558986, "loss": 0.0735, "step": 44950 }, { "epoch": 0.29, "learning_rate": 0.00025647263081123294, "loss": 0.0783, "step": 44960 }, { "epoch": 0.29, "learning_rate": 0.000256462949456876, "loss": 0.0677, "step": 44970 }, { "epoch": 0.29, "learning_rate": 0.00025645326810251905, "loss": 0.0649, "step": 44980 }, { "epoch": 0.29, "learning_rate": 0.0002564435867481621, "loss": 0.0676, "step": 44990 }, { "epoch": 0.29, "learning_rate": 0.0002564339053938052, "loss": 0.0657, "step": 45000 }, { "epoch": 0.29, "eval_cer": 0.920057846571009, "eval_loss": 0.0462675541639328, "eval_runtime": 120.4879, "eval_samples_per_second": 16.599, "eval_steps_per_second": 4.15, "step": 45000 }, { "epoch": 0.29, "learning_rate": 0.0002564242240394483, "loss": 0.0645, "step": 45010 }, { "epoch": 0.29, "learning_rate": 0.00025641454268509137, "loss": 0.0675, "step": 45020 }, { "epoch": 0.29, "learning_rate": 0.0002564048613307344, "loss": 0.0607, "step": 45030 }, { "epoch": 0.29, "learning_rate": 0.00025639517997637747, "loss": 0.0618, "step": 45040 }, { "epoch": 0.29, "learning_rate": 0.00025638549862202055, "loss": 0.078, "step": 45050 }, { "epoch": 0.29, "learning_rate": 0.0002563758172676636, "loss": 0.0671, "step": 45060 }, { "epoch": 0.29, "learning_rate": 0.00025636613591330666, "loss": 0.0702, "step": 45070 }, { "epoch": 0.29, "learning_rate": 0.00025635645455894974, "loss": 0.066, "step": 45080 }, { "epoch": 0.29, "learning_rate": 0.0002563467732045928, "loss": 0.0788, "step": 45090 }, { "epoch": 0.29, "learning_rate": 0.0002563370918502359, "loss": 0.0636, "step": 45100 }, { "epoch": 0.29, "learning_rate": 0.000256327410495879, "loss": 0.0667, "step": 45110 }, { "epoch": 0.29, "learning_rate": 0.000256317729141522, "loss": 0.0676, "step": 45120 }, { "epoch": 0.29, "learning_rate": 0.0002563080477871651, "loss": 0.0787, "step": 45130 }, { "epoch": 0.29, "learning_rate": 0.00025629836643280816, "loss": 0.0548, "step": 45140 }, { "epoch": 0.29, "learning_rate": 0.00025628868507845124, "loss": 0.0644, "step": 45150 }, { "epoch": 0.29, "learning_rate": 0.00025627900372409427, "loss": 0.0636, "step": 45160 }, { "epoch": 0.29, "learning_rate": 0.00025626932236973735, "loss": 0.0734, "step": 45170 }, { "epoch": 0.29, "learning_rate": 0.0002562596410153804, "loss": 0.075, "step": 45180 }, { "epoch": 0.29, "learning_rate": 0.00025624995966102345, "loss": 0.0622, "step": 45190 }, { "epoch": 0.29, "learning_rate": 0.00025624027830666653, "loss": 0.0602, "step": 45200 }, { "epoch": 0.29, "learning_rate": 0.0002562305969523096, "loss": 0.0619, "step": 45210 }, { "epoch": 0.29, "learning_rate": 0.0002562209155979527, "loss": 0.0645, "step": 45220 }, { "epoch": 0.29, "learning_rate": 0.00025621123424359577, "loss": 0.0652, "step": 45230 }, { "epoch": 0.29, "learning_rate": 0.00025620155288923885, "loss": 0.06, "step": 45240 }, { "epoch": 0.29, "learning_rate": 0.00025619187153488193, "loss": 0.0673, "step": 45250 }, { "epoch": 0.29, "learning_rate": 0.00025618219018052495, "loss": 0.0605, "step": 45260 }, { "epoch": 0.29, "learning_rate": 0.00025617250882616803, "loss": 0.0762, "step": 45270 }, { "epoch": 0.29, "learning_rate": 0.0002561628274718111, "loss": 0.0688, "step": 45280 }, { "epoch": 0.29, "learning_rate": 0.00025615314611745414, "loss": 0.0673, "step": 45290 }, { "epoch": 0.29, "learning_rate": 0.0002561434647630972, "loss": 0.0794, "step": 45300 }, { "epoch": 0.29, "learning_rate": 0.0002561337834087403, "loss": 0.0654, "step": 45310 }, { "epoch": 0.29, "learning_rate": 0.0002561241020543834, "loss": 0.0693, "step": 45320 }, { "epoch": 0.29, "learning_rate": 0.0002561144207000264, "loss": 0.0638, "step": 45330 }, { "epoch": 0.29, "learning_rate": 0.0002561047393456695, "loss": 0.06, "step": 45340 }, { "epoch": 0.29, "learning_rate": 0.00025609505799131256, "loss": 0.0642, "step": 45350 }, { "epoch": 0.29, "learning_rate": 0.00025608537663695564, "loss": 0.0681, "step": 45360 }, { "epoch": 0.29, "learning_rate": 0.0002560756952825987, "loss": 0.0674, "step": 45370 }, { "epoch": 0.29, "learning_rate": 0.0002560660139282418, "loss": 0.0648, "step": 45380 }, { "epoch": 0.29, "learning_rate": 0.0002560563325738849, "loss": 0.0665, "step": 45390 }, { "epoch": 0.29, "learning_rate": 0.0002560466512195279, "loss": 0.0688, "step": 45400 }, { "epoch": 0.29, "learning_rate": 0.000256036969865171, "loss": 0.0669, "step": 45410 }, { "epoch": 0.29, "learning_rate": 0.00025602728851081407, "loss": 0.0691, "step": 45420 }, { "epoch": 0.29, "learning_rate": 0.0002560176071564571, "loss": 0.0633, "step": 45430 }, { "epoch": 0.29, "learning_rate": 0.0002560079258021002, "loss": 0.0652, "step": 45440 }, { "epoch": 0.29, "learning_rate": 0.00025599824444774325, "loss": 0.0664, "step": 45450 }, { "epoch": 0.29, "learning_rate": 0.00025598856309338633, "loss": 0.0576, "step": 45460 }, { "epoch": 0.29, "learning_rate": 0.00025597888173902936, "loss": 0.0624, "step": 45470 }, { "epoch": 0.29, "learning_rate": 0.00025596920038467244, "loss": 0.0687, "step": 45480 }, { "epoch": 0.29, "learning_rate": 0.0002559595190303155, "loss": 0.0691, "step": 45490 }, { "epoch": 0.29, "learning_rate": 0.0002559498376759586, "loss": 0.0665, "step": 45500 }, { "epoch": 0.29, "learning_rate": 0.0002559401563216017, "loss": 0.0639, "step": 45510 }, { "epoch": 0.29, "learning_rate": 0.00025593047496724476, "loss": 0.0681, "step": 45520 }, { "epoch": 0.29, "learning_rate": 0.0002559207936128878, "loss": 0.0714, "step": 45530 }, { "epoch": 0.29, "learning_rate": 0.00025591111225853086, "loss": 0.0622, "step": 45540 }, { "epoch": 0.29, "learning_rate": 0.00025590143090417394, "loss": 0.068, "step": 45550 }, { "epoch": 0.29, "learning_rate": 0.00025589174954981697, "loss": 0.0679, "step": 45560 }, { "epoch": 0.29, "learning_rate": 0.00025588206819546005, "loss": 0.0748, "step": 45570 }, { "epoch": 0.29, "learning_rate": 0.00025587238684110313, "loss": 0.0667, "step": 45580 }, { "epoch": 0.29, "learning_rate": 0.0002558627054867462, "loss": 0.0679, "step": 45590 }, { "epoch": 0.29, "learning_rate": 0.0002558530241323893, "loss": 0.07, "step": 45600 }, { "epoch": 0.29, "learning_rate": 0.0002558433427780323, "loss": 0.0647, "step": 45610 }, { "epoch": 0.29, "learning_rate": 0.0002558336614236754, "loss": 0.07, "step": 45620 }, { "epoch": 0.29, "learning_rate": 0.0002558239800693185, "loss": 0.0591, "step": 45630 }, { "epoch": 0.29, "learning_rate": 0.00025581429871496155, "loss": 0.0748, "step": 45640 }, { "epoch": 0.29, "learning_rate": 0.00025580461736060463, "loss": 0.0684, "step": 45650 }, { "epoch": 0.29, "learning_rate": 0.0002557949360062477, "loss": 0.0585, "step": 45660 }, { "epoch": 0.29, "learning_rate": 0.00025578525465189074, "loss": 0.068, "step": 45670 }, { "epoch": 0.29, "learning_rate": 0.0002557755732975338, "loss": 0.067, "step": 45680 }, { "epoch": 0.29, "learning_rate": 0.00025576589194317684, "loss": 0.0695, "step": 45690 }, { "epoch": 0.29, "learning_rate": 0.0002557562105888199, "loss": 0.0614, "step": 45700 }, { "epoch": 0.3, "learning_rate": 0.000255746529234463, "loss": 0.0618, "step": 45710 }, { "epoch": 0.3, "learning_rate": 0.0002557368478801061, "loss": 0.065, "step": 45720 }, { "epoch": 0.3, "learning_rate": 0.00025572716652574916, "loss": 0.0662, "step": 45730 }, { "epoch": 0.3, "learning_rate": 0.00025571748517139224, "loss": 0.0653, "step": 45740 }, { "epoch": 0.3, "learning_rate": 0.00025570780381703527, "loss": 0.0651, "step": 45750 }, { "epoch": 0.3, "learning_rate": 0.00025569812246267835, "loss": 0.0618, "step": 45760 }, { "epoch": 0.3, "learning_rate": 0.00025568844110832143, "loss": 0.0706, "step": 45770 }, { "epoch": 0.3, "learning_rate": 0.0002556787597539645, "loss": 0.0779, "step": 45780 }, { "epoch": 0.3, "learning_rate": 0.0002556690783996076, "loss": 0.0739, "step": 45790 }, { "epoch": 0.3, "learning_rate": 0.0002556593970452506, "loss": 0.0755, "step": 45800 }, { "epoch": 0.3, "learning_rate": 0.0002556497156908937, "loss": 0.0684, "step": 45810 }, { "epoch": 0.3, "learning_rate": 0.00025564003433653677, "loss": 0.0649, "step": 45820 }, { "epoch": 0.3, "learning_rate": 0.0002556303529821798, "loss": 0.0682, "step": 45830 }, { "epoch": 0.3, "learning_rate": 0.0002556206716278229, "loss": 0.0622, "step": 45840 }, { "epoch": 0.3, "learning_rate": 0.00025561099027346596, "loss": 0.0626, "step": 45850 }, { "epoch": 0.3, "learning_rate": 0.00025560130891910904, "loss": 0.0741, "step": 45860 }, { "epoch": 0.3, "learning_rate": 0.0002555916275647521, "loss": 0.0659, "step": 45870 }, { "epoch": 0.3, "learning_rate": 0.0002555819462103952, "loss": 0.0723, "step": 45880 }, { "epoch": 0.3, "learning_rate": 0.0002555722648560382, "loss": 0.0642, "step": 45890 }, { "epoch": 0.3, "learning_rate": 0.0002555625835016813, "loss": 0.071, "step": 45900 }, { "epoch": 0.3, "learning_rate": 0.0002555529021473244, "loss": 0.064, "step": 45910 }, { "epoch": 0.3, "learning_rate": 0.00025554322079296746, "loss": 0.0663, "step": 45920 }, { "epoch": 0.3, "learning_rate": 0.0002555335394386105, "loss": 0.0715, "step": 45930 }, { "epoch": 0.3, "learning_rate": 0.00025552385808425357, "loss": 0.0687, "step": 45940 }, { "epoch": 0.3, "learning_rate": 0.00025551417672989665, "loss": 0.0753, "step": 45950 }, { "epoch": 0.3, "learning_rate": 0.0002555044953755397, "loss": 0.068, "step": 45960 }, { "epoch": 0.3, "learning_rate": 0.00025549481402118275, "loss": 0.0648, "step": 45970 }, { "epoch": 0.3, "learning_rate": 0.00025548513266682583, "loss": 0.0669, "step": 45980 }, { "epoch": 0.3, "learning_rate": 0.0002554754513124689, "loss": 0.0662, "step": 45990 }, { "epoch": 0.3, "learning_rate": 0.000255465769958112, "loss": 0.0649, "step": 46000 }, { "epoch": 0.3, "eval_cer": 0.9200388656648967, "eval_loss": 0.04449348524212837, "eval_runtime": 120.161, "eval_samples_per_second": 16.644, "eval_steps_per_second": 4.161, "step": 46000 }, { "epoch": 0.3, "learning_rate": 0.00025545608860375507, "loss": 0.0767, "step": 46010 }, { "epoch": 0.3, "learning_rate": 0.00025544640724939815, "loss": 0.0647, "step": 46020 }, { "epoch": 0.3, "learning_rate": 0.0002554367258950412, "loss": 0.0625, "step": 46030 }, { "epoch": 0.3, "learning_rate": 0.00025542704454068426, "loss": 0.0721, "step": 46040 }, { "epoch": 0.3, "learning_rate": 0.00025541736318632734, "loss": 0.0633, "step": 46050 }, { "epoch": 0.3, "learning_rate": 0.0002554076818319704, "loss": 0.0611, "step": 46060 }, { "epoch": 0.3, "learning_rate": 0.00025539800047761344, "loss": 0.0655, "step": 46070 }, { "epoch": 0.3, "learning_rate": 0.0002553883191232565, "loss": 0.0611, "step": 46080 }, { "epoch": 0.3, "learning_rate": 0.0002553786377688996, "loss": 0.0644, "step": 46090 }, { "epoch": 0.3, "learning_rate": 0.00025536895641454263, "loss": 0.0626, "step": 46100 }, { "epoch": 0.3, "learning_rate": 0.0002553592750601857, "loss": 0.0716, "step": 46110 }, { "epoch": 0.3, "learning_rate": 0.0002553495937058288, "loss": 0.0608, "step": 46120 }, { "epoch": 0.3, "learning_rate": 0.00025533991235147187, "loss": 0.0611, "step": 46130 }, { "epoch": 0.3, "learning_rate": 0.00025533023099711495, "loss": 0.0703, "step": 46140 }, { "epoch": 0.3, "learning_rate": 0.000255320549642758, "loss": 0.0652, "step": 46150 }, { "epoch": 0.3, "learning_rate": 0.0002553108682884011, "loss": 0.0652, "step": 46160 }, { "epoch": 0.3, "learning_rate": 0.00025530118693404413, "loss": 0.0731, "step": 46170 }, { "epoch": 0.3, "learning_rate": 0.0002552915055796872, "loss": 0.0669, "step": 46180 }, { "epoch": 0.3, "learning_rate": 0.0002552818242253303, "loss": 0.0674, "step": 46190 }, { "epoch": 0.3, "learning_rate": 0.0002552721428709733, "loss": 0.0676, "step": 46200 }, { "epoch": 0.3, "learning_rate": 0.0002552624615166164, "loss": 0.0677, "step": 46210 }, { "epoch": 0.3, "learning_rate": 0.0002552527801622595, "loss": 0.0591, "step": 46220 }, { "epoch": 0.3, "learning_rate": 0.00025524309880790256, "loss": 0.0644, "step": 46230 }, { "epoch": 0.3, "learning_rate": 0.0002552334174535456, "loss": 0.0715, "step": 46240 }, { "epoch": 0.3, "learning_rate": 0.00025522373609918866, "loss": 0.0703, "step": 46250 }, { "epoch": 0.3, "learning_rate": 0.00025521405474483174, "loss": 0.0733, "step": 46260 }, { "epoch": 0.3, "learning_rate": 0.0002552043733904748, "loss": 0.0597, "step": 46270 }, { "epoch": 0.3, "learning_rate": 0.0002551946920361179, "loss": 0.0608, "step": 46280 }, { "epoch": 0.3, "learning_rate": 0.000255185010681761, "loss": 0.0695, "step": 46290 }, { "epoch": 0.3, "learning_rate": 0.000255175329327404, "loss": 0.0592, "step": 46300 }, { "epoch": 0.3, "learning_rate": 0.0002551656479730471, "loss": 0.0541, "step": 46310 }, { "epoch": 0.3, "learning_rate": 0.00025515596661869017, "loss": 0.0623, "step": 46320 }, { "epoch": 0.3, "learning_rate": 0.0002551462852643332, "loss": 0.0727, "step": 46330 }, { "epoch": 0.3, "learning_rate": 0.00025513660390997627, "loss": 0.0663, "step": 46340 }, { "epoch": 0.3, "learning_rate": 0.00025512692255561935, "loss": 0.0573, "step": 46350 }, { "epoch": 0.3, "learning_rate": 0.00025511724120126243, "loss": 0.0562, "step": 46360 }, { "epoch": 0.3, "learning_rate": 0.0002551075598469055, "loss": 0.062, "step": 46370 }, { "epoch": 0.3, "learning_rate": 0.00025509787849254854, "loss": 0.0649, "step": 46380 }, { "epoch": 0.3, "learning_rate": 0.0002550881971381916, "loss": 0.0702, "step": 46390 }, { "epoch": 0.3, "learning_rate": 0.0002550785157838347, "loss": 0.0658, "step": 46400 }, { "epoch": 0.3, "learning_rate": 0.0002550688344294778, "loss": 0.0727, "step": 46410 }, { "epoch": 0.3, "learning_rate": 0.00025505915307512086, "loss": 0.074, "step": 46420 }, { "epoch": 0.3, "learning_rate": 0.00025504947172076394, "loss": 0.0668, "step": 46430 }, { "epoch": 0.3, "learning_rate": 0.00025503979036640696, "loss": 0.0767, "step": 46440 }, { "epoch": 0.3, "learning_rate": 0.00025503010901205004, "loss": 0.067, "step": 46450 }, { "epoch": 0.3, "learning_rate": 0.0002550204276576931, "loss": 0.0807, "step": 46460 }, { "epoch": 0.3, "learning_rate": 0.00025501074630333615, "loss": 0.0659, "step": 46470 }, { "epoch": 0.3, "learning_rate": 0.0002550010649489792, "loss": 0.0657, "step": 46480 }, { "epoch": 0.3, "learning_rate": 0.0002549913835946223, "loss": 0.0723, "step": 46490 }, { "epoch": 0.3, "learning_rate": 0.0002549817022402654, "loss": 0.0594, "step": 46500 }, { "epoch": 0.3, "learning_rate": 0.00025497202088590847, "loss": 0.0629, "step": 46510 }, { "epoch": 0.3, "learning_rate": 0.0002549623395315515, "loss": 0.0661, "step": 46520 }, { "epoch": 0.3, "learning_rate": 0.00025495265817719457, "loss": 0.066, "step": 46530 }, { "epoch": 0.3, "learning_rate": 0.00025494297682283765, "loss": 0.0602, "step": 46540 }, { "epoch": 0.3, "learning_rate": 0.00025493329546848073, "loss": 0.0605, "step": 46550 }, { "epoch": 0.3, "learning_rate": 0.0002549236141141238, "loss": 0.0713, "step": 46560 }, { "epoch": 0.3, "learning_rate": 0.00025491393275976684, "loss": 0.0715, "step": 46570 }, { "epoch": 0.3, "learning_rate": 0.0002549042514054099, "loss": 0.0682, "step": 46580 }, { "epoch": 0.3, "learning_rate": 0.000254894570051053, "loss": 0.0737, "step": 46590 }, { "epoch": 0.3, "learning_rate": 0.000254884888696696, "loss": 0.0627, "step": 46600 }, { "epoch": 0.3, "learning_rate": 0.0002548752073423391, "loss": 0.0646, "step": 46610 }, { "epoch": 0.3, "learning_rate": 0.0002548655259879822, "loss": 0.0604, "step": 46620 }, { "epoch": 0.3, "learning_rate": 0.00025485584463362526, "loss": 0.0631, "step": 46630 }, { "epoch": 0.3, "learning_rate": 0.00025484616327926834, "loss": 0.066, "step": 46640 }, { "epoch": 0.3, "learning_rate": 0.0002548364819249114, "loss": 0.0631, "step": 46650 }, { "epoch": 0.3, "learning_rate": 0.00025482680057055445, "loss": 0.0655, "step": 46660 }, { "epoch": 0.3, "learning_rate": 0.0002548171192161975, "loss": 0.063, "step": 46670 }, { "epoch": 0.3, "learning_rate": 0.0002548074378618406, "loss": 0.0702, "step": 46680 }, { "epoch": 0.3, "learning_rate": 0.0002547977565074837, "loss": 0.0603, "step": 46690 }, { "epoch": 0.3, "learning_rate": 0.0002547880751531267, "loss": 0.0612, "step": 46700 }, { "epoch": 0.3, "learning_rate": 0.0002547783937987698, "loss": 0.0783, "step": 46710 }, { "epoch": 0.3, "learning_rate": 0.00025476871244441287, "loss": 0.0734, "step": 46720 }, { "epoch": 0.3, "learning_rate": 0.0002547590310900559, "loss": 0.0591, "step": 46730 }, { "epoch": 0.3, "learning_rate": 0.000254749349735699, "loss": 0.0668, "step": 46740 }, { "epoch": 0.3, "learning_rate": 0.00025473966838134205, "loss": 0.0613, "step": 46750 }, { "epoch": 0.3, "learning_rate": 0.00025472998702698513, "loss": 0.0617, "step": 46760 }, { "epoch": 0.3, "learning_rate": 0.0002547203056726282, "loss": 0.0716, "step": 46770 }, { "epoch": 0.3, "learning_rate": 0.0002547106243182713, "loss": 0.0663, "step": 46780 }, { "epoch": 0.3, "learning_rate": 0.0002547009429639144, "loss": 0.075, "step": 46790 }, { "epoch": 0.3, "learning_rate": 0.0002546912616095574, "loss": 0.0644, "step": 46800 }, { "epoch": 0.3, "learning_rate": 0.0002546815802552005, "loss": 0.0695, "step": 46810 }, { "epoch": 0.3, "learning_rate": 0.00025467189890084356, "loss": 0.0636, "step": 46820 }, { "epoch": 0.3, "learning_rate": 0.00025466221754648664, "loss": 0.0619, "step": 46830 }, { "epoch": 0.3, "learning_rate": 0.00025465253619212966, "loss": 0.0599, "step": 46840 }, { "epoch": 0.3, "learning_rate": 0.00025464285483777274, "loss": 0.0679, "step": 46850 }, { "epoch": 0.3, "learning_rate": 0.0002546331734834158, "loss": 0.0606, "step": 46860 }, { "epoch": 0.3, "learning_rate": 0.00025462349212905885, "loss": 0.0703, "step": 46870 }, { "epoch": 0.3, "learning_rate": 0.00025461381077470193, "loss": 0.0722, "step": 46880 }, { "epoch": 0.3, "learning_rate": 0.000254604129420345, "loss": 0.0653, "step": 46890 }, { "epoch": 0.3, "learning_rate": 0.0002545944480659881, "loss": 0.0623, "step": 46900 }, { "epoch": 0.3, "learning_rate": 0.00025458476671163117, "loss": 0.0648, "step": 46910 }, { "epoch": 0.3, "learning_rate": 0.00025457508535727425, "loss": 0.0675, "step": 46920 }, { "epoch": 0.3, "learning_rate": 0.00025456540400291733, "loss": 0.0837, "step": 46930 }, { "epoch": 0.3, "learning_rate": 0.00025455572264856035, "loss": 0.0673, "step": 46940 }, { "epoch": 0.3, "learning_rate": 0.00025454604129420343, "loss": 0.0734, "step": 46950 }, { "epoch": 0.3, "learning_rate": 0.0002545363599398465, "loss": 0.0666, "step": 46960 }, { "epoch": 0.3, "learning_rate": 0.00025452667858548954, "loss": 0.0684, "step": 46970 }, { "epoch": 0.3, "learning_rate": 0.0002545169972311326, "loss": 0.0692, "step": 46980 }, { "epoch": 0.3, "learning_rate": 0.0002545073158767757, "loss": 0.0638, "step": 46990 }, { "epoch": 0.3, "learning_rate": 0.0002544976345224188, "loss": 0.069, "step": 47000 }, { "epoch": 0.3, "eval_cer": 0.9200750197717772, "eval_loss": 0.04444407671689987, "eval_runtime": 120.1079, "eval_samples_per_second": 16.652, "eval_steps_per_second": 4.163, "step": 47000 }, { "epoch": 0.3, "learning_rate": 0.0002544879531680618, "loss": 0.0689, "step": 47010 }, { "epoch": 0.3, "learning_rate": 0.0002544782718137049, "loss": 0.0668, "step": 47020 }, { "epoch": 0.3, "learning_rate": 0.00025446859045934796, "loss": 0.0648, "step": 47030 }, { "epoch": 0.3, "learning_rate": 0.00025445890910499104, "loss": 0.0723, "step": 47040 }, { "epoch": 0.3, "learning_rate": 0.0002544492277506341, "loss": 0.0617, "step": 47050 }, { "epoch": 0.3, "learning_rate": 0.0002544395463962772, "loss": 0.0603, "step": 47060 }, { "epoch": 0.3, "learning_rate": 0.00025442986504192023, "loss": 0.063, "step": 47070 }, { "epoch": 0.3, "learning_rate": 0.0002544201836875633, "loss": 0.0666, "step": 47080 }, { "epoch": 0.3, "learning_rate": 0.0002544105023332064, "loss": 0.0681, "step": 47090 }, { "epoch": 0.3, "learning_rate": 0.0002544008209788494, "loss": 0.0644, "step": 47100 }, { "epoch": 0.3, "learning_rate": 0.0002543911396244925, "loss": 0.0732, "step": 47110 }, { "epoch": 0.3, "learning_rate": 0.0002543814582701356, "loss": 0.0647, "step": 47120 }, { "epoch": 0.3, "learning_rate": 0.00025437177691577865, "loss": 0.062, "step": 47130 }, { "epoch": 0.3, "learning_rate": 0.00025436209556142173, "loss": 0.0628, "step": 47140 }, { "epoch": 0.3, "learning_rate": 0.00025435241420706476, "loss": 0.0571, "step": 47150 }, { "epoch": 0.3, "learning_rate": 0.00025434273285270784, "loss": 0.0671, "step": 47160 }, { "epoch": 0.3, "learning_rate": 0.0002543330514983509, "loss": 0.0713, "step": 47170 }, { "epoch": 0.3, "learning_rate": 0.000254323370143994, "loss": 0.0651, "step": 47180 }, { "epoch": 0.3, "learning_rate": 0.0002543136887896371, "loss": 0.0639, "step": 47190 }, { "epoch": 0.3, "learning_rate": 0.00025430400743528016, "loss": 0.0611, "step": 47200 }, { "epoch": 0.3, "learning_rate": 0.0002542943260809232, "loss": 0.0634, "step": 47210 }, { "epoch": 0.3, "learning_rate": 0.00025428464472656626, "loss": 0.0589, "step": 47220 }, { "epoch": 0.3, "learning_rate": 0.00025427496337220934, "loss": 0.0645, "step": 47230 }, { "epoch": 0.3, "learning_rate": 0.00025426528201785237, "loss": 0.0743, "step": 47240 }, { "epoch": 0.3, "learning_rate": 0.00025425560066349545, "loss": 0.072, "step": 47250 }, { "epoch": 0.31, "learning_rate": 0.00025424591930913853, "loss": 0.066, "step": 47260 }, { "epoch": 0.31, "learning_rate": 0.0002542362379547816, "loss": 0.062, "step": 47270 }, { "epoch": 0.31, "learning_rate": 0.0002542265566004247, "loss": 0.0658, "step": 47280 }, { "epoch": 0.31, "learning_rate": 0.0002542168752460677, "loss": 0.0617, "step": 47290 }, { "epoch": 0.31, "learning_rate": 0.0002542071938917108, "loss": 0.0633, "step": 47300 }, { "epoch": 0.31, "learning_rate": 0.00025419751253735387, "loss": 0.0649, "step": 47310 }, { "epoch": 0.31, "learning_rate": 0.00025418783118299695, "loss": 0.0664, "step": 47320 }, { "epoch": 0.31, "learning_rate": 0.00025417814982864003, "loss": 0.0677, "step": 47330 }, { "epoch": 0.31, "learning_rate": 0.00025416846847428306, "loss": 0.0754, "step": 47340 }, { "epoch": 0.31, "learning_rate": 0.00025415878711992614, "loss": 0.0712, "step": 47350 }, { "epoch": 0.31, "learning_rate": 0.0002541491057655692, "loss": 0.0717, "step": 47360 }, { "epoch": 0.31, "learning_rate": 0.00025413942441121224, "loss": 0.0749, "step": 47370 }, { "epoch": 0.31, "learning_rate": 0.0002541297430568553, "loss": 0.0669, "step": 47380 }, { "epoch": 0.31, "learning_rate": 0.0002541200617024984, "loss": 0.078, "step": 47390 }, { "epoch": 0.31, "learning_rate": 0.0002541103803481415, "loss": 0.0703, "step": 47400 }, { "epoch": 0.31, "learning_rate": 0.00025410069899378456, "loss": 0.065, "step": 47410 }, { "epoch": 0.31, "learning_rate": 0.00025409101763942764, "loss": 0.0667, "step": 47420 }, { "epoch": 0.31, "learning_rate": 0.00025408133628507067, "loss": 0.0589, "step": 47430 }, { "epoch": 0.31, "learning_rate": 0.00025407165493071375, "loss": 0.0701, "step": 47440 }, { "epoch": 0.31, "learning_rate": 0.00025406197357635683, "loss": 0.066, "step": 47450 }, { "epoch": 0.31, "learning_rate": 0.0002540522922219999, "loss": 0.0632, "step": 47460 }, { "epoch": 0.31, "learning_rate": 0.00025404261086764293, "loss": 0.0676, "step": 47470 }, { "epoch": 0.31, "learning_rate": 0.000254032929513286, "loss": 0.0624, "step": 47480 }, { "epoch": 0.31, "learning_rate": 0.0002540232481589291, "loss": 0.0627, "step": 47490 }, { "epoch": 0.31, "learning_rate": 0.0002540135668045721, "loss": 0.061, "step": 47500 }, { "epoch": 0.31, "learning_rate": 0.0002540038854502152, "loss": 0.07, "step": 47510 }, { "epoch": 0.31, "learning_rate": 0.0002539942040958583, "loss": 0.0615, "step": 47520 }, { "epoch": 0.31, "learning_rate": 0.00025398452274150136, "loss": 0.0609, "step": 47530 }, { "epoch": 0.31, "learning_rate": 0.00025397484138714444, "loss": 0.0671, "step": 47540 }, { "epoch": 0.31, "learning_rate": 0.0002539651600327875, "loss": 0.0684, "step": 47550 }, { "epoch": 0.31, "learning_rate": 0.0002539554786784306, "loss": 0.0678, "step": 47560 }, { "epoch": 0.31, "learning_rate": 0.0002539457973240736, "loss": 0.0583, "step": 47570 }, { "epoch": 0.31, "learning_rate": 0.0002539361159697167, "loss": 0.0624, "step": 47580 }, { "epoch": 0.31, "learning_rate": 0.0002539264346153598, "loss": 0.0639, "step": 47590 }, { "epoch": 0.31, "learning_rate": 0.00025391675326100286, "loss": 0.063, "step": 47600 }, { "epoch": 0.31, "learning_rate": 0.0002539070719066459, "loss": 0.0684, "step": 47610 }, { "epoch": 0.31, "learning_rate": 0.00025389739055228897, "loss": 0.0678, "step": 47620 }, { "epoch": 0.31, "learning_rate": 0.00025388770919793205, "loss": 0.0648, "step": 47630 }, { "epoch": 0.31, "learning_rate": 0.00025387802784357507, "loss": 0.0697, "step": 47640 }, { "epoch": 0.31, "learning_rate": 0.00025386834648921815, "loss": 0.0725, "step": 47650 }, { "epoch": 0.31, "learning_rate": 0.00025385866513486123, "loss": 0.0628, "step": 47660 }, { "epoch": 0.31, "learning_rate": 0.0002538489837805043, "loss": 0.0628, "step": 47670 }, { "epoch": 0.31, "learning_rate": 0.0002538393024261474, "loss": 0.0591, "step": 47680 }, { "epoch": 0.31, "learning_rate": 0.00025382962107179047, "loss": 0.0637, "step": 47690 }, { "epoch": 0.31, "learning_rate": 0.00025381993971743355, "loss": 0.0723, "step": 47700 }, { "epoch": 0.31, "learning_rate": 0.0002538102583630766, "loss": 0.0576, "step": 47710 }, { "epoch": 0.31, "learning_rate": 0.00025380057700871966, "loss": 0.0602, "step": 47720 }, { "epoch": 0.31, "learning_rate": 0.00025379089565436274, "loss": 0.0605, "step": 47730 }, { "epoch": 0.31, "learning_rate": 0.00025378121430000576, "loss": 0.0669, "step": 47740 }, { "epoch": 0.31, "learning_rate": 0.00025377153294564884, "loss": 0.0639, "step": 47750 }, { "epoch": 0.31, "learning_rate": 0.0002537618515912919, "loss": 0.0623, "step": 47760 }, { "epoch": 0.31, "learning_rate": 0.000253752170236935, "loss": 0.0622, "step": 47770 }, { "epoch": 0.31, "learning_rate": 0.000253742488882578, "loss": 0.0635, "step": 47780 }, { "epoch": 0.31, "learning_rate": 0.0002537328075282211, "loss": 0.0647, "step": 47790 }, { "epoch": 0.31, "learning_rate": 0.0002537231261738642, "loss": 0.0568, "step": 47800 }, { "epoch": 0.31, "learning_rate": 0.00025371344481950727, "loss": 0.061, "step": 47810 }, { "epoch": 0.31, "learning_rate": 0.00025370376346515035, "loss": 0.0626, "step": 47820 }, { "epoch": 0.31, "learning_rate": 0.0002536940821107934, "loss": 0.0632, "step": 47830 }, { "epoch": 0.31, "learning_rate": 0.0002536844007564365, "loss": 0.0648, "step": 47840 }, { "epoch": 0.31, "learning_rate": 0.00025367471940207953, "loss": 0.0839, "step": 47850 }, { "epoch": 0.31, "learning_rate": 0.0002536650380477226, "loss": 0.0665, "step": 47860 }, { "epoch": 0.31, "learning_rate": 0.00025365535669336564, "loss": 0.0616, "step": 47870 }, { "epoch": 0.31, "learning_rate": 0.0002536456753390087, "loss": 0.0705, "step": 47880 }, { "epoch": 0.31, "learning_rate": 0.0002536359939846518, "loss": 0.0654, "step": 47890 }, { "epoch": 0.31, "learning_rate": 0.0002536263126302949, "loss": 0.0675, "step": 47900 }, { "epoch": 0.31, "learning_rate": 0.00025361663127593796, "loss": 0.0669, "step": 47910 }, { "epoch": 0.31, "learning_rate": 0.000253606949921581, "loss": 0.0687, "step": 47920 }, { "epoch": 0.31, "learning_rate": 0.00025359726856722406, "loss": 0.0632, "step": 47930 }, { "epoch": 0.31, "learning_rate": 0.00025358758721286714, "loss": 0.0637, "step": 47940 }, { "epoch": 0.31, "learning_rate": 0.0002535779058585102, "loss": 0.0687, "step": 47950 }, { "epoch": 0.31, "learning_rate": 0.0002535682245041533, "loss": 0.0601, "step": 47960 }, { "epoch": 0.31, "learning_rate": 0.0002535585431497964, "loss": 0.0672, "step": 47970 }, { "epoch": 0.31, "learning_rate": 0.0002535488617954394, "loss": 0.056, "step": 47980 }, { "epoch": 0.31, "learning_rate": 0.0002535391804410825, "loss": 0.0616, "step": 47990 }, { "epoch": 0.31, "learning_rate": 0.00025352949908672557, "loss": 0.0655, "step": 48000 }, { "epoch": 0.31, "eval_cer": 0.9200316348435205, "eval_loss": 0.043291497975587845, "eval_runtime": 120.1252, "eval_samples_per_second": 16.649, "eval_steps_per_second": 4.162, "step": 48000 }, { "epoch": 0.31, "learning_rate": 0.0002535198177323686, "loss": 0.059, "step": 48010 }, { "epoch": 0.31, "learning_rate": 0.00025351013637801167, "loss": 0.0606, "step": 48020 }, { "epoch": 0.31, "learning_rate": 0.00025350045502365475, "loss": 0.0655, "step": 48030 }, { "epoch": 0.31, "learning_rate": 0.00025349077366929783, "loss": 0.0566, "step": 48040 }, { "epoch": 0.31, "learning_rate": 0.0002534810923149409, "loss": 0.0613, "step": 48050 }, { "epoch": 0.31, "learning_rate": 0.00025347141096058394, "loss": 0.0607, "step": 48060 }, { "epoch": 0.31, "learning_rate": 0.000253461729606227, "loss": 0.0685, "step": 48070 }, { "epoch": 0.31, "learning_rate": 0.0002534520482518701, "loss": 0.0636, "step": 48080 }, { "epoch": 0.31, "learning_rate": 0.0002534423668975132, "loss": 0.0621, "step": 48090 }, { "epoch": 0.31, "learning_rate": 0.00025343268554315625, "loss": 0.0653, "step": 48100 }, { "epoch": 0.31, "learning_rate": 0.0002534230041887993, "loss": 0.0652, "step": 48110 }, { "epoch": 0.31, "learning_rate": 0.00025341332283444236, "loss": 0.0637, "step": 48120 }, { "epoch": 0.31, "learning_rate": 0.00025340364148008544, "loss": 0.074, "step": 48130 }, { "epoch": 0.31, "learning_rate": 0.00025339396012572847, "loss": 0.0688, "step": 48140 }, { "epoch": 0.31, "learning_rate": 0.00025338427877137155, "loss": 0.0654, "step": 48150 }, { "epoch": 0.31, "learning_rate": 0.0002533745974170146, "loss": 0.0652, "step": 48160 }, { "epoch": 0.31, "learning_rate": 0.0002533649160626577, "loss": 0.0709, "step": 48170 }, { "epoch": 0.31, "learning_rate": 0.0002533552347083008, "loss": 0.057, "step": 48180 }, { "epoch": 0.31, "learning_rate": 0.00025334555335394386, "loss": 0.0617, "step": 48190 }, { "epoch": 0.31, "learning_rate": 0.0002533358719995869, "loss": 0.0739, "step": 48200 }, { "epoch": 0.31, "learning_rate": 0.00025332619064522997, "loss": 0.0703, "step": 48210 }, { "epoch": 0.31, "learning_rate": 0.00025331650929087305, "loss": 0.0711, "step": 48220 }, { "epoch": 0.31, "learning_rate": 0.00025330682793651613, "loss": 0.0656, "step": 48230 }, { "epoch": 0.31, "learning_rate": 0.0002532971465821592, "loss": 0.0709, "step": 48240 }, { "epoch": 0.31, "learning_rate": 0.00025328746522780223, "loss": 0.0664, "step": 48250 }, { "epoch": 0.31, "learning_rate": 0.0002532777838734453, "loss": 0.0576, "step": 48260 }, { "epoch": 0.31, "learning_rate": 0.00025326810251908834, "loss": 0.0598, "step": 48270 }, { "epoch": 0.31, "learning_rate": 0.0002532584211647314, "loss": 0.0579, "step": 48280 }, { "epoch": 0.31, "learning_rate": 0.0002532487398103745, "loss": 0.0584, "step": 48290 }, { "epoch": 0.31, "learning_rate": 0.0002532390584560176, "loss": 0.0717, "step": 48300 }, { "epoch": 0.31, "learning_rate": 0.00025322937710166066, "loss": 0.0635, "step": 48310 }, { "epoch": 0.31, "learning_rate": 0.00025321969574730374, "loss": 0.0675, "step": 48320 }, { "epoch": 0.31, "learning_rate": 0.0002532100143929468, "loss": 0.0682, "step": 48330 }, { "epoch": 0.31, "learning_rate": 0.00025320033303858984, "loss": 0.0581, "step": 48340 }, { "epoch": 0.31, "learning_rate": 0.0002531906516842329, "loss": 0.0626, "step": 48350 }, { "epoch": 0.31, "learning_rate": 0.000253180970329876, "loss": 0.0534, "step": 48360 }, { "epoch": 0.31, "learning_rate": 0.0002531712889755191, "loss": 0.063, "step": 48370 }, { "epoch": 0.31, "learning_rate": 0.0002531616076211621, "loss": 0.062, "step": 48380 }, { "epoch": 0.31, "learning_rate": 0.0002531519262668052, "loss": 0.0688, "step": 48390 }, { "epoch": 0.31, "learning_rate": 0.00025314224491244827, "loss": 0.069, "step": 48400 }, { "epoch": 0.31, "learning_rate": 0.0002531325635580913, "loss": 0.0714, "step": 48410 }, { "epoch": 0.31, "learning_rate": 0.0002531228822037344, "loss": 0.0657, "step": 48420 }, { "epoch": 0.31, "learning_rate": 0.00025311320084937745, "loss": 0.0691, "step": 48430 }, { "epoch": 0.31, "learning_rate": 0.00025310351949502053, "loss": 0.0593, "step": 48440 }, { "epoch": 0.31, "learning_rate": 0.0002530938381406636, "loss": 0.061, "step": 48450 }, { "epoch": 0.31, "learning_rate": 0.0002530841567863067, "loss": 0.073, "step": 48460 }, { "epoch": 0.31, "learning_rate": 0.0002530744754319498, "loss": 0.0719, "step": 48470 }, { "epoch": 0.31, "learning_rate": 0.0002530647940775928, "loss": 0.0629, "step": 48480 }, { "epoch": 0.31, "learning_rate": 0.0002530551127232359, "loss": 0.069, "step": 48490 }, { "epoch": 0.31, "learning_rate": 0.00025304543136887896, "loss": 0.067, "step": 48500 }, { "epoch": 0.31, "learning_rate": 0.000253035750014522, "loss": 0.0707, "step": 48510 }, { "epoch": 0.31, "learning_rate": 0.00025302606866016506, "loss": 0.0651, "step": 48520 }, { "epoch": 0.31, "learning_rate": 0.00025301638730580814, "loss": 0.0644, "step": 48530 }, { "epoch": 0.31, "learning_rate": 0.0002530067059514512, "loss": 0.0626, "step": 48540 }, { "epoch": 0.31, "learning_rate": 0.00025299702459709425, "loss": 0.0572, "step": 48550 }, { "epoch": 0.31, "learning_rate": 0.00025298734324273733, "loss": 0.0598, "step": 48560 }, { "epoch": 0.31, "learning_rate": 0.0002529776618883804, "loss": 0.0613, "step": 48570 }, { "epoch": 0.31, "learning_rate": 0.0002529679805340235, "loss": 0.0669, "step": 48580 }, { "epoch": 0.31, "learning_rate": 0.00025295829917966657, "loss": 0.0673, "step": 48590 }, { "epoch": 0.31, "learning_rate": 0.00025294861782530965, "loss": 0.0653, "step": 48600 }, { "epoch": 0.31, "learning_rate": 0.00025293893647095273, "loss": 0.0609, "step": 48610 }, { "epoch": 0.31, "learning_rate": 0.00025292925511659575, "loss": 0.0621, "step": 48620 }, { "epoch": 0.31, "learning_rate": 0.00025291957376223883, "loss": 0.0724, "step": 48630 }, { "epoch": 0.31, "learning_rate": 0.0002529098924078819, "loss": 0.0593, "step": 48640 }, { "epoch": 0.31, "learning_rate": 0.00025290021105352494, "loss": 0.0646, "step": 48650 }, { "epoch": 0.31, "learning_rate": 0.000252890529699168, "loss": 0.0641, "step": 48660 }, { "epoch": 0.31, "learning_rate": 0.0002528808483448111, "loss": 0.0627, "step": 48670 }, { "epoch": 0.31, "learning_rate": 0.0002528711669904542, "loss": 0.0634, "step": 48680 }, { "epoch": 0.31, "learning_rate": 0.0002528614856360972, "loss": 0.0627, "step": 48690 }, { "epoch": 0.31, "learning_rate": 0.0002528518042817403, "loss": 0.0674, "step": 48700 }, { "epoch": 0.31, "learning_rate": 0.00025284212292738336, "loss": 0.0664, "step": 48710 }, { "epoch": 0.31, "learning_rate": 0.00025283244157302644, "loss": 0.0734, "step": 48720 }, { "epoch": 0.31, "learning_rate": 0.0002528227602186695, "loss": 0.0677, "step": 48730 }, { "epoch": 0.31, "learning_rate": 0.0002528130788643126, "loss": 0.0643, "step": 48740 }, { "epoch": 0.31, "learning_rate": 0.00025280339750995563, "loss": 0.0596, "step": 48750 }, { "epoch": 0.31, "learning_rate": 0.0002527937161555987, "loss": 0.0657, "step": 48760 }, { "epoch": 0.31, "learning_rate": 0.0002527840348012418, "loss": 0.0642, "step": 48770 }, { "epoch": 0.31, "learning_rate": 0.0002527743534468848, "loss": 0.0554, "step": 48780 }, { "epoch": 0.31, "learning_rate": 0.0002527646720925279, "loss": 0.0611, "step": 48790 }, { "epoch": 0.31, "learning_rate": 0.00025275499073817097, "loss": 0.0719, "step": 48800 }, { "epoch": 0.32, "learning_rate": 0.00025274530938381405, "loss": 0.0605, "step": 48810 }, { "epoch": 0.32, "learning_rate": 0.00025273562802945713, "loss": 0.0646, "step": 48820 }, { "epoch": 0.32, "learning_rate": 0.00025272594667510016, "loss": 0.0666, "step": 48830 }, { "epoch": 0.32, "learning_rate": 0.00025271626532074324, "loss": 0.0676, "step": 48840 }, { "epoch": 0.32, "learning_rate": 0.0002527065839663863, "loss": 0.0585, "step": 48850 }, { "epoch": 0.32, "learning_rate": 0.0002526969026120294, "loss": 0.0649, "step": 48860 }, { "epoch": 0.32, "learning_rate": 0.0002526872212576725, "loss": 0.0564, "step": 48870 }, { "epoch": 0.32, "learning_rate": 0.0002526775399033155, "loss": 0.0644, "step": 48880 }, { "epoch": 0.32, "learning_rate": 0.0002526678585489586, "loss": 0.0618, "step": 48890 }, { "epoch": 0.32, "learning_rate": 0.00025265817719460166, "loss": 0.0748, "step": 48900 }, { "epoch": 0.32, "learning_rate": 0.0002526484958402447, "loss": 0.0634, "step": 48910 }, { "epoch": 0.32, "learning_rate": 0.00025263881448588777, "loss": 0.0665, "step": 48920 }, { "epoch": 0.32, "learning_rate": 0.00025262913313153085, "loss": 0.0609, "step": 48930 }, { "epoch": 0.32, "learning_rate": 0.00025261945177717393, "loss": 0.0608, "step": 48940 }, { "epoch": 0.32, "learning_rate": 0.000252609770422817, "loss": 0.0623, "step": 48950 }, { "epoch": 0.32, "learning_rate": 0.0002526000890684601, "loss": 0.0561, "step": 48960 }, { "epoch": 0.32, "learning_rate": 0.0002525904077141031, "loss": 0.0576, "step": 48970 }, { "epoch": 0.32, "learning_rate": 0.0002525807263597462, "loss": 0.0609, "step": 48980 }, { "epoch": 0.32, "learning_rate": 0.00025257104500538927, "loss": 0.0618, "step": 48990 }, { "epoch": 0.32, "learning_rate": 0.00025256136365103235, "loss": 0.0592, "step": 49000 }, { "epoch": 0.32, "eval_cer": 0.9200677889504011, "eval_loss": 0.043937765061855316, "eval_runtime": 120.4874, "eval_samples_per_second": 16.599, "eval_steps_per_second": 4.15, "step": 49000 }, { "epoch": 0.32, "learning_rate": 0.00025255168229667543, "loss": 0.054, "step": 49010 }, { "epoch": 0.32, "learning_rate": 0.00025254200094231846, "loss": 0.0639, "step": 49020 }, { "epoch": 0.32, "learning_rate": 0.00025253231958796154, "loss": 0.0631, "step": 49030 }, { "epoch": 0.32, "learning_rate": 0.0002525226382336046, "loss": 0.0657, "step": 49040 }, { "epoch": 0.32, "learning_rate": 0.00025251295687924764, "loss": 0.0623, "step": 49050 }, { "epoch": 0.32, "learning_rate": 0.0002525032755248907, "loss": 0.0639, "step": 49060 }, { "epoch": 0.32, "learning_rate": 0.0002524935941705338, "loss": 0.0629, "step": 49070 }, { "epoch": 0.32, "learning_rate": 0.0002524839128161769, "loss": 0.0662, "step": 49080 }, { "epoch": 0.32, "learning_rate": 0.00025247423146181996, "loss": 0.0804, "step": 49090 }, { "epoch": 0.32, "learning_rate": 0.00025246455010746304, "loss": 0.0634, "step": 49100 }, { "epoch": 0.32, "learning_rate": 0.00025245486875310607, "loss": 0.0745, "step": 49110 }, { "epoch": 0.32, "learning_rate": 0.00025244518739874915, "loss": 0.066, "step": 49120 }, { "epoch": 0.32, "learning_rate": 0.0002524355060443922, "loss": 0.0619, "step": 49130 }, { "epoch": 0.32, "learning_rate": 0.0002524258246900353, "loss": 0.0704, "step": 49140 }, { "epoch": 0.32, "learning_rate": 0.00025241614333567833, "loss": 0.0674, "step": 49150 }, { "epoch": 0.32, "learning_rate": 0.0002524064619813214, "loss": 0.0701, "step": 49160 }, { "epoch": 0.32, "learning_rate": 0.0002523967806269645, "loss": 0.0715, "step": 49170 }, { "epoch": 0.32, "learning_rate": 0.0002523870992726075, "loss": 0.0618, "step": 49180 }, { "epoch": 0.32, "learning_rate": 0.0002523774179182506, "loss": 0.0729, "step": 49190 }, { "epoch": 0.32, "learning_rate": 0.0002523677365638937, "loss": 0.0673, "step": 49200 }, { "epoch": 0.32, "learning_rate": 0.00025235805520953676, "loss": 0.068, "step": 49210 }, { "epoch": 0.32, "learning_rate": 0.00025234837385517984, "loss": 0.0676, "step": 49220 }, { "epoch": 0.32, "learning_rate": 0.0002523386925008229, "loss": 0.0772, "step": 49230 }, { "epoch": 0.32, "learning_rate": 0.000252329011146466, "loss": 0.0683, "step": 49240 }, { "epoch": 0.32, "learning_rate": 0.000252319329792109, "loss": 0.0655, "step": 49250 }, { "epoch": 0.32, "learning_rate": 0.0002523096484377521, "loss": 0.0726, "step": 49260 }, { "epoch": 0.32, "learning_rate": 0.0002522999670833952, "loss": 0.0646, "step": 49270 }, { "epoch": 0.32, "learning_rate": 0.0002522902857290382, "loss": 0.0651, "step": 49280 }, { "epoch": 0.32, "learning_rate": 0.0002522806043746813, "loss": 0.065, "step": 49290 }, { "epoch": 0.32, "learning_rate": 0.00025227092302032437, "loss": 0.062, "step": 49300 }, { "epoch": 0.32, "learning_rate": 0.00025226124166596745, "loss": 0.0701, "step": 49310 }, { "epoch": 0.32, "learning_rate": 0.00025225156031161047, "loss": 0.0597, "step": 49320 }, { "epoch": 0.32, "learning_rate": 0.00025224187895725355, "loss": 0.0638, "step": 49330 }, { "epoch": 0.32, "learning_rate": 0.00025223219760289663, "loss": 0.0632, "step": 49340 }, { "epoch": 0.32, "learning_rate": 0.0002522225162485397, "loss": 0.0652, "step": 49350 }, { "epoch": 0.32, "learning_rate": 0.0002522128348941828, "loss": 0.0734, "step": 49360 }, { "epoch": 0.32, "learning_rate": 0.00025220315353982587, "loss": 0.0601, "step": 49370 }, { "epoch": 0.32, "learning_rate": 0.00025219347218546895, "loss": 0.0684, "step": 49380 }, { "epoch": 0.32, "learning_rate": 0.000252183790831112, "loss": 0.0769, "step": 49390 }, { "epoch": 0.32, "learning_rate": 0.00025217410947675506, "loss": 0.062, "step": 49400 }, { "epoch": 0.32, "learning_rate": 0.00025216442812239814, "loss": 0.0587, "step": 49410 }, { "epoch": 0.32, "learning_rate": 0.00025215474676804116, "loss": 0.0608, "step": 49420 }, { "epoch": 0.32, "learning_rate": 0.00025214506541368424, "loss": 0.0688, "step": 49430 }, { "epoch": 0.32, "learning_rate": 0.0002521353840593273, "loss": 0.0632, "step": 49440 }, { "epoch": 0.32, "learning_rate": 0.0002521257027049704, "loss": 0.064, "step": 49450 }, { "epoch": 0.32, "learning_rate": 0.0002521160213506134, "loss": 0.0635, "step": 49460 }, { "epoch": 0.32, "learning_rate": 0.0002521063399962565, "loss": 0.0687, "step": 49470 }, { "epoch": 0.32, "learning_rate": 0.0002520966586418996, "loss": 0.0636, "step": 49480 }, { "epoch": 0.32, "learning_rate": 0.00025208697728754267, "loss": 0.0727, "step": 49490 }, { "epoch": 0.32, "learning_rate": 0.00025207729593318575, "loss": 0.0598, "step": 49500 }, { "epoch": 0.32, "learning_rate": 0.0002520676145788288, "loss": 0.066, "step": 49510 }, { "epoch": 0.32, "learning_rate": 0.00025205793322447185, "loss": 0.0593, "step": 49520 }, { "epoch": 0.32, "learning_rate": 0.00025204825187011493, "loss": 0.0714, "step": 49530 }, { "epoch": 0.32, "learning_rate": 0.000252038570515758, "loss": 0.0651, "step": 49540 }, { "epoch": 0.32, "learning_rate": 0.00025202888916140104, "loss": 0.0601, "step": 49550 }, { "epoch": 0.32, "learning_rate": 0.0002520192078070441, "loss": 0.0562, "step": 49560 }, { "epoch": 0.32, "learning_rate": 0.0002520095264526872, "loss": 0.0702, "step": 49570 }, { "epoch": 0.32, "learning_rate": 0.0002519998450983303, "loss": 0.065, "step": 49580 }, { "epoch": 0.32, "learning_rate": 0.00025199016374397335, "loss": 0.0666, "step": 49590 }, { "epoch": 0.32, "learning_rate": 0.0002519804823896164, "loss": 0.0646, "step": 49600 }, { "epoch": 0.32, "learning_rate": 0.00025197080103525946, "loss": 0.0604, "step": 49610 }, { "epoch": 0.32, "learning_rate": 0.00025196111968090254, "loss": 0.0618, "step": 49620 }, { "epoch": 0.32, "learning_rate": 0.0002519514383265456, "loss": 0.0662, "step": 49630 }, { "epoch": 0.32, "learning_rate": 0.0002519417569721887, "loss": 0.0632, "step": 49640 }, { "epoch": 0.32, "learning_rate": 0.0002519320756178318, "loss": 0.0699, "step": 49650 }, { "epoch": 0.32, "learning_rate": 0.0002519223942634748, "loss": 0.0527, "step": 49660 }, { "epoch": 0.32, "learning_rate": 0.0002519127129091179, "loss": 0.0599, "step": 49670 }, { "epoch": 0.32, "learning_rate": 0.0002519030315547609, "loss": 0.0631, "step": 49680 }, { "epoch": 0.32, "learning_rate": 0.000251893350200404, "loss": 0.0606, "step": 49690 }, { "epoch": 0.32, "learning_rate": 0.00025188366884604707, "loss": 0.0614, "step": 49700 }, { "epoch": 0.32, "learning_rate": 0.00025187398749169015, "loss": 0.0608, "step": 49710 }, { "epoch": 0.32, "learning_rate": 0.00025186430613733323, "loss": 0.0557, "step": 49720 }, { "epoch": 0.32, "learning_rate": 0.0002518546247829763, "loss": 0.0692, "step": 49730 }, { "epoch": 0.32, "learning_rate": 0.00025184494342861933, "loss": 0.0602, "step": 49740 }, { "epoch": 0.32, "learning_rate": 0.0002518352620742624, "loss": 0.0648, "step": 49750 }, { "epoch": 0.32, "learning_rate": 0.0002518255807199055, "loss": 0.0581, "step": 49760 }, { "epoch": 0.32, "learning_rate": 0.0002518158993655486, "loss": 0.0623, "step": 49770 }, { "epoch": 0.32, "learning_rate": 0.00025180621801119165, "loss": 0.0551, "step": 49780 }, { "epoch": 0.32, "learning_rate": 0.0002517965366568347, "loss": 0.0624, "step": 49790 }, { "epoch": 0.32, "learning_rate": 0.00025178685530247776, "loss": 0.0643, "step": 49800 }, { "epoch": 0.32, "learning_rate": 0.00025177717394812084, "loss": 0.0681, "step": 49810 }, { "epoch": 0.32, "learning_rate": 0.00025176749259376386, "loss": 0.0652, "step": 49820 }, { "epoch": 0.32, "learning_rate": 0.00025175781123940694, "loss": 0.0594, "step": 49830 }, { "epoch": 0.32, "learning_rate": 0.00025174812988505, "loss": 0.0647, "step": 49840 }, { "epoch": 0.32, "learning_rate": 0.0002517384485306931, "loss": 0.0604, "step": 49850 }, { "epoch": 0.32, "learning_rate": 0.0002517287671763362, "loss": 0.0611, "step": 49860 }, { "epoch": 0.32, "learning_rate": 0.00025171908582197926, "loss": 0.0628, "step": 49870 }, { "epoch": 0.32, "learning_rate": 0.0002517094044676223, "loss": 0.059, "step": 49880 }, { "epoch": 0.32, "learning_rate": 0.00025169972311326537, "loss": 0.0569, "step": 49890 }, { "epoch": 0.32, "learning_rate": 0.00025169004175890845, "loss": 0.0595, "step": 49900 }, { "epoch": 0.32, "learning_rate": 0.00025168036040455153, "loss": 0.0629, "step": 49910 }, { "epoch": 0.32, "learning_rate": 0.00025167067905019455, "loss": 0.0659, "step": 49920 }, { "epoch": 0.32, "learning_rate": 0.00025166099769583763, "loss": 0.0661, "step": 49930 }, { "epoch": 0.32, "learning_rate": 0.0002516513163414807, "loss": 0.0669, "step": 49940 }, { "epoch": 0.32, "learning_rate": 0.00025164163498712374, "loss": 0.0602, "step": 49950 }, { "epoch": 0.32, "learning_rate": 0.0002516319536327668, "loss": 0.0668, "step": 49960 }, { "epoch": 0.32, "learning_rate": 0.0002516222722784099, "loss": 0.0655, "step": 49970 }, { "epoch": 0.32, "learning_rate": 0.000251612590924053, "loss": 0.0634, "step": 49980 }, { "epoch": 0.32, "learning_rate": 0.00025160290956969606, "loss": 0.0629, "step": 49990 }, { "epoch": 0.32, "learning_rate": 0.00025159322821533914, "loss": 0.0623, "step": 50000 }, { "epoch": 0.32, "eval_cer": 0.9200958083832336, "eval_loss": 0.043299414217472076, "eval_runtime": 120.2242, "eval_samples_per_second": 16.636, "eval_steps_per_second": 4.159, "step": 50000 }, { "epoch": 0.32, "learning_rate": 0.0002515835468609822, "loss": 0.0586, "step": 50010 }, { "epoch": 0.32, "learning_rate": 0.00025157386550662524, "loss": 0.066, "step": 50020 }, { "epoch": 0.32, "learning_rate": 0.0002515641841522683, "loss": 0.0684, "step": 50030 }, { "epoch": 0.32, "learning_rate": 0.0002515545027979114, "loss": 0.0709, "step": 50040 }, { "epoch": 0.32, "learning_rate": 0.0002515448214435545, "loss": 0.0642, "step": 50050 }, { "epoch": 0.32, "learning_rate": 0.0002515351400891975, "loss": 0.0642, "step": 50060 }, { "epoch": 0.32, "learning_rate": 0.0002515254587348406, "loss": 0.0642, "step": 50070 }, { "epoch": 0.32, "learning_rate": 0.00025151577738048367, "loss": 0.0681, "step": 50080 }, { "epoch": 0.32, "learning_rate": 0.0002515060960261267, "loss": 0.0626, "step": 50090 }, { "epoch": 0.32, "learning_rate": 0.0002514964146717698, "loss": 0.0633, "step": 50100 }, { "epoch": 0.32, "learning_rate": 0.00025148673331741285, "loss": 0.0702, "step": 50110 }, { "epoch": 0.32, "learning_rate": 0.00025147705196305593, "loss": 0.0651, "step": 50120 }, { "epoch": 0.32, "learning_rate": 0.000251467370608699, "loss": 0.063, "step": 50130 }, { "epoch": 0.32, "learning_rate": 0.0002514576892543421, "loss": 0.0668, "step": 50140 }, { "epoch": 0.32, "learning_rate": 0.00025144800789998517, "loss": 0.0661, "step": 50150 }, { "epoch": 0.32, "learning_rate": 0.0002514383265456282, "loss": 0.0735, "step": 50160 }, { "epoch": 0.32, "learning_rate": 0.0002514286451912713, "loss": 0.058, "step": 50170 }, { "epoch": 0.32, "learning_rate": 0.00025141896383691436, "loss": 0.0576, "step": 50180 }, { "epoch": 0.32, "learning_rate": 0.0002514092824825574, "loss": 0.0683, "step": 50190 }, { "epoch": 0.32, "learning_rate": 0.00025139960112820046, "loss": 0.056, "step": 50200 }, { "epoch": 0.32, "learning_rate": 0.00025138991977384354, "loss": 0.0637, "step": 50210 }, { "epoch": 0.32, "learning_rate": 0.0002513802384194866, "loss": 0.0689, "step": 50220 }, { "epoch": 0.32, "learning_rate": 0.00025137055706512965, "loss": 0.0652, "step": 50230 }, { "epoch": 0.32, "learning_rate": 0.00025136087571077273, "loss": 0.0631, "step": 50240 }, { "epoch": 0.32, "learning_rate": 0.0002513511943564158, "loss": 0.059, "step": 50250 }, { "epoch": 0.32, "learning_rate": 0.0002513415130020589, "loss": 0.0645, "step": 50260 }, { "epoch": 0.32, "learning_rate": 0.00025133183164770197, "loss": 0.0637, "step": 50270 }, { "epoch": 0.32, "learning_rate": 0.00025132215029334505, "loss": 0.0662, "step": 50280 }, { "epoch": 0.32, "learning_rate": 0.00025131246893898807, "loss": 0.0668, "step": 50290 }, { "epoch": 0.32, "learning_rate": 0.00025130278758463115, "loss": 0.0601, "step": 50300 }, { "epoch": 0.32, "learning_rate": 0.00025129310623027423, "loss": 0.0634, "step": 50310 }, { "epoch": 0.32, "learning_rate": 0.00025128342487591726, "loss": 0.0582, "step": 50320 }, { "epoch": 0.32, "learning_rate": 0.00025127374352156034, "loss": 0.0703, "step": 50330 }, { "epoch": 0.32, "learning_rate": 0.0002512640621672034, "loss": 0.061, "step": 50340 }, { "epoch": 0.32, "learning_rate": 0.0002512543808128465, "loss": 0.0616, "step": 50350 }, { "epoch": 0.33, "learning_rate": 0.0002512446994584896, "loss": 0.0611, "step": 50360 }, { "epoch": 0.33, "learning_rate": 0.0002512350181041326, "loss": 0.0572, "step": 50370 }, { "epoch": 0.33, "learning_rate": 0.0002512253367497757, "loss": 0.0607, "step": 50380 }, { "epoch": 0.33, "learning_rate": 0.00025121565539541876, "loss": 0.0632, "step": 50390 }, { "epoch": 0.33, "learning_rate": 0.00025120597404106184, "loss": 0.0669, "step": 50400 }, { "epoch": 0.33, "learning_rate": 0.0002511962926867049, "loss": 0.0575, "step": 50410 }, { "epoch": 0.33, "learning_rate": 0.000251186611332348, "loss": 0.0697, "step": 50420 }, { "epoch": 0.33, "learning_rate": 0.00025117692997799103, "loss": 0.0564, "step": 50430 }, { "epoch": 0.33, "learning_rate": 0.0002511672486236341, "loss": 0.0661, "step": 50440 }, { "epoch": 0.33, "learning_rate": 0.0002511575672692772, "loss": 0.0575, "step": 50450 }, { "epoch": 0.33, "learning_rate": 0.0002511478859149202, "loss": 0.0548, "step": 50460 }, { "epoch": 0.33, "learning_rate": 0.0002511382045605633, "loss": 0.0705, "step": 50470 }, { "epoch": 0.33, "learning_rate": 0.00025112852320620637, "loss": 0.0636, "step": 50480 }, { "epoch": 0.33, "learning_rate": 0.00025111884185184945, "loss": 0.065, "step": 50490 }, { "epoch": 0.33, "learning_rate": 0.00025110916049749253, "loss": 0.0564, "step": 50500 }, { "epoch": 0.33, "learning_rate": 0.00025109947914313556, "loss": 0.068, "step": 50510 }, { "epoch": 0.33, "learning_rate": 0.00025108979778877864, "loss": 0.0638, "step": 50520 }, { "epoch": 0.33, "learning_rate": 0.0002510801164344217, "loss": 0.0649, "step": 50530 }, { "epoch": 0.33, "learning_rate": 0.0002510704350800648, "loss": 0.059, "step": 50540 }, { "epoch": 0.33, "learning_rate": 0.0002510607537257079, "loss": 0.0582, "step": 50550 }, { "epoch": 0.33, "learning_rate": 0.0002510510723713509, "loss": 0.0571, "step": 50560 }, { "epoch": 0.33, "learning_rate": 0.000251041391016994, "loss": 0.0545, "step": 50570 }, { "epoch": 0.33, "learning_rate": 0.00025103170966263706, "loss": 0.0661, "step": 50580 }, { "epoch": 0.33, "learning_rate": 0.0002510220283082801, "loss": 0.0638, "step": 50590 }, { "epoch": 0.33, "learning_rate": 0.00025101234695392317, "loss": 0.056, "step": 50600 }, { "epoch": 0.33, "learning_rate": 0.00025100266559956625, "loss": 0.0667, "step": 50610 }, { "epoch": 0.33, "learning_rate": 0.0002509929842452093, "loss": 0.0644, "step": 50620 }, { "epoch": 0.33, "learning_rate": 0.0002509833028908524, "loss": 0.0611, "step": 50630 }, { "epoch": 0.33, "learning_rate": 0.0002509736215364955, "loss": 0.061, "step": 50640 }, { "epoch": 0.33, "learning_rate": 0.0002509639401821385, "loss": 0.0659, "step": 50650 }, { "epoch": 0.33, "learning_rate": 0.0002509542588277816, "loss": 0.0656, "step": 50660 }, { "epoch": 0.33, "learning_rate": 0.00025094457747342467, "loss": 0.0627, "step": 50670 }, { "epoch": 0.33, "learning_rate": 0.00025093489611906775, "loss": 0.062, "step": 50680 }, { "epoch": 0.33, "learning_rate": 0.0002509252147647108, "loss": 0.0613, "step": 50690 }, { "epoch": 0.33, "learning_rate": 0.00025091553341035386, "loss": 0.065, "step": 50700 }, { "epoch": 0.33, "learning_rate": 0.00025090585205599694, "loss": 0.0651, "step": 50710 }, { "epoch": 0.33, "learning_rate": 0.00025089617070163996, "loss": 0.0655, "step": 50720 }, { "epoch": 0.33, "learning_rate": 0.00025088648934728304, "loss": 0.0596, "step": 50730 }, { "epoch": 0.33, "learning_rate": 0.0002508768079929261, "loss": 0.0735, "step": 50740 }, { "epoch": 0.33, "learning_rate": 0.0002508671266385692, "loss": 0.0616, "step": 50750 }, { "epoch": 0.33, "learning_rate": 0.0002508574452842123, "loss": 0.0613, "step": 50760 }, { "epoch": 0.33, "learning_rate": 0.00025084776392985536, "loss": 0.0579, "step": 50770 }, { "epoch": 0.33, "learning_rate": 0.00025083808257549844, "loss": 0.0551, "step": 50780 }, { "epoch": 0.33, "learning_rate": 0.00025082840122114147, "loss": 0.0683, "step": 50790 }, { "epoch": 0.33, "learning_rate": 0.00025081871986678455, "loss": 0.0612, "step": 50800 }, { "epoch": 0.33, "learning_rate": 0.0002508090385124276, "loss": 0.0648, "step": 50810 }, { "epoch": 0.33, "learning_rate": 0.0002507993571580707, "loss": 0.0672, "step": 50820 }, { "epoch": 0.33, "learning_rate": 0.00025078967580371373, "loss": 0.0621, "step": 50830 }, { "epoch": 0.33, "learning_rate": 0.0002507799944493568, "loss": 0.0627, "step": 50840 }, { "epoch": 0.33, "learning_rate": 0.0002507703130949999, "loss": 0.0631, "step": 50850 }, { "epoch": 0.33, "learning_rate": 0.0002507606317406429, "loss": 0.0646, "step": 50860 }, { "epoch": 0.33, "learning_rate": 0.000250750950386286, "loss": 0.057, "step": 50870 }, { "epoch": 0.33, "learning_rate": 0.0002507412690319291, "loss": 0.0646, "step": 50880 }, { "epoch": 0.33, "learning_rate": 0.00025073158767757216, "loss": 0.0665, "step": 50890 }, { "epoch": 0.33, "learning_rate": 0.00025072190632321524, "loss": 0.0632, "step": 50900 }, { "epoch": 0.33, "learning_rate": 0.0002507122249688583, "loss": 0.0647, "step": 50910 }, { "epoch": 0.33, "learning_rate": 0.0002507025436145014, "loss": 0.0592, "step": 50920 }, { "epoch": 0.33, "learning_rate": 0.0002506928622601444, "loss": 0.0751, "step": 50930 }, { "epoch": 0.33, "learning_rate": 0.0002506831809057875, "loss": 0.0639, "step": 50940 }, { "epoch": 0.33, "learning_rate": 0.0002506734995514306, "loss": 0.0594, "step": 50950 }, { "epoch": 0.33, "learning_rate": 0.0002506638181970736, "loss": 0.0649, "step": 50960 }, { "epoch": 0.33, "learning_rate": 0.0002506541368427167, "loss": 0.0653, "step": 50970 }, { "epoch": 0.33, "learning_rate": 0.00025064445548835977, "loss": 0.0619, "step": 50980 }, { "epoch": 0.33, "learning_rate": 0.00025063477413400285, "loss": 0.0611, "step": 50990 }, { "epoch": 0.33, "learning_rate": 0.00025062509277964587, "loss": 0.074, "step": 51000 }, { "epoch": 0.33, "eval_cer": 0.9201572703649306, "eval_loss": 0.04186994954943657, "eval_runtime": 120.029, "eval_samples_per_second": 16.663, "eval_steps_per_second": 4.166, "step": 51000 }, { "epoch": 0.33, "learning_rate": 0.00025061541142528895, "loss": 0.0675, "step": 51010 }, { "epoch": 0.33, "learning_rate": 0.00025060573007093203, "loss": 0.0638, "step": 51020 }, { "epoch": 0.33, "learning_rate": 0.0002505960487165751, "loss": 0.0624, "step": 51030 }, { "epoch": 0.33, "learning_rate": 0.0002505863673622182, "loss": 0.065, "step": 51040 }, { "epoch": 0.33, "learning_rate": 0.00025057668600786127, "loss": 0.0603, "step": 51050 }, { "epoch": 0.33, "learning_rate": 0.0002505670046535043, "loss": 0.059, "step": 51060 }, { "epoch": 0.33, "learning_rate": 0.0002505573232991474, "loss": 0.0636, "step": 51070 }, { "epoch": 0.33, "learning_rate": 0.00025054764194479045, "loss": 0.06, "step": 51080 }, { "epoch": 0.33, "learning_rate": 0.0002505379605904335, "loss": 0.0596, "step": 51090 }, { "epoch": 0.33, "learning_rate": 0.00025052827923607656, "loss": 0.0594, "step": 51100 }, { "epoch": 0.33, "learning_rate": 0.00025051859788171964, "loss": 0.0575, "step": 51110 }, { "epoch": 0.33, "learning_rate": 0.0002505089165273627, "loss": 0.0663, "step": 51120 }, { "epoch": 0.33, "learning_rate": 0.0002504992351730058, "loss": 0.0614, "step": 51130 }, { "epoch": 0.33, "learning_rate": 0.0002504895538186488, "loss": 0.0693, "step": 51140 }, { "epoch": 0.33, "learning_rate": 0.0002504798724642919, "loss": 0.0624, "step": 51150 }, { "epoch": 0.33, "learning_rate": 0.000250470191109935, "loss": 0.0651, "step": 51160 }, { "epoch": 0.33, "learning_rate": 0.00025046050975557806, "loss": 0.0582, "step": 51170 }, { "epoch": 0.33, "learning_rate": 0.00025045082840122114, "loss": 0.0652, "step": 51180 }, { "epoch": 0.33, "learning_rate": 0.0002504411470468642, "loss": 0.0625, "step": 51190 }, { "epoch": 0.33, "learning_rate": 0.00025043146569250725, "loss": 0.0611, "step": 51200 }, { "epoch": 0.33, "learning_rate": 0.00025042178433815033, "loss": 0.0564, "step": 51210 }, { "epoch": 0.33, "learning_rate": 0.0002504121029837934, "loss": 0.0596, "step": 51220 }, { "epoch": 0.33, "learning_rate": 0.00025040242162943643, "loss": 0.0715, "step": 51230 }, { "epoch": 0.33, "learning_rate": 0.0002503927402750795, "loss": 0.0616, "step": 51240 }, { "epoch": 0.33, "learning_rate": 0.0002503830589207226, "loss": 0.0692, "step": 51250 }, { "epoch": 0.33, "learning_rate": 0.0002503733775663657, "loss": 0.0689, "step": 51260 }, { "epoch": 0.33, "learning_rate": 0.00025036369621200875, "loss": 0.0568, "step": 51270 }, { "epoch": 0.33, "learning_rate": 0.0002503540148576518, "loss": 0.0659, "step": 51280 }, { "epoch": 0.33, "learning_rate": 0.00025034433350329486, "loss": 0.0706, "step": 51290 }, { "epoch": 0.33, "learning_rate": 0.00025033465214893794, "loss": 0.0621, "step": 51300 }, { "epoch": 0.33, "learning_rate": 0.000250324970794581, "loss": 0.0577, "step": 51310 }, { "epoch": 0.33, "learning_rate": 0.0002503152894402241, "loss": 0.0581, "step": 51320 }, { "epoch": 0.33, "learning_rate": 0.0002503056080858671, "loss": 0.0585, "step": 51330 }, { "epoch": 0.33, "learning_rate": 0.0002502959267315102, "loss": 0.0574, "step": 51340 }, { "epoch": 0.33, "learning_rate": 0.0002502862453771533, "loss": 0.0698, "step": 51350 }, { "epoch": 0.33, "learning_rate": 0.0002502765640227963, "loss": 0.0624, "step": 51360 }, { "epoch": 0.33, "learning_rate": 0.0002502668826684394, "loss": 0.0607, "step": 51370 }, { "epoch": 0.33, "learning_rate": 0.00025025720131408247, "loss": 0.0629, "step": 51380 }, { "epoch": 0.33, "learning_rate": 0.00025024751995972555, "loss": 0.0582, "step": 51390 }, { "epoch": 0.33, "learning_rate": 0.00025023783860536863, "loss": 0.0712, "step": 51400 }, { "epoch": 0.33, "learning_rate": 0.0002502281572510117, "loss": 0.0763, "step": 51410 }, { "epoch": 0.33, "learning_rate": 0.00025021847589665473, "loss": 0.063, "step": 51420 }, { "epoch": 0.33, "learning_rate": 0.0002502087945422978, "loss": 0.0688, "step": 51430 }, { "epoch": 0.33, "learning_rate": 0.0002501991131879409, "loss": 0.062, "step": 51440 }, { "epoch": 0.33, "learning_rate": 0.000250189431833584, "loss": 0.0583, "step": 51450 }, { "epoch": 0.33, "learning_rate": 0.000250179750479227, "loss": 0.0603, "step": 51460 }, { "epoch": 0.33, "learning_rate": 0.0002501700691248701, "loss": 0.0642, "step": 51470 }, { "epoch": 0.33, "learning_rate": 0.00025016038777051316, "loss": 0.0559, "step": 51480 }, { "epoch": 0.33, "learning_rate": 0.0002501507064161562, "loss": 0.0589, "step": 51490 }, { "epoch": 0.33, "learning_rate": 0.00025014102506179926, "loss": 0.0579, "step": 51500 }, { "epoch": 0.33, "learning_rate": 0.00025013134370744234, "loss": 0.07, "step": 51510 }, { "epoch": 0.33, "learning_rate": 0.0002501216623530854, "loss": 0.0624, "step": 51520 }, { "epoch": 0.33, "learning_rate": 0.0002501119809987285, "loss": 0.0623, "step": 51530 }, { "epoch": 0.33, "learning_rate": 0.0002501022996443716, "loss": 0.0615, "step": 51540 }, { "epoch": 0.33, "learning_rate": 0.00025009261829001466, "loss": 0.0666, "step": 51550 }, { "epoch": 0.33, "learning_rate": 0.0002500829369356577, "loss": 0.0566, "step": 51560 }, { "epoch": 0.33, "learning_rate": 0.00025007325558130077, "loss": 0.0629, "step": 51570 }, { "epoch": 0.33, "learning_rate": 0.00025006357422694385, "loss": 0.0574, "step": 51580 }, { "epoch": 0.33, "learning_rate": 0.00025005389287258693, "loss": 0.0648, "step": 51590 }, { "epoch": 0.33, "learning_rate": 0.00025004421151822995, "loss": 0.0571, "step": 51600 }, { "epoch": 0.33, "learning_rate": 0.00025003453016387303, "loss": 0.0684, "step": 51610 }, { "epoch": 0.33, "learning_rate": 0.0002500248488095161, "loss": 0.0597, "step": 51620 }, { "epoch": 0.33, "learning_rate": 0.00025001516745515914, "loss": 0.058, "step": 51630 }, { "epoch": 0.33, "learning_rate": 0.0002500054861008022, "loss": 0.0705, "step": 51640 }, { "epoch": 0.33, "learning_rate": 0.0002499958047464453, "loss": 0.0575, "step": 51650 }, { "epoch": 0.33, "learning_rate": 0.0002499861233920884, "loss": 0.0678, "step": 51660 }, { "epoch": 0.33, "learning_rate": 0.00024997644203773146, "loss": 0.0749, "step": 51670 }, { "epoch": 0.33, "learning_rate": 0.00024996676068337454, "loss": 0.0607, "step": 51680 }, { "epoch": 0.33, "learning_rate": 0.00024995707932901756, "loss": 0.0674, "step": 51690 }, { "epoch": 0.33, "learning_rate": 0.00024994739797466064, "loss": 0.0631, "step": 51700 }, { "epoch": 0.33, "learning_rate": 0.0002499377166203037, "loss": 0.0595, "step": 51710 }, { "epoch": 0.33, "learning_rate": 0.0002499280352659468, "loss": 0.0622, "step": 51720 }, { "epoch": 0.33, "learning_rate": 0.00024991835391158983, "loss": 0.0632, "step": 51730 }, { "epoch": 0.33, "learning_rate": 0.0002499086725572329, "loss": 0.0603, "step": 51740 }, { "epoch": 0.33, "learning_rate": 0.000249898991202876, "loss": 0.065, "step": 51750 }, { "epoch": 0.33, "learning_rate": 0.000249889309848519, "loss": 0.0608, "step": 51760 }, { "epoch": 0.33, "learning_rate": 0.0002498796284941621, "loss": 0.0613, "step": 51770 }, { "epoch": 0.33, "learning_rate": 0.00024986994713980517, "loss": 0.0627, "step": 51780 }, { "epoch": 0.33, "learning_rate": 0.00024986026578544825, "loss": 0.0622, "step": 51790 }, { "epoch": 0.33, "learning_rate": 0.00024985058443109133, "loss": 0.07, "step": 51800 }, { "epoch": 0.33, "learning_rate": 0.0002498409030767344, "loss": 0.0534, "step": 51810 }, { "epoch": 0.33, "learning_rate": 0.0002498312217223775, "loss": 0.0588, "step": 51820 }, { "epoch": 0.33, "learning_rate": 0.0002498215403680205, "loss": 0.0647, "step": 51830 }, { "epoch": 0.33, "learning_rate": 0.0002498118590136636, "loss": 0.0699, "step": 51840 }, { "epoch": 0.33, "learning_rate": 0.0002498021776593067, "loss": 0.0678, "step": 51850 }, { "epoch": 0.33, "learning_rate": 0.0002497924963049497, "loss": 0.0578, "step": 51860 }, { "epoch": 0.33, "learning_rate": 0.0002497828149505928, "loss": 0.0592, "step": 51870 }, { "epoch": 0.33, "learning_rate": 0.00024977313359623586, "loss": 0.0738, "step": 51880 }, { "epoch": 0.33, "learning_rate": 0.00024976345224187894, "loss": 0.0621, "step": 51890 }, { "epoch": 0.33, "learning_rate": 0.00024975377088752197, "loss": 0.0603, "step": 51900 }, { "epoch": 0.34, "learning_rate": 0.00024974408953316505, "loss": 0.0614, "step": 51910 }, { "epoch": 0.34, "learning_rate": 0.00024973440817880813, "loss": 0.0588, "step": 51920 }, { "epoch": 0.34, "learning_rate": 0.0002497247268244512, "loss": 0.0674, "step": 51930 }, { "epoch": 0.34, "learning_rate": 0.0002497150454700943, "loss": 0.0591, "step": 51940 }, { "epoch": 0.34, "learning_rate": 0.00024970536411573737, "loss": 0.0638, "step": 51950 }, { "epoch": 0.34, "learning_rate": 0.00024969568276138045, "loss": 0.0645, "step": 51960 }, { "epoch": 0.34, "learning_rate": 0.00024968600140702347, "loss": 0.0638, "step": 51970 }, { "epoch": 0.34, "learning_rate": 0.00024967632005266655, "loss": 0.0657, "step": 51980 }, { "epoch": 0.34, "learning_rate": 0.00024966663869830963, "loss": 0.0654, "step": 51990 }, { "epoch": 0.34, "learning_rate": 0.00024965695734395266, "loss": 0.0602, "step": 52000 }, { "epoch": 0.34, "eval_cer": 0.9201572703649306, "eval_loss": 0.040952201932668686, "eval_runtime": 120.0447, "eval_samples_per_second": 16.66, "eval_steps_per_second": 4.165, "step": 52000 }, { "epoch": 0.34, "learning_rate": 0.00024964727598959574, "loss": 0.0582, "step": 52010 }, { "epoch": 0.34, "learning_rate": 0.0002496375946352388, "loss": 0.0636, "step": 52020 }, { "epoch": 0.34, "learning_rate": 0.0002496279132808819, "loss": 0.0618, "step": 52030 }, { "epoch": 0.34, "learning_rate": 0.0002496182319265249, "loss": 0.0594, "step": 52040 }, { "epoch": 0.34, "learning_rate": 0.000249608550572168, "loss": 0.0545, "step": 52050 }, { "epoch": 0.34, "learning_rate": 0.0002495988692178111, "loss": 0.0647, "step": 52060 }, { "epoch": 0.34, "learning_rate": 0.00024958918786345416, "loss": 0.0549, "step": 52070 }, { "epoch": 0.34, "learning_rate": 0.00024957950650909724, "loss": 0.0639, "step": 52080 }, { "epoch": 0.34, "learning_rate": 0.0002495698251547403, "loss": 0.0636, "step": 52090 }, { "epoch": 0.34, "learning_rate": 0.00024956014380038335, "loss": 0.0581, "step": 52100 }, { "epoch": 0.34, "learning_rate": 0.0002495504624460264, "loss": 0.0681, "step": 52110 }, { "epoch": 0.34, "learning_rate": 0.0002495407810916695, "loss": 0.059, "step": 52120 }, { "epoch": 0.34, "learning_rate": 0.00024953109973731253, "loss": 0.0626, "step": 52130 }, { "epoch": 0.34, "learning_rate": 0.0002495214183829556, "loss": 0.0619, "step": 52140 }, { "epoch": 0.34, "learning_rate": 0.0002495117370285987, "loss": 0.0641, "step": 52150 }, { "epoch": 0.34, "learning_rate": 0.00024950205567424177, "loss": 0.0691, "step": 52160 }, { "epoch": 0.34, "learning_rate": 0.00024949237431988485, "loss": 0.0593, "step": 52170 }, { "epoch": 0.34, "learning_rate": 0.0002494826929655279, "loss": 0.0672, "step": 52180 }, { "epoch": 0.34, "learning_rate": 0.00024947301161117096, "loss": 0.0692, "step": 52190 }, { "epoch": 0.34, "learning_rate": 0.00024946333025681404, "loss": 0.0603, "step": 52200 }, { "epoch": 0.34, "learning_rate": 0.0002494536489024571, "loss": 0.0603, "step": 52210 }, { "epoch": 0.34, "learning_rate": 0.0002494439675481002, "loss": 0.067, "step": 52220 }, { "epoch": 0.34, "learning_rate": 0.0002494342861937433, "loss": 0.0678, "step": 52230 }, { "epoch": 0.34, "learning_rate": 0.0002494246048393863, "loss": 0.0654, "step": 52240 }, { "epoch": 0.34, "learning_rate": 0.0002494149234850294, "loss": 0.0684, "step": 52250 }, { "epoch": 0.34, "learning_rate": 0.0002494052421306724, "loss": 0.0568, "step": 52260 }, { "epoch": 0.34, "learning_rate": 0.0002493955607763155, "loss": 0.0671, "step": 52270 }, { "epoch": 0.34, "learning_rate": 0.00024938587942195857, "loss": 0.0662, "step": 52280 }, { "epoch": 0.34, "learning_rate": 0.00024937619806760165, "loss": 0.0617, "step": 52290 }, { "epoch": 0.34, "learning_rate": 0.0002493665167132447, "loss": 0.0585, "step": 52300 }, { "epoch": 0.34, "learning_rate": 0.0002493568353588878, "loss": 0.068, "step": 52310 }, { "epoch": 0.34, "learning_rate": 0.00024934715400453083, "loss": 0.0613, "step": 52320 }, { "epoch": 0.34, "learning_rate": 0.0002493374726501739, "loss": 0.0667, "step": 52330 }, { "epoch": 0.34, "learning_rate": 0.000249327791295817, "loss": 0.0623, "step": 52340 }, { "epoch": 0.34, "learning_rate": 0.00024931810994146007, "loss": 0.0634, "step": 52350 }, { "epoch": 0.34, "learning_rate": 0.00024930842858710315, "loss": 0.0579, "step": 52360 }, { "epoch": 0.34, "learning_rate": 0.0002492987472327462, "loss": 0.0732, "step": 52370 }, { "epoch": 0.34, "learning_rate": 0.00024928906587838926, "loss": 0.0671, "step": 52380 }, { "epoch": 0.34, "learning_rate": 0.00024927938452403234, "loss": 0.0605, "step": 52390 }, { "epoch": 0.34, "learning_rate": 0.00024926970316967536, "loss": 0.075, "step": 52400 }, { "epoch": 0.34, "learning_rate": 0.00024926002181531844, "loss": 0.0734, "step": 52410 }, { "epoch": 0.34, "learning_rate": 0.0002492503404609615, "loss": 0.0573, "step": 52420 }, { "epoch": 0.34, "learning_rate": 0.0002492406591066046, "loss": 0.0726, "step": 52430 }, { "epoch": 0.34, "learning_rate": 0.0002492309777522477, "loss": 0.0688, "step": 52440 }, { "epoch": 0.34, "learning_rate": 0.00024922129639789076, "loss": 0.0613, "step": 52450 }, { "epoch": 0.34, "learning_rate": 0.0002492116150435338, "loss": 0.0611, "step": 52460 }, { "epoch": 0.34, "learning_rate": 0.00024920193368917687, "loss": 0.0659, "step": 52470 }, { "epoch": 0.34, "learning_rate": 0.00024919225233481995, "loss": 0.0575, "step": 52480 }, { "epoch": 0.34, "learning_rate": 0.000249182570980463, "loss": 0.0661, "step": 52490 }, { "epoch": 0.34, "learning_rate": 0.00024917288962610605, "loss": 0.0612, "step": 52500 }, { "epoch": 0.34, "learning_rate": 0.00024916320827174913, "loss": 0.0628, "step": 52510 }, { "epoch": 0.34, "learning_rate": 0.0002491535269173922, "loss": 0.0585, "step": 52520 }, { "epoch": 0.34, "learning_rate": 0.00024914384556303524, "loss": 0.057, "step": 52530 }, { "epoch": 0.34, "learning_rate": 0.0002491341642086783, "loss": 0.06, "step": 52540 }, { "epoch": 0.34, "learning_rate": 0.0002491244828543214, "loss": 0.0564, "step": 52550 }, { "epoch": 0.34, "learning_rate": 0.0002491148014999645, "loss": 0.0609, "step": 52560 }, { "epoch": 0.34, "learning_rate": 0.00024910512014560755, "loss": 0.0643, "step": 52570 }, { "epoch": 0.34, "learning_rate": 0.00024909543879125063, "loss": 0.0581, "step": 52580 }, { "epoch": 0.34, "learning_rate": 0.0002490857574368937, "loss": 0.0524, "step": 52590 }, { "epoch": 0.34, "learning_rate": 0.00024907607608253674, "loss": 0.0565, "step": 52600 }, { "epoch": 0.34, "learning_rate": 0.0002490663947281798, "loss": 0.0687, "step": 52610 }, { "epoch": 0.34, "learning_rate": 0.0002490567133738229, "loss": 0.0582, "step": 52620 }, { "epoch": 0.34, "learning_rate": 0.000249047032019466, "loss": 0.0578, "step": 52630 }, { "epoch": 0.34, "learning_rate": 0.000249037350665109, "loss": 0.0788, "step": 52640 }, { "epoch": 0.34, "learning_rate": 0.0002490276693107521, "loss": 0.063, "step": 52650 }, { "epoch": 0.34, "learning_rate": 0.00024901798795639516, "loss": 0.068, "step": 52660 }, { "epoch": 0.34, "learning_rate": 0.0002490083066020382, "loss": 0.0653, "step": 52670 }, { "epoch": 0.34, "learning_rate": 0.00024899862524768127, "loss": 0.0631, "step": 52680 }, { "epoch": 0.34, "learning_rate": 0.00024898894389332435, "loss": 0.0571, "step": 52690 }, { "epoch": 0.34, "learning_rate": 0.00024897926253896743, "loss": 0.0595, "step": 52700 }, { "epoch": 0.34, "learning_rate": 0.0002489695811846105, "loss": 0.0592, "step": 52710 }, { "epoch": 0.34, "learning_rate": 0.0002489598998302536, "loss": 0.06, "step": 52720 }, { "epoch": 0.34, "learning_rate": 0.00024895021847589667, "loss": 0.0586, "step": 52730 }, { "epoch": 0.34, "learning_rate": 0.0002489405371215397, "loss": 0.0651, "step": 52740 }, { "epoch": 0.34, "learning_rate": 0.0002489308557671828, "loss": 0.0694, "step": 52750 }, { "epoch": 0.34, "learning_rate": 0.00024892117441282585, "loss": 0.0581, "step": 52760 }, { "epoch": 0.34, "learning_rate": 0.0002489114930584689, "loss": 0.0562, "step": 52770 }, { "epoch": 0.34, "learning_rate": 0.00024890181170411196, "loss": 0.0589, "step": 52780 }, { "epoch": 0.34, "learning_rate": 0.00024889213034975504, "loss": 0.0569, "step": 52790 }, { "epoch": 0.34, "learning_rate": 0.0002488824489953981, "loss": 0.0637, "step": 52800 }, { "epoch": 0.34, "learning_rate": 0.00024887276764104114, "loss": 0.0654, "step": 52810 }, { "epoch": 0.34, "learning_rate": 0.0002488630862866842, "loss": 0.065, "step": 52820 }, { "epoch": 0.34, "learning_rate": 0.0002488534049323273, "loss": 0.0582, "step": 52830 }, { "epoch": 0.34, "learning_rate": 0.0002488437235779704, "loss": 0.0569, "step": 52840 }, { "epoch": 0.34, "learning_rate": 0.00024883404222361346, "loss": 0.0593, "step": 52850 }, { "epoch": 0.34, "learning_rate": 0.00024882436086925654, "loss": 0.0559, "step": 52860 }, { "epoch": 0.34, "learning_rate": 0.00024881467951489957, "loss": 0.0614, "step": 52870 }, { "epoch": 0.34, "learning_rate": 0.00024880499816054265, "loss": 0.0683, "step": 52880 }, { "epoch": 0.34, "learning_rate": 0.00024879531680618573, "loss": 0.0662, "step": 52890 }, { "epoch": 0.34, "learning_rate": 0.00024878563545182875, "loss": 0.0639, "step": 52900 }, { "epoch": 0.34, "learning_rate": 0.00024877595409747183, "loss": 0.0541, "step": 52910 }, { "epoch": 0.34, "learning_rate": 0.0002487662727431149, "loss": 0.0611, "step": 52920 }, { "epoch": 0.34, "learning_rate": 0.000248756591388758, "loss": 0.059, "step": 52930 }, { "epoch": 0.34, "learning_rate": 0.0002487469100344011, "loss": 0.0683, "step": 52940 }, { "epoch": 0.34, "learning_rate": 0.0002487372286800441, "loss": 0.053, "step": 52950 }, { "epoch": 0.34, "learning_rate": 0.0002487275473256872, "loss": 0.0587, "step": 52960 }, { "epoch": 0.34, "learning_rate": 0.00024871786597133026, "loss": 0.0614, "step": 52970 }, { "epoch": 0.34, "learning_rate": 0.00024870818461697334, "loss": 0.0611, "step": 52980 }, { "epoch": 0.34, "learning_rate": 0.0002486985032626164, "loss": 0.0595, "step": 52990 }, { "epoch": 0.34, "learning_rate": 0.0002486888219082595, "loss": 0.0672, "step": 53000 }, { "epoch": 0.34, "eval_cer": 0.9201590780702745, "eval_loss": 0.041813936084508896, "eval_runtime": 120.1824, "eval_samples_per_second": 16.641, "eval_steps_per_second": 4.16, "step": 53000 }, { "epoch": 0.34, "learning_rate": 0.0002486791405539025, "loss": 0.0609, "step": 53010 }, { "epoch": 0.34, "learning_rate": 0.0002486694591995456, "loss": 0.0576, "step": 53020 }, { "epoch": 0.34, "learning_rate": 0.0002486597778451887, "loss": 0.0647, "step": 53030 }, { "epoch": 0.34, "learning_rate": 0.0002486500964908317, "loss": 0.0553, "step": 53040 }, { "epoch": 0.34, "learning_rate": 0.0002486404151364748, "loss": 0.0677, "step": 53050 }, { "epoch": 0.34, "learning_rate": 0.00024863073378211787, "loss": 0.0665, "step": 53060 }, { "epoch": 0.34, "learning_rate": 0.00024862105242776095, "loss": 0.0554, "step": 53070 }, { "epoch": 0.34, "learning_rate": 0.00024861137107340403, "loss": 0.0621, "step": 53080 }, { "epoch": 0.34, "learning_rate": 0.00024860168971904705, "loss": 0.0654, "step": 53090 }, { "epoch": 0.34, "learning_rate": 0.00024859200836469013, "loss": 0.0627, "step": 53100 }, { "epoch": 0.34, "learning_rate": 0.0002485823270103332, "loss": 0.0671, "step": 53110 }, { "epoch": 0.34, "learning_rate": 0.0002485726456559763, "loss": 0.0691, "step": 53120 }, { "epoch": 0.34, "learning_rate": 0.00024856296430161937, "loss": 0.06, "step": 53130 }, { "epoch": 0.34, "learning_rate": 0.0002485532829472624, "loss": 0.0622, "step": 53140 }, { "epoch": 0.34, "learning_rate": 0.0002485436015929055, "loss": 0.0616, "step": 53150 }, { "epoch": 0.34, "learning_rate": 0.00024853392023854856, "loss": 0.0606, "step": 53160 }, { "epoch": 0.34, "learning_rate": 0.0002485242388841916, "loss": 0.0595, "step": 53170 }, { "epoch": 0.34, "learning_rate": 0.00024851455752983466, "loss": 0.0599, "step": 53180 }, { "epoch": 0.34, "learning_rate": 0.00024850487617547774, "loss": 0.0713, "step": 53190 }, { "epoch": 0.34, "learning_rate": 0.0002484951948211208, "loss": 0.0687, "step": 53200 }, { "epoch": 0.34, "learning_rate": 0.0002484855134667639, "loss": 0.0619, "step": 53210 }, { "epoch": 0.34, "learning_rate": 0.000248475832112407, "loss": 0.0604, "step": 53220 }, { "epoch": 0.34, "learning_rate": 0.00024846615075805, "loss": 0.0609, "step": 53230 }, { "epoch": 0.34, "learning_rate": 0.0002484564694036931, "loss": 0.0579, "step": 53240 }, { "epoch": 0.34, "learning_rate": 0.00024844678804933617, "loss": 0.0616, "step": 53250 }, { "epoch": 0.34, "learning_rate": 0.00024843710669497925, "loss": 0.063, "step": 53260 }, { "epoch": 0.34, "learning_rate": 0.0002484274253406223, "loss": 0.0532, "step": 53270 }, { "epoch": 0.34, "learning_rate": 0.00024841774398626535, "loss": 0.0561, "step": 53280 }, { "epoch": 0.34, "learning_rate": 0.00024840806263190843, "loss": 0.0582, "step": 53290 }, { "epoch": 0.34, "learning_rate": 0.00024839838127755146, "loss": 0.0715, "step": 53300 }, { "epoch": 0.34, "learning_rate": 0.00024838869992319454, "loss": 0.0604, "step": 53310 }, { "epoch": 0.34, "learning_rate": 0.0002483790185688376, "loss": 0.063, "step": 53320 }, { "epoch": 0.34, "learning_rate": 0.0002483693372144807, "loss": 0.0607, "step": 53330 }, { "epoch": 0.34, "learning_rate": 0.0002483596558601238, "loss": 0.0637, "step": 53340 }, { "epoch": 0.34, "learning_rate": 0.00024834997450576686, "loss": 0.0576, "step": 53350 }, { "epoch": 0.34, "learning_rate": 0.00024834029315140994, "loss": 0.0593, "step": 53360 }, { "epoch": 0.34, "learning_rate": 0.00024833061179705296, "loss": 0.057, "step": 53370 }, { "epoch": 0.34, "learning_rate": 0.00024832093044269604, "loss": 0.0639, "step": 53380 }, { "epoch": 0.34, "learning_rate": 0.0002483112490883391, "loss": 0.0597, "step": 53390 }, { "epoch": 0.34, "learning_rate": 0.0002483015677339822, "loss": 0.0599, "step": 53400 }, { "epoch": 0.34, "learning_rate": 0.00024829188637962523, "loss": 0.0676, "step": 53410 }, { "epoch": 0.34, "learning_rate": 0.0002482822050252683, "loss": 0.0592, "step": 53420 }, { "epoch": 0.34, "learning_rate": 0.0002482725236709114, "loss": 0.0688, "step": 53430 }, { "epoch": 0.34, "learning_rate": 0.0002482628423165544, "loss": 0.0701, "step": 53440 }, { "epoch": 0.34, "learning_rate": 0.0002482531609621975, "loss": 0.0662, "step": 53450 }, { "epoch": 0.35, "learning_rate": 0.00024824347960784057, "loss": 0.0562, "step": 53460 }, { "epoch": 0.35, "learning_rate": 0.00024823379825348365, "loss": 0.0546, "step": 53470 }, { "epoch": 0.35, "learning_rate": 0.00024822411689912673, "loss": 0.0614, "step": 53480 }, { "epoch": 0.35, "learning_rate": 0.0002482144355447698, "loss": 0.0595, "step": 53490 }, { "epoch": 0.35, "learning_rate": 0.0002482047541904129, "loss": 0.0692, "step": 53500 }, { "epoch": 0.35, "learning_rate": 0.0002481950728360559, "loss": 0.0597, "step": 53510 }, { "epoch": 0.35, "learning_rate": 0.000248185391481699, "loss": 0.0641, "step": 53520 }, { "epoch": 0.35, "learning_rate": 0.0002481757101273421, "loss": 0.0631, "step": 53530 }, { "epoch": 0.35, "learning_rate": 0.0002481660287729851, "loss": 0.0573, "step": 53540 }, { "epoch": 0.35, "learning_rate": 0.0002481563474186282, "loss": 0.0568, "step": 53550 }, { "epoch": 0.35, "learning_rate": 0.00024814666606427126, "loss": 0.0674, "step": 53560 }, { "epoch": 0.35, "learning_rate": 0.00024813698470991434, "loss": 0.065, "step": 53570 }, { "epoch": 0.35, "learning_rate": 0.00024812730335555737, "loss": 0.0566, "step": 53580 }, { "epoch": 0.35, "learning_rate": 0.00024811762200120045, "loss": 0.0597, "step": 53590 }, { "epoch": 0.35, "learning_rate": 0.0002481079406468435, "loss": 0.0627, "step": 53600 }, { "epoch": 0.35, "learning_rate": 0.0002480982592924866, "loss": 0.0641, "step": 53610 }, { "epoch": 0.35, "learning_rate": 0.0002480885779381297, "loss": 0.0587, "step": 53620 }, { "epoch": 0.35, "learning_rate": 0.00024807889658377277, "loss": 0.0661, "step": 53630 }, { "epoch": 0.35, "learning_rate": 0.0002480692152294158, "loss": 0.0667, "step": 53640 }, { "epoch": 0.35, "learning_rate": 0.00024805953387505887, "loss": 0.0653, "step": 53650 }, { "epoch": 0.35, "learning_rate": 0.00024804985252070195, "loss": 0.0643, "step": 53660 }, { "epoch": 0.35, "learning_rate": 0.000248040171166345, "loss": 0.0702, "step": 53670 }, { "epoch": 0.35, "learning_rate": 0.00024803048981198806, "loss": 0.0675, "step": 53680 }, { "epoch": 0.35, "learning_rate": 0.00024802080845763114, "loss": 0.0685, "step": 53690 }, { "epoch": 0.35, "learning_rate": 0.0002480111271032742, "loss": 0.0707, "step": 53700 }, { "epoch": 0.35, "learning_rate": 0.0002480014457489173, "loss": 0.0573, "step": 53710 }, { "epoch": 0.35, "learning_rate": 0.0002479917643945603, "loss": 0.0641, "step": 53720 }, { "epoch": 0.35, "learning_rate": 0.0002479820830402034, "loss": 0.0652, "step": 53730 }, { "epoch": 0.35, "learning_rate": 0.0002479724016858465, "loss": 0.0592, "step": 53740 }, { "epoch": 0.35, "learning_rate": 0.00024796272033148956, "loss": 0.0588, "step": 53750 }, { "epoch": 0.35, "learning_rate": 0.00024795303897713264, "loss": 0.0608, "step": 53760 }, { "epoch": 0.35, "learning_rate": 0.0002479433576227757, "loss": 0.0579, "step": 53770 }, { "epoch": 0.35, "learning_rate": 0.00024793367626841875, "loss": 0.0632, "step": 53780 }, { "epoch": 0.35, "learning_rate": 0.0002479239949140618, "loss": 0.0566, "step": 53790 }, { "epoch": 0.35, "learning_rate": 0.0002479143135597049, "loss": 0.0641, "step": 53800 }, { "epoch": 0.35, "learning_rate": 0.00024790463220534793, "loss": 0.0738, "step": 53810 }, { "epoch": 0.35, "learning_rate": 0.000247894950850991, "loss": 0.0672, "step": 53820 }, { "epoch": 0.35, "learning_rate": 0.0002478852694966341, "loss": 0.061, "step": 53830 }, { "epoch": 0.35, "learning_rate": 0.00024787558814227717, "loss": 0.0635, "step": 53840 }, { "epoch": 0.35, "learning_rate": 0.00024786590678792025, "loss": 0.0609, "step": 53850 }, { "epoch": 0.35, "learning_rate": 0.0002478562254335633, "loss": 0.0658, "step": 53860 }, { "epoch": 0.35, "learning_rate": 0.00024784654407920636, "loss": 0.0699, "step": 53870 }, { "epoch": 0.35, "learning_rate": 0.00024783686272484944, "loss": 0.0606, "step": 53880 }, { "epoch": 0.35, "learning_rate": 0.0002478271813704925, "loss": 0.0643, "step": 53890 }, { "epoch": 0.35, "learning_rate": 0.0002478175000161356, "loss": 0.0577, "step": 53900 }, { "epoch": 0.35, "learning_rate": 0.0002478078186617786, "loss": 0.0632, "step": 53910 }, { "epoch": 0.35, "learning_rate": 0.0002477981373074217, "loss": 0.0582, "step": 53920 }, { "epoch": 0.35, "learning_rate": 0.0002477884559530648, "loss": 0.0655, "step": 53930 }, { "epoch": 0.35, "learning_rate": 0.0002477787745987078, "loss": 0.0689, "step": 53940 }, { "epoch": 0.35, "learning_rate": 0.0002477690932443509, "loss": 0.0773, "step": 53950 }, { "epoch": 0.35, "learning_rate": 0.00024775941188999397, "loss": 0.0687, "step": 53960 }, { "epoch": 0.35, "learning_rate": 0.00024774973053563705, "loss": 0.0621, "step": 53970 }, { "epoch": 0.35, "learning_rate": 0.0002477400491812801, "loss": 0.0618, "step": 53980 }, { "epoch": 0.35, "learning_rate": 0.0002477303678269232, "loss": 0.065, "step": 53990 }, { "epoch": 0.35, "learning_rate": 0.00024772068647256623, "loss": 0.063, "step": 54000 }, { "epoch": 0.35, "eval_cer": 0.9200108462320642, "eval_loss": 0.04245748743414879, "eval_runtime": 120.2121, "eval_samples_per_second": 16.637, "eval_steps_per_second": 4.159, "step": 54000 }, { "epoch": 0.35, "learning_rate": 0.0002477110051182093, "loss": 0.0614, "step": 54010 }, { "epoch": 0.35, "learning_rate": 0.0002477013237638524, "loss": 0.0582, "step": 54020 }, { "epoch": 0.35, "learning_rate": 0.00024769164240949547, "loss": 0.0706, "step": 54030 }, { "epoch": 0.35, "learning_rate": 0.00024768196105513855, "loss": 0.0636, "step": 54040 }, { "epoch": 0.35, "learning_rate": 0.0002476722797007816, "loss": 0.0647, "step": 54050 }, { "epoch": 0.35, "learning_rate": 0.00024766259834642465, "loss": 0.0565, "step": 54060 }, { "epoch": 0.35, "learning_rate": 0.0002476529169920677, "loss": 0.0747, "step": 54070 }, { "epoch": 0.35, "learning_rate": 0.00024764323563771076, "loss": 0.0598, "step": 54080 }, { "epoch": 0.35, "learning_rate": 0.00024763355428335384, "loss": 0.0644, "step": 54090 }, { "epoch": 0.35, "learning_rate": 0.0002476238729289969, "loss": 0.0645, "step": 54100 }, { "epoch": 0.35, "learning_rate": 0.00024761419157464, "loss": 0.0626, "step": 54110 }, { "epoch": 0.35, "learning_rate": 0.0002476045102202831, "loss": 0.0685, "step": 54120 }, { "epoch": 0.35, "learning_rate": 0.00024759482886592616, "loss": 0.0626, "step": 54130 }, { "epoch": 0.35, "learning_rate": 0.0002475851475115692, "loss": 0.0631, "step": 54140 }, { "epoch": 0.35, "learning_rate": 0.00024757546615721226, "loss": 0.0558, "step": 54150 }, { "epoch": 0.35, "learning_rate": 0.00024756578480285534, "loss": 0.0654, "step": 54160 }, { "epoch": 0.35, "learning_rate": 0.0002475561034484984, "loss": 0.0623, "step": 54170 }, { "epoch": 0.35, "learning_rate": 0.00024754642209414145, "loss": 0.0648, "step": 54180 }, { "epoch": 0.35, "learning_rate": 0.00024753674073978453, "loss": 0.0601, "step": 54190 }, { "epoch": 0.35, "learning_rate": 0.0002475270593854276, "loss": 0.0704, "step": 54200 }, { "epoch": 0.35, "learning_rate": 0.00024751737803107063, "loss": 0.0617, "step": 54210 }, { "epoch": 0.35, "learning_rate": 0.0002475076966767137, "loss": 0.0598, "step": 54220 }, { "epoch": 0.35, "learning_rate": 0.0002474980153223568, "loss": 0.0737, "step": 54230 }, { "epoch": 0.35, "learning_rate": 0.0002474883339679999, "loss": 0.0679, "step": 54240 }, { "epoch": 0.35, "learning_rate": 0.00024747865261364295, "loss": 0.0599, "step": 54250 }, { "epoch": 0.35, "learning_rate": 0.00024746897125928603, "loss": 0.0668, "step": 54260 }, { "epoch": 0.35, "learning_rate": 0.0002474592899049291, "loss": 0.0756, "step": 54270 }, { "epoch": 0.35, "learning_rate": 0.00024744960855057214, "loss": 0.0591, "step": 54280 }, { "epoch": 0.35, "learning_rate": 0.0002474399271962152, "loss": 0.0665, "step": 54290 }, { "epoch": 0.35, "learning_rate": 0.0002474302458418583, "loss": 0.0601, "step": 54300 }, { "epoch": 0.35, "learning_rate": 0.0002474205644875013, "loss": 0.0611, "step": 54310 }, { "epoch": 0.35, "learning_rate": 0.0002474108831331444, "loss": 0.0614, "step": 54320 }, { "epoch": 0.35, "learning_rate": 0.0002474012017787875, "loss": 0.0575, "step": 54330 }, { "epoch": 0.35, "learning_rate": 0.00024739152042443056, "loss": 0.0589, "step": 54340 }, { "epoch": 0.35, "learning_rate": 0.0002473818390700736, "loss": 0.0555, "step": 54350 }, { "epoch": 0.35, "learning_rate": 0.00024737215771571667, "loss": 0.0617, "step": 54360 }, { "epoch": 0.35, "learning_rate": 0.00024736247636135975, "loss": 0.059, "step": 54370 }, { "epoch": 0.35, "learning_rate": 0.00024735279500700283, "loss": 0.0524, "step": 54380 }, { "epoch": 0.35, "learning_rate": 0.0002473431136526459, "loss": 0.0599, "step": 54390 }, { "epoch": 0.35, "learning_rate": 0.000247333432298289, "loss": 0.0573, "step": 54400 }, { "epoch": 0.35, "learning_rate": 0.00024732375094393207, "loss": 0.065, "step": 54410 }, { "epoch": 0.35, "learning_rate": 0.0002473140695895751, "loss": 0.0596, "step": 54420 }, { "epoch": 0.35, "learning_rate": 0.0002473043882352182, "loss": 0.0616, "step": 54430 }, { "epoch": 0.35, "learning_rate": 0.00024729470688086125, "loss": 0.0634, "step": 54440 }, { "epoch": 0.35, "learning_rate": 0.0002472850255265043, "loss": 0.0579, "step": 54450 }, { "epoch": 0.35, "learning_rate": 0.00024727534417214736, "loss": 0.0522, "step": 54460 }, { "epoch": 0.35, "learning_rate": 0.00024726566281779044, "loss": 0.0575, "step": 54470 }, { "epoch": 0.35, "learning_rate": 0.0002472559814634335, "loss": 0.0719, "step": 54480 }, { "epoch": 0.35, "learning_rate": 0.00024724630010907654, "loss": 0.0574, "step": 54490 }, { "epoch": 0.35, "learning_rate": 0.0002472366187547196, "loss": 0.0618, "step": 54500 }, { "epoch": 0.35, "learning_rate": 0.0002472269374003627, "loss": 0.0615, "step": 54510 }, { "epoch": 0.35, "learning_rate": 0.0002472172560460058, "loss": 0.0593, "step": 54520 }, { "epoch": 0.35, "learning_rate": 0.00024720757469164886, "loss": 0.0568, "step": 54530 }, { "epoch": 0.35, "learning_rate": 0.00024719789333729194, "loss": 0.058, "step": 54540 }, { "epoch": 0.35, "learning_rate": 0.00024718821198293497, "loss": 0.0584, "step": 54550 }, { "epoch": 0.35, "learning_rate": 0.00024717853062857805, "loss": 0.0571, "step": 54560 }, { "epoch": 0.35, "learning_rate": 0.00024716884927422113, "loss": 0.0675, "step": 54570 }, { "epoch": 0.35, "learning_rate": 0.00024715916791986415, "loss": 0.0639, "step": 54580 }, { "epoch": 0.35, "learning_rate": 0.00024714948656550723, "loss": 0.0569, "step": 54590 }, { "epoch": 0.35, "learning_rate": 0.0002471398052111503, "loss": 0.0589, "step": 54600 }, { "epoch": 0.35, "learning_rate": 0.0002471301238567934, "loss": 0.0643, "step": 54610 }, { "epoch": 0.35, "learning_rate": 0.00024712044250243647, "loss": 0.0577, "step": 54620 }, { "epoch": 0.35, "learning_rate": 0.0002471107611480795, "loss": 0.0568, "step": 54630 }, { "epoch": 0.35, "learning_rate": 0.0002471010797937226, "loss": 0.0642, "step": 54640 }, { "epoch": 0.35, "learning_rate": 0.00024709139843936566, "loss": 0.0691, "step": 54650 }, { "epoch": 0.35, "learning_rate": 0.00024708171708500874, "loss": 0.0626, "step": 54660 }, { "epoch": 0.35, "learning_rate": 0.0002470720357306518, "loss": 0.0605, "step": 54670 }, { "epoch": 0.35, "learning_rate": 0.00024706235437629484, "loss": 0.0518, "step": 54680 }, { "epoch": 0.35, "learning_rate": 0.0002470526730219379, "loss": 0.0657, "step": 54690 }, { "epoch": 0.35, "learning_rate": 0.000247042991667581, "loss": 0.0607, "step": 54700 }, { "epoch": 0.35, "learning_rate": 0.00024703331031322403, "loss": 0.0664, "step": 54710 }, { "epoch": 0.35, "learning_rate": 0.0002470236289588671, "loss": 0.0607, "step": 54720 }, { "epoch": 0.35, "learning_rate": 0.0002470139476045102, "loss": 0.0661, "step": 54730 }, { "epoch": 0.35, "learning_rate": 0.00024700426625015327, "loss": 0.0556, "step": 54740 }, { "epoch": 0.35, "learning_rate": 0.00024699458489579635, "loss": 0.0604, "step": 54750 }, { "epoch": 0.35, "learning_rate": 0.00024698490354143943, "loss": 0.0633, "step": 54760 }, { "epoch": 0.35, "learning_rate": 0.00024697522218708245, "loss": 0.0655, "step": 54770 }, { "epoch": 0.35, "learning_rate": 0.00024696554083272553, "loss": 0.0582, "step": 54780 }, { "epoch": 0.35, "learning_rate": 0.0002469558594783686, "loss": 0.058, "step": 54790 }, { "epoch": 0.35, "learning_rate": 0.0002469461781240117, "loss": 0.0594, "step": 54800 }, { "epoch": 0.35, "learning_rate": 0.00024693649676965477, "loss": 0.0613, "step": 54810 }, { "epoch": 0.35, "learning_rate": 0.0002469268154152978, "loss": 0.0592, "step": 54820 }, { "epoch": 0.35, "learning_rate": 0.0002469171340609409, "loss": 0.067, "step": 54830 }, { "epoch": 0.35, "learning_rate": 0.00024690745270658396, "loss": 0.0618, "step": 54840 }, { "epoch": 0.35, "learning_rate": 0.000246897771352227, "loss": 0.0542, "step": 54850 }, { "epoch": 0.35, "learning_rate": 0.00024688808999787006, "loss": 0.0672, "step": 54860 }, { "epoch": 0.35, "learning_rate": 0.00024687840864351314, "loss": 0.0657, "step": 54870 }, { "epoch": 0.35, "learning_rate": 0.0002468687272891562, "loss": 0.0579, "step": 54880 }, { "epoch": 0.35, "learning_rate": 0.0002468590459347993, "loss": 0.0589, "step": 54890 }, { "epoch": 0.35, "learning_rate": 0.0002468493645804424, "loss": 0.0579, "step": 54900 }, { "epoch": 0.35, "learning_rate": 0.0002468396832260854, "loss": 0.069, "step": 54910 }, { "epoch": 0.35, "learning_rate": 0.0002468300018717285, "loss": 0.059, "step": 54920 }, { "epoch": 0.35, "learning_rate": 0.00024682032051737157, "loss": 0.0694, "step": 54930 }, { "epoch": 0.35, "learning_rate": 0.00024681063916301465, "loss": 0.0635, "step": 54940 }, { "epoch": 0.35, "learning_rate": 0.00024680095780865767, "loss": 0.0582, "step": 54950 }, { "epoch": 0.35, "learning_rate": 0.00024679127645430075, "loss": 0.0607, "step": 54960 }, { "epoch": 0.35, "learning_rate": 0.00024678159509994383, "loss": 0.0653, "step": 54970 }, { "epoch": 0.35, "learning_rate": 0.00024677191374558686, "loss": 0.069, "step": 54980 }, { "epoch": 0.35, "learning_rate": 0.00024676223239122994, "loss": 0.067, "step": 54990 }, { "epoch": 0.35, "learning_rate": 0.000246752551036873, "loss": 0.0609, "step": 55000 }, { "epoch": 0.35, "eval_cer": 0.9199882499152638, "eval_loss": 0.040658190846443176, "eval_runtime": 120.0185, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 55000 }, { "epoch": 0.36, "learning_rate": 0.0002467428696825161, "loss": 0.0668, "step": 55010 }, { "epoch": 0.36, "learning_rate": 0.0002467331883281592, "loss": 0.0648, "step": 55020 }, { "epoch": 0.36, "learning_rate": 0.00024672350697380226, "loss": 0.0599, "step": 55030 }, { "epoch": 0.36, "learning_rate": 0.00024671382561944534, "loss": 0.06, "step": 55040 }, { "epoch": 0.36, "learning_rate": 0.00024670414426508836, "loss": 0.0602, "step": 55050 }, { "epoch": 0.36, "learning_rate": 0.00024669446291073144, "loss": 0.0638, "step": 55060 }, { "epoch": 0.36, "learning_rate": 0.0002466847815563745, "loss": 0.0576, "step": 55070 }, { "epoch": 0.36, "learning_rate": 0.00024667510020201755, "loss": 0.0564, "step": 55080 }, { "epoch": 0.36, "learning_rate": 0.0002466654188476606, "loss": 0.0541, "step": 55090 }, { "epoch": 0.36, "learning_rate": 0.0002466557374933037, "loss": 0.0569, "step": 55100 }, { "epoch": 0.36, "learning_rate": 0.0002466460561389468, "loss": 0.0665, "step": 55110 }, { "epoch": 0.36, "learning_rate": 0.0002466363747845898, "loss": 0.0551, "step": 55120 }, { "epoch": 0.36, "learning_rate": 0.0002466266934302329, "loss": 0.0624, "step": 55130 }, { "epoch": 0.36, "learning_rate": 0.00024661701207587597, "loss": 0.056, "step": 55140 }, { "epoch": 0.36, "learning_rate": 0.00024660733072151905, "loss": 0.0649, "step": 55150 }, { "epoch": 0.36, "learning_rate": 0.00024659764936716213, "loss": 0.0611, "step": 55160 }, { "epoch": 0.36, "learning_rate": 0.0002465879680128052, "loss": 0.0609, "step": 55170 }, { "epoch": 0.36, "learning_rate": 0.0002465782866584483, "loss": 0.0618, "step": 55180 }, { "epoch": 0.36, "learning_rate": 0.0002465686053040913, "loss": 0.062, "step": 55190 }, { "epoch": 0.36, "learning_rate": 0.0002465589239497344, "loss": 0.0612, "step": 55200 }, { "epoch": 0.36, "learning_rate": 0.0002465492425953775, "loss": 0.0614, "step": 55210 }, { "epoch": 0.36, "learning_rate": 0.0002465395612410205, "loss": 0.0572, "step": 55220 }, { "epoch": 0.36, "learning_rate": 0.0002465298798866636, "loss": 0.061, "step": 55230 }, { "epoch": 0.36, "learning_rate": 0.00024652019853230666, "loss": 0.0557, "step": 55240 }, { "epoch": 0.36, "learning_rate": 0.00024651051717794974, "loss": 0.0617, "step": 55250 }, { "epoch": 0.36, "learning_rate": 0.00024650083582359277, "loss": 0.0535, "step": 55260 }, { "epoch": 0.36, "learning_rate": 0.00024649115446923585, "loss": 0.0566, "step": 55270 }, { "epoch": 0.36, "learning_rate": 0.0002464814731148789, "loss": 0.0578, "step": 55280 }, { "epoch": 0.36, "learning_rate": 0.000246471791760522, "loss": 0.0608, "step": 55290 }, { "epoch": 0.36, "learning_rate": 0.0002464621104061651, "loss": 0.0581, "step": 55300 }, { "epoch": 0.36, "learning_rate": 0.00024645242905180817, "loss": 0.0638, "step": 55310 }, { "epoch": 0.36, "learning_rate": 0.0002464427476974512, "loss": 0.063, "step": 55320 }, { "epoch": 0.36, "learning_rate": 0.00024643306634309427, "loss": 0.0617, "step": 55330 }, { "epoch": 0.36, "learning_rate": 0.00024642338498873735, "loss": 0.0558, "step": 55340 }, { "epoch": 0.36, "learning_rate": 0.0002464137036343804, "loss": 0.053, "step": 55350 }, { "epoch": 0.36, "learning_rate": 0.00024640402228002346, "loss": 0.0623, "step": 55360 }, { "epoch": 0.36, "learning_rate": 0.00024639434092566654, "loss": 0.0614, "step": 55370 }, { "epoch": 0.36, "learning_rate": 0.0002463846595713096, "loss": 0.0627, "step": 55380 }, { "epoch": 0.36, "learning_rate": 0.0002463749782169527, "loss": 0.0561, "step": 55390 }, { "epoch": 0.36, "learning_rate": 0.0002463652968625957, "loss": 0.0695, "step": 55400 }, { "epoch": 0.36, "learning_rate": 0.0002463556155082388, "loss": 0.0623, "step": 55410 }, { "epoch": 0.36, "learning_rate": 0.0002463459341538819, "loss": 0.0612, "step": 55420 }, { "epoch": 0.36, "learning_rate": 0.00024633625279952496, "loss": 0.0579, "step": 55430 }, { "epoch": 0.36, "learning_rate": 0.00024632657144516804, "loss": 0.062, "step": 55440 }, { "epoch": 0.36, "learning_rate": 0.00024631689009081107, "loss": 0.056, "step": 55450 }, { "epoch": 0.36, "learning_rate": 0.00024630720873645415, "loss": 0.061, "step": 55460 }, { "epoch": 0.36, "learning_rate": 0.0002462975273820972, "loss": 0.0611, "step": 55470 }, { "epoch": 0.36, "learning_rate": 0.00024628784602774025, "loss": 0.0583, "step": 55480 }, { "epoch": 0.36, "learning_rate": 0.00024627816467338333, "loss": 0.0562, "step": 55490 }, { "epoch": 0.36, "learning_rate": 0.0002462684833190264, "loss": 0.0654, "step": 55500 }, { "epoch": 0.36, "learning_rate": 0.0002462588019646695, "loss": 0.0609, "step": 55510 }, { "epoch": 0.36, "learning_rate": 0.00024624912061031257, "loss": 0.0607, "step": 55520 }, { "epoch": 0.36, "learning_rate": 0.00024623943925595565, "loss": 0.0626, "step": 55530 }, { "epoch": 0.36, "learning_rate": 0.0002462297579015987, "loss": 0.0572, "step": 55540 }, { "epoch": 0.36, "learning_rate": 0.00024622007654724175, "loss": 0.0611, "step": 55550 }, { "epoch": 0.36, "learning_rate": 0.00024621039519288483, "loss": 0.0651, "step": 55560 }, { "epoch": 0.36, "learning_rate": 0.0002462007138385279, "loss": 0.064, "step": 55570 }, { "epoch": 0.36, "learning_rate": 0.000246191032484171, "loss": 0.0685, "step": 55580 }, { "epoch": 0.36, "learning_rate": 0.000246181351129814, "loss": 0.0578, "step": 55590 }, { "epoch": 0.36, "learning_rate": 0.0002461716697754571, "loss": 0.0635, "step": 55600 }, { "epoch": 0.36, "learning_rate": 0.0002461619884211002, "loss": 0.0615, "step": 55610 }, { "epoch": 0.36, "learning_rate": 0.0002461523070667432, "loss": 0.0663, "step": 55620 }, { "epoch": 0.36, "learning_rate": 0.0002461426257123863, "loss": 0.0648, "step": 55630 }, { "epoch": 0.36, "learning_rate": 0.00024613294435802936, "loss": 0.0555, "step": 55640 }, { "epoch": 0.36, "learning_rate": 0.00024612326300367244, "loss": 0.0649, "step": 55650 }, { "epoch": 0.36, "learning_rate": 0.0002461135816493155, "loss": 0.0665, "step": 55660 }, { "epoch": 0.36, "learning_rate": 0.0002461039002949586, "loss": 0.0627, "step": 55670 }, { "epoch": 0.36, "learning_rate": 0.00024609421894060163, "loss": 0.0583, "step": 55680 }, { "epoch": 0.36, "learning_rate": 0.0002460845375862447, "loss": 0.0582, "step": 55690 }, { "epoch": 0.36, "learning_rate": 0.0002460748562318878, "loss": 0.0618, "step": 55700 }, { "epoch": 0.36, "learning_rate": 0.00024606517487753087, "loss": 0.0547, "step": 55710 }, { "epoch": 0.36, "learning_rate": 0.0002460554935231739, "loss": 0.0595, "step": 55720 }, { "epoch": 0.36, "learning_rate": 0.000246045812168817, "loss": 0.061, "step": 55730 }, { "epoch": 0.36, "learning_rate": 0.00024603613081446005, "loss": 0.0624, "step": 55740 }, { "epoch": 0.36, "learning_rate": 0.0002460264494601031, "loss": 0.0549, "step": 55750 }, { "epoch": 0.36, "learning_rate": 0.00024601676810574616, "loss": 0.0599, "step": 55760 }, { "epoch": 0.36, "learning_rate": 0.00024600708675138924, "loss": 0.0581, "step": 55770 }, { "epoch": 0.36, "learning_rate": 0.0002459974053970323, "loss": 0.0651, "step": 55780 }, { "epoch": 0.36, "learning_rate": 0.0002459877240426754, "loss": 0.0595, "step": 55790 }, { "epoch": 0.36, "learning_rate": 0.0002459780426883185, "loss": 0.067, "step": 55800 }, { "epoch": 0.36, "learning_rate": 0.00024596836133396156, "loss": 0.0689, "step": 55810 }, { "epoch": 0.36, "learning_rate": 0.0002459586799796046, "loss": 0.0625, "step": 55820 }, { "epoch": 0.36, "learning_rate": 0.00024594899862524766, "loss": 0.073, "step": 55830 }, { "epoch": 0.36, "learning_rate": 0.00024593931727089074, "loss": 0.0612, "step": 55840 }, { "epoch": 0.36, "learning_rate": 0.00024592963591653377, "loss": 0.0548, "step": 55850 }, { "epoch": 0.36, "learning_rate": 0.00024591995456217685, "loss": 0.0715, "step": 55860 }, { "epoch": 0.36, "learning_rate": 0.00024591027320781993, "loss": 0.0546, "step": 55870 }, { "epoch": 0.36, "learning_rate": 0.000245900591853463, "loss": 0.062, "step": 55880 }, { "epoch": 0.36, "learning_rate": 0.00024589091049910603, "loss": 0.0678, "step": 55890 }, { "epoch": 0.36, "learning_rate": 0.0002458812291447491, "loss": 0.0645, "step": 55900 }, { "epoch": 0.36, "learning_rate": 0.0002458715477903922, "loss": 0.0651, "step": 55910 }, { "epoch": 0.36, "learning_rate": 0.0002458618664360353, "loss": 0.0541, "step": 55920 }, { "epoch": 0.36, "learning_rate": 0.00024585218508167835, "loss": 0.0722, "step": 55930 }, { "epoch": 0.36, "learning_rate": 0.00024584250372732143, "loss": 0.0566, "step": 55940 }, { "epoch": 0.36, "learning_rate": 0.0002458328223729645, "loss": 0.0593, "step": 55950 }, { "epoch": 0.36, "learning_rate": 0.00024582314101860754, "loss": 0.0616, "step": 55960 }, { "epoch": 0.36, "learning_rate": 0.0002458134596642506, "loss": 0.0624, "step": 55970 }, { "epoch": 0.36, "learning_rate": 0.0002458037783098937, "loss": 0.0584, "step": 55980 }, { "epoch": 0.36, "learning_rate": 0.0002457940969555367, "loss": 0.0569, "step": 55990 }, { "epoch": 0.36, "learning_rate": 0.0002457844156011798, "loss": 0.0583, "step": 56000 }, { "epoch": 0.36, "eval_cer": 0.9199855383572477, "eval_loss": 0.03988322243094444, "eval_runtime": 119.9115, "eval_samples_per_second": 16.679, "eval_steps_per_second": 4.17, "step": 56000 }, { "epoch": 0.36, "learning_rate": 0.0002457747342468229, "loss": 0.0637, "step": 56010 }, { "epoch": 0.36, "learning_rate": 0.00024576505289246596, "loss": 0.0654, "step": 56020 }, { "epoch": 0.36, "learning_rate": 0.000245755371538109, "loss": 0.0611, "step": 56030 }, { "epoch": 0.36, "learning_rate": 0.00024574569018375207, "loss": 0.0631, "step": 56040 }, { "epoch": 0.36, "learning_rate": 0.00024573600882939515, "loss": 0.069, "step": 56050 }, { "epoch": 0.36, "learning_rate": 0.00024572632747503823, "loss": 0.0659, "step": 56060 }, { "epoch": 0.36, "learning_rate": 0.0002457166461206813, "loss": 0.0756, "step": 56070 }, { "epoch": 0.36, "learning_rate": 0.0002457069647663244, "loss": 0.0597, "step": 56080 }, { "epoch": 0.36, "learning_rate": 0.0002456972834119674, "loss": 0.057, "step": 56090 }, { "epoch": 0.36, "learning_rate": 0.0002456876020576105, "loss": 0.0696, "step": 56100 }, { "epoch": 0.36, "learning_rate": 0.00024567792070325357, "loss": 0.0725, "step": 56110 }, { "epoch": 0.36, "learning_rate": 0.0002456682393488966, "loss": 0.0612, "step": 56120 }, { "epoch": 0.36, "learning_rate": 0.0002456585579945397, "loss": 0.0608, "step": 56130 }, { "epoch": 0.36, "learning_rate": 0.00024564887664018276, "loss": 0.0599, "step": 56140 }, { "epoch": 0.36, "learning_rate": 0.00024563919528582584, "loss": 0.0589, "step": 56150 }, { "epoch": 0.36, "learning_rate": 0.0002456295139314689, "loss": 0.0668, "step": 56160 }, { "epoch": 0.36, "learning_rate": 0.00024561983257711194, "loss": 0.0629, "step": 56170 }, { "epoch": 0.36, "learning_rate": 0.000245610151222755, "loss": 0.0547, "step": 56180 }, { "epoch": 0.36, "learning_rate": 0.0002456004698683981, "loss": 0.0626, "step": 56190 }, { "epoch": 0.36, "learning_rate": 0.0002455907885140412, "loss": 0.0548, "step": 56200 }, { "epoch": 0.36, "learning_rate": 0.00024558110715968426, "loss": 0.0622, "step": 56210 }, { "epoch": 0.36, "learning_rate": 0.00024557142580532734, "loss": 0.0621, "step": 56220 }, { "epoch": 0.36, "learning_rate": 0.00024556174445097037, "loss": 0.0653, "step": 56230 }, { "epoch": 0.36, "learning_rate": 0.00024555206309661345, "loss": 0.0607, "step": 56240 }, { "epoch": 0.36, "learning_rate": 0.0002455423817422565, "loss": 0.0529, "step": 56250 }, { "epoch": 0.36, "learning_rate": 0.00024553270038789955, "loss": 0.0514, "step": 56260 }, { "epoch": 0.36, "learning_rate": 0.00024552301903354263, "loss": 0.0626, "step": 56270 }, { "epoch": 0.36, "learning_rate": 0.0002455133376791857, "loss": 0.0619, "step": 56280 }, { "epoch": 0.36, "learning_rate": 0.0002455036563248288, "loss": 0.0527, "step": 56290 }, { "epoch": 0.36, "learning_rate": 0.00024549397497047187, "loss": 0.06, "step": 56300 }, { "epoch": 0.36, "learning_rate": 0.0002454842936161149, "loss": 0.057, "step": 56310 }, { "epoch": 0.36, "learning_rate": 0.000245474612261758, "loss": 0.0621, "step": 56320 }, { "epoch": 0.36, "learning_rate": 0.00024546493090740106, "loss": 0.0558, "step": 56330 }, { "epoch": 0.36, "learning_rate": 0.00024545524955304414, "loss": 0.0588, "step": 56340 }, { "epoch": 0.36, "learning_rate": 0.0002454455681986872, "loss": 0.0569, "step": 56350 }, { "epoch": 0.36, "learning_rate": 0.00024543588684433024, "loss": 0.0529, "step": 56360 }, { "epoch": 0.36, "learning_rate": 0.0002454262054899733, "loss": 0.0615, "step": 56370 }, { "epoch": 0.36, "learning_rate": 0.0002454165241356164, "loss": 0.0686, "step": 56380 }, { "epoch": 0.36, "learning_rate": 0.00024540684278125943, "loss": 0.0568, "step": 56390 }, { "epoch": 0.36, "learning_rate": 0.0002453971614269025, "loss": 0.06, "step": 56400 }, { "epoch": 0.36, "learning_rate": 0.0002453874800725456, "loss": 0.0643, "step": 56410 }, { "epoch": 0.36, "learning_rate": 0.00024537779871818867, "loss": 0.0619, "step": 56420 }, { "epoch": 0.36, "learning_rate": 0.00024536811736383175, "loss": 0.0638, "step": 56430 }, { "epoch": 0.36, "learning_rate": 0.0002453584360094748, "loss": 0.0614, "step": 56440 }, { "epoch": 0.36, "learning_rate": 0.00024534875465511785, "loss": 0.0599, "step": 56450 }, { "epoch": 0.36, "learning_rate": 0.00024533907330076093, "loss": 0.0585, "step": 56460 }, { "epoch": 0.36, "learning_rate": 0.000245329391946404, "loss": 0.0612, "step": 56470 }, { "epoch": 0.36, "learning_rate": 0.0002453197105920471, "loss": 0.0631, "step": 56480 }, { "epoch": 0.36, "learning_rate": 0.0002453100292376901, "loss": 0.0605, "step": 56490 }, { "epoch": 0.36, "learning_rate": 0.0002453003478833332, "loss": 0.0557, "step": 56500 }, { "epoch": 0.36, "learning_rate": 0.0002452906665289763, "loss": 0.0622, "step": 56510 }, { "epoch": 0.36, "learning_rate": 0.0002452809851746193, "loss": 0.0671, "step": 56520 }, { "epoch": 0.36, "learning_rate": 0.0002452713038202624, "loss": 0.0633, "step": 56530 }, { "epoch": 0.36, "learning_rate": 0.00024526162246590546, "loss": 0.058, "step": 56540 }, { "epoch": 0.36, "learning_rate": 0.00024525194111154854, "loss": 0.0534, "step": 56550 }, { "epoch": 0.37, "learning_rate": 0.0002452422597571916, "loss": 0.0614, "step": 56560 }, { "epoch": 0.37, "learning_rate": 0.0002452325784028347, "loss": 0.0544, "step": 56570 }, { "epoch": 0.37, "learning_rate": 0.0002452228970484778, "loss": 0.0534, "step": 56580 }, { "epoch": 0.37, "learning_rate": 0.0002452132156941208, "loss": 0.0628, "step": 56590 }, { "epoch": 0.37, "learning_rate": 0.0002452035343397639, "loss": 0.0588, "step": 56600 }, { "epoch": 0.37, "learning_rate": 0.00024519385298540697, "loss": 0.0626, "step": 56610 }, { "epoch": 0.37, "learning_rate": 0.00024518417163105005, "loss": 0.0773, "step": 56620 }, { "epoch": 0.37, "learning_rate": 0.00024517449027669307, "loss": 0.059, "step": 56630 }, { "epoch": 0.37, "learning_rate": 0.00024516480892233615, "loss": 0.0577, "step": 56640 }, { "epoch": 0.37, "learning_rate": 0.00024515512756797923, "loss": 0.0667, "step": 56650 }, { "epoch": 0.37, "learning_rate": 0.00024514544621362226, "loss": 0.0684, "step": 56660 }, { "epoch": 0.37, "learning_rate": 0.00024513576485926534, "loss": 0.0576, "step": 56670 }, { "epoch": 0.37, "learning_rate": 0.0002451260835049084, "loss": 0.0606, "step": 56680 }, { "epoch": 0.37, "learning_rate": 0.0002451164021505515, "loss": 0.0621, "step": 56690 }, { "epoch": 0.37, "learning_rate": 0.0002451067207961946, "loss": 0.058, "step": 56700 }, { "epoch": 0.37, "learning_rate": 0.00024509703944183766, "loss": 0.0642, "step": 56710 }, { "epoch": 0.37, "learning_rate": 0.00024508735808748074, "loss": 0.0621, "step": 56720 }, { "epoch": 0.37, "learning_rate": 0.00024507767673312376, "loss": 0.0601, "step": 56730 }, { "epoch": 0.37, "learning_rate": 0.00024506799537876684, "loss": 0.0625, "step": 56740 }, { "epoch": 0.37, "learning_rate": 0.0002450583140244099, "loss": 0.0592, "step": 56750 }, { "epoch": 0.37, "learning_rate": 0.00024504863267005295, "loss": 0.0589, "step": 56760 }, { "epoch": 0.37, "learning_rate": 0.000245038951315696, "loss": 0.0514, "step": 56770 }, { "epoch": 0.37, "learning_rate": 0.0002450292699613391, "loss": 0.0626, "step": 56780 }, { "epoch": 0.37, "learning_rate": 0.0002450195886069822, "loss": 0.0577, "step": 56790 }, { "epoch": 0.37, "learning_rate": 0.0002450099072526252, "loss": 0.0614, "step": 56800 }, { "epoch": 0.37, "learning_rate": 0.0002450002258982683, "loss": 0.0604, "step": 56810 }, { "epoch": 0.37, "learning_rate": 0.00024499054454391137, "loss": 0.062, "step": 56820 }, { "epoch": 0.37, "learning_rate": 0.00024498086318955445, "loss": 0.0593, "step": 56830 }, { "epoch": 0.37, "learning_rate": 0.00024497118183519753, "loss": 0.063, "step": 56840 }, { "epoch": 0.37, "learning_rate": 0.0002449615004808406, "loss": 0.0589, "step": 56850 }, { "epoch": 0.37, "learning_rate": 0.00024495181912648364, "loss": 0.0617, "step": 56860 }, { "epoch": 0.37, "learning_rate": 0.0002449421377721267, "loss": 0.0608, "step": 56870 }, { "epoch": 0.37, "learning_rate": 0.0002449324564177698, "loss": 0.0583, "step": 56880 }, { "epoch": 0.37, "learning_rate": 0.0002449227750634128, "loss": 0.0567, "step": 56890 }, { "epoch": 0.37, "learning_rate": 0.0002449130937090559, "loss": 0.0626, "step": 56900 }, { "epoch": 0.37, "learning_rate": 0.000244903412354699, "loss": 0.056, "step": 56910 }, { "epoch": 0.37, "learning_rate": 0.00024489373100034206, "loss": 0.0546, "step": 56920 }, { "epoch": 0.37, "learning_rate": 0.00024488404964598514, "loss": 0.0562, "step": 56930 }, { "epoch": 0.37, "learning_rate": 0.00024487436829162817, "loss": 0.0504, "step": 56940 }, { "epoch": 0.37, "learning_rate": 0.00024486468693727125, "loss": 0.0507, "step": 56950 }, { "epoch": 0.37, "learning_rate": 0.0002448550055829143, "loss": 0.0567, "step": 56960 }, { "epoch": 0.37, "learning_rate": 0.0002448453242285574, "loss": 0.0596, "step": 56970 }, { "epoch": 0.37, "learning_rate": 0.0002448356428742005, "loss": 0.0588, "step": 56980 }, { "epoch": 0.37, "learning_rate": 0.00024482596151984356, "loss": 0.0612, "step": 56990 }, { "epoch": 0.37, "learning_rate": 0.0002448162801654866, "loss": 0.0602, "step": 57000 }, { "epoch": 0.37, "eval_cer": 0.9200777313297932, "eval_loss": 0.04003721475601196, "eval_runtime": 120.0958, "eval_samples_per_second": 16.653, "eval_steps_per_second": 4.163, "step": 57000 }, { "epoch": 0.37, "learning_rate": 0.00024480659881112967, "loss": 0.067, "step": 57010 }, { "epoch": 0.37, "learning_rate": 0.00024479691745677275, "loss": 0.0599, "step": 57020 }, { "epoch": 0.37, "learning_rate": 0.0002447872361024158, "loss": 0.0546, "step": 57030 }, { "epoch": 0.37, "learning_rate": 0.00024477755474805885, "loss": 0.0567, "step": 57040 }, { "epoch": 0.37, "learning_rate": 0.00024476787339370193, "loss": 0.0594, "step": 57050 }, { "epoch": 0.37, "learning_rate": 0.000244758192039345, "loss": 0.0585, "step": 57060 }, { "epoch": 0.37, "learning_rate": 0.0002447485106849881, "loss": 0.0665, "step": 57070 }, { "epoch": 0.37, "learning_rate": 0.0002447388293306311, "loss": 0.0604, "step": 57080 }, { "epoch": 0.37, "learning_rate": 0.0002447291479762742, "loss": 0.0536, "step": 57090 }, { "epoch": 0.37, "learning_rate": 0.0002447194666219173, "loss": 0.0561, "step": 57100 }, { "epoch": 0.37, "learning_rate": 0.00024470978526756036, "loss": 0.0694, "step": 57110 }, { "epoch": 0.37, "learning_rate": 0.00024470010391320344, "loss": 0.0653, "step": 57120 }, { "epoch": 0.37, "learning_rate": 0.00024469042255884646, "loss": 0.0602, "step": 57130 }, { "epoch": 0.37, "learning_rate": 0.00024468074120448954, "loss": 0.0581, "step": 57140 }, { "epoch": 0.37, "learning_rate": 0.0002446710598501326, "loss": 0.0664, "step": 57150 }, { "epoch": 0.37, "learning_rate": 0.00024466137849577565, "loss": 0.0661, "step": 57160 }, { "epoch": 0.37, "learning_rate": 0.00024465169714141873, "loss": 0.0637, "step": 57170 }, { "epoch": 0.37, "learning_rate": 0.0002446420157870618, "loss": 0.0643, "step": 57180 }, { "epoch": 0.37, "learning_rate": 0.0002446323344327049, "loss": 0.0629, "step": 57190 }, { "epoch": 0.37, "learning_rate": 0.00024462265307834797, "loss": 0.0567, "step": 57200 }, { "epoch": 0.37, "learning_rate": 0.00024461297172399105, "loss": 0.0586, "step": 57210 }, { "epoch": 0.37, "learning_rate": 0.0002446032903696341, "loss": 0.0562, "step": 57220 }, { "epoch": 0.37, "learning_rate": 0.00024459360901527715, "loss": 0.0598, "step": 57230 }, { "epoch": 0.37, "learning_rate": 0.00024458392766092023, "loss": 0.0574, "step": 57240 }, { "epoch": 0.37, "learning_rate": 0.0002445742463065633, "loss": 0.0642, "step": 57250 }, { "epoch": 0.37, "learning_rate": 0.00024456456495220634, "loss": 0.0589, "step": 57260 }, { "epoch": 0.37, "learning_rate": 0.0002445548835978494, "loss": 0.0549, "step": 57270 }, { "epoch": 0.37, "learning_rate": 0.0002445452022434925, "loss": 0.0693, "step": 57280 }, { "epoch": 0.37, "learning_rate": 0.0002445355208891355, "loss": 0.0637, "step": 57290 }, { "epoch": 0.37, "learning_rate": 0.0002445258395347786, "loss": 0.0545, "step": 57300 }, { "epoch": 0.37, "learning_rate": 0.0002445161581804217, "loss": 0.0526, "step": 57310 }, { "epoch": 0.37, "learning_rate": 0.00024450647682606476, "loss": 0.0638, "step": 57320 }, { "epoch": 0.37, "learning_rate": 0.00024449679547170784, "loss": 0.0517, "step": 57330 }, { "epoch": 0.37, "learning_rate": 0.0002444871141173509, "loss": 0.0654, "step": 57340 }, { "epoch": 0.37, "learning_rate": 0.000244477432762994, "loss": 0.0577, "step": 57350 }, { "epoch": 0.37, "learning_rate": 0.00024446775140863703, "loss": 0.0579, "step": 57360 }, { "epoch": 0.37, "learning_rate": 0.0002444580700542801, "loss": 0.0748, "step": 57370 }, { "epoch": 0.37, "learning_rate": 0.0002444483886999232, "loss": 0.0589, "step": 57380 }, { "epoch": 0.37, "learning_rate": 0.00024443870734556627, "loss": 0.0572, "step": 57390 }, { "epoch": 0.37, "learning_rate": 0.0002444290259912093, "loss": 0.0628, "step": 57400 }, { "epoch": 0.37, "learning_rate": 0.0002444193446368524, "loss": 0.0634, "step": 57410 }, { "epoch": 0.37, "learning_rate": 0.00024440966328249545, "loss": 0.078, "step": 57420 }, { "epoch": 0.37, "learning_rate": 0.0002443999819281385, "loss": 0.0672, "step": 57430 }, { "epoch": 0.37, "learning_rate": 0.00024439030057378156, "loss": 0.0632, "step": 57440 }, { "epoch": 0.37, "learning_rate": 0.00024438061921942464, "loss": 0.0533, "step": 57450 }, { "epoch": 0.37, "learning_rate": 0.0002443709378650677, "loss": 0.0567, "step": 57460 }, { "epoch": 0.37, "learning_rate": 0.0002443612565107108, "loss": 0.0706, "step": 57470 }, { "epoch": 0.37, "learning_rate": 0.0002443515751563539, "loss": 0.0631, "step": 57480 }, { "epoch": 0.37, "learning_rate": 0.00024434189380199696, "loss": 0.0604, "step": 57490 }, { "epoch": 0.37, "learning_rate": 0.00024433221244764, "loss": 0.0618, "step": 57500 }, { "epoch": 0.37, "learning_rate": 0.00024432253109328306, "loss": 0.056, "step": 57510 }, { "epoch": 0.37, "learning_rate": 0.00024431284973892614, "loss": 0.0641, "step": 57520 }, { "epoch": 0.37, "learning_rate": 0.00024430316838456917, "loss": 0.0649, "step": 57530 }, { "epoch": 0.37, "learning_rate": 0.00024429348703021225, "loss": 0.0651, "step": 57540 }, { "epoch": 0.37, "learning_rate": 0.00024428380567585533, "loss": 0.0656, "step": 57550 }, { "epoch": 0.37, "learning_rate": 0.0002442741243214984, "loss": 0.0667, "step": 57560 }, { "epoch": 0.37, "learning_rate": 0.00024426444296714143, "loss": 0.0593, "step": 57570 }, { "epoch": 0.37, "learning_rate": 0.0002442547616127845, "loss": 0.0585, "step": 57580 }, { "epoch": 0.37, "learning_rate": 0.0002442450802584276, "loss": 0.0609, "step": 57590 }, { "epoch": 0.37, "learning_rate": 0.00024423539890407067, "loss": 0.0558, "step": 57600 }, { "epoch": 0.37, "learning_rate": 0.00024422571754971375, "loss": 0.0668, "step": 57610 }, { "epoch": 0.37, "learning_rate": 0.00024421603619535683, "loss": 0.0618, "step": 57620 }, { "epoch": 0.37, "learning_rate": 0.00024420635484099986, "loss": 0.0709, "step": 57630 }, { "epoch": 0.37, "learning_rate": 0.00024419667348664294, "loss": 0.0569, "step": 57640 }, { "epoch": 0.37, "learning_rate": 0.000244186992132286, "loss": 0.0627, "step": 57650 }, { "epoch": 0.37, "learning_rate": 0.00024417731077792904, "loss": 0.0575, "step": 57660 }, { "epoch": 0.37, "learning_rate": 0.0002441676294235721, "loss": 0.0518, "step": 57670 }, { "epoch": 0.37, "learning_rate": 0.0002441579480692152, "loss": 0.061, "step": 57680 }, { "epoch": 0.37, "learning_rate": 0.0002441482667148583, "loss": 0.0669, "step": 57690 }, { "epoch": 0.37, "learning_rate": 0.00024413858536050136, "loss": 0.0571, "step": 57700 }, { "epoch": 0.37, "learning_rate": 0.0002441289040061444, "loss": 0.062, "step": 57710 }, { "epoch": 0.37, "learning_rate": 0.00024411922265178747, "loss": 0.0673, "step": 57720 }, { "epoch": 0.37, "learning_rate": 0.00024410954129743055, "loss": 0.0594, "step": 57730 }, { "epoch": 0.37, "learning_rate": 0.00024409985994307363, "loss": 0.0543, "step": 57740 }, { "epoch": 0.37, "learning_rate": 0.00024409017858871668, "loss": 0.0597, "step": 57750 }, { "epoch": 0.37, "learning_rate": 0.00024408049723435976, "loss": 0.0634, "step": 57760 }, { "epoch": 0.37, "learning_rate": 0.00024407081588000284, "loss": 0.0595, "step": 57770 }, { "epoch": 0.37, "learning_rate": 0.00024406113452564587, "loss": 0.0607, "step": 57780 }, { "epoch": 0.37, "learning_rate": 0.00024405145317128894, "loss": 0.0588, "step": 57790 }, { "epoch": 0.37, "learning_rate": 0.00024404177181693202, "loss": 0.0649, "step": 57800 }, { "epoch": 0.37, "learning_rate": 0.0002440320904625751, "loss": 0.0719, "step": 57810 }, { "epoch": 0.37, "learning_rate": 0.00024402240910821816, "loss": 0.0612, "step": 57820 }, { "epoch": 0.37, "learning_rate": 0.00024401272775386124, "loss": 0.0499, "step": 57830 }, { "epoch": 0.37, "learning_rate": 0.00024400304639950432, "loss": 0.0552, "step": 57840 }, { "epoch": 0.37, "learning_rate": 0.00024399336504514734, "loss": 0.0534, "step": 57850 }, { "epoch": 0.37, "learning_rate": 0.00024398368369079042, "loss": 0.0544, "step": 57860 }, { "epoch": 0.37, "learning_rate": 0.0002439740023364335, "loss": 0.0556, "step": 57870 }, { "epoch": 0.37, "learning_rate": 0.00024396432098207655, "loss": 0.0612, "step": 57880 }, { "epoch": 0.37, "learning_rate": 0.00024395463962771963, "loss": 0.0611, "step": 57890 }, { "epoch": 0.37, "learning_rate": 0.00024394495827336271, "loss": 0.0531, "step": 57900 }, { "epoch": 0.37, "learning_rate": 0.0002439352769190058, "loss": 0.0552, "step": 57910 }, { "epoch": 0.37, "learning_rate": 0.00024392559556464882, "loss": 0.0553, "step": 57920 }, { "epoch": 0.37, "learning_rate": 0.0002439159142102919, "loss": 0.056, "step": 57930 }, { "epoch": 0.37, "learning_rate": 0.00024390623285593498, "loss": 0.0637, "step": 57940 }, { "epoch": 0.37, "learning_rate": 0.00024389655150157803, "loss": 0.0628, "step": 57950 }, { "epoch": 0.37, "learning_rate": 0.0002438868701472211, "loss": 0.0542, "step": 57960 }, { "epoch": 0.37, "learning_rate": 0.0002438771887928642, "loss": 0.0644, "step": 57970 }, { "epoch": 0.37, "learning_rate": 0.00024386750743850727, "loss": 0.073, "step": 57980 }, { "epoch": 0.37, "learning_rate": 0.0002438578260841503, "loss": 0.0717, "step": 57990 }, { "epoch": 0.37, "learning_rate": 0.00024384814472979338, "loss": 0.0707, "step": 58000 }, { "epoch": 0.37, "eval_cer": 0.9200162693480962, "eval_loss": 0.03994331881403923, "eval_runtime": 120.3621, "eval_samples_per_second": 16.617, "eval_steps_per_second": 4.154, "step": 58000 }, { "epoch": 0.37, "learning_rate": 0.00024383846337543646, "loss": 0.0753, "step": 58010 }, { "epoch": 0.37, "learning_rate": 0.0002438287820210795, "loss": 0.0633, "step": 58020 }, { "epoch": 0.37, "learning_rate": 0.0002438191006667226, "loss": 0.0555, "step": 58030 }, { "epoch": 0.37, "learning_rate": 0.00024380941931236567, "loss": 0.0604, "step": 58040 }, { "epoch": 0.37, "learning_rate": 0.00024379973795800872, "loss": 0.0606, "step": 58050 }, { "epoch": 0.37, "learning_rate": 0.00024379005660365177, "loss": 0.0616, "step": 58060 }, { "epoch": 0.37, "learning_rate": 0.00024378037524929485, "loss": 0.1009, "step": 58070 }, { "epoch": 0.37, "learning_rate": 0.0002437706938949379, "loss": 0.0569, "step": 58080 }, { "epoch": 0.37, "learning_rate": 0.00024376101254058099, "loss": 0.0587, "step": 58090 }, { "epoch": 0.37, "learning_rate": 0.00024375133118622407, "loss": 0.0677, "step": 58100 }, { "epoch": 0.38, "learning_rate": 0.00024374164983186715, "loss": 0.0568, "step": 58110 }, { "epoch": 0.38, "learning_rate": 0.0002437319684775102, "loss": 0.058, "step": 58120 }, { "epoch": 0.38, "learning_rate": 0.00024372228712315325, "loss": 0.0567, "step": 58130 }, { "epoch": 0.38, "learning_rate": 0.00024371260576879633, "loss": 0.0575, "step": 58140 }, { "epoch": 0.38, "learning_rate": 0.00024370292441443938, "loss": 0.0636, "step": 58150 }, { "epoch": 0.38, "learning_rate": 0.00024369324306008246, "loss": 0.061, "step": 58160 }, { "epoch": 0.38, "learning_rate": 0.00024368356170572554, "loss": 0.0598, "step": 58170 }, { "epoch": 0.38, "learning_rate": 0.00024367388035136862, "loss": 0.0589, "step": 58180 }, { "epoch": 0.38, "learning_rate": 0.00024366419899701168, "loss": 0.0613, "step": 58190 }, { "epoch": 0.38, "learning_rate": 0.00024365451764265473, "loss": 0.0575, "step": 58200 }, { "epoch": 0.38, "learning_rate": 0.0002436448362882978, "loss": 0.0642, "step": 58210 }, { "epoch": 0.38, "learning_rate": 0.00024363515493394086, "loss": 0.0595, "step": 58220 }, { "epoch": 0.38, "learning_rate": 0.00024362547357958394, "loss": 0.0671, "step": 58230 }, { "epoch": 0.38, "learning_rate": 0.00024361579222522702, "loss": 0.0629, "step": 58240 }, { "epoch": 0.38, "learning_rate": 0.00024360611087087007, "loss": 0.0625, "step": 58250 }, { "epoch": 0.38, "learning_rate": 0.00024359642951651315, "loss": 0.0604, "step": 58260 }, { "epoch": 0.38, "learning_rate": 0.0002435867481621562, "loss": 0.0595, "step": 58270 }, { "epoch": 0.38, "learning_rate": 0.00024357706680779926, "loss": 0.0586, "step": 58280 }, { "epoch": 0.38, "learning_rate": 0.00024356738545344234, "loss": 0.0593, "step": 58290 }, { "epoch": 0.38, "learning_rate": 0.00024355770409908542, "loss": 0.0594, "step": 58300 }, { "epoch": 0.38, "learning_rate": 0.0002435480227447285, "loss": 0.0622, "step": 58310 }, { "epoch": 0.38, "learning_rate": 0.00024353834139037155, "loss": 0.0658, "step": 58320 }, { "epoch": 0.38, "learning_rate": 0.00024352866003601463, "loss": 0.0674, "step": 58330 }, { "epoch": 0.38, "learning_rate": 0.00024351897868165768, "loss": 0.0639, "step": 58340 }, { "epoch": 0.38, "learning_rate": 0.00024350929732730074, "loss": 0.0715, "step": 58350 }, { "epoch": 0.38, "learning_rate": 0.00024349961597294382, "loss": 0.0642, "step": 58360 }, { "epoch": 0.38, "learning_rate": 0.0002434899346185869, "loss": 0.0567, "step": 58370 }, { "epoch": 0.38, "learning_rate": 0.00024348025326422997, "loss": 0.0582, "step": 58380 }, { "epoch": 0.38, "learning_rate": 0.00024347057190987303, "loss": 0.0615, "step": 58390 }, { "epoch": 0.38, "learning_rate": 0.0002434608905555161, "loss": 0.0578, "step": 58400 }, { "epoch": 0.38, "learning_rate": 0.00024345120920115916, "loss": 0.0655, "step": 58410 }, { "epoch": 0.38, "learning_rate": 0.0002434415278468022, "loss": 0.0636, "step": 58420 }, { "epoch": 0.38, "learning_rate": 0.0002434318464924453, "loss": 0.0593, "step": 58430 }, { "epoch": 0.38, "learning_rate": 0.00024342216513808837, "loss": 0.0599, "step": 58440 }, { "epoch": 0.38, "learning_rate": 0.00024341248378373143, "loss": 0.0664, "step": 58450 }, { "epoch": 0.38, "learning_rate": 0.0002434028024293745, "loss": 0.061, "step": 58460 }, { "epoch": 0.38, "learning_rate": 0.00024339312107501758, "loss": 0.0655, "step": 58470 }, { "epoch": 0.38, "learning_rate": 0.0002433834397206606, "loss": 0.0548, "step": 58480 }, { "epoch": 0.38, "learning_rate": 0.0002433737583663037, "loss": 0.0562, "step": 58490 }, { "epoch": 0.38, "learning_rate": 0.00024336407701194677, "loss": 0.0614, "step": 58500 }, { "epoch": 0.38, "learning_rate": 0.00024335439565758985, "loss": 0.0532, "step": 58510 }, { "epoch": 0.38, "learning_rate": 0.0002433447143032329, "loss": 0.0575, "step": 58520 }, { "epoch": 0.38, "learning_rate": 0.00024333503294887598, "loss": 0.0609, "step": 58530 }, { "epoch": 0.38, "learning_rate": 0.00024332535159451903, "loss": 0.0589, "step": 58540 }, { "epoch": 0.38, "learning_rate": 0.0002433156702401621, "loss": 0.0548, "step": 58550 }, { "epoch": 0.38, "learning_rate": 0.00024330598888580517, "loss": 0.0595, "step": 58560 }, { "epoch": 0.38, "learning_rate": 0.00024329630753144825, "loss": 0.0558, "step": 58570 }, { "epoch": 0.38, "learning_rate": 0.00024328662617709133, "loss": 0.0575, "step": 58580 }, { "epoch": 0.38, "learning_rate": 0.00024327694482273438, "loss": 0.0591, "step": 58590 }, { "epoch": 0.38, "learning_rate": 0.00024326726346837746, "loss": 0.0615, "step": 58600 }, { "epoch": 0.38, "learning_rate": 0.0002432575821140205, "loss": 0.0579, "step": 58610 }, { "epoch": 0.38, "learning_rate": 0.00024324790075966356, "loss": 0.0632, "step": 58620 }, { "epoch": 0.38, "learning_rate": 0.00024323821940530664, "loss": 0.0678, "step": 58630 }, { "epoch": 0.38, "learning_rate": 0.00024322853805094972, "loss": 0.0508, "step": 58640 }, { "epoch": 0.38, "learning_rate": 0.00024321885669659278, "loss": 0.0626, "step": 58650 }, { "epoch": 0.38, "learning_rate": 0.00024320917534223586, "loss": 0.0605, "step": 58660 }, { "epoch": 0.38, "learning_rate": 0.00024319949398787894, "loss": 0.0625, "step": 58670 }, { "epoch": 0.38, "learning_rate": 0.00024318981263352196, "loss": 0.0578, "step": 58680 }, { "epoch": 0.38, "learning_rate": 0.00024318013127916504, "loss": 0.0596, "step": 58690 }, { "epoch": 0.38, "learning_rate": 0.00024317044992480812, "loss": 0.0596, "step": 58700 }, { "epoch": 0.38, "learning_rate": 0.0002431607685704512, "loss": 0.062, "step": 58710 }, { "epoch": 0.38, "learning_rate": 0.00024315108721609425, "loss": 0.0626, "step": 58720 }, { "epoch": 0.38, "learning_rate": 0.00024314140586173733, "loss": 0.0563, "step": 58730 }, { "epoch": 0.38, "learning_rate": 0.00024313172450738041, "loss": 0.0637, "step": 58740 }, { "epoch": 0.38, "learning_rate": 0.00024312204315302344, "loss": 0.0693, "step": 58750 }, { "epoch": 0.38, "learning_rate": 0.00024311236179866652, "loss": 0.0618, "step": 58760 }, { "epoch": 0.38, "learning_rate": 0.0002431026804443096, "loss": 0.0599, "step": 58770 }, { "epoch": 0.38, "learning_rate": 0.00024309299908995268, "loss": 0.0575, "step": 58780 }, { "epoch": 0.38, "learning_rate": 0.00024308331773559573, "loss": 0.0516, "step": 58790 }, { "epoch": 0.38, "learning_rate": 0.0002430736363812388, "loss": 0.0634, "step": 58800 }, { "epoch": 0.38, "learning_rate": 0.0002430639550268819, "loss": 0.0554, "step": 58810 }, { "epoch": 0.38, "learning_rate": 0.00024305427367252492, "loss": 0.0603, "step": 58820 }, { "epoch": 0.38, "learning_rate": 0.000243044592318168, "loss": 0.0613, "step": 58830 }, { "epoch": 0.38, "learning_rate": 0.00024303491096381108, "loss": 0.062, "step": 58840 }, { "epoch": 0.38, "learning_rate": 0.00024302522960945413, "loss": 0.0578, "step": 58850 }, { "epoch": 0.38, "learning_rate": 0.0002430155482550972, "loss": 0.0655, "step": 58860 }, { "epoch": 0.38, "learning_rate": 0.0002430058669007403, "loss": 0.0651, "step": 58870 }, { "epoch": 0.38, "learning_rate": 0.00024299618554638337, "loss": 0.064, "step": 58880 }, { "epoch": 0.38, "learning_rate": 0.0002429865041920264, "loss": 0.0584, "step": 58890 }, { "epoch": 0.38, "learning_rate": 0.00024297682283766947, "loss": 0.0593, "step": 58900 }, { "epoch": 0.38, "learning_rate": 0.00024296714148331255, "loss": 0.0522, "step": 58910 }, { "epoch": 0.38, "learning_rate": 0.0002429574601289556, "loss": 0.0588, "step": 58920 }, { "epoch": 0.38, "learning_rate": 0.00024294777877459869, "loss": 0.0638, "step": 58930 }, { "epoch": 0.38, "learning_rate": 0.00024293809742024177, "loss": 0.0602, "step": 58940 }, { "epoch": 0.38, "learning_rate": 0.00024292841606588485, "loss": 0.0558, "step": 58950 }, { "epoch": 0.38, "learning_rate": 0.00024291873471152787, "loss": 0.0597, "step": 58960 }, { "epoch": 0.38, "learning_rate": 0.00024290905335717095, "loss": 0.0538, "step": 58970 }, { "epoch": 0.38, "learning_rate": 0.00024289937200281403, "loss": 0.0572, "step": 58980 }, { "epoch": 0.38, "learning_rate": 0.00024288969064845708, "loss": 0.0677, "step": 58990 }, { "epoch": 0.38, "learning_rate": 0.00024288000929410016, "loss": 0.0628, "step": 59000 }, { "epoch": 0.38, "eval_cer": 0.9200515196023048, "eval_loss": 0.04011645168066025, "eval_runtime": 120.0848, "eval_samples_per_second": 16.655, "eval_steps_per_second": 4.164, "step": 59000 }, { "epoch": 0.38, "learning_rate": 0.00024287032793974324, "loss": 0.0547, "step": 59010 }, { "epoch": 0.38, "learning_rate": 0.00024286064658538632, "loss": 0.0595, "step": 59020 }, { "epoch": 0.38, "learning_rate": 0.00024285096523102935, "loss": 0.0618, "step": 59030 }, { "epoch": 0.38, "learning_rate": 0.00024284128387667243, "loss": 0.0574, "step": 59040 }, { "epoch": 0.38, "learning_rate": 0.00024283160252231548, "loss": 0.0639, "step": 59050 }, { "epoch": 0.38, "learning_rate": 0.00024282192116795856, "loss": 0.0611, "step": 59060 }, { "epoch": 0.38, "learning_rate": 0.00024281223981360164, "loss": 0.056, "step": 59070 }, { "epoch": 0.38, "learning_rate": 0.00024280255845924472, "loss": 0.0568, "step": 59080 }, { "epoch": 0.38, "learning_rate": 0.00024279287710488777, "loss": 0.0539, "step": 59090 }, { "epoch": 0.38, "learning_rate": 0.00024278319575053083, "loss": 0.0547, "step": 59100 }, { "epoch": 0.38, "learning_rate": 0.0002427735143961739, "loss": 0.0584, "step": 59110 }, { "epoch": 0.38, "learning_rate": 0.00024276383304181696, "loss": 0.0609, "step": 59120 }, { "epoch": 0.38, "learning_rate": 0.00024275415168746004, "loss": 0.0546, "step": 59130 }, { "epoch": 0.38, "learning_rate": 0.00024274447033310312, "loss": 0.0596, "step": 59140 }, { "epoch": 0.38, "learning_rate": 0.0002427347889787462, "loss": 0.0644, "step": 59150 }, { "epoch": 0.38, "learning_rate": 0.00024272510762438925, "loss": 0.0606, "step": 59160 }, { "epoch": 0.38, "learning_rate": 0.0002427154262700323, "loss": 0.0571, "step": 59170 }, { "epoch": 0.38, "learning_rate": 0.00024270574491567538, "loss": 0.0617, "step": 59180 }, { "epoch": 0.38, "learning_rate": 0.00024269606356131844, "loss": 0.0602, "step": 59190 }, { "epoch": 0.38, "learning_rate": 0.00024268638220696151, "loss": 0.0628, "step": 59200 }, { "epoch": 0.38, "learning_rate": 0.0002426767008526046, "loss": 0.0521, "step": 59210 }, { "epoch": 0.38, "learning_rate": 0.00024266701949824767, "loss": 0.0593, "step": 59220 }, { "epoch": 0.38, "learning_rate": 0.00024265733814389073, "loss": 0.0647, "step": 59230 }, { "epoch": 0.38, "learning_rate": 0.00024264765678953378, "loss": 0.0756, "step": 59240 }, { "epoch": 0.38, "learning_rate": 0.00024263797543517683, "loss": 0.0608, "step": 59250 }, { "epoch": 0.38, "learning_rate": 0.0002426282940808199, "loss": 0.0545, "step": 59260 }, { "epoch": 0.38, "learning_rate": 0.000242618612726463, "loss": 0.0574, "step": 59270 }, { "epoch": 0.38, "learning_rate": 0.00024260893137210607, "loss": 0.0571, "step": 59280 }, { "epoch": 0.38, "learning_rate": 0.00024259925001774912, "loss": 0.0587, "step": 59290 }, { "epoch": 0.38, "learning_rate": 0.0002425895686633922, "loss": 0.0512, "step": 59300 }, { "epoch": 0.38, "learning_rate": 0.00024257988730903526, "loss": 0.0593, "step": 59310 }, { "epoch": 0.38, "learning_rate": 0.0002425702059546783, "loss": 0.0621, "step": 59320 }, { "epoch": 0.38, "learning_rate": 0.0002425605246003214, "loss": 0.0572, "step": 59330 }, { "epoch": 0.38, "learning_rate": 0.00024255084324596447, "loss": 0.0654, "step": 59340 }, { "epoch": 0.38, "learning_rate": 0.00024254116189160755, "loss": 0.0541, "step": 59350 }, { "epoch": 0.38, "learning_rate": 0.0002425314805372506, "loss": 0.0627, "step": 59360 }, { "epoch": 0.38, "learning_rate": 0.00024252179918289368, "loss": 0.0572, "step": 59370 }, { "epoch": 0.38, "learning_rate": 0.00024251211782853673, "loss": 0.0545, "step": 59380 }, { "epoch": 0.38, "learning_rate": 0.0002425024364741798, "loss": 0.0626, "step": 59390 }, { "epoch": 0.38, "learning_rate": 0.00024249275511982287, "loss": 0.0613, "step": 59400 }, { "epoch": 0.38, "learning_rate": 0.00024248307376546595, "loss": 0.054, "step": 59410 }, { "epoch": 0.38, "learning_rate": 0.00024247339241110903, "loss": 0.0632, "step": 59420 }, { "epoch": 0.38, "learning_rate": 0.00024246371105675208, "loss": 0.0639, "step": 59430 }, { "epoch": 0.38, "learning_rate": 0.00024245402970239516, "loss": 0.0654, "step": 59440 }, { "epoch": 0.38, "learning_rate": 0.00024244434834803818, "loss": 0.0637, "step": 59450 }, { "epoch": 0.38, "learning_rate": 0.00024243466699368126, "loss": 0.0624, "step": 59460 }, { "epoch": 0.38, "learning_rate": 0.00024242498563932434, "loss": 0.0615, "step": 59470 }, { "epoch": 0.38, "learning_rate": 0.00024241530428496742, "loss": 0.0537, "step": 59480 }, { "epoch": 0.38, "learning_rate": 0.00024240562293061048, "loss": 0.0662, "step": 59490 }, { "epoch": 0.38, "learning_rate": 0.00024239594157625356, "loss": 0.0689, "step": 59500 }, { "epoch": 0.38, "learning_rate": 0.00024238626022189664, "loss": 0.0605, "step": 59510 }, { "epoch": 0.38, "learning_rate": 0.00024237657886753966, "loss": 0.0552, "step": 59520 }, { "epoch": 0.38, "learning_rate": 0.00024236689751318274, "loss": 0.0607, "step": 59530 }, { "epoch": 0.38, "learning_rate": 0.00024235721615882582, "loss": 0.0588, "step": 59540 }, { "epoch": 0.38, "learning_rate": 0.0002423475348044689, "loss": 0.0583, "step": 59550 }, { "epoch": 0.38, "learning_rate": 0.00024233785345011195, "loss": 0.0572, "step": 59560 }, { "epoch": 0.38, "learning_rate": 0.00024232817209575503, "loss": 0.0547, "step": 59570 }, { "epoch": 0.38, "learning_rate": 0.0002423184907413981, "loss": 0.06, "step": 59580 }, { "epoch": 0.38, "learning_rate": 0.00024230880938704114, "loss": 0.0599, "step": 59590 }, { "epoch": 0.38, "learning_rate": 0.00024229912803268422, "loss": 0.0667, "step": 59600 }, { "epoch": 0.38, "learning_rate": 0.0002422894466783273, "loss": 0.0615, "step": 59610 }, { "epoch": 0.38, "learning_rate": 0.00024227976532397038, "loss": 0.0682, "step": 59620 }, { "epoch": 0.38, "learning_rate": 0.00024227008396961343, "loss": 0.059, "step": 59630 }, { "epoch": 0.38, "learning_rate": 0.0002422604026152565, "loss": 0.0648, "step": 59640 }, { "epoch": 0.38, "learning_rate": 0.0002422507212608996, "loss": 0.0607, "step": 59650 }, { "epoch": 0.39, "learning_rate": 0.00024224103990654262, "loss": 0.0555, "step": 59660 }, { "epoch": 0.39, "learning_rate": 0.0002422313585521857, "loss": 0.0624, "step": 59670 }, { "epoch": 0.39, "learning_rate": 0.00024222167719782878, "loss": 0.0641, "step": 59680 }, { "epoch": 0.39, "learning_rate": 0.00024221199584347183, "loss": 0.06, "step": 59690 }, { "epoch": 0.39, "learning_rate": 0.0002422023144891149, "loss": 0.0601, "step": 59700 }, { "epoch": 0.39, "learning_rate": 0.000242192633134758, "loss": 0.0696, "step": 59710 }, { "epoch": 0.39, "learning_rate": 0.00024218295178040107, "loss": 0.0556, "step": 59720 }, { "epoch": 0.39, "learning_rate": 0.0002421732704260441, "loss": 0.0567, "step": 59730 }, { "epoch": 0.39, "learning_rate": 0.00024216358907168717, "loss": 0.0634, "step": 59740 }, { "epoch": 0.39, "learning_rate": 0.00024215390771733025, "loss": 0.0606, "step": 59750 }, { "epoch": 0.39, "learning_rate": 0.0002421442263629733, "loss": 0.0603, "step": 59760 }, { "epoch": 0.39, "learning_rate": 0.00024213454500861639, "loss": 0.0604, "step": 59770 }, { "epoch": 0.39, "learning_rate": 0.00024212486365425947, "loss": 0.0545, "step": 59780 }, { "epoch": 0.39, "learning_rate": 0.00024211518229990255, "loss": 0.0556, "step": 59790 }, { "epoch": 0.39, "learning_rate": 0.00024210550094554557, "loss": 0.0618, "step": 59800 }, { "epoch": 0.39, "learning_rate": 0.00024209581959118865, "loss": 0.0553, "step": 59810 }, { "epoch": 0.39, "learning_rate": 0.00024208613823683173, "loss": 0.0602, "step": 59820 }, { "epoch": 0.39, "learning_rate": 0.00024207645688247478, "loss": 0.0591, "step": 59830 }, { "epoch": 0.39, "learning_rate": 0.00024206677552811786, "loss": 0.0573, "step": 59840 }, { "epoch": 0.39, "learning_rate": 0.00024205709417376094, "loss": 0.0502, "step": 59850 }, { "epoch": 0.39, "learning_rate": 0.000242047412819404, "loss": 0.061, "step": 59860 }, { "epoch": 0.39, "learning_rate": 0.00024203773146504705, "loss": 0.0576, "step": 59870 }, { "epoch": 0.39, "learning_rate": 0.00024202805011069013, "loss": 0.0584, "step": 59880 }, { "epoch": 0.39, "learning_rate": 0.00024201836875633318, "loss": 0.0589, "step": 59890 }, { "epoch": 0.39, "learning_rate": 0.00024200868740197626, "loss": 0.0568, "step": 59900 }, { "epoch": 0.39, "learning_rate": 0.00024199900604761934, "loss": 0.0539, "step": 59910 }, { "epoch": 0.39, "learning_rate": 0.00024198932469326242, "loss": 0.0652, "step": 59920 }, { "epoch": 0.39, "learning_rate": 0.00024197964333890547, "loss": 0.0606, "step": 59930 }, { "epoch": 0.39, "learning_rate": 0.00024196996198454853, "loss": 0.0568, "step": 59940 }, { "epoch": 0.39, "learning_rate": 0.0002419602806301916, "loss": 0.0626, "step": 59950 }, { "epoch": 0.39, "learning_rate": 0.00024195059927583466, "loss": 0.0606, "step": 59960 }, { "epoch": 0.39, "learning_rate": 0.00024194091792147774, "loss": 0.0511, "step": 59970 }, { "epoch": 0.39, "learning_rate": 0.00024193123656712082, "loss": 0.07, "step": 59980 }, { "epoch": 0.39, "learning_rate": 0.0002419215552127639, "loss": 0.0555, "step": 59990 }, { "epoch": 0.39, "learning_rate": 0.00024191187385840695, "loss": 0.0586, "step": 60000 }, { "epoch": 0.39, "eval_cer": 0.9201012314992656, "eval_loss": 0.03904225304722786, "eval_runtime": 119.7689, "eval_samples_per_second": 16.699, "eval_steps_per_second": 4.175, "step": 60000 }, { "epoch": 0.39, "learning_rate": 0.00024190219250405, "loss": 0.0602, "step": 60010 }, { "epoch": 0.39, "learning_rate": 0.00024189251114969308, "loss": 0.0578, "step": 60020 }, { "epoch": 0.39, "learning_rate": 0.00024188282979533613, "loss": 0.0669, "step": 60030 }, { "epoch": 0.39, "learning_rate": 0.00024187314844097921, "loss": 0.0637, "step": 60040 }, { "epoch": 0.39, "learning_rate": 0.0002418634670866223, "loss": 0.0608, "step": 60050 }, { "epoch": 0.39, "learning_rate": 0.00024185378573226535, "loss": 0.0574, "step": 60060 }, { "epoch": 0.39, "learning_rate": 0.00024184410437790843, "loss": 0.057, "step": 60070 }, { "epoch": 0.39, "learning_rate": 0.00024183442302355148, "loss": 0.055, "step": 60080 }, { "epoch": 0.39, "learning_rate": 0.00024182474166919453, "loss": 0.0623, "step": 60090 }, { "epoch": 0.39, "learning_rate": 0.0002418150603148376, "loss": 0.062, "step": 60100 }, { "epoch": 0.39, "learning_rate": 0.0002418053789604807, "loss": 0.0582, "step": 60110 }, { "epoch": 0.39, "learning_rate": 0.00024179569760612377, "loss": 0.0612, "step": 60120 }, { "epoch": 0.39, "learning_rate": 0.00024178601625176682, "loss": 0.06, "step": 60130 }, { "epoch": 0.39, "learning_rate": 0.0002417763348974099, "loss": 0.0606, "step": 60140 }, { "epoch": 0.39, "learning_rate": 0.00024176665354305296, "loss": 0.0652, "step": 60150 }, { "epoch": 0.39, "learning_rate": 0.000241756972188696, "loss": 0.0615, "step": 60160 }, { "epoch": 0.39, "learning_rate": 0.0002417472908343391, "loss": 0.0696, "step": 60170 }, { "epoch": 0.39, "learning_rate": 0.00024173760947998217, "loss": 0.0643, "step": 60180 }, { "epoch": 0.39, "learning_rate": 0.00024172792812562525, "loss": 0.0618, "step": 60190 }, { "epoch": 0.39, "learning_rate": 0.0002417182467712683, "loss": 0.058, "step": 60200 }, { "epoch": 0.39, "learning_rate": 0.00024170856541691138, "loss": 0.056, "step": 60210 }, { "epoch": 0.39, "learning_rate": 0.00024169888406255443, "loss": 0.0645, "step": 60220 }, { "epoch": 0.39, "learning_rate": 0.0002416892027081975, "loss": 0.057, "step": 60230 }, { "epoch": 0.39, "learning_rate": 0.00024167952135384057, "loss": 0.0576, "step": 60240 }, { "epoch": 0.39, "learning_rate": 0.00024166983999948365, "loss": 0.0641, "step": 60250 }, { "epoch": 0.39, "learning_rate": 0.0002416601586451267, "loss": 0.0621, "step": 60260 }, { "epoch": 0.39, "learning_rate": 0.00024165047729076978, "loss": 0.0567, "step": 60270 }, { "epoch": 0.39, "learning_rate": 0.00024164079593641286, "loss": 0.0608, "step": 60280 }, { "epoch": 0.39, "learning_rate": 0.00024163111458205588, "loss": 0.0528, "step": 60290 }, { "epoch": 0.39, "learning_rate": 0.00024162143322769896, "loss": 0.0605, "step": 60300 }, { "epoch": 0.39, "learning_rate": 0.00024161175187334204, "loss": 0.0495, "step": 60310 }, { "epoch": 0.39, "learning_rate": 0.00024160207051898512, "loss": 0.0671, "step": 60320 }, { "epoch": 0.39, "learning_rate": 0.00024159238916462818, "loss": 0.0568, "step": 60330 }, { "epoch": 0.39, "learning_rate": 0.00024158270781027126, "loss": 0.0628, "step": 60340 }, { "epoch": 0.39, "learning_rate": 0.00024157302645591434, "loss": 0.061, "step": 60350 }, { "epoch": 0.39, "learning_rate": 0.00024156334510155736, "loss": 0.0555, "step": 60360 }, { "epoch": 0.39, "learning_rate": 0.00024155366374720044, "loss": 0.0602, "step": 60370 }, { "epoch": 0.39, "learning_rate": 0.00024154398239284352, "loss": 0.0611, "step": 60380 }, { "epoch": 0.39, "learning_rate": 0.0002415343010384866, "loss": 0.0561, "step": 60390 }, { "epoch": 0.39, "learning_rate": 0.00024152461968412965, "loss": 0.0536, "step": 60400 }, { "epoch": 0.39, "learning_rate": 0.00024151493832977273, "loss": 0.0591, "step": 60410 }, { "epoch": 0.39, "learning_rate": 0.0002415052569754158, "loss": 0.0562, "step": 60420 }, { "epoch": 0.39, "learning_rate": 0.00024149557562105884, "loss": 0.0567, "step": 60430 }, { "epoch": 0.39, "learning_rate": 0.00024148589426670192, "loss": 0.0568, "step": 60440 }, { "epoch": 0.39, "learning_rate": 0.000241476212912345, "loss": 0.0622, "step": 60450 }, { "epoch": 0.39, "learning_rate": 0.00024146653155798805, "loss": 0.0552, "step": 60460 }, { "epoch": 0.39, "learning_rate": 0.00024145685020363113, "loss": 0.0593, "step": 60470 }, { "epoch": 0.39, "learning_rate": 0.0002414471688492742, "loss": 0.0582, "step": 60480 }, { "epoch": 0.39, "learning_rate": 0.0002414374874949173, "loss": 0.0759, "step": 60490 }, { "epoch": 0.39, "learning_rate": 0.00024142780614056032, "loss": 0.0568, "step": 60500 }, { "epoch": 0.39, "learning_rate": 0.0002414181247862034, "loss": 0.0502, "step": 60510 }, { "epoch": 0.39, "learning_rate": 0.00024140844343184648, "loss": 0.0672, "step": 60520 }, { "epoch": 0.39, "learning_rate": 0.00024139876207748953, "loss": 0.0583, "step": 60530 }, { "epoch": 0.39, "learning_rate": 0.0002413890807231326, "loss": 0.061, "step": 60540 }, { "epoch": 0.39, "learning_rate": 0.0002413793993687757, "loss": 0.0552, "step": 60550 }, { "epoch": 0.39, "learning_rate": 0.00024136971801441877, "loss": 0.0533, "step": 60560 }, { "epoch": 0.39, "learning_rate": 0.0002413600366600618, "loss": 0.0574, "step": 60570 }, { "epoch": 0.39, "learning_rate": 0.00024135035530570487, "loss": 0.0675, "step": 60580 }, { "epoch": 0.39, "learning_rate": 0.00024134067395134795, "loss": 0.0604, "step": 60590 }, { "epoch": 0.39, "learning_rate": 0.000241330992596991, "loss": 0.0695, "step": 60600 }, { "epoch": 0.39, "learning_rate": 0.00024132131124263409, "loss": 0.058, "step": 60610 }, { "epoch": 0.39, "learning_rate": 0.00024131162988827716, "loss": 0.0591, "step": 60620 }, { "epoch": 0.39, "learning_rate": 0.00024130194853392022, "loss": 0.0608, "step": 60630 }, { "epoch": 0.39, "learning_rate": 0.00024129226717956327, "loss": 0.0683, "step": 60640 }, { "epoch": 0.39, "learning_rate": 0.00024128258582520635, "loss": 0.0597, "step": 60650 }, { "epoch": 0.39, "learning_rate": 0.0002412729044708494, "loss": 0.0578, "step": 60660 }, { "epoch": 0.39, "learning_rate": 0.00024126322311649248, "loss": 0.0652, "step": 60670 }, { "epoch": 0.39, "learning_rate": 0.00024125354176213556, "loss": 0.0619, "step": 60680 }, { "epoch": 0.39, "learning_rate": 0.00024124386040777864, "loss": 0.0606, "step": 60690 }, { "epoch": 0.39, "learning_rate": 0.0002412341790534217, "loss": 0.0578, "step": 60700 }, { "epoch": 0.39, "learning_rate": 0.00024122449769906475, "loss": 0.0555, "step": 60710 }, { "epoch": 0.39, "learning_rate": 0.00024121481634470783, "loss": 0.0653, "step": 60720 }, { "epoch": 0.39, "learning_rate": 0.00024120513499035088, "loss": 0.0637, "step": 60730 }, { "epoch": 0.39, "learning_rate": 0.00024119545363599396, "loss": 0.0625, "step": 60740 }, { "epoch": 0.39, "learning_rate": 0.00024118577228163704, "loss": 0.0577, "step": 60750 }, { "epoch": 0.39, "learning_rate": 0.00024117609092728012, "loss": 0.0727, "step": 60760 }, { "epoch": 0.39, "learning_rate": 0.00024116640957292317, "loss": 0.0565, "step": 60770 }, { "epoch": 0.39, "learning_rate": 0.00024115672821856622, "loss": 0.0632, "step": 60780 }, { "epoch": 0.39, "learning_rate": 0.0002411470468642093, "loss": 0.0582, "step": 60790 }, { "epoch": 0.39, "learning_rate": 0.00024113736550985236, "loss": 0.0575, "step": 60800 }, { "epoch": 0.39, "learning_rate": 0.00024112768415549544, "loss": 0.0568, "step": 60810 }, { "epoch": 0.39, "learning_rate": 0.00024111800280113852, "loss": 0.0592, "step": 60820 }, { "epoch": 0.39, "learning_rate": 0.00024110832144678157, "loss": 0.0622, "step": 60830 }, { "epoch": 0.39, "learning_rate": 0.00024109864009242465, "loss": 0.063, "step": 60840 }, { "epoch": 0.39, "learning_rate": 0.0002410889587380677, "loss": 0.0631, "step": 60850 }, { "epoch": 0.39, "learning_rate": 0.00024107927738371075, "loss": 0.0696, "step": 60860 }, { "epoch": 0.39, "learning_rate": 0.00024106959602935383, "loss": 0.0633, "step": 60870 }, { "epoch": 0.39, "learning_rate": 0.00024105991467499691, "loss": 0.0572, "step": 60880 }, { "epoch": 0.39, "learning_rate": 0.00024105023332064, "loss": 0.055, "step": 60890 }, { "epoch": 0.39, "learning_rate": 0.00024104055196628305, "loss": 0.0616, "step": 60900 }, { "epoch": 0.39, "learning_rate": 0.00024103087061192613, "loss": 0.0654, "step": 60910 }, { "epoch": 0.39, "learning_rate": 0.00024102118925756918, "loss": 0.0536, "step": 60920 }, { "epoch": 0.39, "learning_rate": 0.00024101150790321223, "loss": 0.0623, "step": 60930 }, { "epoch": 0.39, "learning_rate": 0.0002410018265488553, "loss": 0.0638, "step": 60940 }, { "epoch": 0.39, "learning_rate": 0.0002409921451944984, "loss": 0.0702, "step": 60950 }, { "epoch": 0.39, "learning_rate": 0.00024098246384014147, "loss": 0.0557, "step": 60960 }, { "epoch": 0.39, "learning_rate": 0.00024097278248578452, "loss": 0.0611, "step": 60970 }, { "epoch": 0.39, "learning_rate": 0.0002409631011314276, "loss": 0.054, "step": 60980 }, { "epoch": 0.39, "learning_rate": 0.00024095341977707066, "loss": 0.0588, "step": 60990 }, { "epoch": 0.39, "learning_rate": 0.0002409437384227137, "loss": 0.061, "step": 61000 }, { "epoch": 0.39, "eval_cer": 0.9199050954694384, "eval_loss": 0.04031915217638016, "eval_runtime": 120.1875, "eval_samples_per_second": 16.641, "eval_steps_per_second": 4.16, "step": 61000 }, { "epoch": 0.39, "learning_rate": 0.0002409340570683568, "loss": 0.0605, "step": 61010 }, { "epoch": 0.39, "learning_rate": 0.00024092437571399987, "loss": 0.0618, "step": 61020 }, { "epoch": 0.39, "learning_rate": 0.00024091469435964292, "loss": 0.0597, "step": 61030 }, { "epoch": 0.39, "learning_rate": 0.000240905013005286, "loss": 0.0598, "step": 61040 }, { "epoch": 0.39, "learning_rate": 0.00024089533165092908, "loss": 0.0537, "step": 61050 }, { "epoch": 0.39, "learning_rate": 0.0002408856502965721, "loss": 0.0683, "step": 61060 }, { "epoch": 0.39, "learning_rate": 0.00024087596894221519, "loss": 0.0549, "step": 61070 }, { "epoch": 0.39, "learning_rate": 0.00024086628758785827, "loss": 0.0547, "step": 61080 }, { "epoch": 0.39, "learning_rate": 0.00024085660623350135, "loss": 0.0639, "step": 61090 }, { "epoch": 0.39, "learning_rate": 0.0002408469248791444, "loss": 0.0611, "step": 61100 }, { "epoch": 0.39, "learning_rate": 0.00024083724352478748, "loss": 0.0512, "step": 61110 }, { "epoch": 0.39, "learning_rate": 0.00024082756217043056, "loss": 0.0644, "step": 61120 }, { "epoch": 0.39, "learning_rate": 0.00024081788081607358, "loss": 0.0568, "step": 61130 }, { "epoch": 0.39, "learning_rate": 0.00024080819946171666, "loss": 0.0684, "step": 61140 }, { "epoch": 0.39, "learning_rate": 0.00024079851810735974, "loss": 0.0577, "step": 61150 }, { "epoch": 0.39, "learning_rate": 0.00024078883675300282, "loss": 0.056, "step": 61160 }, { "epoch": 0.39, "learning_rate": 0.00024077915539864588, "loss": 0.0706, "step": 61170 }, { "epoch": 0.39, "learning_rate": 0.00024076947404428896, "loss": 0.0624, "step": 61180 }, { "epoch": 0.39, "learning_rate": 0.00024075979268993204, "loss": 0.0563, "step": 61190 }, { "epoch": 0.39, "learning_rate": 0.00024075011133557506, "loss": 0.0518, "step": 61200 }, { "epoch": 0.4, "learning_rate": 0.00024074042998121814, "loss": 0.0594, "step": 61210 }, { "epoch": 0.4, "learning_rate": 0.00024073074862686122, "loss": 0.0552, "step": 61220 }, { "epoch": 0.4, "learning_rate": 0.00024072106727250427, "loss": 0.0621, "step": 61230 }, { "epoch": 0.4, "learning_rate": 0.00024071138591814735, "loss": 0.06, "step": 61240 }, { "epoch": 0.4, "learning_rate": 0.00024070170456379043, "loss": 0.0638, "step": 61250 }, { "epoch": 0.4, "learning_rate": 0.0002406920232094335, "loss": 0.0628, "step": 61260 }, { "epoch": 0.4, "learning_rate": 0.00024068234185507654, "loss": 0.0559, "step": 61270 }, { "epoch": 0.4, "learning_rate": 0.00024067266050071962, "loss": 0.0561, "step": 61280 }, { "epoch": 0.4, "learning_rate": 0.0002406629791463627, "loss": 0.056, "step": 61290 }, { "epoch": 0.4, "learning_rate": 0.00024065329779200575, "loss": 0.0626, "step": 61300 }, { "epoch": 0.4, "learning_rate": 0.00024064361643764883, "loss": 0.0543, "step": 61310 }, { "epoch": 0.4, "learning_rate": 0.0002406339350832919, "loss": 0.0605, "step": 61320 }, { "epoch": 0.4, "learning_rate": 0.000240624253728935, "loss": 0.0576, "step": 61330 }, { "epoch": 0.4, "learning_rate": 0.00024061457237457802, "loss": 0.0565, "step": 61340 }, { "epoch": 0.4, "learning_rate": 0.0002406048910202211, "loss": 0.0588, "step": 61350 }, { "epoch": 0.4, "learning_rate": 0.00024059520966586417, "loss": 0.0626, "step": 61360 }, { "epoch": 0.4, "learning_rate": 0.00024058552831150723, "loss": 0.0559, "step": 61370 }, { "epoch": 0.4, "learning_rate": 0.0002405758469571503, "loss": 0.0582, "step": 61380 }, { "epoch": 0.4, "learning_rate": 0.0002405661656027934, "loss": 0.0562, "step": 61390 }, { "epoch": 0.4, "learning_rate": 0.00024055648424843647, "loss": 0.0564, "step": 61400 }, { "epoch": 0.4, "learning_rate": 0.0002405468028940795, "loss": 0.0624, "step": 61410 }, { "epoch": 0.4, "learning_rate": 0.00024053712153972257, "loss": 0.0638, "step": 61420 }, { "epoch": 0.4, "learning_rate": 0.00024052744018536563, "loss": 0.0533, "step": 61430 }, { "epoch": 0.4, "learning_rate": 0.0002405177588310087, "loss": 0.0535, "step": 61440 }, { "epoch": 0.4, "learning_rate": 0.00024050807747665178, "loss": 0.0554, "step": 61450 }, { "epoch": 0.4, "learning_rate": 0.00024049839612229486, "loss": 0.0582, "step": 61460 }, { "epoch": 0.4, "learning_rate": 0.00024048871476793792, "loss": 0.0579, "step": 61470 }, { "epoch": 0.4, "learning_rate": 0.00024047903341358097, "loss": 0.0584, "step": 61480 }, { "epoch": 0.4, "learning_rate": 0.00024046935205922405, "loss": 0.0603, "step": 61490 }, { "epoch": 0.4, "learning_rate": 0.0002404596707048671, "loss": 0.0674, "step": 61500 }, { "epoch": 0.4, "learning_rate": 0.00024044998935051018, "loss": 0.0553, "step": 61510 }, { "epoch": 0.4, "learning_rate": 0.00024044030799615326, "loss": 0.0551, "step": 61520 }, { "epoch": 0.4, "learning_rate": 0.00024043062664179634, "loss": 0.0523, "step": 61530 }, { "epoch": 0.4, "learning_rate": 0.0002404209452874394, "loss": 0.0559, "step": 61540 }, { "epoch": 0.4, "learning_rate": 0.00024041126393308245, "loss": 0.0612, "step": 61550 }, { "epoch": 0.4, "learning_rate": 0.00024040158257872553, "loss": 0.0535, "step": 61560 }, { "epoch": 0.4, "learning_rate": 0.00024039190122436858, "loss": 0.0541, "step": 61570 }, { "epoch": 0.4, "learning_rate": 0.00024038221987001166, "loss": 0.0669, "step": 61580 }, { "epoch": 0.4, "learning_rate": 0.00024037253851565474, "loss": 0.0569, "step": 61590 }, { "epoch": 0.4, "learning_rate": 0.00024036285716129782, "loss": 0.0591, "step": 61600 }, { "epoch": 0.4, "learning_rate": 0.00024035317580694087, "loss": 0.0619, "step": 61610 }, { "epoch": 0.4, "learning_rate": 0.00024034349445258392, "loss": 0.0677, "step": 61620 }, { "epoch": 0.4, "learning_rate": 0.00024033381309822698, "loss": 0.078, "step": 61630 }, { "epoch": 0.4, "learning_rate": 0.00024032413174387006, "loss": 0.0625, "step": 61640 }, { "epoch": 0.4, "learning_rate": 0.00024031445038951314, "loss": 0.0574, "step": 61650 }, { "epoch": 0.4, "learning_rate": 0.00024030476903515622, "loss": 0.0625, "step": 61660 }, { "epoch": 0.4, "learning_rate": 0.00024029508768079927, "loss": 0.0654, "step": 61670 }, { "epoch": 0.4, "learning_rate": 0.00024028540632644235, "loss": 0.0532, "step": 61680 }, { "epoch": 0.4, "learning_rate": 0.0002402757249720854, "loss": 0.067, "step": 61690 }, { "epoch": 0.4, "learning_rate": 0.00024026604361772845, "loss": 0.0661, "step": 61700 }, { "epoch": 0.4, "learning_rate": 0.00024025636226337153, "loss": 0.0584, "step": 61710 }, { "epoch": 0.4, "learning_rate": 0.00024024668090901461, "loss": 0.0538, "step": 61720 }, { "epoch": 0.4, "learning_rate": 0.0002402369995546577, "loss": 0.06, "step": 61730 }, { "epoch": 0.4, "learning_rate": 0.00024022731820030075, "loss": 0.0648, "step": 61740 }, { "epoch": 0.4, "learning_rate": 0.00024021763684594383, "loss": 0.0566, "step": 61750 }, { "epoch": 0.4, "learning_rate": 0.00024020795549158688, "loss": 0.0593, "step": 61760 }, { "epoch": 0.4, "learning_rate": 0.00024019827413722993, "loss": 0.0583, "step": 61770 }, { "epoch": 0.4, "learning_rate": 0.000240188592782873, "loss": 0.0584, "step": 61780 }, { "epoch": 0.4, "learning_rate": 0.0002401789114285161, "loss": 0.0558, "step": 61790 }, { "epoch": 0.4, "learning_rate": 0.00024016923007415917, "loss": 0.059, "step": 61800 }, { "epoch": 0.4, "learning_rate": 0.00024015954871980222, "loss": 0.0654, "step": 61810 }, { "epoch": 0.4, "learning_rate": 0.0002401498673654453, "loss": 0.0615, "step": 61820 }, { "epoch": 0.4, "learning_rate": 0.00024014018601108836, "loss": 0.066, "step": 61830 }, { "epoch": 0.4, "learning_rate": 0.0002401305046567314, "loss": 0.0557, "step": 61840 }, { "epoch": 0.4, "learning_rate": 0.0002401208233023745, "loss": 0.0554, "step": 61850 }, { "epoch": 0.4, "learning_rate": 0.00024011114194801757, "loss": 0.0631, "step": 61860 }, { "epoch": 0.4, "learning_rate": 0.00024010146059366062, "loss": 0.0586, "step": 61870 }, { "epoch": 0.4, "learning_rate": 0.0002400917792393037, "loss": 0.0587, "step": 61880 }, { "epoch": 0.4, "learning_rate": 0.00024008209788494678, "loss": 0.0642, "step": 61890 }, { "epoch": 0.4, "learning_rate": 0.0002400724165305898, "loss": 0.0592, "step": 61900 }, { "epoch": 0.4, "learning_rate": 0.00024006273517623289, "loss": 0.0583, "step": 61910 }, { "epoch": 0.4, "learning_rate": 0.00024005305382187597, "loss": 0.0622, "step": 61920 }, { "epoch": 0.4, "learning_rate": 0.00024004337246751905, "loss": 0.0634, "step": 61930 }, { "epoch": 0.4, "learning_rate": 0.0002400336911131621, "loss": 0.0665, "step": 61940 }, { "epoch": 0.4, "learning_rate": 0.00024002400975880518, "loss": 0.053, "step": 61950 }, { "epoch": 0.4, "learning_rate": 0.00024001432840444826, "loss": 0.0561, "step": 61960 }, { "epoch": 0.4, "learning_rate": 0.00024000464705009128, "loss": 0.0647, "step": 61970 }, { "epoch": 0.4, "learning_rate": 0.00023999496569573436, "loss": 0.0626, "step": 61980 }, { "epoch": 0.4, "learning_rate": 0.00023998528434137744, "loss": 0.0602, "step": 61990 }, { "epoch": 0.4, "learning_rate": 0.00023997560298702052, "loss": 0.0611, "step": 62000 }, { "epoch": 0.4, "eval_cer": 0.9200768274771213, "eval_loss": 0.03882079944014549, "eval_runtime": 119.9884, "eval_samples_per_second": 16.668, "eval_steps_per_second": 4.167, "step": 62000 }, { "epoch": 0.4, "learning_rate": 0.00023996592163266358, "loss": 0.0549, "step": 62010 }, { "epoch": 0.4, "learning_rate": 0.00023995624027830666, "loss": 0.053, "step": 62020 }, { "epoch": 0.4, "learning_rate": 0.00023994655892394973, "loss": 0.0706, "step": 62030 }, { "epoch": 0.4, "learning_rate": 0.00023993687756959276, "loss": 0.0513, "step": 62040 }, { "epoch": 0.4, "learning_rate": 0.00023992719621523584, "loss": 0.0621, "step": 62050 }, { "epoch": 0.4, "learning_rate": 0.00023991751486087892, "loss": 0.0552, "step": 62060 }, { "epoch": 0.4, "learning_rate": 0.00023990783350652197, "loss": 0.0653, "step": 62070 }, { "epoch": 0.4, "learning_rate": 0.00023989815215216505, "loss": 0.0568, "step": 62080 }, { "epoch": 0.4, "learning_rate": 0.00023988847079780813, "loss": 0.0515, "step": 62090 }, { "epoch": 0.4, "learning_rate": 0.0002398787894434512, "loss": 0.0508, "step": 62100 }, { "epoch": 0.4, "learning_rate": 0.00023986910808909424, "loss": 0.0611, "step": 62110 }, { "epoch": 0.4, "learning_rate": 0.00023985942673473732, "loss": 0.0546, "step": 62120 }, { "epoch": 0.4, "learning_rate": 0.0002398497453803804, "loss": 0.0519, "step": 62130 }, { "epoch": 0.4, "learning_rate": 0.00023984006402602345, "loss": 0.0592, "step": 62140 }, { "epoch": 0.4, "learning_rate": 0.00023983038267166653, "loss": 0.0578, "step": 62150 }, { "epoch": 0.4, "learning_rate": 0.0002398207013173096, "loss": 0.0523, "step": 62160 }, { "epoch": 0.4, "learning_rate": 0.0002398110199629527, "loss": 0.0565, "step": 62170 }, { "epoch": 0.4, "learning_rate": 0.00023980133860859572, "loss": 0.056, "step": 62180 }, { "epoch": 0.4, "learning_rate": 0.0002397916572542388, "loss": 0.0623, "step": 62190 }, { "epoch": 0.4, "learning_rate": 0.00023978197589988187, "loss": 0.0543, "step": 62200 }, { "epoch": 0.4, "learning_rate": 0.00023977229454552493, "loss": 0.0569, "step": 62210 }, { "epoch": 0.4, "learning_rate": 0.000239762613191168, "loss": 0.0618, "step": 62220 }, { "epoch": 0.4, "learning_rate": 0.0002397529318368111, "loss": 0.0572, "step": 62230 }, { "epoch": 0.4, "learning_rate": 0.00023974325048245414, "loss": 0.0637, "step": 62240 }, { "epoch": 0.4, "learning_rate": 0.0002397335691280972, "loss": 0.0726, "step": 62250 }, { "epoch": 0.4, "learning_rate": 0.00023972388777374027, "loss": 0.0609, "step": 62260 }, { "epoch": 0.4, "learning_rate": 0.00023971420641938332, "loss": 0.0609, "step": 62270 }, { "epoch": 0.4, "learning_rate": 0.0002397045250650264, "loss": 0.0555, "step": 62280 }, { "epoch": 0.4, "learning_rate": 0.00023969484371066948, "loss": 0.0513, "step": 62290 }, { "epoch": 0.4, "learning_rate": 0.00023968516235631256, "loss": 0.0614, "step": 62300 }, { "epoch": 0.4, "learning_rate": 0.00023967548100195562, "loss": 0.056, "step": 62310 }, { "epoch": 0.4, "learning_rate": 0.00023966579964759867, "loss": 0.0602, "step": 62320 }, { "epoch": 0.4, "learning_rate": 0.00023965611829324175, "loss": 0.0681, "step": 62330 }, { "epoch": 0.4, "learning_rate": 0.0002396464369388848, "loss": 0.0616, "step": 62340 }, { "epoch": 0.4, "learning_rate": 0.00023963675558452788, "loss": 0.0622, "step": 62350 }, { "epoch": 0.4, "learning_rate": 0.00023962707423017096, "loss": 0.0529, "step": 62360 }, { "epoch": 0.4, "learning_rate": 0.00023961739287581404, "loss": 0.0525, "step": 62370 }, { "epoch": 0.4, "learning_rate": 0.0002396077115214571, "loss": 0.0556, "step": 62380 }, { "epoch": 0.4, "learning_rate": 0.00023959803016710015, "loss": 0.0629, "step": 62390 }, { "epoch": 0.4, "learning_rate": 0.00023958834881274323, "loss": 0.0511, "step": 62400 }, { "epoch": 0.4, "learning_rate": 0.00023957866745838628, "loss": 0.0553, "step": 62410 }, { "epoch": 0.4, "learning_rate": 0.00023956898610402936, "loss": 0.0521, "step": 62420 }, { "epoch": 0.4, "learning_rate": 0.00023955930474967244, "loss": 0.0621, "step": 62430 }, { "epoch": 0.4, "learning_rate": 0.0002395496233953155, "loss": 0.0609, "step": 62440 }, { "epoch": 0.4, "learning_rate": 0.00023953994204095857, "loss": 0.0586, "step": 62450 }, { "epoch": 0.4, "learning_rate": 0.00023953026068660162, "loss": 0.0539, "step": 62460 }, { "epoch": 0.4, "learning_rate": 0.00023952057933224468, "loss": 0.0602, "step": 62470 }, { "epoch": 0.4, "learning_rate": 0.00023951089797788776, "loss": 0.0545, "step": 62480 }, { "epoch": 0.4, "learning_rate": 0.00023950121662353084, "loss": 0.0581, "step": 62490 }, { "epoch": 0.4, "learning_rate": 0.00023949153526917392, "loss": 0.0683, "step": 62500 }, { "epoch": 0.4, "learning_rate": 0.00023948185391481697, "loss": 0.064, "step": 62510 }, { "epoch": 0.4, "learning_rate": 0.00023947217256046005, "loss": 0.0574, "step": 62520 }, { "epoch": 0.4, "learning_rate": 0.0002394624912061031, "loss": 0.0659, "step": 62530 }, { "epoch": 0.4, "learning_rate": 0.00023945280985174615, "loss": 0.062, "step": 62540 }, { "epoch": 0.4, "learning_rate": 0.00023944312849738923, "loss": 0.0597, "step": 62550 }, { "epoch": 0.4, "learning_rate": 0.0002394334471430323, "loss": 0.0551, "step": 62560 }, { "epoch": 0.4, "learning_rate": 0.0002394237657886754, "loss": 0.0569, "step": 62570 }, { "epoch": 0.4, "learning_rate": 0.00023941408443431845, "loss": 0.0639, "step": 62580 }, { "epoch": 0.4, "learning_rate": 0.00023940440307996153, "loss": 0.0545, "step": 62590 }, { "epoch": 0.4, "learning_rate": 0.00023939472172560458, "loss": 0.0561, "step": 62600 }, { "epoch": 0.4, "learning_rate": 0.00023938504037124763, "loss": 0.0544, "step": 62610 }, { "epoch": 0.4, "learning_rate": 0.0002393753590168907, "loss": 0.056, "step": 62620 }, { "epoch": 0.4, "learning_rate": 0.0002393656776625338, "loss": 0.0676, "step": 62630 }, { "epoch": 0.4, "learning_rate": 0.00023935599630817684, "loss": 0.0628, "step": 62640 }, { "epoch": 0.4, "learning_rate": 0.00023934631495381992, "loss": 0.0588, "step": 62650 }, { "epoch": 0.4, "learning_rate": 0.000239336633599463, "loss": 0.0562, "step": 62660 }, { "epoch": 0.4, "learning_rate": 0.00023932695224510603, "loss": 0.0593, "step": 62670 }, { "epoch": 0.4, "learning_rate": 0.0002393172708907491, "loss": 0.0594, "step": 62680 }, { "epoch": 0.4, "learning_rate": 0.0002393075895363922, "loss": 0.0605, "step": 62690 }, { "epoch": 0.4, "learning_rate": 0.00023929790818203527, "loss": 0.0566, "step": 62700 }, { "epoch": 0.4, "learning_rate": 0.00023928822682767832, "loss": 0.0534, "step": 62710 }, { "epoch": 0.4, "learning_rate": 0.0002392785454733214, "loss": 0.0567, "step": 62720 }, { "epoch": 0.4, "learning_rate": 0.00023926886411896448, "loss": 0.0666, "step": 62730 }, { "epoch": 0.4, "learning_rate": 0.0002392591827646075, "loss": 0.0555, "step": 62740 }, { "epoch": 0.41, "learning_rate": 0.00023924950141025059, "loss": 0.0567, "step": 62750 }, { "epoch": 0.41, "learning_rate": 0.00023923982005589367, "loss": 0.0542, "step": 62760 }, { "epoch": 0.41, "learning_rate": 0.00023923013870153675, "loss": 0.053, "step": 62770 }, { "epoch": 0.41, "learning_rate": 0.0002392204573471798, "loss": 0.0578, "step": 62780 }, { "epoch": 0.41, "learning_rate": 0.00023921077599282288, "loss": 0.0495, "step": 62790 }, { "epoch": 0.41, "learning_rate": 0.00023920109463846596, "loss": 0.0637, "step": 62800 }, { "epoch": 0.41, "learning_rate": 0.00023919141328410898, "loss": 0.0548, "step": 62810 }, { "epoch": 0.41, "learning_rate": 0.00023918173192975206, "loss": 0.0529, "step": 62820 }, { "epoch": 0.41, "learning_rate": 0.00023917205057539514, "loss": 0.0561, "step": 62830 }, { "epoch": 0.41, "learning_rate": 0.0002391623692210382, "loss": 0.0643, "step": 62840 }, { "epoch": 0.41, "learning_rate": 0.00023915268786668128, "loss": 0.059, "step": 62850 }, { "epoch": 0.41, "learning_rate": 0.00023914300651232435, "loss": 0.0574, "step": 62860 }, { "epoch": 0.41, "learning_rate": 0.00023913332515796743, "loss": 0.0582, "step": 62870 }, { "epoch": 0.41, "learning_rate": 0.00023912364380361046, "loss": 0.0508, "step": 62880 }, { "epoch": 0.41, "learning_rate": 0.00023911396244925354, "loss": 0.062, "step": 62890 }, { "epoch": 0.41, "learning_rate": 0.00023910428109489662, "loss": 0.0613, "step": 62900 }, { "epoch": 0.41, "learning_rate": 0.00023909459974053967, "loss": 0.0531, "step": 62910 }, { "epoch": 0.41, "learning_rate": 0.00023908491838618275, "loss": 0.0593, "step": 62920 }, { "epoch": 0.41, "learning_rate": 0.00023907523703182583, "loss": 0.0669, "step": 62930 }, { "epoch": 0.41, "learning_rate": 0.0002390655556774689, "loss": 0.0592, "step": 62940 }, { "epoch": 0.41, "learning_rate": 0.00023905587432311194, "loss": 0.0583, "step": 62950 }, { "epoch": 0.41, "learning_rate": 0.00023904619296875502, "loss": 0.0558, "step": 62960 }, { "epoch": 0.41, "learning_rate": 0.0002390365116143981, "loss": 0.0628, "step": 62970 }, { "epoch": 0.41, "learning_rate": 0.00023902683026004115, "loss": 0.0495, "step": 62980 }, { "epoch": 0.41, "learning_rate": 0.00023901714890568423, "loss": 0.0553, "step": 62990 }, { "epoch": 0.41, "learning_rate": 0.0002390074675513273, "loss": 0.0569, "step": 63000 }, { "epoch": 0.41, "eval_cer": 0.919996384589312, "eval_loss": 0.037891894578933716, "eval_runtime": 119.8457, "eval_samples_per_second": 16.688, "eval_steps_per_second": 4.172, "step": 63000 }, { "epoch": 0.41, "learning_rate": 0.0002389977861969704, "loss": 0.0617, "step": 63010 }, { "epoch": 0.41, "learning_rate": 0.00023898810484261341, "loss": 0.061, "step": 63020 }, { "epoch": 0.41, "learning_rate": 0.0002389784234882565, "loss": 0.0576, "step": 63030 }, { "epoch": 0.41, "learning_rate": 0.00023896874213389955, "loss": 0.0585, "step": 63040 }, { "epoch": 0.41, "learning_rate": 0.00023895906077954263, "loss": 0.0544, "step": 63050 }, { "epoch": 0.41, "learning_rate": 0.0002389493794251857, "loss": 0.06, "step": 63060 }, { "epoch": 0.41, "learning_rate": 0.0002389396980708288, "loss": 0.0631, "step": 63070 }, { "epoch": 0.41, "learning_rate": 0.00023893001671647184, "loss": 0.0571, "step": 63080 }, { "epoch": 0.41, "learning_rate": 0.0002389203353621149, "loss": 0.0687, "step": 63090 }, { "epoch": 0.41, "learning_rate": 0.00023891065400775797, "loss": 0.0582, "step": 63100 }, { "epoch": 0.41, "learning_rate": 0.00023890097265340102, "loss": 0.0582, "step": 63110 }, { "epoch": 0.41, "learning_rate": 0.0002388912912990441, "loss": 0.0621, "step": 63120 }, { "epoch": 0.41, "learning_rate": 0.00023888160994468718, "loss": 0.0508, "step": 63130 }, { "epoch": 0.41, "learning_rate": 0.00023887192859033026, "loss": 0.058, "step": 63140 }, { "epoch": 0.41, "learning_rate": 0.00023886224723597332, "loss": 0.0718, "step": 63150 }, { "epoch": 0.41, "learning_rate": 0.00023885256588161637, "loss": 0.0587, "step": 63160 }, { "epoch": 0.41, "learning_rate": 0.00023884288452725945, "loss": 0.056, "step": 63170 }, { "epoch": 0.41, "learning_rate": 0.0002388332031729025, "loss": 0.0503, "step": 63180 }, { "epoch": 0.41, "learning_rate": 0.00023882352181854558, "loss": 0.0592, "step": 63190 }, { "epoch": 0.41, "learning_rate": 0.00023881384046418866, "loss": 0.0532, "step": 63200 }, { "epoch": 0.41, "learning_rate": 0.00023880415910983174, "loss": 0.0574, "step": 63210 }, { "epoch": 0.41, "learning_rate": 0.0002387944777554748, "loss": 0.0617, "step": 63220 }, { "epoch": 0.41, "learning_rate": 0.00023878479640111785, "loss": 0.0608, "step": 63230 }, { "epoch": 0.41, "learning_rate": 0.0002387751150467609, "loss": 0.0676, "step": 63240 }, { "epoch": 0.41, "learning_rate": 0.00023876543369240398, "loss": 0.0566, "step": 63250 }, { "epoch": 0.41, "learning_rate": 0.00023875575233804706, "loss": 0.0643, "step": 63260 }, { "epoch": 0.41, "learning_rate": 0.00023874607098369014, "loss": 0.0611, "step": 63270 }, { "epoch": 0.41, "learning_rate": 0.0002387363896293332, "loss": 0.0572, "step": 63280 }, { "epoch": 0.41, "learning_rate": 0.00023872670827497627, "loss": 0.0585, "step": 63290 }, { "epoch": 0.41, "learning_rate": 0.00023871702692061932, "loss": 0.0579, "step": 63300 }, { "epoch": 0.41, "learning_rate": 0.00023870734556626238, "loss": 0.0557, "step": 63310 }, { "epoch": 0.41, "learning_rate": 0.00023869766421190546, "loss": 0.0567, "step": 63320 }, { "epoch": 0.41, "learning_rate": 0.00023868798285754854, "loss": 0.0634, "step": 63330 }, { "epoch": 0.41, "learning_rate": 0.00023867830150319162, "loss": 0.0607, "step": 63340 }, { "epoch": 0.41, "learning_rate": 0.00023866862014883467, "loss": 0.0588, "step": 63350 }, { "epoch": 0.41, "learning_rate": 0.00023865893879447775, "loss": 0.0625, "step": 63360 }, { "epoch": 0.41, "learning_rate": 0.0002386492574401208, "loss": 0.0587, "step": 63370 }, { "epoch": 0.41, "learning_rate": 0.00023863957608576385, "loss": 0.0581, "step": 63380 }, { "epoch": 0.41, "learning_rate": 0.00023862989473140693, "loss": 0.0589, "step": 63390 }, { "epoch": 0.41, "learning_rate": 0.00023862021337705, "loss": 0.0719, "step": 63400 }, { "epoch": 0.41, "learning_rate": 0.0002386105320226931, "loss": 0.0705, "step": 63410 }, { "epoch": 0.41, "learning_rate": 0.00023860085066833615, "loss": 0.0661, "step": 63420 }, { "epoch": 0.41, "learning_rate": 0.00023859116931397923, "loss": 0.0597, "step": 63430 }, { "epoch": 0.41, "learning_rate": 0.00023858148795962225, "loss": 0.0578, "step": 63440 }, { "epoch": 0.41, "learning_rate": 0.00023857180660526533, "loss": 0.0604, "step": 63450 }, { "epoch": 0.41, "learning_rate": 0.0002385621252509084, "loss": 0.0555, "step": 63460 }, { "epoch": 0.41, "learning_rate": 0.0002385524438965515, "loss": 0.0546, "step": 63470 }, { "epoch": 0.41, "learning_rate": 0.00023854276254219454, "loss": 0.0551, "step": 63480 }, { "epoch": 0.41, "learning_rate": 0.00023853308118783762, "loss": 0.0528, "step": 63490 }, { "epoch": 0.41, "learning_rate": 0.0002385233998334807, "loss": 0.0522, "step": 63500 }, { "epoch": 0.41, "learning_rate": 0.00023851371847912373, "loss": 0.0597, "step": 63510 }, { "epoch": 0.41, "learning_rate": 0.0002385040371247668, "loss": 0.0549, "step": 63520 }, { "epoch": 0.41, "learning_rate": 0.0002384943557704099, "loss": 0.0681, "step": 63530 }, { "epoch": 0.41, "learning_rate": 0.00023848467441605297, "loss": 0.057, "step": 63540 }, { "epoch": 0.41, "learning_rate": 0.00023847499306169602, "loss": 0.0587, "step": 63550 }, { "epoch": 0.41, "learning_rate": 0.0002384653117073391, "loss": 0.0564, "step": 63560 }, { "epoch": 0.41, "learning_rate": 0.00023845563035298218, "loss": 0.0543, "step": 63570 }, { "epoch": 0.41, "learning_rate": 0.0002384459489986252, "loss": 0.0556, "step": 63580 }, { "epoch": 0.41, "learning_rate": 0.00023843626764426829, "loss": 0.0517, "step": 63590 }, { "epoch": 0.41, "learning_rate": 0.00023842658628991136, "loss": 0.0587, "step": 63600 }, { "epoch": 0.41, "learning_rate": 0.00023841690493555444, "loss": 0.0536, "step": 63610 }, { "epoch": 0.41, "learning_rate": 0.0002384072235811975, "loss": 0.0635, "step": 63620 }, { "epoch": 0.41, "learning_rate": 0.00023839754222684058, "loss": 0.0611, "step": 63630 }, { "epoch": 0.41, "learning_rate": 0.00023838786087248366, "loss": 0.054, "step": 63640 }, { "epoch": 0.41, "learning_rate": 0.00023837817951812668, "loss": 0.0665, "step": 63650 }, { "epoch": 0.41, "learning_rate": 0.00023836849816376976, "loss": 0.0588, "step": 63660 }, { "epoch": 0.41, "learning_rate": 0.00023835881680941284, "loss": 0.0506, "step": 63670 }, { "epoch": 0.41, "learning_rate": 0.0002383491354550559, "loss": 0.0543, "step": 63680 }, { "epoch": 0.41, "learning_rate": 0.00023833945410069897, "loss": 0.0577, "step": 63690 }, { "epoch": 0.41, "learning_rate": 0.00023832977274634205, "loss": 0.0677, "step": 63700 }, { "epoch": 0.41, "learning_rate": 0.00023832009139198513, "loss": 0.0576, "step": 63710 }, { "epoch": 0.41, "learning_rate": 0.00023831041003762816, "loss": 0.0664, "step": 63720 }, { "epoch": 0.41, "learning_rate": 0.00023830072868327124, "loss": 0.0627, "step": 63730 }, { "epoch": 0.41, "learning_rate": 0.00023829104732891432, "loss": 0.0565, "step": 63740 }, { "epoch": 0.41, "learning_rate": 0.00023828136597455737, "loss": 0.0582, "step": 63750 }, { "epoch": 0.41, "learning_rate": 0.00023827168462020045, "loss": 0.0586, "step": 63760 }, { "epoch": 0.41, "learning_rate": 0.00023826200326584353, "loss": 0.0556, "step": 63770 }, { "epoch": 0.41, "learning_rate": 0.0002382523219114866, "loss": 0.0582, "step": 63780 }, { "epoch": 0.41, "learning_rate": 0.00023824264055712964, "loss": 0.0593, "step": 63790 }, { "epoch": 0.41, "learning_rate": 0.00023823295920277272, "loss": 0.0671, "step": 63800 }, { "epoch": 0.41, "learning_rate": 0.0002382232778484158, "loss": 0.0596, "step": 63810 }, { "epoch": 0.41, "learning_rate": 0.00023821359649405885, "loss": 0.0509, "step": 63820 }, { "epoch": 0.41, "learning_rate": 0.00023820391513970193, "loss": 0.0552, "step": 63830 }, { "epoch": 0.41, "learning_rate": 0.000238194233785345, "loss": 0.0547, "step": 63840 }, { "epoch": 0.41, "learning_rate": 0.00023818455243098806, "loss": 0.0643, "step": 63850 }, { "epoch": 0.41, "learning_rate": 0.00023817487107663111, "loss": 0.0615, "step": 63860 }, { "epoch": 0.41, "learning_rate": 0.0002381651897222742, "loss": 0.0632, "step": 63870 }, { "epoch": 0.41, "learning_rate": 0.00023815550836791725, "loss": 0.0574, "step": 63880 }, { "epoch": 0.41, "learning_rate": 0.00023814582701356033, "loss": 0.0616, "step": 63890 }, { "epoch": 0.41, "learning_rate": 0.0002381361456592034, "loss": 0.0549, "step": 63900 }, { "epoch": 0.41, "learning_rate": 0.00023812646430484649, "loss": 0.056, "step": 63910 }, { "epoch": 0.41, "learning_rate": 0.00023811678295048954, "loss": 0.0584, "step": 63920 }, { "epoch": 0.41, "learning_rate": 0.0002381071015961326, "loss": 0.0559, "step": 63930 }, { "epoch": 0.41, "learning_rate": 0.00023809742024177567, "loss": 0.0602, "step": 63940 }, { "epoch": 0.41, "learning_rate": 0.00023808773888741872, "loss": 0.0536, "step": 63950 }, { "epoch": 0.41, "learning_rate": 0.0002380780575330618, "loss": 0.054, "step": 63960 }, { "epoch": 0.41, "learning_rate": 0.00023806837617870488, "loss": 0.063, "step": 63970 }, { "epoch": 0.41, "learning_rate": 0.00023805869482434796, "loss": 0.0587, "step": 63980 }, { "epoch": 0.41, "learning_rate": 0.00023804901346999102, "loss": 0.0547, "step": 63990 }, { "epoch": 0.41, "learning_rate": 0.00023803933211563407, "loss": 0.0577, "step": 64000 }, { "epoch": 0.41, "eval_cer": 0.920002711558016, "eval_loss": 0.03821108117699623, "eval_runtime": 119.9562, "eval_samples_per_second": 16.673, "eval_steps_per_second": 4.168, "step": 64000 }, { "epoch": 0.41, "learning_rate": 0.00023802965076127715, "loss": 0.0529, "step": 64010 }, { "epoch": 0.41, "learning_rate": 0.0002380199694069202, "loss": 0.0499, "step": 64020 }, { "epoch": 0.41, "learning_rate": 0.00023801028805256328, "loss": 0.053, "step": 64030 }, { "epoch": 0.41, "learning_rate": 0.00023800060669820636, "loss": 0.0655, "step": 64040 }, { "epoch": 0.41, "learning_rate": 0.0002379909253438494, "loss": 0.0569, "step": 64050 }, { "epoch": 0.41, "learning_rate": 0.0002379812439894925, "loss": 0.0592, "step": 64060 }, { "epoch": 0.41, "learning_rate": 0.00023797156263513555, "loss": 0.0568, "step": 64070 }, { "epoch": 0.41, "learning_rate": 0.0002379618812807786, "loss": 0.0567, "step": 64080 }, { "epoch": 0.41, "learning_rate": 0.00023795219992642168, "loss": 0.0518, "step": 64090 }, { "epoch": 0.41, "learning_rate": 0.00023794251857206476, "loss": 0.0571, "step": 64100 }, { "epoch": 0.41, "learning_rate": 0.00023793283721770784, "loss": 0.0604, "step": 64110 }, { "epoch": 0.41, "learning_rate": 0.0002379231558633509, "loss": 0.0547, "step": 64120 }, { "epoch": 0.41, "learning_rate": 0.00023791347450899397, "loss": 0.0631, "step": 64130 }, { "epoch": 0.41, "learning_rate": 0.00023790379315463702, "loss": 0.0597, "step": 64140 }, { "epoch": 0.41, "learning_rate": 0.00023789411180028008, "loss": 0.0573, "step": 64150 }, { "epoch": 0.41, "learning_rate": 0.00023788443044592316, "loss": 0.0579, "step": 64160 }, { "epoch": 0.41, "learning_rate": 0.00023787474909156624, "loss": 0.0544, "step": 64170 }, { "epoch": 0.41, "learning_rate": 0.00023786506773720932, "loss": 0.0528, "step": 64180 }, { "epoch": 0.41, "learning_rate": 0.00023785538638285237, "loss": 0.0537, "step": 64190 }, { "epoch": 0.41, "learning_rate": 0.00023784570502849545, "loss": 0.0518, "step": 64200 }, { "epoch": 0.41, "learning_rate": 0.0002378360236741385, "loss": 0.0536, "step": 64210 }, { "epoch": 0.41, "learning_rate": 0.00023782634231978155, "loss": 0.0588, "step": 64220 }, { "epoch": 0.41, "learning_rate": 0.00023781666096542463, "loss": 0.0666, "step": 64230 }, { "epoch": 0.41, "learning_rate": 0.0002378069796110677, "loss": 0.0594, "step": 64240 }, { "epoch": 0.41, "learning_rate": 0.00023779729825671077, "loss": 0.0594, "step": 64250 }, { "epoch": 0.41, "learning_rate": 0.00023778761690235385, "loss": 0.0581, "step": 64260 }, { "epoch": 0.41, "learning_rate": 0.00023777793554799692, "loss": 0.0556, "step": 64270 }, { "epoch": 0.41, "learning_rate": 0.00023776825419363995, "loss": 0.054, "step": 64280 }, { "epoch": 0.41, "learning_rate": 0.00023775857283928303, "loss": 0.0639, "step": 64290 }, { "epoch": 0.42, "learning_rate": 0.0002377488914849261, "loss": 0.0545, "step": 64300 }, { "epoch": 0.42, "learning_rate": 0.0002377392101305692, "loss": 0.0555, "step": 64310 }, { "epoch": 0.42, "learning_rate": 0.00023772952877621224, "loss": 0.054, "step": 64320 }, { "epoch": 0.42, "learning_rate": 0.00023771984742185532, "loss": 0.0616, "step": 64330 }, { "epoch": 0.42, "learning_rate": 0.0002377101660674984, "loss": 0.0524, "step": 64340 }, { "epoch": 0.42, "learning_rate": 0.00023770048471314143, "loss": 0.057, "step": 64350 }, { "epoch": 0.42, "learning_rate": 0.0002376908033587845, "loss": 0.0602, "step": 64360 }, { "epoch": 0.42, "learning_rate": 0.0002376811220044276, "loss": 0.0573, "step": 64370 }, { "epoch": 0.42, "learning_rate": 0.00023767144065007067, "loss": 0.0614, "step": 64380 }, { "epoch": 0.42, "learning_rate": 0.00023766175929571372, "loss": 0.0588, "step": 64390 }, { "epoch": 0.42, "learning_rate": 0.0002376520779413568, "loss": 0.0554, "step": 64400 }, { "epoch": 0.42, "learning_rate": 0.00023764239658699988, "loss": 0.0573, "step": 64410 }, { "epoch": 0.42, "learning_rate": 0.0002376327152326429, "loss": 0.0581, "step": 64420 }, { "epoch": 0.42, "learning_rate": 0.00023762303387828598, "loss": 0.0621, "step": 64430 }, { "epoch": 0.42, "learning_rate": 0.00023761335252392906, "loss": 0.0511, "step": 64440 }, { "epoch": 0.42, "learning_rate": 0.00023760367116957212, "loss": 0.0551, "step": 64450 }, { "epoch": 0.42, "learning_rate": 0.0002375939898152152, "loss": 0.0606, "step": 64460 }, { "epoch": 0.42, "learning_rate": 0.00023758430846085828, "loss": 0.062, "step": 64470 }, { "epoch": 0.42, "learning_rate": 0.00023757462710650136, "loss": 0.0573, "step": 64480 }, { "epoch": 0.42, "learning_rate": 0.00023756494575214438, "loss": 0.0609, "step": 64490 }, { "epoch": 0.42, "learning_rate": 0.00023755526439778746, "loss": 0.0653, "step": 64500 }, { "epoch": 0.42, "learning_rate": 0.00023754558304343054, "loss": 0.0599, "step": 64510 }, { "epoch": 0.42, "learning_rate": 0.0002375359016890736, "loss": 0.0555, "step": 64520 }, { "epoch": 0.42, "learning_rate": 0.00023752622033471667, "loss": 0.0534, "step": 64530 }, { "epoch": 0.42, "learning_rate": 0.00023751653898035975, "loss": 0.0512, "step": 64540 }, { "epoch": 0.42, "learning_rate": 0.00023750685762600283, "loss": 0.05, "step": 64550 }, { "epoch": 0.42, "learning_rate": 0.00023749717627164586, "loss": 0.0529, "step": 64560 }, { "epoch": 0.42, "learning_rate": 0.00023748749491728894, "loss": 0.0543, "step": 64570 }, { "epoch": 0.42, "learning_rate": 0.00023747781356293202, "loss": 0.063, "step": 64580 }, { "epoch": 0.42, "learning_rate": 0.00023746813220857507, "loss": 0.062, "step": 64590 }, { "epoch": 0.42, "learning_rate": 0.00023745845085421815, "loss": 0.0624, "step": 64600 }, { "epoch": 0.42, "learning_rate": 0.00023744876949986123, "loss": 0.0689, "step": 64610 }, { "epoch": 0.42, "learning_rate": 0.00023743908814550428, "loss": 0.0552, "step": 64620 }, { "epoch": 0.42, "learning_rate": 0.00023742940679114734, "loss": 0.0581, "step": 64630 }, { "epoch": 0.42, "learning_rate": 0.00023741972543679042, "loss": 0.0553, "step": 64640 }, { "epoch": 0.42, "learning_rate": 0.00023741004408243347, "loss": 0.0599, "step": 64650 }, { "epoch": 0.42, "learning_rate": 0.00023740036272807655, "loss": 0.0591, "step": 64660 }, { "epoch": 0.42, "learning_rate": 0.00023739068137371963, "loss": 0.0536, "step": 64670 }, { "epoch": 0.42, "learning_rate": 0.0002373810000193627, "loss": 0.0525, "step": 64680 }, { "epoch": 0.42, "learning_rate": 0.00023737131866500576, "loss": 0.0571, "step": 64690 }, { "epoch": 0.42, "learning_rate": 0.00023736163731064881, "loss": 0.0622, "step": 64700 }, { "epoch": 0.42, "learning_rate": 0.0002373519559562919, "loss": 0.0529, "step": 64710 }, { "epoch": 0.42, "learning_rate": 0.00023734227460193495, "loss": 0.0591, "step": 64720 }, { "epoch": 0.42, "learning_rate": 0.00023733259324757803, "loss": 0.0582, "step": 64730 }, { "epoch": 0.42, "learning_rate": 0.0002373229118932211, "loss": 0.0659, "step": 64740 }, { "epoch": 0.42, "learning_rate": 0.00023731323053886419, "loss": 0.0553, "step": 64750 }, { "epoch": 0.42, "learning_rate": 0.00023730354918450724, "loss": 0.0647, "step": 64760 }, { "epoch": 0.42, "learning_rate": 0.0002372938678301503, "loss": 0.0614, "step": 64770 }, { "epoch": 0.42, "learning_rate": 0.00023728418647579337, "loss": 0.0549, "step": 64780 }, { "epoch": 0.42, "learning_rate": 0.00023727450512143642, "loss": 0.0621, "step": 64790 }, { "epoch": 0.42, "learning_rate": 0.0002372648237670795, "loss": 0.0616, "step": 64800 }, { "epoch": 0.42, "learning_rate": 0.00023725514241272258, "loss": 0.0568, "step": 64810 }, { "epoch": 0.42, "learning_rate": 0.00023724546105836564, "loss": 0.0575, "step": 64820 }, { "epoch": 0.42, "learning_rate": 0.00023723577970400872, "loss": 0.0625, "step": 64830 }, { "epoch": 0.42, "learning_rate": 0.00023722609834965177, "loss": 0.0571, "step": 64840 }, { "epoch": 0.42, "learning_rate": 0.00023721641699529482, "loss": 0.0554, "step": 64850 }, { "epoch": 0.42, "learning_rate": 0.0002372067356409379, "loss": 0.0562, "step": 64860 }, { "epoch": 0.42, "learning_rate": 0.00023719705428658098, "loss": 0.062, "step": 64870 }, { "epoch": 0.42, "learning_rate": 0.00023718737293222406, "loss": 0.0596, "step": 64880 }, { "epoch": 0.42, "learning_rate": 0.0002371776915778671, "loss": 0.0533, "step": 64890 }, { "epoch": 0.42, "learning_rate": 0.0002371680102235102, "loss": 0.0611, "step": 64900 }, { "epoch": 0.42, "learning_rate": 0.00023715832886915325, "loss": 0.0564, "step": 64910 }, { "epoch": 0.42, "learning_rate": 0.0002371486475147963, "loss": 0.0563, "step": 64920 }, { "epoch": 0.42, "learning_rate": 0.00023713896616043938, "loss": 0.0641, "step": 64930 }, { "epoch": 0.42, "learning_rate": 0.00023712928480608246, "loss": 0.0607, "step": 64940 }, { "epoch": 0.42, "learning_rate": 0.00023711960345172554, "loss": 0.0586, "step": 64950 }, { "epoch": 0.42, "learning_rate": 0.0002371099220973686, "loss": 0.0549, "step": 64960 }, { "epoch": 0.42, "learning_rate": 0.00023710024074301167, "loss": 0.0647, "step": 64970 }, { "epoch": 0.42, "learning_rate": 0.00023709055938865472, "loss": 0.0527, "step": 64980 }, { "epoch": 0.42, "learning_rate": 0.00023708087803429778, "loss": 0.0547, "step": 64990 }, { "epoch": 0.42, "learning_rate": 0.00023707119667994086, "loss": 0.061, "step": 65000 }, { "epoch": 0.42, "eval_cer": 0.9201581742176025, "eval_loss": 0.03896106779575348, "eval_runtime": 120.0403, "eval_samples_per_second": 16.661, "eval_steps_per_second": 4.165, "step": 65000 }, { "epoch": 0.42, "learning_rate": 0.00023706151532558394, "loss": 0.0566, "step": 65010 }, { "epoch": 0.42, "learning_rate": 0.000237051833971227, "loss": 0.0514, "step": 65020 }, { "epoch": 0.42, "learning_rate": 0.00023704215261687007, "loss": 0.0557, "step": 65030 }, { "epoch": 0.42, "learning_rate": 0.00023703247126251315, "loss": 0.0579, "step": 65040 }, { "epoch": 0.42, "learning_rate": 0.00023702278990815617, "loss": 0.0516, "step": 65050 }, { "epoch": 0.42, "learning_rate": 0.00023701310855379925, "loss": 0.0538, "step": 65060 }, { "epoch": 0.42, "learning_rate": 0.00023700342719944233, "loss": 0.0654, "step": 65070 }, { "epoch": 0.42, "learning_rate": 0.0002369937458450854, "loss": 0.0578, "step": 65080 }, { "epoch": 0.42, "learning_rate": 0.00023698406449072846, "loss": 0.069, "step": 65090 }, { "epoch": 0.42, "learning_rate": 0.00023697438313637154, "loss": 0.0604, "step": 65100 }, { "epoch": 0.42, "learning_rate": 0.00023696470178201462, "loss": 0.0567, "step": 65110 }, { "epoch": 0.42, "learning_rate": 0.00023695502042765765, "loss": 0.0551, "step": 65120 }, { "epoch": 0.42, "learning_rate": 0.00023694533907330073, "loss": 0.0539, "step": 65130 }, { "epoch": 0.42, "learning_rate": 0.0002369356577189438, "loss": 0.0572, "step": 65140 }, { "epoch": 0.42, "learning_rate": 0.0002369259763645869, "loss": 0.0525, "step": 65150 }, { "epoch": 0.42, "learning_rate": 0.00023691629501022994, "loss": 0.0507, "step": 65160 }, { "epoch": 0.42, "learning_rate": 0.00023690661365587302, "loss": 0.0624, "step": 65170 }, { "epoch": 0.42, "learning_rate": 0.0002368969323015161, "loss": 0.055, "step": 65180 }, { "epoch": 0.42, "learning_rate": 0.00023688725094715913, "loss": 0.061, "step": 65190 }, { "epoch": 0.42, "learning_rate": 0.0002368775695928022, "loss": 0.0535, "step": 65200 }, { "epoch": 0.42, "learning_rate": 0.0002368678882384453, "loss": 0.0548, "step": 65210 }, { "epoch": 0.42, "learning_rate": 0.00023685820688408834, "loss": 0.0557, "step": 65220 }, { "epoch": 0.42, "learning_rate": 0.00023684852552973142, "loss": 0.0596, "step": 65230 }, { "epoch": 0.42, "learning_rate": 0.0002368388441753745, "loss": 0.0566, "step": 65240 }, { "epoch": 0.42, "learning_rate": 0.00023682916282101758, "loss": 0.0624, "step": 65250 }, { "epoch": 0.42, "learning_rate": 0.0002368194814666606, "loss": 0.0572, "step": 65260 }, { "epoch": 0.42, "learning_rate": 0.00023680980011230368, "loss": 0.0503, "step": 65270 }, { "epoch": 0.42, "learning_rate": 0.00023680011875794676, "loss": 0.0536, "step": 65280 }, { "epoch": 0.42, "learning_rate": 0.00023679043740358982, "loss": 0.0559, "step": 65290 }, { "epoch": 0.42, "learning_rate": 0.0002367807560492329, "loss": 0.0587, "step": 65300 }, { "epoch": 0.42, "learning_rate": 0.00023677107469487598, "loss": 0.0582, "step": 65310 }, { "epoch": 0.42, "learning_rate": 0.00023676139334051906, "loss": 0.0524, "step": 65320 }, { "epoch": 0.42, "learning_rate": 0.00023675171198616208, "loss": 0.0521, "step": 65330 }, { "epoch": 0.42, "learning_rate": 0.00023674203063180516, "loss": 0.0493, "step": 65340 }, { "epoch": 0.42, "learning_rate": 0.00023673234927744824, "loss": 0.0579, "step": 65350 }, { "epoch": 0.42, "learning_rate": 0.0002367226679230913, "loss": 0.059, "step": 65360 }, { "epoch": 0.42, "learning_rate": 0.00023671298656873437, "loss": 0.0566, "step": 65370 }, { "epoch": 0.42, "learning_rate": 0.00023670330521437745, "loss": 0.0522, "step": 65380 }, { "epoch": 0.42, "learning_rate": 0.00023669362386002053, "loss": 0.0559, "step": 65390 }, { "epoch": 0.42, "learning_rate": 0.00023668394250566356, "loss": 0.0592, "step": 65400 }, { "epoch": 0.42, "learning_rate": 0.00023667426115130664, "loss": 0.0543, "step": 65410 }, { "epoch": 0.42, "learning_rate": 0.0002366645797969497, "loss": 0.0576, "step": 65420 }, { "epoch": 0.42, "learning_rate": 0.00023665489844259277, "loss": 0.0588, "step": 65430 }, { "epoch": 0.42, "learning_rate": 0.00023664521708823585, "loss": 0.0579, "step": 65440 }, { "epoch": 0.42, "learning_rate": 0.00023663553573387893, "loss": 0.0636, "step": 65450 }, { "epoch": 0.42, "learning_rate": 0.00023662585437952196, "loss": 0.0508, "step": 65460 }, { "epoch": 0.42, "learning_rate": 0.00023661617302516504, "loss": 0.0707, "step": 65470 }, { "epoch": 0.42, "learning_rate": 0.00023660649167080812, "loss": 0.0563, "step": 65480 }, { "epoch": 0.42, "learning_rate": 0.00023659681031645117, "loss": 0.0556, "step": 65490 }, { "epoch": 0.42, "learning_rate": 0.00023658712896209425, "loss": 0.0619, "step": 65500 }, { "epoch": 0.42, "learning_rate": 0.00023657744760773733, "loss": 0.0719, "step": 65510 }, { "epoch": 0.42, "learning_rate": 0.0002365677662533804, "loss": 0.0653, "step": 65520 }, { "epoch": 0.42, "learning_rate": 0.00023655808489902343, "loss": 0.0626, "step": 65530 }, { "epoch": 0.42, "learning_rate": 0.0002365484035446665, "loss": 0.061, "step": 65540 }, { "epoch": 0.42, "learning_rate": 0.0002365387221903096, "loss": 0.0562, "step": 65550 }, { "epoch": 0.42, "learning_rate": 0.00023652904083595265, "loss": 0.055, "step": 65560 }, { "epoch": 0.42, "learning_rate": 0.00023651935948159573, "loss": 0.0558, "step": 65570 }, { "epoch": 0.42, "learning_rate": 0.0002365096781272388, "loss": 0.0593, "step": 65580 }, { "epoch": 0.42, "learning_rate": 0.00023649999677288189, "loss": 0.0544, "step": 65590 }, { "epoch": 0.42, "learning_rate": 0.0002364903154185249, "loss": 0.0591, "step": 65600 }, { "epoch": 0.42, "learning_rate": 0.000236480634064168, "loss": 0.0515, "step": 65610 }, { "epoch": 0.42, "learning_rate": 0.00023647095270981104, "loss": 0.0554, "step": 65620 }, { "epoch": 0.42, "learning_rate": 0.00023646127135545412, "loss": 0.0703, "step": 65630 }, { "epoch": 0.42, "learning_rate": 0.0002364515900010972, "loss": 0.0597, "step": 65640 }, { "epoch": 0.42, "learning_rate": 0.00023644190864674028, "loss": 0.0589, "step": 65650 }, { "epoch": 0.42, "learning_rate": 0.00023643222729238334, "loss": 0.0532, "step": 65660 }, { "epoch": 0.42, "learning_rate": 0.0002364225459380264, "loss": 0.059, "step": 65670 }, { "epoch": 0.42, "learning_rate": 0.00023641286458366947, "loss": 0.0543, "step": 65680 }, { "epoch": 0.42, "learning_rate": 0.00023640318322931252, "loss": 0.0653, "step": 65690 }, { "epoch": 0.42, "learning_rate": 0.0002363935018749556, "loss": 0.065, "step": 65700 }, { "epoch": 0.42, "learning_rate": 0.00023638382052059868, "loss": 0.0605, "step": 65710 }, { "epoch": 0.42, "learning_rate": 0.00023637413916624176, "loss": 0.0681, "step": 65720 }, { "epoch": 0.42, "learning_rate": 0.0002363644578118848, "loss": 0.0527, "step": 65730 }, { "epoch": 0.42, "learning_rate": 0.00023635477645752787, "loss": 0.0558, "step": 65740 }, { "epoch": 0.42, "learning_rate": 0.00023634509510317095, "loss": 0.0633, "step": 65750 }, { "epoch": 0.42, "learning_rate": 0.000236335413748814, "loss": 0.0612, "step": 65760 }, { "epoch": 0.42, "learning_rate": 0.00023632573239445708, "loss": 0.0596, "step": 65770 }, { "epoch": 0.42, "learning_rate": 0.00023631605104010016, "loss": 0.056, "step": 65780 }, { "epoch": 0.42, "learning_rate": 0.00023630636968574324, "loss": 0.0594, "step": 65790 }, { "epoch": 0.42, "learning_rate": 0.0002362966883313863, "loss": 0.0562, "step": 65800 }, { "epoch": 0.42, "learning_rate": 0.00023628700697702934, "loss": 0.0596, "step": 65810 }, { "epoch": 0.42, "learning_rate": 0.0002362773256226724, "loss": 0.0556, "step": 65820 }, { "epoch": 0.42, "learning_rate": 0.00023626764426831548, "loss": 0.0635, "step": 65830 }, { "epoch": 0.42, "learning_rate": 0.00023625796291395855, "loss": 0.0564, "step": 65840 }, { "epoch": 0.43, "learning_rate": 0.00023624828155960163, "loss": 0.0509, "step": 65850 }, { "epoch": 0.43, "learning_rate": 0.0002362386002052447, "loss": 0.0597, "step": 65860 }, { "epoch": 0.43, "learning_rate": 0.00023622891885088777, "loss": 0.0474, "step": 65870 }, { "epoch": 0.43, "learning_rate": 0.00023621923749653082, "loss": 0.0571, "step": 65880 }, { "epoch": 0.43, "learning_rate": 0.00023620955614217387, "loss": 0.0465, "step": 65890 }, { "epoch": 0.43, "learning_rate": 0.00023619987478781695, "loss": 0.067, "step": 65900 }, { "epoch": 0.43, "learning_rate": 0.00023619019343346003, "loss": 0.0525, "step": 65910 }, { "epoch": 0.43, "learning_rate": 0.0002361805120791031, "loss": 0.0606, "step": 65920 }, { "epoch": 0.43, "learning_rate": 0.00023617083072474616, "loss": 0.0511, "step": 65930 }, { "epoch": 0.43, "learning_rate": 0.00023616114937038924, "loss": 0.0572, "step": 65940 }, { "epoch": 0.43, "learning_rate": 0.0002361514680160323, "loss": 0.0679, "step": 65950 }, { "epoch": 0.43, "learning_rate": 0.00023614178666167535, "loss": 0.0601, "step": 65960 }, { "epoch": 0.43, "learning_rate": 0.00023613210530731843, "loss": 0.0612, "step": 65970 }, { "epoch": 0.43, "learning_rate": 0.0002361224239529615, "loss": 0.0509, "step": 65980 }, { "epoch": 0.43, "learning_rate": 0.0002361127425986046, "loss": 0.0626, "step": 65990 }, { "epoch": 0.43, "learning_rate": 0.00023610306124424764, "loss": 0.0605, "step": 66000 }, { "epoch": 0.43, "eval_cer": 0.9198996723534064, "eval_loss": 0.03807980939745903, "eval_runtime": 120.0579, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 66000 }, { "epoch": 0.43, "learning_rate": 0.00023609337988989072, "loss": 0.0626, "step": 66010 }, { "epoch": 0.43, "learning_rate": 0.00023608369853553375, "loss": 0.0565, "step": 66020 }, { "epoch": 0.43, "learning_rate": 0.00023607401718117683, "loss": 0.0591, "step": 66030 }, { "epoch": 0.43, "learning_rate": 0.0002360643358268199, "loss": 0.055, "step": 66040 }, { "epoch": 0.43, "learning_rate": 0.000236054654472463, "loss": 0.0614, "step": 66050 }, { "epoch": 0.43, "learning_rate": 0.00023604497311810604, "loss": 0.0514, "step": 66060 }, { "epoch": 0.43, "learning_rate": 0.00023603529176374912, "loss": 0.059, "step": 66070 }, { "epoch": 0.43, "learning_rate": 0.0002360256104093922, "loss": 0.063, "step": 66080 }, { "epoch": 0.43, "learning_rate": 0.00023601592905503522, "loss": 0.0571, "step": 66090 }, { "epoch": 0.43, "learning_rate": 0.0002360062477006783, "loss": 0.0615, "step": 66100 }, { "epoch": 0.43, "learning_rate": 0.00023599656634632138, "loss": 0.0552, "step": 66110 }, { "epoch": 0.43, "learning_rate": 0.00023598688499196446, "loss": 0.0538, "step": 66120 }, { "epoch": 0.43, "learning_rate": 0.00023597720363760752, "loss": 0.0547, "step": 66130 }, { "epoch": 0.43, "learning_rate": 0.0002359675222832506, "loss": 0.0556, "step": 66140 }, { "epoch": 0.43, "learning_rate": 0.00023595784092889368, "loss": 0.0596, "step": 66150 }, { "epoch": 0.43, "learning_rate": 0.0002359481595745367, "loss": 0.0476, "step": 66160 }, { "epoch": 0.43, "learning_rate": 0.00023593847822017978, "loss": 0.0613, "step": 66170 }, { "epoch": 0.43, "learning_rate": 0.00023592879686582286, "loss": 0.0551, "step": 66180 }, { "epoch": 0.43, "learning_rate": 0.00023591911551146594, "loss": 0.0558, "step": 66190 }, { "epoch": 0.43, "learning_rate": 0.000235909434157109, "loss": 0.0576, "step": 66200 }, { "epoch": 0.43, "learning_rate": 0.00023589975280275207, "loss": 0.0547, "step": 66210 }, { "epoch": 0.43, "learning_rate": 0.00023589007144839515, "loss": 0.0589, "step": 66220 }, { "epoch": 0.43, "learning_rate": 0.00023588039009403818, "loss": 0.0587, "step": 66230 }, { "epoch": 0.43, "learning_rate": 0.00023587070873968126, "loss": 0.0619, "step": 66240 }, { "epoch": 0.43, "learning_rate": 0.00023586102738532434, "loss": 0.0695, "step": 66250 }, { "epoch": 0.43, "learning_rate": 0.0002358513460309674, "loss": 0.0587, "step": 66260 }, { "epoch": 0.43, "learning_rate": 0.00023584166467661047, "loss": 0.0608, "step": 66270 }, { "epoch": 0.43, "learning_rate": 0.00023583198332225355, "loss": 0.0639, "step": 66280 }, { "epoch": 0.43, "learning_rate": 0.00023582230196789663, "loss": 0.0585, "step": 66290 }, { "epoch": 0.43, "learning_rate": 0.00023581262061353966, "loss": 0.0587, "step": 66300 }, { "epoch": 0.43, "learning_rate": 0.00023580293925918274, "loss": 0.0509, "step": 66310 }, { "epoch": 0.43, "learning_rate": 0.00023579325790482582, "loss": 0.0502, "step": 66320 }, { "epoch": 0.43, "learning_rate": 0.00023578357655046887, "loss": 0.0529, "step": 66330 }, { "epoch": 0.43, "learning_rate": 0.00023577389519611195, "loss": 0.0548, "step": 66340 }, { "epoch": 0.43, "learning_rate": 0.00023576421384175503, "loss": 0.0536, "step": 66350 }, { "epoch": 0.43, "learning_rate": 0.0002357545324873981, "loss": 0.063, "step": 66360 }, { "epoch": 0.43, "learning_rate": 0.00023574485113304113, "loss": 0.062, "step": 66370 }, { "epoch": 0.43, "learning_rate": 0.0002357351697786842, "loss": 0.061, "step": 66380 }, { "epoch": 0.43, "learning_rate": 0.0002357254884243273, "loss": 0.0604, "step": 66390 }, { "epoch": 0.43, "learning_rate": 0.00023571580706997035, "loss": 0.055, "step": 66400 }, { "epoch": 0.43, "learning_rate": 0.00023570612571561343, "loss": 0.0544, "step": 66410 }, { "epoch": 0.43, "learning_rate": 0.0002356964443612565, "loss": 0.0597, "step": 66420 }, { "epoch": 0.43, "learning_rate": 0.00023568676300689956, "loss": 0.0497, "step": 66430 }, { "epoch": 0.43, "learning_rate": 0.0002356770816525426, "loss": 0.06, "step": 66440 }, { "epoch": 0.43, "learning_rate": 0.0002356674002981857, "loss": 0.0605, "step": 66450 }, { "epoch": 0.43, "learning_rate": 0.00023565771894382874, "loss": 0.0542, "step": 66460 }, { "epoch": 0.43, "learning_rate": 0.00023564803758947182, "loss": 0.0633, "step": 66470 }, { "epoch": 0.43, "learning_rate": 0.0002356383562351149, "loss": 0.0689, "step": 66480 }, { "epoch": 0.43, "learning_rate": 0.00023562867488075798, "loss": 0.0541, "step": 66490 }, { "epoch": 0.43, "learning_rate": 0.00023561899352640104, "loss": 0.0609, "step": 66500 }, { "epoch": 0.43, "learning_rate": 0.0002356093121720441, "loss": 0.0628, "step": 66510 }, { "epoch": 0.43, "learning_rate": 0.00023559963081768717, "loss": 0.0521, "step": 66520 }, { "epoch": 0.43, "learning_rate": 0.00023558994946333022, "loss": 0.0538, "step": 66530 }, { "epoch": 0.43, "learning_rate": 0.0002355802681089733, "loss": 0.0585, "step": 66540 }, { "epoch": 0.43, "learning_rate": 0.00023557058675461638, "loss": 0.0564, "step": 66550 }, { "epoch": 0.43, "learning_rate": 0.00023556090540025946, "loss": 0.0552, "step": 66560 }, { "epoch": 0.43, "learning_rate": 0.0002355512240459025, "loss": 0.0522, "step": 66570 }, { "epoch": 0.43, "learning_rate": 0.00023554154269154556, "loss": 0.0513, "step": 66580 }, { "epoch": 0.43, "learning_rate": 0.00023553186133718864, "loss": 0.0622, "step": 66590 }, { "epoch": 0.43, "learning_rate": 0.0002355221799828317, "loss": 0.0533, "step": 66600 }, { "epoch": 0.43, "learning_rate": 0.00023551249862847478, "loss": 0.0561, "step": 66610 }, { "epoch": 0.43, "learning_rate": 0.00023550281727411786, "loss": 0.0515, "step": 66620 }, { "epoch": 0.43, "learning_rate": 0.0002354931359197609, "loss": 0.0523, "step": 66630 }, { "epoch": 0.43, "learning_rate": 0.000235483454565404, "loss": 0.0557, "step": 66640 }, { "epoch": 0.43, "learning_rate": 0.00023547377321104704, "loss": 0.0566, "step": 66650 }, { "epoch": 0.43, "learning_rate": 0.0002354640918566901, "loss": 0.0558, "step": 66660 }, { "epoch": 0.43, "learning_rate": 0.00023545441050233317, "loss": 0.0539, "step": 66670 }, { "epoch": 0.43, "learning_rate": 0.00023544472914797625, "loss": 0.0523, "step": 66680 }, { "epoch": 0.43, "learning_rate": 0.00023543504779361933, "loss": 0.0569, "step": 66690 }, { "epoch": 0.43, "learning_rate": 0.0002354253664392624, "loss": 0.0587, "step": 66700 }, { "epoch": 0.43, "learning_rate": 0.00023541568508490547, "loss": 0.0476, "step": 66710 }, { "epoch": 0.43, "learning_rate": 0.00023540600373054852, "loss": 0.0497, "step": 66720 }, { "epoch": 0.43, "learning_rate": 0.00023539632237619157, "loss": 0.0526, "step": 66730 }, { "epoch": 0.43, "learning_rate": 0.00023538664102183465, "loss": 0.0614, "step": 66740 }, { "epoch": 0.43, "learning_rate": 0.00023537695966747773, "loss": 0.0529, "step": 66750 }, { "epoch": 0.43, "learning_rate": 0.0002353672783131208, "loss": 0.0526, "step": 66760 }, { "epoch": 0.43, "learning_rate": 0.00023535759695876386, "loss": 0.0583, "step": 66770 }, { "epoch": 0.43, "learning_rate": 0.00023534791560440694, "loss": 0.0525, "step": 66780 }, { "epoch": 0.43, "learning_rate": 0.00023533823425005, "loss": 0.0607, "step": 66790 }, { "epoch": 0.43, "learning_rate": 0.00023532855289569305, "loss": 0.0539, "step": 66800 }, { "epoch": 0.43, "learning_rate": 0.00023531887154133613, "loss": 0.0546, "step": 66810 }, { "epoch": 0.43, "learning_rate": 0.0002353091901869792, "loss": 0.0552, "step": 66820 }, { "epoch": 0.43, "learning_rate": 0.00023529950883262226, "loss": 0.0546, "step": 66830 }, { "epoch": 0.43, "learning_rate": 0.00023528982747826534, "loss": 0.0606, "step": 66840 }, { "epoch": 0.43, "learning_rate": 0.00023528014612390842, "loss": 0.0606, "step": 66850 }, { "epoch": 0.43, "learning_rate": 0.00023527046476955145, "loss": 0.063, "step": 66860 }, { "epoch": 0.43, "learning_rate": 0.00023526078341519453, "loss": 0.0622, "step": 66870 }, { "epoch": 0.43, "learning_rate": 0.0002352511020608376, "loss": 0.0598, "step": 66880 }, { "epoch": 0.43, "learning_rate": 0.00023524142070648069, "loss": 0.058, "step": 66890 }, { "epoch": 0.43, "learning_rate": 0.00023523173935212374, "loss": 0.0589, "step": 66900 }, { "epoch": 0.43, "learning_rate": 0.00023522205799776682, "loss": 0.0546, "step": 66910 }, { "epoch": 0.43, "learning_rate": 0.0002352123766434099, "loss": 0.058, "step": 66920 }, { "epoch": 0.43, "learning_rate": 0.00023520269528905292, "loss": 0.0549, "step": 66930 }, { "epoch": 0.43, "learning_rate": 0.000235193013934696, "loss": 0.056, "step": 66940 }, { "epoch": 0.43, "learning_rate": 0.00023518333258033908, "loss": 0.0592, "step": 66950 }, { "epoch": 0.43, "learning_rate": 0.00023517365122598216, "loss": 0.0549, "step": 66960 }, { "epoch": 0.43, "learning_rate": 0.00023516396987162522, "loss": 0.0613, "step": 66970 }, { "epoch": 0.43, "learning_rate": 0.0002351542885172683, "loss": 0.0532, "step": 66980 }, { "epoch": 0.43, "learning_rate": 0.00023514460716291138, "loss": 0.055, "step": 66990 }, { "epoch": 0.43, "learning_rate": 0.0002351349258085544, "loss": 0.0566, "step": 67000 }, { "epoch": 0.43, "eval_cer": 0.9199828267992317, "eval_loss": 0.03815074265003204, "eval_runtime": 120.3509, "eval_samples_per_second": 16.618, "eval_steps_per_second": 4.155, "step": 67000 }, { "epoch": 0.43, "learning_rate": 0.00023512524445419748, "loss": 0.0598, "step": 67010 }, { "epoch": 0.43, "learning_rate": 0.00023511556309984056, "loss": 0.0573, "step": 67020 }, { "epoch": 0.43, "learning_rate": 0.0002351058817454836, "loss": 0.0583, "step": 67030 }, { "epoch": 0.43, "learning_rate": 0.0002350962003911267, "loss": 0.0672, "step": 67040 }, { "epoch": 0.43, "learning_rate": 0.00023508651903676977, "loss": 0.049, "step": 67050 }, { "epoch": 0.43, "learning_rate": 0.00023507683768241285, "loss": 0.0637, "step": 67060 }, { "epoch": 0.43, "learning_rate": 0.00023506715632805588, "loss": 0.0563, "step": 67070 }, { "epoch": 0.43, "learning_rate": 0.00023505747497369896, "loss": 0.0584, "step": 67080 }, { "epoch": 0.43, "learning_rate": 0.00023504779361934204, "loss": 0.0561, "step": 67090 }, { "epoch": 0.43, "learning_rate": 0.0002350381122649851, "loss": 0.0594, "step": 67100 }, { "epoch": 0.43, "learning_rate": 0.00023502843091062817, "loss": 0.0604, "step": 67110 }, { "epoch": 0.43, "learning_rate": 0.00023501874955627125, "loss": 0.0545, "step": 67120 }, { "epoch": 0.43, "learning_rate": 0.00023500906820191433, "loss": 0.0666, "step": 67130 }, { "epoch": 0.43, "learning_rate": 0.00023499938684755736, "loss": 0.0609, "step": 67140 }, { "epoch": 0.43, "learning_rate": 0.00023498970549320044, "loss": 0.0576, "step": 67150 }, { "epoch": 0.43, "learning_rate": 0.00023498002413884352, "loss": 0.0568, "step": 67160 }, { "epoch": 0.43, "learning_rate": 0.00023497034278448657, "loss": 0.0498, "step": 67170 }, { "epoch": 0.43, "learning_rate": 0.00023496066143012965, "loss": 0.055, "step": 67180 }, { "epoch": 0.43, "learning_rate": 0.00023495098007577273, "loss": 0.0568, "step": 67190 }, { "epoch": 0.43, "learning_rate": 0.0002349412987214158, "loss": 0.0519, "step": 67200 }, { "epoch": 0.43, "learning_rate": 0.00023493161736705883, "loss": 0.0541, "step": 67210 }, { "epoch": 0.43, "learning_rate": 0.0002349219360127019, "loss": 0.0535, "step": 67220 }, { "epoch": 0.43, "learning_rate": 0.00023491225465834497, "loss": 0.0559, "step": 67230 }, { "epoch": 0.43, "learning_rate": 0.00023490257330398805, "loss": 0.0535, "step": 67240 }, { "epoch": 0.43, "learning_rate": 0.00023489289194963112, "loss": 0.0535, "step": 67250 }, { "epoch": 0.43, "learning_rate": 0.0002348832105952742, "loss": 0.0533, "step": 67260 }, { "epoch": 0.43, "learning_rate": 0.00023487352924091726, "loss": 0.0622, "step": 67270 }, { "epoch": 0.43, "learning_rate": 0.0002348638478865603, "loss": 0.0537, "step": 67280 }, { "epoch": 0.43, "learning_rate": 0.0002348541665322034, "loss": 0.0621, "step": 67290 }, { "epoch": 0.43, "learning_rate": 0.00023484448517784644, "loss": 0.0557, "step": 67300 }, { "epoch": 0.43, "learning_rate": 0.00023483480382348952, "loss": 0.0601, "step": 67310 }, { "epoch": 0.43, "learning_rate": 0.0002348251224691326, "loss": 0.0525, "step": 67320 }, { "epoch": 0.43, "learning_rate": 0.00023481544111477568, "loss": 0.0629, "step": 67330 }, { "epoch": 0.43, "learning_rate": 0.00023480575976041873, "loss": 0.0596, "step": 67340 }, { "epoch": 0.43, "learning_rate": 0.0002347960784060618, "loss": 0.0608, "step": 67350 }, { "epoch": 0.43, "learning_rate": 0.00023478639705170487, "loss": 0.0551, "step": 67360 }, { "epoch": 0.43, "learning_rate": 0.00023477671569734792, "loss": 0.0576, "step": 67370 }, { "epoch": 0.43, "learning_rate": 0.000234767034342991, "loss": 0.0582, "step": 67380 }, { "epoch": 0.43, "learning_rate": 0.00023475735298863408, "loss": 0.058, "step": 67390 }, { "epoch": 0.44, "learning_rate": 0.00023474767163427716, "loss": 0.0663, "step": 67400 }, { "epoch": 0.44, "learning_rate": 0.0002347379902799202, "loss": 0.0524, "step": 67410 }, { "epoch": 0.44, "learning_rate": 0.00023472830892556326, "loss": 0.0529, "step": 67420 }, { "epoch": 0.44, "learning_rate": 0.00023471862757120632, "loss": 0.0584, "step": 67430 }, { "epoch": 0.44, "learning_rate": 0.0002347089462168494, "loss": 0.0548, "step": 67440 }, { "epoch": 0.44, "learning_rate": 0.00023469926486249248, "loss": 0.0566, "step": 67450 }, { "epoch": 0.44, "learning_rate": 0.00023468958350813556, "loss": 0.0536, "step": 67460 }, { "epoch": 0.44, "learning_rate": 0.0002346799021537786, "loss": 0.0559, "step": 67470 }, { "epoch": 0.44, "learning_rate": 0.0002346702207994217, "loss": 0.0556, "step": 67480 }, { "epoch": 0.44, "learning_rate": 0.00023466053944506474, "loss": 0.0602, "step": 67490 }, { "epoch": 0.44, "learning_rate": 0.0002346508580907078, "loss": 0.0533, "step": 67500 }, { "epoch": 0.44, "learning_rate": 0.00023464117673635087, "loss": 0.0514, "step": 67510 }, { "epoch": 0.44, "learning_rate": 0.00023463149538199395, "loss": 0.0533, "step": 67520 }, { "epoch": 0.44, "learning_rate": 0.00023462181402763703, "loss": 0.052, "step": 67530 }, { "epoch": 0.44, "learning_rate": 0.0002346121326732801, "loss": 0.053, "step": 67540 }, { "epoch": 0.44, "learning_rate": 0.00023460245131892317, "loss": 0.0568, "step": 67550 }, { "epoch": 0.44, "learning_rate": 0.00023459276996456622, "loss": 0.0509, "step": 67560 }, { "epoch": 0.44, "learning_rate": 0.00023458308861020927, "loss": 0.0537, "step": 67570 }, { "epoch": 0.44, "learning_rate": 0.00023457340725585235, "loss": 0.0551, "step": 67580 }, { "epoch": 0.44, "learning_rate": 0.00023456372590149543, "loss": 0.0572, "step": 67590 }, { "epoch": 0.44, "learning_rate": 0.0002345540445471385, "loss": 0.0614, "step": 67600 }, { "epoch": 0.44, "learning_rate": 0.00023454436319278156, "loss": 0.0599, "step": 67610 }, { "epoch": 0.44, "learning_rate": 0.00023453468183842464, "loss": 0.0543, "step": 67620 }, { "epoch": 0.44, "learning_rate": 0.00023452500048406767, "loss": 0.0543, "step": 67630 }, { "epoch": 0.44, "learning_rate": 0.00023451531912971075, "loss": 0.0632, "step": 67640 }, { "epoch": 0.44, "learning_rate": 0.00023450563777535383, "loss": 0.0636, "step": 67650 }, { "epoch": 0.44, "learning_rate": 0.0002344959564209969, "loss": 0.0528, "step": 67660 }, { "epoch": 0.44, "learning_rate": 0.00023448627506663996, "loss": 0.0623, "step": 67670 }, { "epoch": 0.44, "learning_rate": 0.00023447659371228304, "loss": 0.0648, "step": 67680 }, { "epoch": 0.44, "learning_rate": 0.00023446691235792612, "loss": 0.0548, "step": 67690 }, { "epoch": 0.44, "learning_rate": 0.00023445723100356915, "loss": 0.0534, "step": 67700 }, { "epoch": 0.44, "learning_rate": 0.00023444754964921223, "loss": 0.0528, "step": 67710 }, { "epoch": 0.44, "learning_rate": 0.0002344378682948553, "loss": 0.0655, "step": 67720 }, { "epoch": 0.44, "learning_rate": 0.00023442818694049839, "loss": 0.0704, "step": 67730 }, { "epoch": 0.44, "learning_rate": 0.00023441850558614144, "loss": 0.0585, "step": 67740 }, { "epoch": 0.44, "learning_rate": 0.00023440882423178452, "loss": 0.0551, "step": 67750 }, { "epoch": 0.44, "learning_rate": 0.0002343991428774276, "loss": 0.0629, "step": 67760 }, { "epoch": 0.44, "learning_rate": 0.00023438946152307062, "loss": 0.0563, "step": 67770 }, { "epoch": 0.44, "learning_rate": 0.0002343797801687137, "loss": 0.0551, "step": 67780 }, { "epoch": 0.44, "learning_rate": 0.00023437009881435678, "loss": 0.0529, "step": 67790 }, { "epoch": 0.44, "learning_rate": 0.00023436041745999986, "loss": 0.0505, "step": 67800 }, { "epoch": 0.44, "learning_rate": 0.00023435073610564292, "loss": 0.0555, "step": 67810 }, { "epoch": 0.44, "learning_rate": 0.000234341054751286, "loss": 0.0563, "step": 67820 }, { "epoch": 0.44, "learning_rate": 0.00023433137339692908, "loss": 0.0563, "step": 67830 }, { "epoch": 0.44, "learning_rate": 0.0002343216920425721, "loss": 0.0685, "step": 67840 }, { "epoch": 0.44, "learning_rate": 0.00023431201068821518, "loss": 0.0591, "step": 67850 }, { "epoch": 0.44, "learning_rate": 0.00023430232933385826, "loss": 0.0588, "step": 67860 }, { "epoch": 0.44, "learning_rate": 0.0002342926479795013, "loss": 0.0577, "step": 67870 }, { "epoch": 0.44, "learning_rate": 0.0002342829666251444, "loss": 0.0579, "step": 67880 }, { "epoch": 0.44, "learning_rate": 0.00023427328527078747, "loss": 0.0523, "step": 67890 }, { "epoch": 0.44, "learning_rate": 0.00023426360391643055, "loss": 0.0682, "step": 67900 }, { "epoch": 0.44, "learning_rate": 0.00023425392256207358, "loss": 0.0552, "step": 67910 }, { "epoch": 0.44, "learning_rate": 0.00023424424120771666, "loss": 0.0577, "step": 67920 }, { "epoch": 0.44, "learning_rate": 0.00023423455985335974, "loss": 0.0591, "step": 67930 }, { "epoch": 0.44, "learning_rate": 0.0002342248784990028, "loss": 0.0542, "step": 67940 }, { "epoch": 0.44, "learning_rate": 0.00023421519714464587, "loss": 0.0642, "step": 67950 }, { "epoch": 0.44, "learning_rate": 0.00023420551579028895, "loss": 0.0561, "step": 67960 }, { "epoch": 0.44, "learning_rate": 0.00023419583443593203, "loss": 0.0587, "step": 67970 }, { "epoch": 0.44, "learning_rate": 0.00023418615308157506, "loss": 0.061, "step": 67980 }, { "epoch": 0.44, "learning_rate": 0.00023417647172721814, "loss": 0.0523, "step": 67990 }, { "epoch": 0.44, "learning_rate": 0.00023416679037286121, "loss": 0.0616, "step": 68000 }, { "epoch": 0.44, "eval_cer": 0.9200415772229127, "eval_loss": 0.037961166352033615, "eval_runtime": 120.0353, "eval_samples_per_second": 16.662, "eval_steps_per_second": 4.165, "step": 68000 }, { "epoch": 0.44, "learning_rate": 0.00023415710901850427, "loss": 0.0578, "step": 68010 }, { "epoch": 0.44, "learning_rate": 0.00023414742766414735, "loss": 0.0671, "step": 68020 }, { "epoch": 0.44, "learning_rate": 0.00023413774630979043, "loss": 0.057, "step": 68030 }, { "epoch": 0.44, "learning_rate": 0.00023412806495543348, "loss": 0.0556, "step": 68040 }, { "epoch": 0.44, "learning_rate": 0.00023411838360107653, "loss": 0.0527, "step": 68050 }, { "epoch": 0.44, "learning_rate": 0.0002341087022467196, "loss": 0.0571, "step": 68060 }, { "epoch": 0.44, "learning_rate": 0.00023409902089236266, "loss": 0.0492, "step": 68070 }, { "epoch": 0.44, "learning_rate": 0.00023408933953800574, "loss": 0.0555, "step": 68080 }, { "epoch": 0.44, "learning_rate": 0.00023407965818364882, "loss": 0.0581, "step": 68090 }, { "epoch": 0.44, "learning_rate": 0.0002340699768292919, "loss": 0.0528, "step": 68100 }, { "epoch": 0.44, "learning_rate": 0.00023406029547493496, "loss": 0.0589, "step": 68110 }, { "epoch": 0.44, "learning_rate": 0.000234050614120578, "loss": 0.0609, "step": 68120 }, { "epoch": 0.44, "learning_rate": 0.0002340409327662211, "loss": 0.0625, "step": 68130 }, { "epoch": 0.44, "learning_rate": 0.00023403125141186414, "loss": 0.0516, "step": 68140 }, { "epoch": 0.44, "learning_rate": 0.00023402157005750722, "loss": 0.0582, "step": 68150 }, { "epoch": 0.44, "learning_rate": 0.0002340118887031503, "loss": 0.0571, "step": 68160 }, { "epoch": 0.44, "learning_rate": 0.00023400220734879338, "loss": 0.0572, "step": 68170 }, { "epoch": 0.44, "learning_rate": 0.00023399252599443643, "loss": 0.0534, "step": 68180 }, { "epoch": 0.44, "learning_rate": 0.0002339828446400795, "loss": 0.0546, "step": 68190 }, { "epoch": 0.44, "learning_rate": 0.00023397316328572257, "loss": 0.0589, "step": 68200 }, { "epoch": 0.44, "learning_rate": 0.00023396348193136562, "loss": 0.0536, "step": 68210 }, { "epoch": 0.44, "learning_rate": 0.0002339538005770087, "loss": 0.0562, "step": 68220 }, { "epoch": 0.44, "learning_rate": 0.00023394411922265178, "loss": 0.0606, "step": 68230 }, { "epoch": 0.44, "learning_rate": 0.00023393443786829483, "loss": 0.0552, "step": 68240 }, { "epoch": 0.44, "learning_rate": 0.0002339247565139379, "loss": 0.0787, "step": 68250 }, { "epoch": 0.44, "learning_rate": 0.00023391507515958096, "loss": 0.0532, "step": 68260 }, { "epoch": 0.44, "learning_rate": 0.00023390539380522402, "loss": 0.06, "step": 68270 }, { "epoch": 0.44, "learning_rate": 0.0002338957124508671, "loss": 0.0576, "step": 68280 }, { "epoch": 0.44, "learning_rate": 0.00023388603109651018, "loss": 0.0572, "step": 68290 }, { "epoch": 0.44, "learning_rate": 0.00023387634974215326, "loss": 0.0604, "step": 68300 }, { "epoch": 0.44, "learning_rate": 0.0002338666683877963, "loss": 0.0529, "step": 68310 }, { "epoch": 0.44, "learning_rate": 0.0002338569870334394, "loss": 0.0519, "step": 68320 }, { "epoch": 0.44, "learning_rate": 0.00023384730567908244, "loss": 0.0574, "step": 68330 }, { "epoch": 0.44, "learning_rate": 0.0002338376243247255, "loss": 0.0586, "step": 68340 }, { "epoch": 0.44, "learning_rate": 0.00023382794297036857, "loss": 0.0618, "step": 68350 }, { "epoch": 0.44, "learning_rate": 0.00023381826161601165, "loss": 0.058, "step": 68360 }, { "epoch": 0.44, "learning_rate": 0.00023380858026165473, "loss": 0.0589, "step": 68370 }, { "epoch": 0.44, "learning_rate": 0.00023379889890729779, "loss": 0.0495, "step": 68380 }, { "epoch": 0.44, "learning_rate": 0.00023378921755294087, "loss": 0.0566, "step": 68390 }, { "epoch": 0.44, "learning_rate": 0.00023377953619858392, "loss": 0.0578, "step": 68400 }, { "epoch": 0.44, "learning_rate": 0.00023376985484422697, "loss": 0.0478, "step": 68410 }, { "epoch": 0.44, "learning_rate": 0.00023376017348987005, "loss": 0.0541, "step": 68420 }, { "epoch": 0.44, "learning_rate": 0.00023375049213551313, "loss": 0.0664, "step": 68430 }, { "epoch": 0.44, "learning_rate": 0.00023374081078115618, "loss": 0.058, "step": 68440 }, { "epoch": 0.44, "learning_rate": 0.00023373112942679926, "loss": 0.0531, "step": 68450 }, { "epoch": 0.44, "learning_rate": 0.00023372144807244234, "loss": 0.0541, "step": 68460 }, { "epoch": 0.44, "learning_rate": 0.00023371176671808537, "loss": 0.0587, "step": 68470 }, { "epoch": 0.44, "learning_rate": 0.00023370208536372845, "loss": 0.0557, "step": 68480 }, { "epoch": 0.44, "learning_rate": 0.00023369240400937153, "loss": 0.0504, "step": 68490 }, { "epoch": 0.44, "learning_rate": 0.0002336827226550146, "loss": 0.0594, "step": 68500 }, { "epoch": 0.44, "learning_rate": 0.00023367304130065766, "loss": 0.0472, "step": 68510 }, { "epoch": 0.44, "learning_rate": 0.00023366335994630074, "loss": 0.0519, "step": 68520 }, { "epoch": 0.44, "learning_rate": 0.00023365367859194382, "loss": 0.0583, "step": 68530 }, { "epoch": 0.44, "learning_rate": 0.00023364399723758685, "loss": 0.0664, "step": 68540 }, { "epoch": 0.44, "learning_rate": 0.00023363431588322993, "loss": 0.0581, "step": 68550 }, { "epoch": 0.44, "learning_rate": 0.000233624634528873, "loss": 0.0601, "step": 68560 }, { "epoch": 0.44, "learning_rate": 0.00023361495317451609, "loss": 0.0547, "step": 68570 }, { "epoch": 0.44, "learning_rate": 0.00023360527182015914, "loss": 0.0559, "step": 68580 }, { "epoch": 0.44, "learning_rate": 0.00023359559046580222, "loss": 0.0549, "step": 68590 }, { "epoch": 0.44, "learning_rate": 0.0002335859091114453, "loss": 0.0584, "step": 68600 }, { "epoch": 0.44, "learning_rate": 0.00023357622775708832, "loss": 0.064, "step": 68610 }, { "epoch": 0.44, "learning_rate": 0.0002335665464027314, "loss": 0.0633, "step": 68620 }, { "epoch": 0.44, "learning_rate": 0.00023355686504837448, "loss": 0.0556, "step": 68630 }, { "epoch": 0.44, "learning_rate": 0.00023354718369401754, "loss": 0.0585, "step": 68640 }, { "epoch": 0.44, "learning_rate": 0.00023353750233966062, "loss": 0.0584, "step": 68650 }, { "epoch": 0.44, "learning_rate": 0.0002335278209853037, "loss": 0.0558, "step": 68660 }, { "epoch": 0.44, "learning_rate": 0.00023351813963094677, "loss": 0.0589, "step": 68670 }, { "epoch": 0.44, "learning_rate": 0.0002335084582765898, "loss": 0.053, "step": 68680 }, { "epoch": 0.44, "learning_rate": 0.00023349877692223288, "loss": 0.0546, "step": 68690 }, { "epoch": 0.44, "learning_rate": 0.00023348909556787596, "loss": 0.0588, "step": 68700 }, { "epoch": 0.44, "learning_rate": 0.000233479414213519, "loss": 0.0498, "step": 68710 }, { "epoch": 0.44, "learning_rate": 0.0002334697328591621, "loss": 0.0538, "step": 68720 }, { "epoch": 0.44, "learning_rate": 0.00023346005150480517, "loss": 0.0679, "step": 68730 }, { "epoch": 0.44, "learning_rate": 0.00023345037015044825, "loss": 0.0512, "step": 68740 }, { "epoch": 0.44, "learning_rate": 0.00023344068879609128, "loss": 0.0504, "step": 68750 }, { "epoch": 0.44, "learning_rate": 0.00023343100744173436, "loss": 0.0545, "step": 68760 }, { "epoch": 0.44, "learning_rate": 0.00023342132608737744, "loss": 0.0549, "step": 68770 }, { "epoch": 0.44, "learning_rate": 0.0002334116447330205, "loss": 0.0555, "step": 68780 }, { "epoch": 0.44, "learning_rate": 0.00023340196337866357, "loss": 0.0544, "step": 68790 }, { "epoch": 0.44, "learning_rate": 0.00023339228202430665, "loss": 0.0503, "step": 68800 }, { "epoch": 0.44, "learning_rate": 0.0002333826006699497, "loss": 0.0496, "step": 68810 }, { "epoch": 0.44, "learning_rate": 0.00023337291931559275, "loss": 0.056, "step": 68820 }, { "epoch": 0.44, "learning_rate": 0.00023336323796123583, "loss": 0.0513, "step": 68830 }, { "epoch": 0.44, "learning_rate": 0.0002333535566068789, "loss": 0.0518, "step": 68840 }, { "epoch": 0.44, "learning_rate": 0.00023334387525252197, "loss": 0.0498, "step": 68850 }, { "epoch": 0.44, "learning_rate": 0.00023333419389816505, "loss": 0.057, "step": 68860 }, { "epoch": 0.44, "learning_rate": 0.00023332451254380813, "loss": 0.0604, "step": 68870 }, { "epoch": 0.44, "learning_rate": 0.00023331483118945118, "loss": 0.0599, "step": 68880 }, { "epoch": 0.44, "learning_rate": 0.00023330514983509423, "loss": 0.0609, "step": 68890 }, { "epoch": 0.44, "learning_rate": 0.0002332954684807373, "loss": 0.0557, "step": 68900 }, { "epoch": 0.44, "learning_rate": 0.00023328578712638036, "loss": 0.0592, "step": 68910 }, { "epoch": 0.44, "learning_rate": 0.00023327610577202344, "loss": 0.0638, "step": 68920 }, { "epoch": 0.44, "learning_rate": 0.00023326642441766652, "loss": 0.048, "step": 68930 }, { "epoch": 0.44, "learning_rate": 0.0002332567430633096, "loss": 0.0504, "step": 68940 }, { "epoch": 0.45, "learning_rate": 0.00023324706170895266, "loss": 0.0658, "step": 68950 }, { "epoch": 0.45, "learning_rate": 0.0002332373803545957, "loss": 0.0555, "step": 68960 }, { "epoch": 0.45, "learning_rate": 0.0002332276990002388, "loss": 0.0578, "step": 68970 }, { "epoch": 0.45, "learning_rate": 0.00023321801764588184, "loss": 0.0612, "step": 68980 }, { "epoch": 0.45, "learning_rate": 0.00023320833629152492, "loss": 0.0544, "step": 68990 }, { "epoch": 0.45, "learning_rate": 0.000233198654937168, "loss": 0.0666, "step": 69000 }, { "epoch": 0.45, "eval_cer": 0.9200650773923851, "eval_loss": 0.03810597211122513, "eval_runtime": 120.1331, "eval_samples_per_second": 16.648, "eval_steps_per_second": 4.162, "step": 69000 }, { "epoch": 0.45, "learning_rate": 0.00023318897358281105, "loss": 0.0587, "step": 69010 }, { "epoch": 0.45, "learning_rate": 0.00023317929222845413, "loss": 0.0553, "step": 69020 }, { "epoch": 0.45, "learning_rate": 0.0002331696108740972, "loss": 0.0561, "step": 69030 }, { "epoch": 0.45, "learning_rate": 0.00023315992951974024, "loss": 0.0529, "step": 69040 }, { "epoch": 0.45, "learning_rate": 0.00023315024816538332, "loss": 0.0568, "step": 69050 }, { "epoch": 0.45, "learning_rate": 0.0002331405668110264, "loss": 0.0571, "step": 69060 }, { "epoch": 0.45, "learning_rate": 0.00023313088545666948, "loss": 0.0552, "step": 69070 }, { "epoch": 0.45, "learning_rate": 0.00023312120410231253, "loss": 0.0554, "step": 69080 }, { "epoch": 0.45, "learning_rate": 0.0002331115227479556, "loss": 0.0476, "step": 69090 }, { "epoch": 0.45, "learning_rate": 0.00023310184139359866, "loss": 0.0468, "step": 69100 }, { "epoch": 0.45, "learning_rate": 0.00023309216003924172, "loss": 0.0556, "step": 69110 }, { "epoch": 0.45, "learning_rate": 0.0002330824786848848, "loss": 0.0542, "step": 69120 }, { "epoch": 0.45, "learning_rate": 0.00023307279733052788, "loss": 0.0551, "step": 69130 }, { "epoch": 0.45, "learning_rate": 0.00023306311597617096, "loss": 0.053, "step": 69140 }, { "epoch": 0.45, "learning_rate": 0.000233053434621814, "loss": 0.0623, "step": 69150 }, { "epoch": 0.45, "learning_rate": 0.0002330437532674571, "loss": 0.0535, "step": 69160 }, { "epoch": 0.45, "learning_rate": 0.00023303407191310014, "loss": 0.0609, "step": 69170 }, { "epoch": 0.45, "learning_rate": 0.0002330243905587432, "loss": 0.0489, "step": 69180 }, { "epoch": 0.45, "learning_rate": 0.00023301470920438627, "loss": 0.0572, "step": 69190 }, { "epoch": 0.45, "learning_rate": 0.00023300502785002935, "loss": 0.0567, "step": 69200 }, { "epoch": 0.45, "learning_rate": 0.0002329953464956724, "loss": 0.0587, "step": 69210 }, { "epoch": 0.45, "learning_rate": 0.00023298566514131549, "loss": 0.0486, "step": 69220 }, { "epoch": 0.45, "learning_rate": 0.00023297598378695857, "loss": 0.0524, "step": 69230 }, { "epoch": 0.45, "learning_rate": 0.0002329663024326016, "loss": 0.0528, "step": 69240 }, { "epoch": 0.45, "learning_rate": 0.00023295662107824467, "loss": 0.0525, "step": 69250 }, { "epoch": 0.45, "learning_rate": 0.00023294693972388775, "loss": 0.0505, "step": 69260 }, { "epoch": 0.45, "learning_rate": 0.00023293725836953083, "loss": 0.0529, "step": 69270 }, { "epoch": 0.45, "learning_rate": 0.00023292757701517388, "loss": 0.0539, "step": 69280 }, { "epoch": 0.45, "learning_rate": 0.00023291789566081696, "loss": 0.0517, "step": 69290 }, { "epoch": 0.45, "learning_rate": 0.00023290821430646004, "loss": 0.0502, "step": 69300 }, { "epoch": 0.45, "learning_rate": 0.00023289853295210307, "loss": 0.0524, "step": 69310 }, { "epoch": 0.45, "learning_rate": 0.00023288885159774615, "loss": 0.0645, "step": 69320 }, { "epoch": 0.45, "learning_rate": 0.00023287917024338923, "loss": 0.0584, "step": 69330 }, { "epoch": 0.45, "learning_rate": 0.0002328694888890323, "loss": 0.057, "step": 69340 }, { "epoch": 0.45, "learning_rate": 0.00023285980753467536, "loss": 0.063, "step": 69350 }, { "epoch": 0.45, "learning_rate": 0.00023285012618031844, "loss": 0.0464, "step": 69360 }, { "epoch": 0.45, "learning_rate": 0.00023284044482596152, "loss": 0.0527, "step": 69370 }, { "epoch": 0.45, "learning_rate": 0.00023283076347160455, "loss": 0.0547, "step": 69380 }, { "epoch": 0.45, "learning_rate": 0.00023282108211724763, "loss": 0.0519, "step": 69390 }, { "epoch": 0.45, "learning_rate": 0.0002328114007628907, "loss": 0.0517, "step": 69400 }, { "epoch": 0.45, "learning_rate": 0.00023280171940853376, "loss": 0.0556, "step": 69410 }, { "epoch": 0.45, "learning_rate": 0.00023279203805417684, "loss": 0.0553, "step": 69420 }, { "epoch": 0.45, "learning_rate": 0.00023278235669981992, "loss": 0.0545, "step": 69430 }, { "epoch": 0.45, "learning_rate": 0.000232772675345463, "loss": 0.0557, "step": 69440 }, { "epoch": 0.45, "learning_rate": 0.00023276299399110602, "loss": 0.0585, "step": 69450 }, { "epoch": 0.45, "learning_rate": 0.0002327533126367491, "loss": 0.0521, "step": 69460 }, { "epoch": 0.45, "learning_rate": 0.00023274363128239218, "loss": 0.0526, "step": 69470 }, { "epoch": 0.45, "learning_rate": 0.00023273394992803524, "loss": 0.0474, "step": 69480 }, { "epoch": 0.45, "learning_rate": 0.00023272426857367831, "loss": 0.0556, "step": 69490 }, { "epoch": 0.45, "learning_rate": 0.0002327145872193214, "loss": 0.0562, "step": 69500 }, { "epoch": 0.45, "learning_rate": 0.00023270490586496447, "loss": 0.0521, "step": 69510 }, { "epoch": 0.45, "learning_rate": 0.0002326952245106075, "loss": 0.055, "step": 69520 }, { "epoch": 0.45, "learning_rate": 0.00023268554315625058, "loss": 0.0512, "step": 69530 }, { "epoch": 0.45, "learning_rate": 0.00023267586180189366, "loss": 0.0538, "step": 69540 }, { "epoch": 0.45, "learning_rate": 0.0002326661804475367, "loss": 0.0614, "step": 69550 }, { "epoch": 0.45, "learning_rate": 0.0002326564990931798, "loss": 0.0563, "step": 69560 }, { "epoch": 0.45, "learning_rate": 0.00023264681773882287, "loss": 0.0509, "step": 69570 }, { "epoch": 0.45, "learning_rate": 0.00023263713638446595, "loss": 0.0632, "step": 69580 }, { "epoch": 0.45, "learning_rate": 0.00023262745503010898, "loss": 0.0522, "step": 69590 }, { "epoch": 0.45, "learning_rate": 0.00023261777367575206, "loss": 0.0613, "step": 69600 }, { "epoch": 0.45, "learning_rate": 0.0002326080923213951, "loss": 0.0475, "step": 69610 }, { "epoch": 0.45, "learning_rate": 0.0002325984109670382, "loss": 0.0511, "step": 69620 }, { "epoch": 0.45, "learning_rate": 0.00023258872961268127, "loss": 0.0527, "step": 69630 }, { "epoch": 0.45, "learning_rate": 0.00023257904825832435, "loss": 0.0522, "step": 69640 }, { "epoch": 0.45, "learning_rate": 0.0002325693669039674, "loss": 0.0541, "step": 69650 }, { "epoch": 0.45, "learning_rate": 0.00023255968554961045, "loss": 0.0592, "step": 69660 }, { "epoch": 0.45, "learning_rate": 0.00023255000419525353, "loss": 0.0566, "step": 69670 }, { "epoch": 0.45, "learning_rate": 0.0002325403228408966, "loss": 0.0523, "step": 69680 }, { "epoch": 0.45, "learning_rate": 0.00023253064148653967, "loss": 0.0487, "step": 69690 }, { "epoch": 0.45, "learning_rate": 0.00023252096013218275, "loss": 0.0548, "step": 69700 }, { "epoch": 0.45, "learning_rate": 0.00023251127877782583, "loss": 0.0527, "step": 69710 }, { "epoch": 0.45, "learning_rate": 0.00023250159742346888, "loss": 0.0542, "step": 69720 }, { "epoch": 0.45, "learning_rate": 0.00023249191606911193, "loss": 0.0548, "step": 69730 }, { "epoch": 0.45, "learning_rate": 0.000232482234714755, "loss": 0.0534, "step": 69740 }, { "epoch": 0.45, "learning_rate": 0.00023247255336039806, "loss": 0.0528, "step": 69750 }, { "epoch": 0.45, "learning_rate": 0.00023246287200604114, "loss": 0.059, "step": 69760 }, { "epoch": 0.45, "learning_rate": 0.00023245319065168422, "loss": 0.0542, "step": 69770 }, { "epoch": 0.45, "learning_rate": 0.0002324435092973273, "loss": 0.055, "step": 69780 }, { "epoch": 0.45, "learning_rate": 0.00023243382794297036, "loss": 0.0507, "step": 69790 }, { "epoch": 0.45, "learning_rate": 0.0002324241465886134, "loss": 0.0558, "step": 69800 }, { "epoch": 0.45, "learning_rate": 0.00023241446523425646, "loss": 0.0589, "step": 69810 }, { "epoch": 0.45, "learning_rate": 0.00023240478387989954, "loss": 0.0519, "step": 69820 }, { "epoch": 0.45, "learning_rate": 0.00023239510252554262, "loss": 0.0562, "step": 69830 }, { "epoch": 0.45, "learning_rate": 0.0002323854211711857, "loss": 0.0522, "step": 69840 }, { "epoch": 0.45, "learning_rate": 0.00023237573981682875, "loss": 0.0621, "step": 69850 }, { "epoch": 0.45, "learning_rate": 0.00023236605846247183, "loss": 0.0582, "step": 69860 }, { "epoch": 0.45, "learning_rate": 0.00023235637710811489, "loss": 0.0545, "step": 69870 }, { "epoch": 0.45, "learning_rate": 0.00023234669575375794, "loss": 0.0558, "step": 69880 }, { "epoch": 0.45, "learning_rate": 0.00023233701439940102, "loss": 0.0557, "step": 69890 }, { "epoch": 0.45, "learning_rate": 0.0002323273330450441, "loss": 0.0543, "step": 69900 }, { "epoch": 0.45, "learning_rate": 0.00023231765169068718, "loss": 0.0531, "step": 69910 }, { "epoch": 0.45, "learning_rate": 0.00023230797033633023, "loss": 0.0497, "step": 69920 }, { "epoch": 0.45, "learning_rate": 0.0002322982889819733, "loss": 0.055, "step": 69930 }, { "epoch": 0.45, "learning_rate": 0.00023228860762761636, "loss": 0.0605, "step": 69940 }, { "epoch": 0.45, "learning_rate": 0.00023227892627325942, "loss": 0.0501, "step": 69950 }, { "epoch": 0.45, "learning_rate": 0.0002322692449189025, "loss": 0.0527, "step": 69960 }, { "epoch": 0.45, "learning_rate": 0.00023225956356454558, "loss": 0.0534, "step": 69970 }, { "epoch": 0.45, "learning_rate": 0.00023224988221018866, "loss": 0.0583, "step": 69980 }, { "epoch": 0.45, "learning_rate": 0.0002322402008558317, "loss": 0.0585, "step": 69990 }, { "epoch": 0.45, "learning_rate": 0.0002322305195014748, "loss": 0.052, "step": 70000 }, { "epoch": 0.45, "eval_cer": 0.9199529996610553, "eval_loss": 0.037266287952661514, "eval_runtime": 120.2383, "eval_samples_per_second": 16.634, "eval_steps_per_second": 4.158, "step": 70000 }, { "epoch": 0.45, "learning_rate": 0.0002322208381471178, "loss": 0.0492, "step": 70010 }, { "epoch": 0.45, "learning_rate": 0.0002322111567927609, "loss": 0.0508, "step": 70020 }, { "epoch": 0.45, "learning_rate": 0.00023220147543840397, "loss": 0.0482, "step": 70030 }, { "epoch": 0.45, "learning_rate": 0.00023219179408404705, "loss": 0.0495, "step": 70040 }, { "epoch": 0.45, "learning_rate": 0.0002321821127296901, "loss": 0.0539, "step": 70050 }, { "epoch": 0.45, "learning_rate": 0.00023217243137533319, "loss": 0.0576, "step": 70060 }, { "epoch": 0.45, "learning_rate": 0.00023216275002097627, "loss": 0.0543, "step": 70070 }, { "epoch": 0.45, "learning_rate": 0.0002321530686666193, "loss": 0.0547, "step": 70080 }, { "epoch": 0.45, "learning_rate": 0.00023214338731226237, "loss": 0.0538, "step": 70090 }, { "epoch": 0.45, "learning_rate": 0.00023213370595790545, "loss": 0.0468, "step": 70100 }, { "epoch": 0.45, "learning_rate": 0.00023212402460354853, "loss": 0.0541, "step": 70110 }, { "epoch": 0.45, "learning_rate": 0.00023211434324919158, "loss": 0.0588, "step": 70120 }, { "epoch": 0.45, "learning_rate": 0.00023210466189483466, "loss": 0.0555, "step": 70130 }, { "epoch": 0.45, "learning_rate": 0.00023209498054047774, "loss": 0.0523, "step": 70140 }, { "epoch": 0.45, "learning_rate": 0.00023208529918612077, "loss": 0.0496, "step": 70150 }, { "epoch": 0.45, "learning_rate": 0.00023207561783176385, "loss": 0.0699, "step": 70160 }, { "epoch": 0.45, "learning_rate": 0.00023206593647740693, "loss": 0.0536, "step": 70170 }, { "epoch": 0.45, "learning_rate": 0.00023205625512305, "loss": 0.0567, "step": 70180 }, { "epoch": 0.45, "learning_rate": 0.00023204657376869306, "loss": 0.0514, "step": 70190 }, { "epoch": 0.45, "learning_rate": 0.00023203689241433614, "loss": 0.0629, "step": 70200 }, { "epoch": 0.45, "learning_rate": 0.00023202721105997922, "loss": 0.0614, "step": 70210 }, { "epoch": 0.45, "learning_rate": 0.00023201752970562225, "loss": 0.0562, "step": 70220 }, { "epoch": 0.45, "learning_rate": 0.00023200784835126533, "loss": 0.0663, "step": 70230 }, { "epoch": 0.45, "learning_rate": 0.0002319981669969084, "loss": 0.0492, "step": 70240 }, { "epoch": 0.45, "learning_rate": 0.00023198848564255146, "loss": 0.0512, "step": 70250 }, { "epoch": 0.45, "learning_rate": 0.00023197880428819454, "loss": 0.0486, "step": 70260 }, { "epoch": 0.45, "learning_rate": 0.00023196912293383762, "loss": 0.0493, "step": 70270 }, { "epoch": 0.45, "learning_rate": 0.0002319594415794807, "loss": 0.0683, "step": 70280 }, { "epoch": 0.45, "learning_rate": 0.00023194976022512372, "loss": 0.0629, "step": 70290 }, { "epoch": 0.45, "learning_rate": 0.0002319400788707668, "loss": 0.06, "step": 70300 }, { "epoch": 0.45, "learning_rate": 0.00023193039751640988, "loss": 0.0525, "step": 70310 }, { "epoch": 0.45, "learning_rate": 0.00023192071616205293, "loss": 0.0519, "step": 70320 }, { "epoch": 0.45, "learning_rate": 0.00023191103480769601, "loss": 0.0614, "step": 70330 }, { "epoch": 0.45, "learning_rate": 0.0002319013534533391, "loss": 0.0594, "step": 70340 }, { "epoch": 0.45, "learning_rate": 0.00023189167209898217, "loss": 0.0639, "step": 70350 }, { "epoch": 0.45, "learning_rate": 0.0002318819907446252, "loss": 0.0596, "step": 70360 }, { "epoch": 0.45, "learning_rate": 0.00023187230939026828, "loss": 0.0493, "step": 70370 }, { "epoch": 0.45, "learning_rate": 0.00023186262803591136, "loss": 0.0553, "step": 70380 }, { "epoch": 0.45, "learning_rate": 0.0002318529466815544, "loss": 0.0621, "step": 70390 }, { "epoch": 0.45, "learning_rate": 0.0002318432653271975, "loss": 0.0534, "step": 70400 }, { "epoch": 0.45, "learning_rate": 0.00023183358397284057, "loss": 0.0555, "step": 70410 }, { "epoch": 0.45, "learning_rate": 0.00023182390261848362, "loss": 0.0483, "step": 70420 }, { "epoch": 0.45, "learning_rate": 0.00023181422126412668, "loss": 0.0574, "step": 70430 }, { "epoch": 0.45, "learning_rate": 0.00023180453990976976, "loss": 0.0544, "step": 70440 }, { "epoch": 0.45, "learning_rate": 0.0002317948585554128, "loss": 0.0555, "step": 70450 }, { "epoch": 0.45, "learning_rate": 0.0002317851772010559, "loss": 0.0575, "step": 70460 }, { "epoch": 0.45, "learning_rate": 0.00023177549584669897, "loss": 0.0509, "step": 70470 }, { "epoch": 0.45, "learning_rate": 0.00023176581449234205, "loss": 0.0494, "step": 70480 }, { "epoch": 0.45, "learning_rate": 0.0002317561331379851, "loss": 0.0535, "step": 70490 }, { "epoch": 0.46, "learning_rate": 0.00023174645178362815, "loss": 0.059, "step": 70500 }, { "epoch": 0.46, "learning_rate": 0.00023173677042927123, "loss": 0.0531, "step": 70510 }, { "epoch": 0.46, "learning_rate": 0.0002317270890749143, "loss": 0.0565, "step": 70520 }, { "epoch": 0.46, "learning_rate": 0.00023171740772055737, "loss": 0.0548, "step": 70530 }, { "epoch": 0.46, "learning_rate": 0.00023170772636620045, "loss": 0.0536, "step": 70540 }, { "epoch": 0.46, "learning_rate": 0.00023169804501184353, "loss": 0.0574, "step": 70550 }, { "epoch": 0.46, "learning_rate": 0.00023168836365748658, "loss": 0.062, "step": 70560 }, { "epoch": 0.46, "learning_rate": 0.00023167868230312963, "loss": 0.0518, "step": 70570 }, { "epoch": 0.46, "learning_rate": 0.0002316690009487727, "loss": 0.0581, "step": 70580 }, { "epoch": 0.46, "learning_rate": 0.00023165931959441576, "loss": 0.0618, "step": 70590 }, { "epoch": 0.46, "learning_rate": 0.00023164963824005884, "loss": 0.0569, "step": 70600 }, { "epoch": 0.46, "learning_rate": 0.00023163995688570192, "loss": 0.0578, "step": 70610 }, { "epoch": 0.46, "learning_rate": 0.00023163027553134498, "loss": 0.0548, "step": 70620 }, { "epoch": 0.46, "learning_rate": 0.00023162059417698806, "loss": 0.0598, "step": 70630 }, { "epoch": 0.46, "learning_rate": 0.0002316109128226311, "loss": 0.0625, "step": 70640 }, { "epoch": 0.46, "learning_rate": 0.00023160123146827416, "loss": 0.0569, "step": 70650 }, { "epoch": 0.46, "learning_rate": 0.00023159155011391724, "loss": 0.056, "step": 70660 }, { "epoch": 0.46, "learning_rate": 0.00023158186875956032, "loss": 0.0521, "step": 70670 }, { "epoch": 0.46, "learning_rate": 0.0002315721874052034, "loss": 0.0539, "step": 70680 }, { "epoch": 0.46, "learning_rate": 0.00023156250605084645, "loss": 0.0592, "step": 70690 }, { "epoch": 0.46, "learning_rate": 0.00023155282469648953, "loss": 0.0578, "step": 70700 }, { "epoch": 0.46, "learning_rate": 0.00023154314334213259, "loss": 0.0508, "step": 70710 }, { "epoch": 0.46, "learning_rate": 0.00023153346198777564, "loss": 0.0524, "step": 70720 }, { "epoch": 0.46, "learning_rate": 0.00023152378063341872, "loss": 0.0581, "step": 70730 }, { "epoch": 0.46, "learning_rate": 0.0002315140992790618, "loss": 0.0559, "step": 70740 }, { "epoch": 0.46, "learning_rate": 0.00023150441792470488, "loss": 0.0527, "step": 70750 }, { "epoch": 0.46, "learning_rate": 0.00023149473657034793, "loss": 0.0537, "step": 70760 }, { "epoch": 0.46, "learning_rate": 0.000231485055215991, "loss": 0.0579, "step": 70770 }, { "epoch": 0.46, "learning_rate": 0.00023147537386163406, "loss": 0.0567, "step": 70780 }, { "epoch": 0.46, "learning_rate": 0.00023146569250727712, "loss": 0.0496, "step": 70790 }, { "epoch": 0.46, "learning_rate": 0.0002314560111529202, "loss": 0.0587, "step": 70800 }, { "epoch": 0.46, "learning_rate": 0.00023144632979856328, "loss": 0.0591, "step": 70810 }, { "epoch": 0.46, "learning_rate": 0.00023143664844420633, "loss": 0.0609, "step": 70820 }, { "epoch": 0.46, "learning_rate": 0.0002314269670898494, "loss": 0.0551, "step": 70830 }, { "epoch": 0.46, "learning_rate": 0.0002314172857354925, "loss": 0.0588, "step": 70840 }, { "epoch": 0.46, "learning_rate": 0.0002314076043811355, "loss": 0.0639, "step": 70850 }, { "epoch": 0.46, "learning_rate": 0.0002313979230267786, "loss": 0.0553, "step": 70860 }, { "epoch": 0.46, "learning_rate": 0.00023138824167242167, "loss": 0.0557, "step": 70870 }, { "epoch": 0.46, "learning_rate": 0.00023137856031806475, "loss": 0.0518, "step": 70880 }, { "epoch": 0.46, "learning_rate": 0.0002313688789637078, "loss": 0.0498, "step": 70890 }, { "epoch": 0.46, "learning_rate": 0.00023135919760935089, "loss": 0.0614, "step": 70900 }, { "epoch": 0.46, "learning_rate": 0.00023134951625499396, "loss": 0.0505, "step": 70910 }, { "epoch": 0.46, "learning_rate": 0.000231339834900637, "loss": 0.052, "step": 70920 }, { "epoch": 0.46, "learning_rate": 0.00023133015354628007, "loss": 0.1046, "step": 70930 }, { "epoch": 0.46, "learning_rate": 0.00023132047219192315, "loss": 0.0848, "step": 70940 }, { "epoch": 0.46, "learning_rate": 0.00023131079083756623, "loss": 0.0537, "step": 70950 }, { "epoch": 0.46, "learning_rate": 0.00023130110948320928, "loss": 0.05, "step": 70960 }, { "epoch": 0.46, "learning_rate": 0.00023129142812885236, "loss": 0.0569, "step": 70970 }, { "epoch": 0.46, "learning_rate": 0.00023128174677449544, "loss": 0.0568, "step": 70980 }, { "epoch": 0.46, "learning_rate": 0.00023127206542013847, "loss": 0.0576, "step": 70990 }, { "epoch": 0.46, "learning_rate": 0.00023126238406578155, "loss": 0.0576, "step": 71000 }, { "epoch": 0.46, "eval_cer": 0.9200460964862728, "eval_loss": 0.03755395486950874, "eval_runtime": 119.9894, "eval_samples_per_second": 16.668, "eval_steps_per_second": 4.167, "step": 71000 }, { "epoch": 0.46, "learning_rate": 0.00023125270271142463, "loss": 0.0486, "step": 71010 }, { "epoch": 0.46, "learning_rate": 0.00023124302135706768, "loss": 0.0564, "step": 71020 }, { "epoch": 0.46, "learning_rate": 0.00023123334000271076, "loss": 0.0552, "step": 71030 }, { "epoch": 0.46, "learning_rate": 0.00023122365864835384, "loss": 0.0558, "step": 71040 }, { "epoch": 0.46, "learning_rate": 0.00023121397729399692, "loss": 0.057, "step": 71050 }, { "epoch": 0.46, "learning_rate": 0.00023120429593963994, "loss": 0.0617, "step": 71060 }, { "epoch": 0.46, "learning_rate": 0.00023119461458528302, "loss": 0.0605, "step": 71070 }, { "epoch": 0.46, "learning_rate": 0.0002311849332309261, "loss": 0.0556, "step": 71080 }, { "epoch": 0.46, "learning_rate": 0.00023117525187656916, "loss": 0.056, "step": 71090 }, { "epoch": 0.46, "learning_rate": 0.00023116557052221224, "loss": 0.0506, "step": 71100 }, { "epoch": 0.46, "learning_rate": 0.00023115588916785532, "loss": 0.0555, "step": 71110 }, { "epoch": 0.46, "learning_rate": 0.0002311462078134984, "loss": 0.0535, "step": 71120 }, { "epoch": 0.46, "learning_rate": 0.00023113652645914142, "loss": 0.0532, "step": 71130 }, { "epoch": 0.46, "learning_rate": 0.0002311268451047845, "loss": 0.0447, "step": 71140 }, { "epoch": 0.46, "learning_rate": 0.00023111716375042758, "loss": 0.0543, "step": 71150 }, { "epoch": 0.46, "learning_rate": 0.00023110748239607063, "loss": 0.0534, "step": 71160 }, { "epoch": 0.46, "learning_rate": 0.00023109780104171371, "loss": 0.0568, "step": 71170 }, { "epoch": 0.46, "learning_rate": 0.0002310881196873568, "loss": 0.0564, "step": 71180 }, { "epoch": 0.46, "learning_rate": 0.00023107843833299985, "loss": 0.0506, "step": 71190 }, { "epoch": 0.46, "learning_rate": 0.0002310687569786429, "loss": 0.0592, "step": 71200 }, { "epoch": 0.46, "learning_rate": 0.00023105907562428598, "loss": 0.0532, "step": 71210 }, { "epoch": 0.46, "learning_rate": 0.00023104939426992903, "loss": 0.0536, "step": 71220 }, { "epoch": 0.46, "learning_rate": 0.0002310397129155721, "loss": 0.0517, "step": 71230 }, { "epoch": 0.46, "learning_rate": 0.0002310300315612152, "loss": 0.0599, "step": 71240 }, { "epoch": 0.46, "learning_rate": 0.00023102035020685827, "loss": 0.0611, "step": 71250 }, { "epoch": 0.46, "learning_rate": 0.00023101066885250132, "loss": 0.0539, "step": 71260 }, { "epoch": 0.46, "learning_rate": 0.00023100098749814438, "loss": 0.0524, "step": 71270 }, { "epoch": 0.46, "learning_rate": 0.00023099130614378746, "loss": 0.0546, "step": 71280 }, { "epoch": 0.46, "learning_rate": 0.0002309816247894305, "loss": 0.0481, "step": 71290 }, { "epoch": 0.46, "learning_rate": 0.0002309719434350736, "loss": 0.0477, "step": 71300 }, { "epoch": 0.46, "learning_rate": 0.00023096226208071667, "loss": 0.0576, "step": 71310 }, { "epoch": 0.46, "learning_rate": 0.00023095258072635975, "loss": 0.0612, "step": 71320 }, { "epoch": 0.46, "learning_rate": 0.0002309428993720028, "loss": 0.0506, "step": 71330 }, { "epoch": 0.46, "learning_rate": 0.00023093321801764585, "loss": 0.0528, "step": 71340 }, { "epoch": 0.46, "learning_rate": 0.00023092353666328893, "loss": 0.0513, "step": 71350 }, { "epoch": 0.46, "learning_rate": 0.00023091385530893199, "loss": 0.0504, "step": 71360 }, { "epoch": 0.46, "learning_rate": 0.00023090417395457507, "loss": 0.0593, "step": 71370 }, { "epoch": 0.46, "learning_rate": 0.00023089449260021815, "loss": 0.058, "step": 71380 }, { "epoch": 0.46, "learning_rate": 0.00023088481124586123, "loss": 0.0527, "step": 71390 }, { "epoch": 0.46, "learning_rate": 0.00023087512989150428, "loss": 0.0545, "step": 71400 }, { "epoch": 0.46, "learning_rate": 0.00023086544853714733, "loss": 0.059, "step": 71410 }, { "epoch": 0.46, "learning_rate": 0.00023085576718279038, "loss": 0.0553, "step": 71420 }, { "epoch": 0.46, "learning_rate": 0.00023084608582843346, "loss": 0.0544, "step": 71430 }, { "epoch": 0.46, "learning_rate": 0.00023083640447407654, "loss": 0.0666, "step": 71440 }, { "epoch": 0.46, "learning_rate": 0.00023082672311971962, "loss": 0.0628, "step": 71450 }, { "epoch": 0.46, "learning_rate": 0.00023081704176536268, "loss": 0.0573, "step": 71460 }, { "epoch": 0.46, "learning_rate": 0.00023080736041100576, "loss": 0.0648, "step": 71470 }, { "epoch": 0.46, "learning_rate": 0.0002307976790566488, "loss": 0.0683, "step": 71480 }, { "epoch": 0.46, "learning_rate": 0.00023078799770229186, "loss": 0.0639, "step": 71490 }, { "epoch": 0.46, "learning_rate": 0.00023077831634793494, "loss": 0.0565, "step": 71500 }, { "epoch": 0.46, "learning_rate": 0.00023076863499357802, "loss": 0.0606, "step": 71510 }, { "epoch": 0.46, "learning_rate": 0.0002307589536392211, "loss": 0.0562, "step": 71520 }, { "epoch": 0.46, "learning_rate": 0.00023074927228486415, "loss": 0.0536, "step": 71530 }, { "epoch": 0.46, "learning_rate": 0.00023073959093050723, "loss": 0.0545, "step": 71540 }, { "epoch": 0.46, "learning_rate": 0.00023072990957615029, "loss": 0.0641, "step": 71550 }, { "epoch": 0.46, "learning_rate": 0.00023072022822179334, "loss": 0.0574, "step": 71560 }, { "epoch": 0.46, "learning_rate": 0.00023071054686743642, "loss": 0.0583, "step": 71570 }, { "epoch": 0.46, "learning_rate": 0.0002307008655130795, "loss": 0.052, "step": 71580 }, { "epoch": 0.46, "learning_rate": 0.00023069118415872258, "loss": 0.0501, "step": 71590 }, { "epoch": 0.46, "learning_rate": 0.00023068150280436563, "loss": 0.0633, "step": 71600 }, { "epoch": 0.46, "learning_rate": 0.0002306718214500087, "loss": 0.0538, "step": 71610 }, { "epoch": 0.46, "learning_rate": 0.00023066214009565174, "loss": 0.0529, "step": 71620 }, { "epoch": 0.46, "learning_rate": 0.00023065245874129482, "loss": 0.0532, "step": 71630 }, { "epoch": 0.46, "learning_rate": 0.0002306427773869379, "loss": 0.0538, "step": 71640 }, { "epoch": 0.46, "learning_rate": 0.00023063309603258097, "loss": 0.0625, "step": 71650 }, { "epoch": 0.46, "learning_rate": 0.00023062341467822403, "loss": 0.0589, "step": 71660 }, { "epoch": 0.46, "learning_rate": 0.0002306137333238671, "loss": 0.0583, "step": 71670 }, { "epoch": 0.46, "learning_rate": 0.0002306040519695102, "loss": 0.0579, "step": 71680 }, { "epoch": 0.46, "learning_rate": 0.0002305943706151532, "loss": 0.0568, "step": 71690 }, { "epoch": 0.46, "learning_rate": 0.0002305846892607963, "loss": 0.0635, "step": 71700 }, { "epoch": 0.46, "learning_rate": 0.00023057500790643937, "loss": 0.0594, "step": 71710 }, { "epoch": 0.46, "learning_rate": 0.00023056532655208245, "loss": 0.0556, "step": 71720 }, { "epoch": 0.46, "learning_rate": 0.0002305556451977255, "loss": 0.0531, "step": 71730 }, { "epoch": 0.46, "learning_rate": 0.00023054596384336858, "loss": 0.0506, "step": 71740 }, { "epoch": 0.46, "learning_rate": 0.00023053628248901166, "loss": 0.0668, "step": 71750 }, { "epoch": 0.46, "learning_rate": 0.0002305266011346547, "loss": 0.0539, "step": 71760 }, { "epoch": 0.46, "learning_rate": 0.00023051691978029777, "loss": 0.0624, "step": 71770 }, { "epoch": 0.46, "learning_rate": 0.00023050723842594085, "loss": 0.0541, "step": 71780 }, { "epoch": 0.46, "learning_rate": 0.00023049755707158393, "loss": 0.0552, "step": 71790 }, { "epoch": 0.46, "learning_rate": 0.00023048787571722698, "loss": 0.0531, "step": 71800 }, { "epoch": 0.46, "learning_rate": 0.00023047819436287006, "loss": 0.0567, "step": 71810 }, { "epoch": 0.46, "learning_rate": 0.00023046851300851314, "loss": 0.052, "step": 71820 }, { "epoch": 0.46, "learning_rate": 0.00023045883165415617, "loss": 0.0567, "step": 71830 }, { "epoch": 0.46, "learning_rate": 0.00023044915029979925, "loss": 0.0542, "step": 71840 }, { "epoch": 0.46, "learning_rate": 0.00023043946894544233, "loss": 0.0518, "step": 71850 }, { "epoch": 0.46, "learning_rate": 0.00023042978759108538, "loss": 0.0619, "step": 71860 }, { "epoch": 0.46, "learning_rate": 0.00023042010623672846, "loss": 0.0566, "step": 71870 }, { "epoch": 0.46, "learning_rate": 0.00023041042488237154, "loss": 0.0594, "step": 71880 }, { "epoch": 0.46, "learning_rate": 0.00023040074352801462, "loss": 0.0562, "step": 71890 }, { "epoch": 0.46, "learning_rate": 0.00023039106217365764, "loss": 0.0554, "step": 71900 }, { "epoch": 0.46, "learning_rate": 0.00023038138081930072, "loss": 0.058, "step": 71910 }, { "epoch": 0.46, "learning_rate": 0.0002303716994649438, "loss": 0.0522, "step": 71920 }, { "epoch": 0.46, "learning_rate": 0.00023036201811058686, "loss": 0.0547, "step": 71930 }, { "epoch": 0.46, "learning_rate": 0.00023035233675622994, "loss": 0.0472, "step": 71940 }, { "epoch": 0.46, "learning_rate": 0.00023034265540187302, "loss": 0.0513, "step": 71950 }, { "epoch": 0.46, "learning_rate": 0.0002303329740475161, "loss": 0.0505, "step": 71960 }, { "epoch": 0.46, "learning_rate": 0.00023032329269315912, "loss": 0.0546, "step": 71970 }, { "epoch": 0.46, "learning_rate": 0.0002303136113388022, "loss": 0.0683, "step": 71980 }, { "epoch": 0.46, "learning_rate": 0.00023030392998444528, "loss": 0.0547, "step": 71990 }, { "epoch": 0.46, "learning_rate": 0.00023029424863008833, "loss": 0.0529, "step": 72000 }, { "epoch": 0.46, "eval_cer": 0.9200415772229127, "eval_loss": 0.03651151433587074, "eval_runtime": 120.2459, "eval_samples_per_second": 16.633, "eval_steps_per_second": 4.158, "step": 72000 }, { "epoch": 0.46, "learning_rate": 0.00023028456727573141, "loss": 0.056, "step": 72010 }, { "epoch": 0.46, "learning_rate": 0.0002302748859213745, "loss": 0.062, "step": 72020 }, { "epoch": 0.46, "learning_rate": 0.00023026520456701755, "loss": 0.0505, "step": 72030 }, { "epoch": 0.46, "learning_rate": 0.0002302555232126606, "loss": 0.0575, "step": 72040 }, { "epoch": 0.47, "learning_rate": 0.00023024584185830368, "loss": 0.0597, "step": 72050 }, { "epoch": 0.47, "learning_rate": 0.00023023616050394673, "loss": 0.0579, "step": 72060 }, { "epoch": 0.47, "learning_rate": 0.0002302264791495898, "loss": 0.0499, "step": 72070 }, { "epoch": 0.47, "learning_rate": 0.0002302167977952329, "loss": 0.0533, "step": 72080 }, { "epoch": 0.47, "learning_rate": 0.00023020711644087597, "loss": 0.0536, "step": 72090 }, { "epoch": 0.47, "learning_rate": 0.00023019743508651902, "loss": 0.0576, "step": 72100 }, { "epoch": 0.47, "learning_rate": 0.00023018775373216208, "loss": 0.0574, "step": 72110 }, { "epoch": 0.47, "learning_rate": 0.00023017807237780516, "loss": 0.0566, "step": 72120 }, { "epoch": 0.47, "learning_rate": 0.0002301683910234482, "loss": 0.0541, "step": 72130 }, { "epoch": 0.47, "learning_rate": 0.0002301587096690913, "loss": 0.0581, "step": 72140 }, { "epoch": 0.47, "learning_rate": 0.00023014902831473437, "loss": 0.0504, "step": 72150 }, { "epoch": 0.47, "learning_rate": 0.00023013934696037745, "loss": 0.0574, "step": 72160 }, { "epoch": 0.47, "learning_rate": 0.0002301296656060205, "loss": 0.0599, "step": 72170 }, { "epoch": 0.47, "learning_rate": 0.00023011998425166355, "loss": 0.0518, "step": 72180 }, { "epoch": 0.47, "learning_rate": 0.00023011030289730663, "loss": 0.0582, "step": 72190 }, { "epoch": 0.47, "learning_rate": 0.00023010062154294969, "loss": 0.0464, "step": 72200 }, { "epoch": 0.47, "learning_rate": 0.00023009094018859277, "loss": 0.0564, "step": 72210 }, { "epoch": 0.47, "learning_rate": 0.00023008125883423585, "loss": 0.0642, "step": 72220 }, { "epoch": 0.47, "learning_rate": 0.0002300715774798789, "loss": 0.0532, "step": 72230 }, { "epoch": 0.47, "learning_rate": 0.00023006189612552198, "loss": 0.0499, "step": 72240 }, { "epoch": 0.47, "learning_rate": 0.00023005221477116503, "loss": 0.0542, "step": 72250 }, { "epoch": 0.47, "learning_rate": 0.00023004253341680808, "loss": 0.0539, "step": 72260 }, { "epoch": 0.47, "learning_rate": 0.00023003285206245116, "loss": 0.0526, "step": 72270 }, { "epoch": 0.47, "learning_rate": 0.00023002317070809424, "loss": 0.0582, "step": 72280 }, { "epoch": 0.47, "learning_rate": 0.00023001348935373732, "loss": 0.0513, "step": 72290 }, { "epoch": 0.47, "learning_rate": 0.00023000380799938038, "loss": 0.0534, "step": 72300 }, { "epoch": 0.47, "learning_rate": 0.00022999412664502343, "loss": 0.0594, "step": 72310 }, { "epoch": 0.47, "learning_rate": 0.0002299844452906665, "loss": 0.0601, "step": 72320 }, { "epoch": 0.47, "learning_rate": 0.00022997476393630956, "loss": 0.0608, "step": 72330 }, { "epoch": 0.47, "learning_rate": 0.00022996508258195264, "loss": 0.0512, "step": 72340 }, { "epoch": 0.47, "learning_rate": 0.00022995540122759572, "loss": 0.0533, "step": 72350 }, { "epoch": 0.47, "learning_rate": 0.0002299457198732388, "loss": 0.0526, "step": 72360 }, { "epoch": 0.47, "learning_rate": 0.00022993603851888185, "loss": 0.0543, "step": 72370 }, { "epoch": 0.47, "learning_rate": 0.0002299263571645249, "loss": 0.0566, "step": 72380 }, { "epoch": 0.47, "learning_rate": 0.00022991667581016799, "loss": 0.057, "step": 72390 }, { "epoch": 0.47, "learning_rate": 0.00022990699445581104, "loss": 0.0539, "step": 72400 }, { "epoch": 0.47, "learning_rate": 0.00022989731310145412, "loss": 0.0599, "step": 72410 }, { "epoch": 0.47, "learning_rate": 0.0002298876317470972, "loss": 0.0522, "step": 72420 }, { "epoch": 0.47, "learning_rate": 0.00022987795039274025, "loss": 0.0536, "step": 72430 }, { "epoch": 0.47, "learning_rate": 0.00022986826903838333, "loss": 0.0568, "step": 72440 }, { "epoch": 0.47, "learning_rate": 0.00022985858768402638, "loss": 0.0569, "step": 72450 }, { "epoch": 0.47, "learning_rate": 0.00022984890632966944, "loss": 0.0658, "step": 72460 }, { "epoch": 0.47, "learning_rate": 0.00022983922497531251, "loss": 0.0612, "step": 72470 }, { "epoch": 0.47, "learning_rate": 0.0002298295436209556, "loss": 0.0571, "step": 72480 }, { "epoch": 0.47, "learning_rate": 0.00022981986226659867, "loss": 0.0618, "step": 72490 }, { "epoch": 0.47, "learning_rate": 0.00022981018091224173, "loss": 0.06, "step": 72500 }, { "epoch": 0.47, "learning_rate": 0.0002298004995578848, "loss": 0.0605, "step": 72510 }, { "epoch": 0.47, "learning_rate": 0.00022979081820352786, "loss": 0.065, "step": 72520 }, { "epoch": 0.47, "learning_rate": 0.0002297811368491709, "loss": 0.0487, "step": 72530 }, { "epoch": 0.47, "learning_rate": 0.000229771455494814, "loss": 0.0484, "step": 72540 }, { "epoch": 0.47, "learning_rate": 0.00022976177414045707, "loss": 0.0555, "step": 72550 }, { "epoch": 0.47, "learning_rate": 0.00022975209278610015, "loss": 0.0566, "step": 72560 }, { "epoch": 0.47, "learning_rate": 0.0002297424114317432, "loss": 0.0582, "step": 72570 }, { "epoch": 0.47, "learning_rate": 0.00022973273007738628, "loss": 0.0624, "step": 72580 }, { "epoch": 0.47, "learning_rate": 0.00022972304872302934, "loss": 0.0596, "step": 72590 }, { "epoch": 0.47, "learning_rate": 0.0002297133673686724, "loss": 0.0572, "step": 72600 }, { "epoch": 0.47, "learning_rate": 0.00022970368601431547, "loss": 0.0622, "step": 72610 }, { "epoch": 0.47, "learning_rate": 0.00022969400465995855, "loss": 0.0559, "step": 72620 }, { "epoch": 0.47, "learning_rate": 0.0002296843233056016, "loss": 0.0525, "step": 72630 }, { "epoch": 0.47, "learning_rate": 0.00022967464195124468, "loss": 0.0496, "step": 72640 }, { "epoch": 0.47, "learning_rate": 0.00022966496059688776, "loss": 0.0578, "step": 72650 }, { "epoch": 0.47, "learning_rate": 0.0002296552792425308, "loss": 0.0526, "step": 72660 }, { "epoch": 0.47, "learning_rate": 0.00022964559788817387, "loss": 0.0591, "step": 72670 }, { "epoch": 0.47, "learning_rate": 0.00022963591653381695, "loss": 0.0564, "step": 72680 }, { "epoch": 0.47, "learning_rate": 0.00022962623517946003, "loss": 0.0615, "step": 72690 }, { "epoch": 0.47, "learning_rate": 0.00022961655382510308, "loss": 0.0569, "step": 72700 }, { "epoch": 0.47, "learning_rate": 0.00022960687247074616, "loss": 0.0525, "step": 72710 }, { "epoch": 0.47, "learning_rate": 0.00022959719111638924, "loss": 0.0549, "step": 72720 }, { "epoch": 0.47, "learning_rate": 0.00022958750976203226, "loss": 0.0541, "step": 72730 }, { "epoch": 0.47, "learning_rate": 0.00022957782840767534, "loss": 0.0602, "step": 72740 }, { "epoch": 0.47, "learning_rate": 0.00022956814705331842, "loss": 0.0546, "step": 72750 }, { "epoch": 0.47, "learning_rate": 0.0002295584656989615, "loss": 0.0625, "step": 72760 }, { "epoch": 0.47, "learning_rate": 0.00022954878434460456, "loss": 0.0555, "step": 72770 }, { "epoch": 0.47, "learning_rate": 0.00022953910299024764, "loss": 0.0528, "step": 72780 }, { "epoch": 0.47, "learning_rate": 0.00022952942163589072, "loss": 0.0603, "step": 72790 }, { "epoch": 0.47, "learning_rate": 0.00022951974028153374, "loss": 0.0531, "step": 72800 }, { "epoch": 0.47, "learning_rate": 0.00022951005892717682, "loss": 0.0485, "step": 72810 }, { "epoch": 0.47, "learning_rate": 0.0002295003775728199, "loss": 0.0647, "step": 72820 }, { "epoch": 0.47, "learning_rate": 0.00022949069621846295, "loss": 0.0544, "step": 72830 }, { "epoch": 0.47, "learning_rate": 0.00022948101486410603, "loss": 0.0639, "step": 72840 }, { "epoch": 0.47, "learning_rate": 0.0002294713335097491, "loss": 0.0526, "step": 72850 }, { "epoch": 0.47, "learning_rate": 0.0002294616521553922, "loss": 0.0506, "step": 72860 }, { "epoch": 0.47, "learning_rate": 0.00022945197080103522, "loss": 0.0544, "step": 72870 }, { "epoch": 0.47, "learning_rate": 0.0002294422894466783, "loss": 0.0527, "step": 72880 }, { "epoch": 0.47, "learning_rate": 0.00022943260809232138, "loss": 0.0586, "step": 72890 }, { "epoch": 0.47, "learning_rate": 0.00022942292673796443, "loss": 0.0535, "step": 72900 }, { "epoch": 0.47, "learning_rate": 0.0002294132453836075, "loss": 0.0593, "step": 72910 }, { "epoch": 0.47, "learning_rate": 0.0002294035640292506, "loss": 0.0504, "step": 72920 }, { "epoch": 0.47, "learning_rate": 0.00022939388267489367, "loss": 0.0581, "step": 72930 }, { "epoch": 0.47, "learning_rate": 0.0002293842013205367, "loss": 0.0551, "step": 72940 }, { "epoch": 0.47, "learning_rate": 0.00022937451996617978, "loss": 0.0517, "step": 72950 }, { "epoch": 0.47, "learning_rate": 0.00022936483861182286, "loss": 0.0536, "step": 72960 }, { "epoch": 0.47, "learning_rate": 0.0002293551572574659, "loss": 0.0549, "step": 72970 }, { "epoch": 0.47, "learning_rate": 0.000229345475903109, "loss": 0.0565, "step": 72980 }, { "epoch": 0.47, "learning_rate": 0.00022933579454875207, "loss": 0.0582, "step": 72990 }, { "epoch": 0.47, "learning_rate": 0.00022932611319439512, "loss": 0.0504, "step": 73000 }, { "epoch": 0.47, "eval_cer": 0.9200831544458253, "eval_loss": 0.03714871034026146, "eval_runtime": 120.0036, "eval_samples_per_second": 16.666, "eval_steps_per_second": 4.167, "step": 73000 }, { "epoch": 0.47, "learning_rate": 0.00022931643184003817, "loss": 0.0522, "step": 73010 }, { "epoch": 0.47, "learning_rate": 0.00022930675048568125, "loss": 0.047, "step": 73020 }, { "epoch": 0.47, "learning_rate": 0.0002292970691313243, "loss": 0.069, "step": 73030 }, { "epoch": 0.47, "learning_rate": 0.00022928738777696739, "loss": 0.0583, "step": 73040 }, { "epoch": 0.47, "learning_rate": 0.00022927770642261047, "loss": 0.0568, "step": 73050 }, { "epoch": 0.47, "learning_rate": 0.00022926802506825355, "loss": 0.0563, "step": 73060 }, { "epoch": 0.47, "learning_rate": 0.0002292583437138966, "loss": 0.051, "step": 73070 }, { "epoch": 0.47, "learning_rate": 0.00022924866235953965, "loss": 0.057, "step": 73080 }, { "epoch": 0.47, "learning_rate": 0.00022923898100518273, "loss": 0.0505, "step": 73090 }, { "epoch": 0.47, "learning_rate": 0.00022922929965082578, "loss": 0.0515, "step": 73100 }, { "epoch": 0.47, "learning_rate": 0.00022921961829646886, "loss": 0.0597, "step": 73110 }, { "epoch": 0.47, "learning_rate": 0.00022920993694211194, "loss": 0.0588, "step": 73120 }, { "epoch": 0.47, "learning_rate": 0.00022920025558775502, "loss": 0.0573, "step": 73130 }, { "epoch": 0.47, "learning_rate": 0.00022919057423339807, "loss": 0.0538, "step": 73140 }, { "epoch": 0.47, "learning_rate": 0.00022918089287904113, "loss": 0.0539, "step": 73150 }, { "epoch": 0.47, "learning_rate": 0.0002291712115246842, "loss": 0.0555, "step": 73160 }, { "epoch": 0.47, "learning_rate": 0.00022916153017032726, "loss": 0.0577, "step": 73170 }, { "epoch": 0.47, "learning_rate": 0.00022915184881597034, "loss": 0.0501, "step": 73180 }, { "epoch": 0.47, "learning_rate": 0.00022914216746161342, "loss": 0.057, "step": 73190 }, { "epoch": 0.47, "learning_rate": 0.00022913248610725647, "loss": 0.0595, "step": 73200 }, { "epoch": 0.47, "learning_rate": 0.00022912280475289955, "loss": 0.0502, "step": 73210 }, { "epoch": 0.47, "learning_rate": 0.0002291131233985426, "loss": 0.0549, "step": 73220 }, { "epoch": 0.47, "learning_rate": 0.00022910344204418566, "loss": 0.0526, "step": 73230 }, { "epoch": 0.47, "learning_rate": 0.00022909376068982874, "loss": 0.0544, "step": 73240 }, { "epoch": 0.47, "learning_rate": 0.00022908407933547182, "loss": 0.0554, "step": 73250 }, { "epoch": 0.47, "learning_rate": 0.0002290743979811149, "loss": 0.061, "step": 73260 }, { "epoch": 0.47, "learning_rate": 0.00022906471662675795, "loss": 0.0521, "step": 73270 }, { "epoch": 0.47, "learning_rate": 0.00022905503527240103, "loss": 0.0577, "step": 73280 }, { "epoch": 0.47, "learning_rate": 0.00022904535391804408, "loss": 0.0544, "step": 73290 }, { "epoch": 0.47, "learning_rate": 0.00022903567256368713, "loss": 0.0482, "step": 73300 }, { "epoch": 0.47, "learning_rate": 0.00022902599120933021, "loss": 0.0535, "step": 73310 }, { "epoch": 0.47, "learning_rate": 0.0002290163098549733, "loss": 0.0539, "step": 73320 }, { "epoch": 0.47, "learning_rate": 0.00022900662850061637, "loss": 0.0538, "step": 73330 }, { "epoch": 0.47, "learning_rate": 0.00022899694714625943, "loss": 0.0542, "step": 73340 }, { "epoch": 0.47, "learning_rate": 0.0002289872657919025, "loss": 0.0544, "step": 73350 }, { "epoch": 0.47, "learning_rate": 0.00022897758443754556, "loss": 0.0509, "step": 73360 }, { "epoch": 0.47, "learning_rate": 0.0002289679030831886, "loss": 0.0563, "step": 73370 }, { "epoch": 0.47, "learning_rate": 0.0002289582217288317, "loss": 0.0514, "step": 73380 }, { "epoch": 0.47, "learning_rate": 0.00022894854037447477, "loss": 0.058, "step": 73390 }, { "epoch": 0.47, "learning_rate": 0.00022893885902011782, "loss": 0.0521, "step": 73400 }, { "epoch": 0.47, "learning_rate": 0.0002289291776657609, "loss": 0.0498, "step": 73410 }, { "epoch": 0.47, "learning_rate": 0.00022891949631140398, "loss": 0.0536, "step": 73420 }, { "epoch": 0.47, "learning_rate": 0.000228909814957047, "loss": 0.0515, "step": 73430 }, { "epoch": 0.47, "learning_rate": 0.0002289001336026901, "loss": 0.0557, "step": 73440 }, { "epoch": 0.47, "learning_rate": 0.00022889045224833317, "loss": 0.0576, "step": 73450 }, { "epoch": 0.47, "learning_rate": 0.00022888077089397625, "loss": 0.0558, "step": 73460 }, { "epoch": 0.47, "learning_rate": 0.0002288710895396193, "loss": 0.058, "step": 73470 }, { "epoch": 0.47, "learning_rate": 0.00022886140818526238, "loss": 0.0501, "step": 73480 }, { "epoch": 0.47, "learning_rate": 0.00022885172683090546, "loss": 0.0569, "step": 73490 }, { "epoch": 0.47, "learning_rate": 0.0002288420454765485, "loss": 0.0584, "step": 73500 }, { "epoch": 0.47, "learning_rate": 0.00022883236412219157, "loss": 0.0484, "step": 73510 }, { "epoch": 0.47, "learning_rate": 0.00022882268276783465, "loss": 0.0548, "step": 73520 }, { "epoch": 0.47, "learning_rate": 0.00022881300141347773, "loss": 0.0526, "step": 73530 }, { "epoch": 0.47, "learning_rate": 0.00022880332005912078, "loss": 0.0553, "step": 73540 }, { "epoch": 0.47, "learning_rate": 0.00022879363870476386, "loss": 0.0583, "step": 73550 }, { "epoch": 0.47, "learning_rate": 0.00022878395735040694, "loss": 0.0491, "step": 73560 }, { "epoch": 0.47, "learning_rate": 0.00022877427599604996, "loss": 0.0562, "step": 73570 }, { "epoch": 0.47, "learning_rate": 0.00022876459464169304, "loss": 0.0551, "step": 73580 }, { "epoch": 0.47, "learning_rate": 0.00022875491328733612, "loss": 0.0545, "step": 73590 }, { "epoch": 0.48, "learning_rate": 0.00022874523193297918, "loss": 0.048, "step": 73600 }, { "epoch": 0.48, "learning_rate": 0.00022873555057862226, "loss": 0.057, "step": 73610 }, { "epoch": 0.48, "learning_rate": 0.00022872586922426534, "loss": 0.0571, "step": 73620 }, { "epoch": 0.48, "learning_rate": 0.00022871618786990842, "loss": 0.0631, "step": 73630 }, { "epoch": 0.48, "learning_rate": 0.00022870650651555144, "loss": 0.0541, "step": 73640 }, { "epoch": 0.48, "learning_rate": 0.00022869682516119452, "loss": 0.0573, "step": 73650 }, { "epoch": 0.48, "learning_rate": 0.0002286871438068376, "loss": 0.0491, "step": 73660 }, { "epoch": 0.48, "learning_rate": 0.00022867746245248065, "loss": 0.0582, "step": 73670 }, { "epoch": 0.48, "learning_rate": 0.00022866778109812373, "loss": 0.063, "step": 73680 }, { "epoch": 0.48, "learning_rate": 0.0002286580997437668, "loss": 0.0554, "step": 73690 }, { "epoch": 0.48, "learning_rate": 0.0002286484183894099, "loss": 0.0561, "step": 73700 }, { "epoch": 0.48, "learning_rate": 0.00022863873703505292, "loss": 0.0544, "step": 73710 }, { "epoch": 0.48, "learning_rate": 0.000228629055680696, "loss": 0.054, "step": 73720 }, { "epoch": 0.48, "learning_rate": 0.00022861937432633908, "loss": 0.0543, "step": 73730 }, { "epoch": 0.48, "learning_rate": 0.00022860969297198213, "loss": 0.0499, "step": 73740 }, { "epoch": 0.48, "learning_rate": 0.0002286000116176252, "loss": 0.0584, "step": 73750 }, { "epoch": 0.48, "learning_rate": 0.0002285903302632683, "loss": 0.0535, "step": 73760 }, { "epoch": 0.48, "learning_rate": 0.00022858064890891137, "loss": 0.0472, "step": 73770 }, { "epoch": 0.48, "learning_rate": 0.0002285709675545544, "loss": 0.0563, "step": 73780 }, { "epoch": 0.48, "learning_rate": 0.00022856128620019748, "loss": 0.0524, "step": 73790 }, { "epoch": 0.48, "learning_rate": 0.00022855160484584053, "loss": 0.0512, "step": 73800 }, { "epoch": 0.48, "learning_rate": 0.0002285419234914836, "loss": 0.0581, "step": 73810 }, { "epoch": 0.48, "learning_rate": 0.0002285322421371267, "loss": 0.051, "step": 73820 }, { "epoch": 0.48, "learning_rate": 0.00022852256078276977, "loss": 0.057, "step": 73830 }, { "epoch": 0.48, "learning_rate": 0.00022851287942841282, "loss": 0.0451, "step": 73840 }, { "epoch": 0.48, "learning_rate": 0.00022850319807405587, "loss": 0.0518, "step": 73850 }, { "epoch": 0.48, "learning_rate": 0.00022849351671969895, "loss": 0.0568, "step": 73860 }, { "epoch": 0.48, "learning_rate": 0.000228483835365342, "loss": 0.0531, "step": 73870 }, { "epoch": 0.48, "learning_rate": 0.00022847415401098509, "loss": 0.0546, "step": 73880 }, { "epoch": 0.48, "learning_rate": 0.00022846447265662816, "loss": 0.0586, "step": 73890 }, { "epoch": 0.48, "learning_rate": 0.00022845479130227124, "loss": 0.0475, "step": 73900 }, { "epoch": 0.48, "learning_rate": 0.0002284451099479143, "loss": 0.0598, "step": 73910 }, { "epoch": 0.48, "learning_rate": 0.00022843542859355735, "loss": 0.0513, "step": 73920 }, { "epoch": 0.48, "learning_rate": 0.00022842574723920043, "loss": 0.0524, "step": 73930 }, { "epoch": 0.48, "learning_rate": 0.00022841606588484348, "loss": 0.0587, "step": 73940 }, { "epoch": 0.48, "learning_rate": 0.00022840638453048656, "loss": 0.0553, "step": 73950 }, { "epoch": 0.48, "learning_rate": 0.00022839670317612964, "loss": 0.0563, "step": 73960 }, { "epoch": 0.48, "learning_rate": 0.00022838702182177272, "loss": 0.0698, "step": 73970 }, { "epoch": 0.48, "learning_rate": 0.00022837734046741577, "loss": 0.0551, "step": 73980 }, { "epoch": 0.48, "learning_rate": 0.00022836765911305883, "loss": 0.0566, "step": 73990 }, { "epoch": 0.48, "learning_rate": 0.00022835797775870188, "loss": 0.0499, "step": 74000 }, { "epoch": 0.48, "eval_cer": 0.9200479041916167, "eval_loss": 0.037295423448085785, "eval_runtime": 120.0199, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 74000 }, { "epoch": 0.48, "learning_rate": 0.00022834829640434496, "loss": 0.056, "step": 74010 }, { "epoch": 0.48, "learning_rate": 0.00022833861504998804, "loss": 0.0527, "step": 74020 }, { "epoch": 0.48, "learning_rate": 0.00022832893369563112, "loss": 0.0605, "step": 74030 }, { "epoch": 0.48, "learning_rate": 0.00022831925234127417, "loss": 0.0535, "step": 74040 }, { "epoch": 0.48, "learning_rate": 0.00022830957098691725, "loss": 0.0577, "step": 74050 }, { "epoch": 0.48, "learning_rate": 0.0002282998896325603, "loss": 0.0545, "step": 74060 }, { "epoch": 0.48, "learning_rate": 0.00022829020827820336, "loss": 0.0498, "step": 74070 }, { "epoch": 0.48, "learning_rate": 0.00022828052692384644, "loss": 0.0526, "step": 74080 }, { "epoch": 0.48, "learning_rate": 0.00022827084556948952, "loss": 0.0513, "step": 74090 }, { "epoch": 0.48, "learning_rate": 0.0002282611642151326, "loss": 0.0534, "step": 74100 }, { "epoch": 0.48, "learning_rate": 0.00022825148286077565, "loss": 0.0566, "step": 74110 }, { "epoch": 0.48, "learning_rate": 0.00022824180150641873, "loss": 0.0504, "step": 74120 }, { "epoch": 0.48, "learning_rate": 0.00022823212015206178, "loss": 0.0545, "step": 74130 }, { "epoch": 0.48, "learning_rate": 0.00022822243879770483, "loss": 0.0491, "step": 74140 }, { "epoch": 0.48, "learning_rate": 0.00022821275744334791, "loss": 0.0527, "step": 74150 }, { "epoch": 0.48, "learning_rate": 0.000228203076088991, "loss": 0.0575, "step": 74160 }, { "epoch": 0.48, "learning_rate": 0.00022819339473463407, "loss": 0.0536, "step": 74170 }, { "epoch": 0.48, "learning_rate": 0.00022818371338027713, "loss": 0.0563, "step": 74180 }, { "epoch": 0.48, "learning_rate": 0.0002281740320259202, "loss": 0.0539, "step": 74190 }, { "epoch": 0.48, "learning_rate": 0.00022816435067156323, "loss": 0.0556, "step": 74200 }, { "epoch": 0.48, "learning_rate": 0.0002281546693172063, "loss": 0.0612, "step": 74210 }, { "epoch": 0.48, "learning_rate": 0.0002281449879628494, "loss": 0.0517, "step": 74220 }, { "epoch": 0.48, "learning_rate": 0.00022813530660849247, "loss": 0.0478, "step": 74230 }, { "epoch": 0.48, "learning_rate": 0.00022812562525413552, "loss": 0.0531, "step": 74240 }, { "epoch": 0.48, "learning_rate": 0.0002281159438997786, "loss": 0.0596, "step": 74250 }, { "epoch": 0.48, "learning_rate": 0.00022810626254542168, "loss": 0.0456, "step": 74260 }, { "epoch": 0.48, "learning_rate": 0.0002280965811910647, "loss": 0.0545, "step": 74270 }, { "epoch": 0.48, "learning_rate": 0.0002280868998367078, "loss": 0.049, "step": 74280 }, { "epoch": 0.48, "learning_rate": 0.00022807721848235087, "loss": 0.0517, "step": 74290 }, { "epoch": 0.48, "learning_rate": 0.00022806753712799395, "loss": 0.0546, "step": 74300 }, { "epoch": 0.48, "learning_rate": 0.000228057855773637, "loss": 0.049, "step": 74310 }, { "epoch": 0.48, "learning_rate": 0.00022804817441928008, "loss": 0.051, "step": 74320 }, { "epoch": 0.48, "learning_rate": 0.00022803849306492316, "loss": 0.0512, "step": 74330 }, { "epoch": 0.48, "learning_rate": 0.00022802881171056619, "loss": 0.0483, "step": 74340 }, { "epoch": 0.48, "learning_rate": 0.00022801913035620927, "loss": 0.0562, "step": 74350 }, { "epoch": 0.48, "learning_rate": 0.00022800944900185235, "loss": 0.0539, "step": 74360 }, { "epoch": 0.48, "learning_rate": 0.00022799976764749543, "loss": 0.0572, "step": 74370 }, { "epoch": 0.48, "learning_rate": 0.00022799008629313848, "loss": 0.0554, "step": 74380 }, { "epoch": 0.48, "learning_rate": 0.00022798040493878156, "loss": 0.0524, "step": 74390 }, { "epoch": 0.48, "learning_rate": 0.00022797072358442464, "loss": 0.052, "step": 74400 }, { "epoch": 0.48, "learning_rate": 0.00022796104223006766, "loss": 0.0541, "step": 74410 }, { "epoch": 0.48, "learning_rate": 0.00022795136087571074, "loss": 0.0567, "step": 74420 }, { "epoch": 0.48, "learning_rate": 0.00022794167952135382, "loss": 0.06, "step": 74430 }, { "epoch": 0.48, "learning_rate": 0.00022793199816699688, "loss": 0.0455, "step": 74440 }, { "epoch": 0.48, "learning_rate": 0.00022792231681263996, "loss": 0.0548, "step": 74450 }, { "epoch": 0.48, "learning_rate": 0.00022791263545828304, "loss": 0.0501, "step": 74460 }, { "epoch": 0.48, "learning_rate": 0.00022790295410392612, "loss": 0.053, "step": 74470 }, { "epoch": 0.48, "learning_rate": 0.00022789327274956914, "loss": 0.0502, "step": 74480 }, { "epoch": 0.48, "learning_rate": 0.00022788359139521222, "loss": 0.0553, "step": 74490 }, { "epoch": 0.48, "learning_rate": 0.0002278739100408553, "loss": 0.0483, "step": 74500 }, { "epoch": 0.48, "learning_rate": 0.00022786422868649835, "loss": 0.0596, "step": 74510 }, { "epoch": 0.48, "learning_rate": 0.00022785454733214143, "loss": 0.0538, "step": 74520 }, { "epoch": 0.48, "learning_rate": 0.0002278448659777845, "loss": 0.0546, "step": 74530 }, { "epoch": 0.48, "learning_rate": 0.0002278351846234276, "loss": 0.061, "step": 74540 }, { "epoch": 0.48, "learning_rate": 0.00022782550326907062, "loss": 0.0527, "step": 74550 }, { "epoch": 0.48, "learning_rate": 0.0002278158219147137, "loss": 0.0546, "step": 74560 }, { "epoch": 0.48, "learning_rate": 0.00022780614056035678, "loss": 0.0523, "step": 74570 }, { "epoch": 0.48, "learning_rate": 0.00022779645920599983, "loss": 0.055, "step": 74580 }, { "epoch": 0.48, "learning_rate": 0.0002277867778516429, "loss": 0.0479, "step": 74590 }, { "epoch": 0.48, "learning_rate": 0.000227777096497286, "loss": 0.0514, "step": 74600 }, { "epoch": 0.48, "learning_rate": 0.00022776741514292904, "loss": 0.0563, "step": 74610 }, { "epoch": 0.48, "learning_rate": 0.0002277577337885721, "loss": 0.0494, "step": 74620 }, { "epoch": 0.48, "learning_rate": 0.00022774805243421517, "loss": 0.0484, "step": 74630 }, { "epoch": 0.48, "learning_rate": 0.00022773837107985823, "loss": 0.0515, "step": 74640 }, { "epoch": 0.48, "learning_rate": 0.0002277286897255013, "loss": 0.0615, "step": 74650 }, { "epoch": 0.48, "learning_rate": 0.0002277190083711444, "loss": 0.0649, "step": 74660 }, { "epoch": 0.48, "learning_rate": 0.00022770932701678747, "loss": 0.0555, "step": 74670 }, { "epoch": 0.48, "learning_rate": 0.00022769964566243052, "loss": 0.0526, "step": 74680 }, { "epoch": 0.48, "learning_rate": 0.00022768996430807357, "loss": 0.0501, "step": 74690 }, { "epoch": 0.48, "learning_rate": 0.00022768028295371665, "loss": 0.0533, "step": 74700 }, { "epoch": 0.48, "learning_rate": 0.0002276706015993597, "loss": 0.0597, "step": 74710 }, { "epoch": 0.48, "learning_rate": 0.00022766092024500278, "loss": 0.0533, "step": 74720 }, { "epoch": 0.48, "learning_rate": 0.00022765123889064586, "loss": 0.0506, "step": 74730 }, { "epoch": 0.48, "learning_rate": 0.00022764155753628894, "loss": 0.0579, "step": 74740 }, { "epoch": 0.48, "learning_rate": 0.000227631876181932, "loss": 0.0513, "step": 74750 }, { "epoch": 0.48, "learning_rate": 0.00022762219482757505, "loss": 0.0523, "step": 74760 }, { "epoch": 0.48, "learning_rate": 0.00022761251347321813, "loss": 0.0526, "step": 74770 }, { "epoch": 0.48, "learning_rate": 0.00022760283211886118, "loss": 0.0562, "step": 74780 }, { "epoch": 0.48, "learning_rate": 0.00022759315076450426, "loss": 0.0546, "step": 74790 }, { "epoch": 0.48, "learning_rate": 0.00022758346941014734, "loss": 0.0556, "step": 74800 }, { "epoch": 0.48, "learning_rate": 0.0002275737880557904, "loss": 0.0593, "step": 74810 }, { "epoch": 0.48, "learning_rate": 0.00022756410670143347, "loss": 0.0618, "step": 74820 }, { "epoch": 0.48, "learning_rate": 0.00022755442534707653, "loss": 0.0563, "step": 74830 }, { "epoch": 0.48, "learning_rate": 0.00022754474399271958, "loss": 0.0459, "step": 74840 }, { "epoch": 0.48, "learning_rate": 0.00022753506263836266, "loss": 0.0519, "step": 74850 }, { "epoch": 0.48, "learning_rate": 0.00022752538128400574, "loss": 0.0538, "step": 74860 }, { "epoch": 0.48, "learning_rate": 0.00022751569992964882, "loss": 0.056, "step": 74870 }, { "epoch": 0.48, "learning_rate": 0.00022750601857529187, "loss": 0.0611, "step": 74880 }, { "epoch": 0.48, "learning_rate": 0.00022749633722093495, "loss": 0.0579, "step": 74890 }, { "epoch": 0.48, "learning_rate": 0.000227486655866578, "loss": 0.0526, "step": 74900 }, { "epoch": 0.48, "learning_rate": 0.00022747697451222106, "loss": 0.0614, "step": 74910 }, { "epoch": 0.48, "learning_rate": 0.00022746729315786414, "loss": 0.0516, "step": 74920 }, { "epoch": 0.48, "learning_rate": 0.00022745761180350722, "loss": 0.0579, "step": 74930 }, { "epoch": 0.48, "learning_rate": 0.0002274479304491503, "loss": 0.0581, "step": 74940 }, { "epoch": 0.48, "learning_rate": 0.00022743824909479335, "loss": 0.055, "step": 74950 }, { "epoch": 0.48, "learning_rate": 0.00022742856774043643, "loss": 0.0524, "step": 74960 }, { "epoch": 0.48, "learning_rate": 0.00022741888638607948, "loss": 0.0572, "step": 74970 }, { "epoch": 0.48, "learning_rate": 0.00022740920503172253, "loss": 0.0502, "step": 74980 }, { "epoch": 0.48, "learning_rate": 0.00022739952367736561, "loss": 0.0566, "step": 74990 }, { "epoch": 0.48, "learning_rate": 0.0002273898423230087, "loss": 0.0578, "step": 75000 }, { "epoch": 0.48, "eval_cer": 0.9199900576206078, "eval_loss": 0.03665885701775551, "eval_runtime": 120.0194, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 75000 }, { "epoch": 0.48, "learning_rate": 0.00022738016096865175, "loss": 0.054, "step": 75010 }, { "epoch": 0.48, "learning_rate": 0.00022737047961429483, "loss": 0.0585, "step": 75020 }, { "epoch": 0.48, "learning_rate": 0.0002273607982599379, "loss": 0.0547, "step": 75030 }, { "epoch": 0.48, "learning_rate": 0.00022735111690558093, "loss": 0.0516, "step": 75040 }, { "epoch": 0.48, "learning_rate": 0.000227341435551224, "loss": 0.0554, "step": 75050 }, { "epoch": 0.48, "learning_rate": 0.0002273317541968671, "loss": 0.0527, "step": 75060 }, { "epoch": 0.48, "learning_rate": 0.00022732207284251017, "loss": 0.054, "step": 75070 }, { "epoch": 0.48, "learning_rate": 0.00022731239148815322, "loss": 0.049, "step": 75080 }, { "epoch": 0.48, "learning_rate": 0.0002273027101337963, "loss": 0.0559, "step": 75090 }, { "epoch": 0.48, "learning_rate": 0.00022729302877943938, "loss": 0.0572, "step": 75100 }, { "epoch": 0.48, "learning_rate": 0.0002272833474250824, "loss": 0.0595, "step": 75110 }, { "epoch": 0.48, "learning_rate": 0.0002272736660707255, "loss": 0.0503, "step": 75120 }, { "epoch": 0.48, "learning_rate": 0.00022726398471636857, "loss": 0.051, "step": 75130 }, { "epoch": 0.48, "learning_rate": 0.00022725430336201165, "loss": 0.0582, "step": 75140 }, { "epoch": 0.49, "learning_rate": 0.0002272446220076547, "loss": 0.0549, "step": 75150 }, { "epoch": 0.49, "learning_rate": 0.00022723494065329778, "loss": 0.0525, "step": 75160 }, { "epoch": 0.49, "learning_rate": 0.00022722525929894086, "loss": 0.0538, "step": 75170 }, { "epoch": 0.49, "learning_rate": 0.00022721557794458389, "loss": 0.0595, "step": 75180 }, { "epoch": 0.49, "learning_rate": 0.00022720589659022697, "loss": 0.0555, "step": 75190 }, { "epoch": 0.49, "learning_rate": 0.00022719621523587005, "loss": 0.0495, "step": 75200 }, { "epoch": 0.49, "learning_rate": 0.0002271865338815131, "loss": 0.059, "step": 75210 }, { "epoch": 0.49, "learning_rate": 0.00022717685252715618, "loss": 0.0558, "step": 75220 }, { "epoch": 0.49, "learning_rate": 0.00022716717117279926, "loss": 0.0543, "step": 75230 }, { "epoch": 0.49, "learning_rate": 0.00022715748981844234, "loss": 0.1502, "step": 75240 }, { "epoch": 0.49, "learning_rate": 0.00022714780846408536, "loss": 0.0914, "step": 75250 }, { "epoch": 0.49, "learning_rate": 0.00022713812710972844, "loss": 0.0557, "step": 75260 }, { "epoch": 0.49, "learning_rate": 0.00022712844575537152, "loss": 0.059, "step": 75270 }, { "epoch": 0.49, "learning_rate": 0.00022711876440101458, "loss": 0.0474, "step": 75280 }, { "epoch": 0.49, "learning_rate": 0.00022710908304665766, "loss": 0.0485, "step": 75290 }, { "epoch": 0.49, "learning_rate": 0.00022709940169230073, "loss": 0.0537, "step": 75300 }, { "epoch": 0.49, "learning_rate": 0.00022708972033794381, "loss": 0.0533, "step": 75310 }, { "epoch": 0.49, "learning_rate": 0.00022708003898358684, "loss": 0.0551, "step": 75320 }, { "epoch": 0.49, "learning_rate": 0.00022707035762922992, "loss": 0.0549, "step": 75330 }, { "epoch": 0.49, "learning_rate": 0.000227060676274873, "loss": 0.0545, "step": 75340 }, { "epoch": 0.49, "learning_rate": 0.00022705099492051605, "loss": 0.058, "step": 75350 }, { "epoch": 0.49, "learning_rate": 0.00022704131356615913, "loss": 0.0496, "step": 75360 }, { "epoch": 0.49, "learning_rate": 0.0002270316322118022, "loss": 0.0504, "step": 75370 }, { "epoch": 0.49, "learning_rate": 0.00022702195085744526, "loss": 0.0562, "step": 75380 }, { "epoch": 0.49, "learning_rate": 0.00022701226950308832, "loss": 0.0649, "step": 75390 }, { "epoch": 0.49, "learning_rate": 0.0002270025881487314, "loss": 0.0511, "step": 75400 }, { "epoch": 0.49, "learning_rate": 0.00022699290679437445, "loss": 0.0562, "step": 75410 }, { "epoch": 0.49, "learning_rate": 0.00022698322544001753, "loss": 0.056, "step": 75420 }, { "epoch": 0.49, "learning_rate": 0.0002269735440856606, "loss": 0.054, "step": 75430 }, { "epoch": 0.49, "learning_rate": 0.0002269638627313037, "loss": 0.0617, "step": 75440 }, { "epoch": 0.49, "learning_rate": 0.00022695418137694674, "loss": 0.046, "step": 75450 }, { "epoch": 0.49, "learning_rate": 0.0002269445000225898, "loss": 0.0556, "step": 75460 }, { "epoch": 0.49, "learning_rate": 0.00022693481866823287, "loss": 0.0519, "step": 75470 }, { "epoch": 0.49, "learning_rate": 0.00022692513731387593, "loss": 0.0494, "step": 75480 }, { "epoch": 0.49, "learning_rate": 0.000226915455959519, "loss": 0.059, "step": 75490 }, { "epoch": 0.49, "learning_rate": 0.0002269057746051621, "loss": 0.0546, "step": 75500 }, { "epoch": 0.49, "learning_rate": 0.00022689609325080517, "loss": 0.0557, "step": 75510 }, { "epoch": 0.49, "learning_rate": 0.00022688641189644822, "loss": 0.0471, "step": 75520 }, { "epoch": 0.49, "learning_rate": 0.00022687673054209127, "loss": 0.0625, "step": 75530 }, { "epoch": 0.49, "learning_rate": 0.00022686704918773435, "loss": 0.059, "step": 75540 }, { "epoch": 0.49, "learning_rate": 0.0002268573678333774, "loss": 0.0604, "step": 75550 }, { "epoch": 0.49, "learning_rate": 0.00022684768647902048, "loss": 0.0501, "step": 75560 }, { "epoch": 0.49, "learning_rate": 0.00022683800512466356, "loss": 0.0523, "step": 75570 }, { "epoch": 0.49, "learning_rate": 0.00022682832377030662, "loss": 0.0476, "step": 75580 }, { "epoch": 0.49, "learning_rate": 0.0002268186424159497, "loss": 0.0518, "step": 75590 }, { "epoch": 0.49, "learning_rate": 0.00022680896106159275, "loss": 0.0602, "step": 75600 }, { "epoch": 0.49, "learning_rate": 0.0002267992797072358, "loss": 0.0623, "step": 75610 }, { "epoch": 0.49, "learning_rate": 0.00022678959835287888, "loss": 0.0676, "step": 75620 }, { "epoch": 0.49, "learning_rate": 0.00022677991699852196, "loss": 0.0532, "step": 75630 }, { "epoch": 0.49, "learning_rate": 0.00022677023564416504, "loss": 0.0595, "step": 75640 }, { "epoch": 0.49, "learning_rate": 0.0002267605542898081, "loss": 0.0545, "step": 75650 }, { "epoch": 0.49, "learning_rate": 0.00022675087293545117, "loss": 0.0576, "step": 75660 }, { "epoch": 0.49, "learning_rate": 0.00022674119158109423, "loss": 0.0677, "step": 75670 }, { "epoch": 0.49, "learning_rate": 0.00022673151022673728, "loss": 0.0574, "step": 75680 }, { "epoch": 0.49, "learning_rate": 0.00022672182887238036, "loss": 0.054, "step": 75690 }, { "epoch": 0.49, "learning_rate": 0.00022671214751802344, "loss": 0.0568, "step": 75700 }, { "epoch": 0.49, "learning_rate": 0.00022670246616366652, "loss": 0.0578, "step": 75710 }, { "epoch": 0.49, "learning_rate": 0.00022669278480930957, "loss": 0.056, "step": 75720 }, { "epoch": 0.49, "learning_rate": 0.00022668310345495265, "loss": 0.0456, "step": 75730 }, { "epoch": 0.49, "learning_rate": 0.0002266734221005957, "loss": 0.0558, "step": 75740 }, { "epoch": 0.49, "learning_rate": 0.00022666374074623876, "loss": 0.0599, "step": 75750 }, { "epoch": 0.49, "learning_rate": 0.00022665405939188184, "loss": 0.0534, "step": 75760 }, { "epoch": 0.49, "learning_rate": 0.00022664437803752492, "loss": 0.0601, "step": 75770 }, { "epoch": 0.49, "learning_rate": 0.000226634696683168, "loss": 0.0504, "step": 75780 }, { "epoch": 0.49, "learning_rate": 0.00022662501532881105, "loss": 0.0577, "step": 75790 }, { "epoch": 0.49, "learning_rate": 0.00022661533397445413, "loss": 0.058, "step": 75800 }, { "epoch": 0.49, "learning_rate": 0.00022660565262009715, "loss": 0.0499, "step": 75810 }, { "epoch": 0.49, "learning_rate": 0.00022659597126574023, "loss": 0.0529, "step": 75820 }, { "epoch": 0.49, "learning_rate": 0.0002265862899113833, "loss": 0.0497, "step": 75830 }, { "epoch": 0.49, "learning_rate": 0.0002265766085570264, "loss": 0.0536, "step": 75840 }, { "epoch": 0.49, "learning_rate": 0.00022656692720266945, "loss": 0.0493, "step": 75850 }, { "epoch": 0.49, "learning_rate": 0.00022655724584831253, "loss": 0.0541, "step": 75860 }, { "epoch": 0.49, "learning_rate": 0.0002265475644939556, "loss": 0.0526, "step": 75870 }, { "epoch": 0.49, "learning_rate": 0.00022653788313959863, "loss": 0.0482, "step": 75880 }, { "epoch": 0.49, "learning_rate": 0.0002265282017852417, "loss": 0.0564, "step": 75890 }, { "epoch": 0.49, "learning_rate": 0.0002265185204308848, "loss": 0.0581, "step": 75900 }, { "epoch": 0.49, "learning_rate": 0.00022650883907652787, "loss": 0.0593, "step": 75910 }, { "epoch": 0.49, "learning_rate": 0.00022649915772217092, "loss": 0.0515, "step": 75920 }, { "epoch": 0.49, "learning_rate": 0.000226489476367814, "loss": 0.0597, "step": 75930 }, { "epoch": 0.49, "learning_rate": 0.00022647979501345708, "loss": 0.0484, "step": 75940 }, { "epoch": 0.49, "learning_rate": 0.0002264701136591001, "loss": 0.0507, "step": 75950 }, { "epoch": 0.49, "learning_rate": 0.0002264604323047432, "loss": 0.0467, "step": 75960 }, { "epoch": 0.49, "learning_rate": 0.00022645075095038627, "loss": 0.0555, "step": 75970 }, { "epoch": 0.49, "learning_rate": 0.00022644106959602935, "loss": 0.0618, "step": 75980 }, { "epoch": 0.49, "learning_rate": 0.0002264313882416724, "loss": 0.0501, "step": 75990 }, { "epoch": 0.49, "learning_rate": 0.00022642170688731548, "loss": 0.0545, "step": 76000 }, { "epoch": 0.49, "eval_cer": 0.9200289232855045, "eval_loss": 0.03558797389268875, "eval_runtime": 119.9372, "eval_samples_per_second": 16.675, "eval_steps_per_second": 4.169, "step": 76000 }, { "epoch": 0.49, "learning_rate": 0.00022641202553295856, "loss": 0.0543, "step": 76010 }, { "epoch": 0.49, "learning_rate": 0.00022640234417860159, "loss": 0.0621, "step": 76020 }, { "epoch": 0.49, "learning_rate": 0.00022639266282424467, "loss": 0.0504, "step": 76030 }, { "epoch": 0.49, "learning_rate": 0.00022638298146988775, "loss": 0.0534, "step": 76040 }, { "epoch": 0.49, "learning_rate": 0.0002263733001155308, "loss": 0.0491, "step": 76050 }, { "epoch": 0.49, "learning_rate": 0.00022636361876117388, "loss": 0.049, "step": 76060 }, { "epoch": 0.49, "learning_rate": 0.00022635393740681696, "loss": 0.0533, "step": 76070 }, { "epoch": 0.49, "learning_rate": 0.00022634425605246004, "loss": 0.0558, "step": 76080 }, { "epoch": 0.49, "learning_rate": 0.00022633457469810306, "loss": 0.0512, "step": 76090 }, { "epoch": 0.49, "learning_rate": 0.00022632489334374614, "loss": 0.0539, "step": 76100 }, { "epoch": 0.49, "learning_rate": 0.00022631521198938922, "loss": 0.0552, "step": 76110 }, { "epoch": 0.49, "learning_rate": 0.00022630553063503228, "loss": 0.0526, "step": 76120 }, { "epoch": 0.49, "learning_rate": 0.00022629584928067535, "loss": 0.0588, "step": 76130 }, { "epoch": 0.49, "learning_rate": 0.00022628616792631843, "loss": 0.072, "step": 76140 }, { "epoch": 0.49, "learning_rate": 0.00022627648657196151, "loss": 0.0562, "step": 76150 }, { "epoch": 0.49, "learning_rate": 0.00022626680521760454, "loss": 0.0586, "step": 76160 }, { "epoch": 0.49, "learning_rate": 0.00022625712386324762, "loss": 0.0588, "step": 76170 }, { "epoch": 0.49, "learning_rate": 0.0002262474425088907, "loss": 0.056, "step": 76180 }, { "epoch": 0.49, "learning_rate": 0.00022623776115453375, "loss": 0.0603, "step": 76190 }, { "epoch": 0.49, "learning_rate": 0.00022622807980017683, "loss": 0.0538, "step": 76200 }, { "epoch": 0.49, "learning_rate": 0.0002262183984458199, "loss": 0.0555, "step": 76210 }, { "epoch": 0.49, "learning_rate": 0.00022620871709146296, "loss": 0.056, "step": 76220 }, { "epoch": 0.49, "learning_rate": 0.00022619903573710602, "loss": 0.0541, "step": 76230 }, { "epoch": 0.49, "learning_rate": 0.0002261893543827491, "loss": 0.0484, "step": 76240 }, { "epoch": 0.49, "learning_rate": 0.00022617967302839215, "loss": 0.0491, "step": 76250 }, { "epoch": 0.49, "learning_rate": 0.00022616999167403523, "loss": 0.0569, "step": 76260 }, { "epoch": 0.49, "learning_rate": 0.0002261603103196783, "loss": 0.0563, "step": 76270 }, { "epoch": 0.49, "learning_rate": 0.0002261506289653214, "loss": 0.0526, "step": 76280 }, { "epoch": 0.49, "learning_rate": 0.00022614094761096444, "loss": 0.0548, "step": 76290 }, { "epoch": 0.49, "learning_rate": 0.0002261312662566075, "loss": 0.057, "step": 76300 }, { "epoch": 0.49, "learning_rate": 0.00022612158490225057, "loss": 0.0477, "step": 76310 }, { "epoch": 0.49, "learning_rate": 0.00022611190354789363, "loss": 0.0554, "step": 76320 }, { "epoch": 0.49, "learning_rate": 0.0002261022221935367, "loss": 0.055, "step": 76330 }, { "epoch": 0.49, "learning_rate": 0.0002260925408391798, "loss": 0.0539, "step": 76340 }, { "epoch": 0.49, "learning_rate": 0.00022608285948482287, "loss": 0.0511, "step": 76350 }, { "epoch": 0.49, "learning_rate": 0.00022607317813046592, "loss": 0.059, "step": 76360 }, { "epoch": 0.49, "learning_rate": 0.00022606349677610897, "loss": 0.0528, "step": 76370 }, { "epoch": 0.49, "learning_rate": 0.00022605381542175205, "loss": 0.0517, "step": 76380 }, { "epoch": 0.49, "learning_rate": 0.0002260441340673951, "loss": 0.0514, "step": 76390 }, { "epoch": 0.49, "learning_rate": 0.00022603445271303818, "loss": 0.0495, "step": 76400 }, { "epoch": 0.49, "learning_rate": 0.00022602477135868126, "loss": 0.0522, "step": 76410 }, { "epoch": 0.49, "learning_rate": 0.00022601509000432432, "loss": 0.0545, "step": 76420 }, { "epoch": 0.49, "learning_rate": 0.0002260054086499674, "loss": 0.056, "step": 76430 }, { "epoch": 0.49, "learning_rate": 0.00022599572729561045, "loss": 0.0689, "step": 76440 }, { "epoch": 0.49, "learning_rate": 0.0002259860459412535, "loss": 0.0554, "step": 76450 }, { "epoch": 0.49, "learning_rate": 0.00022597636458689658, "loss": 0.058, "step": 76460 }, { "epoch": 0.49, "learning_rate": 0.00022596668323253966, "loss": 0.0557, "step": 76470 }, { "epoch": 0.49, "learning_rate": 0.00022595700187818274, "loss": 0.0617, "step": 76480 }, { "epoch": 0.49, "learning_rate": 0.0002259473205238258, "loss": 0.0552, "step": 76490 }, { "epoch": 0.49, "learning_rate": 0.00022593763916946887, "loss": 0.0612, "step": 76500 }, { "epoch": 0.49, "learning_rate": 0.00022592795781511193, "loss": 0.0526, "step": 76510 }, { "epoch": 0.49, "learning_rate": 0.00022591827646075498, "loss": 0.0536, "step": 76520 }, { "epoch": 0.49, "learning_rate": 0.00022590859510639806, "loss": 0.0617, "step": 76530 }, { "epoch": 0.49, "learning_rate": 0.00022589891375204114, "loss": 0.0522, "step": 76540 }, { "epoch": 0.49, "learning_rate": 0.00022588923239768422, "loss": 0.0505, "step": 76550 }, { "epoch": 0.49, "learning_rate": 0.00022587955104332727, "loss": 0.0578, "step": 76560 }, { "epoch": 0.49, "learning_rate": 0.00022586986968897035, "loss": 0.057, "step": 76570 }, { "epoch": 0.49, "learning_rate": 0.0002258601883346134, "loss": 0.0523, "step": 76580 }, { "epoch": 0.49, "learning_rate": 0.00022585050698025646, "loss": 0.0553, "step": 76590 }, { "epoch": 0.49, "learning_rate": 0.00022584082562589954, "loss": 0.0615, "step": 76600 }, { "epoch": 0.49, "learning_rate": 0.00022583114427154262, "loss": 0.0545, "step": 76610 }, { "epoch": 0.49, "learning_rate": 0.00022582146291718567, "loss": 0.0537, "step": 76620 }, { "epoch": 0.49, "learning_rate": 0.00022581178156282875, "loss": 0.0532, "step": 76630 }, { "epoch": 0.49, "learning_rate": 0.00022580210020847183, "loss": 0.0609, "step": 76640 }, { "epoch": 0.49, "learning_rate": 0.00022579241885411485, "loss": 0.0489, "step": 76650 }, { "epoch": 0.49, "learning_rate": 0.00022578273749975793, "loss": 0.0487, "step": 76660 }, { "epoch": 0.49, "learning_rate": 0.000225773056145401, "loss": 0.0557, "step": 76670 }, { "epoch": 0.49, "learning_rate": 0.0002257633747910441, "loss": 0.0538, "step": 76680 }, { "epoch": 0.49, "learning_rate": 0.00022575369343668715, "loss": 0.0593, "step": 76690 }, { "epoch": 0.5, "learning_rate": 0.00022574401208233023, "loss": 0.0544, "step": 76700 }, { "epoch": 0.5, "learning_rate": 0.0002257343307279733, "loss": 0.058, "step": 76710 }, { "epoch": 0.5, "learning_rate": 0.00022572464937361633, "loss": 0.0564, "step": 76720 }, { "epoch": 0.5, "learning_rate": 0.0002257149680192594, "loss": 0.0499, "step": 76730 }, { "epoch": 0.5, "learning_rate": 0.0002257052866649025, "loss": 0.0558, "step": 76740 }, { "epoch": 0.5, "learning_rate": 0.00022569560531054557, "loss": 0.0538, "step": 76750 }, { "epoch": 0.5, "learning_rate": 0.00022568592395618862, "loss": 0.0591, "step": 76760 }, { "epoch": 0.5, "learning_rate": 0.0002256762426018317, "loss": 0.0547, "step": 76770 }, { "epoch": 0.5, "learning_rate": 0.00022566656124747478, "loss": 0.054, "step": 76780 }, { "epoch": 0.5, "learning_rate": 0.0002256568798931178, "loss": 0.0555, "step": 76790 }, { "epoch": 0.5, "learning_rate": 0.0002256471985387609, "loss": 0.0576, "step": 76800 }, { "epoch": 0.5, "learning_rate": 0.00022563751718440397, "loss": 0.0504, "step": 76810 }, { "epoch": 0.5, "learning_rate": 0.00022562783583004702, "loss": 0.0558, "step": 76820 }, { "epoch": 0.5, "learning_rate": 0.0002256181544756901, "loss": 0.0621, "step": 76830 }, { "epoch": 0.5, "learning_rate": 0.00022560847312133318, "loss": 0.0476, "step": 76840 }, { "epoch": 0.5, "learning_rate": 0.00022559879176697626, "loss": 0.0575, "step": 76850 }, { "epoch": 0.5, "learning_rate": 0.00022558911041261929, "loss": 0.055, "step": 76860 }, { "epoch": 0.5, "learning_rate": 0.00022557942905826236, "loss": 0.0576, "step": 76870 }, { "epoch": 0.5, "learning_rate": 0.00022556974770390544, "loss": 0.0578, "step": 76880 }, { "epoch": 0.5, "learning_rate": 0.0002255600663495485, "loss": 0.056, "step": 76890 }, { "epoch": 0.5, "learning_rate": 0.00022555038499519158, "loss": 0.0536, "step": 76900 }, { "epoch": 0.5, "learning_rate": 0.00022554070364083466, "loss": 0.0541, "step": 76910 }, { "epoch": 0.5, "learning_rate": 0.00022553102228647774, "loss": 0.0534, "step": 76920 }, { "epoch": 0.5, "learning_rate": 0.00022552134093212076, "loss": 0.0511, "step": 76930 }, { "epoch": 0.5, "learning_rate": 0.00022551165957776384, "loss": 0.0543, "step": 76940 }, { "epoch": 0.5, "learning_rate": 0.00022550197822340692, "loss": 0.0615, "step": 76950 }, { "epoch": 0.5, "learning_rate": 0.00022549229686904997, "loss": 0.0624, "step": 76960 }, { "epoch": 0.5, "learning_rate": 0.00022548261551469305, "loss": 0.0485, "step": 76970 }, { "epoch": 0.5, "learning_rate": 0.00022547293416033613, "loss": 0.0648, "step": 76980 }, { "epoch": 0.5, "learning_rate": 0.0002254632528059792, "loss": 0.0631, "step": 76990 }, { "epoch": 0.5, "learning_rate": 0.00022545357145162224, "loss": 0.0527, "step": 77000 }, { "epoch": 0.5, "eval_cer": 0.9199611343351034, "eval_loss": 0.03577205166220665, "eval_runtime": 120.0009, "eval_samples_per_second": 16.667, "eval_steps_per_second": 4.167, "step": 77000 }, { "epoch": 0.5, "learning_rate": 0.00022544389009726532, "loss": 0.0537, "step": 77010 }, { "epoch": 0.5, "learning_rate": 0.00022543420874290837, "loss": 0.0506, "step": 77020 }, { "epoch": 0.5, "learning_rate": 0.00022542452738855145, "loss": 0.0523, "step": 77030 }, { "epoch": 0.5, "learning_rate": 0.00022541484603419453, "loss": 0.0516, "step": 77040 }, { "epoch": 0.5, "learning_rate": 0.0002254051646798376, "loss": 0.048, "step": 77050 }, { "epoch": 0.5, "learning_rate": 0.00022539548332548066, "loss": 0.0593, "step": 77060 }, { "epoch": 0.5, "learning_rate": 0.00022538580197112372, "loss": 0.0545, "step": 77070 }, { "epoch": 0.5, "learning_rate": 0.0002253761206167668, "loss": 0.0482, "step": 77080 }, { "epoch": 0.5, "learning_rate": 0.00022536643926240985, "loss": 0.0561, "step": 77090 }, { "epoch": 0.5, "learning_rate": 0.00022535675790805293, "loss": 0.052, "step": 77100 }, { "epoch": 0.5, "learning_rate": 0.000225347076553696, "loss": 0.0526, "step": 77110 }, { "epoch": 0.5, "learning_rate": 0.0002253373951993391, "loss": 0.0482, "step": 77120 }, { "epoch": 0.5, "learning_rate": 0.00022532771384498214, "loss": 0.0563, "step": 77130 }, { "epoch": 0.5, "learning_rate": 0.0002253180324906252, "loss": 0.0539, "step": 77140 }, { "epoch": 0.5, "learning_rate": 0.00022530835113626827, "loss": 0.0481, "step": 77150 }, { "epoch": 0.5, "learning_rate": 0.00022529866978191133, "loss": 0.0489, "step": 77160 }, { "epoch": 0.5, "learning_rate": 0.0002252889884275544, "loss": 0.0543, "step": 77170 }, { "epoch": 0.5, "learning_rate": 0.00022527930707319749, "loss": 0.0615, "step": 77180 }, { "epoch": 0.5, "learning_rate": 0.00022526962571884054, "loss": 0.0543, "step": 77190 }, { "epoch": 0.5, "learning_rate": 0.00022525994436448362, "loss": 0.0532, "step": 77200 }, { "epoch": 0.5, "learning_rate": 0.00022525026301012667, "loss": 0.0538, "step": 77210 }, { "epoch": 0.5, "learning_rate": 0.00022524058165576972, "loss": 0.0543, "step": 77220 }, { "epoch": 0.5, "learning_rate": 0.0002252309003014128, "loss": 0.054, "step": 77230 }, { "epoch": 0.5, "learning_rate": 0.00022522121894705588, "loss": 0.0475, "step": 77240 }, { "epoch": 0.5, "learning_rate": 0.00022521153759269896, "loss": 0.0579, "step": 77250 }, { "epoch": 0.5, "learning_rate": 0.00022520185623834202, "loss": 0.0516, "step": 77260 }, { "epoch": 0.5, "learning_rate": 0.0002251921748839851, "loss": 0.047, "step": 77270 }, { "epoch": 0.5, "learning_rate": 0.00022518249352962815, "loss": 0.0545, "step": 77280 }, { "epoch": 0.5, "learning_rate": 0.0002251728121752712, "loss": 0.0613, "step": 77290 }, { "epoch": 0.5, "learning_rate": 0.00022516313082091428, "loss": 0.0527, "step": 77300 }, { "epoch": 0.5, "learning_rate": 0.00022515344946655736, "loss": 0.0531, "step": 77310 }, { "epoch": 0.5, "learning_rate": 0.00022514376811220044, "loss": 0.0541, "step": 77320 }, { "epoch": 0.5, "learning_rate": 0.0002251340867578435, "loss": 0.0523, "step": 77330 }, { "epoch": 0.5, "learning_rate": 0.00022512440540348657, "loss": 0.0531, "step": 77340 }, { "epoch": 0.5, "learning_rate": 0.00022511472404912963, "loss": 0.0526, "step": 77350 }, { "epoch": 0.5, "learning_rate": 0.00022510504269477268, "loss": 0.0547, "step": 77360 }, { "epoch": 0.5, "learning_rate": 0.00022509536134041576, "loss": 0.0492, "step": 77370 }, { "epoch": 0.5, "learning_rate": 0.00022508567998605884, "loss": 0.0518, "step": 77380 }, { "epoch": 0.5, "learning_rate": 0.0002250759986317019, "loss": 0.0508, "step": 77390 }, { "epoch": 0.5, "learning_rate": 0.00022506631727734497, "loss": 0.0573, "step": 77400 }, { "epoch": 0.5, "learning_rate": 0.00022505663592298805, "loss": 0.0528, "step": 77410 }, { "epoch": 0.5, "learning_rate": 0.00022504695456863108, "loss": 0.049, "step": 77420 }, { "epoch": 0.5, "learning_rate": 0.00022503727321427416, "loss": 0.0501, "step": 77430 }, { "epoch": 0.5, "learning_rate": 0.00022502759185991724, "loss": 0.054, "step": 77440 }, { "epoch": 0.5, "learning_rate": 0.00022501791050556032, "loss": 0.0543, "step": 77450 }, { "epoch": 0.5, "learning_rate": 0.00022500822915120337, "loss": 0.0494, "step": 77460 }, { "epoch": 0.5, "learning_rate": 0.00022499854779684645, "loss": 0.0514, "step": 77470 }, { "epoch": 0.5, "learning_rate": 0.00022498886644248953, "loss": 0.0611, "step": 77480 }, { "epoch": 0.5, "learning_rate": 0.00022497918508813255, "loss": 0.0496, "step": 77490 }, { "epoch": 0.5, "learning_rate": 0.00022496950373377563, "loss": 0.0527, "step": 77500 }, { "epoch": 0.5, "learning_rate": 0.0002249598223794187, "loss": 0.0531, "step": 77510 }, { "epoch": 0.5, "learning_rate": 0.0002249501410250618, "loss": 0.0581, "step": 77520 }, { "epoch": 0.5, "learning_rate": 0.00022494045967070485, "loss": 0.0553, "step": 77530 }, { "epoch": 0.5, "learning_rate": 0.00022493077831634792, "loss": 0.0548, "step": 77540 }, { "epoch": 0.5, "learning_rate": 0.000224921096961991, "loss": 0.0529, "step": 77550 }, { "epoch": 0.5, "learning_rate": 0.00022491141560763403, "loss": 0.0521, "step": 77560 }, { "epoch": 0.5, "learning_rate": 0.0002249017342532771, "loss": 0.0496, "step": 77570 }, { "epoch": 0.5, "learning_rate": 0.0002248920528989202, "loss": 0.0515, "step": 77580 }, { "epoch": 0.5, "learning_rate": 0.00022488237154456324, "loss": 0.0498, "step": 77590 }, { "epoch": 0.5, "learning_rate": 0.00022487269019020632, "loss": 0.0521, "step": 77600 }, { "epoch": 0.5, "learning_rate": 0.0002248630088358494, "loss": 0.053, "step": 77610 }, { "epoch": 0.5, "learning_rate": 0.00022485332748149248, "loss": 0.0591, "step": 77620 }, { "epoch": 0.5, "learning_rate": 0.0002248436461271355, "loss": 0.0555, "step": 77630 }, { "epoch": 0.5, "learning_rate": 0.0002248339647727786, "loss": 0.0499, "step": 77640 }, { "epoch": 0.5, "learning_rate": 0.00022482428341842167, "loss": 0.0634, "step": 77650 }, { "epoch": 0.5, "learning_rate": 0.00022481460206406472, "loss": 0.0507, "step": 77660 }, { "epoch": 0.5, "learning_rate": 0.0002248049207097078, "loss": 0.0571, "step": 77670 }, { "epoch": 0.5, "learning_rate": 0.00022479523935535088, "loss": 0.0535, "step": 77680 }, { "epoch": 0.5, "learning_rate": 0.00022478555800099396, "loss": 0.0557, "step": 77690 }, { "epoch": 0.5, "learning_rate": 0.00022477587664663698, "loss": 0.0524, "step": 77700 }, { "epoch": 0.5, "learning_rate": 0.00022476619529228006, "loss": 0.0552, "step": 77710 }, { "epoch": 0.5, "learning_rate": 0.00022475651393792314, "loss": 0.0572, "step": 77720 }, { "epoch": 0.5, "learning_rate": 0.0002247468325835662, "loss": 0.0541, "step": 77730 }, { "epoch": 0.5, "learning_rate": 0.00022473715122920928, "loss": 0.062, "step": 77740 }, { "epoch": 0.5, "learning_rate": 0.00022472746987485236, "loss": 0.0582, "step": 77750 }, { "epoch": 0.5, "learning_rate": 0.00022471778852049544, "loss": 0.0499, "step": 77760 }, { "epoch": 0.5, "learning_rate": 0.00022470810716613846, "loss": 0.0595, "step": 77770 }, { "epoch": 0.5, "learning_rate": 0.00022469842581178154, "loss": 0.05, "step": 77780 }, { "epoch": 0.5, "learning_rate": 0.0002246887444574246, "loss": 0.0532, "step": 77790 }, { "epoch": 0.5, "learning_rate": 0.00022467906310306767, "loss": 0.0506, "step": 77800 }, { "epoch": 0.5, "learning_rate": 0.00022466938174871075, "loss": 0.0598, "step": 77810 }, { "epoch": 0.5, "learning_rate": 0.00022465970039435383, "loss": 0.055, "step": 77820 }, { "epoch": 0.5, "learning_rate": 0.0002246500190399969, "loss": 0.0481, "step": 77830 }, { "epoch": 0.5, "learning_rate": 0.00022464033768563994, "loss": 0.0557, "step": 77840 }, { "epoch": 0.5, "learning_rate": 0.00022463065633128302, "loss": 0.058, "step": 77850 }, { "epoch": 0.5, "learning_rate": 0.00022462097497692607, "loss": 0.0509, "step": 77860 }, { "epoch": 0.5, "learning_rate": 0.00022461129362256915, "loss": 0.0435, "step": 77870 }, { "epoch": 0.5, "learning_rate": 0.00022460161226821223, "loss": 0.0584, "step": 77880 }, { "epoch": 0.5, "learning_rate": 0.0002245919309138553, "loss": 0.062, "step": 77890 }, { "epoch": 0.5, "learning_rate": 0.00022458224955949836, "loss": 0.0557, "step": 77900 }, { "epoch": 0.5, "learning_rate": 0.00022457256820514142, "loss": 0.0621, "step": 77910 }, { "epoch": 0.5, "learning_rate": 0.0002245628868507845, "loss": 0.0515, "step": 77920 }, { "epoch": 0.5, "learning_rate": 0.00022455320549642755, "loss": 0.0485, "step": 77930 }, { "epoch": 0.5, "learning_rate": 0.00022454352414207063, "loss": 0.0491, "step": 77940 }, { "epoch": 0.5, "learning_rate": 0.0002245338427877137, "loss": 0.0563, "step": 77950 }, { "epoch": 0.5, "learning_rate": 0.0002245241614333568, "loss": 0.0542, "step": 77960 }, { "epoch": 0.5, "learning_rate": 0.00022451448007899984, "loss": 0.0547, "step": 77970 }, { "epoch": 0.5, "learning_rate": 0.0002245047987246429, "loss": 0.0487, "step": 77980 }, { "epoch": 0.5, "learning_rate": 0.00022449511737028595, "loss": 0.0508, "step": 77990 }, { "epoch": 0.5, "learning_rate": 0.00022448543601592903, "loss": 0.0464, "step": 78000 }, { "epoch": 0.5, "eval_cer": 0.9201102700259858, "eval_loss": 0.03538144752383232, "eval_runtime": 120.2717, "eval_samples_per_second": 16.629, "eval_steps_per_second": 4.157, "step": 78000 }, { "epoch": 0.5, "learning_rate": 0.0002244757546615721, "loss": 0.0577, "step": 78010 }, { "epoch": 0.5, "learning_rate": 0.00022446607330721519, "loss": 0.0517, "step": 78020 }, { "epoch": 0.5, "learning_rate": 0.00022445639195285824, "loss": 0.0542, "step": 78030 }, { "epoch": 0.5, "learning_rate": 0.00022444671059850132, "loss": 0.0448, "step": 78040 }, { "epoch": 0.5, "learning_rate": 0.00022443702924414437, "loss": 0.0612, "step": 78050 }, { "epoch": 0.5, "learning_rate": 0.00022442734788978742, "loss": 0.0519, "step": 78060 }, { "epoch": 0.5, "learning_rate": 0.0002244176665354305, "loss": 0.0493, "step": 78070 }, { "epoch": 0.5, "learning_rate": 0.00022440798518107358, "loss": 0.054, "step": 78080 }, { "epoch": 0.5, "learning_rate": 0.00022439830382671666, "loss": 0.049, "step": 78090 }, { "epoch": 0.5, "learning_rate": 0.00022438862247235972, "loss": 0.0589, "step": 78100 }, { "epoch": 0.5, "learning_rate": 0.0002243789411180028, "loss": 0.0572, "step": 78110 }, { "epoch": 0.5, "learning_rate": 0.00022436925976364585, "loss": 0.0501, "step": 78120 }, { "epoch": 0.5, "learning_rate": 0.0002243595784092889, "loss": 0.0516, "step": 78130 }, { "epoch": 0.5, "learning_rate": 0.00022434989705493198, "loss": 0.0522, "step": 78140 }, { "epoch": 0.5, "learning_rate": 0.00022434021570057506, "loss": 0.0517, "step": 78150 }, { "epoch": 0.5, "learning_rate": 0.00022433053434621814, "loss": 0.0571, "step": 78160 }, { "epoch": 0.5, "learning_rate": 0.0002243208529918612, "loss": 0.0476, "step": 78170 }, { "epoch": 0.5, "learning_rate": 0.00022431117163750427, "loss": 0.0594, "step": 78180 }, { "epoch": 0.5, "learning_rate": 0.0002243014902831473, "loss": 0.0538, "step": 78190 }, { "epoch": 0.5, "learning_rate": 0.00022429180892879038, "loss": 0.051, "step": 78200 }, { "epoch": 0.5, "learning_rate": 0.00022428212757443346, "loss": 0.0528, "step": 78210 }, { "epoch": 0.5, "learning_rate": 0.00022427244622007654, "loss": 0.0524, "step": 78220 }, { "epoch": 0.5, "learning_rate": 0.0002242627648657196, "loss": 0.0595, "step": 78230 }, { "epoch": 0.5, "learning_rate": 0.00022425308351136267, "loss": 0.0519, "step": 78240 }, { "epoch": 0.51, "learning_rate": 0.00022424340215700575, "loss": 0.0504, "step": 78250 }, { "epoch": 0.51, "learning_rate": 0.00022423372080264878, "loss": 0.0538, "step": 78260 }, { "epoch": 0.51, "learning_rate": 0.00022422403944829186, "loss": 0.0468, "step": 78270 }, { "epoch": 0.51, "learning_rate": 0.00022421435809393494, "loss": 0.0525, "step": 78280 }, { "epoch": 0.51, "learning_rate": 0.00022420467673957801, "loss": 0.0545, "step": 78290 }, { "epoch": 0.51, "learning_rate": 0.00022419499538522107, "loss": 0.0521, "step": 78300 }, { "epoch": 0.51, "learning_rate": 0.00022418531403086415, "loss": 0.0536, "step": 78310 }, { "epoch": 0.51, "learning_rate": 0.00022417563267650723, "loss": 0.0488, "step": 78320 }, { "epoch": 0.51, "learning_rate": 0.00022416595132215025, "loss": 0.0451, "step": 78330 }, { "epoch": 0.51, "learning_rate": 0.00022415626996779333, "loss": 0.0559, "step": 78340 }, { "epoch": 0.51, "learning_rate": 0.0002241465886134364, "loss": 0.0551, "step": 78350 }, { "epoch": 0.51, "learning_rate": 0.0002241369072590795, "loss": 0.0514, "step": 78360 }, { "epoch": 0.51, "learning_rate": 0.00022412722590472254, "loss": 0.045, "step": 78370 }, { "epoch": 0.51, "learning_rate": 0.00022411754455036562, "loss": 0.054, "step": 78380 }, { "epoch": 0.51, "learning_rate": 0.0002241078631960087, "loss": 0.061, "step": 78390 }, { "epoch": 0.51, "learning_rate": 0.00022409818184165173, "loss": 0.053, "step": 78400 }, { "epoch": 0.51, "learning_rate": 0.0002240885004872948, "loss": 0.043, "step": 78410 }, { "epoch": 0.51, "learning_rate": 0.0002240788191329379, "loss": 0.0484, "step": 78420 }, { "epoch": 0.51, "learning_rate": 0.00022406913777858094, "loss": 0.0541, "step": 78430 }, { "epoch": 0.51, "learning_rate": 0.00022405945642422402, "loss": 0.0464, "step": 78440 }, { "epoch": 0.51, "learning_rate": 0.0002240497750698671, "loss": 0.0536, "step": 78450 }, { "epoch": 0.51, "learning_rate": 0.00022404009371551018, "loss": 0.052, "step": 78460 }, { "epoch": 0.51, "learning_rate": 0.0002240304123611532, "loss": 0.048, "step": 78470 }, { "epoch": 0.51, "learning_rate": 0.0002240207310067963, "loss": 0.0559, "step": 78480 }, { "epoch": 0.51, "learning_rate": 0.00022401104965243937, "loss": 0.0714, "step": 78490 }, { "epoch": 0.51, "learning_rate": 0.00022400136829808242, "loss": 0.0551, "step": 78500 }, { "epoch": 0.51, "learning_rate": 0.0002239916869437255, "loss": 0.0511, "step": 78510 }, { "epoch": 0.51, "learning_rate": 0.00022398200558936858, "loss": 0.0507, "step": 78520 }, { "epoch": 0.51, "learning_rate": 0.00022397232423501166, "loss": 0.0467, "step": 78530 }, { "epoch": 0.51, "learning_rate": 0.00022396264288065468, "loss": 0.0608, "step": 78540 }, { "epoch": 0.51, "learning_rate": 0.00022395296152629776, "loss": 0.069, "step": 78550 }, { "epoch": 0.51, "learning_rate": 0.00022394328017194084, "loss": 0.049, "step": 78560 }, { "epoch": 0.51, "learning_rate": 0.0002239335988175839, "loss": 0.0596, "step": 78570 }, { "epoch": 0.51, "learning_rate": 0.00022392391746322698, "loss": 0.0496, "step": 78580 }, { "epoch": 0.51, "learning_rate": 0.00022391423610887006, "loss": 0.0581, "step": 78590 }, { "epoch": 0.51, "learning_rate": 0.0002239045547545131, "loss": 0.0497, "step": 78600 }, { "epoch": 0.51, "learning_rate": 0.00022389487340015616, "loss": 0.0553, "step": 78610 }, { "epoch": 0.51, "learning_rate": 0.00022388519204579924, "loss": 0.045, "step": 78620 }, { "epoch": 0.51, "learning_rate": 0.0002238755106914423, "loss": 0.0527, "step": 78630 }, { "epoch": 0.51, "learning_rate": 0.00022386582933708537, "loss": 0.0469, "step": 78640 }, { "epoch": 0.51, "learning_rate": 0.00022385614798272845, "loss": 0.0505, "step": 78650 }, { "epoch": 0.51, "learning_rate": 0.00022384646662837153, "loss": 0.0496, "step": 78660 }, { "epoch": 0.51, "learning_rate": 0.00022383678527401459, "loss": 0.0486, "step": 78670 }, { "epoch": 0.51, "learning_rate": 0.00022382710391965764, "loss": 0.0517, "step": 78680 }, { "epoch": 0.51, "learning_rate": 0.00022381742256530072, "loss": 0.0552, "step": 78690 }, { "epoch": 0.51, "learning_rate": 0.00022380774121094377, "loss": 0.047, "step": 78700 }, { "epoch": 0.51, "learning_rate": 0.00022379805985658685, "loss": 0.0541, "step": 78710 }, { "epoch": 0.51, "learning_rate": 0.00022378837850222993, "loss": 0.0477, "step": 78720 }, { "epoch": 0.51, "learning_rate": 0.000223778697147873, "loss": 0.0499, "step": 78730 }, { "epoch": 0.51, "learning_rate": 0.00022376901579351606, "loss": 0.0534, "step": 78740 }, { "epoch": 0.51, "learning_rate": 0.00022375933443915912, "loss": 0.0534, "step": 78750 }, { "epoch": 0.51, "learning_rate": 0.0002237496530848022, "loss": 0.054, "step": 78760 }, { "epoch": 0.51, "learning_rate": 0.00022373997173044525, "loss": 0.0543, "step": 78770 }, { "epoch": 0.51, "learning_rate": 0.00022373029037608833, "loss": 0.0493, "step": 78780 }, { "epoch": 0.51, "learning_rate": 0.0002237206090217314, "loss": 0.0525, "step": 78790 }, { "epoch": 0.51, "learning_rate": 0.00022371092766737446, "loss": 0.0459, "step": 78800 }, { "epoch": 0.51, "learning_rate": 0.00022370124631301754, "loss": 0.0509, "step": 78810 }, { "epoch": 0.51, "learning_rate": 0.0002236915649586606, "loss": 0.0608, "step": 78820 }, { "epoch": 0.51, "learning_rate": 0.00022368188360430365, "loss": 0.0525, "step": 78830 }, { "epoch": 0.51, "learning_rate": 0.00022367220224994673, "loss": 0.0597, "step": 78840 }, { "epoch": 0.51, "learning_rate": 0.0002236625208955898, "loss": 0.0518, "step": 78850 }, { "epoch": 0.51, "learning_rate": 0.00022365283954123289, "loss": 0.0544, "step": 78860 }, { "epoch": 0.51, "learning_rate": 0.00022364315818687594, "loss": 0.0477, "step": 78870 }, { "epoch": 0.51, "learning_rate": 0.00022363347683251902, "loss": 0.0487, "step": 78880 }, { "epoch": 0.51, "learning_rate": 0.00022362379547816207, "loss": 0.0489, "step": 78890 }, { "epoch": 0.51, "learning_rate": 0.00022361411412380512, "loss": 0.0505, "step": 78900 }, { "epoch": 0.51, "learning_rate": 0.0002236044327694482, "loss": 0.0534, "step": 78910 }, { "epoch": 0.51, "learning_rate": 0.00022359475141509128, "loss": 0.0527, "step": 78920 }, { "epoch": 0.51, "learning_rate": 0.00022358507006073436, "loss": 0.0519, "step": 78930 }, { "epoch": 0.51, "learning_rate": 0.00022357538870637742, "loss": 0.0493, "step": 78940 }, { "epoch": 0.51, "learning_rate": 0.0002235657073520205, "loss": 0.0545, "step": 78950 }, { "epoch": 0.51, "learning_rate": 0.00022355602599766355, "loss": 0.0523, "step": 78960 }, { "epoch": 0.51, "learning_rate": 0.0002235463446433066, "loss": 0.0512, "step": 78970 }, { "epoch": 0.51, "learning_rate": 0.00022353666328894968, "loss": 0.055, "step": 78980 }, { "epoch": 0.51, "learning_rate": 0.00022352698193459276, "loss": 0.0533, "step": 78990 }, { "epoch": 0.51, "learning_rate": 0.0002235173005802358, "loss": 0.0546, "step": 79000 }, { "epoch": 0.51, "eval_cer": 0.9200325386961925, "eval_loss": 0.0354156568646431, "eval_runtime": 120.0383, "eval_samples_per_second": 16.661, "eval_steps_per_second": 4.165, "step": 79000 }, { "epoch": 0.51, "learning_rate": 0.0002235076192258789, "loss": 0.0533, "step": 79010 }, { "epoch": 0.51, "learning_rate": 0.00022349793787152197, "loss": 0.0535, "step": 79020 }, { "epoch": 0.51, "learning_rate": 0.000223488256517165, "loss": 0.05, "step": 79030 }, { "epoch": 0.51, "learning_rate": 0.00022347857516280808, "loss": 0.0549, "step": 79040 }, { "epoch": 0.51, "learning_rate": 0.00022346889380845116, "loss": 0.0607, "step": 79050 }, { "epoch": 0.51, "learning_rate": 0.00022345921245409424, "loss": 0.0474, "step": 79060 }, { "epoch": 0.51, "learning_rate": 0.0002234495310997373, "loss": 0.053, "step": 79070 }, { "epoch": 0.51, "learning_rate": 0.00022343984974538037, "loss": 0.0514, "step": 79080 }, { "epoch": 0.51, "learning_rate": 0.00022343016839102345, "loss": 0.1657, "step": 79090 }, { "epoch": 0.51, "learning_rate": 0.00022342048703666648, "loss": 0.057, "step": 79100 }, { "epoch": 0.51, "learning_rate": 0.00022341080568230955, "loss": 0.053, "step": 79110 }, { "epoch": 0.51, "learning_rate": 0.00022340112432795263, "loss": 0.0523, "step": 79120 }, { "epoch": 0.51, "learning_rate": 0.00022339144297359571, "loss": 0.0527, "step": 79130 }, { "epoch": 0.51, "learning_rate": 0.00022338176161923877, "loss": 0.0567, "step": 79140 }, { "epoch": 0.51, "learning_rate": 0.00022337208026488185, "loss": 0.0542, "step": 79150 }, { "epoch": 0.51, "learning_rate": 0.00022336239891052493, "loss": 0.0516, "step": 79160 }, { "epoch": 0.51, "learning_rate": 0.00022335271755616795, "loss": 0.0525, "step": 79170 }, { "epoch": 0.51, "learning_rate": 0.00022334303620181103, "loss": 0.0508, "step": 79180 }, { "epoch": 0.51, "learning_rate": 0.0002233333548474541, "loss": 0.0457, "step": 79190 }, { "epoch": 0.51, "learning_rate": 0.00022332367349309716, "loss": 0.0472, "step": 79200 }, { "epoch": 0.51, "learning_rate": 0.00022331399213874024, "loss": 0.0512, "step": 79210 }, { "epoch": 0.51, "learning_rate": 0.00022330431078438332, "loss": 0.0524, "step": 79220 }, { "epoch": 0.51, "learning_rate": 0.00022329462943002635, "loss": 0.0473, "step": 79230 }, { "epoch": 0.51, "learning_rate": 0.00022328494807566943, "loss": 0.049, "step": 79240 }, { "epoch": 0.51, "learning_rate": 0.0002232752667213125, "loss": 0.0519, "step": 79250 }, { "epoch": 0.51, "learning_rate": 0.0002232655853669556, "loss": 0.0474, "step": 79260 }, { "epoch": 0.51, "learning_rate": 0.00022325590401259864, "loss": 0.0595, "step": 79270 }, { "epoch": 0.51, "learning_rate": 0.00022324622265824172, "loss": 0.05, "step": 79280 }, { "epoch": 0.51, "learning_rate": 0.0002232365413038848, "loss": 0.048, "step": 79290 }, { "epoch": 0.51, "learning_rate": 0.00022322685994952783, "loss": 0.0495, "step": 79300 }, { "epoch": 0.51, "learning_rate": 0.0002232171785951709, "loss": 0.0582, "step": 79310 }, { "epoch": 0.51, "learning_rate": 0.000223207497240814, "loss": 0.0521, "step": 79320 }, { "epoch": 0.51, "learning_rate": 0.00022319781588645707, "loss": 0.056, "step": 79330 }, { "epoch": 0.51, "learning_rate": 0.00022318813453210012, "loss": 0.0556, "step": 79340 }, { "epoch": 0.51, "learning_rate": 0.0002231784531777432, "loss": 0.0479, "step": 79350 }, { "epoch": 0.51, "learning_rate": 0.00022316877182338628, "loss": 0.0537, "step": 79360 }, { "epoch": 0.51, "learning_rate": 0.0002231590904690293, "loss": 0.0522, "step": 79370 }, { "epoch": 0.51, "learning_rate": 0.00022314940911467238, "loss": 0.0516, "step": 79380 }, { "epoch": 0.51, "learning_rate": 0.00022313972776031546, "loss": 0.0595, "step": 79390 }, { "epoch": 0.51, "learning_rate": 0.00022313004640595852, "loss": 0.059, "step": 79400 }, { "epoch": 0.51, "learning_rate": 0.0002231203650516016, "loss": 0.0542, "step": 79410 }, { "epoch": 0.51, "learning_rate": 0.00022311068369724468, "loss": 0.0505, "step": 79420 }, { "epoch": 0.51, "learning_rate": 0.00022310100234288776, "loss": 0.0521, "step": 79430 }, { "epoch": 0.51, "learning_rate": 0.00022309132098853078, "loss": 0.0479, "step": 79440 }, { "epoch": 0.51, "learning_rate": 0.00022308163963417386, "loss": 0.0508, "step": 79450 }, { "epoch": 0.51, "learning_rate": 0.00022307195827981694, "loss": 0.0486, "step": 79460 }, { "epoch": 0.51, "learning_rate": 0.00022306227692546, "loss": 0.052, "step": 79470 }, { "epoch": 0.51, "learning_rate": 0.00022305259557110307, "loss": 0.0506, "step": 79480 }, { "epoch": 0.51, "learning_rate": 0.00022304291421674615, "loss": 0.0499, "step": 79490 }, { "epoch": 0.51, "learning_rate": 0.00022303323286238923, "loss": 0.0534, "step": 79500 }, { "epoch": 0.51, "learning_rate": 0.00022302355150803226, "loss": 0.0503, "step": 79510 }, { "epoch": 0.51, "learning_rate": 0.00022301387015367534, "loss": 0.0561, "step": 79520 }, { "epoch": 0.51, "learning_rate": 0.00022300418879931842, "loss": 0.0486, "step": 79530 }, { "epoch": 0.51, "learning_rate": 0.00022299450744496147, "loss": 0.0559, "step": 79540 }, { "epoch": 0.51, "learning_rate": 0.00022298482609060455, "loss": 0.0552, "step": 79550 }, { "epoch": 0.51, "learning_rate": 0.00022297514473624763, "loss": 0.0468, "step": 79560 }, { "epoch": 0.51, "learning_rate": 0.00022296546338189068, "loss": 0.0506, "step": 79570 }, { "epoch": 0.51, "learning_rate": 0.00022295578202753374, "loss": 0.0518, "step": 79580 }, { "epoch": 0.51, "learning_rate": 0.00022294610067317682, "loss": 0.0503, "step": 79590 }, { "epoch": 0.51, "learning_rate": 0.00022293641931881987, "loss": 0.0578, "step": 79600 }, { "epoch": 0.51, "learning_rate": 0.00022292673796446295, "loss": 0.0491, "step": 79610 }, { "epoch": 0.51, "learning_rate": 0.00022291705661010603, "loss": 0.0516, "step": 79620 }, { "epoch": 0.51, "learning_rate": 0.0002229073752557491, "loss": 0.0509, "step": 79630 }, { "epoch": 0.51, "learning_rate": 0.00022289769390139216, "loss": 0.0616, "step": 79640 }, { "epoch": 0.51, "learning_rate": 0.0002228880125470352, "loss": 0.0529, "step": 79650 }, { "epoch": 0.51, "learning_rate": 0.0002228783311926783, "loss": 0.0625, "step": 79660 }, { "epoch": 0.51, "learning_rate": 0.00022286864983832135, "loss": 0.069, "step": 79670 }, { "epoch": 0.51, "learning_rate": 0.00022285896848396443, "loss": 0.0505, "step": 79680 }, { "epoch": 0.51, "learning_rate": 0.0002228492871296075, "loss": 0.0499, "step": 79690 }, { "epoch": 0.51, "learning_rate": 0.00022283960577525058, "loss": 0.0488, "step": 79700 }, { "epoch": 0.51, "learning_rate": 0.00022282992442089364, "loss": 0.0491, "step": 79710 }, { "epoch": 0.51, "learning_rate": 0.0002228202430665367, "loss": 0.0606, "step": 79720 }, { "epoch": 0.51, "learning_rate": 0.00022281056171217977, "loss": 0.0573, "step": 79730 }, { "epoch": 0.51, "learning_rate": 0.00022280088035782282, "loss": 0.05, "step": 79740 }, { "epoch": 0.51, "learning_rate": 0.0002227911990034659, "loss": 0.0645, "step": 79750 }, { "epoch": 0.51, "learning_rate": 0.00022278151764910898, "loss": 0.0572, "step": 79760 }, { "epoch": 0.51, "learning_rate": 0.00022277183629475204, "loss": 0.052, "step": 79770 }, { "epoch": 0.51, "learning_rate": 0.00022276215494039511, "loss": 0.0524, "step": 79780 }, { "epoch": 0.51, "learning_rate": 0.00022275247358603817, "loss": 0.0589, "step": 79790 }, { "epoch": 0.52, "learning_rate": 0.00022274279223168122, "loss": 0.0538, "step": 79800 }, { "epoch": 0.52, "learning_rate": 0.0002227331108773243, "loss": 0.0531, "step": 79810 }, { "epoch": 0.52, "learning_rate": 0.00022272342952296738, "loss": 0.0549, "step": 79820 }, { "epoch": 0.52, "learning_rate": 0.00022271374816861046, "loss": 0.0565, "step": 79830 }, { "epoch": 0.52, "learning_rate": 0.0002227040668142535, "loss": 0.057, "step": 79840 }, { "epoch": 0.52, "learning_rate": 0.0002226943854598966, "loss": 0.0609, "step": 79850 }, { "epoch": 0.52, "learning_rate": 0.00022268470410553964, "loss": 0.0578, "step": 79860 }, { "epoch": 0.52, "learning_rate": 0.0002226750227511827, "loss": 0.0512, "step": 79870 }, { "epoch": 0.52, "learning_rate": 0.00022266534139682578, "loss": 0.0577, "step": 79880 }, { "epoch": 0.52, "learning_rate": 0.00022265566004246886, "loss": 0.0538, "step": 79890 }, { "epoch": 0.52, "learning_rate": 0.00022264597868811194, "loss": 0.062, "step": 79900 }, { "epoch": 0.52, "learning_rate": 0.000222636297333755, "loss": 0.0553, "step": 79910 }, { "epoch": 0.52, "learning_rate": 0.00022262661597939807, "loss": 0.0476, "step": 79920 }, { "epoch": 0.52, "learning_rate": 0.00022261693462504112, "loss": 0.054, "step": 79930 }, { "epoch": 0.52, "learning_rate": 0.00022260725327068417, "loss": 0.0524, "step": 79940 }, { "epoch": 0.52, "learning_rate": 0.00022259757191632725, "loss": 0.0543, "step": 79950 }, { "epoch": 0.52, "learning_rate": 0.00022258789056197033, "loss": 0.0609, "step": 79960 }, { "epoch": 0.52, "learning_rate": 0.0002225782092076134, "loss": 0.0496, "step": 79970 }, { "epoch": 0.52, "learning_rate": 0.00022256852785325647, "loss": 0.0477, "step": 79980 }, { "epoch": 0.52, "learning_rate": 0.00022255884649889955, "loss": 0.0562, "step": 79990 }, { "epoch": 0.52, "learning_rate": 0.00022254916514454257, "loss": 0.0536, "step": 80000 }, { "epoch": 0.52, "eval_cer": 0.9199647497457915, "eval_loss": 0.03456534445285797, "eval_runtime": 119.9236, "eval_samples_per_second": 16.677, "eval_steps_per_second": 4.169, "step": 80000 }, { "epoch": 0.52, "learning_rate": 0.00022253948379018565, "loss": 0.0641, "step": 80010 }, { "epoch": 0.52, "learning_rate": 0.00022252980243582873, "loss": 0.0488, "step": 80020 }, { "epoch": 0.52, "learning_rate": 0.0002225201210814718, "loss": 0.0487, "step": 80030 }, { "epoch": 0.52, "learning_rate": 0.00022251043972711486, "loss": 0.0517, "step": 80040 }, { "epoch": 0.52, "learning_rate": 0.00022250075837275794, "loss": 0.0533, "step": 80050 }, { "epoch": 0.52, "learning_rate": 0.00022249107701840102, "loss": 0.0528, "step": 80060 }, { "epoch": 0.52, "learning_rate": 0.00022248139566404405, "loss": 0.0473, "step": 80070 }, { "epoch": 0.52, "learning_rate": 0.00022247171430968713, "loss": 0.0528, "step": 80080 }, { "epoch": 0.52, "learning_rate": 0.0002224620329553302, "loss": 0.056, "step": 80090 }, { "epoch": 0.52, "learning_rate": 0.0002224523516009733, "loss": 0.0533, "step": 80100 }, { "epoch": 0.52, "learning_rate": 0.00022244267024661634, "loss": 0.0593, "step": 80110 }, { "epoch": 0.52, "learning_rate": 0.00022243298889225942, "loss": 0.0605, "step": 80120 }, { "epoch": 0.52, "learning_rate": 0.0002224233075379025, "loss": 0.0491, "step": 80130 }, { "epoch": 0.52, "learning_rate": 0.00022241362618354553, "loss": 0.051, "step": 80140 }, { "epoch": 0.52, "learning_rate": 0.0002224039448291886, "loss": 0.0529, "step": 80150 }, { "epoch": 0.52, "learning_rate": 0.00022239426347483169, "loss": 0.0556, "step": 80160 }, { "epoch": 0.52, "learning_rate": 0.00022238458212047477, "loss": 0.0517, "step": 80170 }, { "epoch": 0.52, "learning_rate": 0.00022237490076611782, "loss": 0.0646, "step": 80180 }, { "epoch": 0.52, "learning_rate": 0.0002223652194117609, "loss": 0.0545, "step": 80190 }, { "epoch": 0.52, "learning_rate": 0.00022235553805740398, "loss": 0.0488, "step": 80200 }, { "epoch": 0.52, "learning_rate": 0.000222345856703047, "loss": 0.0525, "step": 80210 }, { "epoch": 0.52, "learning_rate": 0.00022233617534869008, "loss": 0.0567, "step": 80220 }, { "epoch": 0.52, "learning_rate": 0.00022232649399433316, "loss": 0.0448, "step": 80230 }, { "epoch": 0.52, "learning_rate": 0.00022231681263997622, "loss": 0.0492, "step": 80240 }, { "epoch": 0.52, "learning_rate": 0.0002223071312856193, "loss": 0.051, "step": 80250 }, { "epoch": 0.52, "learning_rate": 0.00022229744993126238, "loss": 0.0451, "step": 80260 }, { "epoch": 0.52, "learning_rate": 0.00022228776857690546, "loss": 0.0485, "step": 80270 }, { "epoch": 0.52, "learning_rate": 0.00022227808722254848, "loss": 0.0519, "step": 80280 }, { "epoch": 0.52, "learning_rate": 0.00022226840586819156, "loss": 0.0552, "step": 80290 }, { "epoch": 0.52, "learning_rate": 0.00022225872451383464, "loss": 0.0598, "step": 80300 }, { "epoch": 0.52, "learning_rate": 0.0002222490431594777, "loss": 0.0481, "step": 80310 }, { "epoch": 0.52, "learning_rate": 0.00022223936180512077, "loss": 0.0521, "step": 80320 }, { "epoch": 0.52, "learning_rate": 0.00022222968045076385, "loss": 0.0528, "step": 80330 }, { "epoch": 0.52, "learning_rate": 0.00022221999909640693, "loss": 0.0475, "step": 80340 }, { "epoch": 0.52, "learning_rate": 0.00022221031774204996, "loss": 0.0544, "step": 80350 }, { "epoch": 0.52, "learning_rate": 0.00022220063638769304, "loss": 0.061, "step": 80360 }, { "epoch": 0.52, "learning_rate": 0.00022219095503333612, "loss": 0.054, "step": 80370 }, { "epoch": 0.52, "learning_rate": 0.00022218127367897917, "loss": 0.0535, "step": 80380 }, { "epoch": 0.52, "learning_rate": 0.00022217159232462225, "loss": 0.0536, "step": 80390 }, { "epoch": 0.52, "learning_rate": 0.00022216191097026533, "loss": 0.05, "step": 80400 }, { "epoch": 0.52, "learning_rate": 0.00022215222961590838, "loss": 0.0475, "step": 80410 }, { "epoch": 0.52, "learning_rate": 0.00022214254826155144, "loss": 0.0543, "step": 80420 }, { "epoch": 0.52, "learning_rate": 0.00022213286690719452, "loss": 0.0506, "step": 80430 }, { "epoch": 0.52, "learning_rate": 0.00022212318555283757, "loss": 0.0489, "step": 80440 }, { "epoch": 0.52, "learning_rate": 0.00022211350419848065, "loss": 0.0594, "step": 80450 }, { "epoch": 0.52, "learning_rate": 0.00022210382284412373, "loss": 0.0516, "step": 80460 }, { "epoch": 0.52, "learning_rate": 0.0002220941414897668, "loss": 0.0513, "step": 80470 }, { "epoch": 0.52, "learning_rate": 0.00022208446013540986, "loss": 0.0563, "step": 80480 }, { "epoch": 0.52, "learning_rate": 0.0002220747787810529, "loss": 0.0568, "step": 80490 }, { "epoch": 0.52, "learning_rate": 0.000222065097426696, "loss": 0.0532, "step": 80500 }, { "epoch": 0.52, "learning_rate": 0.00022205541607233905, "loss": 0.0533, "step": 80510 }, { "epoch": 0.52, "learning_rate": 0.00022204573471798212, "loss": 0.064, "step": 80520 }, { "epoch": 0.52, "learning_rate": 0.0002220360533636252, "loss": 0.0501, "step": 80530 }, { "epoch": 0.52, "learning_rate": 0.00022202637200926828, "loss": 0.0591, "step": 80540 }, { "epoch": 0.52, "learning_rate": 0.00022201669065491134, "loss": 0.0454, "step": 80550 }, { "epoch": 0.52, "learning_rate": 0.0002220070093005544, "loss": 0.0514, "step": 80560 }, { "epoch": 0.52, "learning_rate": 0.00022199732794619747, "loss": 0.0493, "step": 80570 }, { "epoch": 0.52, "learning_rate": 0.00022198764659184052, "loss": 0.0481, "step": 80580 }, { "epoch": 0.52, "learning_rate": 0.0002219779652374836, "loss": 0.0474, "step": 80590 }, { "epoch": 0.52, "learning_rate": 0.00022196828388312668, "loss": 0.05, "step": 80600 }, { "epoch": 0.52, "learning_rate": 0.00022195860252876973, "loss": 0.0455, "step": 80610 }, { "epoch": 0.52, "learning_rate": 0.00022194892117441281, "loss": 0.0493, "step": 80620 }, { "epoch": 0.52, "learning_rate": 0.00022193923982005587, "loss": 0.0513, "step": 80630 }, { "epoch": 0.52, "learning_rate": 0.00022192955846569892, "loss": 0.0448, "step": 80640 }, { "epoch": 0.52, "learning_rate": 0.000221919877111342, "loss": 0.0461, "step": 80650 }, { "epoch": 0.52, "learning_rate": 0.00022191019575698508, "loss": 0.05, "step": 80660 }, { "epoch": 0.52, "learning_rate": 0.00022190051440262816, "loss": 0.0514, "step": 80670 }, { "epoch": 0.52, "learning_rate": 0.0002218908330482712, "loss": 0.0515, "step": 80680 }, { "epoch": 0.52, "learning_rate": 0.0002218811516939143, "loss": 0.0485, "step": 80690 }, { "epoch": 0.52, "learning_rate": 0.00022187147033955734, "loss": 0.049, "step": 80700 }, { "epoch": 0.52, "learning_rate": 0.0002218617889852004, "loss": 0.0489, "step": 80710 }, { "epoch": 0.52, "learning_rate": 0.00022185210763084348, "loss": 0.0537, "step": 80720 }, { "epoch": 0.52, "learning_rate": 0.00022184242627648656, "loss": 0.0529, "step": 80730 }, { "epoch": 0.52, "learning_rate": 0.00022183274492212964, "loss": 0.0562, "step": 80740 }, { "epoch": 0.52, "learning_rate": 0.0002218230635677727, "loss": 0.05, "step": 80750 }, { "epoch": 0.52, "learning_rate": 0.00022181338221341577, "loss": 0.0521, "step": 80760 }, { "epoch": 0.52, "learning_rate": 0.00022180370085905882, "loss": 0.0473, "step": 80770 }, { "epoch": 0.52, "learning_rate": 0.00022179401950470187, "loss": 0.0475, "step": 80780 }, { "epoch": 0.52, "learning_rate": 0.00022178433815034495, "loss": 0.0504, "step": 80790 }, { "epoch": 0.52, "learning_rate": 0.00022177465679598803, "loss": 0.0516, "step": 80800 }, { "epoch": 0.52, "learning_rate": 0.0002217649754416311, "loss": 0.0519, "step": 80810 }, { "epoch": 0.52, "learning_rate": 0.00022175529408727417, "loss": 0.0618, "step": 80820 }, { "epoch": 0.52, "learning_rate": 0.00022174561273291725, "loss": 0.0492, "step": 80830 }, { "epoch": 0.52, "learning_rate": 0.00022173593137856027, "loss": 0.0557, "step": 80840 }, { "epoch": 0.52, "learning_rate": 0.00022172625002420335, "loss": 0.0457, "step": 80850 }, { "epoch": 0.52, "learning_rate": 0.00022171656866984643, "loss": 0.0432, "step": 80860 }, { "epoch": 0.52, "learning_rate": 0.0002217068873154895, "loss": 0.0525, "step": 80870 }, { "epoch": 0.52, "learning_rate": 0.00022169720596113256, "loss": 0.0435, "step": 80880 }, { "epoch": 0.52, "learning_rate": 0.00022168752460677564, "loss": 0.0463, "step": 80890 }, { "epoch": 0.52, "learning_rate": 0.00022167784325241872, "loss": 0.0485, "step": 80900 }, { "epoch": 0.52, "learning_rate": 0.00022166816189806175, "loss": 0.0481, "step": 80910 }, { "epoch": 0.52, "learning_rate": 0.00022165848054370483, "loss": 0.0508, "step": 80920 }, { "epoch": 0.52, "learning_rate": 0.0002216487991893479, "loss": 0.0629, "step": 80930 }, { "epoch": 0.52, "learning_rate": 0.000221639117834991, "loss": 0.049, "step": 80940 }, { "epoch": 0.52, "learning_rate": 0.00022162943648063404, "loss": 0.0491, "step": 80950 }, { "epoch": 0.52, "learning_rate": 0.00022161975512627712, "loss": 0.0483, "step": 80960 }, { "epoch": 0.52, "learning_rate": 0.0002216100737719202, "loss": 0.0541, "step": 80970 }, { "epoch": 0.52, "learning_rate": 0.00022160039241756323, "loss": 0.0552, "step": 80980 }, { "epoch": 0.52, "learning_rate": 0.0002215907110632063, "loss": 0.0471, "step": 80990 }, { "epoch": 0.52, "learning_rate": 0.00022158102970884939, "loss": 0.0568, "step": 81000 }, { "epoch": 0.52, "eval_cer": 0.9199439611343351, "eval_loss": 0.0355331152677536, "eval_runtime": 120.0549, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 81000 }, { "epoch": 0.52, "learning_rate": 0.00022157134835449244, "loss": 0.0538, "step": 81010 }, { "epoch": 0.52, "learning_rate": 0.00022156166700013552, "loss": 0.0606, "step": 81020 }, { "epoch": 0.52, "learning_rate": 0.0002215519856457786, "loss": 0.0529, "step": 81030 }, { "epoch": 0.52, "learning_rate": 0.00022154230429142168, "loss": 0.0556, "step": 81040 }, { "epoch": 0.52, "learning_rate": 0.0002215326229370647, "loss": 0.0502, "step": 81050 }, { "epoch": 0.52, "learning_rate": 0.00022152294158270778, "loss": 0.0505, "step": 81060 }, { "epoch": 0.52, "learning_rate": 0.00022151326022835086, "loss": 0.053, "step": 81070 }, { "epoch": 0.52, "learning_rate": 0.00022150357887399392, "loss": 0.0491, "step": 81080 }, { "epoch": 0.52, "learning_rate": 0.000221493897519637, "loss": 0.0528, "step": 81090 }, { "epoch": 0.52, "learning_rate": 0.00022148421616528008, "loss": 0.0614, "step": 81100 }, { "epoch": 0.52, "learning_rate": 0.00022147453481092316, "loss": 0.0537, "step": 81110 }, { "epoch": 0.52, "learning_rate": 0.00022146485345656618, "loss": 0.0541, "step": 81120 }, { "epoch": 0.52, "learning_rate": 0.00022145517210220926, "loss": 0.0515, "step": 81130 }, { "epoch": 0.52, "learning_rate": 0.00022144549074785234, "loss": 0.051, "step": 81140 }, { "epoch": 0.52, "learning_rate": 0.0002214358093934954, "loss": 0.0531, "step": 81150 }, { "epoch": 0.52, "learning_rate": 0.00022142612803913847, "loss": 0.0615, "step": 81160 }, { "epoch": 0.52, "learning_rate": 0.00022141644668478155, "loss": 0.053, "step": 81170 }, { "epoch": 0.52, "learning_rate": 0.0002214067653304246, "loss": 0.0436, "step": 81180 }, { "epoch": 0.52, "learning_rate": 0.00022139708397606766, "loss": 0.0557, "step": 81190 }, { "epoch": 0.52, "learning_rate": 0.00022138740262171074, "loss": 0.0536, "step": 81200 }, { "epoch": 0.52, "learning_rate": 0.0002213777212673538, "loss": 0.0523, "step": 81210 }, { "epoch": 0.52, "learning_rate": 0.00022136803991299687, "loss": 0.0515, "step": 81220 }, { "epoch": 0.52, "learning_rate": 0.00022135835855863995, "loss": 0.0515, "step": 81230 }, { "epoch": 0.52, "learning_rate": 0.00022134867720428303, "loss": 0.0524, "step": 81240 }, { "epoch": 0.52, "learning_rate": 0.00022133899584992608, "loss": 0.0498, "step": 81250 }, { "epoch": 0.52, "learning_rate": 0.00022132931449556914, "loss": 0.0462, "step": 81260 }, { "epoch": 0.52, "learning_rate": 0.00022131963314121221, "loss": 0.0487, "step": 81270 }, { "epoch": 0.52, "learning_rate": 0.00022130995178685527, "loss": 0.0525, "step": 81280 }, { "epoch": 0.52, "learning_rate": 0.00022130027043249835, "loss": 0.0481, "step": 81290 }, { "epoch": 0.52, "learning_rate": 0.00022129058907814143, "loss": 0.0568, "step": 81300 }, { "epoch": 0.52, "learning_rate": 0.0002212809077237845, "loss": 0.0516, "step": 81310 }, { "epoch": 0.52, "learning_rate": 0.00022127122636942756, "loss": 0.0519, "step": 81320 }, { "epoch": 0.52, "learning_rate": 0.0002212615450150706, "loss": 0.0561, "step": 81330 }, { "epoch": 0.52, "learning_rate": 0.0002212518636607137, "loss": 0.0487, "step": 81340 }, { "epoch": 0.53, "learning_rate": 0.00022124218230635674, "loss": 0.0579, "step": 81350 }, { "epoch": 0.53, "learning_rate": 0.00022123250095199982, "loss": 0.0523, "step": 81360 }, { "epoch": 0.53, "learning_rate": 0.0002212228195976429, "loss": 0.0571, "step": 81370 }, { "epoch": 0.53, "learning_rate": 0.00022121313824328596, "loss": 0.0454, "step": 81380 }, { "epoch": 0.53, "learning_rate": 0.00022120345688892904, "loss": 0.0458, "step": 81390 }, { "epoch": 0.53, "learning_rate": 0.0002211937755345721, "loss": 0.0607, "step": 81400 }, { "epoch": 0.53, "learning_rate": 0.00022118409418021514, "loss": 0.0487, "step": 81410 }, { "epoch": 0.53, "learning_rate": 0.00022117441282585822, "loss": 0.0519, "step": 81420 }, { "epoch": 0.53, "learning_rate": 0.0002211647314715013, "loss": 0.0634, "step": 81430 }, { "epoch": 0.53, "learning_rate": 0.00022115505011714438, "loss": 0.0475, "step": 81440 }, { "epoch": 0.53, "learning_rate": 0.00022114536876278743, "loss": 0.0577, "step": 81450 }, { "epoch": 0.53, "learning_rate": 0.00022113568740843051, "loss": 0.0516, "step": 81460 }, { "epoch": 0.53, "learning_rate": 0.00022112600605407357, "loss": 0.0603, "step": 81470 }, { "epoch": 0.53, "learning_rate": 0.00022111632469971662, "loss": 0.0465, "step": 81480 }, { "epoch": 0.53, "learning_rate": 0.0002211066433453597, "loss": 0.0478, "step": 81490 }, { "epoch": 0.53, "learning_rate": 0.00022109696199100278, "loss": 0.0497, "step": 81500 }, { "epoch": 0.53, "learning_rate": 0.00022108728063664586, "loss": 0.0535, "step": 81510 }, { "epoch": 0.53, "learning_rate": 0.0002210775992822889, "loss": 0.0523, "step": 81520 }, { "epoch": 0.53, "learning_rate": 0.000221067917927932, "loss": 0.0639, "step": 81530 }, { "epoch": 0.53, "learning_rate": 0.00022105823657357504, "loss": 0.0515, "step": 81540 }, { "epoch": 0.53, "learning_rate": 0.0002210485552192181, "loss": 0.0516, "step": 81550 }, { "epoch": 0.53, "learning_rate": 0.00022103887386486118, "loss": 0.0494, "step": 81560 }, { "epoch": 0.53, "learning_rate": 0.00022102919251050426, "loss": 0.0496, "step": 81570 }, { "epoch": 0.53, "learning_rate": 0.0002210195111561473, "loss": 0.0542, "step": 81580 }, { "epoch": 0.53, "learning_rate": 0.0002210098298017904, "loss": 0.0542, "step": 81590 }, { "epoch": 0.53, "learning_rate": 0.00022100014844743347, "loss": 0.0519, "step": 81600 }, { "epoch": 0.53, "learning_rate": 0.0002209904670930765, "loss": 0.0476, "step": 81610 }, { "epoch": 0.53, "learning_rate": 0.00022098078573871957, "loss": 0.0527, "step": 81620 }, { "epoch": 0.53, "learning_rate": 0.00022097110438436265, "loss": 0.0481, "step": 81630 }, { "epoch": 0.53, "learning_rate": 0.00022096142303000573, "loss": 0.0486, "step": 81640 }, { "epoch": 0.53, "learning_rate": 0.00022095174167564879, "loss": 0.0584, "step": 81650 }, { "epoch": 0.53, "learning_rate": 0.00022094206032129187, "loss": 0.0502, "step": 81660 }, { "epoch": 0.53, "learning_rate": 0.00022093237896693495, "loss": 0.0488, "step": 81670 }, { "epoch": 0.53, "learning_rate": 0.00022092269761257797, "loss": 0.0529, "step": 81680 }, { "epoch": 0.53, "learning_rate": 0.00022091301625822105, "loss": 0.0493, "step": 81690 }, { "epoch": 0.53, "learning_rate": 0.00022090333490386413, "loss": 0.0492, "step": 81700 }, { "epoch": 0.53, "learning_rate": 0.0002208936535495072, "loss": 0.0502, "step": 81710 }, { "epoch": 0.53, "learning_rate": 0.00022088397219515026, "loss": 0.0567, "step": 81720 }, { "epoch": 0.53, "learning_rate": 0.00022087429084079334, "loss": 0.0524, "step": 81730 }, { "epoch": 0.53, "learning_rate": 0.00022086460948643642, "loss": 0.054, "step": 81740 }, { "epoch": 0.53, "learning_rate": 0.00022085492813207945, "loss": 0.0536, "step": 81750 }, { "epoch": 0.53, "learning_rate": 0.00022084524677772253, "loss": 0.0531, "step": 81760 }, { "epoch": 0.53, "learning_rate": 0.0002208355654233656, "loss": 0.0686, "step": 81770 }, { "epoch": 0.53, "learning_rate": 0.00022082588406900866, "loss": 0.0572, "step": 81780 }, { "epoch": 0.53, "learning_rate": 0.00022081620271465174, "loss": 0.0511, "step": 81790 }, { "epoch": 0.53, "learning_rate": 0.00022080652136029482, "loss": 0.0511, "step": 81800 }, { "epoch": 0.53, "learning_rate": 0.0002207968400059379, "loss": 0.0528, "step": 81810 }, { "epoch": 0.53, "learning_rate": 0.00022078715865158093, "loss": 0.0476, "step": 81820 }, { "epoch": 0.53, "learning_rate": 0.000220777477297224, "loss": 0.055, "step": 81830 }, { "epoch": 0.53, "learning_rate": 0.00022076779594286709, "loss": 0.0526, "step": 81840 }, { "epoch": 0.53, "learning_rate": 0.00022075811458851014, "loss": 0.048, "step": 81850 }, { "epoch": 0.53, "learning_rate": 0.00022074843323415322, "loss": 0.0499, "step": 81860 }, { "epoch": 0.53, "learning_rate": 0.0002207387518797963, "loss": 0.0472, "step": 81870 }, { "epoch": 0.53, "learning_rate": 0.00022072907052543938, "loss": 0.0528, "step": 81880 }, { "epoch": 0.53, "learning_rate": 0.0002207193891710824, "loss": 0.0472, "step": 81890 }, { "epoch": 0.53, "learning_rate": 0.00022070970781672548, "loss": 0.0523, "step": 81900 }, { "epoch": 0.53, "learning_rate": 0.00022070002646236856, "loss": 0.0604, "step": 81910 }, { "epoch": 0.53, "learning_rate": 0.00022069034510801162, "loss": 0.05, "step": 81920 }, { "epoch": 0.53, "learning_rate": 0.0002206806637536547, "loss": 0.0501, "step": 81930 }, { "epoch": 0.53, "learning_rate": 0.00022067098239929777, "loss": 0.0475, "step": 81940 }, { "epoch": 0.53, "learning_rate": 0.00022066130104494085, "loss": 0.0499, "step": 81950 }, { "epoch": 0.53, "learning_rate": 0.00022065161969058388, "loss": 0.056, "step": 81960 }, { "epoch": 0.53, "learning_rate": 0.00022064193833622696, "loss": 0.0471, "step": 81970 }, { "epoch": 0.53, "learning_rate": 0.00022063225698187, "loss": 0.0555, "step": 81980 }, { "epoch": 0.53, "learning_rate": 0.0002206225756275131, "loss": 0.0568, "step": 81990 }, { "epoch": 0.53, "learning_rate": 0.00022061289427315617, "loss": 0.0486, "step": 82000 }, { "epoch": 0.53, "eval_cer": 0.9199421534289911, "eval_loss": 0.03461761400103569, "eval_runtime": 120.0302, "eval_samples_per_second": 16.662, "eval_steps_per_second": 4.166, "step": 82000 }, { "epoch": 0.53, "learning_rate": 0.00022060321291879925, "loss": 0.0555, "step": 82010 }, { "epoch": 0.53, "learning_rate": 0.0002205935315644423, "loss": 0.0497, "step": 82020 }, { "epoch": 0.53, "learning_rate": 0.00022058385021008536, "loss": 0.0472, "step": 82030 }, { "epoch": 0.53, "learning_rate": 0.00022057416885572844, "loss": 0.0553, "step": 82040 }, { "epoch": 0.53, "learning_rate": 0.0002205644875013715, "loss": 0.062, "step": 82050 }, { "epoch": 0.53, "learning_rate": 0.00022055480614701457, "loss": 0.0539, "step": 82060 }, { "epoch": 0.53, "learning_rate": 0.00022054512479265765, "loss": 0.0505, "step": 82070 }, { "epoch": 0.53, "learning_rate": 0.00022053544343830073, "loss": 0.0493, "step": 82080 }, { "epoch": 0.53, "learning_rate": 0.00022052576208394378, "loss": 0.0463, "step": 82090 }, { "epoch": 0.53, "learning_rate": 0.00022051608072958683, "loss": 0.0541, "step": 82100 }, { "epoch": 0.53, "learning_rate": 0.00022050639937522991, "loss": 0.0531, "step": 82110 }, { "epoch": 0.53, "learning_rate": 0.00022049671802087297, "loss": 0.0475, "step": 82120 }, { "epoch": 0.53, "learning_rate": 0.00022048703666651605, "loss": 0.0541, "step": 82130 }, { "epoch": 0.53, "learning_rate": 0.00022047735531215913, "loss": 0.0505, "step": 82140 }, { "epoch": 0.53, "learning_rate": 0.0002204676739578022, "loss": 0.0497, "step": 82150 }, { "epoch": 0.53, "learning_rate": 0.00022045799260344526, "loss": 0.0507, "step": 82160 }, { "epoch": 0.53, "learning_rate": 0.0002204483112490883, "loss": 0.0551, "step": 82170 }, { "epoch": 0.53, "learning_rate": 0.00022043862989473136, "loss": 0.0481, "step": 82180 }, { "epoch": 0.53, "learning_rate": 0.00022042894854037444, "loss": 0.046, "step": 82190 }, { "epoch": 0.53, "learning_rate": 0.00022041926718601752, "loss": 0.0567, "step": 82200 }, { "epoch": 0.53, "learning_rate": 0.0002204095858316606, "loss": 0.0481, "step": 82210 }, { "epoch": 0.53, "learning_rate": 0.00022039990447730366, "loss": 0.0495, "step": 82220 }, { "epoch": 0.53, "learning_rate": 0.00022039022312294674, "loss": 0.057, "step": 82230 }, { "epoch": 0.53, "learning_rate": 0.0002203805417685898, "loss": 0.051, "step": 82240 }, { "epoch": 0.53, "learning_rate": 0.00022037086041423284, "loss": 0.0546, "step": 82250 }, { "epoch": 0.53, "learning_rate": 0.00022036117905987592, "loss": 0.0457, "step": 82260 }, { "epoch": 0.53, "learning_rate": 0.000220351497705519, "loss": 0.0463, "step": 82270 }, { "epoch": 0.53, "learning_rate": 0.00022034181635116208, "loss": 0.048, "step": 82280 }, { "epoch": 0.53, "learning_rate": 0.00022033213499680513, "loss": 0.0486, "step": 82290 }, { "epoch": 0.53, "learning_rate": 0.00022032245364244821, "loss": 0.0541, "step": 82300 }, { "epoch": 0.53, "learning_rate": 0.00022031277228809127, "loss": 0.0569, "step": 82310 }, { "epoch": 0.53, "learning_rate": 0.00022030309093373432, "loss": 0.0471, "step": 82320 }, { "epoch": 0.53, "learning_rate": 0.0002202934095793774, "loss": 0.0494, "step": 82330 }, { "epoch": 0.53, "learning_rate": 0.00022028372822502048, "loss": 0.0527, "step": 82340 }, { "epoch": 0.53, "learning_rate": 0.00022027404687066356, "loss": 0.0513, "step": 82350 }, { "epoch": 0.53, "learning_rate": 0.0002202643655163066, "loss": 0.0551, "step": 82360 }, { "epoch": 0.53, "learning_rate": 0.0002202546841619497, "loss": 0.045, "step": 82370 }, { "epoch": 0.53, "learning_rate": 0.00022024500280759272, "loss": 0.0513, "step": 82380 }, { "epoch": 0.53, "learning_rate": 0.0002202353214532358, "loss": 0.0455, "step": 82390 }, { "epoch": 0.53, "learning_rate": 0.00022022564009887888, "loss": 0.0472, "step": 82400 }, { "epoch": 0.53, "learning_rate": 0.00022021595874452196, "loss": 0.0485, "step": 82410 }, { "epoch": 0.53, "learning_rate": 0.000220206277390165, "loss": 0.0503, "step": 82420 }, { "epoch": 0.53, "learning_rate": 0.0002201965960358081, "loss": 0.051, "step": 82430 }, { "epoch": 0.53, "learning_rate": 0.00022018691468145117, "loss": 0.0496, "step": 82440 }, { "epoch": 0.53, "learning_rate": 0.0002201772333270942, "loss": 0.0435, "step": 82450 }, { "epoch": 0.53, "learning_rate": 0.00022016755197273727, "loss": 0.0535, "step": 82460 }, { "epoch": 0.53, "learning_rate": 0.00022015787061838035, "loss": 0.0479, "step": 82470 }, { "epoch": 0.53, "learning_rate": 0.00022014818926402343, "loss": 0.0654, "step": 82480 }, { "epoch": 0.53, "learning_rate": 0.00022013850790966649, "loss": 0.0512, "step": 82490 }, { "epoch": 0.53, "learning_rate": 0.00022012882655530957, "loss": 0.0513, "step": 82500 }, { "epoch": 0.53, "learning_rate": 0.00022011914520095265, "loss": 0.046, "step": 82510 }, { "epoch": 0.53, "learning_rate": 0.00022010946384659567, "loss": 0.0514, "step": 82520 }, { "epoch": 0.53, "learning_rate": 0.00022009978249223875, "loss": 0.0524, "step": 82530 }, { "epoch": 0.53, "learning_rate": 0.00022009010113788183, "loss": 0.0562, "step": 82540 }, { "epoch": 0.53, "learning_rate": 0.0002200804197835249, "loss": 0.0465, "step": 82550 }, { "epoch": 0.53, "learning_rate": 0.00022007073842916796, "loss": 0.0454, "step": 82560 }, { "epoch": 0.53, "learning_rate": 0.00022006105707481104, "loss": 0.0541, "step": 82570 }, { "epoch": 0.53, "learning_rate": 0.00022005137572045412, "loss": 0.0517, "step": 82580 }, { "epoch": 0.53, "learning_rate": 0.00022004169436609715, "loss": 0.0503, "step": 82590 }, { "epoch": 0.53, "learning_rate": 0.00022003201301174023, "loss": 0.0578, "step": 82600 }, { "epoch": 0.53, "learning_rate": 0.0002200223316573833, "loss": 0.0613, "step": 82610 }, { "epoch": 0.53, "learning_rate": 0.00022001265030302636, "loss": 0.0479, "step": 82620 }, { "epoch": 0.53, "learning_rate": 0.00022000296894866944, "loss": 0.0515, "step": 82630 }, { "epoch": 0.53, "learning_rate": 0.00021999328759431252, "loss": 0.0479, "step": 82640 }, { "epoch": 0.53, "learning_rate": 0.0002199836062399556, "loss": 0.0486, "step": 82650 }, { "epoch": 0.53, "learning_rate": 0.00021997392488559863, "loss": 0.0481, "step": 82660 }, { "epoch": 0.53, "learning_rate": 0.0002199642435312417, "loss": 0.0601, "step": 82670 }, { "epoch": 0.53, "learning_rate": 0.00021995456217688478, "loss": 0.0491, "step": 82680 }, { "epoch": 0.53, "learning_rate": 0.00021994488082252784, "loss": 0.0525, "step": 82690 }, { "epoch": 0.53, "learning_rate": 0.00021993519946817092, "loss": 0.0461, "step": 82700 }, { "epoch": 0.53, "learning_rate": 0.000219925518113814, "loss": 0.0514, "step": 82710 }, { "epoch": 0.53, "learning_rate": 0.00021991583675945708, "loss": 0.0481, "step": 82720 }, { "epoch": 0.53, "learning_rate": 0.0002199061554051001, "loss": 0.0513, "step": 82730 }, { "epoch": 0.53, "learning_rate": 0.00021989647405074318, "loss": 0.0565, "step": 82740 }, { "epoch": 0.53, "learning_rate": 0.00021988679269638626, "loss": 0.0498, "step": 82750 }, { "epoch": 0.53, "learning_rate": 0.00021987711134202931, "loss": 0.0535, "step": 82760 }, { "epoch": 0.53, "learning_rate": 0.0002198674299876724, "loss": 0.0527, "step": 82770 }, { "epoch": 0.53, "learning_rate": 0.00021985774863331547, "loss": 0.0526, "step": 82780 }, { "epoch": 0.53, "learning_rate": 0.00021984806727895853, "loss": 0.0515, "step": 82790 }, { "epoch": 0.53, "learning_rate": 0.00021983838592460158, "loss": 0.0483, "step": 82800 }, { "epoch": 0.53, "learning_rate": 0.00021982870457024466, "loss": 0.0538, "step": 82810 }, { "epoch": 0.53, "learning_rate": 0.0002198190232158877, "loss": 0.0535, "step": 82820 }, { "epoch": 0.53, "learning_rate": 0.0002198093418615308, "loss": 0.0515, "step": 82830 }, { "epoch": 0.53, "learning_rate": 0.00021979966050717387, "loss": 0.0505, "step": 82840 }, { "epoch": 0.53, "learning_rate": 0.00021978997915281695, "loss": 0.0555, "step": 82850 }, { "epoch": 0.53, "learning_rate": 0.00021978029779846, "loss": 0.0534, "step": 82860 }, { "epoch": 0.53, "learning_rate": 0.00021977061644410306, "loss": 0.0493, "step": 82870 }, { "epoch": 0.53, "learning_rate": 0.00021976093508974614, "loss": 0.0505, "step": 82880 }, { "epoch": 0.53, "learning_rate": 0.0002197512537353892, "loss": 0.0492, "step": 82890 }, { "epoch": 0.54, "learning_rate": 0.00021974157238103227, "loss": 0.049, "step": 82900 }, { "epoch": 0.54, "learning_rate": 0.00021973189102667535, "loss": 0.0492, "step": 82910 }, { "epoch": 0.54, "learning_rate": 0.00021972220967231843, "loss": 0.0491, "step": 82920 }, { "epoch": 0.54, "learning_rate": 0.00021971252831796148, "loss": 0.0528, "step": 82930 }, { "epoch": 0.54, "learning_rate": 0.00021970284696360453, "loss": 0.0541, "step": 82940 }, { "epoch": 0.54, "learning_rate": 0.00021969316560924761, "loss": 0.0519, "step": 82950 }, { "epoch": 0.54, "learning_rate": 0.00021968348425489067, "loss": 0.0515, "step": 82960 }, { "epoch": 0.54, "learning_rate": 0.00021967380290053375, "loss": 0.0549, "step": 82970 }, { "epoch": 0.54, "learning_rate": 0.00021966412154617683, "loss": 0.0527, "step": 82980 }, { "epoch": 0.54, "learning_rate": 0.00021965444019181988, "loss": 0.0502, "step": 82990 }, { "epoch": 0.54, "learning_rate": 0.00021964475883746296, "loss": 0.0571, "step": 83000 }, { "epoch": 0.54, "eval_cer": 0.9200235001694724, "eval_loss": 0.03383234888315201, "eval_runtime": 120.0102, "eval_samples_per_second": 16.665, "eval_steps_per_second": 4.166, "step": 83000 }, { "epoch": 0.54, "learning_rate": 0.000219635077483106, "loss": 0.0469, "step": 83010 }, { "epoch": 0.54, "learning_rate": 0.00021962539612874906, "loss": 0.0574, "step": 83020 }, { "epoch": 0.54, "learning_rate": 0.00021961571477439214, "loss": 0.0527, "step": 83030 }, { "epoch": 0.54, "learning_rate": 0.00021960603342003522, "loss": 0.0436, "step": 83040 }, { "epoch": 0.54, "learning_rate": 0.0002195963520656783, "loss": 0.0538, "step": 83050 }, { "epoch": 0.54, "learning_rate": 0.00021958667071132136, "loss": 0.049, "step": 83060 }, { "epoch": 0.54, "learning_rate": 0.00021957698935696444, "loss": 0.0495, "step": 83070 }, { "epoch": 0.54, "learning_rate": 0.0002195673080026075, "loss": 0.0481, "step": 83080 }, { "epoch": 0.54, "learning_rate": 0.00021955762664825054, "loss": 0.0503, "step": 83090 }, { "epoch": 0.54, "learning_rate": 0.00021954794529389362, "loss": 0.0495, "step": 83100 }, { "epoch": 0.54, "learning_rate": 0.0002195382639395367, "loss": 0.0428, "step": 83110 }, { "epoch": 0.54, "learning_rate": 0.00021952858258517978, "loss": 0.0496, "step": 83120 }, { "epoch": 0.54, "learning_rate": 0.00021951890123082283, "loss": 0.0514, "step": 83130 }, { "epoch": 0.54, "learning_rate": 0.0002195092198764659, "loss": 0.0517, "step": 83140 }, { "epoch": 0.54, "learning_rate": 0.00021949953852210897, "loss": 0.0597, "step": 83150 }, { "epoch": 0.54, "learning_rate": 0.00021948985716775202, "loss": 0.0489, "step": 83160 }, { "epoch": 0.54, "learning_rate": 0.0002194801758133951, "loss": 0.0569, "step": 83170 }, { "epoch": 0.54, "learning_rate": 0.00021947049445903818, "loss": 0.0459, "step": 83180 }, { "epoch": 0.54, "learning_rate": 0.00021946081310468123, "loss": 0.0603, "step": 83190 }, { "epoch": 0.54, "learning_rate": 0.0002194511317503243, "loss": 0.0538, "step": 83200 }, { "epoch": 0.54, "learning_rate": 0.0002194414503959674, "loss": 0.0531, "step": 83210 }, { "epoch": 0.54, "learning_rate": 0.00021943176904161042, "loss": 0.0453, "step": 83220 }, { "epoch": 0.54, "learning_rate": 0.0002194220876872535, "loss": 0.046, "step": 83230 }, { "epoch": 0.54, "learning_rate": 0.00021941240633289658, "loss": 0.0528, "step": 83240 }, { "epoch": 0.54, "learning_rate": 0.00021940272497853966, "loss": 0.0551, "step": 83250 }, { "epoch": 0.54, "learning_rate": 0.0002193930436241827, "loss": 0.0547, "step": 83260 }, { "epoch": 0.54, "learning_rate": 0.0002193833622698258, "loss": 0.0514, "step": 83270 }, { "epoch": 0.54, "learning_rate": 0.00021937368091546887, "loss": 0.0462, "step": 83280 }, { "epoch": 0.54, "learning_rate": 0.0002193639995611119, "loss": 0.0453, "step": 83290 }, { "epoch": 0.54, "learning_rate": 0.00021935431820675497, "loss": 0.0458, "step": 83300 }, { "epoch": 0.54, "learning_rate": 0.00021934463685239805, "loss": 0.0518, "step": 83310 }, { "epoch": 0.54, "learning_rate": 0.00021933495549804113, "loss": 0.0552, "step": 83320 }, { "epoch": 0.54, "learning_rate": 0.00021932527414368419, "loss": 0.0596, "step": 83330 }, { "epoch": 0.54, "learning_rate": 0.00021931559278932727, "loss": 0.0502, "step": 83340 }, { "epoch": 0.54, "learning_rate": 0.00021930591143497034, "loss": 0.0516, "step": 83350 }, { "epoch": 0.54, "learning_rate": 0.00021929623008061337, "loss": 0.0501, "step": 83360 }, { "epoch": 0.54, "learning_rate": 0.00021928654872625645, "loss": 0.0517, "step": 83370 }, { "epoch": 0.54, "learning_rate": 0.00021927686737189953, "loss": 0.0552, "step": 83380 }, { "epoch": 0.54, "learning_rate": 0.00021926718601754258, "loss": 0.0559, "step": 83390 }, { "epoch": 0.54, "learning_rate": 0.00021925750466318566, "loss": 0.0575, "step": 83400 }, { "epoch": 0.54, "learning_rate": 0.00021924782330882874, "loss": 0.0473, "step": 83410 }, { "epoch": 0.54, "learning_rate": 0.00021923814195447182, "loss": 0.0526, "step": 83420 }, { "epoch": 0.54, "learning_rate": 0.00021922846060011485, "loss": 0.0553, "step": 83430 }, { "epoch": 0.54, "learning_rate": 0.00021921877924575793, "loss": 0.0532, "step": 83440 }, { "epoch": 0.54, "learning_rate": 0.000219209097891401, "loss": 0.0499, "step": 83450 }, { "epoch": 0.54, "learning_rate": 0.00021919941653704406, "loss": 0.0603, "step": 83460 }, { "epoch": 0.54, "learning_rate": 0.00021918973518268714, "loss": 0.053, "step": 83470 }, { "epoch": 0.54, "learning_rate": 0.00021918005382833022, "loss": 0.0525, "step": 83480 }, { "epoch": 0.54, "learning_rate": 0.0002191703724739733, "loss": 0.0548, "step": 83490 }, { "epoch": 0.54, "learning_rate": 0.00021916069111961633, "loss": 0.0545, "step": 83500 }, { "epoch": 0.54, "learning_rate": 0.0002191510097652594, "loss": 0.0479, "step": 83510 }, { "epoch": 0.54, "learning_rate": 0.00021914132841090248, "loss": 0.05, "step": 83520 }, { "epoch": 0.54, "learning_rate": 0.00021913164705654554, "loss": 0.0489, "step": 83530 }, { "epoch": 0.54, "learning_rate": 0.00021912196570218862, "loss": 0.0486, "step": 83540 }, { "epoch": 0.54, "learning_rate": 0.0002191122843478317, "loss": 0.048, "step": 83550 }, { "epoch": 0.54, "learning_rate": 0.00021910260299347475, "loss": 0.0514, "step": 83560 }, { "epoch": 0.54, "learning_rate": 0.0002190929216391178, "loss": 0.0538, "step": 83570 }, { "epoch": 0.54, "learning_rate": 0.00021908324028476088, "loss": 0.0485, "step": 83580 }, { "epoch": 0.54, "learning_rate": 0.00021907355893040393, "loss": 0.0593, "step": 83590 }, { "epoch": 0.54, "learning_rate": 0.00021906387757604701, "loss": 0.0515, "step": 83600 }, { "epoch": 0.54, "learning_rate": 0.0002190541962216901, "loss": 0.0563, "step": 83610 }, { "epoch": 0.54, "learning_rate": 0.00021904451486733317, "loss": 0.0499, "step": 83620 }, { "epoch": 0.54, "learning_rate": 0.00021903483351297623, "loss": 0.0497, "step": 83630 }, { "epoch": 0.54, "learning_rate": 0.00021902515215861928, "loss": 0.0542, "step": 83640 }, { "epoch": 0.54, "learning_rate": 0.00021901547080426236, "loss": 0.0476, "step": 83650 }, { "epoch": 0.54, "learning_rate": 0.0002190057894499054, "loss": 0.0495, "step": 83660 }, { "epoch": 0.54, "learning_rate": 0.0002189961080955485, "loss": 0.0506, "step": 83670 }, { "epoch": 0.54, "learning_rate": 0.00021898642674119157, "loss": 0.0467, "step": 83680 }, { "epoch": 0.54, "learning_rate": 0.00021897674538683465, "loss": 0.0505, "step": 83690 }, { "epoch": 0.54, "learning_rate": 0.0002189670640324777, "loss": 0.0426, "step": 83700 }, { "epoch": 0.54, "learning_rate": 0.00021895738267812076, "loss": 0.0519, "step": 83710 }, { "epoch": 0.54, "learning_rate": 0.00021894770132376384, "loss": 0.0476, "step": 83720 }, { "epoch": 0.54, "learning_rate": 0.0002189380199694069, "loss": 0.0551, "step": 83730 }, { "epoch": 0.54, "learning_rate": 0.00021892833861504997, "loss": 0.0504, "step": 83740 }, { "epoch": 0.54, "learning_rate": 0.00021891865726069305, "loss": 0.0487, "step": 83750 }, { "epoch": 0.54, "learning_rate": 0.0002189089759063361, "loss": 0.0481, "step": 83760 }, { "epoch": 0.54, "learning_rate": 0.00021889929455197918, "loss": 0.0518, "step": 83770 }, { "epoch": 0.54, "learning_rate": 0.00021888961319762223, "loss": 0.0488, "step": 83780 }, { "epoch": 0.54, "learning_rate": 0.0002188799318432653, "loss": 0.0567, "step": 83790 }, { "epoch": 0.54, "learning_rate": 0.00021887025048890837, "loss": 0.047, "step": 83800 }, { "epoch": 0.54, "learning_rate": 0.00021886056913455145, "loss": 0.0571, "step": 83810 }, { "epoch": 0.54, "learning_rate": 0.00021885088778019453, "loss": 0.0588, "step": 83820 }, { "epoch": 0.54, "learning_rate": 0.00021884120642583758, "loss": 0.0546, "step": 83830 }, { "epoch": 0.54, "learning_rate": 0.00021883152507148066, "loss": 0.054, "step": 83840 }, { "epoch": 0.54, "learning_rate": 0.0002188218437171237, "loss": 0.052, "step": 83850 }, { "epoch": 0.54, "learning_rate": 0.00021881216236276676, "loss": 0.0539, "step": 83860 }, { "epoch": 0.54, "learning_rate": 0.00021880248100840984, "loss": 0.0576, "step": 83870 }, { "epoch": 0.54, "learning_rate": 0.00021879279965405292, "loss": 0.0533, "step": 83880 }, { "epoch": 0.54, "learning_rate": 0.000218783118299696, "loss": 0.0493, "step": 83890 }, { "epoch": 0.54, "learning_rate": 0.00021877343694533906, "loss": 0.0488, "step": 83900 }, { "epoch": 0.54, "learning_rate": 0.00021876375559098214, "loss": 0.0507, "step": 83910 }, { "epoch": 0.54, "learning_rate": 0.0002187540742366252, "loss": 0.0512, "step": 83920 }, { "epoch": 0.54, "learning_rate": 0.00021874439288226824, "loss": 0.061, "step": 83930 }, { "epoch": 0.54, "learning_rate": 0.00021873471152791132, "loss": 0.0542, "step": 83940 }, { "epoch": 0.54, "learning_rate": 0.0002187250301735544, "loss": 0.0523, "step": 83950 }, { "epoch": 0.54, "learning_rate": 0.00021871534881919745, "loss": 0.0485, "step": 83960 }, { "epoch": 0.54, "learning_rate": 0.00021870566746484053, "loss": 0.0475, "step": 83970 }, { "epoch": 0.54, "learning_rate": 0.0002186959861104836, "loss": 0.0459, "step": 83980 }, { "epoch": 0.54, "learning_rate": 0.00021868630475612664, "loss": 0.0504, "step": 83990 }, { "epoch": 0.54, "learning_rate": 0.00021867662340176972, "loss": 0.0526, "step": 84000 }, { "epoch": 0.54, "eval_cer": 0.9200343464015366, "eval_loss": 0.033935271203517914, "eval_runtime": 120.0158, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 84000 }, { "epoch": 0.54, "learning_rate": 0.0002186669420474128, "loss": 0.0611, "step": 84010 }, { "epoch": 0.54, "learning_rate": 0.00021865726069305588, "loss": 0.0523, "step": 84020 }, { "epoch": 0.54, "learning_rate": 0.00021864757933869893, "loss": 0.047, "step": 84030 }, { "epoch": 0.54, "learning_rate": 0.000218637897984342, "loss": 0.0557, "step": 84040 }, { "epoch": 0.54, "learning_rate": 0.0002186282166299851, "loss": 0.0476, "step": 84050 }, { "epoch": 0.54, "learning_rate": 0.00021861853527562812, "loss": 0.0577, "step": 84060 }, { "epoch": 0.54, "learning_rate": 0.0002186088539212712, "loss": 0.0547, "step": 84070 }, { "epoch": 0.54, "learning_rate": 0.00021859917256691428, "loss": 0.0524, "step": 84080 }, { "epoch": 0.54, "learning_rate": 0.00021858949121255736, "loss": 0.049, "step": 84090 }, { "epoch": 0.54, "learning_rate": 0.0002185798098582004, "loss": 0.0487, "step": 84100 }, { "epoch": 0.54, "learning_rate": 0.0002185701285038435, "loss": 0.0493, "step": 84110 }, { "epoch": 0.54, "learning_rate": 0.00021856044714948657, "loss": 0.0487, "step": 84120 }, { "epoch": 0.54, "learning_rate": 0.0002185507657951296, "loss": 0.0519, "step": 84130 }, { "epoch": 0.54, "learning_rate": 0.00021854108444077267, "loss": 0.0542, "step": 84140 }, { "epoch": 0.54, "learning_rate": 0.00021853140308641575, "loss": 0.048, "step": 84150 }, { "epoch": 0.54, "learning_rate": 0.0002185217217320588, "loss": 0.0484, "step": 84160 }, { "epoch": 0.54, "learning_rate": 0.00021851204037770189, "loss": 0.0466, "step": 84170 }, { "epoch": 0.54, "learning_rate": 0.00021850235902334496, "loss": 0.0492, "step": 84180 }, { "epoch": 0.54, "learning_rate": 0.00021849267766898804, "loss": 0.0482, "step": 84190 }, { "epoch": 0.54, "learning_rate": 0.00021848299631463107, "loss": 0.0551, "step": 84200 }, { "epoch": 0.54, "learning_rate": 0.00021847331496027415, "loss": 0.0535, "step": 84210 }, { "epoch": 0.54, "learning_rate": 0.00021846363360591723, "loss": 0.0534, "step": 84220 }, { "epoch": 0.54, "learning_rate": 0.00021845395225156028, "loss": 0.0467, "step": 84230 }, { "epoch": 0.54, "learning_rate": 0.00021844427089720336, "loss": 0.0582, "step": 84240 }, { "epoch": 0.54, "learning_rate": 0.00021843458954284644, "loss": 0.0562, "step": 84250 }, { "epoch": 0.54, "learning_rate": 0.00021842490818848952, "loss": 0.0523, "step": 84260 }, { "epoch": 0.54, "learning_rate": 0.00021841522683413255, "loss": 0.0611, "step": 84270 }, { "epoch": 0.54, "learning_rate": 0.00021840554547977563, "loss": 0.053, "step": 84280 }, { "epoch": 0.54, "learning_rate": 0.0002183958641254187, "loss": 0.0504, "step": 84290 }, { "epoch": 0.54, "learning_rate": 0.00021838618277106176, "loss": 0.0468, "step": 84300 }, { "epoch": 0.54, "learning_rate": 0.00021837650141670484, "loss": 0.057, "step": 84310 }, { "epoch": 0.54, "learning_rate": 0.00021836682006234792, "loss": 0.0475, "step": 84320 }, { "epoch": 0.54, "learning_rate": 0.000218357138707991, "loss": 0.056, "step": 84330 }, { "epoch": 0.54, "learning_rate": 0.00021834745735363402, "loss": 0.0429, "step": 84340 }, { "epoch": 0.54, "learning_rate": 0.0002183377759992771, "loss": 0.0516, "step": 84350 }, { "epoch": 0.54, "learning_rate": 0.00021832809464492018, "loss": 0.0547, "step": 84360 }, { "epoch": 0.54, "learning_rate": 0.00021831841329056324, "loss": 0.0452, "step": 84370 }, { "epoch": 0.54, "learning_rate": 0.00021830873193620632, "loss": 0.0489, "step": 84380 }, { "epoch": 0.54, "learning_rate": 0.0002182990505818494, "loss": 0.0506, "step": 84390 }, { "epoch": 0.54, "learning_rate": 0.00021828936922749245, "loss": 0.0589, "step": 84400 }, { "epoch": 0.54, "learning_rate": 0.0002182796878731355, "loss": 0.0479, "step": 84410 }, { "epoch": 0.54, "learning_rate": 0.00021827000651877858, "loss": 0.0445, "step": 84420 }, { "epoch": 0.54, "learning_rate": 0.00021826032516442163, "loss": 0.0492, "step": 84430 }, { "epoch": 0.54, "learning_rate": 0.00021825064381006471, "loss": 0.048, "step": 84440 }, { "epoch": 0.55, "learning_rate": 0.0002182409624557078, "loss": 0.0515, "step": 84450 }, { "epoch": 0.55, "learning_rate": 0.00021823128110135087, "loss": 0.0533, "step": 84460 }, { "epoch": 0.55, "learning_rate": 0.00021822159974699393, "loss": 0.05, "step": 84470 }, { "epoch": 0.55, "learning_rate": 0.00021821191839263698, "loss": 0.0503, "step": 84480 }, { "epoch": 0.55, "learning_rate": 0.00021820223703828006, "loss": 0.0515, "step": 84490 }, { "epoch": 0.55, "learning_rate": 0.0002181925556839231, "loss": 0.05, "step": 84500 }, { "epoch": 0.55, "learning_rate": 0.0002181828743295662, "loss": 0.0513, "step": 84510 }, { "epoch": 0.55, "learning_rate": 0.00021817319297520927, "loss": 0.054, "step": 84520 }, { "epoch": 0.55, "learning_rate": 0.00021816351162085235, "loss": 0.0498, "step": 84530 }, { "epoch": 0.55, "learning_rate": 0.0002181538302664954, "loss": 0.0545, "step": 84540 }, { "epoch": 0.55, "learning_rate": 0.00021814414891213846, "loss": 0.048, "step": 84550 }, { "epoch": 0.55, "learning_rate": 0.00021813446755778154, "loss": 0.0543, "step": 84560 }, { "epoch": 0.55, "learning_rate": 0.0002181247862034246, "loss": 0.0533, "step": 84570 }, { "epoch": 0.55, "learning_rate": 0.00021811510484906767, "loss": 0.0518, "step": 84580 }, { "epoch": 0.55, "learning_rate": 0.00021810542349471075, "loss": 0.061, "step": 84590 }, { "epoch": 0.55, "learning_rate": 0.0002180957421403538, "loss": 0.0457, "step": 84600 }, { "epoch": 0.55, "learning_rate": 0.00021808606078599688, "loss": 0.0518, "step": 84610 }, { "epoch": 0.55, "learning_rate": 0.00021807637943163993, "loss": 0.0532, "step": 84620 }, { "epoch": 0.55, "learning_rate": 0.00021806669807728299, "loss": 0.0514, "step": 84630 }, { "epoch": 0.55, "learning_rate": 0.00021805701672292607, "loss": 0.0516, "step": 84640 }, { "epoch": 0.55, "learning_rate": 0.00021804733536856915, "loss": 0.0442, "step": 84650 }, { "epoch": 0.55, "learning_rate": 0.00021803765401421223, "loss": 0.0509, "step": 84660 }, { "epoch": 0.55, "learning_rate": 0.00021802797265985528, "loss": 0.0482, "step": 84670 }, { "epoch": 0.55, "learning_rate": 0.00021801829130549836, "loss": 0.0477, "step": 84680 }, { "epoch": 0.55, "learning_rate": 0.0002180086099511414, "loss": 0.0531, "step": 84690 }, { "epoch": 0.55, "learning_rate": 0.00021799892859678446, "loss": 0.0505, "step": 84700 }, { "epoch": 0.55, "learning_rate": 0.00021798924724242754, "loss": 0.0487, "step": 84710 }, { "epoch": 0.55, "learning_rate": 0.00021797956588807062, "loss": 0.0457, "step": 84720 }, { "epoch": 0.55, "learning_rate": 0.0002179698845337137, "loss": 0.0519, "step": 84730 }, { "epoch": 0.55, "learning_rate": 0.00021796020317935676, "loss": 0.0497, "step": 84740 }, { "epoch": 0.55, "learning_rate": 0.00021795052182499984, "loss": 0.0474, "step": 84750 }, { "epoch": 0.55, "learning_rate": 0.0002179408404706429, "loss": 0.0611, "step": 84760 }, { "epoch": 0.55, "learning_rate": 0.00021793115911628594, "loss": 0.0519, "step": 84770 }, { "epoch": 0.55, "learning_rate": 0.00021792147776192902, "loss": 0.0521, "step": 84780 }, { "epoch": 0.55, "learning_rate": 0.0002179117964075721, "loss": 0.0488, "step": 84790 }, { "epoch": 0.55, "learning_rate": 0.00021790211505321515, "loss": 0.049, "step": 84800 }, { "epoch": 0.55, "learning_rate": 0.00021789243369885823, "loss": 0.0504, "step": 84810 }, { "epoch": 0.55, "learning_rate": 0.0002178827523445013, "loss": 0.0447, "step": 84820 }, { "epoch": 0.55, "learning_rate": 0.00021787307099014434, "loss": 0.0485, "step": 84830 }, { "epoch": 0.55, "learning_rate": 0.00021786338963578742, "loss": 0.0443, "step": 84840 }, { "epoch": 0.55, "learning_rate": 0.0002178537082814305, "loss": 0.0549, "step": 84850 }, { "epoch": 0.55, "learning_rate": 0.00021784402692707358, "loss": 0.0551, "step": 84860 }, { "epoch": 0.55, "learning_rate": 0.00021783434557271663, "loss": 0.0572, "step": 84870 }, { "epoch": 0.55, "learning_rate": 0.0002178246642183597, "loss": 0.045, "step": 84880 }, { "epoch": 0.55, "learning_rate": 0.0002178149828640028, "loss": 0.0578, "step": 84890 }, { "epoch": 0.55, "learning_rate": 0.00021780530150964582, "loss": 0.055, "step": 84900 }, { "epoch": 0.55, "learning_rate": 0.0002177956201552889, "loss": 0.0549, "step": 84910 }, { "epoch": 0.55, "learning_rate": 0.00021778593880093197, "loss": 0.0457, "step": 84920 }, { "epoch": 0.55, "learning_rate": 0.00021777625744657505, "loss": 0.0565, "step": 84930 }, { "epoch": 0.55, "learning_rate": 0.0002177665760922181, "loss": 0.0468, "step": 84940 }, { "epoch": 0.55, "learning_rate": 0.0002177568947378612, "loss": 0.0526, "step": 84950 }, { "epoch": 0.55, "learning_rate": 0.00021774721338350427, "loss": 0.0502, "step": 84960 }, { "epoch": 0.55, "learning_rate": 0.0002177375320291473, "loss": 0.0627, "step": 84970 }, { "epoch": 0.55, "learning_rate": 0.00021772785067479037, "loss": 0.0537, "step": 84980 }, { "epoch": 0.55, "learning_rate": 0.00021771816932043345, "loss": 0.0468, "step": 84990 }, { "epoch": 0.55, "learning_rate": 0.0002177084879660765, "loss": 0.0485, "step": 85000 }, { "epoch": 0.55, "eval_cer": 0.9199746921251836, "eval_loss": 0.033818814903497696, "eval_runtime": 120.0068, "eval_samples_per_second": 16.666, "eval_steps_per_second": 4.166, "step": 85000 }, { "epoch": 0.55, "learning_rate": 0.00021769880661171958, "loss": 0.0553, "step": 85010 }, { "epoch": 0.55, "learning_rate": 0.00021768912525736266, "loss": 0.0487, "step": 85020 }, { "epoch": 0.55, "learning_rate": 0.00021767944390300574, "loss": 0.0495, "step": 85030 }, { "epoch": 0.55, "learning_rate": 0.00021766976254864877, "loss": 0.0514, "step": 85040 }, { "epoch": 0.55, "learning_rate": 0.00021766008119429185, "loss": 0.0576, "step": 85050 }, { "epoch": 0.55, "learning_rate": 0.00021765039983993493, "loss": 0.0525, "step": 85060 }, { "epoch": 0.55, "learning_rate": 0.00021764071848557798, "loss": 0.0502, "step": 85070 }, { "epoch": 0.55, "learning_rate": 0.00021763103713122106, "loss": 0.0519, "step": 85080 }, { "epoch": 0.55, "learning_rate": 0.00021762135577686414, "loss": 0.0524, "step": 85090 }, { "epoch": 0.55, "learning_rate": 0.00021761167442250722, "loss": 0.0583, "step": 85100 }, { "epoch": 0.55, "learning_rate": 0.00021760199306815025, "loss": 0.0433, "step": 85110 }, { "epoch": 0.55, "learning_rate": 0.00021759231171379333, "loss": 0.0537, "step": 85120 }, { "epoch": 0.55, "learning_rate": 0.0002175826303594364, "loss": 0.0552, "step": 85130 }, { "epoch": 0.55, "learning_rate": 0.00021757294900507946, "loss": 0.0569, "step": 85140 }, { "epoch": 0.55, "learning_rate": 0.00021756326765072254, "loss": 0.0494, "step": 85150 }, { "epoch": 0.55, "learning_rate": 0.00021755358629636562, "loss": 0.0748, "step": 85160 }, { "epoch": 0.55, "learning_rate": 0.00021754390494200867, "loss": 0.0764, "step": 85170 }, { "epoch": 0.55, "learning_rate": 0.00021753422358765172, "loss": 0.0512, "step": 85180 }, { "epoch": 0.55, "learning_rate": 0.0002175245422332948, "loss": 0.049, "step": 85190 }, { "epoch": 0.55, "learning_rate": 0.00021751486087893786, "loss": 0.054, "step": 85200 }, { "epoch": 0.55, "learning_rate": 0.00021750517952458094, "loss": 0.0496, "step": 85210 }, { "epoch": 0.55, "learning_rate": 0.00021749549817022402, "loss": 0.0595, "step": 85220 }, { "epoch": 0.55, "learning_rate": 0.0002174858168158671, "loss": 0.0558, "step": 85230 }, { "epoch": 0.55, "learning_rate": 0.00021747613546151015, "loss": 0.0496, "step": 85240 }, { "epoch": 0.55, "learning_rate": 0.0002174664541071532, "loss": 0.0486, "step": 85250 }, { "epoch": 0.55, "learning_rate": 0.00021745677275279628, "loss": 0.0558, "step": 85260 }, { "epoch": 0.55, "learning_rate": 0.00021744709139843933, "loss": 0.0515, "step": 85270 }, { "epoch": 0.55, "learning_rate": 0.00021743741004408241, "loss": 0.053, "step": 85280 }, { "epoch": 0.55, "learning_rate": 0.0002174277286897255, "loss": 0.0518, "step": 85290 }, { "epoch": 0.55, "learning_rate": 0.00021741804733536857, "loss": 0.0567, "step": 85300 }, { "epoch": 0.55, "learning_rate": 0.00021740836598101163, "loss": 0.0505, "step": 85310 }, { "epoch": 0.55, "learning_rate": 0.00021739868462665468, "loss": 0.0476, "step": 85320 }, { "epoch": 0.55, "learning_rate": 0.00021738900327229776, "loss": 0.0489, "step": 85330 }, { "epoch": 0.55, "learning_rate": 0.0002173793219179408, "loss": 0.0532, "step": 85340 }, { "epoch": 0.55, "learning_rate": 0.0002173696405635839, "loss": 0.0627, "step": 85350 }, { "epoch": 0.55, "learning_rate": 0.00021735995920922697, "loss": 0.0552, "step": 85360 }, { "epoch": 0.55, "learning_rate": 0.00021735027785487002, "loss": 0.0488, "step": 85370 }, { "epoch": 0.55, "learning_rate": 0.0002173405965005131, "loss": 0.0508, "step": 85380 }, { "epoch": 0.55, "learning_rate": 0.00021733091514615616, "loss": 0.0501, "step": 85390 }, { "epoch": 0.55, "learning_rate": 0.0002173212337917992, "loss": 0.0459, "step": 85400 }, { "epoch": 0.55, "learning_rate": 0.0002173115524374423, "loss": 0.0444, "step": 85410 }, { "epoch": 0.55, "learning_rate": 0.00021730187108308537, "loss": 0.0494, "step": 85420 }, { "epoch": 0.55, "learning_rate": 0.00021729218972872845, "loss": 0.05, "step": 85430 }, { "epoch": 0.55, "learning_rate": 0.0002172825083743715, "loss": 0.0483, "step": 85440 }, { "epoch": 0.55, "learning_rate": 0.00021727282702001458, "loss": 0.0509, "step": 85450 }, { "epoch": 0.55, "learning_rate": 0.00021726314566565763, "loss": 0.0536, "step": 85460 }, { "epoch": 0.55, "learning_rate": 0.00021725346431130069, "loss": 0.0496, "step": 85470 }, { "epoch": 0.55, "learning_rate": 0.00021724378295694377, "loss": 0.0559, "step": 85480 }, { "epoch": 0.55, "learning_rate": 0.00021723410160258685, "loss": 0.0507, "step": 85490 }, { "epoch": 0.55, "learning_rate": 0.00021722442024822993, "loss": 0.0461, "step": 85500 }, { "epoch": 0.55, "learning_rate": 0.00021721473889387298, "loss": 0.0538, "step": 85510 }, { "epoch": 0.55, "learning_rate": 0.00021720505753951606, "loss": 0.0473, "step": 85520 }, { "epoch": 0.55, "learning_rate": 0.0002171953761851591, "loss": 0.0594, "step": 85530 }, { "epoch": 0.55, "learning_rate": 0.00021718569483080216, "loss": 0.0496, "step": 85540 }, { "epoch": 0.55, "learning_rate": 0.00021717601347644524, "loss": 0.047, "step": 85550 }, { "epoch": 0.55, "learning_rate": 0.00021716633212208832, "loss": 0.0606, "step": 85560 }, { "epoch": 0.55, "learning_rate": 0.00021715665076773138, "loss": 0.0481, "step": 85570 }, { "epoch": 0.55, "learning_rate": 0.00021714696941337446, "loss": 0.0475, "step": 85580 }, { "epoch": 0.55, "learning_rate": 0.00021713728805901753, "loss": 0.0449, "step": 85590 }, { "epoch": 0.55, "learning_rate": 0.00021712760670466056, "loss": 0.0537, "step": 85600 }, { "epoch": 0.55, "learning_rate": 0.00021711792535030364, "loss": 0.0509, "step": 85610 }, { "epoch": 0.55, "learning_rate": 0.00021710824399594672, "loss": 0.0452, "step": 85620 }, { "epoch": 0.55, "learning_rate": 0.0002170985626415898, "loss": 0.0518, "step": 85630 }, { "epoch": 0.55, "learning_rate": 0.00021708888128723285, "loss": 0.047, "step": 85640 }, { "epoch": 0.55, "learning_rate": 0.00021707919993287593, "loss": 0.0594, "step": 85650 }, { "epoch": 0.55, "learning_rate": 0.000217069518578519, "loss": 0.0538, "step": 85660 }, { "epoch": 0.55, "learning_rate": 0.00021705983722416204, "loss": 0.0504, "step": 85670 }, { "epoch": 0.55, "learning_rate": 0.00021705015586980512, "loss": 0.0524, "step": 85680 }, { "epoch": 0.55, "learning_rate": 0.0002170404745154482, "loss": 0.0551, "step": 85690 }, { "epoch": 0.55, "learning_rate": 0.00021703079316109128, "loss": 0.0479, "step": 85700 }, { "epoch": 0.55, "learning_rate": 0.00021702111180673433, "loss": 0.0482, "step": 85710 }, { "epoch": 0.55, "learning_rate": 0.0002170114304523774, "loss": 0.0489, "step": 85720 }, { "epoch": 0.55, "learning_rate": 0.0002170017490980205, "loss": 0.0482, "step": 85730 }, { "epoch": 0.55, "learning_rate": 0.00021699206774366351, "loss": 0.0493, "step": 85740 }, { "epoch": 0.55, "learning_rate": 0.0002169823863893066, "loss": 0.05, "step": 85750 }, { "epoch": 0.55, "learning_rate": 0.00021697270503494967, "loss": 0.0474, "step": 85760 }, { "epoch": 0.55, "learning_rate": 0.00021696302368059273, "loss": 0.0458, "step": 85770 }, { "epoch": 0.55, "learning_rate": 0.0002169533423262358, "loss": 0.052, "step": 85780 }, { "epoch": 0.55, "learning_rate": 0.0002169436609718789, "loss": 0.0481, "step": 85790 }, { "epoch": 0.55, "learning_rate": 0.00021693397961752197, "loss": 0.0524, "step": 85800 }, { "epoch": 0.55, "learning_rate": 0.000216924298263165, "loss": 0.0546, "step": 85810 }, { "epoch": 0.55, "learning_rate": 0.00021691461690880807, "loss": 0.0483, "step": 85820 }, { "epoch": 0.55, "learning_rate": 0.00021690493555445115, "loss": 0.0513, "step": 85830 }, { "epoch": 0.55, "learning_rate": 0.0002168952542000942, "loss": 0.0491, "step": 85840 }, { "epoch": 0.55, "learning_rate": 0.00021688557284573728, "loss": 0.0507, "step": 85850 }, { "epoch": 0.55, "learning_rate": 0.00021687589149138036, "loss": 0.0519, "step": 85860 }, { "epoch": 0.55, "learning_rate": 0.00021686621013702344, "loss": 0.0507, "step": 85870 }, { "epoch": 0.55, "learning_rate": 0.00021685652878266647, "loss": 0.0459, "step": 85880 }, { "epoch": 0.55, "learning_rate": 0.00021684684742830955, "loss": 0.059, "step": 85890 }, { "epoch": 0.55, "learning_rate": 0.00021683716607395263, "loss": 0.0446, "step": 85900 }, { "epoch": 0.55, "learning_rate": 0.00021682748471959568, "loss": 0.0495, "step": 85910 }, { "epoch": 0.55, "learning_rate": 0.00021681780336523876, "loss": 0.0519, "step": 85920 }, { "epoch": 0.55, "learning_rate": 0.00021680812201088184, "loss": 0.0582, "step": 85930 }, { "epoch": 0.55, "learning_rate": 0.00021679844065652492, "loss": 0.0511, "step": 85940 }, { "epoch": 0.55, "learning_rate": 0.00021678875930216795, "loss": 0.0464, "step": 85950 }, { "epoch": 0.55, "learning_rate": 0.00021677907794781103, "loss": 0.048, "step": 85960 }, { "epoch": 0.55, "learning_rate": 0.00021676939659345408, "loss": 0.0539, "step": 85970 }, { "epoch": 0.55, "learning_rate": 0.00021675971523909716, "loss": 0.0509, "step": 85980 }, { "epoch": 0.55, "learning_rate": 0.00021675003388474024, "loss": 0.0466, "step": 85990 }, { "epoch": 0.56, "learning_rate": 0.00021674035253038332, "loss": 0.0489, "step": 86000 }, { "epoch": 0.56, "eval_cer": 0.9199322110495989, "eval_loss": 0.03454515337944031, "eval_runtime": 120.4354, "eval_samples_per_second": 16.606, "eval_steps_per_second": 4.152, "step": 86000 }, { "epoch": 0.56, "learning_rate": 0.00021673067117602637, "loss": 0.0495, "step": 86010 }, { "epoch": 0.56, "learning_rate": 0.00021672098982166942, "loss": 0.0477, "step": 86020 }, { "epoch": 0.56, "learning_rate": 0.0002167113084673125, "loss": 0.0555, "step": 86030 }, { "epoch": 0.56, "learning_rate": 0.00021670162711295556, "loss": 0.0603, "step": 86040 }, { "epoch": 0.56, "learning_rate": 0.00021669194575859864, "loss": 0.049, "step": 86050 }, { "epoch": 0.56, "learning_rate": 0.00021668226440424172, "loss": 0.0533, "step": 86060 }, { "epoch": 0.56, "learning_rate": 0.0002166725830498848, "loss": 0.0547, "step": 86070 }, { "epoch": 0.56, "learning_rate": 0.00021666290169552782, "loss": 0.0583, "step": 86080 }, { "epoch": 0.56, "learning_rate": 0.0002166532203411709, "loss": 0.0493, "step": 86090 }, { "epoch": 0.56, "learning_rate": 0.00021664353898681398, "loss": 0.0558, "step": 86100 }, { "epoch": 0.56, "learning_rate": 0.00021663385763245703, "loss": 0.0515, "step": 86110 }, { "epoch": 0.56, "learning_rate": 0.0002166241762781001, "loss": 0.0532, "step": 86120 }, { "epoch": 0.56, "learning_rate": 0.0002166144949237432, "loss": 0.0486, "step": 86130 }, { "epoch": 0.56, "learning_rate": 0.00021660481356938627, "loss": 0.0521, "step": 86140 }, { "epoch": 0.56, "learning_rate": 0.0002165951322150293, "loss": 0.0427, "step": 86150 }, { "epoch": 0.56, "learning_rate": 0.00021658545086067238, "loss": 0.0454, "step": 86160 }, { "epoch": 0.56, "learning_rate": 0.00021657576950631543, "loss": 0.049, "step": 86170 }, { "epoch": 0.56, "learning_rate": 0.0002165660881519585, "loss": 0.052, "step": 86180 }, { "epoch": 0.56, "learning_rate": 0.0002165564067976016, "loss": 0.0552, "step": 86190 }, { "epoch": 0.56, "learning_rate": 0.00021654672544324467, "loss": 0.0474, "step": 86200 }, { "epoch": 0.56, "learning_rate": 0.00021653704408888772, "loss": 0.0553, "step": 86210 }, { "epoch": 0.56, "learning_rate": 0.00021652736273453078, "loss": 0.0538, "step": 86220 }, { "epoch": 0.56, "learning_rate": 0.00021651768138017386, "loss": 0.0544, "step": 86230 }, { "epoch": 0.56, "learning_rate": 0.0002165080000258169, "loss": 0.0511, "step": 86240 }, { "epoch": 0.56, "learning_rate": 0.00021649831867146, "loss": 0.05, "step": 86250 }, { "epoch": 0.56, "learning_rate": 0.00021648863731710307, "loss": 0.0489, "step": 86260 }, { "epoch": 0.56, "learning_rate": 0.00021647895596274615, "loss": 0.05, "step": 86270 }, { "epoch": 0.56, "learning_rate": 0.0002164692746083892, "loss": 0.0531, "step": 86280 }, { "epoch": 0.56, "learning_rate": 0.00021645959325403225, "loss": 0.0489, "step": 86290 }, { "epoch": 0.56, "learning_rate": 0.00021644991189967533, "loss": 0.0526, "step": 86300 }, { "epoch": 0.56, "learning_rate": 0.00021644023054531839, "loss": 0.0482, "step": 86310 }, { "epoch": 0.56, "learning_rate": 0.00021643054919096147, "loss": 0.0488, "step": 86320 }, { "epoch": 0.56, "learning_rate": 0.00021642086783660455, "loss": 0.0475, "step": 86330 }, { "epoch": 0.56, "learning_rate": 0.00021641118648224762, "loss": 0.0588, "step": 86340 }, { "epoch": 0.56, "learning_rate": 0.00021640150512789068, "loss": 0.0484, "step": 86350 }, { "epoch": 0.56, "learning_rate": 0.00021639182377353373, "loss": 0.0564, "step": 86360 }, { "epoch": 0.56, "learning_rate": 0.00021638214241917678, "loss": 0.0518, "step": 86370 }, { "epoch": 0.56, "learning_rate": 0.00021637246106481986, "loss": 0.0489, "step": 86380 }, { "epoch": 0.56, "learning_rate": 0.00021636277971046294, "loss": 0.0516, "step": 86390 }, { "epoch": 0.56, "learning_rate": 0.00021635309835610602, "loss": 0.0605, "step": 86400 }, { "epoch": 0.56, "learning_rate": 0.00021634341700174907, "loss": 0.0553, "step": 86410 }, { "epoch": 0.56, "learning_rate": 0.00021633373564739215, "loss": 0.0513, "step": 86420 }, { "epoch": 0.56, "learning_rate": 0.0002163240542930352, "loss": 0.0614, "step": 86430 }, { "epoch": 0.56, "learning_rate": 0.00021631437293867826, "loss": 0.05, "step": 86440 }, { "epoch": 0.56, "learning_rate": 0.00021630469158432134, "loss": 0.0498, "step": 86450 }, { "epoch": 0.56, "learning_rate": 0.00021629501022996442, "loss": 0.0491, "step": 86460 }, { "epoch": 0.56, "learning_rate": 0.0002162853288756075, "loss": 0.048, "step": 86470 }, { "epoch": 0.56, "learning_rate": 0.00021627564752125055, "loss": 0.046, "step": 86480 }, { "epoch": 0.56, "learning_rate": 0.00021626596616689363, "loss": 0.0525, "step": 86490 }, { "epoch": 0.56, "learning_rate": 0.00021625628481253668, "loss": 0.0489, "step": 86500 }, { "epoch": 0.56, "learning_rate": 0.00021624660345817974, "loss": 0.0513, "step": 86510 }, { "epoch": 0.56, "learning_rate": 0.00021623692210382282, "loss": 0.0522, "step": 86520 }, { "epoch": 0.56, "learning_rate": 0.0002162272407494659, "loss": 0.0497, "step": 86530 }, { "epoch": 0.56, "learning_rate": 0.00021621755939510898, "loss": 0.0504, "step": 86540 }, { "epoch": 0.56, "learning_rate": 0.00021620787804075203, "loss": 0.0493, "step": 86550 }, { "epoch": 0.56, "learning_rate": 0.0002161981966863951, "loss": 0.0474, "step": 86560 }, { "epoch": 0.56, "learning_rate": 0.00021618851533203813, "loss": 0.0484, "step": 86570 }, { "epoch": 0.56, "learning_rate": 0.00021617883397768121, "loss": 0.0512, "step": 86580 }, { "epoch": 0.56, "learning_rate": 0.0002161691526233243, "loss": 0.0484, "step": 86590 }, { "epoch": 0.56, "learning_rate": 0.00021615947126896737, "loss": 0.0402, "step": 86600 }, { "epoch": 0.56, "learning_rate": 0.00021614978991461043, "loss": 0.0515, "step": 86610 }, { "epoch": 0.56, "learning_rate": 0.0002161401085602535, "loss": 0.0487, "step": 86620 }, { "epoch": 0.56, "learning_rate": 0.00021613042720589659, "loss": 0.0471, "step": 86630 }, { "epoch": 0.56, "learning_rate": 0.0002161207458515396, "loss": 0.048, "step": 86640 }, { "epoch": 0.56, "learning_rate": 0.0002161110644971827, "loss": 0.0538, "step": 86650 }, { "epoch": 0.56, "learning_rate": 0.00021610138314282577, "loss": 0.0447, "step": 86660 }, { "epoch": 0.56, "learning_rate": 0.00021609170178846885, "loss": 0.0562, "step": 86670 }, { "epoch": 0.56, "learning_rate": 0.0002160820204341119, "loss": 0.0494, "step": 86680 }, { "epoch": 0.56, "learning_rate": 0.00021607233907975498, "loss": 0.0509, "step": 86690 }, { "epoch": 0.56, "learning_rate": 0.00021606265772539806, "loss": 0.0541, "step": 86700 }, { "epoch": 0.56, "learning_rate": 0.0002160529763710411, "loss": 0.0454, "step": 86710 }, { "epoch": 0.56, "learning_rate": 0.00021604329501668417, "loss": 0.054, "step": 86720 }, { "epoch": 0.56, "learning_rate": 0.00021603361366232725, "loss": 0.0613, "step": 86730 }, { "epoch": 0.56, "learning_rate": 0.00021602393230797033, "loss": 0.0486, "step": 86740 }, { "epoch": 0.56, "learning_rate": 0.00021601425095361338, "loss": 0.0711, "step": 86750 }, { "epoch": 0.56, "learning_rate": 0.00021600456959925646, "loss": 0.0554, "step": 86760 }, { "epoch": 0.56, "learning_rate": 0.00021599488824489954, "loss": 0.049, "step": 86770 }, { "epoch": 0.56, "learning_rate": 0.00021598520689054257, "loss": 0.0465, "step": 86780 }, { "epoch": 0.56, "learning_rate": 0.00021597552553618565, "loss": 0.0499, "step": 86790 }, { "epoch": 0.56, "learning_rate": 0.00021596584418182873, "loss": 0.0487, "step": 86800 }, { "epoch": 0.56, "learning_rate": 0.00021595616282747178, "loss": 0.0516, "step": 86810 }, { "epoch": 0.56, "learning_rate": 0.00021594648147311486, "loss": 0.0486, "step": 86820 }, { "epoch": 0.56, "learning_rate": 0.00021593680011875794, "loss": 0.0545, "step": 86830 }, { "epoch": 0.56, "learning_rate": 0.00021592711876440102, "loss": 0.0491, "step": 86840 }, { "epoch": 0.56, "learning_rate": 0.00021591743741004404, "loss": 0.057, "step": 86850 }, { "epoch": 0.56, "learning_rate": 0.00021590775605568712, "loss": 0.0519, "step": 86860 }, { "epoch": 0.56, "learning_rate": 0.0002158980747013302, "loss": 0.0481, "step": 86870 }, { "epoch": 0.56, "learning_rate": 0.00021588839334697326, "loss": 0.055, "step": 86880 }, { "epoch": 0.56, "learning_rate": 0.00021587871199261634, "loss": 0.0504, "step": 86890 }, { "epoch": 0.56, "learning_rate": 0.00021586903063825942, "loss": 0.0538, "step": 86900 }, { "epoch": 0.56, "learning_rate": 0.0002158593492839025, "loss": 0.0548, "step": 86910 }, { "epoch": 0.56, "learning_rate": 0.00021584966792954552, "loss": 0.0528, "step": 86920 }, { "epoch": 0.56, "learning_rate": 0.0002158399865751886, "loss": 0.0525, "step": 86930 }, { "epoch": 0.56, "learning_rate": 0.00021583030522083168, "loss": 0.0494, "step": 86940 }, { "epoch": 0.56, "learning_rate": 0.00021582062386647473, "loss": 0.049, "step": 86950 }, { "epoch": 0.56, "learning_rate": 0.0002158109425121178, "loss": 0.048, "step": 86960 }, { "epoch": 0.56, "learning_rate": 0.0002158012611577609, "loss": 0.0422, "step": 86970 }, { "epoch": 0.56, "learning_rate": 0.00021579157980340395, "loss": 0.051, "step": 86980 }, { "epoch": 0.56, "learning_rate": 0.000215781898449047, "loss": 0.051, "step": 86990 }, { "epoch": 0.56, "learning_rate": 0.00021577221709469008, "loss": 0.0473, "step": 87000 }, { "epoch": 0.56, "eval_cer": 0.9200949045305615, "eval_loss": 0.033820219337940216, "eval_runtime": 119.8564, "eval_samples_per_second": 16.687, "eval_steps_per_second": 4.172, "step": 87000 }, { "epoch": 0.56, "learning_rate": 0.00021576253574033313, "loss": 0.0527, "step": 87010 }, { "epoch": 0.56, "learning_rate": 0.0002157528543859762, "loss": 0.0451, "step": 87020 }, { "epoch": 0.56, "learning_rate": 0.0002157431730316193, "loss": 0.0548, "step": 87030 }, { "epoch": 0.56, "learning_rate": 0.00021573349167726237, "loss": 0.0487, "step": 87040 }, { "epoch": 0.56, "learning_rate": 0.00021572381032290542, "loss": 0.0535, "step": 87050 }, { "epoch": 0.56, "learning_rate": 0.00021571412896854848, "loss": 0.0517, "step": 87060 }, { "epoch": 0.56, "learning_rate": 0.00021570444761419156, "loss": 0.0513, "step": 87070 }, { "epoch": 0.56, "learning_rate": 0.0002156947662598346, "loss": 0.056, "step": 87080 }, { "epoch": 0.56, "learning_rate": 0.0002156850849054777, "loss": 0.0534, "step": 87090 }, { "epoch": 0.56, "learning_rate": 0.00021567540355112077, "loss": 0.0483, "step": 87100 }, { "epoch": 0.56, "learning_rate": 0.00021566572219676385, "loss": 0.0455, "step": 87110 }, { "epoch": 0.56, "learning_rate": 0.0002156560408424069, "loss": 0.0572, "step": 87120 }, { "epoch": 0.56, "learning_rate": 0.00021564635948804995, "loss": 0.0582, "step": 87130 }, { "epoch": 0.56, "learning_rate": 0.00021563667813369303, "loss": 0.0464, "step": 87140 }, { "epoch": 0.56, "learning_rate": 0.00021562699677933609, "loss": 0.054, "step": 87150 }, { "epoch": 0.56, "learning_rate": 0.00021561731542497916, "loss": 0.0445, "step": 87160 }, { "epoch": 0.56, "learning_rate": 0.00021560763407062224, "loss": 0.0489, "step": 87170 }, { "epoch": 0.56, "learning_rate": 0.0002155979527162653, "loss": 0.0592, "step": 87180 }, { "epoch": 0.56, "learning_rate": 0.00021558827136190838, "loss": 0.0507, "step": 87190 }, { "epoch": 0.56, "learning_rate": 0.00021557859000755143, "loss": 0.0487, "step": 87200 }, { "epoch": 0.56, "learning_rate": 0.00021556890865319448, "loss": 0.0508, "step": 87210 }, { "epoch": 0.56, "learning_rate": 0.00021555922729883756, "loss": 0.0437, "step": 87220 }, { "epoch": 0.56, "learning_rate": 0.00021554954594448064, "loss": 0.0557, "step": 87230 }, { "epoch": 0.56, "learning_rate": 0.00021553986459012372, "loss": 0.0448, "step": 87240 }, { "epoch": 0.56, "learning_rate": 0.00021553018323576677, "loss": 0.0466, "step": 87250 }, { "epoch": 0.56, "learning_rate": 0.00021552050188140985, "loss": 0.0442, "step": 87260 }, { "epoch": 0.56, "learning_rate": 0.0002155108205270529, "loss": 0.0493, "step": 87270 }, { "epoch": 0.56, "learning_rate": 0.00021550113917269596, "loss": 0.0443, "step": 87280 }, { "epoch": 0.56, "learning_rate": 0.00021549145781833904, "loss": 0.0517, "step": 87290 }, { "epoch": 0.56, "learning_rate": 0.00021548177646398212, "loss": 0.0503, "step": 87300 }, { "epoch": 0.56, "learning_rate": 0.0002154720951096252, "loss": 0.0582, "step": 87310 }, { "epoch": 0.56, "learning_rate": 0.00021546241375526825, "loss": 0.0552, "step": 87320 }, { "epoch": 0.56, "learning_rate": 0.00021545273240091133, "loss": 0.0592, "step": 87330 }, { "epoch": 0.56, "learning_rate": 0.00021544305104655438, "loss": 0.0571, "step": 87340 }, { "epoch": 0.56, "learning_rate": 0.00021543336969219744, "loss": 0.051, "step": 87350 }, { "epoch": 0.56, "learning_rate": 0.00021542368833784052, "loss": 0.0594, "step": 87360 }, { "epoch": 0.56, "learning_rate": 0.0002154140069834836, "loss": 0.0453, "step": 87370 }, { "epoch": 0.56, "learning_rate": 0.00021540432562912665, "loss": 0.0583, "step": 87380 }, { "epoch": 0.56, "learning_rate": 0.00021539464427476973, "loss": 0.0571, "step": 87390 }, { "epoch": 0.56, "learning_rate": 0.0002153849629204128, "loss": 0.0474, "step": 87400 }, { "epoch": 0.56, "learning_rate": 0.00021537528156605583, "loss": 0.053, "step": 87410 }, { "epoch": 0.56, "learning_rate": 0.00021536560021169891, "loss": 0.0545, "step": 87420 }, { "epoch": 0.56, "learning_rate": 0.000215355918857342, "loss": 0.0521, "step": 87430 }, { "epoch": 0.56, "learning_rate": 0.00021534623750298507, "loss": 0.0503, "step": 87440 }, { "epoch": 0.56, "learning_rate": 0.00021533655614862813, "loss": 0.0504, "step": 87450 }, { "epoch": 0.56, "learning_rate": 0.0002153268747942712, "loss": 0.0535, "step": 87460 }, { "epoch": 0.56, "learning_rate": 0.00021531719343991429, "loss": 0.0488, "step": 87470 }, { "epoch": 0.56, "learning_rate": 0.0002153075120855573, "loss": 0.0514, "step": 87480 }, { "epoch": 0.56, "learning_rate": 0.0002152978307312004, "loss": 0.0463, "step": 87490 }, { "epoch": 0.56, "learning_rate": 0.00021528814937684347, "loss": 0.0473, "step": 87500 }, { "epoch": 0.56, "learning_rate": 0.00021527846802248655, "loss": 0.0452, "step": 87510 }, { "epoch": 0.56, "learning_rate": 0.0002152687866681296, "loss": 0.0492, "step": 87520 }, { "epoch": 0.56, "learning_rate": 0.00021525910531377268, "loss": 0.0656, "step": 87530 }, { "epoch": 0.57, "learning_rate": 0.00021524942395941576, "loss": 0.0516, "step": 87540 }, { "epoch": 0.57, "learning_rate": 0.0002152397426050588, "loss": 0.0464, "step": 87550 }, { "epoch": 0.57, "learning_rate": 0.00021523006125070187, "loss": 0.0437, "step": 87560 }, { "epoch": 0.57, "learning_rate": 0.00021522037989634495, "loss": 0.0487, "step": 87570 }, { "epoch": 0.57, "learning_rate": 0.000215210698541988, "loss": 0.0499, "step": 87580 }, { "epoch": 0.57, "learning_rate": 0.00021520101718763108, "loss": 0.0465, "step": 87590 }, { "epoch": 0.57, "learning_rate": 0.00021519133583327416, "loss": 0.0503, "step": 87600 }, { "epoch": 0.57, "learning_rate": 0.00021518165447891724, "loss": 0.0468, "step": 87610 }, { "epoch": 0.57, "learning_rate": 0.00021517197312456027, "loss": 0.0546, "step": 87620 }, { "epoch": 0.57, "learning_rate": 0.00021516229177020335, "loss": 0.052, "step": 87630 }, { "epoch": 0.57, "learning_rate": 0.00021515261041584643, "loss": 0.0444, "step": 87640 }, { "epoch": 0.57, "learning_rate": 0.00021514292906148948, "loss": 0.052, "step": 87650 }, { "epoch": 0.57, "learning_rate": 0.00021513324770713256, "loss": 0.0528, "step": 87660 }, { "epoch": 0.57, "learning_rate": 0.00021512356635277564, "loss": 0.046, "step": 87670 }, { "epoch": 0.57, "learning_rate": 0.00021511388499841872, "loss": 0.0544, "step": 87680 }, { "epoch": 0.57, "learning_rate": 0.00021510420364406174, "loss": 0.0505, "step": 87690 }, { "epoch": 0.57, "learning_rate": 0.00021509452228970482, "loss": 0.0638, "step": 87700 }, { "epoch": 0.57, "learning_rate": 0.0002150848409353479, "loss": 0.0509, "step": 87710 }, { "epoch": 0.57, "learning_rate": 0.00021507515958099096, "loss": 0.0538, "step": 87720 }, { "epoch": 0.57, "learning_rate": 0.00021506547822663404, "loss": 0.0516, "step": 87730 }, { "epoch": 0.57, "learning_rate": 0.00021505579687227712, "loss": 0.0458, "step": 87740 }, { "epoch": 0.57, "learning_rate": 0.00021504611551792017, "loss": 0.0484, "step": 87750 }, { "epoch": 0.57, "learning_rate": 0.00021503643416356322, "loss": 0.0486, "step": 87760 }, { "epoch": 0.57, "learning_rate": 0.0002150267528092063, "loss": 0.0514, "step": 87770 }, { "epoch": 0.57, "learning_rate": 0.00021501707145484935, "loss": 0.0505, "step": 87780 }, { "epoch": 0.57, "learning_rate": 0.00021500739010049243, "loss": 0.0664, "step": 87790 }, { "epoch": 0.57, "learning_rate": 0.0002149977087461355, "loss": 0.0526, "step": 87800 }, { "epoch": 0.57, "learning_rate": 0.0002149880273917786, "loss": 0.0528, "step": 87810 }, { "epoch": 0.57, "learning_rate": 0.00021497834603742165, "loss": 0.0495, "step": 87820 }, { "epoch": 0.57, "learning_rate": 0.0002149686646830647, "loss": 0.0544, "step": 87830 }, { "epoch": 0.57, "learning_rate": 0.00021495898332870778, "loss": 0.0529, "step": 87840 }, { "epoch": 0.57, "learning_rate": 0.00021494930197435083, "loss": 0.0443, "step": 87850 }, { "epoch": 0.57, "learning_rate": 0.0002149396206199939, "loss": 0.054, "step": 87860 }, { "epoch": 0.57, "learning_rate": 0.000214929939265637, "loss": 0.054, "step": 87870 }, { "epoch": 0.57, "learning_rate": 0.00021492025791128007, "loss": 0.0426, "step": 87880 }, { "epoch": 0.57, "learning_rate": 0.00021491057655692312, "loss": 0.0438, "step": 87890 }, { "epoch": 0.57, "learning_rate": 0.00021490089520256617, "loss": 0.0519, "step": 87900 }, { "epoch": 0.57, "learning_rate": 0.00021489121384820925, "loss": 0.0497, "step": 87910 }, { "epoch": 0.57, "learning_rate": 0.0002148815324938523, "loss": 0.05, "step": 87920 }, { "epoch": 0.57, "learning_rate": 0.0002148718511394954, "loss": 0.0486, "step": 87930 }, { "epoch": 0.57, "learning_rate": 0.00021486216978513847, "loss": 0.0567, "step": 87940 }, { "epoch": 0.57, "learning_rate": 0.00021485248843078152, "loss": 0.0535, "step": 87950 }, { "epoch": 0.57, "learning_rate": 0.0002148428070764246, "loss": 0.0468, "step": 87960 }, { "epoch": 0.57, "learning_rate": 0.00021483312572206765, "loss": 0.0447, "step": 87970 }, { "epoch": 0.57, "learning_rate": 0.0002148234443677107, "loss": 0.0585, "step": 87980 }, { "epoch": 0.57, "learning_rate": 0.00021481376301335378, "loss": 0.0522, "step": 87990 }, { "epoch": 0.57, "learning_rate": 0.00021480408165899686, "loss": 0.0449, "step": 88000 }, { "epoch": 0.57, "eval_cer": 0.9198897299740142, "eval_loss": 0.033422499895095825, "eval_runtime": 119.8447, "eval_samples_per_second": 16.688, "eval_steps_per_second": 4.172, "step": 88000 }, { "epoch": 0.57, "learning_rate": 0.00021479440030463994, "loss": 0.0464, "step": 88010 }, { "epoch": 0.57, "learning_rate": 0.000214784718950283, "loss": 0.0526, "step": 88020 }, { "epoch": 0.57, "learning_rate": 0.00021477503759592608, "loss": 0.0547, "step": 88030 }, { "epoch": 0.57, "learning_rate": 0.00021476535624156913, "loss": 0.0522, "step": 88040 }, { "epoch": 0.57, "learning_rate": 0.00021475567488721218, "loss": 0.0485, "step": 88050 }, { "epoch": 0.57, "learning_rate": 0.00021474599353285526, "loss": 0.047, "step": 88060 }, { "epoch": 0.57, "learning_rate": 0.00021473631217849834, "loss": 0.05, "step": 88070 }, { "epoch": 0.57, "learning_rate": 0.00021472663082414142, "loss": 0.05, "step": 88080 }, { "epoch": 0.57, "learning_rate": 0.00021471694946978447, "loss": 0.052, "step": 88090 }, { "epoch": 0.57, "learning_rate": 0.00021470726811542755, "loss": 0.0432, "step": 88100 }, { "epoch": 0.57, "learning_rate": 0.0002146975867610706, "loss": 0.0523, "step": 88110 }, { "epoch": 0.57, "learning_rate": 0.00021468790540671366, "loss": 0.0449, "step": 88120 }, { "epoch": 0.57, "learning_rate": 0.00021467822405235674, "loss": 0.0498, "step": 88130 }, { "epoch": 0.57, "learning_rate": 0.00021466854269799982, "loss": 0.0489, "step": 88140 }, { "epoch": 0.57, "learning_rate": 0.00021465886134364287, "loss": 0.0532, "step": 88150 }, { "epoch": 0.57, "learning_rate": 0.00021464917998928595, "loss": 0.0495, "step": 88160 }, { "epoch": 0.57, "learning_rate": 0.00021463949863492903, "loss": 0.0549, "step": 88170 }, { "epoch": 0.57, "learning_rate": 0.00021462981728057206, "loss": 0.0512, "step": 88180 }, { "epoch": 0.57, "learning_rate": 0.00021462013592621514, "loss": 0.0484, "step": 88190 }, { "epoch": 0.57, "learning_rate": 0.00021461045457185822, "loss": 0.0504, "step": 88200 }, { "epoch": 0.57, "learning_rate": 0.0002146007732175013, "loss": 0.0471, "step": 88210 }, { "epoch": 0.57, "learning_rate": 0.00021459109186314435, "loss": 0.055, "step": 88220 }, { "epoch": 0.57, "learning_rate": 0.00021458141050878743, "loss": 0.0478, "step": 88230 }, { "epoch": 0.57, "learning_rate": 0.0002145717291544305, "loss": 0.0471, "step": 88240 }, { "epoch": 0.57, "learning_rate": 0.00021456204780007353, "loss": 0.0532, "step": 88250 }, { "epoch": 0.57, "learning_rate": 0.00021455236644571661, "loss": 0.0517, "step": 88260 }, { "epoch": 0.57, "learning_rate": 0.0002145426850913597, "loss": 0.0551, "step": 88270 }, { "epoch": 0.57, "learning_rate": 0.00021453300373700277, "loss": 0.0498, "step": 88280 }, { "epoch": 0.57, "learning_rate": 0.00021452332238264583, "loss": 0.0456, "step": 88290 }, { "epoch": 0.57, "learning_rate": 0.0002145136410282889, "loss": 0.0592, "step": 88300 }, { "epoch": 0.57, "learning_rate": 0.00021450395967393199, "loss": 0.0457, "step": 88310 }, { "epoch": 0.57, "learning_rate": 0.000214494278319575, "loss": 0.049, "step": 88320 }, { "epoch": 0.57, "learning_rate": 0.0002144845969652181, "loss": 0.0446, "step": 88330 }, { "epoch": 0.57, "learning_rate": 0.00021447491561086117, "loss": 0.0556, "step": 88340 }, { "epoch": 0.57, "learning_rate": 0.00021446523425650422, "loss": 0.0535, "step": 88350 }, { "epoch": 0.57, "learning_rate": 0.0002144555529021473, "loss": 0.0484, "step": 88360 }, { "epoch": 0.57, "learning_rate": 0.00021444587154779038, "loss": 0.0448, "step": 88370 }, { "epoch": 0.57, "learning_rate": 0.00021443619019343346, "loss": 0.0528, "step": 88380 }, { "epoch": 0.57, "learning_rate": 0.0002144265088390765, "loss": 0.0482, "step": 88390 }, { "epoch": 0.57, "learning_rate": 0.00021441682748471957, "loss": 0.0558, "step": 88400 }, { "epoch": 0.57, "learning_rate": 0.00021440714613036265, "loss": 0.0587, "step": 88410 }, { "epoch": 0.57, "learning_rate": 0.0002143974647760057, "loss": 0.0577, "step": 88420 }, { "epoch": 0.57, "learning_rate": 0.00021438778342164878, "loss": 0.0505, "step": 88430 }, { "epoch": 0.57, "learning_rate": 0.00021437810206729186, "loss": 0.0469, "step": 88440 }, { "epoch": 0.57, "learning_rate": 0.00021436842071293494, "loss": 0.0503, "step": 88450 }, { "epoch": 0.57, "learning_rate": 0.00021435873935857797, "loss": 0.0448, "step": 88460 }, { "epoch": 0.57, "learning_rate": 0.00021434905800422105, "loss": 0.0559, "step": 88470 }, { "epoch": 0.57, "learning_rate": 0.00021433937664986413, "loss": 0.0517, "step": 88480 }, { "epoch": 0.57, "learning_rate": 0.00021432969529550718, "loss": 0.1163, "step": 88490 }, { "epoch": 0.57, "learning_rate": 0.00021432001394115026, "loss": 0.0504, "step": 88500 }, { "epoch": 0.57, "learning_rate": 0.00021431033258679334, "loss": 0.0451, "step": 88510 }, { "epoch": 0.57, "learning_rate": 0.00021430065123243642, "loss": 0.0537, "step": 88520 }, { "epoch": 0.57, "learning_rate": 0.00021429096987807944, "loss": 0.049, "step": 88530 }, { "epoch": 0.57, "learning_rate": 0.00021428128852372252, "loss": 0.0489, "step": 88540 }, { "epoch": 0.57, "learning_rate": 0.00021427160716936558, "loss": 0.0418, "step": 88550 }, { "epoch": 0.57, "learning_rate": 0.00021426192581500866, "loss": 0.0468, "step": 88560 }, { "epoch": 0.57, "learning_rate": 0.00021425224446065173, "loss": 0.0465, "step": 88570 }, { "epoch": 0.57, "learning_rate": 0.00021424256310629481, "loss": 0.0432, "step": 88580 }, { "epoch": 0.57, "learning_rate": 0.00021423288175193787, "loss": 0.0567, "step": 88590 }, { "epoch": 0.57, "learning_rate": 0.00021422320039758092, "loss": 0.0526, "step": 88600 }, { "epoch": 0.57, "learning_rate": 0.000214213519043224, "loss": 0.0483, "step": 88610 }, { "epoch": 0.57, "learning_rate": 0.00021420383768886705, "loss": 0.0448, "step": 88620 }, { "epoch": 0.57, "learning_rate": 0.00021419415633451013, "loss": 0.0469, "step": 88630 }, { "epoch": 0.57, "learning_rate": 0.0002141844749801532, "loss": 0.0476, "step": 88640 }, { "epoch": 0.57, "learning_rate": 0.0002141747936257963, "loss": 0.0408, "step": 88650 }, { "epoch": 0.57, "learning_rate": 0.00021416511227143934, "loss": 0.0503, "step": 88660 }, { "epoch": 0.57, "learning_rate": 0.0002141554309170824, "loss": 0.0593, "step": 88670 }, { "epoch": 0.57, "learning_rate": 0.00021414574956272548, "loss": 0.0624, "step": 88680 }, { "epoch": 0.57, "learning_rate": 0.00021413606820836853, "loss": 0.0556, "step": 88690 }, { "epoch": 0.57, "learning_rate": 0.0002141263868540116, "loss": 0.044, "step": 88700 }, { "epoch": 0.57, "learning_rate": 0.0002141167054996547, "loss": 0.05, "step": 88710 }, { "epoch": 0.57, "learning_rate": 0.00021410702414529777, "loss": 0.0497, "step": 88720 }, { "epoch": 0.57, "learning_rate": 0.00021409734279094082, "loss": 0.0502, "step": 88730 }, { "epoch": 0.57, "learning_rate": 0.00021408766143658387, "loss": 0.0459, "step": 88740 }, { "epoch": 0.57, "learning_rate": 0.00021407798008222695, "loss": 0.0549, "step": 88750 }, { "epoch": 0.57, "learning_rate": 0.00021406829872787, "loss": 0.0516, "step": 88760 }, { "epoch": 0.57, "learning_rate": 0.0002140586173735131, "loss": 0.0519, "step": 88770 }, { "epoch": 0.57, "learning_rate": 0.00021404893601915617, "loss": 0.0472, "step": 88780 }, { "epoch": 0.57, "learning_rate": 0.00021403925466479922, "loss": 0.0476, "step": 88790 }, { "epoch": 0.57, "learning_rate": 0.0002140295733104423, "loss": 0.0503, "step": 88800 }, { "epoch": 0.57, "learning_rate": 0.00021401989195608535, "loss": 0.0544, "step": 88810 }, { "epoch": 0.57, "learning_rate": 0.0002140102106017284, "loss": 0.0512, "step": 88820 }, { "epoch": 0.57, "learning_rate": 0.00021400052924737148, "loss": 0.0436, "step": 88830 }, { "epoch": 0.57, "learning_rate": 0.00021399084789301456, "loss": 0.0572, "step": 88840 }, { "epoch": 0.57, "learning_rate": 0.00021398116653865764, "loss": 0.0486, "step": 88850 }, { "epoch": 0.57, "learning_rate": 0.0002139714851843007, "loss": 0.0566, "step": 88860 }, { "epoch": 0.57, "learning_rate": 0.00021396180382994378, "loss": 0.057, "step": 88870 }, { "epoch": 0.57, "learning_rate": 0.00021395212247558683, "loss": 0.05, "step": 88880 }, { "epoch": 0.57, "learning_rate": 0.00021394244112122988, "loss": 0.048, "step": 88890 }, { "epoch": 0.57, "learning_rate": 0.00021393275976687296, "loss": 0.0551, "step": 88900 }, { "epoch": 0.57, "learning_rate": 0.00021392307841251604, "loss": 0.0545, "step": 88910 }, { "epoch": 0.57, "learning_rate": 0.00021391339705815912, "loss": 0.0476, "step": 88920 }, { "epoch": 0.57, "learning_rate": 0.00021390371570380217, "loss": 0.0507, "step": 88930 }, { "epoch": 0.57, "learning_rate": 0.00021389403434944525, "loss": 0.061, "step": 88940 }, { "epoch": 0.57, "learning_rate": 0.0002138843529950883, "loss": 0.0531, "step": 88950 }, { "epoch": 0.57, "learning_rate": 0.00021387467164073136, "loss": 0.0464, "step": 88960 }, { "epoch": 0.57, "learning_rate": 0.00021386499028637444, "loss": 0.0531, "step": 88970 }, { "epoch": 0.57, "learning_rate": 0.00021385530893201752, "loss": 0.0444, "step": 88980 }, { "epoch": 0.57, "learning_rate": 0.00021384562757766057, "loss": 0.0478, "step": 88990 }, { "epoch": 0.57, "learning_rate": 0.00021383594622330365, "loss": 0.0516, "step": 89000 }, { "epoch": 0.57, "eval_cer": 0.919940345723647, "eval_loss": 0.0331486351788044, "eval_runtime": 120.3849, "eval_samples_per_second": 16.613, "eval_steps_per_second": 4.153, "step": 89000 }, { "epoch": 0.57, "learning_rate": 0.00021382626486894673, "loss": 0.0438, "step": 89010 }, { "epoch": 0.57, "learning_rate": 0.00021381658351458976, "loss": 0.0481, "step": 89020 }, { "epoch": 0.57, "learning_rate": 0.00021380690216023284, "loss": 0.042, "step": 89030 }, { "epoch": 0.57, "learning_rate": 0.00021379722080587592, "loss": 0.0482, "step": 89040 }, { "epoch": 0.57, "learning_rate": 0.000213787539451519, "loss": 0.0517, "step": 89050 }, { "epoch": 0.57, "learning_rate": 0.00021377785809716205, "loss": 0.0447, "step": 89060 }, { "epoch": 0.57, "learning_rate": 0.00021376817674280513, "loss": 0.0501, "step": 89070 }, { "epoch": 0.57, "learning_rate": 0.0002137584953884482, "loss": 0.0514, "step": 89080 }, { "epoch": 0.58, "learning_rate": 0.00021374881403409123, "loss": 0.0523, "step": 89090 }, { "epoch": 0.58, "learning_rate": 0.0002137391326797343, "loss": 0.0483, "step": 89100 }, { "epoch": 0.58, "learning_rate": 0.0002137294513253774, "loss": 0.0572, "step": 89110 }, { "epoch": 0.58, "learning_rate": 0.00021371976997102047, "loss": 0.0533, "step": 89120 }, { "epoch": 0.58, "learning_rate": 0.00021371008861666353, "loss": 0.0492, "step": 89130 }, { "epoch": 0.58, "learning_rate": 0.0002137004072623066, "loss": 0.0538, "step": 89140 }, { "epoch": 0.58, "learning_rate": 0.00021369072590794969, "loss": 0.057, "step": 89150 }, { "epoch": 0.58, "learning_rate": 0.0002136810445535927, "loss": 0.0537, "step": 89160 }, { "epoch": 0.58, "learning_rate": 0.0002136713631992358, "loss": 0.0451, "step": 89170 }, { "epoch": 0.58, "learning_rate": 0.00021366168184487887, "loss": 0.0501, "step": 89180 }, { "epoch": 0.58, "learning_rate": 0.00021365200049052192, "loss": 0.0439, "step": 89190 }, { "epoch": 0.58, "learning_rate": 0.000213642319136165, "loss": 0.0529, "step": 89200 }, { "epoch": 0.58, "learning_rate": 0.00021363263778180808, "loss": 0.044, "step": 89210 }, { "epoch": 0.58, "learning_rate": 0.00021362295642745116, "loss": 0.0455, "step": 89220 }, { "epoch": 0.58, "learning_rate": 0.0002136132750730942, "loss": 0.0539, "step": 89230 }, { "epoch": 0.58, "learning_rate": 0.00021360359371873727, "loss": 0.0425, "step": 89240 }, { "epoch": 0.58, "learning_rate": 0.00021359391236438035, "loss": 0.0447, "step": 89250 }, { "epoch": 0.58, "learning_rate": 0.0002135842310100234, "loss": 0.049, "step": 89260 }, { "epoch": 0.58, "learning_rate": 0.00021357454965566648, "loss": 0.05, "step": 89270 }, { "epoch": 0.58, "learning_rate": 0.00021356486830130956, "loss": 0.0505, "step": 89280 }, { "epoch": 0.58, "learning_rate": 0.00021355518694695264, "loss": 0.0449, "step": 89290 }, { "epoch": 0.58, "learning_rate": 0.00021354550559259567, "loss": 0.0501, "step": 89300 }, { "epoch": 0.58, "learning_rate": 0.00021353582423823875, "loss": 0.0443, "step": 89310 }, { "epoch": 0.58, "learning_rate": 0.00021352614288388182, "loss": 0.0478, "step": 89320 }, { "epoch": 0.58, "learning_rate": 0.00021351646152952488, "loss": 0.0536, "step": 89330 }, { "epoch": 0.58, "learning_rate": 0.00021350678017516796, "loss": 0.0638, "step": 89340 }, { "epoch": 0.58, "learning_rate": 0.00021349709882081104, "loss": 0.0515, "step": 89350 }, { "epoch": 0.58, "learning_rate": 0.0002134874174664541, "loss": 0.0458, "step": 89360 }, { "epoch": 0.58, "learning_rate": 0.00021347773611209714, "loss": 0.0497, "step": 89370 }, { "epoch": 0.58, "learning_rate": 0.00021346805475774022, "loss": 0.0471, "step": 89380 }, { "epoch": 0.58, "learning_rate": 0.00021345837340338327, "loss": 0.0479, "step": 89390 }, { "epoch": 0.58, "learning_rate": 0.00021344869204902635, "loss": 0.0452, "step": 89400 }, { "epoch": 0.58, "learning_rate": 0.00021343901069466943, "loss": 0.04, "step": 89410 }, { "epoch": 0.58, "learning_rate": 0.00021342932934031251, "loss": 0.0482, "step": 89420 }, { "epoch": 0.58, "learning_rate": 0.00021341964798595557, "loss": 0.0575, "step": 89430 }, { "epoch": 0.58, "learning_rate": 0.00021340996663159862, "loss": 0.048, "step": 89440 }, { "epoch": 0.58, "learning_rate": 0.0002134002852772417, "loss": 0.0497, "step": 89450 }, { "epoch": 0.58, "learning_rate": 0.00021339060392288475, "loss": 0.0513, "step": 89460 }, { "epoch": 0.58, "learning_rate": 0.00021338092256852783, "loss": 0.0529, "step": 89470 }, { "epoch": 0.58, "learning_rate": 0.0002133712412141709, "loss": 0.0537, "step": 89480 }, { "epoch": 0.58, "learning_rate": 0.000213361559859814, "loss": 0.0507, "step": 89490 }, { "epoch": 0.58, "learning_rate": 0.00021335187850545704, "loss": 0.0535, "step": 89500 }, { "epoch": 0.58, "learning_rate": 0.0002133421971511001, "loss": 0.0499, "step": 89510 }, { "epoch": 0.58, "learning_rate": 0.00021333251579674318, "loss": 0.0537, "step": 89520 }, { "epoch": 0.58, "learning_rate": 0.00021332283444238623, "loss": 0.0521, "step": 89530 }, { "epoch": 0.58, "learning_rate": 0.0002133131530880293, "loss": 0.0481, "step": 89540 }, { "epoch": 0.58, "learning_rate": 0.0002133034717336724, "loss": 0.0475, "step": 89550 }, { "epoch": 0.58, "learning_rate": 0.00021329379037931544, "loss": 0.0481, "step": 89560 }, { "epoch": 0.58, "learning_rate": 0.00021328410902495852, "loss": 0.0476, "step": 89570 }, { "epoch": 0.58, "learning_rate": 0.00021327442767060157, "loss": 0.059, "step": 89580 }, { "epoch": 0.58, "learning_rate": 0.00021326474631624463, "loss": 0.0473, "step": 89590 }, { "epoch": 0.58, "learning_rate": 0.0002132550649618877, "loss": 0.0578, "step": 89600 }, { "epoch": 0.58, "learning_rate": 0.0002132453836075308, "loss": 0.0483, "step": 89610 }, { "epoch": 0.58, "learning_rate": 0.00021323570225317387, "loss": 0.0484, "step": 89620 }, { "epoch": 0.58, "learning_rate": 0.00021322602089881692, "loss": 0.06, "step": 89630 }, { "epoch": 0.58, "learning_rate": 0.00021321633954446, "loss": 0.0464, "step": 89640 }, { "epoch": 0.58, "learning_rate": 0.00021320665819010305, "loss": 0.0454, "step": 89650 }, { "epoch": 0.58, "learning_rate": 0.0002131969768357461, "loss": 0.0541, "step": 89660 }, { "epoch": 0.58, "learning_rate": 0.00021318729548138918, "loss": 0.0554, "step": 89670 }, { "epoch": 0.58, "learning_rate": 0.00021317761412703226, "loss": 0.0464, "step": 89680 }, { "epoch": 0.58, "learning_rate": 0.00021316793277267534, "loss": 0.0485, "step": 89690 }, { "epoch": 0.58, "learning_rate": 0.0002131582514183184, "loss": 0.0474, "step": 89700 }, { "epoch": 0.58, "learning_rate": 0.00021314857006396148, "loss": 0.0523, "step": 89710 }, { "epoch": 0.58, "learning_rate": 0.00021313888870960453, "loss": 0.0531, "step": 89720 }, { "epoch": 0.58, "learning_rate": 0.00021312920735524758, "loss": 0.0479, "step": 89730 }, { "epoch": 0.58, "learning_rate": 0.00021311952600089066, "loss": 0.045, "step": 89740 }, { "epoch": 0.58, "learning_rate": 0.00021310984464653374, "loss": 0.0457, "step": 89750 }, { "epoch": 0.58, "learning_rate": 0.0002131001632921768, "loss": 0.0488, "step": 89760 }, { "epoch": 0.58, "learning_rate": 0.00021309048193781987, "loss": 0.0575, "step": 89770 }, { "epoch": 0.58, "learning_rate": 0.00021308080058346295, "loss": 0.0511, "step": 89780 }, { "epoch": 0.58, "learning_rate": 0.00021307111922910598, "loss": 0.0524, "step": 89790 }, { "epoch": 0.58, "learning_rate": 0.00021306143787474906, "loss": 0.0504, "step": 89800 }, { "epoch": 0.58, "learning_rate": 0.00021305175652039214, "loss": 0.0492, "step": 89810 }, { "epoch": 0.58, "learning_rate": 0.00021304207516603522, "loss": 0.0521, "step": 89820 }, { "epoch": 0.58, "learning_rate": 0.00021303239381167827, "loss": 0.0517, "step": 89830 }, { "epoch": 0.58, "learning_rate": 0.00021302271245732135, "loss": 0.0474, "step": 89840 }, { "epoch": 0.58, "learning_rate": 0.00021301303110296443, "loss": 0.0559, "step": 89850 }, { "epoch": 0.58, "learning_rate": 0.00021300334974860746, "loss": 0.0526, "step": 89860 }, { "epoch": 0.58, "learning_rate": 0.00021299366839425054, "loss": 0.054, "step": 89870 }, { "epoch": 0.58, "learning_rate": 0.00021298398703989362, "loss": 0.0497, "step": 89880 }, { "epoch": 0.58, "learning_rate": 0.0002129743056855367, "loss": 0.0537, "step": 89890 }, { "epoch": 0.58, "learning_rate": 0.00021296462433117975, "loss": 0.0481, "step": 89900 }, { "epoch": 0.58, "learning_rate": 0.00021295494297682283, "loss": 0.0457, "step": 89910 }, { "epoch": 0.58, "learning_rate": 0.0002129452616224659, "loss": 0.0505, "step": 89920 }, { "epoch": 0.58, "learning_rate": 0.00021293558026810893, "loss": 0.0466, "step": 89930 }, { "epoch": 0.58, "learning_rate": 0.000212925898913752, "loss": 0.0525, "step": 89940 }, { "epoch": 0.58, "learning_rate": 0.0002129162175593951, "loss": 0.0482, "step": 89950 }, { "epoch": 0.58, "learning_rate": 0.00021290653620503815, "loss": 0.068, "step": 89960 }, { "epoch": 0.58, "learning_rate": 0.00021289685485068123, "loss": 0.0501, "step": 89970 }, { "epoch": 0.58, "learning_rate": 0.0002128871734963243, "loss": 0.0417, "step": 89980 }, { "epoch": 0.58, "learning_rate": 0.00021287749214196738, "loss": 0.0546, "step": 89990 }, { "epoch": 0.58, "learning_rate": 0.0002128678107876104, "loss": 0.0537, "step": 90000 }, { "epoch": 0.58, "eval_cer": 0.9199249802282228, "eval_loss": 0.03311315178871155, "eval_runtime": 119.7145, "eval_samples_per_second": 16.706, "eval_steps_per_second": 4.177, "step": 90000 }, { "epoch": 0.58, "learning_rate": 0.0002128581294332535, "loss": 0.0477, "step": 90010 }, { "epoch": 0.58, "learning_rate": 0.00021284844807889657, "loss": 0.057, "step": 90020 }, { "epoch": 0.58, "learning_rate": 0.00021283876672453962, "loss": 0.0535, "step": 90030 }, { "epoch": 0.58, "learning_rate": 0.0002128290853701827, "loss": 0.0485, "step": 90040 }, { "epoch": 0.58, "learning_rate": 0.00021281940401582578, "loss": 0.0517, "step": 90050 }, { "epoch": 0.58, "learning_rate": 0.00021280972266146886, "loss": 0.0503, "step": 90060 }, { "epoch": 0.58, "learning_rate": 0.0002128000413071119, "loss": 0.0543, "step": 90070 }, { "epoch": 0.58, "learning_rate": 0.00021279035995275497, "loss": 0.0519, "step": 90080 }, { "epoch": 0.58, "learning_rate": 0.00021278067859839805, "loss": 0.0541, "step": 90090 }, { "epoch": 0.58, "learning_rate": 0.0002127709972440411, "loss": 0.0505, "step": 90100 }, { "epoch": 0.58, "learning_rate": 0.00021276131588968418, "loss": 0.048, "step": 90110 }, { "epoch": 0.58, "learning_rate": 0.00021275163453532726, "loss": 0.0522, "step": 90120 }, { "epoch": 0.58, "learning_rate": 0.00021274195318097034, "loss": 0.0512, "step": 90130 }, { "epoch": 0.58, "learning_rate": 0.00021273227182661336, "loss": 0.0437, "step": 90140 }, { "epoch": 0.58, "learning_rate": 0.00021272259047225644, "loss": 0.0542, "step": 90150 }, { "epoch": 0.58, "learning_rate": 0.0002127129091178995, "loss": 0.0521, "step": 90160 }, { "epoch": 0.58, "learning_rate": 0.00021270322776354258, "loss": 0.0516, "step": 90170 }, { "epoch": 0.58, "learning_rate": 0.00021269354640918566, "loss": 0.0454, "step": 90180 }, { "epoch": 0.58, "learning_rate": 0.00021268386505482874, "loss": 0.0542, "step": 90190 }, { "epoch": 0.58, "learning_rate": 0.0002126741837004718, "loss": 0.0483, "step": 90200 }, { "epoch": 0.58, "learning_rate": 0.00021266450234611484, "loss": 0.0497, "step": 90210 }, { "epoch": 0.58, "learning_rate": 0.00021265482099175792, "loss": 0.0517, "step": 90220 }, { "epoch": 0.58, "learning_rate": 0.00021264513963740097, "loss": 0.0515, "step": 90230 }, { "epoch": 0.58, "learning_rate": 0.00021263545828304405, "loss": 0.0488, "step": 90240 }, { "epoch": 0.58, "learning_rate": 0.00021262577692868713, "loss": 0.0493, "step": 90250 }, { "epoch": 0.58, "learning_rate": 0.00021261609557433021, "loss": 0.0463, "step": 90260 }, { "epoch": 0.58, "learning_rate": 0.00021260641421997327, "loss": 0.0461, "step": 90270 }, { "epoch": 0.58, "learning_rate": 0.00021259673286561632, "loss": 0.0532, "step": 90280 }, { "epoch": 0.58, "learning_rate": 0.0002125870515112594, "loss": 0.0472, "step": 90290 }, { "epoch": 0.58, "learning_rate": 0.00021257737015690245, "loss": 0.0452, "step": 90300 }, { "epoch": 0.58, "learning_rate": 0.00021256768880254553, "loss": 0.0578, "step": 90310 }, { "epoch": 0.58, "learning_rate": 0.0002125580074481886, "loss": 0.0577, "step": 90320 }, { "epoch": 0.58, "learning_rate": 0.0002125483260938317, "loss": 0.0534, "step": 90330 }, { "epoch": 0.58, "learning_rate": 0.00021253864473947474, "loss": 0.0518, "step": 90340 }, { "epoch": 0.58, "learning_rate": 0.0002125289633851178, "loss": 0.0528, "step": 90350 }, { "epoch": 0.58, "learning_rate": 0.00021251928203076085, "loss": 0.0554, "step": 90360 }, { "epoch": 0.58, "learning_rate": 0.00021250960067640393, "loss": 0.0505, "step": 90370 }, { "epoch": 0.58, "learning_rate": 0.000212499919322047, "loss": 0.0485, "step": 90380 }, { "epoch": 0.58, "learning_rate": 0.0002124902379676901, "loss": 0.0504, "step": 90390 }, { "epoch": 0.58, "learning_rate": 0.00021248055661333314, "loss": 0.0462, "step": 90400 }, { "epoch": 0.58, "learning_rate": 0.00021247087525897622, "loss": 0.0508, "step": 90410 }, { "epoch": 0.58, "learning_rate": 0.00021246119390461927, "loss": 0.0552, "step": 90420 }, { "epoch": 0.58, "learning_rate": 0.00021245151255026233, "loss": 0.0415, "step": 90430 }, { "epoch": 0.58, "learning_rate": 0.0002124418311959054, "loss": 0.0486, "step": 90440 }, { "epoch": 0.58, "learning_rate": 0.00021243214984154849, "loss": 0.052, "step": 90450 }, { "epoch": 0.58, "learning_rate": 0.00021242246848719157, "loss": 0.0517, "step": 90460 }, { "epoch": 0.58, "learning_rate": 0.00021241278713283462, "loss": 0.0559, "step": 90470 }, { "epoch": 0.58, "learning_rate": 0.0002124031057784777, "loss": 0.05, "step": 90480 }, { "epoch": 0.58, "learning_rate": 0.00021239342442412075, "loss": 0.0508, "step": 90490 }, { "epoch": 0.58, "learning_rate": 0.0002123837430697638, "loss": 0.0454, "step": 90500 }, { "epoch": 0.58, "learning_rate": 0.00021237406171540688, "loss": 0.0501, "step": 90510 }, { "epoch": 0.58, "learning_rate": 0.00021236438036104996, "loss": 0.0474, "step": 90520 }, { "epoch": 0.58, "learning_rate": 0.00021235469900669304, "loss": 0.0457, "step": 90530 }, { "epoch": 0.58, "learning_rate": 0.0002123450176523361, "loss": 0.049, "step": 90540 }, { "epoch": 0.58, "learning_rate": 0.00021233533629797918, "loss": 0.0512, "step": 90550 }, { "epoch": 0.58, "learning_rate": 0.0002123256549436222, "loss": 0.0469, "step": 90560 }, { "epoch": 0.58, "learning_rate": 0.00021231597358926528, "loss": 0.0553, "step": 90570 }, { "epoch": 0.58, "learning_rate": 0.00021230629223490836, "loss": 0.0468, "step": 90580 }, { "epoch": 0.58, "learning_rate": 0.00021229661088055144, "loss": 0.0458, "step": 90590 }, { "epoch": 0.58, "learning_rate": 0.0002122869295261945, "loss": 0.0467, "step": 90600 }, { "epoch": 0.58, "learning_rate": 0.00021227724817183757, "loss": 0.0498, "step": 90610 }, { "epoch": 0.58, "learning_rate": 0.00021226756681748065, "loss": 0.0591, "step": 90620 }, { "epoch": 0.58, "learning_rate": 0.00021225788546312368, "loss": 0.0484, "step": 90630 }, { "epoch": 0.59, "learning_rate": 0.00021224820410876676, "loss": 0.0445, "step": 90640 }, { "epoch": 0.59, "learning_rate": 0.00021223852275440984, "loss": 0.0564, "step": 90650 }, { "epoch": 0.59, "learning_rate": 0.00021222884140005292, "loss": 0.0522, "step": 90660 }, { "epoch": 0.59, "learning_rate": 0.00021221916004569597, "loss": 0.0515, "step": 90670 }, { "epoch": 0.59, "learning_rate": 0.00021220947869133905, "loss": 0.0505, "step": 90680 }, { "epoch": 0.59, "learning_rate": 0.00021219979733698213, "loss": 0.0424, "step": 90690 }, { "epoch": 0.59, "learning_rate": 0.00021219011598262516, "loss": 0.0464, "step": 90700 }, { "epoch": 0.59, "learning_rate": 0.00021218043462826824, "loss": 0.0443, "step": 90710 }, { "epoch": 0.59, "learning_rate": 0.00021217075327391132, "loss": 0.0468, "step": 90720 }, { "epoch": 0.59, "learning_rate": 0.0002121610719195544, "loss": 0.0441, "step": 90730 }, { "epoch": 0.59, "learning_rate": 0.00021215139056519745, "loss": 0.0515, "step": 90740 }, { "epoch": 0.59, "learning_rate": 0.00021214170921084053, "loss": 0.0489, "step": 90750 }, { "epoch": 0.59, "learning_rate": 0.0002121320278564836, "loss": 0.0552, "step": 90760 }, { "epoch": 0.59, "learning_rate": 0.00021212234650212663, "loss": 0.0487, "step": 90770 }, { "epoch": 0.59, "learning_rate": 0.0002121126651477697, "loss": 0.0467, "step": 90780 }, { "epoch": 0.59, "learning_rate": 0.0002121029837934128, "loss": 0.0475, "step": 90790 }, { "epoch": 0.59, "learning_rate": 0.00021209330243905585, "loss": 0.0526, "step": 90800 }, { "epoch": 0.59, "learning_rate": 0.00021208362108469892, "loss": 0.0482, "step": 90810 }, { "epoch": 0.59, "learning_rate": 0.000212073939730342, "loss": 0.0457, "step": 90820 }, { "epoch": 0.59, "learning_rate": 0.00021206425837598508, "loss": 0.0469, "step": 90830 }, { "epoch": 0.59, "learning_rate": 0.0002120545770216281, "loss": 0.0524, "step": 90840 }, { "epoch": 0.59, "learning_rate": 0.0002120448956672712, "loss": 0.0576, "step": 90850 }, { "epoch": 0.59, "learning_rate": 0.00021203521431291427, "loss": 0.0503, "step": 90860 }, { "epoch": 0.59, "learning_rate": 0.00021202553295855732, "loss": 0.0461, "step": 90870 }, { "epoch": 0.59, "learning_rate": 0.0002120158516042004, "loss": 0.0451, "step": 90880 }, { "epoch": 0.59, "learning_rate": 0.00021200617024984348, "loss": 0.0511, "step": 90890 }, { "epoch": 0.59, "learning_rate": 0.00021199648889548656, "loss": 0.0453, "step": 90900 }, { "epoch": 0.59, "learning_rate": 0.0002119868075411296, "loss": 0.047, "step": 90910 }, { "epoch": 0.59, "learning_rate": 0.00021197712618677267, "loss": 0.0459, "step": 90920 }, { "epoch": 0.59, "learning_rate": 0.00021196744483241575, "loss": 0.0481, "step": 90930 }, { "epoch": 0.59, "learning_rate": 0.0002119577634780588, "loss": 0.0467, "step": 90940 }, { "epoch": 0.59, "learning_rate": 0.00021194808212370188, "loss": 0.0501, "step": 90950 }, { "epoch": 0.59, "learning_rate": 0.00021193840076934496, "loss": 0.0442, "step": 90960 }, { "epoch": 0.59, "learning_rate": 0.000211928719414988, "loss": 0.0472, "step": 90970 }, { "epoch": 0.59, "learning_rate": 0.00021191903806063106, "loss": 0.0452, "step": 90980 }, { "epoch": 0.59, "learning_rate": 0.00021190935670627414, "loss": 0.0497, "step": 90990 }, { "epoch": 0.59, "learning_rate": 0.0002118996753519172, "loss": 0.0477, "step": 91000 }, { "epoch": 0.59, "eval_cer": 0.9199819229465597, "eval_loss": 0.03264106065034866, "eval_runtime": 119.6718, "eval_samples_per_second": 16.712, "eval_steps_per_second": 4.178, "step": 91000 }, { "epoch": 0.59, "learning_rate": 0.00021188999399756028, "loss": 0.056, "step": 91010 }, { "epoch": 0.59, "learning_rate": 0.00021188031264320336, "loss": 0.0529, "step": 91020 }, { "epoch": 0.59, "learning_rate": 0.00021187063128884644, "loss": 0.0468, "step": 91030 }, { "epoch": 0.59, "learning_rate": 0.0002118609499344895, "loss": 0.0472, "step": 91040 }, { "epoch": 0.59, "learning_rate": 0.00021185126858013254, "loss": 0.0527, "step": 91050 }, { "epoch": 0.59, "learning_rate": 0.00021184158722577562, "loss": 0.0541, "step": 91060 }, { "epoch": 0.59, "learning_rate": 0.00021183190587141867, "loss": 0.0429, "step": 91070 }, { "epoch": 0.59, "learning_rate": 0.00021182222451706175, "loss": 0.0446, "step": 91080 }, { "epoch": 0.59, "learning_rate": 0.00021181254316270483, "loss": 0.0524, "step": 91090 }, { "epoch": 0.59, "learning_rate": 0.00021180286180834791, "loss": 0.0433, "step": 91100 }, { "epoch": 0.59, "learning_rate": 0.00021179318045399097, "loss": 0.0505, "step": 91110 }, { "epoch": 0.59, "learning_rate": 0.00021178349909963402, "loss": 0.054, "step": 91120 }, { "epoch": 0.59, "learning_rate": 0.0002117738177452771, "loss": 0.0486, "step": 91130 }, { "epoch": 0.59, "learning_rate": 0.00021176413639092015, "loss": 0.0462, "step": 91140 }, { "epoch": 0.59, "learning_rate": 0.00021175445503656323, "loss": 0.0481, "step": 91150 }, { "epoch": 0.59, "learning_rate": 0.0002117447736822063, "loss": 0.0505, "step": 91160 }, { "epoch": 0.59, "learning_rate": 0.00021173509232784936, "loss": 0.0531, "step": 91170 }, { "epoch": 0.59, "learning_rate": 0.00021172541097349244, "loss": 0.0476, "step": 91180 }, { "epoch": 0.59, "learning_rate": 0.0002117157296191355, "loss": 0.0498, "step": 91190 }, { "epoch": 0.59, "learning_rate": 0.00021170604826477855, "loss": 0.0485, "step": 91200 }, { "epoch": 0.59, "learning_rate": 0.00021169636691042163, "loss": 0.0466, "step": 91210 }, { "epoch": 0.59, "learning_rate": 0.0002116866855560647, "loss": 0.0466, "step": 91220 }, { "epoch": 0.59, "learning_rate": 0.0002116770042017078, "loss": 0.0501, "step": 91230 }, { "epoch": 0.59, "learning_rate": 0.00021166732284735084, "loss": 0.0461, "step": 91240 }, { "epoch": 0.59, "learning_rate": 0.00021165764149299392, "loss": 0.0438, "step": 91250 }, { "epoch": 0.59, "learning_rate": 0.00021164796013863697, "loss": 0.0458, "step": 91260 }, { "epoch": 0.59, "learning_rate": 0.00021163827878428003, "loss": 0.0465, "step": 91270 }, { "epoch": 0.59, "learning_rate": 0.0002116285974299231, "loss": 0.0528, "step": 91280 }, { "epoch": 0.59, "learning_rate": 0.00021161891607556619, "loss": 0.0629, "step": 91290 }, { "epoch": 0.59, "learning_rate": 0.00021160923472120927, "loss": 0.0443, "step": 91300 }, { "epoch": 0.59, "learning_rate": 0.00021159955336685232, "loss": 0.0418, "step": 91310 }, { "epoch": 0.59, "learning_rate": 0.0002115898720124954, "loss": 0.051, "step": 91320 }, { "epoch": 0.59, "learning_rate": 0.00021158019065813845, "loss": 0.0489, "step": 91330 }, { "epoch": 0.59, "learning_rate": 0.0002115705093037815, "loss": 0.0514, "step": 91340 }, { "epoch": 0.59, "learning_rate": 0.00021156082794942458, "loss": 0.0498, "step": 91350 }, { "epoch": 0.59, "learning_rate": 0.00021155114659506766, "loss": 0.0522, "step": 91360 }, { "epoch": 0.59, "learning_rate": 0.00021154146524071072, "loss": 0.0533, "step": 91370 }, { "epoch": 0.59, "learning_rate": 0.0002115317838863538, "loss": 0.0489, "step": 91380 }, { "epoch": 0.59, "learning_rate": 0.00021152210253199688, "loss": 0.0494, "step": 91390 }, { "epoch": 0.59, "learning_rate": 0.0002115124211776399, "loss": 0.0494, "step": 91400 }, { "epoch": 0.59, "learning_rate": 0.00021150273982328298, "loss": 0.0682, "step": 91410 }, { "epoch": 0.59, "learning_rate": 0.00021149305846892606, "loss": 0.0581, "step": 91420 }, { "epoch": 0.59, "learning_rate": 0.00021148337711456914, "loss": 0.0529, "step": 91430 }, { "epoch": 0.59, "learning_rate": 0.0002114736957602122, "loss": 0.0519, "step": 91440 }, { "epoch": 0.59, "learning_rate": 0.00021146401440585527, "loss": 0.048, "step": 91450 }, { "epoch": 0.59, "learning_rate": 0.00021145433305149835, "loss": 0.0517, "step": 91460 }, { "epoch": 0.59, "learning_rate": 0.00021144465169714138, "loss": 0.0518, "step": 91470 }, { "epoch": 0.59, "learning_rate": 0.00021143497034278446, "loss": 0.0509, "step": 91480 }, { "epoch": 0.59, "learning_rate": 0.00021142528898842754, "loss": 0.054, "step": 91490 }, { "epoch": 0.59, "learning_rate": 0.00021141560763407062, "loss": 0.0419, "step": 91500 }, { "epoch": 0.59, "learning_rate": 0.00021140592627971367, "loss": 0.049, "step": 91510 }, { "epoch": 0.59, "learning_rate": 0.00021139624492535675, "loss": 0.048, "step": 91520 }, { "epoch": 0.59, "learning_rate": 0.00021138656357099983, "loss": 0.0517, "step": 91530 }, { "epoch": 0.59, "learning_rate": 0.00021137688221664286, "loss": 0.0512, "step": 91540 }, { "epoch": 0.59, "learning_rate": 0.00021136720086228594, "loss": 0.0492, "step": 91550 }, { "epoch": 0.59, "learning_rate": 0.00021135751950792901, "loss": 0.0592, "step": 91560 }, { "epoch": 0.59, "learning_rate": 0.00021134783815357207, "loss": 0.0502, "step": 91570 }, { "epoch": 0.59, "learning_rate": 0.00021133815679921515, "loss": 0.0492, "step": 91580 }, { "epoch": 0.59, "learning_rate": 0.00021132847544485823, "loss": 0.0541, "step": 91590 }, { "epoch": 0.59, "learning_rate": 0.0002113187940905013, "loss": 0.0474, "step": 91600 }, { "epoch": 0.59, "learning_rate": 0.00021130911273614433, "loss": 0.0472, "step": 91610 }, { "epoch": 0.59, "learning_rate": 0.0002112994313817874, "loss": 0.0542, "step": 91620 }, { "epoch": 0.59, "learning_rate": 0.0002112897500274305, "loss": 0.0559, "step": 91630 }, { "epoch": 0.59, "learning_rate": 0.00021128006867307354, "loss": 0.0537, "step": 91640 }, { "epoch": 0.59, "learning_rate": 0.00021127038731871662, "loss": 0.0525, "step": 91650 }, { "epoch": 0.59, "learning_rate": 0.0002112607059643597, "loss": 0.0582, "step": 91660 }, { "epoch": 0.59, "learning_rate": 0.00021125102461000278, "loss": 0.0511, "step": 91670 }, { "epoch": 0.59, "learning_rate": 0.0002112413432556458, "loss": 0.0542, "step": 91680 }, { "epoch": 0.59, "learning_rate": 0.0002112316619012889, "loss": 0.052, "step": 91690 }, { "epoch": 0.59, "learning_rate": 0.00021122198054693197, "loss": 0.046, "step": 91700 }, { "epoch": 0.59, "learning_rate": 0.00021121229919257502, "loss": 0.0452, "step": 91710 }, { "epoch": 0.59, "learning_rate": 0.0002112026178382181, "loss": 0.0485, "step": 91720 }, { "epoch": 0.59, "learning_rate": 0.00021119293648386118, "loss": 0.046, "step": 91730 }, { "epoch": 0.59, "learning_rate": 0.00021118325512950423, "loss": 0.0452, "step": 91740 }, { "epoch": 0.59, "learning_rate": 0.0002111735737751473, "loss": 0.0517, "step": 91750 }, { "epoch": 0.59, "learning_rate": 0.00021116389242079037, "loss": 0.0489, "step": 91760 }, { "epoch": 0.59, "learning_rate": 0.00021115421106643342, "loss": 0.0497, "step": 91770 }, { "epoch": 0.59, "learning_rate": 0.0002111445297120765, "loss": 0.0536, "step": 91780 }, { "epoch": 0.59, "learning_rate": 0.00021113484835771958, "loss": 0.0472, "step": 91790 }, { "epoch": 0.59, "learning_rate": 0.00021112516700336266, "loss": 0.0498, "step": 91800 }, { "epoch": 0.59, "learning_rate": 0.0002111154856490057, "loss": 0.0537, "step": 91810 }, { "epoch": 0.59, "learning_rate": 0.00021110580429464876, "loss": 0.0404, "step": 91820 }, { "epoch": 0.59, "learning_rate": 0.00021109612294029184, "loss": 0.0606, "step": 91830 }, { "epoch": 0.59, "learning_rate": 0.0002110864415859349, "loss": 0.0515, "step": 91840 }, { "epoch": 0.59, "learning_rate": 0.00021107676023157798, "loss": 0.0516, "step": 91850 }, { "epoch": 0.59, "learning_rate": 0.00021106707887722106, "loss": 0.0461, "step": 91860 }, { "epoch": 0.59, "learning_rate": 0.00021105739752286414, "loss": 0.0633, "step": 91870 }, { "epoch": 0.59, "learning_rate": 0.0002110477161685072, "loss": 0.0486, "step": 91880 }, { "epoch": 0.59, "learning_rate": 0.00021103803481415024, "loss": 0.048, "step": 91890 }, { "epoch": 0.59, "learning_rate": 0.00021102835345979332, "loss": 0.0479, "step": 91900 }, { "epoch": 0.59, "learning_rate": 0.00021101867210543637, "loss": 0.0496, "step": 91910 }, { "epoch": 0.59, "learning_rate": 0.00021100899075107945, "loss": 0.0539, "step": 91920 }, { "epoch": 0.59, "learning_rate": 0.00021099930939672253, "loss": 0.049, "step": 91930 }, { "epoch": 0.59, "learning_rate": 0.00021098962804236559, "loss": 0.0505, "step": 91940 }, { "epoch": 0.59, "learning_rate": 0.00021097994668800867, "loss": 0.0507, "step": 91950 }, { "epoch": 0.59, "learning_rate": 0.00021097026533365172, "loss": 0.0503, "step": 91960 }, { "epoch": 0.59, "learning_rate": 0.00021096058397929477, "loss": 0.0507, "step": 91970 }, { "epoch": 0.59, "learning_rate": 0.00021095090262493785, "loss": 0.0574, "step": 91980 }, { "epoch": 0.59, "learning_rate": 0.00021094122127058093, "loss": 0.0533, "step": 91990 }, { "epoch": 0.59, "learning_rate": 0.000210931539916224, "loss": 0.046, "step": 92000 }, { "epoch": 0.59, "eval_cer": 0.9200949045305615, "eval_loss": 0.03254178166389465, "eval_runtime": 119.8756, "eval_samples_per_second": 16.684, "eval_steps_per_second": 4.171, "step": 92000 }, { "epoch": 0.59, "learning_rate": 0.00021092185856186706, "loss": 0.0445, "step": 92010 }, { "epoch": 0.59, "learning_rate": 0.00021091217720751014, "loss": 0.0458, "step": 92020 }, { "epoch": 0.59, "learning_rate": 0.0002109024958531532, "loss": 0.0502, "step": 92030 }, { "epoch": 0.59, "learning_rate": 0.00021089281449879625, "loss": 0.0528, "step": 92040 }, { "epoch": 0.59, "learning_rate": 0.00021088313314443933, "loss": 0.0521, "step": 92050 }, { "epoch": 0.59, "learning_rate": 0.0002108734517900824, "loss": 0.0571, "step": 92060 }, { "epoch": 0.59, "learning_rate": 0.0002108637704357255, "loss": 0.0488, "step": 92070 }, { "epoch": 0.59, "learning_rate": 0.00021085408908136854, "loss": 0.0457, "step": 92080 }, { "epoch": 0.59, "learning_rate": 0.00021084440772701162, "loss": 0.0514, "step": 92090 }, { "epoch": 0.59, "learning_rate": 0.00021083472637265467, "loss": 0.0479, "step": 92100 }, { "epoch": 0.59, "learning_rate": 0.00021082504501829773, "loss": 0.0509, "step": 92110 }, { "epoch": 0.59, "learning_rate": 0.0002108153636639408, "loss": 0.0438, "step": 92120 }, { "epoch": 0.59, "learning_rate": 0.00021080568230958389, "loss": 0.0483, "step": 92130 }, { "epoch": 0.59, "learning_rate": 0.00021079600095522694, "loss": 0.0515, "step": 92140 }, { "epoch": 0.59, "learning_rate": 0.00021078631960087002, "loss": 0.0504, "step": 92150 }, { "epoch": 0.59, "learning_rate": 0.0002107766382465131, "loss": 0.0476, "step": 92160 }, { "epoch": 0.59, "learning_rate": 0.00021076695689215612, "loss": 0.0458, "step": 92170 }, { "epoch": 0.59, "learning_rate": 0.0002107572755377992, "loss": 0.049, "step": 92180 }, { "epoch": 0.6, "learning_rate": 0.00021074759418344228, "loss": 0.0449, "step": 92190 }, { "epoch": 0.6, "learning_rate": 0.00021073791282908536, "loss": 0.0426, "step": 92200 }, { "epoch": 0.6, "learning_rate": 0.00021072823147472842, "loss": 0.0565, "step": 92210 }, { "epoch": 0.6, "learning_rate": 0.0002107185501203715, "loss": 0.0472, "step": 92220 }, { "epoch": 0.6, "learning_rate": 0.00021070886876601457, "loss": 0.0489, "step": 92230 }, { "epoch": 0.6, "learning_rate": 0.0002106991874116576, "loss": 0.0495, "step": 92240 }, { "epoch": 0.6, "learning_rate": 0.00021068950605730068, "loss": 0.049, "step": 92250 }, { "epoch": 0.6, "learning_rate": 0.00021067982470294376, "loss": 0.0475, "step": 92260 }, { "epoch": 0.6, "learning_rate": 0.00021067014334858684, "loss": 0.043, "step": 92270 }, { "epoch": 0.6, "learning_rate": 0.0002106604619942299, "loss": 0.0543, "step": 92280 }, { "epoch": 0.6, "learning_rate": 0.00021065078063987297, "loss": 0.0463, "step": 92290 }, { "epoch": 0.6, "learning_rate": 0.00021064109928551605, "loss": 0.0455, "step": 92300 }, { "epoch": 0.6, "learning_rate": 0.00021063141793115908, "loss": 0.0449, "step": 92310 }, { "epoch": 0.6, "learning_rate": 0.00021062173657680216, "loss": 0.0604, "step": 92320 }, { "epoch": 0.6, "learning_rate": 0.00021061205522244524, "loss": 0.0475, "step": 92330 }, { "epoch": 0.6, "learning_rate": 0.0002106023738680883, "loss": 0.0466, "step": 92340 }, { "epoch": 0.6, "learning_rate": 0.00021059269251373137, "loss": 0.0513, "step": 92350 }, { "epoch": 0.6, "learning_rate": 0.00021058301115937445, "loss": 0.0567, "step": 92360 }, { "epoch": 0.6, "learning_rate": 0.00021057332980501753, "loss": 0.0552, "step": 92370 }, { "epoch": 0.6, "learning_rate": 0.00021056364845066055, "loss": 0.0534, "step": 92380 }, { "epoch": 0.6, "learning_rate": 0.00021055396709630363, "loss": 0.0448, "step": 92390 }, { "epoch": 0.6, "learning_rate": 0.00021054428574194671, "loss": 0.0477, "step": 92400 }, { "epoch": 0.6, "learning_rate": 0.00021053460438758977, "loss": 0.0485, "step": 92410 }, { "epoch": 0.6, "learning_rate": 0.00021052492303323285, "loss": 0.0528, "step": 92420 }, { "epoch": 0.6, "learning_rate": 0.00021051524167887593, "loss": 0.0484, "step": 92430 }, { "epoch": 0.6, "learning_rate": 0.000210505560324519, "loss": 0.049, "step": 92440 }, { "epoch": 0.6, "learning_rate": 0.00021049587897016203, "loss": 0.0463, "step": 92450 }, { "epoch": 0.6, "learning_rate": 0.0002104861976158051, "loss": 0.0531, "step": 92460 }, { "epoch": 0.6, "learning_rate": 0.0002104765162614482, "loss": 0.0471, "step": 92470 }, { "epoch": 0.6, "learning_rate": 0.00021046683490709124, "loss": 0.0473, "step": 92480 }, { "epoch": 0.6, "learning_rate": 0.00021045715355273432, "loss": 0.0518, "step": 92490 }, { "epoch": 0.6, "learning_rate": 0.0002104474721983774, "loss": 0.053, "step": 92500 }, { "epoch": 0.6, "learning_rate": 0.00021043779084402048, "loss": 0.0507, "step": 92510 }, { "epoch": 0.6, "learning_rate": 0.0002104281094896635, "loss": 0.0484, "step": 92520 }, { "epoch": 0.6, "learning_rate": 0.0002104184281353066, "loss": 0.0447, "step": 92530 }, { "epoch": 0.6, "learning_rate": 0.00021040874678094964, "loss": 0.0584, "step": 92540 }, { "epoch": 0.6, "learning_rate": 0.00021039906542659272, "loss": 0.0502, "step": 92550 }, { "epoch": 0.6, "learning_rate": 0.0002103893840722358, "loss": 0.0454, "step": 92560 }, { "epoch": 0.6, "learning_rate": 0.00021037970271787888, "loss": 0.0462, "step": 92570 }, { "epoch": 0.6, "learning_rate": 0.00021037002136352193, "loss": 0.0464, "step": 92580 }, { "epoch": 0.6, "learning_rate": 0.000210360340009165, "loss": 0.045, "step": 92590 }, { "epoch": 0.6, "learning_rate": 0.00021035065865480807, "loss": 0.0529, "step": 92600 }, { "epoch": 0.6, "learning_rate": 0.00021034097730045112, "loss": 0.0531, "step": 92610 }, { "epoch": 0.6, "learning_rate": 0.0002103312959460942, "loss": 0.0426, "step": 92620 }, { "epoch": 0.6, "learning_rate": 0.00021032161459173728, "loss": 0.0457, "step": 92630 }, { "epoch": 0.6, "learning_rate": 0.00021031193323738036, "loss": 0.0523, "step": 92640 }, { "epoch": 0.6, "learning_rate": 0.0002103022518830234, "loss": 0.0678, "step": 92650 }, { "epoch": 0.6, "learning_rate": 0.00021029257052866646, "loss": 0.0532, "step": 92660 }, { "epoch": 0.6, "learning_rate": 0.00021028288917430954, "loss": 0.0492, "step": 92670 }, { "epoch": 0.6, "learning_rate": 0.0002102732078199526, "loss": 0.0506, "step": 92680 }, { "epoch": 0.6, "learning_rate": 0.00021026352646559568, "loss": 0.0488, "step": 92690 }, { "epoch": 0.6, "learning_rate": 0.00021025384511123876, "loss": 0.0459, "step": 92700 }, { "epoch": 0.6, "learning_rate": 0.00021024416375688184, "loss": 0.0559, "step": 92710 }, { "epoch": 0.6, "learning_rate": 0.0002102344824025249, "loss": 0.0514, "step": 92720 }, { "epoch": 0.6, "learning_rate": 0.00021022480104816794, "loss": 0.0515, "step": 92730 }, { "epoch": 0.6, "learning_rate": 0.000210215119693811, "loss": 0.0467, "step": 92740 }, { "epoch": 0.6, "learning_rate": 0.00021020543833945407, "loss": 0.043, "step": 92750 }, { "epoch": 0.6, "learning_rate": 0.00021019575698509715, "loss": 0.0517, "step": 92760 }, { "epoch": 0.6, "learning_rate": 0.00021018607563074023, "loss": 0.052, "step": 92770 }, { "epoch": 0.6, "learning_rate": 0.00021017639427638329, "loss": 0.0475, "step": 92780 }, { "epoch": 0.6, "learning_rate": 0.00021016671292202637, "loss": 0.0493, "step": 92790 }, { "epoch": 0.6, "learning_rate": 0.00021015703156766942, "loss": 0.0417, "step": 92800 }, { "epoch": 0.6, "learning_rate": 0.00021014735021331247, "loss": 0.046, "step": 92810 }, { "epoch": 0.6, "learning_rate": 0.00021013766885895555, "loss": 0.0434, "step": 92820 }, { "epoch": 0.6, "learning_rate": 0.00021012798750459863, "loss": 0.045, "step": 92830 }, { "epoch": 0.6, "learning_rate": 0.0002101183061502417, "loss": 0.0453, "step": 92840 }, { "epoch": 0.6, "learning_rate": 0.00021010862479588476, "loss": 0.0497, "step": 92850 }, { "epoch": 0.6, "learning_rate": 0.00021009894344152784, "loss": 0.0501, "step": 92860 }, { "epoch": 0.6, "learning_rate": 0.0002100892620871709, "loss": 0.0499, "step": 92870 }, { "epoch": 0.6, "learning_rate": 0.00021007958073281395, "loss": 0.0563, "step": 92880 }, { "epoch": 0.6, "learning_rate": 0.00021006989937845703, "loss": 0.0472, "step": 92890 }, { "epoch": 0.6, "learning_rate": 0.0002100602180241001, "loss": 0.0569, "step": 92900 }, { "epoch": 0.6, "learning_rate": 0.0002100505366697432, "loss": 0.0529, "step": 92910 }, { "epoch": 0.6, "learning_rate": 0.00021004085531538624, "loss": 0.0555, "step": 92920 }, { "epoch": 0.6, "learning_rate": 0.00021003117396102932, "loss": 0.0436, "step": 92930 }, { "epoch": 0.6, "learning_rate": 0.00021002149260667237, "loss": 0.0453, "step": 92940 }, { "epoch": 0.6, "learning_rate": 0.00021001181125231543, "loss": 0.0428, "step": 92950 }, { "epoch": 0.6, "learning_rate": 0.0002100021298979585, "loss": 0.0493, "step": 92960 }, { "epoch": 0.6, "learning_rate": 0.00020999244854360158, "loss": 0.0481, "step": 92970 }, { "epoch": 0.6, "learning_rate": 0.00020998276718924464, "loss": 0.0458, "step": 92980 }, { "epoch": 0.6, "learning_rate": 0.00020997308583488772, "loss": 0.0525, "step": 92990 }, { "epoch": 0.6, "learning_rate": 0.00020996340448053077, "loss": 0.0545, "step": 93000 }, { "epoch": 0.6, "eval_cer": 0.9199846345045758, "eval_loss": 0.032582107931375504, "eval_runtime": 120.1286, "eval_samples_per_second": 16.649, "eval_steps_per_second": 4.162, "step": 93000 }, { "epoch": 0.6, "learning_rate": 0.00020995372312617382, "loss": 0.0485, "step": 93010 }, { "epoch": 0.6, "learning_rate": 0.0002099440417718169, "loss": 0.0466, "step": 93020 }, { "epoch": 0.6, "learning_rate": 0.00020993436041745998, "loss": 0.0516, "step": 93030 }, { "epoch": 0.6, "learning_rate": 0.00020992467906310306, "loss": 0.0437, "step": 93040 }, { "epoch": 0.6, "learning_rate": 0.00020991499770874611, "loss": 0.0578, "step": 93050 }, { "epoch": 0.6, "learning_rate": 0.0002099053163543892, "loss": 0.0552, "step": 93060 }, { "epoch": 0.6, "learning_rate": 0.00020989563500003225, "loss": 0.0467, "step": 93070 }, { "epoch": 0.6, "learning_rate": 0.0002098859536456753, "loss": 0.0512, "step": 93080 }, { "epoch": 0.6, "learning_rate": 0.00020987627229131838, "loss": 0.0482, "step": 93090 }, { "epoch": 0.6, "learning_rate": 0.00020986659093696146, "loss": 0.0494, "step": 93100 }, { "epoch": 0.6, "learning_rate": 0.00020985690958260454, "loss": 0.0499, "step": 93110 }, { "epoch": 0.6, "learning_rate": 0.0002098472282282476, "loss": 0.0539, "step": 93120 }, { "epoch": 0.6, "learning_rate": 0.00020983754687389067, "loss": 0.0462, "step": 93130 }, { "epoch": 0.6, "learning_rate": 0.00020982786551953372, "loss": 0.0451, "step": 93140 }, { "epoch": 0.6, "learning_rate": 0.00020981818416517678, "loss": 0.0465, "step": 93150 }, { "epoch": 0.6, "learning_rate": 0.00020980850281081986, "loss": 0.0497, "step": 93160 }, { "epoch": 0.6, "learning_rate": 0.00020979882145646294, "loss": 0.0473, "step": 93170 }, { "epoch": 0.6, "learning_rate": 0.000209789140102106, "loss": 0.0426, "step": 93180 }, { "epoch": 0.6, "learning_rate": 0.00020977945874774907, "loss": 0.0486, "step": 93190 }, { "epoch": 0.6, "learning_rate": 0.00020976977739339215, "loss": 0.0478, "step": 93200 }, { "epoch": 0.6, "learning_rate": 0.00020976009603903517, "loss": 0.0504, "step": 93210 }, { "epoch": 0.6, "learning_rate": 0.00020975041468467825, "loss": 0.0478, "step": 93220 }, { "epoch": 0.6, "learning_rate": 0.00020974073333032133, "loss": 0.0476, "step": 93230 }, { "epoch": 0.6, "learning_rate": 0.00020973105197596441, "loss": 0.0446, "step": 93240 }, { "epoch": 0.6, "learning_rate": 0.00020972137062160747, "loss": 0.0489, "step": 93250 }, { "epoch": 0.6, "learning_rate": 0.00020971168926725055, "loss": 0.0434, "step": 93260 }, { "epoch": 0.6, "learning_rate": 0.00020970200791289363, "loss": 0.0527, "step": 93270 }, { "epoch": 0.6, "learning_rate": 0.00020969232655853665, "loss": 0.0471, "step": 93280 }, { "epoch": 0.6, "learning_rate": 0.00020968264520417973, "loss": 0.0532, "step": 93290 }, { "epoch": 0.6, "learning_rate": 0.0002096729638498228, "loss": 0.0472, "step": 93300 }, { "epoch": 0.6, "learning_rate": 0.0002096632824954659, "loss": 0.0506, "step": 93310 }, { "epoch": 0.6, "learning_rate": 0.00020965360114110894, "loss": 0.0429, "step": 93320 }, { "epoch": 0.6, "learning_rate": 0.00020964391978675202, "loss": 0.0497, "step": 93330 }, { "epoch": 0.6, "learning_rate": 0.0002096342384323951, "loss": 0.0468, "step": 93340 }, { "epoch": 0.6, "learning_rate": 0.00020962455707803813, "loss": 0.0456, "step": 93350 }, { "epoch": 0.6, "learning_rate": 0.0002096148757236812, "loss": 0.0515, "step": 93360 }, { "epoch": 0.6, "learning_rate": 0.0002096051943693243, "loss": 0.0552, "step": 93370 }, { "epoch": 0.6, "learning_rate": 0.00020959551301496734, "loss": 0.0444, "step": 93380 }, { "epoch": 0.6, "learning_rate": 0.00020958583166061042, "loss": 0.0413, "step": 93390 }, { "epoch": 0.6, "learning_rate": 0.0002095761503062535, "loss": 0.0435, "step": 93400 }, { "epoch": 0.6, "learning_rate": 0.00020956646895189658, "loss": 0.0472, "step": 93410 }, { "epoch": 0.6, "learning_rate": 0.0002095567875975396, "loss": 0.0498, "step": 93420 }, { "epoch": 0.6, "learning_rate": 0.00020954710624318269, "loss": 0.044, "step": 93430 }, { "epoch": 0.6, "learning_rate": 0.00020953742488882577, "loss": 0.0432, "step": 93440 }, { "epoch": 0.6, "learning_rate": 0.00020952774353446882, "loss": 0.05, "step": 93450 }, { "epoch": 0.6, "learning_rate": 0.0002095180621801119, "loss": 0.0461, "step": 93460 }, { "epoch": 0.6, "learning_rate": 0.00020950838082575498, "loss": 0.0469, "step": 93470 }, { "epoch": 0.6, "learning_rate": 0.00020949869947139806, "loss": 0.0506, "step": 93480 }, { "epoch": 0.6, "learning_rate": 0.00020948901811704108, "loss": 0.0404, "step": 93490 }, { "epoch": 0.6, "learning_rate": 0.00020947933676268416, "loss": 0.0529, "step": 93500 }, { "epoch": 0.6, "learning_rate": 0.00020946965540832724, "loss": 0.0501, "step": 93510 }, { "epoch": 0.6, "learning_rate": 0.0002094599740539703, "loss": 0.0453, "step": 93520 }, { "epoch": 0.6, "learning_rate": 0.00020945029269961338, "loss": 0.0504, "step": 93530 }, { "epoch": 0.6, "learning_rate": 0.00020944061134525646, "loss": 0.0497, "step": 93540 }, { "epoch": 0.6, "learning_rate": 0.0002094309299908995, "loss": 0.0523, "step": 93550 }, { "epoch": 0.6, "learning_rate": 0.00020942124863654256, "loss": 0.0538, "step": 93560 }, { "epoch": 0.6, "learning_rate": 0.00020941156728218564, "loss": 0.0496, "step": 93570 }, { "epoch": 0.6, "learning_rate": 0.0002094018859278287, "loss": 0.045, "step": 93580 }, { "epoch": 0.6, "learning_rate": 0.00020939220457347177, "loss": 0.0509, "step": 93590 }, { "epoch": 0.6, "learning_rate": 0.00020938252321911485, "loss": 0.0492, "step": 93600 }, { "epoch": 0.6, "learning_rate": 0.00020937284186475793, "loss": 0.0528, "step": 93610 }, { "epoch": 0.6, "learning_rate": 0.00020936316051040099, "loss": 0.0524, "step": 93620 }, { "epoch": 0.6, "learning_rate": 0.00020935347915604404, "loss": 0.0452, "step": 93630 }, { "epoch": 0.6, "learning_rate": 0.00020934379780168712, "loss": 0.0497, "step": 93640 }, { "epoch": 0.6, "learning_rate": 0.00020933411644733017, "loss": 0.0479, "step": 93650 }, { "epoch": 0.6, "learning_rate": 0.00020932443509297325, "loss": 0.0486, "step": 93660 }, { "epoch": 0.6, "learning_rate": 0.00020931475373861633, "loss": 0.0582, "step": 93670 }, { "epoch": 0.6, "learning_rate": 0.0002093050723842594, "loss": 0.0484, "step": 93680 }, { "epoch": 0.6, "learning_rate": 0.00020929539102990246, "loss": 0.0523, "step": 93690 }, { "epoch": 0.6, "learning_rate": 0.00020928570967554552, "loss": 0.0514, "step": 93700 }, { "epoch": 0.6, "learning_rate": 0.0002092760283211886, "loss": 0.0475, "step": 93710 }, { "epoch": 0.6, "learning_rate": 0.00020926634696683165, "loss": 0.0447, "step": 93720 }, { "epoch": 0.6, "learning_rate": 0.00020925666561247473, "loss": 0.0442, "step": 93730 }, { "epoch": 0.61, "learning_rate": 0.0002092469842581178, "loss": 0.0457, "step": 93740 }, { "epoch": 0.61, "learning_rate": 0.00020923730290376086, "loss": 0.0476, "step": 93750 }, { "epoch": 0.61, "learning_rate": 0.00020922762154940394, "loss": 0.0557, "step": 93760 }, { "epoch": 0.61, "learning_rate": 0.000209217940195047, "loss": 0.0442, "step": 93770 }, { "epoch": 0.61, "learning_rate": 0.00020920825884069005, "loss": 0.0426, "step": 93780 }, { "epoch": 0.61, "learning_rate": 0.00020919857748633312, "loss": 0.0437, "step": 93790 }, { "epoch": 0.61, "learning_rate": 0.0002091888961319762, "loss": 0.0464, "step": 93800 }, { "epoch": 0.61, "learning_rate": 0.00020917921477761928, "loss": 0.0566, "step": 93810 }, { "epoch": 0.61, "learning_rate": 0.00020916953342326234, "loss": 0.0411, "step": 93820 }, { "epoch": 0.61, "learning_rate": 0.00020915985206890542, "loss": 0.0572, "step": 93830 }, { "epoch": 0.61, "learning_rate": 0.00020915017071454847, "loss": 0.0462, "step": 93840 }, { "epoch": 0.61, "learning_rate": 0.00020914048936019152, "loss": 0.0505, "step": 93850 }, { "epoch": 0.61, "learning_rate": 0.0002091308080058346, "loss": 0.0532, "step": 93860 }, { "epoch": 0.61, "learning_rate": 0.00020912112665147768, "loss": 0.0642, "step": 93870 }, { "epoch": 0.61, "learning_rate": 0.00020911144529712076, "loss": 0.0502, "step": 93880 }, { "epoch": 0.61, "learning_rate": 0.00020910176394276381, "loss": 0.0464, "step": 93890 }, { "epoch": 0.61, "learning_rate": 0.0002090920825884069, "loss": 0.0494, "step": 93900 }, { "epoch": 0.61, "learning_rate": 0.00020908240123404995, "loss": 0.053, "step": 93910 }, { "epoch": 0.61, "learning_rate": 0.000209072719879693, "loss": 0.0442, "step": 93920 }, { "epoch": 0.61, "learning_rate": 0.00020906303852533608, "loss": 0.0465, "step": 93930 }, { "epoch": 0.61, "learning_rate": 0.00020905335717097916, "loss": 0.0621, "step": 93940 }, { "epoch": 0.61, "learning_rate": 0.0002090436758166222, "loss": 0.0483, "step": 93950 }, { "epoch": 0.61, "learning_rate": 0.0002090339944622653, "loss": 0.0527, "step": 93960 }, { "epoch": 0.61, "learning_rate": 0.00020902431310790837, "loss": 0.0465, "step": 93970 }, { "epoch": 0.61, "learning_rate": 0.0002090146317535514, "loss": 0.0564, "step": 93980 }, { "epoch": 0.61, "learning_rate": 0.00020900495039919448, "loss": 0.0523, "step": 93990 }, { "epoch": 0.61, "learning_rate": 0.00020899526904483756, "loss": 0.0473, "step": 94000 }, { "epoch": 0.61, "eval_cer": 0.920060558129025, "eval_loss": 0.03265640139579773, "eval_runtime": 119.8353, "eval_samples_per_second": 16.69, "eval_steps_per_second": 4.172, "step": 94000 }, { "epoch": 0.61, "learning_rate": 0.00020898558769048064, "loss": 0.052, "step": 94010 }, { "epoch": 0.61, "learning_rate": 0.0002089759063361237, "loss": 0.0431, "step": 94020 }, { "epoch": 0.61, "learning_rate": 0.00020896622498176677, "loss": 0.0509, "step": 94030 }, { "epoch": 0.61, "learning_rate": 0.00020895654362740985, "loss": 0.05, "step": 94040 }, { "epoch": 0.61, "learning_rate": 0.00020894686227305287, "loss": 0.0506, "step": 94050 }, { "epoch": 0.61, "learning_rate": 0.00020893718091869595, "loss": 0.0515, "step": 94060 }, { "epoch": 0.61, "learning_rate": 0.00020892749956433903, "loss": 0.05, "step": 94070 }, { "epoch": 0.61, "learning_rate": 0.00020891781820998211, "loss": 0.0521, "step": 94080 }, { "epoch": 0.61, "learning_rate": 0.00020890813685562517, "loss": 0.0495, "step": 94090 }, { "epoch": 0.61, "learning_rate": 0.00020889845550126825, "loss": 0.0478, "step": 94100 }, { "epoch": 0.61, "learning_rate": 0.00020888877414691133, "loss": 0.0556, "step": 94110 }, { "epoch": 0.61, "learning_rate": 0.00020887909279255435, "loss": 0.0469, "step": 94120 }, { "epoch": 0.61, "learning_rate": 0.00020886941143819743, "loss": 0.0485, "step": 94130 }, { "epoch": 0.61, "learning_rate": 0.0002088597300838405, "loss": 0.0493, "step": 94140 }, { "epoch": 0.61, "learning_rate": 0.00020885004872948356, "loss": 0.0518, "step": 94150 }, { "epoch": 0.61, "learning_rate": 0.00020884036737512664, "loss": 0.0532, "step": 94160 }, { "epoch": 0.61, "learning_rate": 0.00020883068602076972, "loss": 0.0538, "step": 94170 }, { "epoch": 0.61, "learning_rate": 0.0002088210046664128, "loss": 0.0549, "step": 94180 }, { "epoch": 0.61, "learning_rate": 0.00020881132331205583, "loss": 0.0483, "step": 94190 }, { "epoch": 0.61, "learning_rate": 0.0002088016419576989, "loss": 0.0467, "step": 94200 }, { "epoch": 0.61, "learning_rate": 0.000208791960603342, "loss": 0.0541, "step": 94210 }, { "epoch": 0.61, "learning_rate": 0.00020878227924898504, "loss": 0.0426, "step": 94220 }, { "epoch": 0.61, "learning_rate": 0.00020877259789462812, "loss": 0.0496, "step": 94230 }, { "epoch": 0.61, "learning_rate": 0.0002087629165402712, "loss": 0.0547, "step": 94240 }, { "epoch": 0.61, "learning_rate": 0.00020875323518591428, "loss": 0.048, "step": 94250 }, { "epoch": 0.61, "learning_rate": 0.0002087435538315573, "loss": 0.0454, "step": 94260 }, { "epoch": 0.61, "learning_rate": 0.00020873387247720039, "loss": 0.0496, "step": 94270 }, { "epoch": 0.61, "learning_rate": 0.00020872419112284347, "loss": 0.0596, "step": 94280 }, { "epoch": 0.61, "learning_rate": 0.00020871450976848652, "loss": 0.0453, "step": 94290 }, { "epoch": 0.61, "learning_rate": 0.0002087048284141296, "loss": 0.0519, "step": 94300 }, { "epoch": 0.61, "learning_rate": 0.00020869514705977268, "loss": 0.0484, "step": 94310 }, { "epoch": 0.61, "learning_rate": 0.00020868546570541576, "loss": 0.0497, "step": 94320 }, { "epoch": 0.61, "learning_rate": 0.00020867578435105878, "loss": 0.0439, "step": 94330 }, { "epoch": 0.61, "learning_rate": 0.00020866610299670186, "loss": 0.0548, "step": 94340 }, { "epoch": 0.61, "learning_rate": 0.00020865642164234492, "loss": 0.0517, "step": 94350 }, { "epoch": 0.61, "learning_rate": 0.000208646740287988, "loss": 0.0487, "step": 94360 }, { "epoch": 0.61, "learning_rate": 0.00020863705893363108, "loss": 0.0433, "step": 94370 }, { "epoch": 0.61, "learning_rate": 0.00020862737757927416, "loss": 0.0566, "step": 94380 }, { "epoch": 0.61, "learning_rate": 0.0002086176962249172, "loss": 0.0479, "step": 94390 }, { "epoch": 0.61, "learning_rate": 0.00020860801487056026, "loss": 0.05, "step": 94400 }, { "epoch": 0.61, "learning_rate": 0.00020859833351620334, "loss": 0.0505, "step": 94410 }, { "epoch": 0.61, "learning_rate": 0.0002085886521618464, "loss": 0.0516, "step": 94420 }, { "epoch": 0.61, "learning_rate": 0.00020857897080748947, "loss": 0.0455, "step": 94430 }, { "epoch": 0.61, "learning_rate": 0.00020856928945313255, "loss": 0.0502, "step": 94440 }, { "epoch": 0.61, "learning_rate": 0.00020855960809877563, "loss": 0.0543, "step": 94450 }, { "epoch": 0.61, "learning_rate": 0.00020854992674441868, "loss": 0.0518, "step": 94460 }, { "epoch": 0.61, "learning_rate": 0.00020854024539006174, "loss": 0.0477, "step": 94470 }, { "epoch": 0.61, "learning_rate": 0.00020853056403570482, "loss": 0.0445, "step": 94480 }, { "epoch": 0.61, "learning_rate": 0.00020852088268134787, "loss": 0.0496, "step": 94490 }, { "epoch": 0.61, "learning_rate": 0.00020851120132699095, "loss": 0.0489, "step": 94500 }, { "epoch": 0.61, "learning_rate": 0.00020850151997263403, "loss": 0.0438, "step": 94510 }, { "epoch": 0.61, "learning_rate": 0.0002084918386182771, "loss": 0.0533, "step": 94520 }, { "epoch": 0.61, "learning_rate": 0.00020848215726392016, "loss": 0.0485, "step": 94530 }, { "epoch": 0.61, "learning_rate": 0.00020847247590956321, "loss": 0.055, "step": 94540 }, { "epoch": 0.61, "learning_rate": 0.00020846279455520627, "loss": 0.0498, "step": 94550 }, { "epoch": 0.61, "learning_rate": 0.00020845311320084935, "loss": 0.0512, "step": 94560 }, { "epoch": 0.61, "learning_rate": 0.00020844343184649243, "loss": 0.052, "step": 94570 }, { "epoch": 0.61, "learning_rate": 0.0002084337504921355, "loss": 0.0493, "step": 94580 }, { "epoch": 0.61, "learning_rate": 0.00020842406913777856, "loss": 0.0571, "step": 94590 }, { "epoch": 0.61, "learning_rate": 0.00020841438778342164, "loss": 0.0525, "step": 94600 }, { "epoch": 0.61, "learning_rate": 0.0002084047064290647, "loss": 0.0498, "step": 94610 }, { "epoch": 0.61, "learning_rate": 0.00020839502507470774, "loss": 0.0529, "step": 94620 }, { "epoch": 0.61, "learning_rate": 0.00020838534372035082, "loss": 0.0473, "step": 94630 }, { "epoch": 0.61, "learning_rate": 0.0002083756623659939, "loss": 0.0476, "step": 94640 }, { "epoch": 0.61, "learning_rate": 0.00020836598101163698, "loss": 0.0433, "step": 94650 }, { "epoch": 0.61, "learning_rate": 0.00020835629965728004, "loss": 0.0443, "step": 94660 }, { "epoch": 0.61, "learning_rate": 0.00020834661830292312, "loss": 0.0473, "step": 94670 }, { "epoch": 0.61, "learning_rate": 0.00020833693694856617, "loss": 0.049, "step": 94680 }, { "epoch": 0.61, "learning_rate": 0.00020832725559420922, "loss": 0.0505, "step": 94690 }, { "epoch": 0.61, "learning_rate": 0.0002083175742398523, "loss": 0.0535, "step": 94700 }, { "epoch": 0.61, "learning_rate": 0.00020830789288549538, "loss": 0.0577, "step": 94710 }, { "epoch": 0.61, "learning_rate": 0.00020829821153113846, "loss": 0.0528, "step": 94720 }, { "epoch": 0.61, "learning_rate": 0.00020828853017678151, "loss": 0.0523, "step": 94730 }, { "epoch": 0.61, "learning_rate": 0.0002082788488224246, "loss": 0.0452, "step": 94740 }, { "epoch": 0.61, "learning_rate": 0.00020826916746806762, "loss": 0.0472, "step": 94750 }, { "epoch": 0.61, "learning_rate": 0.0002082594861137107, "loss": 0.0548, "step": 94760 }, { "epoch": 0.61, "learning_rate": 0.00020824980475935378, "loss": 0.0472, "step": 94770 }, { "epoch": 0.61, "learning_rate": 0.00020824012340499686, "loss": 0.0466, "step": 94780 }, { "epoch": 0.61, "learning_rate": 0.0002082304420506399, "loss": 0.0472, "step": 94790 }, { "epoch": 0.61, "learning_rate": 0.000208220760696283, "loss": 0.0534, "step": 94800 }, { "epoch": 0.61, "learning_rate": 0.00020821107934192607, "loss": 0.0546, "step": 94810 }, { "epoch": 0.61, "learning_rate": 0.0002082013979875691, "loss": 0.0452, "step": 94820 }, { "epoch": 0.61, "learning_rate": 0.00020819171663321218, "loss": 0.0442, "step": 94830 }, { "epoch": 0.61, "learning_rate": 0.00020818203527885526, "loss": 0.0509, "step": 94840 }, { "epoch": 0.61, "learning_rate": 0.00020817235392449834, "loss": 0.0488, "step": 94850 }, { "epoch": 0.61, "learning_rate": 0.0002081626725701414, "loss": 0.0504, "step": 94860 }, { "epoch": 0.61, "learning_rate": 0.00020815299121578447, "loss": 0.0469, "step": 94870 }, { "epoch": 0.61, "learning_rate": 0.00020814330986142755, "loss": 0.0565, "step": 94880 }, { "epoch": 0.61, "learning_rate": 0.00020813362850707057, "loss": 0.0489, "step": 94890 }, { "epoch": 0.61, "learning_rate": 0.00020812394715271365, "loss": 0.0584, "step": 94900 }, { "epoch": 0.61, "learning_rate": 0.00020811426579835673, "loss": 0.0402, "step": 94910 }, { "epoch": 0.61, "learning_rate": 0.0002081045844439998, "loss": 0.0478, "step": 94920 }, { "epoch": 0.61, "learning_rate": 0.00020809490308964287, "loss": 0.048, "step": 94930 }, { "epoch": 0.61, "learning_rate": 0.00020808522173528595, "loss": 0.0471, "step": 94940 }, { "epoch": 0.61, "learning_rate": 0.00020807554038092903, "loss": 0.0402, "step": 94950 }, { "epoch": 0.61, "learning_rate": 0.00020806585902657205, "loss": 0.0445, "step": 94960 }, { "epoch": 0.61, "learning_rate": 0.00020805617767221513, "loss": 0.0478, "step": 94970 }, { "epoch": 0.61, "learning_rate": 0.0002080464963178582, "loss": 0.0475, "step": 94980 }, { "epoch": 0.61, "learning_rate": 0.00020803681496350126, "loss": 0.0556, "step": 94990 }, { "epoch": 0.61, "learning_rate": 0.00020802713360914434, "loss": 0.0558, "step": 95000 }, { "epoch": 0.61, "eval_cer": 0.9198942492373743, "eval_loss": 0.032361067831516266, "eval_runtime": 119.7802, "eval_samples_per_second": 16.697, "eval_steps_per_second": 4.174, "step": 95000 }, { "epoch": 0.61, "learning_rate": 0.00020801745225478742, "loss": 0.0497, "step": 95010 }, { "epoch": 0.61, "learning_rate": 0.0002080077709004305, "loss": 0.0482, "step": 95020 }, { "epoch": 0.61, "learning_rate": 0.00020799808954607353, "loss": 0.0471, "step": 95030 }, { "epoch": 0.61, "learning_rate": 0.0002079884081917166, "loss": 0.051, "step": 95040 }, { "epoch": 0.61, "learning_rate": 0.0002079787268373597, "loss": 0.0508, "step": 95050 }, { "epoch": 0.61, "learning_rate": 0.00020796904548300274, "loss": 0.0464, "step": 95060 }, { "epoch": 0.61, "learning_rate": 0.00020795936412864582, "loss": 0.0461, "step": 95070 }, { "epoch": 0.61, "learning_rate": 0.0002079496827742889, "loss": 0.054, "step": 95080 }, { "epoch": 0.61, "learning_rate": 0.00020794000141993198, "loss": 0.0533, "step": 95090 }, { "epoch": 0.61, "learning_rate": 0.000207930320065575, "loss": 0.049, "step": 95100 }, { "epoch": 0.61, "learning_rate": 0.00020792063871121809, "loss": 0.0538, "step": 95110 }, { "epoch": 0.61, "learning_rate": 0.00020791095735686117, "loss": 0.0467, "step": 95120 }, { "epoch": 0.61, "learning_rate": 0.00020790127600250422, "loss": 0.0458, "step": 95130 }, { "epoch": 0.61, "learning_rate": 0.0002078915946481473, "loss": 0.0494, "step": 95140 }, { "epoch": 0.61, "learning_rate": 0.00020788191329379038, "loss": 0.0464, "step": 95150 }, { "epoch": 0.61, "learning_rate": 0.00020787223193943343, "loss": 0.0524, "step": 95160 }, { "epoch": 0.61, "learning_rate": 0.00020786255058507648, "loss": 0.0468, "step": 95170 }, { "epoch": 0.61, "learning_rate": 0.00020785286923071956, "loss": 0.0474, "step": 95180 }, { "epoch": 0.61, "learning_rate": 0.00020784318787636262, "loss": 0.0433, "step": 95190 }, { "epoch": 0.61, "learning_rate": 0.0002078335065220057, "loss": 0.0484, "step": 95200 }, { "epoch": 0.61, "learning_rate": 0.00020782382516764877, "loss": 0.0421, "step": 95210 }, { "epoch": 0.61, "learning_rate": 0.00020781414381329185, "loss": 0.0593, "step": 95220 }, { "epoch": 0.61, "learning_rate": 0.0002078044624589349, "loss": 0.0488, "step": 95230 }, { "epoch": 0.61, "learning_rate": 0.00020779478110457796, "loss": 0.0494, "step": 95240 }, { "epoch": 0.61, "learning_rate": 0.00020778509975022104, "loss": 0.0425, "step": 95250 }, { "epoch": 0.61, "learning_rate": 0.0002077754183958641, "loss": 0.0542, "step": 95260 }, { "epoch": 0.61, "learning_rate": 0.00020776573704150717, "loss": 0.0502, "step": 95270 }, { "epoch": 0.61, "learning_rate": 0.00020775605568715025, "loss": 0.0414, "step": 95280 }, { "epoch": 0.62, "learning_rate": 0.00020774637433279333, "loss": 0.0474, "step": 95290 }, { "epoch": 0.62, "learning_rate": 0.00020773669297843638, "loss": 0.0454, "step": 95300 }, { "epoch": 0.62, "learning_rate": 0.00020772701162407944, "loss": 0.047, "step": 95310 }, { "epoch": 0.62, "learning_rate": 0.00020771733026972252, "loss": 0.0514, "step": 95320 }, { "epoch": 0.62, "learning_rate": 0.00020770764891536557, "loss": 0.0447, "step": 95330 }, { "epoch": 0.62, "learning_rate": 0.00020769796756100865, "loss": 0.0501, "step": 95340 }, { "epoch": 0.62, "learning_rate": 0.00020768828620665173, "loss": 0.0457, "step": 95350 }, { "epoch": 0.62, "learning_rate": 0.00020767860485229478, "loss": 0.0497, "step": 95360 }, { "epoch": 0.62, "learning_rate": 0.00020766892349793786, "loss": 0.0437, "step": 95370 }, { "epoch": 0.62, "learning_rate": 0.00020765924214358091, "loss": 0.0487, "step": 95380 }, { "epoch": 0.62, "learning_rate": 0.00020764956078922397, "loss": 0.0509, "step": 95390 }, { "epoch": 0.62, "learning_rate": 0.00020763987943486705, "loss": 0.0455, "step": 95400 }, { "epoch": 0.62, "learning_rate": 0.00020763019808051013, "loss": 0.0466, "step": 95410 }, { "epoch": 0.62, "learning_rate": 0.0002076205167261532, "loss": 0.0484, "step": 95420 }, { "epoch": 0.62, "learning_rate": 0.00020761083537179626, "loss": 0.0387, "step": 95430 }, { "epoch": 0.62, "learning_rate": 0.00020760115401743934, "loss": 0.048, "step": 95440 }, { "epoch": 0.62, "learning_rate": 0.0002075914726630824, "loss": 0.0443, "step": 95450 }, { "epoch": 0.62, "learning_rate": 0.00020758179130872544, "loss": 0.0458, "step": 95460 }, { "epoch": 0.62, "learning_rate": 0.00020757210995436852, "loss": 0.0438, "step": 95470 }, { "epoch": 0.62, "learning_rate": 0.0002075624286000116, "loss": 0.0489, "step": 95480 }, { "epoch": 0.62, "learning_rate": 0.00020755274724565468, "loss": 0.0486, "step": 95490 }, { "epoch": 0.62, "learning_rate": 0.00020754306589129774, "loss": 0.0404, "step": 95500 }, { "epoch": 0.62, "learning_rate": 0.00020753338453694082, "loss": 0.0457, "step": 95510 }, { "epoch": 0.62, "learning_rate": 0.00020752370318258387, "loss": 0.0515, "step": 95520 }, { "epoch": 0.62, "learning_rate": 0.00020751402182822692, "loss": 0.0484, "step": 95530 }, { "epoch": 0.62, "learning_rate": 0.00020750434047387, "loss": 0.0443, "step": 95540 }, { "epoch": 0.62, "learning_rate": 0.00020749465911951308, "loss": 0.0426, "step": 95550 }, { "epoch": 0.62, "learning_rate": 0.00020748497776515613, "loss": 0.049, "step": 95560 }, { "epoch": 0.62, "learning_rate": 0.00020747529641079921, "loss": 0.047, "step": 95570 }, { "epoch": 0.62, "learning_rate": 0.0002074656150564423, "loss": 0.0508, "step": 95580 }, { "epoch": 0.62, "learning_rate": 0.00020745593370208532, "loss": 0.0471, "step": 95590 }, { "epoch": 0.62, "learning_rate": 0.0002074462523477284, "loss": 0.0467, "step": 95600 }, { "epoch": 0.62, "learning_rate": 0.00020743657099337148, "loss": 0.0468, "step": 95610 }, { "epoch": 0.62, "learning_rate": 0.00020742688963901456, "loss": 0.0495, "step": 95620 }, { "epoch": 0.62, "learning_rate": 0.0002074172082846576, "loss": 0.0488, "step": 95630 }, { "epoch": 0.62, "learning_rate": 0.0002074075269303007, "loss": 0.0444, "step": 95640 }, { "epoch": 0.62, "learning_rate": 0.00020739784557594377, "loss": 0.0443, "step": 95650 }, { "epoch": 0.62, "learning_rate": 0.0002073881642215868, "loss": 0.0481, "step": 95660 }, { "epoch": 0.62, "learning_rate": 0.00020737848286722988, "loss": 0.0543, "step": 95670 }, { "epoch": 0.62, "learning_rate": 0.00020736880151287296, "loss": 0.0462, "step": 95680 }, { "epoch": 0.62, "learning_rate": 0.00020735912015851604, "loss": 0.0464, "step": 95690 }, { "epoch": 0.62, "learning_rate": 0.0002073494388041591, "loss": 0.0509, "step": 95700 }, { "epoch": 0.62, "learning_rate": 0.00020733975744980217, "loss": 0.0508, "step": 95710 }, { "epoch": 0.62, "learning_rate": 0.00020733007609544525, "loss": 0.0503, "step": 95720 }, { "epoch": 0.62, "learning_rate": 0.00020732039474108827, "loss": 0.0507, "step": 95730 }, { "epoch": 0.62, "learning_rate": 0.00020731071338673135, "loss": 0.0464, "step": 95740 }, { "epoch": 0.62, "learning_rate": 0.00020730103203237443, "loss": 0.0449, "step": 95750 }, { "epoch": 0.62, "learning_rate": 0.00020729135067801749, "loss": 0.0467, "step": 95760 }, { "epoch": 0.62, "learning_rate": 0.00020728166932366057, "loss": 0.0469, "step": 95770 }, { "epoch": 0.62, "learning_rate": 0.00020727198796930365, "loss": 0.0466, "step": 95780 }, { "epoch": 0.62, "learning_rate": 0.00020726230661494673, "loss": 0.06, "step": 95790 }, { "epoch": 0.62, "learning_rate": 0.00020725262526058975, "loss": 0.0534, "step": 95800 }, { "epoch": 0.62, "learning_rate": 0.00020724294390623283, "loss": 0.0512, "step": 95810 }, { "epoch": 0.62, "learning_rate": 0.0002072332625518759, "loss": 0.0521, "step": 95820 }, { "epoch": 0.62, "learning_rate": 0.00020722358119751896, "loss": 0.0515, "step": 95830 }, { "epoch": 0.62, "learning_rate": 0.00020721389984316204, "loss": 0.051, "step": 95840 }, { "epoch": 0.62, "learning_rate": 0.00020720421848880512, "loss": 0.059, "step": 95850 }, { "epoch": 0.62, "learning_rate": 0.0002071945371344482, "loss": 0.0495, "step": 95860 }, { "epoch": 0.62, "learning_rate": 0.00020718485578009123, "loss": 0.0516, "step": 95870 }, { "epoch": 0.62, "learning_rate": 0.0002071751744257343, "loss": 0.0564, "step": 95880 }, { "epoch": 0.62, "learning_rate": 0.0002071654930713774, "loss": 0.0491, "step": 95890 }, { "epoch": 0.62, "learning_rate": 0.00020715581171702044, "loss": 0.0542, "step": 95900 }, { "epoch": 0.62, "learning_rate": 0.00020714613036266352, "loss": 0.0465, "step": 95910 }, { "epoch": 0.62, "learning_rate": 0.0002071364490083066, "loss": 0.044, "step": 95920 }, { "epoch": 0.62, "learning_rate": 0.00020712676765394965, "loss": 0.0424, "step": 95930 }, { "epoch": 0.62, "learning_rate": 0.0002071170862995927, "loss": 0.0548, "step": 95940 }, { "epoch": 0.62, "learning_rate": 0.00020710740494523578, "loss": 0.0477, "step": 95950 }, { "epoch": 0.62, "learning_rate": 0.00020709772359087884, "loss": 0.05, "step": 95960 }, { "epoch": 0.62, "learning_rate": 0.00020708804223652192, "loss": 0.0559, "step": 95970 }, { "epoch": 0.62, "learning_rate": 0.000207078360882165, "loss": 0.0466, "step": 95980 }, { "epoch": 0.62, "learning_rate": 0.00020706867952780808, "loss": 0.046, "step": 95990 }, { "epoch": 0.62, "learning_rate": 0.00020705899817345113, "loss": 0.0428, "step": 96000 }, { "epoch": 0.62, "eval_cer": 0.9199810190938877, "eval_loss": 0.03174648433923721, "eval_runtime": 120.4054, "eval_samples_per_second": 16.611, "eval_steps_per_second": 4.153, "step": 96000 }, { "epoch": 0.62, "learning_rate": 0.00020704931681909418, "loss": 0.051, "step": 96010 }, { "epoch": 0.62, "learning_rate": 0.00020703963546473726, "loss": 0.0442, "step": 96020 }, { "epoch": 0.62, "learning_rate": 0.00020702995411038031, "loss": 0.0422, "step": 96030 }, { "epoch": 0.62, "learning_rate": 0.0002070202727560234, "loss": 0.0429, "step": 96040 }, { "epoch": 0.62, "learning_rate": 0.00020701059140166647, "loss": 0.056, "step": 96050 }, { "epoch": 0.62, "learning_rate": 0.00020700091004730955, "loss": 0.0473, "step": 96060 }, { "epoch": 0.62, "learning_rate": 0.0002069912286929526, "loss": 0.0483, "step": 96070 }, { "epoch": 0.62, "learning_rate": 0.00020698154733859566, "loss": 0.0554, "step": 96080 }, { "epoch": 0.62, "learning_rate": 0.00020697186598423874, "loss": 0.0527, "step": 96090 }, { "epoch": 0.62, "learning_rate": 0.0002069621846298818, "loss": 0.0518, "step": 96100 }, { "epoch": 0.62, "learning_rate": 0.00020695250327552487, "loss": 0.0602, "step": 96110 }, { "epoch": 0.62, "learning_rate": 0.00020694282192116795, "loss": 0.0469, "step": 96120 }, { "epoch": 0.62, "learning_rate": 0.000206933140566811, "loss": 0.0523, "step": 96130 }, { "epoch": 0.62, "learning_rate": 0.00020692345921245408, "loss": 0.0508, "step": 96140 }, { "epoch": 0.62, "learning_rate": 0.00020691377785809714, "loss": 0.0484, "step": 96150 }, { "epoch": 0.62, "learning_rate": 0.0002069040965037402, "loss": 0.0551, "step": 96160 }, { "epoch": 0.62, "learning_rate": 0.00020689441514938327, "loss": 0.0461, "step": 96170 }, { "epoch": 0.62, "learning_rate": 0.00020688473379502635, "loss": 0.0524, "step": 96180 }, { "epoch": 0.62, "learning_rate": 0.00020687505244066943, "loss": 0.0503, "step": 96190 }, { "epoch": 0.62, "learning_rate": 0.00020686537108631248, "loss": 0.0449, "step": 96200 }, { "epoch": 0.62, "learning_rate": 0.00020685568973195556, "loss": 0.0493, "step": 96210 }, { "epoch": 0.62, "learning_rate": 0.00020684600837759861, "loss": 0.0451, "step": 96220 }, { "epoch": 0.62, "learning_rate": 0.00020683632702324167, "loss": 0.0518, "step": 96230 }, { "epoch": 0.62, "learning_rate": 0.00020682664566888475, "loss": 0.0516, "step": 96240 }, { "epoch": 0.62, "learning_rate": 0.00020681696431452783, "loss": 0.0592, "step": 96250 }, { "epoch": 0.62, "learning_rate": 0.0002068072829601709, "loss": 0.0432, "step": 96260 }, { "epoch": 0.62, "learning_rate": 0.00020679760160581396, "loss": 0.0436, "step": 96270 }, { "epoch": 0.62, "learning_rate": 0.00020678792025145704, "loss": 0.0475, "step": 96280 }, { "epoch": 0.62, "learning_rate": 0.0002067782388971001, "loss": 0.0489, "step": 96290 }, { "epoch": 0.62, "learning_rate": 0.00020676855754274314, "loss": 0.0475, "step": 96300 }, { "epoch": 0.62, "learning_rate": 0.00020675887618838622, "loss": 0.0427, "step": 96310 }, { "epoch": 0.62, "learning_rate": 0.0002067491948340293, "loss": 0.0445, "step": 96320 }, { "epoch": 0.62, "learning_rate": 0.00020673951347967236, "loss": 0.0449, "step": 96330 }, { "epoch": 0.62, "learning_rate": 0.00020672983212531544, "loss": 0.0467, "step": 96340 }, { "epoch": 0.62, "learning_rate": 0.00020672015077095852, "loss": 0.0558, "step": 96350 }, { "epoch": 0.62, "learning_rate": 0.00020671046941660154, "loss": 0.0419, "step": 96360 }, { "epoch": 0.62, "learning_rate": 0.00020670078806224462, "loss": 0.0509, "step": 96370 }, { "epoch": 0.62, "learning_rate": 0.0002066911067078877, "loss": 0.0469, "step": 96380 }, { "epoch": 0.62, "learning_rate": 0.00020668142535353078, "loss": 0.0533, "step": 96390 }, { "epoch": 0.62, "learning_rate": 0.00020667174399917383, "loss": 0.0451, "step": 96400 }, { "epoch": 0.62, "learning_rate": 0.0002066620626448169, "loss": 0.0465, "step": 96410 }, { "epoch": 0.62, "learning_rate": 0.00020665238129046, "loss": 0.048, "step": 96420 }, { "epoch": 0.62, "learning_rate": 0.00020664269993610302, "loss": 0.059, "step": 96430 }, { "epoch": 0.62, "learning_rate": 0.0002066330185817461, "loss": 0.045, "step": 96440 }, { "epoch": 0.62, "learning_rate": 0.00020662333722738918, "loss": 0.0479, "step": 96450 }, { "epoch": 0.62, "learning_rate": 0.00020661365587303226, "loss": 0.0484, "step": 96460 }, { "epoch": 0.62, "learning_rate": 0.0002066039745186753, "loss": 0.0527, "step": 96470 }, { "epoch": 0.62, "learning_rate": 0.0002065942931643184, "loss": 0.0511, "step": 96480 }, { "epoch": 0.62, "learning_rate": 0.00020658461180996147, "loss": 0.0463, "step": 96490 }, { "epoch": 0.62, "learning_rate": 0.0002065749304556045, "loss": 0.0482, "step": 96500 }, { "epoch": 0.62, "learning_rate": 0.00020656524910124758, "loss": 0.0566, "step": 96510 }, { "epoch": 0.62, "learning_rate": 0.00020655556774689066, "loss": 0.0579, "step": 96520 }, { "epoch": 0.62, "learning_rate": 0.0002065458863925337, "loss": 0.0491, "step": 96530 }, { "epoch": 0.62, "learning_rate": 0.0002065362050381768, "loss": 0.0432, "step": 96540 }, { "epoch": 0.62, "learning_rate": 0.00020652652368381987, "loss": 0.0444, "step": 96550 }, { "epoch": 0.62, "learning_rate": 0.00020651684232946295, "loss": 0.0471, "step": 96560 }, { "epoch": 0.62, "learning_rate": 0.00020650716097510597, "loss": 0.0486, "step": 96570 }, { "epoch": 0.62, "learning_rate": 0.00020649747962074905, "loss": 0.0491, "step": 96580 }, { "epoch": 0.62, "learning_rate": 0.00020648779826639213, "loss": 0.0573, "step": 96590 }, { "epoch": 0.62, "learning_rate": 0.00020647811691203519, "loss": 0.0497, "step": 96600 }, { "epoch": 0.62, "learning_rate": 0.00020646843555767827, "loss": 0.0475, "step": 96610 }, { "epoch": 0.62, "learning_rate": 0.00020645875420332134, "loss": 0.0442, "step": 96620 }, { "epoch": 0.62, "learning_rate": 0.00020644907284896442, "loss": 0.053, "step": 96630 }, { "epoch": 0.62, "learning_rate": 0.00020643939149460745, "loss": 0.056, "step": 96640 }, { "epoch": 0.62, "learning_rate": 0.00020642971014025053, "loss": 0.053, "step": 96650 }, { "epoch": 0.62, "learning_rate": 0.0002064200287858936, "loss": 0.0436, "step": 96660 }, { "epoch": 0.62, "learning_rate": 0.00020641034743153666, "loss": 0.0444, "step": 96670 }, { "epoch": 0.62, "learning_rate": 0.00020640066607717974, "loss": 0.0504, "step": 96680 }, { "epoch": 0.62, "learning_rate": 0.00020639098472282282, "loss": 0.0569, "step": 96690 }, { "epoch": 0.62, "learning_rate": 0.0002063813033684659, "loss": 0.0485, "step": 96700 }, { "epoch": 0.62, "learning_rate": 0.00020637162201410893, "loss": 0.0472, "step": 96710 }, { "epoch": 0.62, "learning_rate": 0.000206361940659752, "loss": 0.0508, "step": 96720 }, { "epoch": 0.62, "learning_rate": 0.00020635225930539506, "loss": 0.0497, "step": 96730 }, { "epoch": 0.62, "learning_rate": 0.00020634257795103814, "loss": 0.0491, "step": 96740 }, { "epoch": 0.62, "learning_rate": 0.00020633289659668122, "loss": 0.0435, "step": 96750 }, { "epoch": 0.62, "learning_rate": 0.0002063232152423243, "loss": 0.0487, "step": 96760 }, { "epoch": 0.62, "learning_rate": 0.00020631353388796735, "loss": 0.0544, "step": 96770 }, { "epoch": 0.62, "learning_rate": 0.0002063038525336104, "loss": 0.0504, "step": 96780 }, { "epoch": 0.62, "learning_rate": 0.00020629417117925348, "loss": 0.0352, "step": 96790 }, { "epoch": 0.62, "learning_rate": 0.00020628448982489654, "loss": 0.0436, "step": 96800 }, { "epoch": 0.62, "learning_rate": 0.00020627480847053962, "loss": 0.0494, "step": 96810 }, { "epoch": 0.62, "learning_rate": 0.0002062651271161827, "loss": 0.0509, "step": 96820 }, { "epoch": 0.62, "learning_rate": 0.00020625544576182578, "loss": 0.0494, "step": 96830 }, { "epoch": 0.63, "learning_rate": 0.00020624576440746883, "loss": 0.0428, "step": 96840 }, { "epoch": 0.63, "learning_rate": 0.00020623608305311188, "loss": 0.0541, "step": 96850 }, { "epoch": 0.63, "learning_rate": 0.00020622640169875496, "loss": 0.0451, "step": 96860 }, { "epoch": 0.63, "learning_rate": 0.00020621672034439801, "loss": 0.05, "step": 96870 }, { "epoch": 0.63, "learning_rate": 0.0002062070389900411, "loss": 0.0437, "step": 96880 }, { "epoch": 0.63, "learning_rate": 0.00020619735763568417, "loss": 0.0576, "step": 96890 }, { "epoch": 0.63, "learning_rate": 0.00020618767628132725, "loss": 0.0505, "step": 96900 }, { "epoch": 0.63, "learning_rate": 0.0002061779949269703, "loss": 0.0491, "step": 96910 }, { "epoch": 0.63, "learning_rate": 0.00020616831357261336, "loss": 0.0487, "step": 96920 }, { "epoch": 0.63, "learning_rate": 0.0002061586322182564, "loss": 0.0514, "step": 96930 }, { "epoch": 0.63, "learning_rate": 0.0002061489508638995, "loss": 0.0471, "step": 96940 }, { "epoch": 0.63, "learning_rate": 0.00020613926950954257, "loss": 0.0534, "step": 96950 }, { "epoch": 0.63, "learning_rate": 0.00020612958815518565, "loss": 0.0542, "step": 96960 }, { "epoch": 0.63, "learning_rate": 0.0002061199068008287, "loss": 0.0501, "step": 96970 }, { "epoch": 0.63, "learning_rate": 0.00020611022544647178, "loss": 0.0416, "step": 96980 }, { "epoch": 0.63, "learning_rate": 0.00020610054409211484, "loss": 0.0542, "step": 96990 }, { "epoch": 0.63, "learning_rate": 0.0002060908627377579, "loss": 0.0596, "step": 97000 }, { "epoch": 0.63, "eval_cer": 0.9199656535984635, "eval_loss": 0.03143526241183281, "eval_runtime": 119.7543, "eval_samples_per_second": 16.701, "eval_steps_per_second": 4.175, "step": 97000 }, { "epoch": 0.63, "learning_rate": 0.00020608118138340097, "loss": 0.0548, "step": 97010 }, { "epoch": 0.63, "learning_rate": 0.00020607150002904405, "loss": 0.0474, "step": 97020 }, { "epoch": 0.63, "learning_rate": 0.00020606181867468713, "loss": 0.0456, "step": 97030 }, { "epoch": 0.63, "learning_rate": 0.00020605213732033018, "loss": 0.0412, "step": 97040 }, { "epoch": 0.63, "learning_rate": 0.00020604245596597326, "loss": 0.052, "step": 97050 }, { "epoch": 0.63, "learning_rate": 0.00020603277461161631, "loss": 0.0492, "step": 97060 }, { "epoch": 0.63, "learning_rate": 0.00020602309325725937, "loss": 0.0521, "step": 97070 }, { "epoch": 0.63, "learning_rate": 0.00020601341190290245, "loss": 0.0481, "step": 97080 }, { "epoch": 0.63, "learning_rate": 0.00020600373054854553, "loss": 0.05, "step": 97090 }, { "epoch": 0.63, "learning_rate": 0.0002059940491941886, "loss": 0.0501, "step": 97100 }, { "epoch": 0.63, "learning_rate": 0.00020598436783983166, "loss": 0.0458, "step": 97110 }, { "epoch": 0.63, "learning_rate": 0.00020597468648547474, "loss": 0.0567, "step": 97120 }, { "epoch": 0.63, "learning_rate": 0.00020596500513111776, "loss": 0.0485, "step": 97130 }, { "epoch": 0.63, "learning_rate": 0.00020595532377676084, "loss": 0.0453, "step": 97140 }, { "epoch": 0.63, "learning_rate": 0.00020594564242240392, "loss": 0.0426, "step": 97150 }, { "epoch": 0.63, "learning_rate": 0.000205935961068047, "loss": 0.0449, "step": 97160 }, { "epoch": 0.63, "learning_rate": 0.00020592627971369006, "loss": 0.0394, "step": 97170 }, { "epoch": 0.63, "learning_rate": 0.00020591659835933314, "loss": 0.0435, "step": 97180 }, { "epoch": 0.63, "learning_rate": 0.00020590691700497622, "loss": 0.0556, "step": 97190 }, { "epoch": 0.63, "learning_rate": 0.00020589723565061924, "loss": 0.0482, "step": 97200 }, { "epoch": 0.63, "learning_rate": 0.00020588755429626232, "loss": 0.0484, "step": 97210 }, { "epoch": 0.63, "learning_rate": 0.0002058778729419054, "loss": 0.055, "step": 97220 }, { "epoch": 0.63, "learning_rate": 0.00020586819158754848, "loss": 0.0455, "step": 97230 }, { "epoch": 0.63, "learning_rate": 0.00020585851023319153, "loss": 0.0533, "step": 97240 }, { "epoch": 0.63, "learning_rate": 0.0002058488288788346, "loss": 0.0487, "step": 97250 }, { "epoch": 0.63, "learning_rate": 0.0002058391475244777, "loss": 0.051, "step": 97260 }, { "epoch": 0.63, "learning_rate": 0.00020582946617012072, "loss": 0.0416, "step": 97270 }, { "epoch": 0.63, "learning_rate": 0.0002058197848157638, "loss": 0.0572, "step": 97280 }, { "epoch": 0.63, "learning_rate": 0.00020581010346140688, "loss": 0.05, "step": 97290 }, { "epoch": 0.63, "learning_rate": 0.00020580042210704996, "loss": 0.0443, "step": 97300 }, { "epoch": 0.63, "learning_rate": 0.000205790740752693, "loss": 0.0472, "step": 97310 }, { "epoch": 0.63, "learning_rate": 0.0002057810593983361, "loss": 0.0498, "step": 97320 }, { "epoch": 0.63, "learning_rate": 0.00020577137804397917, "loss": 0.0465, "step": 97330 }, { "epoch": 0.63, "learning_rate": 0.0002057616966896222, "loss": 0.0519, "step": 97340 }, { "epoch": 0.63, "learning_rate": 0.00020575201533526528, "loss": 0.0467, "step": 97350 }, { "epoch": 0.63, "learning_rate": 0.00020574233398090836, "loss": 0.0531, "step": 97360 }, { "epoch": 0.63, "learning_rate": 0.0002057326526265514, "loss": 0.052, "step": 97370 }, { "epoch": 0.63, "learning_rate": 0.0002057229712721945, "loss": 0.0476, "step": 97380 }, { "epoch": 0.63, "learning_rate": 0.00020571328991783757, "loss": 0.0519, "step": 97390 }, { "epoch": 0.63, "learning_rate": 0.00020570360856348065, "loss": 0.0399, "step": 97400 }, { "epoch": 0.63, "learning_rate": 0.00020569392720912367, "loss": 0.0501, "step": 97410 }, { "epoch": 0.63, "learning_rate": 0.00020568424585476675, "loss": 0.0435, "step": 97420 }, { "epoch": 0.63, "learning_rate": 0.00020567456450040983, "loss": 0.0456, "step": 97430 }, { "epoch": 0.63, "learning_rate": 0.00020566488314605289, "loss": 0.0445, "step": 97440 }, { "epoch": 0.63, "learning_rate": 0.00020565520179169596, "loss": 0.0452, "step": 97450 }, { "epoch": 0.63, "learning_rate": 0.00020564552043733904, "loss": 0.0524, "step": 97460 }, { "epoch": 0.63, "learning_rate": 0.00020563583908298212, "loss": 0.0454, "step": 97470 }, { "epoch": 0.63, "learning_rate": 0.00020562615772862515, "loss": 0.0461, "step": 97480 }, { "epoch": 0.63, "learning_rate": 0.00020561647637426823, "loss": 0.0425, "step": 97490 }, { "epoch": 0.63, "learning_rate": 0.0002056067950199113, "loss": 0.047, "step": 97500 }, { "epoch": 0.63, "learning_rate": 0.00020559711366555436, "loss": 0.0455, "step": 97510 }, { "epoch": 0.63, "learning_rate": 0.00020558743231119744, "loss": 0.0613, "step": 97520 }, { "epoch": 0.63, "learning_rate": 0.00020557775095684052, "loss": 0.0464, "step": 97530 }, { "epoch": 0.63, "learning_rate": 0.00020556806960248357, "loss": 0.0572, "step": 97540 }, { "epoch": 0.63, "learning_rate": 0.00020555838824812663, "loss": 0.0429, "step": 97550 }, { "epoch": 0.63, "learning_rate": 0.0002055487068937697, "loss": 0.0461, "step": 97560 }, { "epoch": 0.63, "learning_rate": 0.00020553902553941276, "loss": 0.0505, "step": 97570 }, { "epoch": 0.63, "learning_rate": 0.00020552934418505584, "loss": 0.0502, "step": 97580 }, { "epoch": 0.63, "learning_rate": 0.00020551966283069892, "loss": 0.0458, "step": 97590 }, { "epoch": 0.63, "learning_rate": 0.000205509981476342, "loss": 0.0481, "step": 97600 }, { "epoch": 0.63, "learning_rate": 0.00020550030012198505, "loss": 0.0472, "step": 97610 }, { "epoch": 0.63, "learning_rate": 0.0002054906187676281, "loss": 0.0531, "step": 97620 }, { "epoch": 0.63, "learning_rate": 0.00020548093741327118, "loss": 0.0597, "step": 97630 }, { "epoch": 0.63, "learning_rate": 0.00020547125605891424, "loss": 0.045, "step": 97640 }, { "epoch": 0.63, "learning_rate": 0.00020546157470455732, "loss": 0.0601, "step": 97650 }, { "epoch": 0.63, "learning_rate": 0.0002054518933502004, "loss": 0.0496, "step": 97660 }, { "epoch": 0.63, "learning_rate": 0.00020544221199584348, "loss": 0.0511, "step": 97670 }, { "epoch": 0.63, "learning_rate": 0.00020543253064148653, "loss": 0.049, "step": 97680 }, { "epoch": 0.63, "learning_rate": 0.00020542284928712958, "loss": 0.0469, "step": 97690 }, { "epoch": 0.63, "learning_rate": 0.00020541316793277266, "loss": 0.0496, "step": 97700 }, { "epoch": 0.63, "learning_rate": 0.00020540348657841571, "loss": 0.0507, "step": 97710 }, { "epoch": 0.63, "learning_rate": 0.0002053938052240588, "loss": 0.0453, "step": 97720 }, { "epoch": 0.63, "learning_rate": 0.00020538412386970187, "loss": 0.0446, "step": 97730 }, { "epoch": 0.63, "learning_rate": 0.00020537444251534493, "loss": 0.0486, "step": 97740 }, { "epoch": 0.63, "learning_rate": 0.000205364761160988, "loss": 0.0488, "step": 97750 }, { "epoch": 0.63, "learning_rate": 0.00020535507980663106, "loss": 0.0445, "step": 97760 }, { "epoch": 0.63, "learning_rate": 0.0002053453984522741, "loss": 0.0518, "step": 97770 }, { "epoch": 0.63, "learning_rate": 0.0002053357170979172, "loss": 0.0543, "step": 97780 }, { "epoch": 0.63, "learning_rate": 0.00020532603574356027, "loss": 0.0393, "step": 97790 }, { "epoch": 0.63, "learning_rate": 0.00020531635438920335, "loss": 0.0579, "step": 97800 }, { "epoch": 0.63, "learning_rate": 0.0002053066730348464, "loss": 0.0514, "step": 97810 }, { "epoch": 0.63, "learning_rate": 0.00020529699168048948, "loss": 0.0494, "step": 97820 }, { "epoch": 0.63, "learning_rate": 0.00020528731032613254, "loss": 0.0472, "step": 97830 }, { "epoch": 0.63, "learning_rate": 0.0002052776289717756, "loss": 0.0454, "step": 97840 }, { "epoch": 0.63, "learning_rate": 0.00020526794761741867, "loss": 0.0432, "step": 97850 }, { "epoch": 0.63, "learning_rate": 0.00020525826626306175, "loss": 0.0518, "step": 97860 }, { "epoch": 0.63, "learning_rate": 0.00020524858490870483, "loss": 0.0429, "step": 97870 }, { "epoch": 0.63, "learning_rate": 0.00020523890355434788, "loss": 0.0499, "step": 97880 }, { "epoch": 0.63, "learning_rate": 0.00020522922219999096, "loss": 0.0494, "step": 97890 }, { "epoch": 0.63, "learning_rate": 0.000205219540845634, "loss": 0.0502, "step": 97900 }, { "epoch": 0.63, "learning_rate": 0.00020520985949127707, "loss": 0.0528, "step": 97910 }, { "epoch": 0.63, "learning_rate": 0.00020520017813692015, "loss": 0.0549, "step": 97920 }, { "epoch": 0.63, "learning_rate": 0.00020519049678256323, "loss": 0.0453, "step": 97930 }, { "epoch": 0.63, "learning_rate": 0.00020518081542820628, "loss": 0.0441, "step": 97940 }, { "epoch": 0.63, "learning_rate": 0.00020517113407384936, "loss": 0.043, "step": 97950 }, { "epoch": 0.63, "learning_rate": 0.00020516145271949244, "loss": 0.0487, "step": 97960 }, { "epoch": 0.63, "learning_rate": 0.00020515177136513546, "loss": 0.0453, "step": 97970 }, { "epoch": 0.63, "learning_rate": 0.00020514209001077854, "loss": 0.0484, "step": 97980 }, { "epoch": 0.63, "learning_rate": 0.00020513240865642162, "loss": 0.0405, "step": 97990 }, { "epoch": 0.63, "learning_rate": 0.0002051227273020647, "loss": 0.0449, "step": 98000 }, { "epoch": 0.63, "eval_cer": 0.920000903852672, "eval_loss": 0.03220009431242943, "eval_runtime": 120.0197, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 98000 }, { "epoch": 0.63, "learning_rate": 0.00020511304594770776, "loss": 0.043, "step": 98010 }, { "epoch": 0.63, "learning_rate": 0.00020510336459335084, "loss": 0.0485, "step": 98020 }, { "epoch": 0.63, "learning_rate": 0.00020509368323899392, "loss": 0.0456, "step": 98030 }, { "epoch": 0.63, "learning_rate": 0.00020508400188463694, "loss": 0.0481, "step": 98040 }, { "epoch": 0.63, "learning_rate": 0.00020507432053028002, "loss": 0.0455, "step": 98050 }, { "epoch": 0.63, "learning_rate": 0.0002050646391759231, "loss": 0.0482, "step": 98060 }, { "epoch": 0.63, "learning_rate": 0.00020505495782156618, "loss": 0.0381, "step": 98070 }, { "epoch": 0.63, "learning_rate": 0.00020504527646720923, "loss": 0.0417, "step": 98080 }, { "epoch": 0.63, "learning_rate": 0.0002050355951128523, "loss": 0.0404, "step": 98090 }, { "epoch": 0.63, "learning_rate": 0.0002050259137584954, "loss": 0.0457, "step": 98100 }, { "epoch": 0.63, "learning_rate": 0.00020501623240413842, "loss": 0.0467, "step": 98110 }, { "epoch": 0.63, "learning_rate": 0.0002050065510497815, "loss": 0.052, "step": 98120 }, { "epoch": 0.63, "learning_rate": 0.00020499686969542458, "loss": 0.0446, "step": 98130 }, { "epoch": 0.63, "learning_rate": 0.00020498718834106763, "loss": 0.0449, "step": 98140 }, { "epoch": 0.63, "learning_rate": 0.0002049775069867107, "loss": 0.0481, "step": 98150 }, { "epoch": 0.63, "learning_rate": 0.0002049678256323538, "loss": 0.0447, "step": 98160 }, { "epoch": 0.63, "learning_rate": 0.00020495814427799687, "loss": 0.0543, "step": 98170 }, { "epoch": 0.63, "learning_rate": 0.0002049484629236399, "loss": 0.0556, "step": 98180 }, { "epoch": 0.63, "learning_rate": 0.00020493878156928297, "loss": 0.0458, "step": 98190 }, { "epoch": 0.63, "learning_rate": 0.00020492910021492605, "loss": 0.0418, "step": 98200 }, { "epoch": 0.63, "learning_rate": 0.0002049194188605691, "loss": 0.049, "step": 98210 }, { "epoch": 0.63, "learning_rate": 0.0002049097375062122, "loss": 0.0488, "step": 98220 }, { "epoch": 0.63, "learning_rate": 0.00020490005615185527, "loss": 0.0489, "step": 98230 }, { "epoch": 0.63, "learning_rate": 0.00020489037479749835, "loss": 0.0493, "step": 98240 }, { "epoch": 0.63, "learning_rate": 0.00020488069344314137, "loss": 0.0485, "step": 98250 }, { "epoch": 0.63, "learning_rate": 0.00020487101208878445, "loss": 0.0517, "step": 98260 }, { "epoch": 0.63, "learning_rate": 0.00020486133073442753, "loss": 0.0428, "step": 98270 }, { "epoch": 0.63, "learning_rate": 0.00020485164938007058, "loss": 0.0493, "step": 98280 }, { "epoch": 0.63, "learning_rate": 0.00020484196802571366, "loss": 0.0418, "step": 98290 }, { "epoch": 0.63, "learning_rate": 0.00020483228667135674, "loss": 0.0514, "step": 98300 }, { "epoch": 0.63, "learning_rate": 0.00020482260531699982, "loss": 0.0442, "step": 98310 }, { "epoch": 0.63, "learning_rate": 0.00020481292396264285, "loss": 0.05, "step": 98320 }, { "epoch": 0.63, "learning_rate": 0.00020480324260828593, "loss": 0.0453, "step": 98330 }, { "epoch": 0.63, "learning_rate": 0.00020479356125392898, "loss": 0.0429, "step": 98340 }, { "epoch": 0.63, "learning_rate": 0.00020478387989957206, "loss": 0.0461, "step": 98350 }, { "epoch": 0.63, "learning_rate": 0.00020477419854521514, "loss": 0.0458, "step": 98360 }, { "epoch": 0.63, "learning_rate": 0.00020476451719085822, "loss": 0.045, "step": 98370 }, { "epoch": 0.63, "learning_rate": 0.00020475483583650127, "loss": 0.0465, "step": 98380 }, { "epoch": 0.64, "learning_rate": 0.00020474515448214433, "loss": 0.0466, "step": 98390 }, { "epoch": 0.64, "learning_rate": 0.0002047354731277874, "loss": 0.0434, "step": 98400 }, { "epoch": 0.64, "learning_rate": 0.00020472579177343046, "loss": 0.0447, "step": 98410 }, { "epoch": 0.64, "learning_rate": 0.00020471611041907354, "loss": 0.0483, "step": 98420 }, { "epoch": 0.64, "learning_rate": 0.00020470642906471662, "loss": 0.0509, "step": 98430 }, { "epoch": 0.64, "learning_rate": 0.0002046967477103597, "loss": 0.0433, "step": 98440 }, { "epoch": 0.64, "learning_rate": 0.00020468706635600275, "loss": 0.0487, "step": 98450 }, { "epoch": 0.64, "learning_rate": 0.0002046773850016458, "loss": 0.0474, "step": 98460 }, { "epoch": 0.64, "learning_rate": 0.00020466770364728888, "loss": 0.0533, "step": 98470 }, { "epoch": 0.64, "learning_rate": 0.00020465802229293194, "loss": 0.0476, "step": 98480 }, { "epoch": 0.64, "learning_rate": 0.00020464834093857502, "loss": 0.0491, "step": 98490 }, { "epoch": 0.64, "learning_rate": 0.0002046386595842181, "loss": 0.0455, "step": 98500 }, { "epoch": 0.64, "learning_rate": 0.00020462897822986118, "loss": 0.0526, "step": 98510 }, { "epoch": 0.64, "learning_rate": 0.00020461929687550423, "loss": 0.0479, "step": 98520 }, { "epoch": 0.64, "learning_rate": 0.00020460961552114728, "loss": 0.0476, "step": 98530 }, { "epoch": 0.64, "learning_rate": 0.00020459993416679033, "loss": 0.0516, "step": 98540 }, { "epoch": 0.64, "learning_rate": 0.00020459025281243341, "loss": 0.0484, "step": 98550 }, { "epoch": 0.64, "learning_rate": 0.0002045805714580765, "loss": 0.0525, "step": 98560 }, { "epoch": 0.64, "learning_rate": 0.00020457089010371957, "loss": 0.0496, "step": 98570 }, { "epoch": 0.64, "learning_rate": 0.00020456120874936263, "loss": 0.0442, "step": 98580 }, { "epoch": 0.64, "learning_rate": 0.0002045515273950057, "loss": 0.0482, "step": 98590 }, { "epoch": 0.64, "learning_rate": 0.00020454184604064876, "loss": 0.0488, "step": 98600 }, { "epoch": 0.64, "learning_rate": 0.0002045321646862918, "loss": 0.0519, "step": 98610 }, { "epoch": 0.64, "learning_rate": 0.0002045224833319349, "loss": 0.05, "step": 98620 }, { "epoch": 0.64, "learning_rate": 0.00020451280197757797, "loss": 0.0433, "step": 98630 }, { "epoch": 0.64, "learning_rate": 0.00020450312062322105, "loss": 0.0445, "step": 98640 }, { "epoch": 0.64, "learning_rate": 0.0002044934392688641, "loss": 0.048, "step": 98650 }, { "epoch": 0.64, "learning_rate": 0.00020448375791450718, "loss": 0.0476, "step": 98660 }, { "epoch": 0.64, "learning_rate": 0.00020447407656015024, "loss": 0.0441, "step": 98670 }, { "epoch": 0.64, "learning_rate": 0.0002044643952057933, "loss": 0.0441, "step": 98680 }, { "epoch": 0.64, "learning_rate": 0.00020445471385143637, "loss": 0.0404, "step": 98690 }, { "epoch": 0.64, "learning_rate": 0.00020444503249707945, "loss": 0.0442, "step": 98700 }, { "epoch": 0.64, "learning_rate": 0.00020443535114272253, "loss": 0.0461, "step": 98710 }, { "epoch": 0.64, "learning_rate": 0.00020442566978836558, "loss": 0.0492, "step": 98720 }, { "epoch": 0.64, "learning_rate": 0.00020441598843400866, "loss": 0.0456, "step": 98730 }, { "epoch": 0.64, "learning_rate": 0.00020440630707965169, "loss": 0.0501, "step": 98740 }, { "epoch": 0.64, "learning_rate": 0.00020439662572529477, "loss": 0.0418, "step": 98750 }, { "epoch": 0.64, "learning_rate": 0.00020438694437093785, "loss": 0.0413, "step": 98760 }, { "epoch": 0.64, "learning_rate": 0.00020437726301658093, "loss": 0.0482, "step": 98770 }, { "epoch": 0.64, "learning_rate": 0.00020436758166222398, "loss": 0.0524, "step": 98780 }, { "epoch": 0.64, "learning_rate": 0.00020435790030786706, "loss": 0.0442, "step": 98790 }, { "epoch": 0.64, "learning_rate": 0.00020434821895351014, "loss": 0.051, "step": 98800 }, { "epoch": 0.64, "learning_rate": 0.00020433853759915316, "loss": 0.0427, "step": 98810 }, { "epoch": 0.64, "learning_rate": 0.00020432885624479624, "loss": 0.0445, "step": 98820 }, { "epoch": 0.64, "learning_rate": 0.00020431917489043932, "loss": 0.0493, "step": 98830 }, { "epoch": 0.64, "learning_rate": 0.0002043094935360824, "loss": 0.0458, "step": 98840 }, { "epoch": 0.64, "learning_rate": 0.00020429981218172546, "loss": 0.0565, "step": 98850 }, { "epoch": 0.64, "learning_rate": 0.00020429013082736853, "loss": 0.054, "step": 98860 }, { "epoch": 0.64, "learning_rate": 0.00020428044947301161, "loss": 0.046, "step": 98870 }, { "epoch": 0.64, "learning_rate": 0.00020427076811865464, "loss": 0.0451, "step": 98880 }, { "epoch": 0.64, "learning_rate": 0.00020426108676429772, "loss": 0.0492, "step": 98890 }, { "epoch": 0.64, "learning_rate": 0.0002042514054099408, "loss": 0.0461, "step": 98900 }, { "epoch": 0.64, "learning_rate": 0.00020424172405558388, "loss": 0.047, "step": 98910 }, { "epoch": 0.64, "learning_rate": 0.00020423204270122693, "loss": 0.0456, "step": 98920 }, { "epoch": 0.64, "learning_rate": 0.00020422236134687, "loss": 0.0457, "step": 98930 }, { "epoch": 0.64, "learning_rate": 0.0002042126799925131, "loss": 0.0439, "step": 98940 }, { "epoch": 0.64, "learning_rate": 0.00020420299863815612, "loss": 0.0442, "step": 98950 }, { "epoch": 0.64, "learning_rate": 0.0002041933172837992, "loss": 0.0476, "step": 98960 }, { "epoch": 0.64, "learning_rate": 0.00020418363592944228, "loss": 0.0525, "step": 98970 }, { "epoch": 0.64, "learning_rate": 0.00020417395457508533, "loss": 0.0444, "step": 98980 }, { "epoch": 0.64, "learning_rate": 0.0002041642732207284, "loss": 0.0536, "step": 98990 }, { "epoch": 0.64, "learning_rate": 0.0002041545918663715, "loss": 0.041, "step": 99000 }, { "epoch": 0.64, "eval_cer": 0.9199168455541746, "eval_loss": 0.031374961137771606, "eval_runtime": 119.7911, "eval_samples_per_second": 16.696, "eval_steps_per_second": 4.174, "step": 99000 }, { "epoch": 0.64, "learning_rate": 0.00020414491051201457, "loss": 0.0421, "step": 99010 }, { "epoch": 0.64, "learning_rate": 0.0002041352291576576, "loss": 0.052, "step": 99020 }, { "epoch": 0.64, "learning_rate": 0.00020412554780330067, "loss": 0.055, "step": 99030 }, { "epoch": 0.64, "learning_rate": 0.00020411586644894375, "loss": 0.0496, "step": 99040 }, { "epoch": 0.64, "learning_rate": 0.0002041061850945868, "loss": 0.0434, "step": 99050 }, { "epoch": 0.64, "learning_rate": 0.0002040965037402299, "loss": 0.0449, "step": 99060 }, { "epoch": 0.64, "learning_rate": 0.00020408682238587297, "loss": 0.0464, "step": 99070 }, { "epoch": 0.64, "learning_rate": 0.00020407714103151605, "loss": 0.05, "step": 99080 }, { "epoch": 0.64, "learning_rate": 0.00020406745967715907, "loss": 0.0438, "step": 99090 }, { "epoch": 0.64, "learning_rate": 0.00020405777832280215, "loss": 0.052, "step": 99100 }, { "epoch": 0.64, "learning_rate": 0.00020404809696844523, "loss": 0.043, "step": 99110 }, { "epoch": 0.64, "learning_rate": 0.00020403841561408828, "loss": 0.0469, "step": 99120 }, { "epoch": 0.64, "learning_rate": 0.00020402873425973136, "loss": 0.0458, "step": 99130 }, { "epoch": 0.64, "learning_rate": 0.00020401905290537444, "loss": 0.0505, "step": 99140 }, { "epoch": 0.64, "learning_rate": 0.0002040093715510175, "loss": 0.0452, "step": 99150 }, { "epoch": 0.64, "learning_rate": 0.00020399969019666055, "loss": 0.044, "step": 99160 }, { "epoch": 0.64, "learning_rate": 0.00020399000884230363, "loss": 0.0562, "step": 99170 }, { "epoch": 0.64, "learning_rate": 0.00020398032748794668, "loss": 0.0437, "step": 99180 }, { "epoch": 0.64, "learning_rate": 0.00020397064613358976, "loss": 0.0437, "step": 99190 }, { "epoch": 0.64, "learning_rate": 0.00020396096477923284, "loss": 0.0531, "step": 99200 }, { "epoch": 0.64, "learning_rate": 0.00020395128342487592, "loss": 0.0487, "step": 99210 }, { "epoch": 0.64, "learning_rate": 0.00020394160207051897, "loss": 0.0442, "step": 99220 }, { "epoch": 0.64, "learning_rate": 0.00020393192071616203, "loss": 0.0418, "step": 99230 }, { "epoch": 0.64, "learning_rate": 0.0002039222393618051, "loss": 0.0455, "step": 99240 }, { "epoch": 0.64, "learning_rate": 0.00020391255800744816, "loss": 0.0404, "step": 99250 }, { "epoch": 0.64, "learning_rate": 0.00020390287665309124, "loss": 0.0446, "step": 99260 }, { "epoch": 0.64, "learning_rate": 0.00020389319529873432, "loss": 0.0501, "step": 99270 }, { "epoch": 0.64, "learning_rate": 0.0002038835139443774, "loss": 0.0462, "step": 99280 }, { "epoch": 0.64, "learning_rate": 0.00020387383259002045, "loss": 0.0435, "step": 99290 }, { "epoch": 0.64, "learning_rate": 0.0002038641512356635, "loss": 0.0411, "step": 99300 }, { "epoch": 0.64, "learning_rate": 0.00020385446988130658, "loss": 0.0448, "step": 99310 }, { "epoch": 0.64, "learning_rate": 0.00020384478852694964, "loss": 0.0513, "step": 99320 }, { "epoch": 0.64, "learning_rate": 0.00020383510717259272, "loss": 0.0451, "step": 99330 }, { "epoch": 0.64, "learning_rate": 0.0002038254258182358, "loss": 0.0423, "step": 99340 }, { "epoch": 0.64, "learning_rate": 0.00020381574446387885, "loss": 0.0548, "step": 99350 }, { "epoch": 0.64, "learning_rate": 0.00020380606310952193, "loss": 0.0534, "step": 99360 }, { "epoch": 0.64, "learning_rate": 0.00020379638175516498, "loss": 0.0445, "step": 99370 }, { "epoch": 0.64, "learning_rate": 0.00020378670040080803, "loss": 0.0425, "step": 99380 }, { "epoch": 0.64, "learning_rate": 0.0002037770190464511, "loss": 0.044, "step": 99390 }, { "epoch": 0.64, "learning_rate": 0.0002037673376920942, "loss": 0.0484, "step": 99400 }, { "epoch": 0.64, "learning_rate": 0.00020375765633773727, "loss": 0.0431, "step": 99410 }, { "epoch": 0.64, "learning_rate": 0.00020374797498338033, "loss": 0.0464, "step": 99420 }, { "epoch": 0.64, "learning_rate": 0.0002037382936290234, "loss": 0.0525, "step": 99430 }, { "epoch": 0.64, "learning_rate": 0.00020372861227466646, "loss": 0.0483, "step": 99440 }, { "epoch": 0.64, "learning_rate": 0.0002037189309203095, "loss": 0.0471, "step": 99450 }, { "epoch": 0.64, "learning_rate": 0.0002037092495659526, "loss": 0.0454, "step": 99460 }, { "epoch": 0.64, "learning_rate": 0.00020369956821159567, "loss": 0.0464, "step": 99470 }, { "epoch": 0.64, "learning_rate": 0.00020368988685723875, "loss": 0.0515, "step": 99480 }, { "epoch": 0.64, "learning_rate": 0.0002036802055028818, "loss": 0.0463, "step": 99490 }, { "epoch": 0.64, "learning_rate": 0.00020367052414852488, "loss": 0.0513, "step": 99500 }, { "epoch": 0.64, "learning_rate": 0.00020366084279416794, "loss": 0.0452, "step": 99510 }, { "epoch": 0.64, "learning_rate": 0.000203651161439811, "loss": 0.0462, "step": 99520 }, { "epoch": 0.64, "learning_rate": 0.00020364148008545407, "loss": 0.0465, "step": 99530 }, { "epoch": 0.64, "learning_rate": 0.00020363179873109715, "loss": 0.0484, "step": 99540 }, { "epoch": 0.64, "learning_rate": 0.0002036221173767402, "loss": 0.0482, "step": 99550 }, { "epoch": 0.64, "learning_rate": 0.00020361243602238328, "loss": 0.0533, "step": 99560 }, { "epoch": 0.64, "learning_rate": 0.00020360275466802636, "loss": 0.049, "step": 99570 }, { "epoch": 0.64, "learning_rate": 0.00020359307331366939, "loss": 0.052, "step": 99580 }, { "epoch": 0.64, "learning_rate": 0.00020358339195931247, "loss": 0.046, "step": 99590 }, { "epoch": 0.64, "learning_rate": 0.00020357371060495555, "loss": 0.0468, "step": 99600 }, { "epoch": 0.64, "learning_rate": 0.00020356402925059862, "loss": 0.0473, "step": 99610 }, { "epoch": 0.64, "learning_rate": 0.00020355434789624168, "loss": 0.0488, "step": 99620 }, { "epoch": 0.64, "learning_rate": 0.00020354466654188476, "loss": 0.0472, "step": 99630 }, { "epoch": 0.64, "learning_rate": 0.00020353498518752784, "loss": 0.0508, "step": 99640 }, { "epoch": 0.64, "learning_rate": 0.00020352530383317086, "loss": 0.0458, "step": 99650 }, { "epoch": 0.64, "learning_rate": 0.00020351562247881394, "loss": 0.0429, "step": 99660 }, { "epoch": 0.64, "learning_rate": 0.00020350594112445702, "loss": 0.053, "step": 99670 }, { "epoch": 0.64, "learning_rate": 0.0002034962597701001, "loss": 0.0543, "step": 99680 }, { "epoch": 0.64, "learning_rate": 0.00020348657841574315, "loss": 0.0457, "step": 99690 }, { "epoch": 0.64, "learning_rate": 0.00020347689706138623, "loss": 0.0441, "step": 99700 }, { "epoch": 0.64, "learning_rate": 0.00020346721570702931, "loss": 0.0499, "step": 99710 }, { "epoch": 0.64, "learning_rate": 0.00020345753435267234, "loss": 0.0405, "step": 99720 }, { "epoch": 0.64, "learning_rate": 0.00020344785299831542, "loss": 0.0452, "step": 99730 }, { "epoch": 0.64, "learning_rate": 0.0002034381716439585, "loss": 0.0442, "step": 99740 }, { "epoch": 0.64, "learning_rate": 0.00020342849028960155, "loss": 0.0453, "step": 99750 }, { "epoch": 0.64, "learning_rate": 0.00020341880893524463, "loss": 0.046, "step": 99760 }, { "epoch": 0.64, "learning_rate": 0.0002034091275808877, "loss": 0.047, "step": 99770 }, { "epoch": 0.64, "learning_rate": 0.0002033994462265308, "loss": 0.0488, "step": 99780 }, { "epoch": 0.64, "learning_rate": 0.00020338976487217382, "loss": 0.0508, "step": 99790 }, { "epoch": 0.64, "learning_rate": 0.0002033800835178169, "loss": 0.0525, "step": 99800 }, { "epoch": 0.64, "learning_rate": 0.00020337040216345998, "loss": 0.0474, "step": 99810 }, { "epoch": 0.64, "learning_rate": 0.00020336072080910303, "loss": 0.05, "step": 99820 }, { "epoch": 0.64, "learning_rate": 0.0002033510394547461, "loss": 0.0409, "step": 99830 }, { "epoch": 0.64, "learning_rate": 0.0002033413581003892, "loss": 0.0426, "step": 99840 }, { "epoch": 0.64, "learning_rate": 0.00020333167674603221, "loss": 0.0485, "step": 99850 }, { "epoch": 0.64, "learning_rate": 0.0002033219953916753, "loss": 0.0488, "step": 99860 }, { "epoch": 0.64, "learning_rate": 0.00020331231403731837, "loss": 0.048, "step": 99870 }, { "epoch": 0.64, "learning_rate": 0.00020330263268296145, "loss": 0.0496, "step": 99880 }, { "epoch": 0.64, "learning_rate": 0.0002032929513286045, "loss": 0.045, "step": 99890 }, { "epoch": 0.64, "learning_rate": 0.00020328326997424759, "loss": 0.0524, "step": 99900 }, { "epoch": 0.64, "learning_rate": 0.00020327358861989067, "loss": 0.049, "step": 99910 }, { "epoch": 0.64, "learning_rate": 0.0002032639072655337, "loss": 0.0527, "step": 99920 }, { "epoch": 0.64, "learning_rate": 0.00020325422591117677, "loss": 0.0494, "step": 99930 }, { "epoch": 0.65, "learning_rate": 0.00020324454455681985, "loss": 0.0595, "step": 99940 }, { "epoch": 0.65, "learning_rate": 0.0002032348632024629, "loss": 0.0497, "step": 99950 }, { "epoch": 0.65, "learning_rate": 0.00020322518184810598, "loss": 0.0456, "step": 99960 }, { "epoch": 0.65, "learning_rate": 0.00020321550049374906, "loss": 0.049, "step": 99970 }, { "epoch": 0.65, "learning_rate": 0.00020320581913939214, "loss": 0.0575, "step": 99980 }, { "epoch": 0.65, "learning_rate": 0.00020319613778503517, "loss": 0.0502, "step": 99990 }, { "epoch": 0.65, "learning_rate": 0.00020318645643067825, "loss": 0.0464, "step": 100000 }, { "epoch": 0.65, "eval_cer": 0.9199602304824314, "eval_loss": 0.031852345913648605, "eval_runtime": 119.8085, "eval_samples_per_second": 16.693, "eval_steps_per_second": 4.173, "step": 100000 }, { "epoch": 0.65, "learning_rate": 0.00020317677507632133, "loss": 0.0428, "step": 100010 }, { "epoch": 0.65, "learning_rate": 0.00020316709372196438, "loss": 0.0554, "step": 100020 }, { "epoch": 0.65, "learning_rate": 0.00020315741236760746, "loss": 0.0511, "step": 100030 }, { "epoch": 0.65, "learning_rate": 0.00020314773101325054, "loss": 0.0443, "step": 100040 }, { "epoch": 0.65, "learning_rate": 0.00020313804965889362, "loss": 0.0414, "step": 100050 }, { "epoch": 0.65, "learning_rate": 0.00020312836830453665, "loss": 0.0453, "step": 100060 }, { "epoch": 0.65, "learning_rate": 0.00020311868695017973, "loss": 0.0445, "step": 100070 }, { "epoch": 0.65, "learning_rate": 0.0002031090055958228, "loss": 0.0548, "step": 100080 }, { "epoch": 0.65, "learning_rate": 0.00020309932424146586, "loss": 0.0541, "step": 100090 }, { "epoch": 0.65, "learning_rate": 0.00020308964288710894, "loss": 0.0486, "step": 100100 }, { "epoch": 0.65, "learning_rate": 0.00020307996153275202, "loss": 0.0559, "step": 100110 }, { "epoch": 0.65, "learning_rate": 0.00020307028017839507, "loss": 0.052, "step": 100120 }, { "epoch": 0.65, "learning_rate": 0.00020306059882403812, "loss": 0.0437, "step": 100130 }, { "epoch": 0.65, "learning_rate": 0.0002030509174696812, "loss": 0.047, "step": 100140 }, { "epoch": 0.65, "learning_rate": 0.00020304123611532426, "loss": 0.0514, "step": 100150 }, { "epoch": 0.65, "learning_rate": 0.00020303155476096734, "loss": 0.0514, "step": 100160 }, { "epoch": 0.65, "learning_rate": 0.00020302187340661042, "loss": 0.0455, "step": 100170 }, { "epoch": 0.65, "learning_rate": 0.0002030121920522535, "loss": 0.0497, "step": 100180 }, { "epoch": 0.65, "learning_rate": 0.00020300251069789655, "loss": 0.0497, "step": 100190 }, { "epoch": 0.65, "learning_rate": 0.0002029928293435396, "loss": 0.0506, "step": 100200 }, { "epoch": 0.65, "learning_rate": 0.00020298314798918268, "loss": 0.045, "step": 100210 }, { "epoch": 0.65, "learning_rate": 0.00020297346663482573, "loss": 0.0523, "step": 100220 }, { "epoch": 0.65, "learning_rate": 0.0002029637852804688, "loss": 0.0544, "step": 100230 }, { "epoch": 0.65, "learning_rate": 0.0002029541039261119, "loss": 0.0438, "step": 100240 }, { "epoch": 0.65, "learning_rate": 0.00020294442257175497, "loss": 0.0459, "step": 100250 }, { "epoch": 0.65, "learning_rate": 0.00020293474121739803, "loss": 0.0476, "step": 100260 }, { "epoch": 0.65, "learning_rate": 0.00020292505986304108, "loss": 0.0431, "step": 100270 }, { "epoch": 0.65, "learning_rate": 0.00020291537850868416, "loss": 0.0439, "step": 100280 }, { "epoch": 0.65, "learning_rate": 0.0002029056971543272, "loss": 0.045, "step": 100290 }, { "epoch": 0.65, "learning_rate": 0.0002028960157999703, "loss": 0.0543, "step": 100300 }, { "epoch": 0.65, "learning_rate": 0.00020288633444561337, "loss": 0.048, "step": 100310 }, { "epoch": 0.65, "learning_rate": 0.00020287665309125642, "loss": 0.0411, "step": 100320 }, { "epoch": 0.65, "learning_rate": 0.0002028669717368995, "loss": 0.044, "step": 100330 }, { "epoch": 0.65, "learning_rate": 0.00020285729038254256, "loss": 0.0529, "step": 100340 }, { "epoch": 0.65, "learning_rate": 0.0002028476090281856, "loss": 0.045, "step": 100350 }, { "epoch": 0.65, "learning_rate": 0.0002028379276738287, "loss": 0.0443, "step": 100360 }, { "epoch": 0.65, "learning_rate": 0.00020282824631947177, "loss": 0.0456, "step": 100370 }, { "epoch": 0.65, "learning_rate": 0.00020281856496511485, "loss": 0.0499, "step": 100380 }, { "epoch": 0.65, "learning_rate": 0.0002028088836107579, "loss": 0.0487, "step": 100390 }, { "epoch": 0.65, "learning_rate": 0.00020279920225640098, "loss": 0.0576, "step": 100400 }, { "epoch": 0.65, "learning_rate": 0.00020278952090204403, "loss": 0.0486, "step": 100410 }, { "epoch": 0.65, "learning_rate": 0.00020277983954768709, "loss": 0.0443, "step": 100420 }, { "epoch": 0.65, "learning_rate": 0.00020277015819333016, "loss": 0.0468, "step": 100430 }, { "epoch": 0.65, "learning_rate": 0.00020276047683897324, "loss": 0.0493, "step": 100440 }, { "epoch": 0.65, "learning_rate": 0.00020275079548461632, "loss": 0.0523, "step": 100450 }, { "epoch": 0.65, "learning_rate": 0.00020274111413025938, "loss": 0.0506, "step": 100460 }, { "epoch": 0.65, "learning_rate": 0.00020273143277590246, "loss": 0.0417, "step": 100470 }, { "epoch": 0.65, "learning_rate": 0.0002027217514215455, "loss": 0.0403, "step": 100480 }, { "epoch": 0.65, "learning_rate": 0.00020271207006718856, "loss": 0.0601, "step": 100490 }, { "epoch": 0.65, "learning_rate": 0.00020270238871283164, "loss": 0.0448, "step": 100500 }, { "epoch": 0.65, "learning_rate": 0.00020269270735847472, "loss": 0.0474, "step": 100510 }, { "epoch": 0.65, "learning_rate": 0.00020268302600411777, "loss": 0.0451, "step": 100520 }, { "epoch": 0.65, "learning_rate": 0.00020267334464976085, "loss": 0.0433, "step": 100530 }, { "epoch": 0.65, "learning_rate": 0.00020266366329540393, "loss": 0.0482, "step": 100540 }, { "epoch": 0.65, "learning_rate": 0.00020265398194104696, "loss": 0.0442, "step": 100550 }, { "epoch": 0.65, "learning_rate": 0.00020264430058669004, "loss": 0.0504, "step": 100560 }, { "epoch": 0.65, "learning_rate": 0.00020263461923233312, "loss": 0.0479, "step": 100570 }, { "epoch": 0.65, "learning_rate": 0.0002026249378779762, "loss": 0.0538, "step": 100580 }, { "epoch": 0.65, "learning_rate": 0.00020261525652361925, "loss": 0.0466, "step": 100590 }, { "epoch": 0.65, "learning_rate": 0.00020260557516926233, "loss": 0.0458, "step": 100600 }, { "epoch": 0.65, "learning_rate": 0.0002025958938149054, "loss": 0.0468, "step": 100610 }, { "epoch": 0.65, "learning_rate": 0.00020258621246054844, "loss": 0.0568, "step": 100620 }, { "epoch": 0.65, "learning_rate": 0.00020257653110619152, "loss": 0.0486, "step": 100630 }, { "epoch": 0.65, "learning_rate": 0.0002025668497518346, "loss": 0.0468, "step": 100640 }, { "epoch": 0.65, "learning_rate": 0.00020255716839747768, "loss": 0.0455, "step": 100650 }, { "epoch": 0.65, "learning_rate": 0.00020254748704312073, "loss": 0.0515, "step": 100660 }, { "epoch": 0.65, "learning_rate": 0.0002025378056887638, "loss": 0.0435, "step": 100670 }, { "epoch": 0.65, "learning_rate": 0.0002025281243344069, "loss": 0.0456, "step": 100680 }, { "epoch": 0.65, "learning_rate": 0.00020251844298004991, "loss": 0.0408, "step": 100690 }, { "epoch": 0.65, "learning_rate": 0.000202508761625693, "loss": 0.0528, "step": 100700 }, { "epoch": 0.65, "learning_rate": 0.00020249908027133607, "loss": 0.0402, "step": 100710 }, { "epoch": 0.65, "learning_rate": 0.00020248939891697913, "loss": 0.0497, "step": 100720 }, { "epoch": 0.65, "learning_rate": 0.0002024797175626222, "loss": 0.0427, "step": 100730 }, { "epoch": 0.65, "learning_rate": 0.00020247003620826529, "loss": 0.0526, "step": 100740 }, { "epoch": 0.65, "learning_rate": 0.00020246035485390837, "loss": 0.041, "step": 100750 }, { "epoch": 0.65, "learning_rate": 0.0002024506734995514, "loss": 0.0444, "step": 100760 }, { "epoch": 0.65, "learning_rate": 0.00020244099214519447, "loss": 0.0448, "step": 100770 }, { "epoch": 0.65, "learning_rate": 0.00020243131079083755, "loss": 0.0482, "step": 100780 }, { "epoch": 0.65, "learning_rate": 0.0002024216294364806, "loss": 0.0457, "step": 100790 }, { "epoch": 0.65, "learning_rate": 0.00020241194808212368, "loss": 0.0468, "step": 100800 }, { "epoch": 0.65, "learning_rate": 0.00020240226672776676, "loss": 0.0431, "step": 100810 }, { "epoch": 0.65, "learning_rate": 0.00020239258537340984, "loss": 0.0416, "step": 100820 }, { "epoch": 0.65, "learning_rate": 0.00020238290401905287, "loss": 0.0398, "step": 100830 }, { "epoch": 0.65, "learning_rate": 0.00020237322266469595, "loss": 0.0487, "step": 100840 }, { "epoch": 0.65, "learning_rate": 0.00020236354131033903, "loss": 0.0479, "step": 100850 }, { "epoch": 0.65, "learning_rate": 0.00020235385995598208, "loss": 0.0425, "step": 100860 }, { "epoch": 0.65, "learning_rate": 0.00020234417860162516, "loss": 0.0442, "step": 100870 }, { "epoch": 0.65, "learning_rate": 0.00020233449724726824, "loss": 0.0416, "step": 100880 }, { "epoch": 0.65, "learning_rate": 0.00020232481589291132, "loss": 0.048, "step": 100890 }, { "epoch": 0.65, "learning_rate": 0.00020231513453855435, "loss": 0.0416, "step": 100900 }, { "epoch": 0.65, "learning_rate": 0.00020230545318419743, "loss": 0.0426, "step": 100910 }, { "epoch": 0.65, "learning_rate": 0.00020229577182984048, "loss": 0.0442, "step": 100920 }, { "epoch": 0.65, "learning_rate": 0.00020228609047548356, "loss": 0.0427, "step": 100930 }, { "epoch": 0.65, "learning_rate": 0.00020227640912112664, "loss": 0.0494, "step": 100940 }, { "epoch": 0.65, "learning_rate": 0.00020226672776676972, "loss": 0.0436, "step": 100950 }, { "epoch": 0.65, "learning_rate": 0.00020225704641241277, "loss": 0.0447, "step": 100960 }, { "epoch": 0.65, "learning_rate": 0.00020224736505805582, "loss": 0.0379, "step": 100970 }, { "epoch": 0.65, "learning_rate": 0.0002022376837036989, "loss": 0.0522, "step": 100980 }, { "epoch": 0.65, "learning_rate": 0.00020222800234934196, "loss": 0.0512, "step": 100990 }, { "epoch": 0.65, "learning_rate": 0.00020221832099498504, "loss": 0.0519, "step": 101000 }, { "epoch": 0.65, "eval_cer": 0.9199032877640945, "eval_loss": 0.030138300731778145, "eval_runtime": 119.833, "eval_samples_per_second": 16.69, "eval_steps_per_second": 4.172, "step": 101000 }, { "epoch": 0.65, "learning_rate": 0.00020220863964062812, "loss": 0.0599, "step": 101010 }, { "epoch": 0.65, "learning_rate": 0.0002021989582862712, "loss": 0.0476, "step": 101020 }, { "epoch": 0.65, "learning_rate": 0.00020218927693191425, "loss": 0.0482, "step": 101030 }, { "epoch": 0.65, "learning_rate": 0.0002021795955775573, "loss": 0.0523, "step": 101040 }, { "epoch": 0.65, "learning_rate": 0.00020216991422320038, "loss": 0.0426, "step": 101050 }, { "epoch": 0.65, "learning_rate": 0.00020216023286884343, "loss": 0.0457, "step": 101060 }, { "epoch": 0.65, "learning_rate": 0.0002021505515144865, "loss": 0.046, "step": 101070 }, { "epoch": 0.65, "learning_rate": 0.0002021408701601296, "loss": 0.0539, "step": 101080 }, { "epoch": 0.65, "learning_rate": 0.00020213118880577267, "loss": 0.0463, "step": 101090 }, { "epoch": 0.65, "learning_rate": 0.00020212150745141572, "loss": 0.0446, "step": 101100 }, { "epoch": 0.65, "learning_rate": 0.00020211182609705878, "loss": 0.0498, "step": 101110 }, { "epoch": 0.65, "learning_rate": 0.00020210214474270183, "loss": 0.0477, "step": 101120 }, { "epoch": 0.65, "learning_rate": 0.0002020924633883449, "loss": 0.059, "step": 101130 }, { "epoch": 0.65, "learning_rate": 0.000202082782033988, "loss": 0.0476, "step": 101140 }, { "epoch": 0.65, "learning_rate": 0.00020207310067963107, "loss": 0.0507, "step": 101150 }, { "epoch": 0.65, "learning_rate": 0.00020206341932527412, "loss": 0.0497, "step": 101160 }, { "epoch": 0.65, "learning_rate": 0.0002020537379709172, "loss": 0.0494, "step": 101170 }, { "epoch": 0.65, "learning_rate": 0.00020204405661656025, "loss": 0.0454, "step": 101180 }, { "epoch": 0.65, "learning_rate": 0.0002020343752622033, "loss": 0.0415, "step": 101190 }, { "epoch": 0.65, "learning_rate": 0.0002020246939078464, "loss": 0.0486, "step": 101200 }, { "epoch": 0.65, "learning_rate": 0.00020201501255348947, "loss": 0.0479, "step": 101210 }, { "epoch": 0.65, "learning_rate": 0.00020200533119913255, "loss": 0.0552, "step": 101220 }, { "epoch": 0.65, "learning_rate": 0.0002019956498447756, "loss": 0.049, "step": 101230 }, { "epoch": 0.65, "learning_rate": 0.00020198596849041868, "loss": 0.0444, "step": 101240 }, { "epoch": 0.65, "learning_rate": 0.00020197628713606173, "loss": 0.0546, "step": 101250 }, { "epoch": 0.65, "learning_rate": 0.00020196660578170478, "loss": 0.0489, "step": 101260 }, { "epoch": 0.65, "learning_rate": 0.00020195692442734786, "loss": 0.0573, "step": 101270 }, { "epoch": 0.65, "learning_rate": 0.00020194724307299094, "loss": 0.0459, "step": 101280 }, { "epoch": 0.65, "learning_rate": 0.00020193756171863402, "loss": 0.0447, "step": 101290 }, { "epoch": 0.65, "learning_rate": 0.00020192788036427708, "loss": 0.044, "step": 101300 }, { "epoch": 0.65, "learning_rate": 0.00020191819900992016, "loss": 0.041, "step": 101310 }, { "epoch": 0.65, "learning_rate": 0.00020190851765556318, "loss": 0.0466, "step": 101320 }, { "epoch": 0.65, "learning_rate": 0.00020189883630120626, "loss": 0.0431, "step": 101330 }, { "epoch": 0.65, "learning_rate": 0.00020188915494684934, "loss": 0.046, "step": 101340 }, { "epoch": 0.65, "learning_rate": 0.00020187947359249242, "loss": 0.0419, "step": 101350 }, { "epoch": 0.65, "learning_rate": 0.00020186979223813547, "loss": 0.0424, "step": 101360 }, { "epoch": 0.65, "learning_rate": 0.00020186011088377855, "loss": 0.0457, "step": 101370 }, { "epoch": 0.65, "learning_rate": 0.00020185042952942163, "loss": 0.0436, "step": 101380 }, { "epoch": 0.65, "learning_rate": 0.00020184074817506466, "loss": 0.0501, "step": 101390 }, { "epoch": 0.65, "learning_rate": 0.00020183106682070774, "loss": 0.0508, "step": 101400 }, { "epoch": 0.65, "learning_rate": 0.00020182138546635082, "loss": 0.044, "step": 101410 }, { "epoch": 0.65, "learning_rate": 0.0002018117041119939, "loss": 0.0464, "step": 101420 }, { "epoch": 0.65, "learning_rate": 0.00020180202275763695, "loss": 0.0426, "step": 101430 }, { "epoch": 0.65, "learning_rate": 0.00020179234140328003, "loss": 0.0502, "step": 101440 }, { "epoch": 0.65, "learning_rate": 0.0002017826600489231, "loss": 0.0464, "step": 101450 }, { "epoch": 0.65, "learning_rate": 0.00020177297869456614, "loss": 0.052, "step": 101460 }, { "epoch": 0.65, "learning_rate": 0.00020176329734020922, "loss": 0.0515, "step": 101470 }, { "epoch": 0.65, "learning_rate": 0.0002017536159858523, "loss": 0.0408, "step": 101480 }, { "epoch": 0.66, "learning_rate": 0.00020174393463149538, "loss": 0.0485, "step": 101490 }, { "epoch": 0.66, "learning_rate": 0.00020173425327713843, "loss": 0.0456, "step": 101500 }, { "epoch": 0.66, "learning_rate": 0.0002017245719227815, "loss": 0.0555, "step": 101510 }, { "epoch": 0.66, "learning_rate": 0.0002017148905684246, "loss": 0.053, "step": 101520 }, { "epoch": 0.66, "learning_rate": 0.00020170520921406761, "loss": 0.0429, "step": 101530 }, { "epoch": 0.66, "learning_rate": 0.0002016955278597107, "loss": 0.0441, "step": 101540 }, { "epoch": 0.66, "learning_rate": 0.00020168584650535377, "loss": 0.0464, "step": 101550 }, { "epoch": 0.66, "learning_rate": 0.00020167616515099683, "loss": 0.0408, "step": 101560 }, { "epoch": 0.66, "learning_rate": 0.0002016664837966399, "loss": 0.0533, "step": 101570 }, { "epoch": 0.66, "learning_rate": 0.00020165680244228299, "loss": 0.0524, "step": 101580 }, { "epoch": 0.66, "learning_rate": 0.00020164712108792607, "loss": 0.0496, "step": 101590 }, { "epoch": 0.66, "learning_rate": 0.0002016374397335691, "loss": 0.0488, "step": 101600 }, { "epoch": 0.66, "learning_rate": 0.00020162775837921217, "loss": 0.0467, "step": 101610 }, { "epoch": 0.66, "learning_rate": 0.00020161807702485525, "loss": 0.0403, "step": 101620 }, { "epoch": 0.66, "learning_rate": 0.0002016083956704983, "loss": 0.0476, "step": 101630 }, { "epoch": 0.66, "learning_rate": 0.00020159871431614138, "loss": 0.0473, "step": 101640 }, { "epoch": 0.66, "learning_rate": 0.00020158903296178446, "loss": 0.0501, "step": 101650 }, { "epoch": 0.66, "learning_rate": 0.00020157935160742754, "loss": 0.0409, "step": 101660 }, { "epoch": 0.66, "learning_rate": 0.00020156967025307057, "loss": 0.0457, "step": 101670 }, { "epoch": 0.66, "learning_rate": 0.00020155998889871365, "loss": 0.0567, "step": 101680 }, { "epoch": 0.66, "learning_rate": 0.00020155030754435673, "loss": 0.0499, "step": 101690 }, { "epoch": 0.66, "learning_rate": 0.00020154062618999978, "loss": 0.049, "step": 101700 }, { "epoch": 0.66, "learning_rate": 0.00020153094483564286, "loss": 0.0486, "step": 101710 }, { "epoch": 0.66, "learning_rate": 0.00020152126348128594, "loss": 0.041, "step": 101720 }, { "epoch": 0.66, "learning_rate": 0.000201511582126929, "loss": 0.0416, "step": 101730 }, { "epoch": 0.66, "learning_rate": 0.00020150190077257205, "loss": 0.0488, "step": 101740 }, { "epoch": 0.66, "learning_rate": 0.00020149221941821513, "loss": 0.0576, "step": 101750 }, { "epoch": 0.66, "learning_rate": 0.00020148253806385818, "loss": 0.0483, "step": 101760 }, { "epoch": 0.66, "learning_rate": 0.00020147285670950126, "loss": 0.0514, "step": 101770 }, { "epoch": 0.66, "learning_rate": 0.00020146317535514434, "loss": 0.0441, "step": 101780 }, { "epoch": 0.66, "learning_rate": 0.00020145349400078742, "loss": 0.0463, "step": 101790 }, { "epoch": 0.66, "learning_rate": 0.00020144381264643047, "loss": 0.0533, "step": 101800 }, { "epoch": 0.66, "learning_rate": 0.00020143413129207352, "loss": 0.0484, "step": 101810 }, { "epoch": 0.66, "learning_rate": 0.0002014244499377166, "loss": 0.0462, "step": 101820 }, { "epoch": 0.66, "learning_rate": 0.00020141476858335966, "loss": 0.048, "step": 101830 }, { "epoch": 0.66, "learning_rate": 0.00020140508722900273, "loss": 0.0459, "step": 101840 }, { "epoch": 0.66, "learning_rate": 0.00020139540587464581, "loss": 0.0627, "step": 101850 }, { "epoch": 0.66, "learning_rate": 0.0002013857245202889, "loss": 0.0418, "step": 101860 }, { "epoch": 0.66, "learning_rate": 0.00020137604316593195, "loss": 0.0499, "step": 101870 }, { "epoch": 0.66, "learning_rate": 0.000201366361811575, "loss": 0.046, "step": 101880 }, { "epoch": 0.66, "learning_rate": 0.00020135668045721808, "loss": 0.0447, "step": 101890 }, { "epoch": 0.66, "learning_rate": 0.00020134699910286113, "loss": 0.0471, "step": 101900 }, { "epoch": 0.66, "learning_rate": 0.0002013373177485042, "loss": 0.0522, "step": 101910 }, { "epoch": 0.66, "learning_rate": 0.0002013276363941473, "loss": 0.0463, "step": 101920 }, { "epoch": 0.66, "learning_rate": 0.00020131795503979034, "loss": 0.0388, "step": 101930 }, { "epoch": 0.66, "learning_rate": 0.00020130827368543342, "loss": 0.0439, "step": 101940 }, { "epoch": 0.66, "learning_rate": 0.00020129859233107648, "loss": 0.0471, "step": 101950 }, { "epoch": 0.66, "learning_rate": 0.00020128891097671953, "loss": 0.0507, "step": 101960 }, { "epoch": 0.66, "learning_rate": 0.0002012792296223626, "loss": 0.0431, "step": 101970 }, { "epoch": 0.66, "learning_rate": 0.0002012695482680057, "loss": 0.0494, "step": 101980 }, { "epoch": 0.66, "learning_rate": 0.00020125986691364877, "loss": 0.0458, "step": 101990 }, { "epoch": 0.66, "learning_rate": 0.00020125018555929182, "loss": 0.0417, "step": 102000 }, { "epoch": 0.66, "eval_cer": 0.9199168455541746, "eval_loss": 0.030525721609592438, "eval_runtime": 119.742, "eval_samples_per_second": 16.703, "eval_steps_per_second": 4.176, "step": 102000 }, { "epoch": 0.66, "learning_rate": 0.0002012405042049349, "loss": 0.05, "step": 102010 }, { "epoch": 0.66, "learning_rate": 0.00020123082285057795, "loss": 0.0474, "step": 102020 }, { "epoch": 0.66, "learning_rate": 0.000201221141496221, "loss": 0.0494, "step": 102030 }, { "epoch": 0.66, "learning_rate": 0.0002012114601418641, "loss": 0.0406, "step": 102040 }, { "epoch": 0.66, "learning_rate": 0.00020120177878750717, "loss": 0.0457, "step": 102050 }, { "epoch": 0.66, "learning_rate": 0.00020119209743315025, "loss": 0.0478, "step": 102060 }, { "epoch": 0.66, "learning_rate": 0.0002011824160787933, "loss": 0.0457, "step": 102070 }, { "epoch": 0.66, "learning_rate": 0.00020117273472443638, "loss": 0.0444, "step": 102080 }, { "epoch": 0.66, "learning_rate": 0.00020116305337007943, "loss": 0.0518, "step": 102090 }, { "epoch": 0.66, "learning_rate": 0.00020115337201572248, "loss": 0.0436, "step": 102100 }, { "epoch": 0.66, "learning_rate": 0.00020114369066136556, "loss": 0.0449, "step": 102110 }, { "epoch": 0.66, "learning_rate": 0.00020113400930700864, "loss": 0.0486, "step": 102120 }, { "epoch": 0.66, "learning_rate": 0.0002011243279526517, "loss": 0.0433, "step": 102130 }, { "epoch": 0.66, "learning_rate": 0.00020111464659829478, "loss": 0.0478, "step": 102140 }, { "epoch": 0.66, "learning_rate": 0.00020110496524393786, "loss": 0.0522, "step": 102150 }, { "epoch": 0.66, "learning_rate": 0.00020109528388958088, "loss": 0.0468, "step": 102160 }, { "epoch": 0.66, "learning_rate": 0.00020108560253522396, "loss": 0.0452, "step": 102170 }, { "epoch": 0.66, "learning_rate": 0.00020107592118086704, "loss": 0.0551, "step": 102180 }, { "epoch": 0.66, "learning_rate": 0.00020106623982651012, "loss": 0.0455, "step": 102190 }, { "epoch": 0.66, "learning_rate": 0.00020105655847215317, "loss": 0.0429, "step": 102200 }, { "epoch": 0.66, "learning_rate": 0.00020104687711779625, "loss": 0.0448, "step": 102210 }, { "epoch": 0.66, "learning_rate": 0.00020103719576343933, "loss": 0.0562, "step": 102220 }, { "epoch": 0.66, "learning_rate": 0.00020102751440908236, "loss": 0.0449, "step": 102230 }, { "epoch": 0.66, "learning_rate": 0.00020101783305472544, "loss": 0.0485, "step": 102240 }, { "epoch": 0.66, "learning_rate": 0.00020100815170036852, "loss": 0.0474, "step": 102250 }, { "epoch": 0.66, "learning_rate": 0.0002009984703460116, "loss": 0.0434, "step": 102260 }, { "epoch": 0.66, "learning_rate": 0.00020098878899165465, "loss": 0.0497, "step": 102270 }, { "epoch": 0.66, "learning_rate": 0.00020097910763729773, "loss": 0.0483, "step": 102280 }, { "epoch": 0.66, "learning_rate": 0.0002009694262829408, "loss": 0.0473, "step": 102290 }, { "epoch": 0.66, "learning_rate": 0.00020095974492858384, "loss": 0.0439, "step": 102300 }, { "epoch": 0.66, "learning_rate": 0.00020095006357422692, "loss": 0.0493, "step": 102310 }, { "epoch": 0.66, "learning_rate": 0.00020094038221987, "loss": 0.0524, "step": 102320 }, { "epoch": 0.66, "learning_rate": 0.00020093070086551305, "loss": 0.0437, "step": 102330 }, { "epoch": 0.66, "learning_rate": 0.00020092101951115613, "loss": 0.0463, "step": 102340 }, { "epoch": 0.66, "learning_rate": 0.0002009113381567992, "loss": 0.0506, "step": 102350 }, { "epoch": 0.66, "learning_rate": 0.0002009016568024423, "loss": 0.0425, "step": 102360 }, { "epoch": 0.66, "learning_rate": 0.0002008919754480853, "loss": 0.0461, "step": 102370 }, { "epoch": 0.66, "learning_rate": 0.0002008822940937284, "loss": 0.0437, "step": 102380 }, { "epoch": 0.66, "learning_rate": 0.00020087261273937147, "loss": 0.0471, "step": 102390 }, { "epoch": 0.66, "learning_rate": 0.00020086293138501453, "loss": 0.0465, "step": 102400 }, { "epoch": 0.66, "learning_rate": 0.0002008532500306576, "loss": 0.0482, "step": 102410 }, { "epoch": 0.66, "learning_rate": 0.00020084356867630069, "loss": 0.039, "step": 102420 }, { "epoch": 0.66, "learning_rate": 0.00020083388732194377, "loss": 0.0457, "step": 102430 }, { "epoch": 0.66, "learning_rate": 0.0002008242059675868, "loss": 0.0401, "step": 102440 }, { "epoch": 0.66, "learning_rate": 0.00020081452461322987, "loss": 0.052, "step": 102450 }, { "epoch": 0.66, "learning_rate": 0.00020080484325887295, "loss": 0.047, "step": 102460 }, { "epoch": 0.66, "learning_rate": 0.000200795161904516, "loss": 0.0437, "step": 102470 }, { "epoch": 0.66, "learning_rate": 0.00020078548055015908, "loss": 0.044, "step": 102480 }, { "epoch": 0.66, "learning_rate": 0.00020077579919580216, "loss": 0.0462, "step": 102490 }, { "epoch": 0.66, "learning_rate": 0.00020076611784144522, "loss": 0.0457, "step": 102500 }, { "epoch": 0.66, "learning_rate": 0.00020075643648708827, "loss": 0.0513, "step": 102510 }, { "epoch": 0.66, "learning_rate": 0.00020074675513273135, "loss": 0.0517, "step": 102520 }, { "epoch": 0.66, "learning_rate": 0.0002007370737783744, "loss": 0.0463, "step": 102530 }, { "epoch": 0.66, "learning_rate": 0.00020072739242401748, "loss": 0.0493, "step": 102540 }, { "epoch": 0.66, "learning_rate": 0.00020071771106966056, "loss": 0.0418, "step": 102550 }, { "epoch": 0.66, "learning_rate": 0.00020070802971530364, "loss": 0.0437, "step": 102560 }, { "epoch": 0.66, "learning_rate": 0.0002006983483609467, "loss": 0.0427, "step": 102570 }, { "epoch": 0.66, "learning_rate": 0.00020068866700658975, "loss": 0.0472, "step": 102580 }, { "epoch": 0.66, "learning_rate": 0.00020067898565223282, "loss": 0.0449, "step": 102590 }, { "epoch": 0.66, "learning_rate": 0.00020066930429787588, "loss": 0.0486, "step": 102600 }, { "epoch": 0.66, "learning_rate": 0.00020065962294351896, "loss": 0.0511, "step": 102610 }, { "epoch": 0.66, "learning_rate": 0.00020064994158916204, "loss": 0.0461, "step": 102620 }, { "epoch": 0.66, "learning_rate": 0.00020064026023480512, "loss": 0.0518, "step": 102630 }, { "epoch": 0.66, "learning_rate": 0.00020063057888044817, "loss": 0.0511, "step": 102640 }, { "epoch": 0.66, "learning_rate": 0.00020062089752609122, "loss": 0.0422, "step": 102650 }, { "epoch": 0.66, "learning_rate": 0.0002006112161717343, "loss": 0.0449, "step": 102660 }, { "epoch": 0.66, "learning_rate": 0.00020060153481737735, "loss": 0.0436, "step": 102670 }, { "epoch": 0.66, "learning_rate": 0.00020059185346302043, "loss": 0.049, "step": 102680 }, { "epoch": 0.66, "learning_rate": 0.00020058217210866351, "loss": 0.0406, "step": 102690 }, { "epoch": 0.66, "learning_rate": 0.0002005724907543066, "loss": 0.0473, "step": 102700 }, { "epoch": 0.66, "learning_rate": 0.00020056280939994965, "loss": 0.0431, "step": 102710 }, { "epoch": 0.66, "learning_rate": 0.0002005531280455927, "loss": 0.0457, "step": 102720 }, { "epoch": 0.66, "learning_rate": 0.00020054344669123575, "loss": 0.0441, "step": 102730 }, { "epoch": 0.66, "learning_rate": 0.00020053376533687883, "loss": 0.0397, "step": 102740 }, { "epoch": 0.66, "learning_rate": 0.0002005240839825219, "loss": 0.0469, "step": 102750 }, { "epoch": 0.66, "learning_rate": 0.000200514402628165, "loss": 0.0437, "step": 102760 }, { "epoch": 0.66, "learning_rate": 0.00020050472127380804, "loss": 0.0456, "step": 102770 }, { "epoch": 0.66, "learning_rate": 0.00020049503991945112, "loss": 0.0407, "step": 102780 }, { "epoch": 0.66, "learning_rate": 0.00020048535856509418, "loss": 0.0487, "step": 102790 }, { "epoch": 0.66, "learning_rate": 0.00020047567721073723, "loss": 0.0377, "step": 102800 }, { "epoch": 0.66, "learning_rate": 0.0002004659958563803, "loss": 0.0434, "step": 102810 }, { "epoch": 0.66, "learning_rate": 0.0002004563145020234, "loss": 0.046, "step": 102820 }, { "epoch": 0.66, "learning_rate": 0.00020044663314766647, "loss": 0.0498, "step": 102830 }, { "epoch": 0.66, "learning_rate": 0.00020043695179330952, "loss": 0.0477, "step": 102840 }, { "epoch": 0.66, "learning_rate": 0.0002004272704389526, "loss": 0.0487, "step": 102850 }, { "epoch": 0.66, "learning_rate": 0.00020041758908459565, "loss": 0.0491, "step": 102860 }, { "epoch": 0.66, "learning_rate": 0.0002004079077302387, "loss": 0.0535, "step": 102870 }, { "epoch": 0.66, "learning_rate": 0.0002003982263758818, "loss": 0.045, "step": 102880 }, { "epoch": 0.66, "learning_rate": 0.00020038854502152487, "loss": 0.0431, "step": 102890 }, { "epoch": 0.66, "learning_rate": 0.00020037886366716795, "loss": 0.0458, "step": 102900 }, { "epoch": 0.66, "learning_rate": 0.000200369182312811, "loss": 0.045, "step": 102910 }, { "epoch": 0.66, "learning_rate": 0.00020035950095845408, "loss": 0.0491, "step": 102920 }, { "epoch": 0.66, "learning_rate": 0.0002003498196040971, "loss": 0.0508, "step": 102930 }, { "epoch": 0.66, "learning_rate": 0.00020034013824974018, "loss": 0.0462, "step": 102940 }, { "epoch": 0.66, "learning_rate": 0.00020033045689538326, "loss": 0.0458, "step": 102950 }, { "epoch": 0.66, "learning_rate": 0.00020032077554102634, "loss": 0.0471, "step": 102960 }, { "epoch": 0.66, "learning_rate": 0.0002003110941866694, "loss": 0.0428, "step": 102970 }, { "epoch": 0.66, "learning_rate": 0.00020030141283231248, "loss": 0.0529, "step": 102980 }, { "epoch": 0.66, "learning_rate": 0.00020029173147795556, "loss": 0.053, "step": 102990 }, { "epoch": 0.66, "learning_rate": 0.00020028205012359858, "loss": 0.0456, "step": 103000 }, { "epoch": 0.66, "eval_cer": 0.919939441870975, "eval_loss": 0.030785538256168365, "eval_runtime": 119.6928, "eval_samples_per_second": 16.709, "eval_steps_per_second": 4.177, "step": 103000 }, { "epoch": 0.66, "learning_rate": 0.00020027236876924166, "loss": 0.0453, "step": 103010 }, { "epoch": 0.66, "learning_rate": 0.00020026268741488474, "loss": 0.0431, "step": 103020 }, { "epoch": 0.66, "learning_rate": 0.00020025300606052782, "loss": 0.0539, "step": 103030 }, { "epoch": 0.67, "learning_rate": 0.00020024332470617087, "loss": 0.0385, "step": 103040 }, { "epoch": 0.67, "learning_rate": 0.00020023364335181395, "loss": 0.0449, "step": 103050 }, { "epoch": 0.67, "learning_rate": 0.00020022396199745703, "loss": 0.053, "step": 103060 }, { "epoch": 0.67, "learning_rate": 0.00020021428064310006, "loss": 0.0456, "step": 103070 }, { "epoch": 0.67, "learning_rate": 0.00020020459928874314, "loss": 0.0492, "step": 103080 }, { "epoch": 0.67, "learning_rate": 0.00020019491793438622, "loss": 0.043, "step": 103090 }, { "epoch": 0.67, "learning_rate": 0.0002001852365800293, "loss": 0.0574, "step": 103100 }, { "epoch": 0.67, "learning_rate": 0.00020017555522567235, "loss": 0.0475, "step": 103110 }, { "epoch": 0.67, "learning_rate": 0.00020016587387131543, "loss": 0.0429, "step": 103120 }, { "epoch": 0.67, "learning_rate": 0.0002001561925169585, "loss": 0.0534, "step": 103130 }, { "epoch": 0.67, "learning_rate": 0.00020014651116260154, "loss": 0.046, "step": 103140 }, { "epoch": 0.67, "learning_rate": 0.00020013682980824462, "loss": 0.0478, "step": 103150 }, { "epoch": 0.67, "learning_rate": 0.0002001271484538877, "loss": 0.0435, "step": 103160 }, { "epoch": 0.67, "learning_rate": 0.00020011746709953075, "loss": 0.0449, "step": 103170 }, { "epoch": 0.67, "learning_rate": 0.00020010778574517383, "loss": 0.0477, "step": 103180 }, { "epoch": 0.67, "learning_rate": 0.0002000981043908169, "loss": 0.0385, "step": 103190 }, { "epoch": 0.67, "learning_rate": 0.00020008842303646, "loss": 0.0444, "step": 103200 }, { "epoch": 0.67, "learning_rate": 0.000200078741682103, "loss": 0.045, "step": 103210 }, { "epoch": 0.67, "learning_rate": 0.0002000690603277461, "loss": 0.0497, "step": 103220 }, { "epoch": 0.67, "learning_rate": 0.00020005937897338917, "loss": 0.0449, "step": 103230 }, { "epoch": 0.67, "learning_rate": 0.00020004969761903223, "loss": 0.0404, "step": 103240 }, { "epoch": 0.67, "learning_rate": 0.0002000400162646753, "loss": 0.0503, "step": 103250 }, { "epoch": 0.67, "learning_rate": 0.00020003033491031838, "loss": 0.0449, "step": 103260 }, { "epoch": 0.67, "learning_rate": 0.00020002065355596146, "loss": 0.0496, "step": 103270 }, { "epoch": 0.67, "learning_rate": 0.0002000109722016045, "loss": 0.0493, "step": 103280 }, { "epoch": 0.67, "learning_rate": 0.00020000129084724757, "loss": 0.0462, "step": 103290 }, { "epoch": 0.67, "learning_rate": 0.00019999160949289065, "loss": 0.0509, "step": 103300 }, { "epoch": 0.67, "learning_rate": 0.0001999819281385337, "loss": 0.0542, "step": 103310 }, { "epoch": 0.67, "learning_rate": 0.00019997224678417678, "loss": 0.0417, "step": 103320 }, { "epoch": 0.67, "learning_rate": 0.00019996256542981986, "loss": 0.0477, "step": 103330 }, { "epoch": 0.67, "learning_rate": 0.00019995288407546291, "loss": 0.0455, "step": 103340 }, { "epoch": 0.67, "learning_rate": 0.00019994320272110597, "loss": 0.0551, "step": 103350 }, { "epoch": 0.67, "learning_rate": 0.00019993352136674905, "loss": 0.0482, "step": 103360 }, { "epoch": 0.67, "learning_rate": 0.0001999238400123921, "loss": 0.05, "step": 103370 }, { "epoch": 0.67, "learning_rate": 0.00019991415865803518, "loss": 0.0518, "step": 103380 }, { "epoch": 0.67, "learning_rate": 0.00019990447730367826, "loss": 0.0447, "step": 103390 }, { "epoch": 0.67, "learning_rate": 0.00019989479594932134, "loss": 0.0438, "step": 103400 }, { "epoch": 0.67, "learning_rate": 0.0001998851145949644, "loss": 0.0516, "step": 103410 }, { "epoch": 0.67, "learning_rate": 0.00019987543324060744, "loss": 0.0451, "step": 103420 }, { "epoch": 0.67, "learning_rate": 0.00019986575188625052, "loss": 0.0448, "step": 103430 }, { "epoch": 0.67, "learning_rate": 0.00019985607053189358, "loss": 0.0439, "step": 103440 }, { "epoch": 0.67, "learning_rate": 0.00019984638917753666, "loss": 0.043, "step": 103450 }, { "epoch": 0.67, "learning_rate": 0.00019983670782317974, "loss": 0.0479, "step": 103460 }, { "epoch": 0.67, "learning_rate": 0.00019982702646882282, "loss": 0.0421, "step": 103470 }, { "epoch": 0.67, "learning_rate": 0.00019981734511446587, "loss": 0.0508, "step": 103480 }, { "epoch": 0.67, "learning_rate": 0.00019980766376010892, "loss": 0.0456, "step": 103490 }, { "epoch": 0.67, "learning_rate": 0.000199797982405752, "loss": 0.0461, "step": 103500 }, { "epoch": 0.67, "learning_rate": 0.00019978830105139505, "loss": 0.0471, "step": 103510 }, { "epoch": 0.67, "learning_rate": 0.00019977861969703813, "loss": 0.0466, "step": 103520 }, { "epoch": 0.67, "learning_rate": 0.00019976893834268121, "loss": 0.0526, "step": 103530 }, { "epoch": 0.67, "learning_rate": 0.00019975925698832427, "loss": 0.0476, "step": 103540 }, { "epoch": 0.67, "learning_rate": 0.00019974957563396735, "loss": 0.0433, "step": 103550 }, { "epoch": 0.67, "learning_rate": 0.0001997398942796104, "loss": 0.0464, "step": 103560 }, { "epoch": 0.67, "learning_rate": 0.00019973021292525345, "loss": 0.043, "step": 103570 }, { "epoch": 0.67, "learning_rate": 0.00019972053157089653, "loss": 0.0409, "step": 103580 }, { "epoch": 0.67, "learning_rate": 0.0001997108502165396, "loss": 0.0412, "step": 103590 }, { "epoch": 0.67, "learning_rate": 0.0001997011688621827, "loss": 0.0462, "step": 103600 }, { "epoch": 0.67, "learning_rate": 0.00019969148750782574, "loss": 0.0477, "step": 103610 }, { "epoch": 0.67, "learning_rate": 0.00019968180615346882, "loss": 0.049, "step": 103620 }, { "epoch": 0.67, "learning_rate": 0.00019967212479911188, "loss": 0.0448, "step": 103630 }, { "epoch": 0.67, "learning_rate": 0.00019966244344475493, "loss": 0.0502, "step": 103640 }, { "epoch": 0.67, "learning_rate": 0.000199652762090398, "loss": 0.0501, "step": 103650 }, { "epoch": 0.67, "learning_rate": 0.0001996430807360411, "loss": 0.0457, "step": 103660 }, { "epoch": 0.67, "learning_rate": 0.00019963339938168417, "loss": 0.0539, "step": 103670 }, { "epoch": 0.67, "learning_rate": 0.00019962371802732722, "loss": 0.0468, "step": 103680 }, { "epoch": 0.67, "learning_rate": 0.0001996140366729703, "loss": 0.0504, "step": 103690 }, { "epoch": 0.67, "learning_rate": 0.00019960435531861335, "loss": 0.0448, "step": 103700 }, { "epoch": 0.67, "learning_rate": 0.0001995946739642564, "loss": 0.0468, "step": 103710 }, { "epoch": 0.67, "learning_rate": 0.00019958499260989949, "loss": 0.0459, "step": 103720 }, { "epoch": 0.67, "learning_rate": 0.00019957531125554257, "loss": 0.045, "step": 103730 }, { "epoch": 0.67, "learning_rate": 0.00019956562990118562, "loss": 0.0521, "step": 103740 }, { "epoch": 0.67, "learning_rate": 0.0001995559485468287, "loss": 0.046, "step": 103750 }, { "epoch": 0.67, "learning_rate": 0.00019954626719247178, "loss": 0.0451, "step": 103760 }, { "epoch": 0.67, "learning_rate": 0.0001995365858381148, "loss": 0.0448, "step": 103770 }, { "epoch": 0.67, "learning_rate": 0.00019952690448375788, "loss": 0.0449, "step": 103780 }, { "epoch": 0.67, "learning_rate": 0.00019951722312940096, "loss": 0.0422, "step": 103790 }, { "epoch": 0.67, "learning_rate": 0.00019950754177504404, "loss": 0.0552, "step": 103800 }, { "epoch": 0.67, "learning_rate": 0.0001994978604206871, "loss": 0.0502, "step": 103810 }, { "epoch": 0.67, "learning_rate": 0.00019948817906633018, "loss": 0.0495, "step": 103820 }, { "epoch": 0.67, "learning_rate": 0.00019947849771197326, "loss": 0.0425, "step": 103830 }, { "epoch": 0.67, "learning_rate": 0.00019946881635761628, "loss": 0.0587, "step": 103840 }, { "epoch": 0.67, "learning_rate": 0.00019945913500325936, "loss": 0.0421, "step": 103850 }, { "epoch": 0.67, "learning_rate": 0.00019944945364890244, "loss": 0.0538, "step": 103860 }, { "epoch": 0.67, "learning_rate": 0.00019943977229454552, "loss": 0.0457, "step": 103870 }, { "epoch": 0.67, "learning_rate": 0.00019943009094018857, "loss": 0.0452, "step": 103880 }, { "epoch": 0.67, "learning_rate": 0.00019942040958583165, "loss": 0.0477, "step": 103890 }, { "epoch": 0.67, "learning_rate": 0.00019941072823147473, "loss": 0.0479, "step": 103900 }, { "epoch": 0.67, "learning_rate": 0.00019940104687711776, "loss": 0.0428, "step": 103910 }, { "epoch": 0.67, "learning_rate": 0.00019939136552276084, "loss": 0.0481, "step": 103920 }, { "epoch": 0.67, "learning_rate": 0.00019938168416840392, "loss": 0.0473, "step": 103930 }, { "epoch": 0.67, "learning_rate": 0.00019937200281404697, "loss": 0.0503, "step": 103940 }, { "epoch": 0.67, "learning_rate": 0.00019936232145969005, "loss": 0.0473, "step": 103950 }, { "epoch": 0.67, "learning_rate": 0.00019935264010533313, "loss": 0.0426, "step": 103960 }, { "epoch": 0.67, "learning_rate": 0.0001993429587509762, "loss": 0.0507, "step": 103970 }, { "epoch": 0.67, "learning_rate": 0.00019933327739661924, "loss": 0.0548, "step": 103980 }, { "epoch": 0.67, "learning_rate": 0.00019932359604226232, "loss": 0.0506, "step": 103990 }, { "epoch": 0.67, "learning_rate": 0.0001993139146879054, "loss": 0.046, "step": 104000 }, { "epoch": 0.67, "eval_cer": 0.9198345949610214, "eval_loss": 0.03151978179812431, "eval_runtime": 120.1984, "eval_samples_per_second": 16.639, "eval_steps_per_second": 4.16, "step": 104000 }, { "epoch": 0.67, "learning_rate": 0.00019930423333354845, "loss": 0.0484, "step": 104010 }, { "epoch": 0.67, "learning_rate": 0.00019929455197919153, "loss": 0.0488, "step": 104020 }, { "epoch": 0.67, "learning_rate": 0.0001992848706248346, "loss": 0.0434, "step": 104030 }, { "epoch": 0.67, "learning_rate": 0.0001992751892704777, "loss": 0.0429, "step": 104040 }, { "epoch": 0.67, "learning_rate": 0.0001992655079161207, "loss": 0.0523, "step": 104050 }, { "epoch": 0.67, "learning_rate": 0.0001992558265617638, "loss": 0.0472, "step": 104060 }, { "epoch": 0.67, "learning_rate": 0.00019924614520740687, "loss": 0.0426, "step": 104070 }, { "epoch": 0.67, "learning_rate": 0.00019923646385304992, "loss": 0.0503, "step": 104080 }, { "epoch": 0.67, "learning_rate": 0.000199226782498693, "loss": 0.0488, "step": 104090 }, { "epoch": 0.67, "learning_rate": 0.00019921710114433608, "loss": 0.0456, "step": 104100 }, { "epoch": 0.67, "learning_rate": 0.00019920741978997914, "loss": 0.0545, "step": 104110 }, { "epoch": 0.67, "learning_rate": 0.0001991977384356222, "loss": 0.0459, "step": 104120 }, { "epoch": 0.67, "learning_rate": 0.00019918805708126527, "loss": 0.0473, "step": 104130 }, { "epoch": 0.67, "learning_rate": 0.00019917837572690832, "loss": 0.0519, "step": 104140 }, { "epoch": 0.67, "learning_rate": 0.0001991686943725514, "loss": 0.0419, "step": 104150 }, { "epoch": 0.67, "learning_rate": 0.00019915901301819448, "loss": 0.0441, "step": 104160 }, { "epoch": 0.67, "learning_rate": 0.00019914933166383756, "loss": 0.0503, "step": 104170 }, { "epoch": 0.67, "learning_rate": 0.00019913965030948061, "loss": 0.0429, "step": 104180 }, { "epoch": 0.67, "learning_rate": 0.00019912996895512367, "loss": 0.0415, "step": 104190 }, { "epoch": 0.67, "learning_rate": 0.00019912028760076675, "loss": 0.0483, "step": 104200 }, { "epoch": 0.67, "learning_rate": 0.0001991106062464098, "loss": 0.0472, "step": 104210 }, { "epoch": 0.67, "learning_rate": 0.00019910092489205288, "loss": 0.0502, "step": 104220 }, { "epoch": 0.67, "learning_rate": 0.00019909124353769596, "loss": 0.0432, "step": 104230 }, { "epoch": 0.67, "learning_rate": 0.00019908156218333904, "loss": 0.0469, "step": 104240 }, { "epoch": 0.67, "learning_rate": 0.0001990718808289821, "loss": 0.0381, "step": 104250 }, { "epoch": 0.67, "learning_rate": 0.00019906219947462514, "loss": 0.0454, "step": 104260 }, { "epoch": 0.67, "learning_rate": 0.00019905251812026822, "loss": 0.0431, "step": 104270 }, { "epoch": 0.67, "learning_rate": 0.00019904283676591128, "loss": 0.0448, "step": 104280 }, { "epoch": 0.67, "learning_rate": 0.00019903315541155436, "loss": 0.0461, "step": 104290 }, { "epoch": 0.67, "learning_rate": 0.00019902347405719744, "loss": 0.0426, "step": 104300 }, { "epoch": 0.67, "learning_rate": 0.0001990137927028405, "loss": 0.0491, "step": 104310 }, { "epoch": 0.67, "learning_rate": 0.00019900411134848357, "loss": 0.0424, "step": 104320 }, { "epoch": 0.67, "learning_rate": 0.00019899442999412662, "loss": 0.0415, "step": 104330 }, { "epoch": 0.67, "learning_rate": 0.00019898474863976967, "loss": 0.0472, "step": 104340 }, { "epoch": 0.67, "learning_rate": 0.00019897506728541275, "loss": 0.0414, "step": 104350 }, { "epoch": 0.67, "learning_rate": 0.00019896538593105583, "loss": 0.0419, "step": 104360 }, { "epoch": 0.67, "learning_rate": 0.00019895570457669891, "loss": 0.0448, "step": 104370 }, { "epoch": 0.67, "learning_rate": 0.00019894602322234197, "loss": 0.0532, "step": 104380 }, { "epoch": 0.67, "learning_rate": 0.00019893634186798505, "loss": 0.0494, "step": 104390 }, { "epoch": 0.67, "learning_rate": 0.0001989266605136281, "loss": 0.043, "step": 104400 }, { "epoch": 0.67, "learning_rate": 0.00019891697915927115, "loss": 0.0467, "step": 104410 }, { "epoch": 0.67, "learning_rate": 0.00019890729780491423, "loss": 0.0483, "step": 104420 }, { "epoch": 0.67, "learning_rate": 0.0001988976164505573, "loss": 0.046, "step": 104430 }, { "epoch": 0.67, "learning_rate": 0.0001988879350962004, "loss": 0.059, "step": 104440 }, { "epoch": 0.67, "learning_rate": 0.00019887825374184344, "loss": 0.0463, "step": 104450 }, { "epoch": 0.67, "learning_rate": 0.00019886857238748652, "loss": 0.052, "step": 104460 }, { "epoch": 0.67, "learning_rate": 0.00019885889103312958, "loss": 0.0453, "step": 104470 }, { "epoch": 0.67, "learning_rate": 0.00019884920967877263, "loss": 0.0435, "step": 104480 }, { "epoch": 0.67, "learning_rate": 0.0001988395283244157, "loss": 0.0487, "step": 104490 }, { "epoch": 0.67, "learning_rate": 0.0001988298469700588, "loss": 0.0392, "step": 104500 }, { "epoch": 0.67, "learning_rate": 0.00019882016561570184, "loss": 0.0453, "step": 104510 }, { "epoch": 0.67, "learning_rate": 0.00019881048426134492, "loss": 0.0477, "step": 104520 }, { "epoch": 0.67, "learning_rate": 0.000198800802906988, "loss": 0.0454, "step": 104530 }, { "epoch": 0.67, "learning_rate": 0.00019879112155263103, "loss": 0.0488, "step": 104540 }, { "epoch": 0.67, "learning_rate": 0.0001987814401982741, "loss": 0.0453, "step": 104550 }, { "epoch": 0.67, "learning_rate": 0.00019877175884391719, "loss": 0.043, "step": 104560 }, { "epoch": 0.67, "learning_rate": 0.00019876207748956027, "loss": 0.0474, "step": 104570 }, { "epoch": 0.67, "learning_rate": 0.00019875239613520332, "loss": 0.0489, "step": 104580 }, { "epoch": 0.68, "learning_rate": 0.0001987427147808464, "loss": 0.045, "step": 104590 }, { "epoch": 0.68, "learning_rate": 0.00019873303342648948, "loss": 0.049, "step": 104600 }, { "epoch": 0.68, "learning_rate": 0.0001987233520721325, "loss": 0.0406, "step": 104610 }, { "epoch": 0.68, "learning_rate": 0.00019871367071777558, "loss": 0.0459, "step": 104620 }, { "epoch": 0.68, "learning_rate": 0.00019870398936341866, "loss": 0.0438, "step": 104630 }, { "epoch": 0.68, "learning_rate": 0.00019869430800906174, "loss": 0.05, "step": 104640 }, { "epoch": 0.68, "learning_rate": 0.0001986846266547048, "loss": 0.0446, "step": 104650 }, { "epoch": 0.68, "learning_rate": 0.00019867494530034788, "loss": 0.0481, "step": 104660 }, { "epoch": 0.68, "learning_rate": 0.00019866526394599095, "loss": 0.0437, "step": 104670 }, { "epoch": 0.68, "learning_rate": 0.00019865558259163398, "loss": 0.0435, "step": 104680 }, { "epoch": 0.68, "learning_rate": 0.00019864590123727706, "loss": 0.0496, "step": 104690 }, { "epoch": 0.68, "learning_rate": 0.00019863621988292014, "loss": 0.0501, "step": 104700 }, { "epoch": 0.68, "learning_rate": 0.0001986265385285632, "loss": 0.0471, "step": 104710 }, { "epoch": 0.68, "learning_rate": 0.00019861685717420627, "loss": 0.0542, "step": 104720 }, { "epoch": 0.68, "learning_rate": 0.00019860717581984935, "loss": 0.0464, "step": 104730 }, { "epoch": 0.68, "learning_rate": 0.00019859749446549243, "loss": 0.0493, "step": 104740 }, { "epoch": 0.68, "learning_rate": 0.00019858781311113546, "loss": 0.0648, "step": 104750 }, { "epoch": 0.68, "learning_rate": 0.00019857813175677854, "loss": 0.0541, "step": 104760 }, { "epoch": 0.68, "learning_rate": 0.00019856845040242162, "loss": 0.0464, "step": 104770 }, { "epoch": 0.68, "learning_rate": 0.00019855876904806467, "loss": 0.0438, "step": 104780 }, { "epoch": 0.68, "learning_rate": 0.00019854908769370775, "loss": 0.0574, "step": 104790 }, { "epoch": 0.68, "learning_rate": 0.00019853940633935083, "loss": 0.0437, "step": 104800 }, { "epoch": 0.68, "learning_rate": 0.0001985297249849939, "loss": 0.047, "step": 104810 }, { "epoch": 0.68, "learning_rate": 0.00019852004363063694, "loss": 0.0438, "step": 104820 }, { "epoch": 0.68, "learning_rate": 0.00019851036227628001, "loss": 0.0442, "step": 104830 }, { "epoch": 0.68, "learning_rate": 0.0001985006809219231, "loss": 0.0443, "step": 104840 }, { "epoch": 0.68, "learning_rate": 0.00019849099956756615, "loss": 0.046, "step": 104850 }, { "epoch": 0.68, "learning_rate": 0.00019848131821320923, "loss": 0.0413, "step": 104860 }, { "epoch": 0.68, "learning_rate": 0.0001984716368588523, "loss": 0.0451, "step": 104870 }, { "epoch": 0.68, "learning_rate": 0.0001984619555044954, "loss": 0.0453, "step": 104880 }, { "epoch": 0.68, "learning_rate": 0.0001984522741501384, "loss": 0.0459, "step": 104890 }, { "epoch": 0.68, "learning_rate": 0.0001984425927957815, "loss": 0.049, "step": 104900 }, { "epoch": 0.68, "learning_rate": 0.00019843291144142454, "loss": 0.0482, "step": 104910 }, { "epoch": 0.68, "learning_rate": 0.00019842323008706762, "loss": 0.0448, "step": 104920 }, { "epoch": 0.68, "learning_rate": 0.0001984135487327107, "loss": 0.0473, "step": 104930 }, { "epoch": 0.68, "learning_rate": 0.00019840386737835378, "loss": 0.0512, "step": 104940 }, { "epoch": 0.68, "learning_rate": 0.00019839418602399684, "loss": 0.0436, "step": 104950 }, { "epoch": 0.68, "learning_rate": 0.0001983845046696399, "loss": 0.0489, "step": 104960 }, { "epoch": 0.68, "learning_rate": 0.00019837482331528297, "loss": 0.0526, "step": 104970 }, { "epoch": 0.68, "learning_rate": 0.00019836514196092602, "loss": 0.0395, "step": 104980 }, { "epoch": 0.68, "learning_rate": 0.0001983554606065691, "loss": 0.0449, "step": 104990 }, { "epoch": 0.68, "learning_rate": 0.00019834577925221218, "loss": 0.0462, "step": 105000 }, { "epoch": 0.68, "eval_cer": 0.9199078070274546, "eval_loss": 0.03056810237467289, "eval_runtime": 119.7885, "eval_samples_per_second": 16.696, "eval_steps_per_second": 4.174, "step": 105000 }, { "epoch": 0.68, "learning_rate": 0.00019833609789785526, "loss": 0.0445, "step": 105010 }, { "epoch": 0.68, "learning_rate": 0.00019832641654349831, "loss": 0.044, "step": 105020 }, { "epoch": 0.68, "learning_rate": 0.00019831673518914137, "loss": 0.0484, "step": 105030 }, { "epoch": 0.68, "learning_rate": 0.00019830705383478445, "loss": 0.042, "step": 105040 }, { "epoch": 0.68, "learning_rate": 0.0001982973724804275, "loss": 0.0496, "step": 105050 }, { "epoch": 0.68, "learning_rate": 0.00019828769112607058, "loss": 0.0528, "step": 105060 }, { "epoch": 0.68, "learning_rate": 0.00019827800977171366, "loss": 0.052, "step": 105070 }, { "epoch": 0.68, "learning_rate": 0.00019826832841735674, "loss": 0.0502, "step": 105080 }, { "epoch": 0.68, "learning_rate": 0.0001982586470629998, "loss": 0.0518, "step": 105090 }, { "epoch": 0.68, "learning_rate": 0.00019824896570864284, "loss": 0.0435, "step": 105100 }, { "epoch": 0.68, "learning_rate": 0.0001982392843542859, "loss": 0.0513, "step": 105110 }, { "epoch": 0.68, "learning_rate": 0.00019822960299992898, "loss": 0.0521, "step": 105120 }, { "epoch": 0.68, "learning_rate": 0.00019821992164557206, "loss": 0.0479, "step": 105130 }, { "epoch": 0.68, "learning_rate": 0.00019821024029121514, "loss": 0.0433, "step": 105140 }, { "epoch": 0.68, "learning_rate": 0.0001982005589368582, "loss": 0.0464, "step": 105150 }, { "epoch": 0.68, "learning_rate": 0.00019819087758250127, "loss": 0.0426, "step": 105160 }, { "epoch": 0.68, "learning_rate": 0.00019818119622814432, "loss": 0.0509, "step": 105170 }, { "epoch": 0.68, "learning_rate": 0.00019817151487378737, "loss": 0.0454, "step": 105180 }, { "epoch": 0.68, "learning_rate": 0.00019816183351943045, "loss": 0.0409, "step": 105190 }, { "epoch": 0.68, "learning_rate": 0.00019815215216507353, "loss": 0.0365, "step": 105200 }, { "epoch": 0.68, "learning_rate": 0.0001981424708107166, "loss": 0.042, "step": 105210 }, { "epoch": 0.68, "learning_rate": 0.00019813278945635967, "loss": 0.0501, "step": 105220 }, { "epoch": 0.68, "learning_rate": 0.00019812310810200275, "loss": 0.0458, "step": 105230 }, { "epoch": 0.68, "learning_rate": 0.0001981134267476458, "loss": 0.049, "step": 105240 }, { "epoch": 0.68, "learning_rate": 0.00019810374539328885, "loss": 0.0502, "step": 105250 }, { "epoch": 0.68, "learning_rate": 0.00019809406403893193, "loss": 0.0521, "step": 105260 }, { "epoch": 0.68, "learning_rate": 0.000198084382684575, "loss": 0.0469, "step": 105270 }, { "epoch": 0.68, "learning_rate": 0.0001980747013302181, "loss": 0.0429, "step": 105280 }, { "epoch": 0.68, "learning_rate": 0.00019806501997586114, "loss": 0.0412, "step": 105290 }, { "epoch": 0.68, "learning_rate": 0.00019805533862150422, "loss": 0.0457, "step": 105300 }, { "epoch": 0.68, "learning_rate": 0.00019804565726714725, "loss": 0.0476, "step": 105310 }, { "epoch": 0.68, "learning_rate": 0.00019803597591279033, "loss": 0.0517, "step": 105320 }, { "epoch": 0.68, "learning_rate": 0.0001980262945584334, "loss": 0.0448, "step": 105330 }, { "epoch": 0.68, "learning_rate": 0.0001980166132040765, "loss": 0.0541, "step": 105340 }, { "epoch": 0.68, "learning_rate": 0.00019800693184971954, "loss": 0.0424, "step": 105350 }, { "epoch": 0.68, "learning_rate": 0.00019799725049536262, "loss": 0.0456, "step": 105360 }, { "epoch": 0.68, "learning_rate": 0.0001979875691410057, "loss": 0.0446, "step": 105370 }, { "epoch": 0.68, "learning_rate": 0.00019797788778664873, "loss": 0.0518, "step": 105380 }, { "epoch": 0.68, "learning_rate": 0.0001979682064322918, "loss": 0.0506, "step": 105390 }, { "epoch": 0.68, "learning_rate": 0.00019795852507793489, "loss": 0.0506, "step": 105400 }, { "epoch": 0.68, "learning_rate": 0.00019794884372357797, "loss": 0.0509, "step": 105410 }, { "epoch": 0.68, "learning_rate": 0.00019793916236922102, "loss": 0.0425, "step": 105420 }, { "epoch": 0.68, "learning_rate": 0.0001979294810148641, "loss": 0.0419, "step": 105430 }, { "epoch": 0.68, "learning_rate": 0.00019791979966050718, "loss": 0.0399, "step": 105440 }, { "epoch": 0.68, "learning_rate": 0.0001979101183061502, "loss": 0.0511, "step": 105450 }, { "epoch": 0.68, "learning_rate": 0.00019790043695179328, "loss": 0.0478, "step": 105460 }, { "epoch": 0.68, "learning_rate": 0.00019789075559743636, "loss": 0.0446, "step": 105470 }, { "epoch": 0.68, "learning_rate": 0.00019788107424307944, "loss": 0.0486, "step": 105480 }, { "epoch": 0.68, "learning_rate": 0.0001978713928887225, "loss": 0.0412, "step": 105490 }, { "epoch": 0.68, "learning_rate": 0.00019786171153436557, "loss": 0.0442, "step": 105500 }, { "epoch": 0.68, "learning_rate": 0.00019785203018000865, "loss": 0.0457, "step": 105510 }, { "epoch": 0.68, "learning_rate": 0.00019784234882565168, "loss": 0.0432, "step": 105520 }, { "epoch": 0.68, "learning_rate": 0.00019783266747129476, "loss": 0.0508, "step": 105530 }, { "epoch": 0.68, "learning_rate": 0.00019782298611693784, "loss": 0.0436, "step": 105540 }, { "epoch": 0.68, "learning_rate": 0.0001978133047625809, "loss": 0.0444, "step": 105550 }, { "epoch": 0.68, "learning_rate": 0.00019780362340822397, "loss": 0.0447, "step": 105560 }, { "epoch": 0.68, "learning_rate": 0.00019779394205386705, "loss": 0.0464, "step": 105570 }, { "epoch": 0.68, "learning_rate": 0.00019778426069951013, "loss": 0.044, "step": 105580 }, { "epoch": 0.68, "learning_rate": 0.00019777457934515316, "loss": 0.0476, "step": 105590 }, { "epoch": 0.68, "learning_rate": 0.00019776489799079624, "loss": 0.0448, "step": 105600 }, { "epoch": 0.68, "learning_rate": 0.00019775521663643932, "loss": 0.0463, "step": 105610 }, { "epoch": 0.68, "learning_rate": 0.00019774553528208237, "loss": 0.0431, "step": 105620 }, { "epoch": 0.68, "learning_rate": 0.00019773585392772545, "loss": 0.0436, "step": 105630 }, { "epoch": 0.68, "learning_rate": 0.00019772617257336853, "loss": 0.0422, "step": 105640 }, { "epoch": 0.68, "learning_rate": 0.0001977164912190116, "loss": 0.0436, "step": 105650 }, { "epoch": 0.68, "learning_rate": 0.00019770680986465463, "loss": 0.0449, "step": 105660 }, { "epoch": 0.68, "learning_rate": 0.00019769712851029771, "loss": 0.0476, "step": 105670 }, { "epoch": 0.68, "learning_rate": 0.0001976874471559408, "loss": 0.0415, "step": 105680 }, { "epoch": 0.68, "learning_rate": 0.00019767776580158385, "loss": 0.0437, "step": 105690 }, { "epoch": 0.68, "learning_rate": 0.00019766808444722693, "loss": 0.0412, "step": 105700 }, { "epoch": 0.68, "learning_rate": 0.00019765840309287, "loss": 0.0442, "step": 105710 }, { "epoch": 0.68, "learning_rate": 0.00019764872173851306, "loss": 0.0374, "step": 105720 }, { "epoch": 0.68, "learning_rate": 0.0001976390403841561, "loss": 0.0426, "step": 105730 }, { "epoch": 0.68, "learning_rate": 0.0001976293590297992, "loss": 0.0382, "step": 105740 }, { "epoch": 0.68, "learning_rate": 0.00019761967767544224, "loss": 0.0536, "step": 105750 }, { "epoch": 0.68, "learning_rate": 0.00019760999632108532, "loss": 0.0467, "step": 105760 }, { "epoch": 0.68, "learning_rate": 0.0001976003149667284, "loss": 0.0438, "step": 105770 }, { "epoch": 0.68, "learning_rate": 0.00019759063361237148, "loss": 0.0414, "step": 105780 }, { "epoch": 0.68, "learning_rate": 0.00019758095225801454, "loss": 0.0432, "step": 105790 }, { "epoch": 0.68, "learning_rate": 0.0001975712709036576, "loss": 0.0428, "step": 105800 }, { "epoch": 0.68, "learning_rate": 0.00019756158954930067, "loss": 0.0461, "step": 105810 }, { "epoch": 0.68, "learning_rate": 0.00019755190819494372, "loss": 0.0384, "step": 105820 }, { "epoch": 0.68, "learning_rate": 0.0001975422268405868, "loss": 0.0476, "step": 105830 }, { "epoch": 0.68, "learning_rate": 0.00019753254548622988, "loss": 0.0458, "step": 105840 }, { "epoch": 0.68, "learning_rate": 0.00019752286413187296, "loss": 0.0425, "step": 105850 }, { "epoch": 0.68, "learning_rate": 0.00019751318277751601, "loss": 0.0498, "step": 105860 }, { "epoch": 0.68, "learning_rate": 0.00019750350142315907, "loss": 0.0381, "step": 105870 }, { "epoch": 0.68, "learning_rate": 0.00019749382006880215, "loss": 0.0466, "step": 105880 }, { "epoch": 0.68, "learning_rate": 0.0001974841387144452, "loss": 0.05, "step": 105890 }, { "epoch": 0.68, "learning_rate": 0.00019747445736008828, "loss": 0.0443, "step": 105900 }, { "epoch": 0.68, "learning_rate": 0.00019746477600573136, "loss": 0.0505, "step": 105910 }, { "epoch": 0.68, "learning_rate": 0.0001974550946513744, "loss": 0.0454, "step": 105920 }, { "epoch": 0.68, "learning_rate": 0.0001974454132970175, "loss": 0.045, "step": 105930 }, { "epoch": 0.68, "learning_rate": 0.00019743573194266054, "loss": 0.0447, "step": 105940 }, { "epoch": 0.68, "learning_rate": 0.0001974260505883036, "loss": 0.0446, "step": 105950 }, { "epoch": 0.68, "learning_rate": 0.00019741636923394668, "loss": 0.0502, "step": 105960 }, { "epoch": 0.68, "learning_rate": 0.00019740668787958976, "loss": 0.0462, "step": 105970 }, { "epoch": 0.68, "learning_rate": 0.00019739700652523284, "loss": 0.0506, "step": 105980 }, { "epoch": 0.68, "learning_rate": 0.0001973873251708759, "loss": 0.0446, "step": 105990 }, { "epoch": 0.68, "learning_rate": 0.00019737764381651897, "loss": 0.0478, "step": 106000 }, { "epoch": 0.68, "eval_cer": 0.9198834030053101, "eval_loss": 0.03057784214615822, "eval_runtime": 119.7766, "eval_samples_per_second": 16.698, "eval_steps_per_second": 4.174, "step": 106000 }, { "epoch": 0.68, "learning_rate": 0.00019736796246216202, "loss": 0.0508, "step": 106010 }, { "epoch": 0.68, "learning_rate": 0.00019735828110780507, "loss": 0.0506, "step": 106020 }, { "epoch": 0.68, "learning_rate": 0.00019734859975344815, "loss": 0.0585, "step": 106030 }, { "epoch": 0.68, "learning_rate": 0.00019733891839909123, "loss": 0.0429, "step": 106040 }, { "epoch": 0.68, "learning_rate": 0.0001973292370447343, "loss": 0.0612, "step": 106050 }, { "epoch": 0.68, "learning_rate": 0.00019731955569037737, "loss": 0.0439, "step": 106060 }, { "epoch": 0.68, "learning_rate": 0.00019730987433602045, "loss": 0.0429, "step": 106070 }, { "epoch": 0.68, "learning_rate": 0.0001973001929816635, "loss": 0.049, "step": 106080 }, { "epoch": 0.68, "learning_rate": 0.00019729051162730655, "loss": 0.0503, "step": 106090 }, { "epoch": 0.68, "learning_rate": 0.00019728083027294963, "loss": 0.0428, "step": 106100 }, { "epoch": 0.68, "learning_rate": 0.0001972711489185927, "loss": 0.0523, "step": 106110 }, { "epoch": 0.68, "learning_rate": 0.00019726146756423576, "loss": 0.0468, "step": 106120 }, { "epoch": 0.68, "learning_rate": 0.00019725178620987884, "loss": 0.0592, "step": 106130 }, { "epoch": 0.69, "learning_rate": 0.00019724210485552192, "loss": 0.0529, "step": 106140 }, { "epoch": 0.69, "learning_rate": 0.00019723242350116495, "loss": 0.0456, "step": 106150 }, { "epoch": 0.69, "learning_rate": 0.00019722274214680803, "loss": 0.0392, "step": 106160 }, { "epoch": 0.69, "learning_rate": 0.0001972130607924511, "loss": 0.0455, "step": 106170 }, { "epoch": 0.69, "learning_rate": 0.0001972033794380942, "loss": 0.0412, "step": 106180 }, { "epoch": 0.69, "learning_rate": 0.00019719369808373724, "loss": 0.0545, "step": 106190 }, { "epoch": 0.69, "learning_rate": 0.00019718401672938032, "loss": 0.0455, "step": 106200 }, { "epoch": 0.69, "learning_rate": 0.0001971743353750234, "loss": 0.045, "step": 106210 }, { "epoch": 0.69, "learning_rate": 0.00019716465402066643, "loss": 0.0501, "step": 106220 }, { "epoch": 0.69, "learning_rate": 0.0001971549726663095, "loss": 0.0429, "step": 106230 }, { "epoch": 0.69, "learning_rate": 0.00019714529131195258, "loss": 0.0431, "step": 106240 }, { "epoch": 0.69, "learning_rate": 0.00019713560995759566, "loss": 0.0506, "step": 106250 }, { "epoch": 0.69, "learning_rate": 0.00019712592860323872, "loss": 0.0416, "step": 106260 }, { "epoch": 0.69, "learning_rate": 0.0001971162472488818, "loss": 0.0491, "step": 106270 }, { "epoch": 0.69, "learning_rate": 0.00019710656589452488, "loss": 0.0544, "step": 106280 }, { "epoch": 0.69, "learning_rate": 0.0001970968845401679, "loss": 0.0469, "step": 106290 }, { "epoch": 0.69, "learning_rate": 0.00019708720318581098, "loss": 0.0618, "step": 106300 }, { "epoch": 0.69, "learning_rate": 0.00019707752183145406, "loss": 0.0434, "step": 106310 }, { "epoch": 0.69, "learning_rate": 0.00019706784047709711, "loss": 0.0393, "step": 106320 }, { "epoch": 0.69, "learning_rate": 0.0001970581591227402, "loss": 0.0445, "step": 106330 }, { "epoch": 0.69, "learning_rate": 0.00019704847776838327, "loss": 0.0399, "step": 106340 }, { "epoch": 0.69, "learning_rate": 0.00019703879641402635, "loss": 0.0418, "step": 106350 }, { "epoch": 0.69, "learning_rate": 0.00019702911505966938, "loss": 0.0479, "step": 106360 }, { "epoch": 0.69, "learning_rate": 0.00019701943370531246, "loss": 0.052, "step": 106370 }, { "epoch": 0.69, "learning_rate": 0.00019700975235095554, "loss": 0.0491, "step": 106380 }, { "epoch": 0.69, "learning_rate": 0.0001970000709965986, "loss": 0.0462, "step": 106390 }, { "epoch": 0.69, "learning_rate": 0.00019699038964224167, "loss": 0.0465, "step": 106400 }, { "epoch": 0.69, "learning_rate": 0.00019698070828788475, "loss": 0.0498, "step": 106410 }, { "epoch": 0.69, "learning_rate": 0.00019697102693352783, "loss": 0.0431, "step": 106420 }, { "epoch": 0.69, "learning_rate": 0.00019696134557917086, "loss": 0.0543, "step": 106430 }, { "epoch": 0.69, "learning_rate": 0.00019695166422481394, "loss": 0.0443, "step": 106440 }, { "epoch": 0.69, "learning_rate": 0.00019694198287045702, "loss": 0.0451, "step": 106450 }, { "epoch": 0.69, "learning_rate": 0.00019693230151610007, "loss": 0.0453, "step": 106460 }, { "epoch": 0.69, "learning_rate": 0.00019692262016174315, "loss": 0.0432, "step": 106470 }, { "epoch": 0.69, "learning_rate": 0.00019691293880738623, "loss": 0.0466, "step": 106480 }, { "epoch": 0.69, "learning_rate": 0.00019690325745302928, "loss": 0.0459, "step": 106490 }, { "epoch": 0.69, "learning_rate": 0.00019689357609867233, "loss": 0.046, "step": 106500 }, { "epoch": 0.69, "learning_rate": 0.00019688389474431541, "loss": 0.0432, "step": 106510 }, { "epoch": 0.69, "learning_rate": 0.00019687421338995847, "loss": 0.0447, "step": 106520 }, { "epoch": 0.69, "learning_rate": 0.00019686453203560155, "loss": 0.0431, "step": 106530 }, { "epoch": 0.69, "learning_rate": 0.00019685485068124463, "loss": 0.0478, "step": 106540 }, { "epoch": 0.69, "learning_rate": 0.0001968451693268877, "loss": 0.0414, "step": 106550 }, { "epoch": 0.69, "learning_rate": 0.00019683548797253076, "loss": 0.0518, "step": 106560 }, { "epoch": 0.69, "learning_rate": 0.0001968258066181738, "loss": 0.0495, "step": 106570 }, { "epoch": 0.69, "learning_rate": 0.0001968161252638169, "loss": 0.0461, "step": 106580 }, { "epoch": 0.69, "learning_rate": 0.00019680644390945994, "loss": 0.0522, "step": 106590 }, { "epoch": 0.69, "learning_rate": 0.00019679676255510302, "loss": 0.0511, "step": 106600 }, { "epoch": 0.69, "learning_rate": 0.0001967870812007461, "loss": 0.0493, "step": 106610 }, { "epoch": 0.69, "learning_rate": 0.00019677739984638918, "loss": 0.0489, "step": 106620 }, { "epoch": 0.69, "learning_rate": 0.00019676771849203224, "loss": 0.0434, "step": 106630 }, { "epoch": 0.69, "learning_rate": 0.0001967580371376753, "loss": 0.0419, "step": 106640 }, { "epoch": 0.69, "learning_rate": 0.00019674835578331837, "loss": 0.0449, "step": 106650 }, { "epoch": 0.69, "learning_rate": 0.00019673867442896142, "loss": 0.0512, "step": 106660 }, { "epoch": 0.69, "learning_rate": 0.0001967289930746045, "loss": 0.0501, "step": 106670 }, { "epoch": 0.69, "learning_rate": 0.00019671931172024758, "loss": 0.0555, "step": 106680 }, { "epoch": 0.69, "learning_rate": 0.00019670963036589063, "loss": 0.0446, "step": 106690 }, { "epoch": 0.69, "learning_rate": 0.0001966999490115337, "loss": 0.0518, "step": 106700 }, { "epoch": 0.69, "learning_rate": 0.00019669026765717677, "loss": 0.045, "step": 106710 }, { "epoch": 0.69, "learning_rate": 0.00019668058630281982, "loss": 0.0484, "step": 106720 }, { "epoch": 0.69, "learning_rate": 0.0001966709049484629, "loss": 0.0467, "step": 106730 }, { "epoch": 0.69, "learning_rate": 0.00019666122359410598, "loss": 0.041, "step": 106740 }, { "epoch": 0.69, "learning_rate": 0.00019665154223974906, "loss": 0.0454, "step": 106750 }, { "epoch": 0.69, "learning_rate": 0.0001966418608853921, "loss": 0.0439, "step": 106760 }, { "epoch": 0.69, "learning_rate": 0.00019663217953103516, "loss": 0.0424, "step": 106770 }, { "epoch": 0.69, "learning_rate": 0.00019662249817667824, "loss": 0.0413, "step": 106780 }, { "epoch": 0.69, "learning_rate": 0.0001966128168223213, "loss": 0.0457, "step": 106790 }, { "epoch": 0.69, "learning_rate": 0.00019660313546796438, "loss": 0.0395, "step": 106800 }, { "epoch": 0.69, "learning_rate": 0.00019659345411360746, "loss": 0.0538, "step": 106810 }, { "epoch": 0.69, "learning_rate": 0.00019658377275925054, "loss": 0.0418, "step": 106820 }, { "epoch": 0.69, "learning_rate": 0.0001965740914048936, "loss": 0.046, "step": 106830 }, { "epoch": 0.69, "learning_rate": 0.00019656441005053664, "loss": 0.0454, "step": 106840 }, { "epoch": 0.69, "learning_rate": 0.00019655472869617972, "loss": 0.0533, "step": 106850 }, { "epoch": 0.69, "learning_rate": 0.00019654504734182277, "loss": 0.0457, "step": 106860 }, { "epoch": 0.69, "learning_rate": 0.00019653536598746585, "loss": 0.1217, "step": 106870 }, { "epoch": 0.69, "learning_rate": 0.00019652568463310893, "loss": 0.0501, "step": 106880 }, { "epoch": 0.69, "learning_rate": 0.000196516003278752, "loss": 0.0533, "step": 106890 }, { "epoch": 0.69, "learning_rate": 0.00019650632192439507, "loss": 0.0463, "step": 106900 }, { "epoch": 0.69, "learning_rate": 0.00019649664057003812, "loss": 0.0432, "step": 106910 }, { "epoch": 0.69, "learning_rate": 0.00019648695921568117, "loss": 0.0494, "step": 106920 }, { "epoch": 0.69, "learning_rate": 0.00019647727786132425, "loss": 0.0406, "step": 106930 }, { "epoch": 0.69, "learning_rate": 0.00019646759650696733, "loss": 0.0508, "step": 106940 }, { "epoch": 0.69, "learning_rate": 0.0001964579151526104, "loss": 0.0455, "step": 106950 }, { "epoch": 0.69, "learning_rate": 0.00019644823379825346, "loss": 0.0402, "step": 106960 }, { "epoch": 0.69, "learning_rate": 0.00019643855244389654, "loss": 0.0482, "step": 106970 }, { "epoch": 0.69, "learning_rate": 0.0001964288710895396, "loss": 0.0958, "step": 106980 }, { "epoch": 0.69, "learning_rate": 0.00019641918973518265, "loss": 0.056, "step": 106990 }, { "epoch": 0.69, "learning_rate": 0.00019640950838082573, "loss": 0.0456, "step": 107000 }, { "epoch": 0.69, "eval_cer": 0.9199249802282228, "eval_loss": 0.03076346032321453, "eval_runtime": 119.7637, "eval_samples_per_second": 16.7, "eval_steps_per_second": 4.175, "step": 107000 }, { "epoch": 0.69, "learning_rate": 0.0001963998270264688, "loss": 0.0391, "step": 107010 }, { "epoch": 0.69, "learning_rate": 0.0001963901456721119, "loss": 0.0503, "step": 107020 }, { "epoch": 0.69, "learning_rate": 0.00019638046431775494, "loss": 0.0497, "step": 107030 }, { "epoch": 0.69, "learning_rate": 0.00019637078296339802, "loss": 0.0553, "step": 107040 }, { "epoch": 0.69, "learning_rate": 0.00019636110160904107, "loss": 0.0503, "step": 107050 }, { "epoch": 0.69, "learning_rate": 0.00019635142025468412, "loss": 0.0498, "step": 107060 }, { "epoch": 0.69, "learning_rate": 0.0001963417389003272, "loss": 0.0547, "step": 107070 }, { "epoch": 0.69, "learning_rate": 0.00019633205754597028, "loss": 0.0447, "step": 107080 }, { "epoch": 0.69, "learning_rate": 0.00019632237619161336, "loss": 0.0471, "step": 107090 }, { "epoch": 0.69, "learning_rate": 0.00019631269483725642, "loss": 0.0451, "step": 107100 }, { "epoch": 0.69, "learning_rate": 0.0001963030134828995, "loss": 0.0459, "step": 107110 }, { "epoch": 0.69, "learning_rate": 0.00019629333212854252, "loss": 0.0442, "step": 107120 }, { "epoch": 0.69, "learning_rate": 0.0001962836507741856, "loss": 0.0466, "step": 107130 }, { "epoch": 0.69, "learning_rate": 0.00019627396941982868, "loss": 0.0467, "step": 107140 }, { "epoch": 0.69, "learning_rate": 0.00019626428806547176, "loss": 0.0502, "step": 107150 }, { "epoch": 0.69, "learning_rate": 0.00019625460671111481, "loss": 0.046, "step": 107160 }, { "epoch": 0.69, "learning_rate": 0.0001962449253567579, "loss": 0.0436, "step": 107170 }, { "epoch": 0.69, "learning_rate": 0.00019623524400240097, "loss": 0.0418, "step": 107180 }, { "epoch": 0.69, "learning_rate": 0.000196225562648044, "loss": 0.0431, "step": 107190 }, { "epoch": 0.69, "learning_rate": 0.00019621588129368708, "loss": 0.0433, "step": 107200 }, { "epoch": 0.69, "learning_rate": 0.00019620619993933016, "loss": 0.0463, "step": 107210 }, { "epoch": 0.69, "learning_rate": 0.00019619651858497324, "loss": 0.0439, "step": 107220 }, { "epoch": 0.69, "learning_rate": 0.0001961868372306163, "loss": 0.0467, "step": 107230 }, { "epoch": 0.69, "learning_rate": 0.00019617715587625937, "loss": 0.0598, "step": 107240 }, { "epoch": 0.69, "learning_rate": 0.00019616747452190245, "loss": 0.0482, "step": 107250 }, { "epoch": 0.69, "learning_rate": 0.00019615779316754548, "loss": 0.0456, "step": 107260 }, { "epoch": 0.69, "learning_rate": 0.00019614811181318856, "loss": 0.0545, "step": 107270 }, { "epoch": 0.69, "learning_rate": 0.00019613843045883164, "loss": 0.0454, "step": 107280 }, { "epoch": 0.69, "learning_rate": 0.00019612874910447472, "loss": 0.04, "step": 107290 }, { "epoch": 0.69, "learning_rate": 0.00019611906775011777, "loss": 0.0416, "step": 107300 }, { "epoch": 0.69, "learning_rate": 0.00019610938639576085, "loss": 0.0554, "step": 107310 }, { "epoch": 0.69, "learning_rate": 0.00019609970504140393, "loss": 0.0473, "step": 107320 }, { "epoch": 0.69, "learning_rate": 0.00019609002368704695, "loss": 0.046, "step": 107330 }, { "epoch": 0.69, "learning_rate": 0.00019608034233269003, "loss": 0.044, "step": 107340 }, { "epoch": 0.69, "learning_rate": 0.00019607066097833311, "loss": 0.0415, "step": 107350 }, { "epoch": 0.69, "learning_rate": 0.00019606097962397617, "loss": 0.0453, "step": 107360 }, { "epoch": 0.69, "learning_rate": 0.00019605129826961925, "loss": 0.0457, "step": 107370 }, { "epoch": 0.69, "learning_rate": 0.00019604161691526233, "loss": 0.0437, "step": 107380 }, { "epoch": 0.69, "learning_rate": 0.0001960319355609054, "loss": 0.045, "step": 107390 }, { "epoch": 0.69, "learning_rate": 0.00019602225420654843, "loss": 0.0422, "step": 107400 }, { "epoch": 0.69, "learning_rate": 0.0001960125728521915, "loss": 0.0469, "step": 107410 }, { "epoch": 0.69, "learning_rate": 0.0001960028914978346, "loss": 0.0472, "step": 107420 }, { "epoch": 0.69, "learning_rate": 0.00019599321014347764, "loss": 0.0535, "step": 107430 }, { "epoch": 0.69, "learning_rate": 0.00019598352878912072, "loss": 0.0453, "step": 107440 }, { "epoch": 0.69, "learning_rate": 0.0001959738474347638, "loss": 0.0432, "step": 107450 }, { "epoch": 0.69, "learning_rate": 0.00019596416608040688, "loss": 0.051, "step": 107460 }, { "epoch": 0.69, "learning_rate": 0.0001959544847260499, "loss": 0.0443, "step": 107470 }, { "epoch": 0.69, "learning_rate": 0.000195944803371693, "loss": 0.043, "step": 107480 }, { "epoch": 0.69, "learning_rate": 0.00019593512201733607, "loss": 0.0442, "step": 107490 }, { "epoch": 0.69, "learning_rate": 0.00019592544066297912, "loss": 0.0516, "step": 107500 }, { "epoch": 0.69, "learning_rate": 0.0001959157593086222, "loss": 0.043, "step": 107510 }, { "epoch": 0.69, "learning_rate": 0.00019590607795426528, "loss": 0.0432, "step": 107520 }, { "epoch": 0.69, "learning_rate": 0.00019589639659990833, "loss": 0.0405, "step": 107530 }, { "epoch": 0.69, "learning_rate": 0.00019588671524555139, "loss": 0.0459, "step": 107540 }, { "epoch": 0.69, "learning_rate": 0.00019587703389119447, "loss": 0.0482, "step": 107550 }, { "epoch": 0.69, "learning_rate": 0.00019586735253683752, "loss": 0.0427, "step": 107560 }, { "epoch": 0.69, "learning_rate": 0.0001958576711824806, "loss": 0.0536, "step": 107570 }, { "epoch": 0.69, "learning_rate": 0.00019584798982812368, "loss": 0.0398, "step": 107580 }, { "epoch": 0.69, "learning_rate": 0.00019583830847376676, "loss": 0.0457, "step": 107590 }, { "epoch": 0.69, "learning_rate": 0.0001958286271194098, "loss": 0.0677, "step": 107600 }, { "epoch": 0.69, "learning_rate": 0.00019581894576505286, "loss": 0.0438, "step": 107610 }, { "epoch": 0.69, "learning_rate": 0.00019580926441069594, "loss": 0.047, "step": 107620 }, { "epoch": 0.69, "learning_rate": 0.000195799583056339, "loss": 0.0427, "step": 107630 }, { "epoch": 0.69, "learning_rate": 0.00019578990170198208, "loss": 0.0457, "step": 107640 }, { "epoch": 0.69, "learning_rate": 0.00019578022034762516, "loss": 0.0456, "step": 107650 }, { "epoch": 0.69, "learning_rate": 0.00019577053899326823, "loss": 0.0555, "step": 107660 }, { "epoch": 0.69, "learning_rate": 0.0001957608576389113, "loss": 0.049, "step": 107670 }, { "epoch": 0.69, "learning_rate": 0.00019575117628455434, "loss": 0.0445, "step": 107680 }, { "epoch": 0.7, "learning_rate": 0.00019574149493019742, "loss": 0.0455, "step": 107690 }, { "epoch": 0.7, "learning_rate": 0.00019573181357584047, "loss": 0.0425, "step": 107700 }, { "epoch": 0.7, "learning_rate": 0.00019572213222148355, "loss": 0.0489, "step": 107710 }, { "epoch": 0.7, "learning_rate": 0.00019571245086712663, "loss": 0.0452, "step": 107720 }, { "epoch": 0.7, "learning_rate": 0.00019570276951276968, "loss": 0.0449, "step": 107730 }, { "epoch": 0.7, "learning_rate": 0.00019569308815841276, "loss": 0.062, "step": 107740 }, { "epoch": 0.7, "learning_rate": 0.00019568340680405582, "loss": 0.0558, "step": 107750 }, { "epoch": 0.7, "learning_rate": 0.00019567372544969887, "loss": 0.0446, "step": 107760 }, { "epoch": 0.7, "learning_rate": 0.00019566404409534195, "loss": 0.0442, "step": 107770 }, { "epoch": 0.7, "learning_rate": 0.00019565436274098503, "loss": 0.0446, "step": 107780 }, { "epoch": 0.7, "learning_rate": 0.0001956446813866281, "loss": 0.0386, "step": 107790 }, { "epoch": 0.7, "learning_rate": 0.00019563500003227116, "loss": 0.0495, "step": 107800 }, { "epoch": 0.7, "learning_rate": 0.00019562531867791424, "loss": 0.0402, "step": 107810 }, { "epoch": 0.7, "learning_rate": 0.0001956156373235573, "loss": 0.0413, "step": 107820 }, { "epoch": 0.7, "learning_rate": 0.00019560595596920035, "loss": 0.0529, "step": 107830 }, { "epoch": 0.7, "learning_rate": 0.00019559627461484343, "loss": 0.0431, "step": 107840 }, { "epoch": 0.7, "learning_rate": 0.0001955865932604865, "loss": 0.0563, "step": 107850 }, { "epoch": 0.7, "learning_rate": 0.0001955769119061296, "loss": 0.0563, "step": 107860 }, { "epoch": 0.7, "learning_rate": 0.00019556723055177264, "loss": 0.0424, "step": 107870 }, { "epoch": 0.7, "learning_rate": 0.00019555754919741572, "loss": 0.0392, "step": 107880 }, { "epoch": 0.7, "learning_rate": 0.00019554786784305877, "loss": 0.0493, "step": 107890 }, { "epoch": 0.7, "learning_rate": 0.00019553818648870182, "loss": 0.0463, "step": 107900 }, { "epoch": 0.7, "learning_rate": 0.0001955285051343449, "loss": 0.043, "step": 107910 }, { "epoch": 0.7, "learning_rate": 0.00019551882377998798, "loss": 0.0525, "step": 107920 }, { "epoch": 0.7, "learning_rate": 0.00019550914242563104, "loss": 0.0453, "step": 107930 }, { "epoch": 0.7, "learning_rate": 0.00019549946107127412, "loss": 0.0496, "step": 107940 }, { "epoch": 0.7, "learning_rate": 0.0001954897797169172, "loss": 0.0443, "step": 107950 }, { "epoch": 0.7, "learning_rate": 0.00019548009836256022, "loss": 0.0442, "step": 107960 }, { "epoch": 0.7, "learning_rate": 0.0001954704170082033, "loss": 0.0589, "step": 107970 }, { "epoch": 0.7, "learning_rate": 0.00019546073565384638, "loss": 0.0403, "step": 107980 }, { "epoch": 0.7, "learning_rate": 0.00019545105429948946, "loss": 0.043, "step": 107990 }, { "epoch": 0.7, "learning_rate": 0.00019544137294513251, "loss": 0.0433, "step": 108000 }, { "epoch": 0.7, "eval_cer": 0.9200207886114563, "eval_loss": 0.030186787247657776, "eval_runtime": 119.9054, "eval_samples_per_second": 16.68, "eval_steps_per_second": 4.17, "step": 108000 }, { "epoch": 0.7, "learning_rate": 0.0001954316915907756, "loss": 0.0465, "step": 108010 }, { "epoch": 0.7, "learning_rate": 0.00019542201023641867, "loss": 0.0443, "step": 108020 }, { "epoch": 0.7, "learning_rate": 0.0001954123288820617, "loss": 0.0405, "step": 108030 }, { "epoch": 0.7, "learning_rate": 0.00019540264752770478, "loss": 0.0418, "step": 108040 }, { "epoch": 0.7, "learning_rate": 0.00019539296617334786, "loss": 0.0472, "step": 108050 }, { "epoch": 0.7, "learning_rate": 0.00019538328481899094, "loss": 0.0409, "step": 108060 }, { "epoch": 0.7, "learning_rate": 0.000195373603464634, "loss": 0.0472, "step": 108070 }, { "epoch": 0.7, "learning_rate": 0.00019536392211027707, "loss": 0.0436, "step": 108080 }, { "epoch": 0.7, "learning_rate": 0.00019535424075592015, "loss": 0.0471, "step": 108090 }, { "epoch": 0.7, "learning_rate": 0.00019534455940156318, "loss": 0.0443, "step": 108100 }, { "epoch": 0.7, "learning_rate": 0.00019533487804720626, "loss": 0.0473, "step": 108110 }, { "epoch": 0.7, "learning_rate": 0.00019532519669284934, "loss": 0.0452, "step": 108120 }, { "epoch": 0.7, "learning_rate": 0.0001953155153384924, "loss": 0.0505, "step": 108130 }, { "epoch": 0.7, "learning_rate": 0.00019530583398413547, "loss": 0.0456, "step": 108140 }, { "epoch": 0.7, "learning_rate": 0.00019529615262977855, "loss": 0.0455, "step": 108150 }, { "epoch": 0.7, "learning_rate": 0.00019528647127542163, "loss": 0.0414, "step": 108160 }, { "epoch": 0.7, "learning_rate": 0.00019527678992106465, "loss": 0.0433, "step": 108170 }, { "epoch": 0.7, "learning_rate": 0.00019526710856670773, "loss": 0.0397, "step": 108180 }, { "epoch": 0.7, "learning_rate": 0.0001952574272123508, "loss": 0.0482, "step": 108190 }, { "epoch": 0.7, "learning_rate": 0.00019524774585799387, "loss": 0.0464, "step": 108200 }, { "epoch": 0.7, "learning_rate": 0.00019523806450363695, "loss": 0.0442, "step": 108210 }, { "epoch": 0.7, "learning_rate": 0.00019522838314928003, "loss": 0.0598, "step": 108220 }, { "epoch": 0.7, "learning_rate": 0.0001952187017949231, "loss": 0.0421, "step": 108230 }, { "epoch": 0.7, "learning_rate": 0.00019520902044056613, "loss": 0.0427, "step": 108240 }, { "epoch": 0.7, "learning_rate": 0.0001951993390862092, "loss": 0.0499, "step": 108250 }, { "epoch": 0.7, "learning_rate": 0.0001951896577318523, "loss": 0.054, "step": 108260 }, { "epoch": 0.7, "learning_rate": 0.00019517997637749534, "loss": 0.053, "step": 108270 }, { "epoch": 0.7, "learning_rate": 0.00019517029502313842, "loss": 0.0446, "step": 108280 }, { "epoch": 0.7, "learning_rate": 0.0001951606136687815, "loss": 0.0442, "step": 108290 }, { "epoch": 0.7, "learning_rate": 0.00019515093231442456, "loss": 0.0542, "step": 108300 }, { "epoch": 0.7, "learning_rate": 0.0001951412509600676, "loss": 0.05, "step": 108310 }, { "epoch": 0.7, "learning_rate": 0.0001951315696057107, "loss": 0.0442, "step": 108320 }, { "epoch": 0.7, "learning_rate": 0.00019512188825135374, "loss": 0.0403, "step": 108330 }, { "epoch": 0.7, "learning_rate": 0.00019511220689699682, "loss": 0.0435, "step": 108340 }, { "epoch": 0.7, "learning_rate": 0.0001951025255426399, "loss": 0.041, "step": 108350 }, { "epoch": 0.7, "learning_rate": 0.00019509284418828298, "loss": 0.0455, "step": 108360 }, { "epoch": 0.7, "learning_rate": 0.00019508316283392603, "loss": 0.0439, "step": 108370 }, { "epoch": 0.7, "learning_rate": 0.00019507348147956909, "loss": 0.0426, "step": 108380 }, { "epoch": 0.7, "learning_rate": 0.00019506380012521217, "loss": 0.0454, "step": 108390 }, { "epoch": 0.7, "learning_rate": 0.00019505411877085522, "loss": 0.0466, "step": 108400 }, { "epoch": 0.7, "learning_rate": 0.0001950444374164983, "loss": 0.0445, "step": 108410 }, { "epoch": 0.7, "learning_rate": 0.00019503475606214138, "loss": 0.0436, "step": 108420 }, { "epoch": 0.7, "learning_rate": 0.00019502507470778446, "loss": 0.0428, "step": 108430 }, { "epoch": 0.7, "learning_rate": 0.0001950153933534275, "loss": 0.0439, "step": 108440 }, { "epoch": 0.7, "learning_rate": 0.00019500571199907056, "loss": 0.0427, "step": 108450 }, { "epoch": 0.7, "learning_rate": 0.00019499603064471364, "loss": 0.0552, "step": 108460 }, { "epoch": 0.7, "learning_rate": 0.0001949863492903567, "loss": 0.0447, "step": 108470 }, { "epoch": 0.7, "learning_rate": 0.00019497666793599977, "loss": 0.042, "step": 108480 }, { "epoch": 0.7, "learning_rate": 0.00019496698658164285, "loss": 0.0468, "step": 108490 }, { "epoch": 0.7, "learning_rate": 0.0001949573052272859, "loss": 0.0542, "step": 108500 }, { "epoch": 0.7, "learning_rate": 0.000194947623872929, "loss": 0.0579, "step": 108510 }, { "epoch": 0.7, "learning_rate": 0.00019493794251857204, "loss": 0.0489, "step": 108520 }, { "epoch": 0.7, "learning_rate": 0.0001949282611642151, "loss": 0.0478, "step": 108530 }, { "epoch": 0.7, "learning_rate": 0.00019491857980985817, "loss": 0.0593, "step": 108540 }, { "epoch": 0.7, "learning_rate": 0.00019490889845550125, "loss": 0.0502, "step": 108550 }, { "epoch": 0.7, "learning_rate": 0.00019489921710114433, "loss": 0.0473, "step": 108560 }, { "epoch": 0.7, "learning_rate": 0.00019488953574678738, "loss": 0.0459, "step": 108570 }, { "epoch": 0.7, "learning_rate": 0.00019487985439243046, "loss": 0.0483, "step": 108580 }, { "epoch": 0.7, "learning_rate": 0.00019487017303807352, "loss": 0.0596, "step": 108590 }, { "epoch": 0.7, "learning_rate": 0.00019486049168371657, "loss": 0.0416, "step": 108600 }, { "epoch": 0.7, "learning_rate": 0.00019485081032935965, "loss": 0.0439, "step": 108610 }, { "epoch": 0.7, "learning_rate": 0.00019484112897500273, "loss": 0.0489, "step": 108620 }, { "epoch": 0.7, "learning_rate": 0.0001948314476206458, "loss": 0.0441, "step": 108630 }, { "epoch": 0.7, "learning_rate": 0.00019482176626628886, "loss": 0.0441, "step": 108640 }, { "epoch": 0.7, "learning_rate": 0.00019481208491193194, "loss": 0.0512, "step": 108650 }, { "epoch": 0.7, "learning_rate": 0.000194802403557575, "loss": 0.0438, "step": 108660 }, { "epoch": 0.7, "learning_rate": 0.00019479272220321805, "loss": 0.0451, "step": 108670 }, { "epoch": 0.7, "learning_rate": 0.00019478304084886113, "loss": 0.0467, "step": 108680 }, { "epoch": 0.7, "learning_rate": 0.0001947733594945042, "loss": 0.0405, "step": 108690 }, { "epoch": 0.7, "learning_rate": 0.00019476367814014726, "loss": 0.0518, "step": 108700 }, { "epoch": 0.7, "learning_rate": 0.00019475399678579034, "loss": 0.0486, "step": 108710 }, { "epoch": 0.7, "learning_rate": 0.00019474431543143342, "loss": 0.0474, "step": 108720 }, { "epoch": 0.7, "learning_rate": 0.00019473463407707644, "loss": 0.0381, "step": 108730 }, { "epoch": 0.7, "learning_rate": 0.00019472495272271952, "loss": 0.0455, "step": 108740 }, { "epoch": 0.7, "learning_rate": 0.0001947152713683626, "loss": 0.0521, "step": 108750 }, { "epoch": 0.7, "learning_rate": 0.00019470559001400568, "loss": 0.0405, "step": 108760 }, { "epoch": 0.7, "learning_rate": 0.00019469590865964874, "loss": 0.0482, "step": 108770 }, { "epoch": 0.7, "learning_rate": 0.00019468622730529182, "loss": 0.0408, "step": 108780 }, { "epoch": 0.7, "learning_rate": 0.0001946765459509349, "loss": 0.0498, "step": 108790 }, { "epoch": 0.7, "learning_rate": 0.00019466686459657792, "loss": 0.0428, "step": 108800 }, { "epoch": 0.7, "learning_rate": 0.000194657183242221, "loss": 0.0442, "step": 108810 }, { "epoch": 0.7, "learning_rate": 0.00019464750188786408, "loss": 0.0456, "step": 108820 }, { "epoch": 0.7, "learning_rate": 0.00019463782053350716, "loss": 0.048, "step": 108830 }, { "epoch": 0.7, "learning_rate": 0.00019462813917915021, "loss": 0.0477, "step": 108840 }, { "epoch": 0.7, "learning_rate": 0.0001946184578247933, "loss": 0.0567, "step": 108850 }, { "epoch": 0.7, "learning_rate": 0.00019460877647043637, "loss": 0.0451, "step": 108860 }, { "epoch": 0.7, "learning_rate": 0.0001945990951160794, "loss": 0.047, "step": 108870 }, { "epoch": 0.7, "learning_rate": 0.00019458941376172248, "loss": 0.0414, "step": 108880 }, { "epoch": 0.7, "learning_rate": 0.00019457973240736556, "loss": 0.0427, "step": 108890 }, { "epoch": 0.7, "learning_rate": 0.0001945700510530086, "loss": 0.046, "step": 108900 }, { "epoch": 0.7, "learning_rate": 0.0001945603696986517, "loss": 0.045, "step": 108910 }, { "epoch": 0.7, "learning_rate": 0.00019455068834429477, "loss": 0.0528, "step": 108920 }, { "epoch": 0.7, "learning_rate": 0.00019454100698993785, "loss": 0.0459, "step": 108930 }, { "epoch": 0.7, "learning_rate": 0.00019453132563558088, "loss": 0.0386, "step": 108940 }, { "epoch": 0.7, "learning_rate": 0.00019452164428122396, "loss": 0.0472, "step": 108950 }, { "epoch": 0.7, "learning_rate": 0.00019451196292686704, "loss": 0.0456, "step": 108960 }, { "epoch": 0.7, "learning_rate": 0.0001945022815725101, "loss": 0.0564, "step": 108970 }, { "epoch": 0.7, "learning_rate": 0.00019449260021815317, "loss": 0.0496, "step": 108980 }, { "epoch": 0.7, "learning_rate": 0.00019448291886379625, "loss": 0.0491, "step": 108990 }, { "epoch": 0.7, "learning_rate": 0.00019447323750943933, "loss": 0.0498, "step": 109000 }, { "epoch": 0.7, "eval_cer": 0.9199918653259519, "eval_loss": 0.029607662931084633, "eval_runtime": 119.9769, "eval_samples_per_second": 16.67, "eval_steps_per_second": 4.167, "step": 109000 }, { "epoch": 0.7, "learning_rate": 0.00019446355615508235, "loss": 0.0528, "step": 109010 }, { "epoch": 0.7, "learning_rate": 0.00019445387480072543, "loss": 0.0442, "step": 109020 }, { "epoch": 0.7, "learning_rate": 0.0001944441934463685, "loss": 0.0491, "step": 109030 }, { "epoch": 0.7, "learning_rate": 0.00019443451209201157, "loss": 0.0482, "step": 109040 }, { "epoch": 0.7, "learning_rate": 0.00019442483073765465, "loss": 0.0472, "step": 109050 }, { "epoch": 0.7, "learning_rate": 0.00019441514938329773, "loss": 0.0502, "step": 109060 }, { "epoch": 0.7, "learning_rate": 0.0001944054680289408, "loss": 0.0439, "step": 109070 }, { "epoch": 0.7, "learning_rate": 0.00019439578667458383, "loss": 0.0465, "step": 109080 }, { "epoch": 0.7, "learning_rate": 0.0001943861053202269, "loss": 0.049, "step": 109090 }, { "epoch": 0.7, "learning_rate": 0.00019437642396586996, "loss": 0.0409, "step": 109100 }, { "epoch": 0.7, "learning_rate": 0.00019436674261151304, "loss": 0.0475, "step": 109110 }, { "epoch": 0.7, "learning_rate": 0.00019435706125715612, "loss": 0.0451, "step": 109120 }, { "epoch": 0.7, "learning_rate": 0.0001943473799027992, "loss": 0.0473, "step": 109130 }, { "epoch": 0.7, "learning_rate": 0.00019433769854844226, "loss": 0.0415, "step": 109140 }, { "epoch": 0.7, "learning_rate": 0.0001943280171940853, "loss": 0.0438, "step": 109150 }, { "epoch": 0.7, "learning_rate": 0.0001943183358397284, "loss": 0.0478, "step": 109160 }, { "epoch": 0.7, "learning_rate": 0.00019430865448537144, "loss": 0.0409, "step": 109170 }, { "epoch": 0.7, "learning_rate": 0.00019429897313101452, "loss": 0.0411, "step": 109180 }, { "epoch": 0.7, "learning_rate": 0.0001942892917766576, "loss": 0.0472, "step": 109190 }, { "epoch": 0.7, "learning_rate": 0.00019427961042230068, "loss": 0.0402, "step": 109200 }, { "epoch": 0.7, "learning_rate": 0.00019426992906794373, "loss": 0.037, "step": 109210 }, { "epoch": 0.7, "learning_rate": 0.00019426024771358678, "loss": 0.0575, "step": 109220 }, { "epoch": 0.7, "learning_rate": 0.00019425056635922986, "loss": 0.0434, "step": 109230 }, { "epoch": 0.71, "learning_rate": 0.00019424088500487292, "loss": 0.0483, "step": 109240 }, { "epoch": 0.71, "learning_rate": 0.000194231203650516, "loss": 0.045, "step": 109250 }, { "epoch": 0.71, "learning_rate": 0.00019422152229615908, "loss": 0.0456, "step": 109260 }, { "epoch": 0.71, "learning_rate": 0.00019421184094180216, "loss": 0.04, "step": 109270 }, { "epoch": 0.71, "learning_rate": 0.0001942021595874452, "loss": 0.0437, "step": 109280 }, { "epoch": 0.71, "learning_rate": 0.00019419247823308826, "loss": 0.0465, "step": 109290 }, { "epoch": 0.71, "learning_rate": 0.00019418279687873131, "loss": 0.0493, "step": 109300 }, { "epoch": 0.71, "learning_rate": 0.0001941731155243744, "loss": 0.0401, "step": 109310 }, { "epoch": 0.71, "learning_rate": 0.00019416343417001747, "loss": 0.0469, "step": 109320 }, { "epoch": 0.71, "learning_rate": 0.00019415375281566055, "loss": 0.0452, "step": 109330 }, { "epoch": 0.71, "learning_rate": 0.0001941440714613036, "loss": 0.048, "step": 109340 }, { "epoch": 0.71, "learning_rate": 0.0001941343901069467, "loss": 0.0446, "step": 109350 }, { "epoch": 0.71, "learning_rate": 0.00019412470875258974, "loss": 0.0439, "step": 109360 }, { "epoch": 0.71, "learning_rate": 0.0001941150273982328, "loss": 0.0436, "step": 109370 }, { "epoch": 0.71, "learning_rate": 0.00019410534604387587, "loss": 0.0428, "step": 109380 }, { "epoch": 0.71, "learning_rate": 0.00019409566468951895, "loss": 0.0441, "step": 109390 }, { "epoch": 0.71, "learning_rate": 0.00019408598333516203, "loss": 0.0452, "step": 109400 }, { "epoch": 0.71, "learning_rate": 0.00019407630198080508, "loss": 0.0535, "step": 109410 }, { "epoch": 0.71, "learning_rate": 0.00019406662062644816, "loss": 0.0437, "step": 109420 }, { "epoch": 0.71, "learning_rate": 0.00019405693927209122, "loss": 0.0414, "step": 109430 }, { "epoch": 0.71, "learning_rate": 0.00019404725791773427, "loss": 0.0478, "step": 109440 }, { "epoch": 0.71, "learning_rate": 0.00019403757656337735, "loss": 0.0475, "step": 109450 }, { "epoch": 0.71, "learning_rate": 0.00019402789520902043, "loss": 0.0453, "step": 109460 }, { "epoch": 0.71, "learning_rate": 0.0001940182138546635, "loss": 0.0451, "step": 109470 }, { "epoch": 0.71, "learning_rate": 0.00019400853250030656, "loss": 0.0429, "step": 109480 }, { "epoch": 0.71, "learning_rate": 0.00019399885114594964, "loss": 0.0477, "step": 109490 }, { "epoch": 0.71, "learning_rate": 0.00019398916979159267, "loss": 0.0436, "step": 109500 }, { "epoch": 0.71, "learning_rate": 0.00019397948843723575, "loss": 0.0439, "step": 109510 }, { "epoch": 0.71, "learning_rate": 0.00019396980708287883, "loss": 0.0513, "step": 109520 }, { "epoch": 0.71, "learning_rate": 0.0001939601257285219, "loss": 0.0403, "step": 109530 }, { "epoch": 0.71, "learning_rate": 0.00019395044437416496, "loss": 0.0436, "step": 109540 }, { "epoch": 0.71, "learning_rate": 0.00019394076301980804, "loss": 0.0428, "step": 109550 }, { "epoch": 0.71, "learning_rate": 0.00019393108166545112, "loss": 0.0418, "step": 109560 }, { "epoch": 0.71, "learning_rate": 0.00019392140031109414, "loss": 0.0461, "step": 109570 }, { "epoch": 0.71, "learning_rate": 0.00019391171895673722, "loss": 0.043, "step": 109580 }, { "epoch": 0.71, "learning_rate": 0.0001939020376023803, "loss": 0.0503, "step": 109590 }, { "epoch": 0.71, "learning_rate": 0.00019389235624802338, "loss": 0.0462, "step": 109600 }, { "epoch": 0.71, "learning_rate": 0.00019388267489366644, "loss": 0.0442, "step": 109610 }, { "epoch": 0.71, "learning_rate": 0.00019387299353930952, "loss": 0.0473, "step": 109620 }, { "epoch": 0.71, "learning_rate": 0.0001938633121849526, "loss": 0.0449, "step": 109630 }, { "epoch": 0.71, "learning_rate": 0.00019385363083059562, "loss": 0.043, "step": 109640 }, { "epoch": 0.71, "learning_rate": 0.0001938439494762387, "loss": 0.05, "step": 109650 }, { "epoch": 0.71, "learning_rate": 0.00019383426812188178, "loss": 0.0477, "step": 109660 }, { "epoch": 0.71, "learning_rate": 0.00019382458676752486, "loss": 0.0442, "step": 109670 }, { "epoch": 0.71, "learning_rate": 0.0001938149054131679, "loss": 0.0544, "step": 109680 }, { "epoch": 0.71, "learning_rate": 0.000193805224058811, "loss": 0.0467, "step": 109690 }, { "epoch": 0.71, "learning_rate": 0.00019379554270445407, "loss": 0.0454, "step": 109700 }, { "epoch": 0.71, "learning_rate": 0.0001937858613500971, "loss": 0.0363, "step": 109710 }, { "epoch": 0.71, "learning_rate": 0.00019377617999574018, "loss": 0.0465, "step": 109720 }, { "epoch": 0.71, "learning_rate": 0.00019376649864138326, "loss": 0.0532, "step": 109730 }, { "epoch": 0.71, "learning_rate": 0.0001937568172870263, "loss": 0.0488, "step": 109740 }, { "epoch": 0.71, "learning_rate": 0.0001937471359326694, "loss": 0.0425, "step": 109750 }, { "epoch": 0.71, "learning_rate": 0.00019373745457831247, "loss": 0.0417, "step": 109760 }, { "epoch": 0.71, "learning_rate": 0.00019372777322395555, "loss": 0.0455, "step": 109770 }, { "epoch": 0.71, "learning_rate": 0.00019371809186959858, "loss": 0.0434, "step": 109780 }, { "epoch": 0.71, "learning_rate": 0.00019370841051524166, "loss": 0.0473, "step": 109790 }, { "epoch": 0.71, "learning_rate": 0.00019369872916088474, "loss": 0.0492, "step": 109800 }, { "epoch": 0.71, "learning_rate": 0.0001936890478065278, "loss": 0.0462, "step": 109810 }, { "epoch": 0.71, "learning_rate": 0.00019367936645217087, "loss": 0.0459, "step": 109820 }, { "epoch": 0.71, "learning_rate": 0.00019366968509781395, "loss": 0.0463, "step": 109830 }, { "epoch": 0.71, "learning_rate": 0.00019366000374345703, "loss": 0.0465, "step": 109840 }, { "epoch": 0.71, "learning_rate": 0.00019365032238910005, "loss": 0.0424, "step": 109850 }, { "epoch": 0.71, "learning_rate": 0.00019364064103474313, "loss": 0.0487, "step": 109860 }, { "epoch": 0.71, "learning_rate": 0.0001936309596803862, "loss": 0.0479, "step": 109870 }, { "epoch": 0.71, "learning_rate": 0.00019362127832602927, "loss": 0.0448, "step": 109880 }, { "epoch": 0.71, "learning_rate": 0.00019361159697167234, "loss": 0.0443, "step": 109890 }, { "epoch": 0.71, "learning_rate": 0.00019360191561731542, "loss": 0.0416, "step": 109900 }, { "epoch": 0.71, "learning_rate": 0.00019359223426295848, "loss": 0.0449, "step": 109910 }, { "epoch": 0.71, "learning_rate": 0.00019358255290860153, "loss": 0.0525, "step": 109920 }, { "epoch": 0.71, "learning_rate": 0.0001935728715542446, "loss": 0.0449, "step": 109930 }, { "epoch": 0.71, "learning_rate": 0.00019356319019988766, "loss": 0.0482, "step": 109940 }, { "epoch": 0.71, "learning_rate": 0.00019355350884553074, "loss": 0.0433, "step": 109950 }, { "epoch": 0.71, "learning_rate": 0.00019354382749117382, "loss": 0.0441, "step": 109960 }, { "epoch": 0.71, "learning_rate": 0.0001935341461368169, "loss": 0.0452, "step": 109970 }, { "epoch": 0.71, "learning_rate": 0.00019352446478245995, "loss": 0.0496, "step": 109980 }, { "epoch": 0.71, "learning_rate": 0.000193514783428103, "loss": 0.0451, "step": 109990 }, { "epoch": 0.71, "learning_rate": 0.0001935051020737461, "loss": 0.0438, "step": 110000 }, { "epoch": 0.71, "eval_cer": 0.9199584227770873, "eval_loss": 0.03002985194325447, "eval_runtime": 120.0419, "eval_samples_per_second": 16.661, "eval_steps_per_second": 4.165, "step": 110000 }, { "epoch": 0.71, "learning_rate": 0.00019349542071938914, "loss": 0.0396, "step": 110010 }, { "epoch": 0.71, "learning_rate": 0.00019348573936503222, "loss": 0.0466, "step": 110020 }, { "epoch": 0.71, "learning_rate": 0.0001934760580106753, "loss": 0.0454, "step": 110030 }, { "epoch": 0.71, "learning_rate": 0.00019346637665631838, "loss": 0.0444, "step": 110040 }, { "epoch": 0.71, "learning_rate": 0.00019345669530196143, "loss": 0.0507, "step": 110050 }, { "epoch": 0.71, "learning_rate": 0.00019344701394760448, "loss": 0.044, "step": 110060 }, { "epoch": 0.71, "learning_rate": 0.00019343733259324756, "loss": 0.0466, "step": 110070 }, { "epoch": 0.71, "learning_rate": 0.00019342765123889062, "loss": 0.0463, "step": 110080 }, { "epoch": 0.71, "learning_rate": 0.0001934179698845337, "loss": 0.0482, "step": 110090 }, { "epoch": 0.71, "learning_rate": 0.00019340828853017678, "loss": 0.0388, "step": 110100 }, { "epoch": 0.71, "learning_rate": 0.00019339860717581983, "loss": 0.0411, "step": 110110 }, { "epoch": 0.71, "learning_rate": 0.0001933889258214629, "loss": 0.0433, "step": 110120 }, { "epoch": 0.71, "learning_rate": 0.00019337924446710596, "loss": 0.0462, "step": 110130 }, { "epoch": 0.71, "learning_rate": 0.00019336956311274901, "loss": 0.0451, "step": 110140 }, { "epoch": 0.71, "learning_rate": 0.0001933598817583921, "loss": 0.0431, "step": 110150 }, { "epoch": 0.71, "learning_rate": 0.00019335020040403517, "loss": 0.0468, "step": 110160 }, { "epoch": 0.71, "learning_rate": 0.00019334051904967825, "loss": 0.0383, "step": 110170 }, { "epoch": 0.71, "learning_rate": 0.0001933308376953213, "loss": 0.0474, "step": 110180 }, { "epoch": 0.71, "learning_rate": 0.00019332115634096439, "loss": 0.0518, "step": 110190 }, { "epoch": 0.71, "learning_rate": 0.00019331147498660744, "loss": 0.0441, "step": 110200 }, { "epoch": 0.71, "learning_rate": 0.0001933017936322505, "loss": 0.0443, "step": 110210 }, { "epoch": 0.71, "learning_rate": 0.00019329211227789357, "loss": 0.0388, "step": 110220 }, { "epoch": 0.71, "learning_rate": 0.00019328243092353665, "loss": 0.0473, "step": 110230 }, { "epoch": 0.71, "learning_rate": 0.00019327274956917973, "loss": 0.0465, "step": 110240 }, { "epoch": 0.71, "learning_rate": 0.00019326306821482278, "loss": 0.0501, "step": 110250 }, { "epoch": 0.71, "learning_rate": 0.00019325338686046586, "loss": 0.0412, "step": 110260 }, { "epoch": 0.71, "learning_rate": 0.00019324370550610892, "loss": 0.0447, "step": 110270 }, { "epoch": 0.71, "learning_rate": 0.00019323402415175197, "loss": 0.0488, "step": 110280 }, { "epoch": 0.71, "learning_rate": 0.00019322434279739505, "loss": 0.0419, "step": 110290 }, { "epoch": 0.71, "learning_rate": 0.00019321466144303813, "loss": 0.0418, "step": 110300 }, { "epoch": 0.71, "learning_rate": 0.00019320498008868118, "loss": 0.0406, "step": 110310 }, { "epoch": 0.71, "learning_rate": 0.00019319529873432426, "loss": 0.0432, "step": 110320 }, { "epoch": 0.71, "learning_rate": 0.00019318561737996734, "loss": 0.047, "step": 110330 }, { "epoch": 0.71, "learning_rate": 0.00019317593602561037, "loss": 0.0459, "step": 110340 }, { "epoch": 0.71, "learning_rate": 0.00019316625467125345, "loss": 0.0427, "step": 110350 }, { "epoch": 0.71, "learning_rate": 0.00019315657331689653, "loss": 0.0523, "step": 110360 }, { "epoch": 0.71, "learning_rate": 0.0001931468919625396, "loss": 0.0417, "step": 110370 }, { "epoch": 0.71, "learning_rate": 0.00019313721060818266, "loss": 0.0483, "step": 110380 }, { "epoch": 0.71, "learning_rate": 0.00019312752925382574, "loss": 0.0418, "step": 110390 }, { "epoch": 0.71, "learning_rate": 0.00019311784789946882, "loss": 0.0415, "step": 110400 }, { "epoch": 0.71, "learning_rate": 0.00019310816654511184, "loss": 0.0433, "step": 110410 }, { "epoch": 0.71, "learning_rate": 0.00019309848519075492, "loss": 0.0446, "step": 110420 }, { "epoch": 0.71, "learning_rate": 0.000193088803836398, "loss": 0.0409, "step": 110430 }, { "epoch": 0.71, "learning_rate": 0.00019307912248204108, "loss": 0.0446, "step": 110440 }, { "epoch": 0.71, "learning_rate": 0.00019306944112768414, "loss": 0.0416, "step": 110450 }, { "epoch": 0.71, "learning_rate": 0.00019305975977332722, "loss": 0.0485, "step": 110460 }, { "epoch": 0.71, "learning_rate": 0.0001930500784189703, "loss": 0.0475, "step": 110470 }, { "epoch": 0.71, "learning_rate": 0.00019304039706461332, "loss": 0.0458, "step": 110480 }, { "epoch": 0.71, "learning_rate": 0.0001930307157102564, "loss": 0.0489, "step": 110490 }, { "epoch": 0.71, "learning_rate": 0.00019302103435589948, "loss": 0.05, "step": 110500 }, { "epoch": 0.71, "learning_rate": 0.00019301135300154253, "loss": 0.0462, "step": 110510 }, { "epoch": 0.71, "learning_rate": 0.0001930016716471856, "loss": 0.0541, "step": 110520 }, { "epoch": 0.71, "learning_rate": 0.0001929919902928287, "loss": 0.0507, "step": 110530 }, { "epoch": 0.71, "learning_rate": 0.00019298230893847177, "loss": 0.0448, "step": 110540 }, { "epoch": 0.71, "learning_rate": 0.0001929726275841148, "loss": 0.0495, "step": 110550 }, { "epoch": 0.71, "learning_rate": 0.00019296294622975788, "loss": 0.0449, "step": 110560 }, { "epoch": 0.71, "learning_rate": 0.00019295326487540096, "loss": 0.0409, "step": 110570 }, { "epoch": 0.71, "learning_rate": 0.000192943583521044, "loss": 0.045, "step": 110580 }, { "epoch": 0.71, "learning_rate": 0.0001929339021666871, "loss": 0.0416, "step": 110590 }, { "epoch": 0.71, "learning_rate": 0.00019292422081233017, "loss": 0.0423, "step": 110600 }, { "epoch": 0.71, "learning_rate": 0.00019291453945797325, "loss": 0.0483, "step": 110610 }, { "epoch": 0.71, "learning_rate": 0.00019290485810361628, "loss": 0.0465, "step": 110620 }, { "epoch": 0.71, "learning_rate": 0.00019289517674925936, "loss": 0.0421, "step": 110630 }, { "epoch": 0.71, "learning_rate": 0.00019288549539490243, "loss": 0.045, "step": 110640 }, { "epoch": 0.71, "learning_rate": 0.0001928758140405455, "loss": 0.0443, "step": 110650 }, { "epoch": 0.71, "learning_rate": 0.00019286613268618857, "loss": 0.0508, "step": 110660 }, { "epoch": 0.71, "learning_rate": 0.00019285645133183165, "loss": 0.0437, "step": 110670 }, { "epoch": 0.71, "learning_rate": 0.0001928467699774747, "loss": 0.0412, "step": 110680 }, { "epoch": 0.71, "learning_rate": 0.00019283708862311775, "loss": 0.0423, "step": 110690 }, { "epoch": 0.71, "learning_rate": 0.00019282740726876083, "loss": 0.0502, "step": 110700 }, { "epoch": 0.71, "learning_rate": 0.00019281772591440389, "loss": 0.0432, "step": 110710 }, { "epoch": 0.71, "learning_rate": 0.00019280804456004696, "loss": 0.048, "step": 110720 }, { "epoch": 0.71, "learning_rate": 0.00019279836320569004, "loss": 0.0437, "step": 110730 }, { "epoch": 0.71, "learning_rate": 0.00019278868185133312, "loss": 0.0429, "step": 110740 }, { "epoch": 0.71, "learning_rate": 0.00019277900049697618, "loss": 0.0432, "step": 110750 }, { "epoch": 0.71, "learning_rate": 0.00019276931914261923, "loss": 0.0437, "step": 110760 }, { "epoch": 0.71, "learning_rate": 0.0001927596377882623, "loss": 0.0428, "step": 110770 }, { "epoch": 0.71, "learning_rate": 0.00019274995643390536, "loss": 0.0472, "step": 110780 }, { "epoch": 0.72, "learning_rate": 0.00019274027507954844, "loss": 0.0481, "step": 110790 }, { "epoch": 0.72, "learning_rate": 0.00019273059372519152, "loss": 0.041, "step": 110800 }, { "epoch": 0.72, "learning_rate": 0.0001927209123708346, "loss": 0.0449, "step": 110810 }, { "epoch": 0.72, "learning_rate": 0.00019271123101647765, "loss": 0.0432, "step": 110820 }, { "epoch": 0.72, "learning_rate": 0.0001927015496621207, "loss": 0.0447, "step": 110830 }, { "epoch": 0.72, "learning_rate": 0.0001926918683077638, "loss": 0.049, "step": 110840 }, { "epoch": 0.72, "learning_rate": 0.00019268218695340684, "loss": 0.0471, "step": 110850 }, { "epoch": 0.72, "learning_rate": 0.00019267250559904992, "loss": 0.0501, "step": 110860 }, { "epoch": 0.72, "learning_rate": 0.000192662824244693, "loss": 0.0427, "step": 110870 }, { "epoch": 0.72, "learning_rate": 0.00019265314289033605, "loss": 0.0418, "step": 110880 }, { "epoch": 0.72, "learning_rate": 0.00019264346153597913, "loss": 0.0426, "step": 110890 }, { "epoch": 0.72, "learning_rate": 0.00019263378018162218, "loss": 0.0437, "step": 110900 }, { "epoch": 0.72, "learning_rate": 0.00019262409882726524, "loss": 0.0497, "step": 110910 }, { "epoch": 0.72, "learning_rate": 0.00019261441747290832, "loss": 0.0482, "step": 110920 }, { "epoch": 0.72, "learning_rate": 0.0001926047361185514, "loss": 0.051, "step": 110930 }, { "epoch": 0.72, "learning_rate": 0.00019259505476419448, "loss": 0.0467, "step": 110940 }, { "epoch": 0.72, "learning_rate": 0.00019258537340983753, "loss": 0.048, "step": 110950 }, { "epoch": 0.72, "learning_rate": 0.0001925756920554806, "loss": 0.0423, "step": 110960 }, { "epoch": 0.72, "learning_rate": 0.00019256601070112366, "loss": 0.0476, "step": 110970 }, { "epoch": 0.72, "learning_rate": 0.00019255632934676671, "loss": 0.0432, "step": 110980 }, { "epoch": 0.72, "learning_rate": 0.0001925466479924098, "loss": 0.0551, "step": 110990 }, { "epoch": 0.72, "learning_rate": 0.00019253696663805287, "loss": 0.0394, "step": 111000 }, { "epoch": 0.72, "eval_cer": 0.9198192294655971, "eval_loss": 0.029867488890886307, "eval_runtime": 119.9464, "eval_samples_per_second": 16.674, "eval_steps_per_second": 4.169, "step": 111000 }, { "epoch": 0.72, "learning_rate": 0.00019252728528369595, "loss": 0.0482, "step": 111010 }, { "epoch": 0.72, "learning_rate": 0.000192517603929339, "loss": 0.041, "step": 111020 }, { "epoch": 0.72, "learning_rate": 0.00019250792257498209, "loss": 0.0401, "step": 111030 }, { "epoch": 0.72, "learning_rate": 0.00019249824122062514, "loss": 0.0507, "step": 111040 }, { "epoch": 0.72, "learning_rate": 0.0001924885598662682, "loss": 0.0426, "step": 111050 }, { "epoch": 0.72, "learning_rate": 0.00019247887851191127, "loss": 0.0454, "step": 111060 }, { "epoch": 0.72, "learning_rate": 0.00019246919715755435, "loss": 0.0521, "step": 111070 }, { "epoch": 0.72, "learning_rate": 0.0001924595158031974, "loss": 0.0407, "step": 111080 }, { "epoch": 0.72, "learning_rate": 0.00019244983444884048, "loss": 0.044, "step": 111090 }, { "epoch": 0.72, "learning_rate": 0.00019244015309448356, "loss": 0.0473, "step": 111100 }, { "epoch": 0.72, "learning_rate": 0.0001924304717401266, "loss": 0.0464, "step": 111110 }, { "epoch": 0.72, "learning_rate": 0.00019242079038576967, "loss": 0.0527, "step": 111120 }, { "epoch": 0.72, "learning_rate": 0.00019241110903141275, "loss": 0.0479, "step": 111130 }, { "epoch": 0.72, "learning_rate": 0.00019240142767705583, "loss": 0.0479, "step": 111140 }, { "epoch": 0.72, "learning_rate": 0.00019239174632269888, "loss": 0.0453, "step": 111150 }, { "epoch": 0.72, "learning_rate": 0.00019238206496834196, "loss": 0.0494, "step": 111160 }, { "epoch": 0.72, "learning_rate": 0.00019237238361398504, "loss": 0.0415, "step": 111170 }, { "epoch": 0.72, "learning_rate": 0.00019236270225962807, "loss": 0.0482, "step": 111180 }, { "epoch": 0.72, "learning_rate": 0.00019235302090527115, "loss": 0.0453, "step": 111190 }, { "epoch": 0.72, "learning_rate": 0.00019234333955091423, "loss": 0.0416, "step": 111200 }, { "epoch": 0.72, "learning_rate": 0.0001923336581965573, "loss": 0.0468, "step": 111210 }, { "epoch": 0.72, "learning_rate": 0.00019232397684220036, "loss": 0.0448, "step": 111220 }, { "epoch": 0.72, "learning_rate": 0.00019231429548784344, "loss": 0.0545, "step": 111230 }, { "epoch": 0.72, "learning_rate": 0.00019230461413348652, "loss": 0.04, "step": 111240 }, { "epoch": 0.72, "learning_rate": 0.00019229493277912954, "loss": 0.044, "step": 111250 }, { "epoch": 0.72, "learning_rate": 0.00019228525142477262, "loss": 0.0456, "step": 111260 }, { "epoch": 0.72, "learning_rate": 0.0001922755700704157, "loss": 0.0393, "step": 111270 }, { "epoch": 0.72, "learning_rate": 0.00019226588871605878, "loss": 0.0394, "step": 111280 }, { "epoch": 0.72, "learning_rate": 0.00019225620736170184, "loss": 0.0564, "step": 111290 }, { "epoch": 0.72, "learning_rate": 0.00019224652600734492, "loss": 0.0453, "step": 111300 }, { "epoch": 0.72, "learning_rate": 0.000192236844652988, "loss": 0.042, "step": 111310 }, { "epoch": 0.72, "learning_rate": 0.00019222716329863102, "loss": 0.0411, "step": 111320 }, { "epoch": 0.72, "learning_rate": 0.0001922174819442741, "loss": 0.0421, "step": 111330 }, { "epoch": 0.72, "learning_rate": 0.00019220780058991718, "loss": 0.0418, "step": 111340 }, { "epoch": 0.72, "learning_rate": 0.00019219811923556023, "loss": 0.046, "step": 111350 }, { "epoch": 0.72, "learning_rate": 0.0001921884378812033, "loss": 0.046, "step": 111360 }, { "epoch": 0.72, "learning_rate": 0.0001921787565268464, "loss": 0.0443, "step": 111370 }, { "epoch": 0.72, "learning_rate": 0.00019216907517248947, "loss": 0.0417, "step": 111380 }, { "epoch": 0.72, "learning_rate": 0.0001921593938181325, "loss": 0.0499, "step": 111390 }, { "epoch": 0.72, "learning_rate": 0.00019214971246377558, "loss": 0.0461, "step": 111400 }, { "epoch": 0.72, "learning_rate": 0.00019214003110941866, "loss": 0.04, "step": 111410 }, { "epoch": 0.72, "learning_rate": 0.0001921303497550617, "loss": 0.0452, "step": 111420 }, { "epoch": 0.72, "learning_rate": 0.0001921206684007048, "loss": 0.0442, "step": 111430 }, { "epoch": 0.72, "learning_rate": 0.00019211098704634787, "loss": 0.0406, "step": 111440 }, { "epoch": 0.72, "learning_rate": 0.00019210130569199095, "loss": 0.043, "step": 111450 }, { "epoch": 0.72, "learning_rate": 0.00019209162433763397, "loss": 0.0434, "step": 111460 }, { "epoch": 0.72, "learning_rate": 0.00019208194298327705, "loss": 0.0499, "step": 111470 }, { "epoch": 0.72, "learning_rate": 0.00019207226162892013, "loss": 0.0451, "step": 111480 }, { "epoch": 0.72, "learning_rate": 0.0001920625802745632, "loss": 0.0395, "step": 111490 }, { "epoch": 0.72, "learning_rate": 0.00019205289892020627, "loss": 0.0427, "step": 111500 }, { "epoch": 0.72, "learning_rate": 0.00019204321756584935, "loss": 0.0431, "step": 111510 }, { "epoch": 0.72, "learning_rate": 0.0001920335362114924, "loss": 0.0497, "step": 111520 }, { "epoch": 0.72, "learning_rate": 0.00019202385485713545, "loss": 0.0433, "step": 111530 }, { "epoch": 0.72, "learning_rate": 0.00019201417350277853, "loss": 0.0469, "step": 111540 }, { "epoch": 0.72, "learning_rate": 0.00019200449214842158, "loss": 0.0428, "step": 111550 }, { "epoch": 0.72, "learning_rate": 0.00019199481079406466, "loss": 0.0448, "step": 111560 }, { "epoch": 0.72, "learning_rate": 0.00019198512943970774, "loss": 0.0434, "step": 111570 }, { "epoch": 0.72, "learning_rate": 0.00019197544808535082, "loss": 0.0435, "step": 111580 }, { "epoch": 0.72, "learning_rate": 0.00019196576673099388, "loss": 0.0423, "step": 111590 }, { "epoch": 0.72, "learning_rate": 0.00019195608537663693, "loss": 0.049, "step": 111600 }, { "epoch": 0.72, "learning_rate": 0.00019194640402228, "loss": 0.0428, "step": 111610 }, { "epoch": 0.72, "learning_rate": 0.00019193672266792306, "loss": 0.0417, "step": 111620 }, { "epoch": 0.72, "learning_rate": 0.00019192704131356614, "loss": 0.0598, "step": 111630 }, { "epoch": 0.72, "learning_rate": 0.00019191735995920922, "loss": 0.0422, "step": 111640 }, { "epoch": 0.72, "learning_rate": 0.0001919076786048523, "loss": 0.0484, "step": 111650 }, { "epoch": 0.72, "learning_rate": 0.00019189799725049535, "loss": 0.0389, "step": 111660 }, { "epoch": 0.72, "learning_rate": 0.0001918883158961384, "loss": 0.0385, "step": 111670 }, { "epoch": 0.72, "learning_rate": 0.00019187863454178149, "loss": 0.0472, "step": 111680 }, { "epoch": 0.72, "learning_rate": 0.00019186895318742454, "loss": 0.0393, "step": 111690 }, { "epoch": 0.72, "learning_rate": 0.00019185927183306762, "loss": 0.0452, "step": 111700 }, { "epoch": 0.72, "learning_rate": 0.0001918495904787107, "loss": 0.0441, "step": 111710 }, { "epoch": 0.72, "learning_rate": 0.00019183990912435375, "loss": 0.0437, "step": 111720 }, { "epoch": 0.72, "learning_rate": 0.00019183022776999683, "loss": 0.04, "step": 111730 }, { "epoch": 0.72, "learning_rate": 0.00019182054641563988, "loss": 0.0408, "step": 111740 }, { "epoch": 0.72, "learning_rate": 0.00019181086506128294, "loss": 0.0435, "step": 111750 }, { "epoch": 0.72, "learning_rate": 0.00019180118370692602, "loss": 0.04, "step": 111760 }, { "epoch": 0.72, "learning_rate": 0.0001917915023525691, "loss": 0.0442, "step": 111770 }, { "epoch": 0.72, "learning_rate": 0.00019178182099821218, "loss": 0.0456, "step": 111780 }, { "epoch": 0.72, "learning_rate": 0.00019177213964385523, "loss": 0.0445, "step": 111790 }, { "epoch": 0.72, "learning_rate": 0.0001917624582894983, "loss": 0.0428, "step": 111800 }, { "epoch": 0.72, "learning_rate": 0.00019175277693514136, "loss": 0.0394, "step": 111810 }, { "epoch": 0.72, "learning_rate": 0.00019174309558078441, "loss": 0.0453, "step": 111820 }, { "epoch": 0.72, "learning_rate": 0.0001917334142264275, "loss": 0.0555, "step": 111830 }, { "epoch": 0.72, "learning_rate": 0.00019172373287207057, "loss": 0.0481, "step": 111840 }, { "epoch": 0.72, "learning_rate": 0.00019171405151771365, "loss": 0.0483, "step": 111850 }, { "epoch": 0.72, "learning_rate": 0.0001917043701633567, "loss": 0.0435, "step": 111860 }, { "epoch": 0.72, "learning_rate": 0.00019169468880899979, "loss": 0.0461, "step": 111870 }, { "epoch": 0.72, "learning_rate": 0.00019168500745464284, "loss": 0.0487, "step": 111880 }, { "epoch": 0.72, "learning_rate": 0.0001916753261002859, "loss": 0.0439, "step": 111890 }, { "epoch": 0.72, "learning_rate": 0.00019166564474592897, "loss": 0.0557, "step": 111900 }, { "epoch": 0.72, "learning_rate": 0.00019165596339157205, "loss": 0.0461, "step": 111910 }, { "epoch": 0.72, "learning_rate": 0.0001916462820372151, "loss": 0.0546, "step": 111920 }, { "epoch": 0.72, "learning_rate": 0.00019163660068285818, "loss": 0.0468, "step": 111930 }, { "epoch": 0.72, "learning_rate": 0.00019162691932850126, "loss": 0.0425, "step": 111940 }, { "epoch": 0.72, "learning_rate": 0.0001916172379741443, "loss": 0.0417, "step": 111950 }, { "epoch": 0.72, "learning_rate": 0.00019160755661978737, "loss": 0.0421, "step": 111960 }, { "epoch": 0.72, "learning_rate": 0.00019159787526543045, "loss": 0.0493, "step": 111970 }, { "epoch": 0.72, "learning_rate": 0.00019158819391107353, "loss": 0.0441, "step": 111980 }, { "epoch": 0.72, "learning_rate": 0.00019157851255671658, "loss": 0.0409, "step": 111990 }, { "epoch": 0.72, "learning_rate": 0.00019156883120235966, "loss": 0.0451, "step": 112000 }, { "epoch": 0.72, "eval_cer": 0.9199602304824314, "eval_loss": 0.029715538024902344, "eval_runtime": 120.0538, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 112000 }, { "epoch": 0.72, "learning_rate": 0.00019155914984800274, "loss": 0.0462, "step": 112010 }, { "epoch": 0.72, "learning_rate": 0.00019154946849364577, "loss": 0.0536, "step": 112020 }, { "epoch": 0.72, "learning_rate": 0.00019153978713928885, "loss": 0.0446, "step": 112030 }, { "epoch": 0.72, "learning_rate": 0.00019153010578493193, "loss": 0.0476, "step": 112040 }, { "epoch": 0.72, "learning_rate": 0.000191520424430575, "loss": 0.0523, "step": 112050 }, { "epoch": 0.72, "learning_rate": 0.00019151074307621806, "loss": 0.045, "step": 112060 }, { "epoch": 0.72, "learning_rate": 0.00019150106172186114, "loss": 0.0439, "step": 112070 }, { "epoch": 0.72, "learning_rate": 0.00019149138036750422, "loss": 0.0482, "step": 112080 }, { "epoch": 0.72, "learning_rate": 0.00019148169901314724, "loss": 0.0447, "step": 112090 }, { "epoch": 0.72, "learning_rate": 0.00019147201765879032, "loss": 0.0439, "step": 112100 }, { "epoch": 0.72, "learning_rate": 0.0001914623363044334, "loss": 0.0449, "step": 112110 }, { "epoch": 0.72, "learning_rate": 0.00019145265495007646, "loss": 0.0432, "step": 112120 }, { "epoch": 0.72, "learning_rate": 0.00019144297359571953, "loss": 0.0432, "step": 112130 }, { "epoch": 0.72, "learning_rate": 0.00019143329224136261, "loss": 0.0442, "step": 112140 }, { "epoch": 0.72, "learning_rate": 0.0001914236108870057, "loss": 0.0463, "step": 112150 }, { "epoch": 0.72, "learning_rate": 0.00019141392953264872, "loss": 0.0494, "step": 112160 }, { "epoch": 0.72, "learning_rate": 0.0001914042481782918, "loss": 0.0464, "step": 112170 }, { "epoch": 0.72, "learning_rate": 0.00019139456682393488, "loss": 0.0424, "step": 112180 }, { "epoch": 0.72, "learning_rate": 0.00019138488546957793, "loss": 0.0448, "step": 112190 }, { "epoch": 0.72, "learning_rate": 0.000191375204115221, "loss": 0.0446, "step": 112200 }, { "epoch": 0.72, "learning_rate": 0.0001913655227608641, "loss": 0.0409, "step": 112210 }, { "epoch": 0.72, "learning_rate": 0.00019135584140650717, "loss": 0.0517, "step": 112220 }, { "epoch": 0.72, "learning_rate": 0.0001913461600521502, "loss": 0.0401, "step": 112230 }, { "epoch": 0.72, "learning_rate": 0.00019133647869779328, "loss": 0.0436, "step": 112240 }, { "epoch": 0.72, "learning_rate": 0.00019132679734343636, "loss": 0.0416, "step": 112250 }, { "epoch": 0.72, "learning_rate": 0.0001913171159890794, "loss": 0.0534, "step": 112260 }, { "epoch": 0.72, "learning_rate": 0.0001913074346347225, "loss": 0.0433, "step": 112270 }, { "epoch": 0.72, "learning_rate": 0.00019129775328036557, "loss": 0.0518, "step": 112280 }, { "epoch": 0.72, "learning_rate": 0.00019128807192600862, "loss": 0.046, "step": 112290 }, { "epoch": 0.72, "learning_rate": 0.00019127839057165167, "loss": 0.0449, "step": 112300 }, { "epoch": 0.72, "learning_rate": 0.00019126870921729475, "loss": 0.0435, "step": 112310 }, { "epoch": 0.72, "learning_rate": 0.0001912590278629378, "loss": 0.0392, "step": 112320 }, { "epoch": 0.73, "learning_rate": 0.0001912493465085809, "loss": 0.0417, "step": 112330 }, { "epoch": 0.73, "learning_rate": 0.00019123966515422397, "loss": 0.0398, "step": 112340 }, { "epoch": 0.73, "learning_rate": 0.00019122998379986705, "loss": 0.0474, "step": 112350 }, { "epoch": 0.73, "learning_rate": 0.0001912203024455101, "loss": 0.0491, "step": 112360 }, { "epoch": 0.73, "learning_rate": 0.00019121062109115315, "loss": 0.039, "step": 112370 }, { "epoch": 0.73, "learning_rate": 0.00019120093973679623, "loss": 0.0477, "step": 112380 }, { "epoch": 0.73, "learning_rate": 0.00019119125838243928, "loss": 0.049, "step": 112390 }, { "epoch": 0.73, "learning_rate": 0.00019118157702808236, "loss": 0.0463, "step": 112400 }, { "epoch": 0.73, "learning_rate": 0.00019117189567372544, "loss": 0.0444, "step": 112410 }, { "epoch": 0.73, "learning_rate": 0.00019116221431936852, "loss": 0.0479, "step": 112420 }, { "epoch": 0.73, "learning_rate": 0.00019115253296501158, "loss": 0.0426, "step": 112430 }, { "epoch": 0.73, "learning_rate": 0.00019114285161065463, "loss": 0.0439, "step": 112440 }, { "epoch": 0.73, "learning_rate": 0.0001911331702562977, "loss": 0.0426, "step": 112450 }, { "epoch": 0.73, "learning_rate": 0.00019112348890194076, "loss": 0.0419, "step": 112460 }, { "epoch": 0.73, "learning_rate": 0.00019111380754758384, "loss": 0.0389, "step": 112470 }, { "epoch": 0.73, "learning_rate": 0.00019110412619322692, "loss": 0.0431, "step": 112480 }, { "epoch": 0.73, "learning_rate": 0.00019109444483886997, "loss": 0.0423, "step": 112490 }, { "epoch": 0.73, "learning_rate": 0.00019108476348451305, "loss": 0.0494, "step": 112500 }, { "epoch": 0.73, "learning_rate": 0.0001910750821301561, "loss": 0.0417, "step": 112510 }, { "epoch": 0.73, "learning_rate": 0.00019106540077579916, "loss": 0.0474, "step": 112520 }, { "epoch": 0.73, "learning_rate": 0.00019105571942144224, "loss": 0.0408, "step": 112530 }, { "epoch": 0.73, "learning_rate": 0.00019104603806708532, "loss": 0.0489, "step": 112540 }, { "epoch": 0.73, "learning_rate": 0.0001910363567127284, "loss": 0.0456, "step": 112550 }, { "epoch": 0.73, "learning_rate": 0.00019102667535837145, "loss": 0.0409, "step": 112560 }, { "epoch": 0.73, "learning_rate": 0.00019101699400401453, "loss": 0.0479, "step": 112570 }, { "epoch": 0.73, "learning_rate": 0.00019100731264965758, "loss": 0.0423, "step": 112580 }, { "epoch": 0.73, "learning_rate": 0.00019099763129530064, "loss": 0.0472, "step": 112590 }, { "epoch": 0.73, "learning_rate": 0.00019098794994094372, "loss": 0.0415, "step": 112600 }, { "epoch": 0.73, "learning_rate": 0.0001909782685865868, "loss": 0.0419, "step": 112610 }, { "epoch": 0.73, "learning_rate": 0.00019096858723222988, "loss": 0.0424, "step": 112620 }, { "epoch": 0.73, "learning_rate": 0.00019095890587787293, "loss": 0.0436, "step": 112630 }, { "epoch": 0.73, "learning_rate": 0.000190949224523516, "loss": 0.0462, "step": 112640 }, { "epoch": 0.73, "learning_rate": 0.00019093954316915906, "loss": 0.0474, "step": 112650 }, { "epoch": 0.73, "learning_rate": 0.0001909298618148021, "loss": 0.0434, "step": 112660 }, { "epoch": 0.73, "learning_rate": 0.0001909201804604452, "loss": 0.0443, "step": 112670 }, { "epoch": 0.73, "learning_rate": 0.00019091049910608827, "loss": 0.0509, "step": 112680 }, { "epoch": 0.73, "learning_rate": 0.00019090081775173133, "loss": 0.047, "step": 112690 }, { "epoch": 0.73, "learning_rate": 0.0001908911363973744, "loss": 0.0544, "step": 112700 }, { "epoch": 0.73, "learning_rate": 0.00019088145504301749, "loss": 0.0463, "step": 112710 }, { "epoch": 0.73, "learning_rate": 0.0001908717736886605, "loss": 0.0474, "step": 112720 }, { "epoch": 0.73, "learning_rate": 0.0001908620923343036, "loss": 0.0454, "step": 112730 }, { "epoch": 0.73, "learning_rate": 0.00019085241097994667, "loss": 0.0431, "step": 112740 }, { "epoch": 0.73, "learning_rate": 0.00019084272962558975, "loss": 0.0498, "step": 112750 }, { "epoch": 0.73, "learning_rate": 0.0001908330482712328, "loss": 0.0457, "step": 112760 }, { "epoch": 0.73, "learning_rate": 0.00019082336691687588, "loss": 0.0456, "step": 112770 }, { "epoch": 0.73, "learning_rate": 0.00019081368556251896, "loss": 0.0478, "step": 112780 }, { "epoch": 0.73, "learning_rate": 0.000190804004208162, "loss": 0.0431, "step": 112790 }, { "epoch": 0.73, "learning_rate": 0.00019079432285380507, "loss": 0.0408, "step": 112800 }, { "epoch": 0.73, "learning_rate": 0.00019078464149944815, "loss": 0.043, "step": 112810 }, { "epoch": 0.73, "learning_rate": 0.00019077496014509123, "loss": 0.0449, "step": 112820 }, { "epoch": 0.73, "learning_rate": 0.00019076527879073428, "loss": 0.0409, "step": 112830 }, { "epoch": 0.73, "learning_rate": 0.00019075559743637736, "loss": 0.0495, "step": 112840 }, { "epoch": 0.73, "learning_rate": 0.00019074591608202044, "loss": 0.0418, "step": 112850 }, { "epoch": 0.73, "learning_rate": 0.00019073623472766347, "loss": 0.0437, "step": 112860 }, { "epoch": 0.73, "learning_rate": 0.00019072655337330655, "loss": 0.0569, "step": 112870 }, { "epoch": 0.73, "learning_rate": 0.00019071687201894962, "loss": 0.0431, "step": 112880 }, { "epoch": 0.73, "learning_rate": 0.00019070719066459268, "loss": 0.0464, "step": 112890 }, { "epoch": 0.73, "learning_rate": 0.00019069750931023576, "loss": 0.048, "step": 112900 }, { "epoch": 0.73, "learning_rate": 0.00019068782795587884, "loss": 0.0527, "step": 112910 }, { "epoch": 0.73, "learning_rate": 0.00019067814660152192, "loss": 0.0505, "step": 112920 }, { "epoch": 0.73, "learning_rate": 0.00019066846524716494, "loss": 0.0491, "step": 112930 }, { "epoch": 0.73, "learning_rate": 0.00019065878389280802, "loss": 0.0478, "step": 112940 }, { "epoch": 0.73, "learning_rate": 0.0001906491025384511, "loss": 0.0469, "step": 112950 }, { "epoch": 0.73, "learning_rate": 0.00019063942118409415, "loss": 0.0416, "step": 112960 }, { "epoch": 0.73, "learning_rate": 0.00019062973982973723, "loss": 0.0427, "step": 112970 }, { "epoch": 0.73, "learning_rate": 0.00019062005847538031, "loss": 0.0413, "step": 112980 }, { "epoch": 0.73, "learning_rate": 0.0001906103771210234, "loss": 0.049, "step": 112990 }, { "epoch": 0.73, "learning_rate": 0.00019060069576666642, "loss": 0.0413, "step": 113000 }, { "epoch": 0.73, "eval_cer": 0.9199014800587504, "eval_loss": 0.02950255572795868, "eval_runtime": 119.9456, "eval_samples_per_second": 16.674, "eval_steps_per_second": 4.169, "step": 113000 }, { "epoch": 0.73, "learning_rate": 0.0001905910144123095, "loss": 0.0461, "step": 113010 }, { "epoch": 0.73, "learning_rate": 0.00019058133305795258, "loss": 0.0446, "step": 113020 }, { "epoch": 0.73, "learning_rate": 0.00019057165170359563, "loss": 0.0394, "step": 113030 }, { "epoch": 0.73, "learning_rate": 0.0001905619703492387, "loss": 0.0436, "step": 113040 }, { "epoch": 0.73, "learning_rate": 0.0001905522889948818, "loss": 0.0434, "step": 113050 }, { "epoch": 0.73, "learning_rate": 0.00019054260764052487, "loss": 0.0493, "step": 113060 }, { "epoch": 0.73, "learning_rate": 0.0001905329262861679, "loss": 0.0428, "step": 113070 }, { "epoch": 0.73, "learning_rate": 0.00019052324493181098, "loss": 0.0406, "step": 113080 }, { "epoch": 0.73, "learning_rate": 0.00019051356357745403, "loss": 0.0519, "step": 113090 }, { "epoch": 0.73, "learning_rate": 0.0001905038822230971, "loss": 0.0481, "step": 113100 }, { "epoch": 0.73, "learning_rate": 0.0001904942008687402, "loss": 0.0429, "step": 113110 }, { "epoch": 0.73, "learning_rate": 0.00019048451951438327, "loss": 0.0403, "step": 113120 }, { "epoch": 0.73, "learning_rate": 0.00019047483816002632, "loss": 0.0461, "step": 113130 }, { "epoch": 0.73, "learning_rate": 0.00019046515680566937, "loss": 0.0431, "step": 113140 }, { "epoch": 0.73, "learning_rate": 0.00019045547545131245, "loss": 0.052, "step": 113150 }, { "epoch": 0.73, "learning_rate": 0.0001904457940969555, "loss": 0.0483, "step": 113160 }, { "epoch": 0.73, "learning_rate": 0.00019043611274259859, "loss": 0.0449, "step": 113170 }, { "epoch": 0.73, "learning_rate": 0.00019042643138824167, "loss": 0.0469, "step": 113180 }, { "epoch": 0.73, "learning_rate": 0.00019041675003388475, "loss": 0.0405, "step": 113190 }, { "epoch": 0.73, "learning_rate": 0.0001904070686795278, "loss": 0.0426, "step": 113200 }, { "epoch": 0.73, "learning_rate": 0.00019039738732517085, "loss": 0.0412, "step": 113210 }, { "epoch": 0.73, "learning_rate": 0.00019038770597081393, "loss": 0.0488, "step": 113220 }, { "epoch": 0.73, "learning_rate": 0.00019037802461645698, "loss": 0.0483, "step": 113230 }, { "epoch": 0.73, "learning_rate": 0.00019036834326210006, "loss": 0.0421, "step": 113240 }, { "epoch": 0.73, "learning_rate": 0.00019035866190774314, "loss": 0.0421, "step": 113250 }, { "epoch": 0.73, "learning_rate": 0.00019034898055338622, "loss": 0.0416, "step": 113260 }, { "epoch": 0.73, "learning_rate": 0.00019033929919902928, "loss": 0.0399, "step": 113270 }, { "epoch": 0.73, "learning_rate": 0.00019032961784467233, "loss": 0.0455, "step": 113280 }, { "epoch": 0.73, "learning_rate": 0.00019031993649031538, "loss": 0.0448, "step": 113290 }, { "epoch": 0.73, "learning_rate": 0.00019031025513595846, "loss": 0.0431, "step": 113300 }, { "epoch": 0.73, "learning_rate": 0.00019030057378160154, "loss": 0.0416, "step": 113310 }, { "epoch": 0.73, "learning_rate": 0.00019029089242724462, "loss": 0.0463, "step": 113320 }, { "epoch": 0.73, "learning_rate": 0.00019028121107288767, "loss": 0.0501, "step": 113330 }, { "epoch": 0.73, "learning_rate": 0.00019027152971853075, "loss": 0.0403, "step": 113340 }, { "epoch": 0.73, "learning_rate": 0.0001902618483641738, "loss": 0.0465, "step": 113350 }, { "epoch": 0.73, "learning_rate": 0.00019025216700981686, "loss": 0.0416, "step": 113360 }, { "epoch": 0.73, "learning_rate": 0.00019024248565545994, "loss": 0.0438, "step": 113370 }, { "epoch": 0.73, "learning_rate": 0.00019023280430110302, "loss": 0.051, "step": 113380 }, { "epoch": 0.73, "learning_rate": 0.0001902231229467461, "loss": 0.0412, "step": 113390 }, { "epoch": 0.73, "learning_rate": 0.00019021344159238915, "loss": 0.0448, "step": 113400 }, { "epoch": 0.73, "learning_rate": 0.00019020376023803223, "loss": 0.0447, "step": 113410 }, { "epoch": 0.73, "learning_rate": 0.00019019407888367528, "loss": 0.0407, "step": 113420 }, { "epoch": 0.73, "learning_rate": 0.00019018439752931834, "loss": 0.043, "step": 113430 }, { "epoch": 0.73, "learning_rate": 0.00019017471617496142, "loss": 0.0373, "step": 113440 }, { "epoch": 0.73, "learning_rate": 0.0001901650348206045, "loss": 0.0446, "step": 113450 }, { "epoch": 0.73, "learning_rate": 0.00019015535346624758, "loss": 0.0412, "step": 113460 }, { "epoch": 0.73, "learning_rate": 0.00019014567211189063, "loss": 0.0451, "step": 113470 }, { "epoch": 0.73, "learning_rate": 0.0001901359907575337, "loss": 0.0383, "step": 113480 }, { "epoch": 0.73, "learning_rate": 0.00019012630940317673, "loss": 0.0376, "step": 113490 }, { "epoch": 0.73, "learning_rate": 0.0001901166280488198, "loss": 0.0385, "step": 113500 }, { "epoch": 0.73, "learning_rate": 0.0001901069466944629, "loss": 0.0401, "step": 113510 }, { "epoch": 0.73, "learning_rate": 0.00019009726534010597, "loss": 0.0406, "step": 113520 }, { "epoch": 0.73, "learning_rate": 0.00019008758398574903, "loss": 0.0491, "step": 113530 }, { "epoch": 0.73, "learning_rate": 0.0001900779026313921, "loss": 0.0417, "step": 113540 }, { "epoch": 0.73, "learning_rate": 0.00019006822127703518, "loss": 0.0382, "step": 113550 }, { "epoch": 0.73, "learning_rate": 0.0001900585399226782, "loss": 0.0489, "step": 113560 }, { "epoch": 0.73, "learning_rate": 0.0001900488585683213, "loss": 0.0379, "step": 113570 }, { "epoch": 0.73, "learning_rate": 0.00019003917721396437, "loss": 0.0403, "step": 113580 }, { "epoch": 0.73, "learning_rate": 0.00019002949585960745, "loss": 0.0394, "step": 113590 }, { "epoch": 0.73, "learning_rate": 0.0001900198145052505, "loss": 0.043, "step": 113600 }, { "epoch": 0.73, "learning_rate": 0.00019001013315089358, "loss": 0.0554, "step": 113610 }, { "epoch": 0.73, "learning_rate": 0.00019000045179653666, "loss": 0.0467, "step": 113620 }, { "epoch": 0.73, "learning_rate": 0.0001899907704421797, "loss": 0.0468, "step": 113630 }, { "epoch": 0.73, "learning_rate": 0.00018998108908782277, "loss": 0.0505, "step": 113640 }, { "epoch": 0.73, "learning_rate": 0.00018997140773346585, "loss": 0.0403, "step": 113650 }, { "epoch": 0.73, "learning_rate": 0.00018996172637910893, "loss": 0.041, "step": 113660 }, { "epoch": 0.73, "learning_rate": 0.00018995204502475198, "loss": 0.0463, "step": 113670 }, { "epoch": 0.73, "learning_rate": 0.00018994236367039506, "loss": 0.0495, "step": 113680 }, { "epoch": 0.73, "learning_rate": 0.00018993268231603809, "loss": 0.0407, "step": 113690 }, { "epoch": 0.73, "learning_rate": 0.00018992300096168116, "loss": 0.0423, "step": 113700 }, { "epoch": 0.73, "learning_rate": 0.00018991331960732424, "loss": 0.0434, "step": 113710 }, { "epoch": 0.73, "learning_rate": 0.00018990363825296732, "loss": 0.0444, "step": 113720 }, { "epoch": 0.73, "learning_rate": 0.00018989395689861038, "loss": 0.0476, "step": 113730 }, { "epoch": 0.73, "learning_rate": 0.00018988427554425346, "loss": 0.0462, "step": 113740 }, { "epoch": 0.73, "learning_rate": 0.00018987459418989654, "loss": 0.0426, "step": 113750 }, { "epoch": 0.73, "learning_rate": 0.00018986491283553956, "loss": 0.0457, "step": 113760 }, { "epoch": 0.73, "learning_rate": 0.00018985523148118264, "loss": 0.0472, "step": 113770 }, { "epoch": 0.73, "learning_rate": 0.00018984555012682572, "loss": 0.0495, "step": 113780 }, { "epoch": 0.73, "learning_rate": 0.0001898358687724688, "loss": 0.0497, "step": 113790 }, { "epoch": 0.73, "learning_rate": 0.00018982618741811185, "loss": 0.0449, "step": 113800 }, { "epoch": 0.73, "learning_rate": 0.00018981650606375493, "loss": 0.0418, "step": 113810 }, { "epoch": 0.73, "learning_rate": 0.00018980682470939801, "loss": 0.0524, "step": 113820 }, { "epoch": 0.73, "learning_rate": 0.00018979714335504104, "loss": 0.046, "step": 113830 }, { "epoch": 0.73, "learning_rate": 0.00018978746200068412, "loss": 0.0441, "step": 113840 }, { "epoch": 0.73, "learning_rate": 0.0001897777806463272, "loss": 0.0424, "step": 113850 }, { "epoch": 0.73, "learning_rate": 0.00018976809929197028, "loss": 0.0403, "step": 113860 }, { "epoch": 0.73, "learning_rate": 0.00018975841793761333, "loss": 0.0441, "step": 113870 }, { "epoch": 0.74, "learning_rate": 0.0001897487365832564, "loss": 0.0366, "step": 113880 }, { "epoch": 0.74, "learning_rate": 0.0001897390552288995, "loss": 0.041, "step": 113890 }, { "epoch": 0.74, "learning_rate": 0.00018972937387454252, "loss": 0.0433, "step": 113900 }, { "epoch": 0.74, "learning_rate": 0.0001897196925201856, "loss": 0.0511, "step": 113910 }, { "epoch": 0.74, "learning_rate": 0.00018971001116582868, "loss": 0.042, "step": 113920 }, { "epoch": 0.74, "learning_rate": 0.00018970032981147173, "loss": 0.0406, "step": 113930 }, { "epoch": 0.74, "learning_rate": 0.0001896906484571148, "loss": 0.0406, "step": 113940 }, { "epoch": 0.74, "learning_rate": 0.0001896809671027579, "loss": 0.0443, "step": 113950 }, { "epoch": 0.74, "learning_rate": 0.00018967128574840097, "loss": 0.0384, "step": 113960 }, { "epoch": 0.74, "learning_rate": 0.000189661604394044, "loss": 0.0426, "step": 113970 }, { "epoch": 0.74, "learning_rate": 0.00018965192303968707, "loss": 0.0432, "step": 113980 }, { "epoch": 0.74, "learning_rate": 0.00018964224168533015, "loss": 0.0369, "step": 113990 }, { "epoch": 0.74, "learning_rate": 0.0001896325603309732, "loss": 0.0461, "step": 114000 }, { "epoch": 0.74, "eval_cer": 0.919810190938877, "eval_loss": 0.030083321034908295, "eval_runtime": 119.8896, "eval_samples_per_second": 16.682, "eval_steps_per_second": 4.171, "step": 114000 }, { "epoch": 0.74, "learning_rate": 0.00018962287897661629, "loss": 0.043, "step": 114010 }, { "epoch": 0.74, "learning_rate": 0.00018961319762225937, "loss": 0.047, "step": 114020 }, { "epoch": 0.74, "learning_rate": 0.00018960351626790245, "loss": 0.0419, "step": 114030 }, { "epoch": 0.74, "learning_rate": 0.00018959383491354547, "loss": 0.0448, "step": 114040 }, { "epoch": 0.74, "learning_rate": 0.00018958415355918855, "loss": 0.0412, "step": 114050 }, { "epoch": 0.74, "learning_rate": 0.00018957447220483163, "loss": 0.0393, "step": 114060 }, { "epoch": 0.74, "learning_rate": 0.00018956479085047468, "loss": 0.0463, "step": 114070 }, { "epoch": 0.74, "learning_rate": 0.00018955510949611776, "loss": 0.0368, "step": 114080 }, { "epoch": 0.74, "learning_rate": 0.00018954542814176084, "loss": 0.0632, "step": 114090 }, { "epoch": 0.74, "learning_rate": 0.0001895357467874039, "loss": 0.0382, "step": 114100 }, { "epoch": 0.74, "learning_rate": 0.00018952606543304695, "loss": 0.0487, "step": 114110 }, { "epoch": 0.74, "learning_rate": 0.00018951638407869003, "loss": 0.0396, "step": 114120 }, { "epoch": 0.74, "learning_rate": 0.00018950670272433308, "loss": 0.0452, "step": 114130 }, { "epoch": 0.74, "learning_rate": 0.00018949702136997616, "loss": 0.0442, "step": 114140 }, { "epoch": 0.74, "learning_rate": 0.00018948734001561924, "loss": 0.0398, "step": 114150 }, { "epoch": 0.74, "learning_rate": 0.00018947765866126232, "loss": 0.0459, "step": 114160 }, { "epoch": 0.74, "learning_rate": 0.00018946797730690537, "loss": 0.0428, "step": 114170 }, { "epoch": 0.74, "learning_rate": 0.00018945829595254843, "loss": 0.0535, "step": 114180 }, { "epoch": 0.74, "learning_rate": 0.0001894486145981915, "loss": 0.0451, "step": 114190 }, { "epoch": 0.74, "learning_rate": 0.00018943893324383456, "loss": 0.0481, "step": 114200 }, { "epoch": 0.74, "learning_rate": 0.00018942925188947764, "loss": 0.0446, "step": 114210 }, { "epoch": 0.74, "learning_rate": 0.00018941957053512072, "loss": 0.0477, "step": 114220 }, { "epoch": 0.74, "learning_rate": 0.0001894098891807638, "loss": 0.0409, "step": 114230 }, { "epoch": 0.74, "learning_rate": 0.00018940020782640685, "loss": 0.0461, "step": 114240 }, { "epoch": 0.74, "learning_rate": 0.0001893905264720499, "loss": 0.0428, "step": 114250 }, { "epoch": 0.74, "learning_rate": 0.00018938084511769298, "loss": 0.0426, "step": 114260 }, { "epoch": 0.74, "learning_rate": 0.00018937116376333604, "loss": 0.0399, "step": 114270 }, { "epoch": 0.74, "learning_rate": 0.00018936148240897912, "loss": 0.0461, "step": 114280 }, { "epoch": 0.74, "learning_rate": 0.0001893518010546222, "loss": 0.049, "step": 114290 }, { "epoch": 0.74, "learning_rate": 0.00018934211970026525, "loss": 0.0514, "step": 114300 }, { "epoch": 0.74, "learning_rate": 0.00018933243834590833, "loss": 0.0391, "step": 114310 }, { "epoch": 0.74, "learning_rate": 0.00018932275699155138, "loss": 0.0509, "step": 114320 }, { "epoch": 0.74, "learning_rate": 0.00018931307563719443, "loss": 0.0451, "step": 114330 }, { "epoch": 0.74, "learning_rate": 0.0001893033942828375, "loss": 0.0438, "step": 114340 }, { "epoch": 0.74, "learning_rate": 0.0001892937129284806, "loss": 0.0445, "step": 114350 }, { "epoch": 0.74, "learning_rate": 0.00018928403157412367, "loss": 0.0493, "step": 114360 }, { "epoch": 0.74, "learning_rate": 0.00018927435021976672, "loss": 0.0483, "step": 114370 }, { "epoch": 0.74, "learning_rate": 0.0001892646688654098, "loss": 0.0398, "step": 114380 }, { "epoch": 0.74, "learning_rate": 0.00018925498751105286, "loss": 0.0444, "step": 114390 }, { "epoch": 0.74, "learning_rate": 0.0001892453061566959, "loss": 0.0422, "step": 114400 }, { "epoch": 0.74, "learning_rate": 0.000189235624802339, "loss": 0.0403, "step": 114410 }, { "epoch": 0.74, "learning_rate": 0.00018922594344798207, "loss": 0.0392, "step": 114420 }, { "epoch": 0.74, "learning_rate": 0.00018921626209362515, "loss": 0.0517, "step": 114430 }, { "epoch": 0.74, "learning_rate": 0.0001892065807392682, "loss": 0.045, "step": 114440 }, { "epoch": 0.74, "learning_rate": 0.00018919689938491128, "loss": 0.0538, "step": 114450 }, { "epoch": 0.74, "learning_rate": 0.00018918721803055433, "loss": 0.0467, "step": 114460 }, { "epoch": 0.74, "learning_rate": 0.0001891775366761974, "loss": 0.0509, "step": 114470 }, { "epoch": 0.74, "learning_rate": 0.00018916785532184047, "loss": 0.0479, "step": 114480 }, { "epoch": 0.74, "learning_rate": 0.00018915817396748355, "loss": 0.0428, "step": 114490 }, { "epoch": 0.74, "learning_rate": 0.0001891484926131266, "loss": 0.0495, "step": 114500 }, { "epoch": 0.74, "learning_rate": 0.00018913881125876968, "loss": 0.0413, "step": 114510 }, { "epoch": 0.74, "learning_rate": 0.00018912912990441276, "loss": 0.0413, "step": 114520 }, { "epoch": 0.74, "learning_rate": 0.00018911944855005578, "loss": 0.0484, "step": 114530 }, { "epoch": 0.74, "learning_rate": 0.00018910976719569886, "loss": 0.0516, "step": 114540 }, { "epoch": 0.74, "learning_rate": 0.00018910008584134194, "loss": 0.0468, "step": 114550 }, { "epoch": 0.74, "learning_rate": 0.00018909040448698502, "loss": 0.045, "step": 114560 }, { "epoch": 0.74, "learning_rate": 0.00018908072313262808, "loss": 0.043, "step": 114570 }, { "epoch": 0.74, "learning_rate": 0.00018907104177827116, "loss": 0.0516, "step": 114580 }, { "epoch": 0.74, "learning_rate": 0.00018906136042391424, "loss": 0.0496, "step": 114590 }, { "epoch": 0.74, "learning_rate": 0.00018905167906955726, "loss": 0.0509, "step": 114600 }, { "epoch": 0.74, "learning_rate": 0.00018904199771520034, "loss": 0.046, "step": 114610 }, { "epoch": 0.74, "learning_rate": 0.00018903231636084342, "loss": 0.0445, "step": 114620 }, { "epoch": 0.74, "learning_rate": 0.0001890226350064865, "loss": 0.0404, "step": 114630 }, { "epoch": 0.74, "learning_rate": 0.00018901295365212955, "loss": 0.0417, "step": 114640 }, { "epoch": 0.74, "learning_rate": 0.00018900327229777263, "loss": 0.04, "step": 114650 }, { "epoch": 0.74, "learning_rate": 0.0001889935909434157, "loss": 0.0488, "step": 114660 }, { "epoch": 0.74, "learning_rate": 0.00018898390958905874, "loss": 0.0461, "step": 114670 }, { "epoch": 0.74, "learning_rate": 0.00018897422823470182, "loss": 0.0481, "step": 114680 }, { "epoch": 0.74, "learning_rate": 0.0001889645468803449, "loss": 0.0499, "step": 114690 }, { "epoch": 0.74, "learning_rate": 0.00018895486552598795, "loss": 0.0456, "step": 114700 }, { "epoch": 0.74, "learning_rate": 0.00018894518417163103, "loss": 0.0498, "step": 114710 }, { "epoch": 0.74, "learning_rate": 0.0001889355028172741, "loss": 0.0417, "step": 114720 }, { "epoch": 0.74, "learning_rate": 0.0001889258214629172, "loss": 0.0477, "step": 114730 }, { "epoch": 0.74, "learning_rate": 0.00018891614010856022, "loss": 0.0527, "step": 114740 }, { "epoch": 0.74, "learning_rate": 0.0001889064587542033, "loss": 0.0482, "step": 114750 }, { "epoch": 0.74, "learning_rate": 0.00018889677739984638, "loss": 0.0468, "step": 114760 }, { "epoch": 0.74, "learning_rate": 0.00018888709604548943, "loss": 0.045, "step": 114770 }, { "epoch": 0.74, "learning_rate": 0.0001888774146911325, "loss": 0.0511, "step": 114780 }, { "epoch": 0.74, "learning_rate": 0.0001888677333367756, "loss": 0.0407, "step": 114790 }, { "epoch": 0.74, "learning_rate": 0.00018885805198241867, "loss": 0.0477, "step": 114800 }, { "epoch": 0.74, "learning_rate": 0.0001888483706280617, "loss": 0.0479, "step": 114810 }, { "epoch": 0.74, "learning_rate": 0.00018883868927370477, "loss": 0.0411, "step": 114820 }, { "epoch": 0.74, "learning_rate": 0.00018882900791934785, "loss": 0.0439, "step": 114830 }, { "epoch": 0.74, "learning_rate": 0.0001888193265649909, "loss": 0.0388, "step": 114840 }, { "epoch": 0.74, "learning_rate": 0.00018880964521063399, "loss": 0.0457, "step": 114850 }, { "epoch": 0.74, "learning_rate": 0.00018879996385627707, "loss": 0.0504, "step": 114860 }, { "epoch": 0.74, "learning_rate": 0.00018879028250192012, "loss": 0.0406, "step": 114870 }, { "epoch": 0.74, "learning_rate": 0.00018878060114756317, "loss": 0.0495, "step": 114880 }, { "epoch": 0.74, "learning_rate": 0.00018877091979320625, "loss": 0.0457, "step": 114890 }, { "epoch": 0.74, "learning_rate": 0.0001887612384388493, "loss": 0.0446, "step": 114900 }, { "epoch": 0.74, "learning_rate": 0.00018875155708449238, "loss": 0.0382, "step": 114910 }, { "epoch": 0.74, "learning_rate": 0.00018874187573013546, "loss": 0.0447, "step": 114920 }, { "epoch": 0.74, "learning_rate": 0.00018873219437577854, "loss": 0.0382, "step": 114930 }, { "epoch": 0.74, "learning_rate": 0.0001887225130214216, "loss": 0.0511, "step": 114940 }, { "epoch": 0.74, "learning_rate": 0.00018871283166706465, "loss": 0.0477, "step": 114950 }, { "epoch": 0.74, "learning_rate": 0.00018870315031270773, "loss": 0.0494, "step": 114960 }, { "epoch": 0.74, "learning_rate": 0.00018869346895835078, "loss": 0.0484, "step": 114970 }, { "epoch": 0.74, "learning_rate": 0.00018868378760399386, "loss": 0.0438, "step": 114980 }, { "epoch": 0.74, "learning_rate": 0.00018867410624963694, "loss": 0.0483, "step": 114990 }, { "epoch": 0.74, "learning_rate": 0.00018866442489528002, "loss": 0.0501, "step": 115000 }, { "epoch": 0.74, "eval_cer": 0.9198960569427184, "eval_loss": 0.02958066016435623, "eval_runtime": 119.869, "eval_samples_per_second": 16.685, "eval_steps_per_second": 4.171, "step": 115000 }, { "epoch": 0.74, "learning_rate": 0.00018865474354092307, "loss": 0.0397, "step": 115010 }, { "epoch": 0.74, "learning_rate": 0.00018864506218656613, "loss": 0.0429, "step": 115020 }, { "epoch": 0.74, "learning_rate": 0.0001886353808322092, "loss": 0.0451, "step": 115030 }, { "epoch": 0.74, "learning_rate": 0.00018862569947785226, "loss": 0.0384, "step": 115040 }, { "epoch": 0.74, "learning_rate": 0.00018861601812349534, "loss": 0.0432, "step": 115050 }, { "epoch": 0.74, "learning_rate": 0.00018860633676913842, "loss": 0.0445, "step": 115060 }, { "epoch": 0.74, "learning_rate": 0.00018859665541478147, "loss": 0.0467, "step": 115070 }, { "epoch": 0.74, "learning_rate": 0.00018858697406042455, "loss": 0.04, "step": 115080 }, { "epoch": 0.74, "learning_rate": 0.0001885772927060676, "loss": 0.0439, "step": 115090 }, { "epoch": 0.74, "learning_rate": 0.00018856761135171066, "loss": 0.0527, "step": 115100 }, { "epoch": 0.74, "learning_rate": 0.00018855792999735373, "loss": 0.0473, "step": 115110 }, { "epoch": 0.74, "learning_rate": 0.00018854824864299681, "loss": 0.0397, "step": 115120 }, { "epoch": 0.74, "learning_rate": 0.0001885385672886399, "loss": 0.0505, "step": 115130 }, { "epoch": 0.74, "learning_rate": 0.00018852888593428295, "loss": 0.0391, "step": 115140 }, { "epoch": 0.74, "learning_rate": 0.00018851920457992603, "loss": 0.0433, "step": 115150 }, { "epoch": 0.74, "learning_rate": 0.00018850952322556908, "loss": 0.0507, "step": 115160 }, { "epoch": 0.74, "learning_rate": 0.00018849984187121213, "loss": 0.0483, "step": 115170 }, { "epoch": 0.74, "learning_rate": 0.0001884901605168552, "loss": 0.0472, "step": 115180 }, { "epoch": 0.74, "learning_rate": 0.0001884804791624983, "loss": 0.0446, "step": 115190 }, { "epoch": 0.74, "learning_rate": 0.00018847079780814137, "loss": 0.0463, "step": 115200 }, { "epoch": 0.74, "learning_rate": 0.00018846111645378442, "loss": 0.0422, "step": 115210 }, { "epoch": 0.74, "learning_rate": 0.0001884514350994275, "loss": 0.0499, "step": 115220 }, { "epoch": 0.74, "learning_rate": 0.00018844175374507056, "loss": 0.0483, "step": 115230 }, { "epoch": 0.74, "learning_rate": 0.0001884320723907136, "loss": 0.0414, "step": 115240 }, { "epoch": 0.74, "learning_rate": 0.0001884223910363567, "loss": 0.0419, "step": 115250 }, { "epoch": 0.74, "learning_rate": 0.00018841270968199977, "loss": 0.0492, "step": 115260 }, { "epoch": 0.74, "learning_rate": 0.00018840302832764282, "loss": 0.0414, "step": 115270 }, { "epoch": 0.74, "learning_rate": 0.0001883933469732859, "loss": 0.048, "step": 115280 }, { "epoch": 0.74, "learning_rate": 0.00018838366561892898, "loss": 0.04, "step": 115290 }, { "epoch": 0.74, "learning_rate": 0.000188373984264572, "loss": 0.0416, "step": 115300 }, { "epoch": 0.74, "learning_rate": 0.0001883643029102151, "loss": 0.0432, "step": 115310 }, { "epoch": 0.74, "learning_rate": 0.00018835462155585817, "loss": 0.0421, "step": 115320 }, { "epoch": 0.74, "learning_rate": 0.00018834494020150125, "loss": 0.0477, "step": 115330 }, { "epoch": 0.74, "learning_rate": 0.0001883352588471443, "loss": 0.0457, "step": 115340 }, { "epoch": 0.74, "learning_rate": 0.00018832557749278738, "loss": 0.046, "step": 115350 }, { "epoch": 0.74, "learning_rate": 0.00018831589613843046, "loss": 0.0444, "step": 115360 }, { "epoch": 0.74, "learning_rate": 0.00018830621478407348, "loss": 0.0462, "step": 115370 }, { "epoch": 0.74, "learning_rate": 0.00018829653342971656, "loss": 0.0431, "step": 115380 }, { "epoch": 0.74, "learning_rate": 0.00018828685207535964, "loss": 0.0475, "step": 115390 }, { "epoch": 0.74, "learning_rate": 0.00018827717072100272, "loss": 0.0464, "step": 115400 }, { "epoch": 0.74, "learning_rate": 0.00018826748936664578, "loss": 0.0423, "step": 115410 }, { "epoch": 0.74, "learning_rate": 0.00018825780801228886, "loss": 0.0482, "step": 115420 }, { "epoch": 0.75, "learning_rate": 0.00018824812665793194, "loss": 0.0393, "step": 115430 }, { "epoch": 0.75, "learning_rate": 0.00018823844530357496, "loss": 0.0445, "step": 115440 }, { "epoch": 0.75, "learning_rate": 0.00018822876394921804, "loss": 0.0425, "step": 115450 }, { "epoch": 0.75, "learning_rate": 0.00018821908259486112, "loss": 0.0476, "step": 115460 }, { "epoch": 0.75, "learning_rate": 0.0001882094012405042, "loss": 0.0526, "step": 115470 }, { "epoch": 0.75, "learning_rate": 0.00018819971988614725, "loss": 0.0416, "step": 115480 }, { "epoch": 0.75, "learning_rate": 0.00018819003853179033, "loss": 0.0514, "step": 115490 }, { "epoch": 0.75, "learning_rate": 0.0001881803571774334, "loss": 0.0465, "step": 115500 }, { "epoch": 0.75, "learning_rate": 0.00018817067582307644, "loss": 0.045, "step": 115510 }, { "epoch": 0.75, "learning_rate": 0.00018816099446871952, "loss": 0.0482, "step": 115520 }, { "epoch": 0.75, "learning_rate": 0.0001881513131143626, "loss": 0.0514, "step": 115530 }, { "epoch": 0.75, "learning_rate": 0.00018814163176000565, "loss": 0.0459, "step": 115540 }, { "epoch": 0.75, "learning_rate": 0.00018813195040564873, "loss": 0.0449, "step": 115550 }, { "epoch": 0.75, "learning_rate": 0.0001881222690512918, "loss": 0.043, "step": 115560 }, { "epoch": 0.75, "learning_rate": 0.0001881125876969349, "loss": 0.046, "step": 115570 }, { "epoch": 0.75, "learning_rate": 0.00018810290634257792, "loss": 0.0459, "step": 115580 }, { "epoch": 0.75, "learning_rate": 0.000188093224988221, "loss": 0.0473, "step": 115590 }, { "epoch": 0.75, "learning_rate": 0.00018808354363386408, "loss": 0.0404, "step": 115600 }, { "epoch": 0.75, "learning_rate": 0.00018807386227950713, "loss": 0.0473, "step": 115610 }, { "epoch": 0.75, "learning_rate": 0.0001880641809251502, "loss": 0.0466, "step": 115620 }, { "epoch": 0.75, "learning_rate": 0.0001880544995707933, "loss": 0.0427, "step": 115630 }, { "epoch": 0.75, "learning_rate": 0.00018804481821643637, "loss": 0.0524, "step": 115640 }, { "epoch": 0.75, "learning_rate": 0.0001880351368620794, "loss": 0.0413, "step": 115650 }, { "epoch": 0.75, "learning_rate": 0.00018802545550772247, "loss": 0.0413, "step": 115660 }, { "epoch": 0.75, "learning_rate": 0.00018801577415336555, "loss": 0.0433, "step": 115670 }, { "epoch": 0.75, "learning_rate": 0.0001880060927990086, "loss": 0.0379, "step": 115680 }, { "epoch": 0.75, "learning_rate": 0.00018799641144465169, "loss": 0.0432, "step": 115690 }, { "epoch": 0.75, "learning_rate": 0.00018798673009029477, "loss": 0.0468, "step": 115700 }, { "epoch": 0.75, "learning_rate": 0.00018797704873593782, "loss": 0.0406, "step": 115710 }, { "epoch": 0.75, "learning_rate": 0.00018796736738158087, "loss": 0.0444, "step": 115720 }, { "epoch": 0.75, "learning_rate": 0.00018795768602722395, "loss": 0.0411, "step": 115730 }, { "epoch": 0.75, "learning_rate": 0.000187948004672867, "loss": 0.0423, "step": 115740 }, { "epoch": 0.75, "learning_rate": 0.00018793832331851008, "loss": 0.0471, "step": 115750 }, { "epoch": 0.75, "learning_rate": 0.00018792864196415316, "loss": 0.0498, "step": 115760 }, { "epoch": 0.75, "learning_rate": 0.00018791896060979624, "loss": 0.0404, "step": 115770 }, { "epoch": 0.75, "learning_rate": 0.0001879092792554393, "loss": 0.0396, "step": 115780 }, { "epoch": 0.75, "learning_rate": 0.00018789959790108235, "loss": 0.0469, "step": 115790 }, { "epoch": 0.75, "learning_rate": 0.00018788991654672543, "loss": 0.0474, "step": 115800 }, { "epoch": 0.75, "learning_rate": 0.00018788023519236848, "loss": 0.0468, "step": 115810 }, { "epoch": 0.75, "learning_rate": 0.00018787055383801156, "loss": 0.0456, "step": 115820 }, { "epoch": 0.75, "learning_rate": 0.00018786087248365464, "loss": 0.0463, "step": 115830 }, { "epoch": 0.75, "learning_rate": 0.00018785119112929772, "loss": 0.0398, "step": 115840 }, { "epoch": 0.75, "learning_rate": 0.00018784150977494077, "loss": 0.0417, "step": 115850 }, { "epoch": 0.75, "learning_rate": 0.00018783182842058382, "loss": 0.0508, "step": 115860 }, { "epoch": 0.75, "learning_rate": 0.0001878221470662269, "loss": 0.0364, "step": 115870 }, { "epoch": 0.75, "learning_rate": 0.00018781246571186996, "loss": 0.0465, "step": 115880 }, { "epoch": 0.75, "learning_rate": 0.00018780278435751304, "loss": 0.0414, "step": 115890 }, { "epoch": 0.75, "learning_rate": 0.00018779310300315612, "loss": 0.0414, "step": 115900 }, { "epoch": 0.75, "learning_rate": 0.00018778342164879917, "loss": 0.042, "step": 115910 }, { "epoch": 0.75, "learning_rate": 0.00018777374029444225, "loss": 0.0505, "step": 115920 }, { "epoch": 0.75, "learning_rate": 0.0001877640589400853, "loss": 0.0379, "step": 115930 }, { "epoch": 0.75, "learning_rate": 0.00018775437758572835, "loss": 0.038, "step": 115940 }, { "epoch": 0.75, "learning_rate": 0.00018774469623137143, "loss": 0.0413, "step": 115950 }, { "epoch": 0.75, "learning_rate": 0.00018773501487701451, "loss": 0.04, "step": 115960 }, { "epoch": 0.75, "learning_rate": 0.0001877253335226576, "loss": 0.0433, "step": 115970 }, { "epoch": 0.75, "learning_rate": 0.00018771565216830065, "loss": 0.0449, "step": 115980 }, { "epoch": 0.75, "learning_rate": 0.00018770597081394373, "loss": 0.0453, "step": 115990 }, { "epoch": 0.75, "learning_rate": 0.00018769628945958678, "loss": 0.0387, "step": 116000 }, { "epoch": 0.75, "eval_cer": 0.9199774036831997, "eval_loss": 0.029281143099069595, "eval_runtime": 119.7604, "eval_samples_per_second": 16.7, "eval_steps_per_second": 4.175, "step": 116000 }, { "epoch": 0.75, "learning_rate": 0.00018768660810522983, "loss": 0.0402, "step": 116010 }, { "epoch": 0.75, "learning_rate": 0.0001876769267508729, "loss": 0.045, "step": 116020 }, { "epoch": 0.75, "learning_rate": 0.000187667245396516, "loss": 0.0432, "step": 116030 }, { "epoch": 0.75, "learning_rate": 0.00018765756404215907, "loss": 0.0524, "step": 116040 }, { "epoch": 0.75, "learning_rate": 0.00018764788268780212, "loss": 0.0421, "step": 116050 }, { "epoch": 0.75, "learning_rate": 0.0001876382013334452, "loss": 0.0395, "step": 116060 }, { "epoch": 0.75, "learning_rate": 0.00018762851997908826, "loss": 0.052, "step": 116070 }, { "epoch": 0.75, "learning_rate": 0.0001876188386247313, "loss": 0.0378, "step": 116080 }, { "epoch": 0.75, "learning_rate": 0.0001876091572703744, "loss": 0.0413, "step": 116090 }, { "epoch": 0.75, "learning_rate": 0.00018759947591601747, "loss": 0.0499, "step": 116100 }, { "epoch": 0.75, "learning_rate": 0.00018758979456166052, "loss": 0.0428, "step": 116110 }, { "epoch": 0.75, "learning_rate": 0.0001875801132073036, "loss": 0.044, "step": 116120 }, { "epoch": 0.75, "learning_rate": 0.00018757043185294668, "loss": 0.0529, "step": 116130 }, { "epoch": 0.75, "learning_rate": 0.0001875607504985897, "loss": 0.0461, "step": 116140 }, { "epoch": 0.75, "learning_rate": 0.0001875510691442328, "loss": 0.0361, "step": 116150 }, { "epoch": 0.75, "learning_rate": 0.00018754138778987587, "loss": 0.0396, "step": 116160 }, { "epoch": 0.75, "learning_rate": 0.00018753170643551895, "loss": 0.0433, "step": 116170 }, { "epoch": 0.75, "learning_rate": 0.000187522025081162, "loss": 0.0437, "step": 116180 }, { "epoch": 0.75, "learning_rate": 0.00018751234372680508, "loss": 0.0519, "step": 116190 }, { "epoch": 0.75, "learning_rate": 0.00018750266237244816, "loss": 0.0477, "step": 116200 }, { "epoch": 0.75, "learning_rate": 0.00018749298101809118, "loss": 0.0389, "step": 116210 }, { "epoch": 0.75, "learning_rate": 0.00018748329966373426, "loss": 0.048, "step": 116220 }, { "epoch": 0.75, "learning_rate": 0.00018747361830937734, "loss": 0.0411, "step": 116230 }, { "epoch": 0.75, "learning_rate": 0.00018746393695502042, "loss": 0.049, "step": 116240 }, { "epoch": 0.75, "learning_rate": 0.00018745425560066348, "loss": 0.0421, "step": 116250 }, { "epoch": 0.75, "learning_rate": 0.00018744457424630656, "loss": 0.0441, "step": 116260 }, { "epoch": 0.75, "learning_rate": 0.00018743489289194964, "loss": 0.043, "step": 116270 }, { "epoch": 0.75, "learning_rate": 0.00018742521153759266, "loss": 0.0435, "step": 116280 }, { "epoch": 0.75, "learning_rate": 0.00018741553018323574, "loss": 0.0413, "step": 116290 }, { "epoch": 0.75, "learning_rate": 0.00018740584882887882, "loss": 0.0423, "step": 116300 }, { "epoch": 0.75, "learning_rate": 0.00018739616747452187, "loss": 0.0456, "step": 116310 }, { "epoch": 0.75, "learning_rate": 0.00018738648612016495, "loss": 0.0456, "step": 116320 }, { "epoch": 0.75, "learning_rate": 0.00018737680476580803, "loss": 0.0479, "step": 116330 }, { "epoch": 0.75, "learning_rate": 0.0001873671234114511, "loss": 0.0504, "step": 116340 }, { "epoch": 0.75, "learning_rate": 0.00018735744205709414, "loss": 0.0391, "step": 116350 }, { "epoch": 0.75, "learning_rate": 0.00018734776070273722, "loss": 0.0438, "step": 116360 }, { "epoch": 0.75, "learning_rate": 0.0001873380793483803, "loss": 0.0468, "step": 116370 }, { "epoch": 0.75, "learning_rate": 0.00018732839799402335, "loss": 0.0447, "step": 116380 }, { "epoch": 0.75, "learning_rate": 0.00018731871663966643, "loss": 0.0428, "step": 116390 }, { "epoch": 0.75, "learning_rate": 0.0001873090352853095, "loss": 0.0439, "step": 116400 }, { "epoch": 0.75, "learning_rate": 0.0001872993539309526, "loss": 0.0468, "step": 116410 }, { "epoch": 0.75, "learning_rate": 0.00018728967257659562, "loss": 0.0399, "step": 116420 }, { "epoch": 0.75, "learning_rate": 0.0001872799912222387, "loss": 0.0414, "step": 116430 }, { "epoch": 0.75, "learning_rate": 0.00018727030986788178, "loss": 0.0476, "step": 116440 }, { "epoch": 0.75, "learning_rate": 0.00018726062851352483, "loss": 0.0436, "step": 116450 }, { "epoch": 0.75, "learning_rate": 0.0001872509471591679, "loss": 0.0384, "step": 116460 }, { "epoch": 0.75, "learning_rate": 0.000187241265804811, "loss": 0.0354, "step": 116470 }, { "epoch": 0.75, "learning_rate": 0.00018723158445045404, "loss": 0.0459, "step": 116480 }, { "epoch": 0.75, "learning_rate": 0.0001872219030960971, "loss": 0.046, "step": 116490 }, { "epoch": 0.75, "learning_rate": 0.00018721222174174017, "loss": 0.0444, "step": 116500 }, { "epoch": 0.75, "learning_rate": 0.00018720254038738323, "loss": 0.0393, "step": 116510 }, { "epoch": 0.75, "learning_rate": 0.0001871928590330263, "loss": 0.0445, "step": 116520 }, { "epoch": 0.75, "learning_rate": 0.00018718317767866938, "loss": 0.0433, "step": 116530 }, { "epoch": 0.75, "learning_rate": 0.00018717349632431246, "loss": 0.042, "step": 116540 }, { "epoch": 0.75, "learning_rate": 0.00018716381496995552, "loss": 0.0393, "step": 116550 }, { "epoch": 0.75, "learning_rate": 0.00018715413361559857, "loss": 0.0366, "step": 116560 }, { "epoch": 0.75, "learning_rate": 0.00018714445226124165, "loss": 0.0467, "step": 116570 }, { "epoch": 0.75, "learning_rate": 0.0001871347709068847, "loss": 0.0381, "step": 116580 }, { "epoch": 0.75, "learning_rate": 0.00018712508955252778, "loss": 0.0444, "step": 116590 }, { "epoch": 0.75, "learning_rate": 0.00018711540819817086, "loss": 0.0478, "step": 116600 }, { "epoch": 0.75, "learning_rate": 0.00018710572684381394, "loss": 0.0406, "step": 116610 }, { "epoch": 0.75, "learning_rate": 0.000187096045489457, "loss": 0.0491, "step": 116620 }, { "epoch": 0.75, "learning_rate": 0.00018708636413510005, "loss": 0.0446, "step": 116630 }, { "epoch": 0.75, "learning_rate": 0.00018707668278074313, "loss": 0.037, "step": 116640 }, { "epoch": 0.75, "learning_rate": 0.00018706700142638618, "loss": 0.0441, "step": 116650 }, { "epoch": 0.75, "learning_rate": 0.00018705732007202926, "loss": 0.0381, "step": 116660 }, { "epoch": 0.75, "learning_rate": 0.00018704763871767234, "loss": 0.0453, "step": 116670 }, { "epoch": 0.75, "learning_rate": 0.0001870379573633154, "loss": 0.0459, "step": 116680 }, { "epoch": 0.75, "learning_rate": 0.00018702827600895847, "loss": 0.0397, "step": 116690 }, { "epoch": 0.75, "learning_rate": 0.00018701859465460152, "loss": 0.0481, "step": 116700 }, { "epoch": 0.75, "learning_rate": 0.00018700891330024458, "loss": 0.0413, "step": 116710 }, { "epoch": 0.75, "learning_rate": 0.00018699923194588766, "loss": 0.0415, "step": 116720 }, { "epoch": 0.75, "learning_rate": 0.00018698955059153074, "loss": 0.0406, "step": 116730 }, { "epoch": 0.75, "learning_rate": 0.00018697986923717382, "loss": 0.0417, "step": 116740 }, { "epoch": 0.75, "learning_rate": 0.00018697018788281687, "loss": 0.041, "step": 116750 }, { "epoch": 0.75, "learning_rate": 0.00018696050652845995, "loss": 0.042, "step": 116760 }, { "epoch": 0.75, "learning_rate": 0.000186950825174103, "loss": 0.0483, "step": 116770 }, { "epoch": 0.75, "learning_rate": 0.00018694114381974605, "loss": 0.046, "step": 116780 }, { "epoch": 0.75, "learning_rate": 0.00018693146246538913, "loss": 0.0394, "step": 116790 }, { "epoch": 0.75, "learning_rate": 0.00018692178111103221, "loss": 0.0408, "step": 116800 }, { "epoch": 0.75, "learning_rate": 0.0001869120997566753, "loss": 0.0405, "step": 116810 }, { "epoch": 0.75, "learning_rate": 0.00018690241840231835, "loss": 0.0521, "step": 116820 }, { "epoch": 0.75, "learning_rate": 0.00018689273704796143, "loss": 0.0416, "step": 116830 }, { "epoch": 0.75, "learning_rate": 0.00018688305569360448, "loss": 0.0521, "step": 116840 }, { "epoch": 0.75, "learning_rate": 0.00018687337433924753, "loss": 0.0496, "step": 116850 }, { "epoch": 0.75, "learning_rate": 0.0001868636929848906, "loss": 0.0513, "step": 116860 }, { "epoch": 0.75, "learning_rate": 0.0001868540116305337, "loss": 0.0521, "step": 116870 }, { "epoch": 0.75, "learning_rate": 0.00018684433027617674, "loss": 0.0493, "step": 116880 }, { "epoch": 0.75, "learning_rate": 0.00018683464892181982, "loss": 0.041, "step": 116890 }, { "epoch": 0.75, "learning_rate": 0.0001868249675674629, "loss": 0.048, "step": 116900 }, { "epoch": 0.75, "learning_rate": 0.00018681528621310593, "loss": 0.0402, "step": 116910 }, { "epoch": 0.75, "learning_rate": 0.000186805604858749, "loss": 0.0411, "step": 116920 }, { "epoch": 0.75, "learning_rate": 0.0001867959235043921, "loss": 0.0395, "step": 116930 }, { "epoch": 0.75, "learning_rate": 0.00018678624215003517, "loss": 0.0436, "step": 116940 }, { "epoch": 0.75, "learning_rate": 0.00018677656079567822, "loss": 0.0396, "step": 116950 }, { "epoch": 0.75, "learning_rate": 0.0001867668794413213, "loss": 0.0487, "step": 116960 }, { "epoch": 0.75, "learning_rate": 0.00018675719808696438, "loss": 0.0385, "step": 116970 }, { "epoch": 0.76, "learning_rate": 0.0001867475167326074, "loss": 0.0423, "step": 116980 }, { "epoch": 0.76, "learning_rate": 0.00018673783537825049, "loss": 0.0463, "step": 116990 }, { "epoch": 0.76, "learning_rate": 0.00018672815402389357, "loss": 0.0384, "step": 117000 }, { "epoch": 0.76, "eval_cer": 0.9199240763755507, "eval_loss": 0.02930784970521927, "eval_runtime": 120.0533, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 117000 }, { "epoch": 0.76, "learning_rate": 0.00018671847266953665, "loss": 0.0382, "step": 117010 }, { "epoch": 0.76, "learning_rate": 0.0001867087913151797, "loss": 0.0464, "step": 117020 }, { "epoch": 0.76, "learning_rate": 0.00018669910996082278, "loss": 0.0417, "step": 117030 }, { "epoch": 0.76, "learning_rate": 0.00018668942860646586, "loss": 0.0434, "step": 117040 }, { "epoch": 0.76, "learning_rate": 0.00018667974725210888, "loss": 0.0404, "step": 117050 }, { "epoch": 0.76, "learning_rate": 0.00018667006589775196, "loss": 0.0386, "step": 117060 }, { "epoch": 0.76, "learning_rate": 0.00018666038454339504, "loss": 0.0434, "step": 117070 }, { "epoch": 0.76, "learning_rate": 0.0001866507031890381, "loss": 0.043, "step": 117080 }, { "epoch": 0.76, "learning_rate": 0.00018664102183468118, "loss": 0.0431, "step": 117090 }, { "epoch": 0.76, "learning_rate": 0.00018663134048032426, "loss": 0.0397, "step": 117100 }, { "epoch": 0.76, "learning_rate": 0.00018662165912596734, "loss": 0.0447, "step": 117110 }, { "epoch": 0.76, "learning_rate": 0.00018661197777161036, "loss": 0.0444, "step": 117120 }, { "epoch": 0.76, "learning_rate": 0.00018660229641725344, "loss": 0.0466, "step": 117130 }, { "epoch": 0.76, "learning_rate": 0.00018659261506289652, "loss": 0.0473, "step": 117140 }, { "epoch": 0.76, "learning_rate": 0.00018658293370853957, "loss": 0.0521, "step": 117150 }, { "epoch": 0.76, "learning_rate": 0.00018657325235418265, "loss": 0.0432, "step": 117160 }, { "epoch": 0.76, "learning_rate": 0.00018656357099982573, "loss": 0.0385, "step": 117170 }, { "epoch": 0.76, "learning_rate": 0.0001865538896454688, "loss": 0.0412, "step": 117180 }, { "epoch": 0.76, "learning_rate": 0.00018654420829111184, "loss": 0.0438, "step": 117190 }, { "epoch": 0.76, "learning_rate": 0.00018653452693675492, "loss": 0.0441, "step": 117200 }, { "epoch": 0.76, "learning_rate": 0.000186524845582398, "loss": 0.0477, "step": 117210 }, { "epoch": 0.76, "learning_rate": 0.00018651516422804105, "loss": 0.0519, "step": 117220 }, { "epoch": 0.76, "learning_rate": 0.00018650548287368413, "loss": 0.0382, "step": 117230 }, { "epoch": 0.76, "learning_rate": 0.0001864958015193272, "loss": 0.0411, "step": 117240 }, { "epoch": 0.76, "learning_rate": 0.0001864861201649703, "loss": 0.0424, "step": 117250 }, { "epoch": 0.76, "learning_rate": 0.00018647643881061332, "loss": 0.046, "step": 117260 }, { "epoch": 0.76, "learning_rate": 0.0001864667574562564, "loss": 0.0488, "step": 117270 }, { "epoch": 0.76, "learning_rate": 0.00018645707610189945, "loss": 0.0421, "step": 117280 }, { "epoch": 0.76, "learning_rate": 0.00018644739474754253, "loss": 0.0431, "step": 117290 }, { "epoch": 0.76, "learning_rate": 0.0001864377133931856, "loss": 0.0444, "step": 117300 }, { "epoch": 0.76, "learning_rate": 0.0001864280320388287, "loss": 0.0451, "step": 117310 }, { "epoch": 0.76, "learning_rate": 0.00018641835068447174, "loss": 0.0473, "step": 117320 }, { "epoch": 0.76, "learning_rate": 0.0001864086693301148, "loss": 0.0425, "step": 117330 }, { "epoch": 0.76, "learning_rate": 0.00018639898797575787, "loss": 0.0415, "step": 117340 }, { "epoch": 0.76, "learning_rate": 0.00018638930662140092, "loss": 0.0433, "step": 117350 }, { "epoch": 0.76, "learning_rate": 0.000186379625267044, "loss": 0.0424, "step": 117360 }, { "epoch": 0.76, "learning_rate": 0.00018636994391268708, "loss": 0.0372, "step": 117370 }, { "epoch": 0.76, "learning_rate": 0.00018636026255833016, "loss": 0.0391, "step": 117380 }, { "epoch": 0.76, "learning_rate": 0.00018635058120397322, "loss": 0.0411, "step": 117390 }, { "epoch": 0.76, "learning_rate": 0.00018634089984961627, "loss": 0.0462, "step": 117400 }, { "epoch": 0.76, "learning_rate": 0.00018633121849525935, "loss": 0.0426, "step": 117410 }, { "epoch": 0.76, "learning_rate": 0.0001863215371409024, "loss": 0.0452, "step": 117420 }, { "epoch": 0.76, "learning_rate": 0.00018631185578654548, "loss": 0.051, "step": 117430 }, { "epoch": 0.76, "learning_rate": 0.00018630217443218856, "loss": 0.0562, "step": 117440 }, { "epoch": 0.76, "learning_rate": 0.00018629249307783164, "loss": 0.0427, "step": 117450 }, { "epoch": 0.76, "learning_rate": 0.0001862828117234747, "loss": 0.044, "step": 117460 }, { "epoch": 0.76, "learning_rate": 0.00018627313036911775, "loss": 0.044, "step": 117470 }, { "epoch": 0.76, "learning_rate": 0.0001862634490147608, "loss": 0.0383, "step": 117480 }, { "epoch": 0.76, "learning_rate": 0.00018625376766040388, "loss": 0.0543, "step": 117490 }, { "epoch": 0.76, "learning_rate": 0.00018624408630604696, "loss": 0.0384, "step": 117500 }, { "epoch": 0.76, "learning_rate": 0.00018623440495169004, "loss": 0.046, "step": 117510 }, { "epoch": 0.76, "learning_rate": 0.0001862247235973331, "loss": 0.0426, "step": 117520 }, { "epoch": 0.76, "learning_rate": 0.00018621504224297617, "loss": 0.0499, "step": 117530 }, { "epoch": 0.76, "learning_rate": 0.00018620536088861922, "loss": 0.0437, "step": 117540 }, { "epoch": 0.76, "learning_rate": 0.00018619567953426228, "loss": 0.0583, "step": 117550 }, { "epoch": 0.76, "learning_rate": 0.00018618599817990536, "loss": 0.0443, "step": 117560 }, { "epoch": 0.76, "learning_rate": 0.00018617631682554844, "loss": 0.045, "step": 117570 }, { "epoch": 0.76, "learning_rate": 0.00018616663547119152, "loss": 0.0378, "step": 117580 }, { "epoch": 0.76, "learning_rate": 0.00018615695411683457, "loss": 0.0478, "step": 117590 }, { "epoch": 0.76, "learning_rate": 0.00018614727276247765, "loss": 0.0473, "step": 117600 }, { "epoch": 0.76, "learning_rate": 0.0001861375914081207, "loss": 0.0443, "step": 117610 }, { "epoch": 0.76, "learning_rate": 0.00018612791005376375, "loss": 0.0472, "step": 117620 }, { "epoch": 0.76, "learning_rate": 0.00018611822869940683, "loss": 0.0409, "step": 117630 }, { "epoch": 0.76, "learning_rate": 0.00018610854734504991, "loss": 0.0441, "step": 117640 }, { "epoch": 0.76, "learning_rate": 0.000186098865990693, "loss": 0.0395, "step": 117650 }, { "epoch": 0.76, "learning_rate": 0.00018608918463633605, "loss": 0.0418, "step": 117660 }, { "epoch": 0.76, "learning_rate": 0.00018607950328197913, "loss": 0.0422, "step": 117670 }, { "epoch": 0.76, "learning_rate": 0.00018606982192762215, "loss": 0.0488, "step": 117680 }, { "epoch": 0.76, "learning_rate": 0.00018606014057326523, "loss": 0.0452, "step": 117690 }, { "epoch": 0.76, "learning_rate": 0.0001860504592189083, "loss": 0.0408, "step": 117700 }, { "epoch": 0.76, "learning_rate": 0.0001860407778645514, "loss": 0.0354, "step": 117710 }, { "epoch": 0.76, "learning_rate": 0.00018603109651019444, "loss": 0.0531, "step": 117720 }, { "epoch": 0.76, "learning_rate": 0.00018602141515583752, "loss": 0.0456, "step": 117730 }, { "epoch": 0.76, "learning_rate": 0.0001860117338014806, "loss": 0.0456, "step": 117740 }, { "epoch": 0.76, "learning_rate": 0.00018600205244712363, "loss": 0.042, "step": 117750 }, { "epoch": 0.76, "learning_rate": 0.0001859923710927667, "loss": 0.0388, "step": 117760 }, { "epoch": 0.76, "learning_rate": 0.0001859826897384098, "loss": 0.0413, "step": 117770 }, { "epoch": 0.76, "learning_rate": 0.00018597300838405287, "loss": 0.0447, "step": 117780 }, { "epoch": 0.76, "learning_rate": 0.00018596332702969592, "loss": 0.041, "step": 117790 }, { "epoch": 0.76, "learning_rate": 0.000185953645675339, "loss": 0.0432, "step": 117800 }, { "epoch": 0.76, "learning_rate": 0.00018594396432098208, "loss": 0.0474, "step": 117810 }, { "epoch": 0.76, "learning_rate": 0.0001859342829666251, "loss": 0.0431, "step": 117820 }, { "epoch": 0.76, "learning_rate": 0.00018592460161226819, "loss": 0.0608, "step": 117830 }, { "epoch": 0.76, "learning_rate": 0.00018591492025791127, "loss": 0.0547, "step": 117840 }, { "epoch": 0.76, "learning_rate": 0.00018590523890355435, "loss": 0.0451, "step": 117850 }, { "epoch": 0.76, "learning_rate": 0.0001858955575491974, "loss": 0.0447, "step": 117860 }, { "epoch": 0.76, "learning_rate": 0.00018588587619484048, "loss": 0.038, "step": 117870 }, { "epoch": 0.76, "learning_rate": 0.00018587619484048356, "loss": 0.0479, "step": 117880 }, { "epoch": 0.76, "learning_rate": 0.00018586651348612658, "loss": 0.0391, "step": 117890 }, { "epoch": 0.76, "learning_rate": 0.00018585683213176966, "loss": 0.0398, "step": 117900 }, { "epoch": 0.76, "learning_rate": 0.00018584715077741274, "loss": 0.0389, "step": 117910 }, { "epoch": 0.76, "learning_rate": 0.0001858374694230558, "loss": 0.0533, "step": 117920 }, { "epoch": 0.76, "learning_rate": 0.00018582778806869888, "loss": 0.0398, "step": 117930 }, { "epoch": 0.76, "learning_rate": 0.00018581810671434195, "loss": 0.0422, "step": 117940 }, { "epoch": 0.76, "learning_rate": 0.00018580842535998503, "loss": 0.0522, "step": 117950 }, { "epoch": 0.76, "learning_rate": 0.00018579874400562806, "loss": 0.0393, "step": 117960 }, { "epoch": 0.76, "learning_rate": 0.00018578906265127114, "loss": 0.0408, "step": 117970 }, { "epoch": 0.76, "learning_rate": 0.00018577938129691422, "loss": 0.0437, "step": 117980 }, { "epoch": 0.76, "learning_rate": 0.00018576969994255727, "loss": 0.0415, "step": 117990 }, { "epoch": 0.76, "learning_rate": 0.00018576001858820035, "loss": 0.0492, "step": 118000 }, { "epoch": 0.76, "eval_cer": 0.9199322110495989, "eval_loss": 0.029090311378240585, "eval_runtime": 119.8047, "eval_samples_per_second": 16.694, "eval_steps_per_second": 4.173, "step": 118000 }, { "epoch": 0.76, "learning_rate": 0.00018575033723384343, "loss": 0.0435, "step": 118010 }, { "epoch": 0.76, "learning_rate": 0.0001857406558794865, "loss": 0.0426, "step": 118020 }, { "epoch": 0.76, "learning_rate": 0.00018573097452512954, "loss": 0.0415, "step": 118030 }, { "epoch": 0.76, "learning_rate": 0.00018572129317077262, "loss": 0.0477, "step": 118040 }, { "epoch": 0.76, "learning_rate": 0.0001857116118164157, "loss": 0.0418, "step": 118050 }, { "epoch": 0.76, "learning_rate": 0.00018570193046205875, "loss": 0.0453, "step": 118060 }, { "epoch": 0.76, "learning_rate": 0.00018569224910770183, "loss": 0.046, "step": 118070 }, { "epoch": 0.76, "learning_rate": 0.0001856825677533449, "loss": 0.0414, "step": 118080 }, { "epoch": 0.76, "learning_rate": 0.00018567288639898796, "loss": 0.0435, "step": 118090 }, { "epoch": 0.76, "learning_rate": 0.00018566320504463101, "loss": 0.0465, "step": 118100 }, { "epoch": 0.76, "learning_rate": 0.0001856535236902741, "loss": 0.0512, "step": 118110 }, { "epoch": 0.76, "learning_rate": 0.00018564384233591715, "loss": 0.0528, "step": 118120 }, { "epoch": 0.76, "learning_rate": 0.00018563416098156023, "loss": 0.0521, "step": 118130 }, { "epoch": 0.76, "learning_rate": 0.0001856244796272033, "loss": 0.0455, "step": 118140 }, { "epoch": 0.76, "learning_rate": 0.0001856147982728464, "loss": 0.041, "step": 118150 }, { "epoch": 0.76, "learning_rate": 0.00018560511691848944, "loss": 0.044, "step": 118160 }, { "epoch": 0.76, "learning_rate": 0.0001855954355641325, "loss": 0.0421, "step": 118170 }, { "epoch": 0.76, "learning_rate": 0.00018558575420977557, "loss": 0.0497, "step": 118180 }, { "epoch": 0.76, "learning_rate": 0.00018557607285541862, "loss": 0.0517, "step": 118190 }, { "epoch": 0.76, "learning_rate": 0.0001855663915010617, "loss": 0.0433, "step": 118200 }, { "epoch": 0.76, "learning_rate": 0.00018555671014670478, "loss": 0.0603, "step": 118210 }, { "epoch": 0.76, "learning_rate": 0.00018554702879234786, "loss": 0.0479, "step": 118220 }, { "epoch": 0.76, "learning_rate": 0.00018553734743799092, "loss": 0.0471, "step": 118230 }, { "epoch": 0.76, "learning_rate": 0.00018552766608363397, "loss": 0.054, "step": 118240 }, { "epoch": 0.76, "learning_rate": 0.00018551798472927705, "loss": 0.045, "step": 118250 }, { "epoch": 0.76, "learning_rate": 0.0001855083033749201, "loss": 0.0401, "step": 118260 }, { "epoch": 0.76, "learning_rate": 0.00018549862202056318, "loss": 0.0431, "step": 118270 }, { "epoch": 0.76, "learning_rate": 0.00018548894066620626, "loss": 0.0488, "step": 118280 }, { "epoch": 0.76, "learning_rate": 0.00018547925931184931, "loss": 0.0384, "step": 118290 }, { "epoch": 0.76, "learning_rate": 0.0001854695779574924, "loss": 0.0424, "step": 118300 }, { "epoch": 0.76, "learning_rate": 0.00018545989660313545, "loss": 0.04, "step": 118310 }, { "epoch": 0.76, "learning_rate": 0.0001854502152487785, "loss": 0.0378, "step": 118320 }, { "epoch": 0.76, "learning_rate": 0.00018544053389442158, "loss": 0.0416, "step": 118330 }, { "epoch": 0.76, "learning_rate": 0.00018543085254006466, "loss": 0.043, "step": 118340 }, { "epoch": 0.76, "learning_rate": 0.00018542117118570774, "loss": 0.0455, "step": 118350 }, { "epoch": 0.76, "learning_rate": 0.0001854114898313508, "loss": 0.0387, "step": 118360 }, { "epoch": 0.76, "learning_rate": 0.00018540180847699387, "loss": 0.0437, "step": 118370 }, { "epoch": 0.76, "learning_rate": 0.00018539212712263692, "loss": 0.0407, "step": 118380 }, { "epoch": 0.76, "learning_rate": 0.00018538244576827998, "loss": 0.0458, "step": 118390 }, { "epoch": 0.76, "learning_rate": 0.00018537276441392306, "loss": 0.0424, "step": 118400 }, { "epoch": 0.76, "learning_rate": 0.00018536308305956614, "loss": 0.0467, "step": 118410 }, { "epoch": 0.76, "learning_rate": 0.00018535340170520922, "loss": 0.0434, "step": 118420 }, { "epoch": 0.76, "learning_rate": 0.00018534372035085227, "loss": 0.0372, "step": 118430 }, { "epoch": 0.76, "learning_rate": 0.00018533403899649535, "loss": 0.0411, "step": 118440 }, { "epoch": 0.76, "learning_rate": 0.0001853243576421384, "loss": 0.045, "step": 118450 }, { "epoch": 0.76, "learning_rate": 0.00018531467628778145, "loss": 0.0583, "step": 118460 }, { "epoch": 0.76, "learning_rate": 0.00018530499493342453, "loss": 0.046, "step": 118470 }, { "epoch": 0.76, "learning_rate": 0.0001852953135790676, "loss": 0.0453, "step": 118480 }, { "epoch": 0.76, "learning_rate": 0.00018528563222471067, "loss": 0.045, "step": 118490 }, { "epoch": 0.76, "learning_rate": 0.00018527595087035375, "loss": 0.0463, "step": 118500 }, { "epoch": 0.76, "learning_rate": 0.00018526626951599683, "loss": 0.0422, "step": 118510 }, { "epoch": 0.76, "learning_rate": 0.00018525658816163985, "loss": 0.043, "step": 118520 }, { "epoch": 0.77, "learning_rate": 0.00018524690680728293, "loss": 0.0469, "step": 118530 }, { "epoch": 0.77, "learning_rate": 0.000185237225452926, "loss": 0.0519, "step": 118540 }, { "epoch": 0.77, "learning_rate": 0.0001852275440985691, "loss": 0.043, "step": 118550 }, { "epoch": 0.77, "learning_rate": 0.00018521786274421214, "loss": 0.0503, "step": 118560 }, { "epoch": 0.77, "learning_rate": 0.00018520818138985522, "loss": 0.0489, "step": 118570 }, { "epoch": 0.77, "learning_rate": 0.0001851985000354983, "loss": 0.0428, "step": 118580 }, { "epoch": 0.77, "learning_rate": 0.00018518881868114133, "loss": 0.0446, "step": 118590 }, { "epoch": 0.77, "learning_rate": 0.0001851791373267844, "loss": 0.0462, "step": 118600 }, { "epoch": 0.77, "learning_rate": 0.0001851694559724275, "loss": 0.0415, "step": 118610 }, { "epoch": 0.77, "learning_rate": 0.00018515977461807057, "loss": 0.0438, "step": 118620 }, { "epoch": 0.77, "learning_rate": 0.00018515009326371362, "loss": 0.0414, "step": 118630 }, { "epoch": 0.77, "learning_rate": 0.0001851404119093567, "loss": 0.0468, "step": 118640 }, { "epoch": 0.77, "learning_rate": 0.00018513073055499978, "loss": 0.0438, "step": 118650 }, { "epoch": 0.77, "learning_rate": 0.0001851210492006428, "loss": 0.0411, "step": 118660 }, { "epoch": 0.77, "learning_rate": 0.00018511136784628589, "loss": 0.045, "step": 118670 }, { "epoch": 0.77, "learning_rate": 0.00018510168649192897, "loss": 0.0432, "step": 118680 }, { "epoch": 0.77, "learning_rate": 0.00018509200513757202, "loss": 0.0497, "step": 118690 }, { "epoch": 0.77, "learning_rate": 0.0001850823237832151, "loss": 0.0428, "step": 118700 }, { "epoch": 0.77, "learning_rate": 0.00018507264242885818, "loss": 0.0393, "step": 118710 }, { "epoch": 0.77, "learning_rate": 0.00018506296107450126, "loss": 0.0512, "step": 118720 }, { "epoch": 0.77, "learning_rate": 0.00018505327972014428, "loss": 0.0447, "step": 118730 }, { "epoch": 0.77, "learning_rate": 0.00018504359836578736, "loss": 0.0483, "step": 118740 }, { "epoch": 0.77, "learning_rate": 0.00018503391701143044, "loss": 0.0393, "step": 118750 }, { "epoch": 0.77, "learning_rate": 0.0001850242356570735, "loss": 0.0478, "step": 118760 }, { "epoch": 0.77, "learning_rate": 0.00018501455430271657, "loss": 0.0441, "step": 118770 }, { "epoch": 0.77, "learning_rate": 0.00018500487294835965, "loss": 0.0389, "step": 118780 }, { "epoch": 0.77, "learning_rate": 0.00018499519159400273, "loss": 0.0435, "step": 118790 }, { "epoch": 0.77, "learning_rate": 0.00018498551023964576, "loss": 0.0473, "step": 118800 }, { "epoch": 0.77, "learning_rate": 0.00018497582888528884, "loss": 0.0438, "step": 118810 }, { "epoch": 0.77, "learning_rate": 0.00018496614753093192, "loss": 0.0374, "step": 118820 }, { "epoch": 0.77, "learning_rate": 0.00018495646617657497, "loss": 0.0466, "step": 118830 }, { "epoch": 0.77, "learning_rate": 0.00018494678482221805, "loss": 0.0459, "step": 118840 }, { "epoch": 0.77, "learning_rate": 0.00018493710346786113, "loss": 0.0539, "step": 118850 }, { "epoch": 0.77, "learning_rate": 0.00018492742211350418, "loss": 0.0438, "step": 118860 }, { "epoch": 0.77, "learning_rate": 0.00018491774075914724, "loss": 0.0448, "step": 118870 }, { "epoch": 0.77, "learning_rate": 0.00018490805940479032, "loss": 0.0432, "step": 118880 }, { "epoch": 0.77, "learning_rate": 0.00018489837805043337, "loss": 0.0405, "step": 118890 }, { "epoch": 0.77, "learning_rate": 0.00018488869669607645, "loss": 0.0406, "step": 118900 }, { "epoch": 0.77, "learning_rate": 0.00018487901534171953, "loss": 0.0547, "step": 118910 }, { "epoch": 0.77, "learning_rate": 0.0001848693339873626, "loss": 0.0437, "step": 118920 }, { "epoch": 0.77, "learning_rate": 0.00018485965263300566, "loss": 0.0448, "step": 118930 }, { "epoch": 0.77, "learning_rate": 0.00018484997127864871, "loss": 0.0355, "step": 118940 }, { "epoch": 0.77, "learning_rate": 0.0001848402899242918, "loss": 0.0403, "step": 118950 }, { "epoch": 0.77, "learning_rate": 0.00018483060856993485, "loss": 0.0423, "step": 118960 }, { "epoch": 0.77, "learning_rate": 0.00018482092721557793, "loss": 0.0421, "step": 118970 }, { "epoch": 0.77, "learning_rate": 0.000184811245861221, "loss": 0.0431, "step": 118980 }, { "epoch": 0.77, "learning_rate": 0.00018480156450686409, "loss": 0.0418, "step": 118990 }, { "epoch": 0.77, "learning_rate": 0.00018479188315250714, "loss": 0.0415, "step": 119000 }, { "epoch": 0.77, "eval_cer": 0.9199755959778556, "eval_loss": 0.028800196945667267, "eval_runtime": 119.8883, "eval_samples_per_second": 16.682, "eval_steps_per_second": 4.171, "step": 119000 }, { "epoch": 0.77, "learning_rate": 0.0001847822017981502, "loss": 0.0439, "step": 119010 }, { "epoch": 0.77, "learning_rate": 0.00018477252044379327, "loss": 0.044, "step": 119020 }, { "epoch": 0.77, "learning_rate": 0.00018476283908943632, "loss": 0.0408, "step": 119030 }, { "epoch": 0.77, "learning_rate": 0.0001847531577350794, "loss": 0.0408, "step": 119040 }, { "epoch": 0.77, "learning_rate": 0.00018474347638072248, "loss": 0.0431, "step": 119050 }, { "epoch": 0.77, "learning_rate": 0.00018473379502636554, "loss": 0.0401, "step": 119060 }, { "epoch": 0.77, "learning_rate": 0.00018472411367200862, "loss": 0.0385, "step": 119070 }, { "epoch": 0.77, "learning_rate": 0.00018471443231765167, "loss": 0.0437, "step": 119080 }, { "epoch": 0.77, "learning_rate": 0.00018470475096329472, "loss": 0.0423, "step": 119090 }, { "epoch": 0.77, "learning_rate": 0.0001846950696089378, "loss": 0.0455, "step": 119100 }, { "epoch": 0.77, "learning_rate": 0.00018468538825458088, "loss": 0.0437, "step": 119110 }, { "epoch": 0.77, "learning_rate": 0.00018467570690022396, "loss": 0.0447, "step": 119120 }, { "epoch": 0.77, "learning_rate": 0.00018466602554586701, "loss": 0.0416, "step": 119130 }, { "epoch": 0.77, "learning_rate": 0.0001846563441915101, "loss": 0.038, "step": 119140 }, { "epoch": 0.77, "learning_rate": 0.00018464666283715315, "loss": 0.0391, "step": 119150 }, { "epoch": 0.77, "learning_rate": 0.0001846369814827962, "loss": 0.0428, "step": 119160 }, { "epoch": 0.77, "learning_rate": 0.00018462730012843928, "loss": 0.0433, "step": 119170 }, { "epoch": 0.77, "learning_rate": 0.00018461761877408236, "loss": 0.0441, "step": 119180 }, { "epoch": 0.77, "learning_rate": 0.00018460793741972544, "loss": 0.0464, "step": 119190 }, { "epoch": 0.77, "learning_rate": 0.0001845982560653685, "loss": 0.0408, "step": 119200 }, { "epoch": 0.77, "learning_rate": 0.00018458857471101157, "loss": 0.0419, "step": 119210 }, { "epoch": 0.77, "learning_rate": 0.00018457889335665462, "loss": 0.0447, "step": 119220 }, { "epoch": 0.77, "learning_rate": 0.00018456921200229768, "loss": 0.0444, "step": 119230 }, { "epoch": 0.77, "learning_rate": 0.00018455953064794076, "loss": 0.0401, "step": 119240 }, { "epoch": 0.77, "learning_rate": 0.00018454984929358384, "loss": 0.0387, "step": 119250 }, { "epoch": 0.77, "learning_rate": 0.0001845401679392269, "loss": 0.0465, "step": 119260 }, { "epoch": 0.77, "learning_rate": 0.00018453048658486997, "loss": 0.0402, "step": 119270 }, { "epoch": 0.77, "learning_rate": 0.00018452080523051305, "loss": 0.0386, "step": 119280 }, { "epoch": 0.77, "learning_rate": 0.00018451112387615607, "loss": 0.0392, "step": 119290 }, { "epoch": 0.77, "learning_rate": 0.00018450144252179915, "loss": 0.0488, "step": 119300 }, { "epoch": 0.77, "learning_rate": 0.00018449176116744223, "loss": 0.0429, "step": 119310 }, { "epoch": 0.77, "learning_rate": 0.0001844820798130853, "loss": 0.0446, "step": 119320 }, { "epoch": 0.77, "learning_rate": 0.00018447239845872837, "loss": 0.035, "step": 119330 }, { "epoch": 0.77, "learning_rate": 0.00018446271710437145, "loss": 0.0398, "step": 119340 }, { "epoch": 0.77, "learning_rate": 0.00018445303575001453, "loss": 0.0471, "step": 119350 }, { "epoch": 0.77, "learning_rate": 0.00018444335439565755, "loss": 0.0451, "step": 119360 }, { "epoch": 0.77, "learning_rate": 0.00018443367304130063, "loss": 0.0419, "step": 119370 }, { "epoch": 0.77, "learning_rate": 0.0001844239916869437, "loss": 0.0416, "step": 119380 }, { "epoch": 0.77, "learning_rate": 0.0001844143103325868, "loss": 0.0407, "step": 119390 }, { "epoch": 0.77, "learning_rate": 0.00018440462897822984, "loss": 0.0445, "step": 119400 }, { "epoch": 0.77, "learning_rate": 0.00018439494762387292, "loss": 0.0442, "step": 119410 }, { "epoch": 0.77, "learning_rate": 0.000184385266269516, "loss": 0.0394, "step": 119420 }, { "epoch": 0.77, "learning_rate": 0.00018437558491515903, "loss": 0.0458, "step": 119430 }, { "epoch": 0.77, "learning_rate": 0.0001843659035608021, "loss": 0.0444, "step": 119440 }, { "epoch": 0.77, "learning_rate": 0.0001843562222064452, "loss": 0.0406, "step": 119450 }, { "epoch": 0.77, "learning_rate": 0.00018434654085208824, "loss": 0.0389, "step": 119460 }, { "epoch": 0.77, "learning_rate": 0.00018433685949773132, "loss": 0.0453, "step": 119470 }, { "epoch": 0.77, "learning_rate": 0.0001843271781433744, "loss": 0.0468, "step": 119480 }, { "epoch": 0.77, "learning_rate": 0.00018431749678901748, "loss": 0.0529, "step": 119490 }, { "epoch": 0.77, "learning_rate": 0.0001843078154346605, "loss": 0.0412, "step": 119500 }, { "epoch": 0.77, "learning_rate": 0.00018429813408030358, "loss": 0.0408, "step": 119510 }, { "epoch": 0.77, "learning_rate": 0.00018428845272594666, "loss": 0.0407, "step": 119520 }, { "epoch": 0.77, "learning_rate": 0.00018427877137158972, "loss": 0.0403, "step": 119530 }, { "epoch": 0.77, "learning_rate": 0.0001842690900172328, "loss": 0.0407, "step": 119540 }, { "epoch": 0.77, "learning_rate": 0.00018425940866287588, "loss": 0.0432, "step": 119550 }, { "epoch": 0.77, "learning_rate": 0.00018424972730851896, "loss": 0.0482, "step": 119560 }, { "epoch": 0.77, "learning_rate": 0.00018424004595416198, "loss": 0.0417, "step": 119570 }, { "epoch": 0.77, "learning_rate": 0.00018423036459980506, "loss": 0.047, "step": 119580 }, { "epoch": 0.77, "learning_rate": 0.00018422068324544814, "loss": 0.0403, "step": 119590 }, { "epoch": 0.77, "learning_rate": 0.0001842110018910912, "loss": 0.0501, "step": 119600 }, { "epoch": 0.77, "learning_rate": 0.00018420132053673427, "loss": 0.0431, "step": 119610 }, { "epoch": 0.77, "learning_rate": 0.00018419163918237735, "loss": 0.0411, "step": 119620 }, { "epoch": 0.77, "learning_rate": 0.00018418195782802043, "loss": 0.0434, "step": 119630 }, { "epoch": 0.77, "learning_rate": 0.00018417227647366346, "loss": 0.0391, "step": 119640 }, { "epoch": 0.77, "learning_rate": 0.00018416259511930654, "loss": 0.0386, "step": 119650 }, { "epoch": 0.77, "learning_rate": 0.0001841529137649496, "loss": 0.0431, "step": 119660 }, { "epoch": 0.77, "learning_rate": 0.00018414323241059267, "loss": 0.0377, "step": 119670 }, { "epoch": 0.77, "learning_rate": 0.00018413355105623575, "loss": 0.0356, "step": 119680 }, { "epoch": 0.77, "learning_rate": 0.00018412386970187883, "loss": 0.0535, "step": 119690 }, { "epoch": 0.77, "learning_rate": 0.00018411418834752188, "loss": 0.0403, "step": 119700 }, { "epoch": 0.77, "learning_rate": 0.00018410450699316494, "loss": 0.0427, "step": 119710 }, { "epoch": 0.77, "learning_rate": 0.00018409482563880802, "loss": 0.0442, "step": 119720 }, { "epoch": 0.77, "learning_rate": 0.00018408514428445107, "loss": 0.0417, "step": 119730 }, { "epoch": 0.77, "learning_rate": 0.00018407546293009415, "loss": 0.0468, "step": 119740 }, { "epoch": 0.77, "learning_rate": 0.00018406578157573723, "loss": 0.0422, "step": 119750 }, { "epoch": 0.77, "learning_rate": 0.0001840561002213803, "loss": 0.0376, "step": 119760 }, { "epoch": 0.77, "learning_rate": 0.00018404641886702336, "loss": 0.0436, "step": 119770 }, { "epoch": 0.77, "learning_rate": 0.00018403673751266641, "loss": 0.0403, "step": 119780 }, { "epoch": 0.77, "learning_rate": 0.0001840270561583095, "loss": 0.0389, "step": 119790 }, { "epoch": 0.77, "learning_rate": 0.00018401737480395255, "loss": 0.0385, "step": 119800 }, { "epoch": 0.77, "learning_rate": 0.00018400769344959563, "loss": 0.0416, "step": 119810 }, { "epoch": 0.77, "learning_rate": 0.0001839980120952387, "loss": 0.0406, "step": 119820 }, { "epoch": 0.77, "learning_rate": 0.00018398833074088179, "loss": 0.038, "step": 119830 }, { "epoch": 0.77, "learning_rate": 0.00018397864938652484, "loss": 0.0409, "step": 119840 }, { "epoch": 0.77, "learning_rate": 0.0001839689680321679, "loss": 0.0442, "step": 119850 }, { "epoch": 0.77, "learning_rate": 0.00018395928667781097, "loss": 0.0424, "step": 119860 }, { "epoch": 0.77, "learning_rate": 0.00018394960532345402, "loss": 0.05, "step": 119870 }, { "epoch": 0.77, "learning_rate": 0.0001839399239690971, "loss": 0.0394, "step": 119880 }, { "epoch": 0.77, "learning_rate": 0.00018393024261474018, "loss": 0.0418, "step": 119890 }, { "epoch": 0.77, "learning_rate": 0.00018392056126038324, "loss": 0.0464, "step": 119900 }, { "epoch": 0.77, "learning_rate": 0.00018391087990602632, "loss": 0.0416, "step": 119910 }, { "epoch": 0.77, "learning_rate": 0.00018390119855166937, "loss": 0.0459, "step": 119920 }, { "epoch": 0.77, "learning_rate": 0.00018389151719731242, "loss": 0.0351, "step": 119930 }, { "epoch": 0.77, "learning_rate": 0.0001838818358429555, "loss": 0.0469, "step": 119940 }, { "epoch": 0.77, "learning_rate": 0.00018387215448859858, "loss": 0.0426, "step": 119950 }, { "epoch": 0.77, "learning_rate": 0.00018386247313424166, "loss": 0.0497, "step": 119960 }, { "epoch": 0.77, "learning_rate": 0.0001838527917798847, "loss": 0.0409, "step": 119970 }, { "epoch": 0.77, "learning_rate": 0.0001838431104255278, "loss": 0.0435, "step": 119980 }, { "epoch": 0.77, "learning_rate": 0.00018383342907117085, "loss": 0.0447, "step": 119990 }, { "epoch": 0.77, "learning_rate": 0.0001838237477168139, "loss": 0.0435, "step": 120000 }, { "epoch": 0.77, "eval_cer": 0.9199069031747825, "eval_loss": 0.028599528595805168, "eval_runtime": 120.0989, "eval_samples_per_second": 16.653, "eval_steps_per_second": 4.163, "step": 120000 }, { "epoch": 0.77, "learning_rate": 0.00018381406636245698, "loss": 0.0421, "step": 120010 }, { "epoch": 0.77, "learning_rate": 0.00018380438500810006, "loss": 0.0465, "step": 120020 }, { "epoch": 0.77, "learning_rate": 0.00018379470365374314, "loss": 0.0458, "step": 120030 }, { "epoch": 0.77, "learning_rate": 0.0001837850222993862, "loss": 0.0456, "step": 120040 }, { "epoch": 0.77, "learning_rate": 0.00018377534094502927, "loss": 0.0451, "step": 120050 }, { "epoch": 0.77, "learning_rate": 0.00018376565959067232, "loss": 0.0485, "step": 120060 }, { "epoch": 0.77, "learning_rate": 0.00018375597823631538, "loss": 0.0418, "step": 120070 }, { "epoch": 0.78, "learning_rate": 0.00018374629688195846, "loss": 0.0393, "step": 120080 }, { "epoch": 0.78, "learning_rate": 0.00018373661552760154, "loss": 0.042, "step": 120090 }, { "epoch": 0.78, "learning_rate": 0.0001837269341732446, "loss": 0.0386, "step": 120100 }, { "epoch": 0.78, "learning_rate": 0.00018371725281888767, "loss": 0.0398, "step": 120110 }, { "epoch": 0.78, "learning_rate": 0.00018370757146453075, "loss": 0.0373, "step": 120120 }, { "epoch": 0.78, "learning_rate": 0.00018369789011017377, "loss": 0.0463, "step": 120130 }, { "epoch": 0.78, "learning_rate": 0.00018368820875581685, "loss": 0.0454, "step": 120140 }, { "epoch": 0.78, "learning_rate": 0.00018367852740145993, "loss": 0.0419, "step": 120150 }, { "epoch": 0.78, "learning_rate": 0.000183668846047103, "loss": 0.0388, "step": 120160 }, { "epoch": 0.78, "learning_rate": 0.00018365916469274607, "loss": 0.0431, "step": 120170 }, { "epoch": 0.78, "learning_rate": 0.00018364948333838914, "loss": 0.0445, "step": 120180 }, { "epoch": 0.78, "learning_rate": 0.00018363980198403222, "loss": 0.0395, "step": 120190 }, { "epoch": 0.78, "learning_rate": 0.00018363012062967525, "loss": 0.0383, "step": 120200 }, { "epoch": 0.78, "learning_rate": 0.00018362043927531833, "loss": 0.0493, "step": 120210 }, { "epoch": 0.78, "learning_rate": 0.0001836107579209614, "loss": 0.0434, "step": 120220 }, { "epoch": 0.78, "learning_rate": 0.0001836010765666045, "loss": 0.0404, "step": 120230 }, { "epoch": 0.78, "learning_rate": 0.00018359139521224754, "loss": 0.0461, "step": 120240 }, { "epoch": 0.78, "learning_rate": 0.00018358171385789062, "loss": 0.0441, "step": 120250 }, { "epoch": 0.78, "learning_rate": 0.0001835720325035337, "loss": 0.0421, "step": 120260 }, { "epoch": 0.78, "learning_rate": 0.00018356235114917673, "loss": 0.039, "step": 120270 }, { "epoch": 0.78, "learning_rate": 0.0001835526697948198, "loss": 0.0417, "step": 120280 }, { "epoch": 0.78, "learning_rate": 0.0001835429884404629, "loss": 0.0475, "step": 120290 }, { "epoch": 0.78, "learning_rate": 0.00018353330708610594, "loss": 0.0524, "step": 120300 }, { "epoch": 0.78, "learning_rate": 0.00018352362573174902, "loss": 0.0438, "step": 120310 }, { "epoch": 0.78, "learning_rate": 0.0001835139443773921, "loss": 0.0386, "step": 120320 }, { "epoch": 0.78, "learning_rate": 0.00018350426302303518, "loss": 0.0415, "step": 120330 }, { "epoch": 0.78, "learning_rate": 0.0001834945816686782, "loss": 0.0424, "step": 120340 }, { "epoch": 0.78, "learning_rate": 0.00018348490031432128, "loss": 0.0435, "step": 120350 }, { "epoch": 0.78, "learning_rate": 0.00018347521895996436, "loss": 0.0423, "step": 120360 }, { "epoch": 0.78, "learning_rate": 0.00018346553760560742, "loss": 0.046, "step": 120370 }, { "epoch": 0.78, "learning_rate": 0.0001834558562512505, "loss": 0.0389, "step": 120380 }, { "epoch": 0.78, "learning_rate": 0.00018344617489689358, "loss": 0.0478, "step": 120390 }, { "epoch": 0.78, "learning_rate": 0.00018343649354253666, "loss": 0.047, "step": 120400 }, { "epoch": 0.78, "learning_rate": 0.00018342681218817968, "loss": 0.0405, "step": 120410 }, { "epoch": 0.78, "learning_rate": 0.00018341713083382276, "loss": 0.0445, "step": 120420 }, { "epoch": 0.78, "learning_rate": 0.00018340744947946584, "loss": 0.0454, "step": 120430 }, { "epoch": 0.78, "learning_rate": 0.0001833977681251089, "loss": 0.0451, "step": 120440 }, { "epoch": 0.78, "learning_rate": 0.00018338808677075197, "loss": 0.0466, "step": 120450 }, { "epoch": 0.78, "learning_rate": 0.00018337840541639505, "loss": 0.0361, "step": 120460 }, { "epoch": 0.78, "learning_rate": 0.0001833687240620381, "loss": 0.0453, "step": 120470 }, { "epoch": 0.78, "learning_rate": 0.00018335904270768116, "loss": 0.0406, "step": 120480 }, { "epoch": 0.78, "learning_rate": 0.00018334936135332424, "loss": 0.0453, "step": 120490 }, { "epoch": 0.78, "learning_rate": 0.0001833396799989673, "loss": 0.0433, "step": 120500 }, { "epoch": 0.78, "learning_rate": 0.00018332999864461037, "loss": 0.0478, "step": 120510 }, { "epoch": 0.78, "learning_rate": 0.00018332031729025345, "loss": 0.0473, "step": 120520 }, { "epoch": 0.78, "learning_rate": 0.00018331063593589653, "loss": 0.0444, "step": 120530 }, { "epoch": 0.78, "learning_rate": 0.00018330095458153956, "loss": 0.043, "step": 120540 }, { "epoch": 0.78, "learning_rate": 0.00018329127322718264, "loss": 0.0421, "step": 120550 }, { "epoch": 0.78, "learning_rate": 0.00018328159187282572, "loss": 0.0354, "step": 120560 }, { "epoch": 0.78, "learning_rate": 0.00018327191051846877, "loss": 0.0417, "step": 120570 }, { "epoch": 0.78, "learning_rate": 0.00018326222916411185, "loss": 0.0408, "step": 120580 }, { "epoch": 0.78, "learning_rate": 0.00018325254780975493, "loss": 0.045, "step": 120590 }, { "epoch": 0.78, "learning_rate": 0.000183242866455398, "loss": 0.0446, "step": 120600 }, { "epoch": 0.78, "learning_rate": 0.00018323318510104103, "loss": 0.052, "step": 120610 }, { "epoch": 0.78, "learning_rate": 0.00018322350374668411, "loss": 0.0372, "step": 120620 }, { "epoch": 0.78, "learning_rate": 0.0001832138223923272, "loss": 0.0393, "step": 120630 }, { "epoch": 0.78, "learning_rate": 0.00018320414103797025, "loss": 0.0402, "step": 120640 }, { "epoch": 0.78, "learning_rate": 0.00018319445968361333, "loss": 0.0486, "step": 120650 }, { "epoch": 0.78, "learning_rate": 0.0001831847783292564, "loss": 0.0431, "step": 120660 }, { "epoch": 0.78, "learning_rate": 0.00018317509697489946, "loss": 0.0469, "step": 120670 }, { "epoch": 0.78, "learning_rate": 0.0001831654156205425, "loss": 0.0467, "step": 120680 }, { "epoch": 0.78, "learning_rate": 0.0001831557342661856, "loss": 0.0468, "step": 120690 }, { "epoch": 0.78, "learning_rate": 0.00018314605291182864, "loss": 0.0485, "step": 120700 }, { "epoch": 0.78, "learning_rate": 0.00018313637155747172, "loss": 0.0464, "step": 120710 }, { "epoch": 0.78, "learning_rate": 0.0001831266902031148, "loss": 0.0428, "step": 120720 }, { "epoch": 0.78, "learning_rate": 0.00018311700884875788, "loss": 0.0424, "step": 120730 }, { "epoch": 0.78, "learning_rate": 0.00018310732749440094, "loss": 0.0468, "step": 120740 }, { "epoch": 0.78, "learning_rate": 0.000183097646140044, "loss": 0.0537, "step": 120750 }, { "epoch": 0.78, "learning_rate": 0.00018308796478568707, "loss": 0.0419, "step": 120760 }, { "epoch": 0.78, "learning_rate": 0.00018307828343133012, "loss": 0.0457, "step": 120770 }, { "epoch": 0.78, "learning_rate": 0.0001830686020769732, "loss": 0.0401, "step": 120780 }, { "epoch": 0.78, "learning_rate": 0.00018305892072261628, "loss": 0.0433, "step": 120790 }, { "epoch": 0.78, "learning_rate": 0.00018304923936825936, "loss": 0.0417, "step": 120800 }, { "epoch": 0.78, "learning_rate": 0.0001830395580139024, "loss": 0.0378, "step": 120810 }, { "epoch": 0.78, "learning_rate": 0.00018302987665954547, "loss": 0.0405, "step": 120820 }, { "epoch": 0.78, "learning_rate": 0.00018302019530518855, "loss": 0.0407, "step": 120830 }, { "epoch": 0.78, "learning_rate": 0.0001830105139508316, "loss": 0.0481, "step": 120840 }, { "epoch": 0.78, "learning_rate": 0.00018300083259647468, "loss": 0.0488, "step": 120850 }, { "epoch": 0.78, "learning_rate": 0.00018299115124211776, "loss": 0.0399, "step": 120860 }, { "epoch": 0.78, "learning_rate": 0.0001829814698877608, "loss": 0.0413, "step": 120870 }, { "epoch": 0.78, "learning_rate": 0.0001829717885334039, "loss": 0.0407, "step": 120880 }, { "epoch": 0.78, "learning_rate": 0.00018296210717904694, "loss": 0.0456, "step": 120890 }, { "epoch": 0.78, "learning_rate": 0.00018295242582469, "loss": 0.0399, "step": 120900 }, { "epoch": 0.78, "learning_rate": 0.00018294274447033308, "loss": 0.039, "step": 120910 }, { "epoch": 0.78, "learning_rate": 0.00018293306311597616, "loss": 0.0428, "step": 120920 }, { "epoch": 0.78, "learning_rate": 0.00018292338176161923, "loss": 0.0397, "step": 120930 }, { "epoch": 0.78, "learning_rate": 0.0001829137004072623, "loss": 0.0413, "step": 120940 }, { "epoch": 0.78, "learning_rate": 0.00018290401905290537, "loss": 0.0439, "step": 120950 }, { "epoch": 0.78, "learning_rate": 0.00018289433769854842, "loss": 0.0413, "step": 120960 }, { "epoch": 0.78, "learning_rate": 0.00018288465634419147, "loss": 0.0514, "step": 120970 }, { "epoch": 0.78, "learning_rate": 0.00018287497498983455, "loss": 0.0476, "step": 120980 }, { "epoch": 0.78, "learning_rate": 0.00018286529363547763, "loss": 0.0417, "step": 120990 }, { "epoch": 0.78, "learning_rate": 0.0001828556122811207, "loss": 0.0423, "step": 121000 }, { "epoch": 0.78, "eval_cer": 0.9198309795503333, "eval_loss": 0.02841617912054062, "eval_runtime": 120.0158, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 121000 }, { "epoch": 0.78, "learning_rate": 0.00018284593092676376, "loss": 0.0425, "step": 121010 }, { "epoch": 0.78, "learning_rate": 0.00018283624957240684, "loss": 0.0448, "step": 121020 }, { "epoch": 0.78, "learning_rate": 0.0001828265682180499, "loss": 0.0514, "step": 121030 }, { "epoch": 0.78, "learning_rate": 0.00018281688686369295, "loss": 0.0408, "step": 121040 }, { "epoch": 0.78, "learning_rate": 0.00018280720550933603, "loss": 0.0441, "step": 121050 }, { "epoch": 0.78, "learning_rate": 0.0001827975241549791, "loss": 0.0437, "step": 121060 }, { "epoch": 0.78, "learning_rate": 0.00018278784280062216, "loss": 0.0405, "step": 121070 }, { "epoch": 0.78, "learning_rate": 0.00018277816144626524, "loss": 0.048, "step": 121080 }, { "epoch": 0.78, "learning_rate": 0.00018276848009190832, "loss": 0.0421, "step": 121090 }, { "epoch": 0.78, "learning_rate": 0.00018275879873755135, "loss": 0.0439, "step": 121100 }, { "epoch": 0.78, "learning_rate": 0.00018274911738319443, "loss": 0.0408, "step": 121110 }, { "epoch": 0.78, "learning_rate": 0.0001827394360288375, "loss": 0.0439, "step": 121120 }, { "epoch": 0.78, "learning_rate": 0.0001827297546744806, "loss": 0.0491, "step": 121130 }, { "epoch": 0.78, "learning_rate": 0.00018272007332012364, "loss": 0.0431, "step": 121140 }, { "epoch": 0.78, "learning_rate": 0.00018271039196576672, "loss": 0.0407, "step": 121150 }, { "epoch": 0.78, "learning_rate": 0.0001827007106114098, "loss": 0.0556, "step": 121160 }, { "epoch": 0.78, "learning_rate": 0.00018269102925705282, "loss": 0.0461, "step": 121170 }, { "epoch": 0.78, "learning_rate": 0.0001826813479026959, "loss": 0.0419, "step": 121180 }, { "epoch": 0.78, "learning_rate": 0.00018267166654833898, "loss": 0.0469, "step": 121190 }, { "epoch": 0.78, "learning_rate": 0.00018266198519398206, "loss": 0.0383, "step": 121200 }, { "epoch": 0.78, "learning_rate": 0.00018265230383962512, "loss": 0.0427, "step": 121210 }, { "epoch": 0.78, "learning_rate": 0.0001826426224852682, "loss": 0.0391, "step": 121220 }, { "epoch": 0.78, "learning_rate": 0.00018263294113091128, "loss": 0.0412, "step": 121230 }, { "epoch": 0.78, "learning_rate": 0.0001826232597765543, "loss": 0.0437, "step": 121240 }, { "epoch": 0.78, "learning_rate": 0.00018261357842219738, "loss": 0.0408, "step": 121250 }, { "epoch": 0.78, "learning_rate": 0.00018260389706784046, "loss": 0.0429, "step": 121260 }, { "epoch": 0.78, "learning_rate": 0.00018259421571348351, "loss": 0.0444, "step": 121270 }, { "epoch": 0.78, "learning_rate": 0.0001825845343591266, "loss": 0.04, "step": 121280 }, { "epoch": 0.78, "learning_rate": 0.00018257485300476967, "loss": 0.0409, "step": 121290 }, { "epoch": 0.78, "learning_rate": 0.00018256517165041275, "loss": 0.0427, "step": 121300 }, { "epoch": 0.78, "learning_rate": 0.00018255549029605578, "loss": 0.0383, "step": 121310 }, { "epoch": 0.78, "learning_rate": 0.00018254580894169886, "loss": 0.0467, "step": 121320 }, { "epoch": 0.78, "learning_rate": 0.00018253612758734194, "loss": 0.0352, "step": 121330 }, { "epoch": 0.78, "learning_rate": 0.000182526446232985, "loss": 0.0466, "step": 121340 }, { "epoch": 0.78, "learning_rate": 0.00018251676487862807, "loss": 0.0392, "step": 121350 }, { "epoch": 0.78, "learning_rate": 0.00018250708352427115, "loss": 0.0391, "step": 121360 }, { "epoch": 0.78, "learning_rate": 0.00018249740216991423, "loss": 0.0451, "step": 121370 }, { "epoch": 0.78, "learning_rate": 0.00018248772081555726, "loss": 0.0386, "step": 121380 }, { "epoch": 0.78, "learning_rate": 0.00018247803946120034, "loss": 0.0392, "step": 121390 }, { "epoch": 0.78, "learning_rate": 0.00018246835810684342, "loss": 0.0516, "step": 121400 }, { "epoch": 0.78, "learning_rate": 0.00018245867675248647, "loss": 0.0395, "step": 121410 }, { "epoch": 0.78, "learning_rate": 0.00018244899539812955, "loss": 0.0409, "step": 121420 }, { "epoch": 0.78, "learning_rate": 0.00018243931404377263, "loss": 0.047, "step": 121430 }, { "epoch": 0.78, "learning_rate": 0.0001824296326894157, "loss": 0.044, "step": 121440 }, { "epoch": 0.78, "learning_rate": 0.00018241995133505873, "loss": 0.0477, "step": 121450 }, { "epoch": 0.78, "learning_rate": 0.0001824102699807018, "loss": 0.0414, "step": 121460 }, { "epoch": 0.78, "learning_rate": 0.00018240058862634487, "loss": 0.0412, "step": 121470 }, { "epoch": 0.78, "learning_rate": 0.00018239090727198795, "loss": 0.0418, "step": 121480 }, { "epoch": 0.78, "learning_rate": 0.00018238122591763103, "loss": 0.0406, "step": 121490 }, { "epoch": 0.78, "learning_rate": 0.0001823715445632741, "loss": 0.0404, "step": 121500 }, { "epoch": 0.78, "learning_rate": 0.00018236186320891716, "loss": 0.0428, "step": 121510 }, { "epoch": 0.78, "learning_rate": 0.0001823521818545602, "loss": 0.0447, "step": 121520 }, { "epoch": 0.78, "learning_rate": 0.0001823425005002033, "loss": 0.0426, "step": 121530 }, { "epoch": 0.78, "learning_rate": 0.00018233281914584634, "loss": 0.0383, "step": 121540 }, { "epoch": 0.78, "learning_rate": 0.00018232313779148942, "loss": 0.0409, "step": 121550 }, { "epoch": 0.78, "learning_rate": 0.0001823134564371325, "loss": 0.0405, "step": 121560 }, { "epoch": 0.78, "learning_rate": 0.00018230377508277558, "loss": 0.037, "step": 121570 }, { "epoch": 0.78, "learning_rate": 0.00018229409372841864, "loss": 0.0405, "step": 121580 }, { "epoch": 0.78, "learning_rate": 0.0001822844123740617, "loss": 0.0409, "step": 121590 }, { "epoch": 0.78, "learning_rate": 0.00018227473101970477, "loss": 0.0355, "step": 121600 }, { "epoch": 0.78, "learning_rate": 0.00018226504966534782, "loss": 0.0528, "step": 121610 }, { "epoch": 0.78, "learning_rate": 0.0001822553683109909, "loss": 0.0413, "step": 121620 }, { "epoch": 0.79, "learning_rate": 0.00018224568695663398, "loss": 0.0371, "step": 121630 }, { "epoch": 0.79, "learning_rate": 0.00018223600560227706, "loss": 0.0406, "step": 121640 }, { "epoch": 0.79, "learning_rate": 0.0001822263242479201, "loss": 0.0398, "step": 121650 }, { "epoch": 0.79, "learning_rate": 0.00018221664289356317, "loss": 0.0439, "step": 121660 }, { "epoch": 0.79, "learning_rate": 0.00018220696153920622, "loss": 0.0466, "step": 121670 }, { "epoch": 0.79, "learning_rate": 0.0001821972801848493, "loss": 0.0405, "step": 121680 }, { "epoch": 0.79, "learning_rate": 0.00018218759883049238, "loss": 0.0435, "step": 121690 }, { "epoch": 0.79, "learning_rate": 0.00018217791747613546, "loss": 0.0404, "step": 121700 }, { "epoch": 0.79, "learning_rate": 0.0001821682361217785, "loss": 0.0472, "step": 121710 }, { "epoch": 0.79, "learning_rate": 0.0001821585547674216, "loss": 0.0403, "step": 121720 }, { "epoch": 0.79, "learning_rate": 0.00018214887341306464, "loss": 0.0425, "step": 121730 }, { "epoch": 0.79, "learning_rate": 0.0001821391920587077, "loss": 0.0447, "step": 121740 }, { "epoch": 0.79, "learning_rate": 0.00018212951070435077, "loss": 0.0375, "step": 121750 }, { "epoch": 0.79, "learning_rate": 0.00018211982934999385, "loss": 0.0417, "step": 121760 }, { "epoch": 0.79, "learning_rate": 0.00018211014799563693, "loss": 0.0444, "step": 121770 }, { "epoch": 0.79, "learning_rate": 0.00018210046664128, "loss": 0.0414, "step": 121780 }, { "epoch": 0.79, "learning_rate": 0.00018209078528692307, "loss": 0.0475, "step": 121790 }, { "epoch": 0.79, "learning_rate": 0.00018208110393256612, "loss": 0.0436, "step": 121800 }, { "epoch": 0.79, "learning_rate": 0.00018207142257820917, "loss": 0.0433, "step": 121810 }, { "epoch": 0.79, "learning_rate": 0.00018206174122385225, "loss": 0.0383, "step": 121820 }, { "epoch": 0.79, "learning_rate": 0.00018205205986949533, "loss": 0.0402, "step": 121830 }, { "epoch": 0.79, "learning_rate": 0.0001820423785151384, "loss": 0.0479, "step": 121840 }, { "epoch": 0.79, "learning_rate": 0.00018203269716078146, "loss": 0.0493, "step": 121850 }, { "epoch": 0.79, "learning_rate": 0.00018202301580642454, "loss": 0.0417, "step": 121860 }, { "epoch": 0.79, "learning_rate": 0.00018201333445206757, "loss": 0.0447, "step": 121870 }, { "epoch": 0.79, "learning_rate": 0.00018200365309771065, "loss": 0.046, "step": 121880 }, { "epoch": 0.79, "learning_rate": 0.00018199397174335373, "loss": 0.0388, "step": 121890 }, { "epoch": 0.79, "learning_rate": 0.0001819842903889968, "loss": 0.0429, "step": 121900 }, { "epoch": 0.79, "learning_rate": 0.00018197460903463986, "loss": 0.043, "step": 121910 }, { "epoch": 0.79, "learning_rate": 0.00018196492768028294, "loss": 0.0409, "step": 121920 }, { "epoch": 0.79, "learning_rate": 0.00018195524632592602, "loss": 0.0413, "step": 121930 }, { "epoch": 0.79, "learning_rate": 0.00018194556497156905, "loss": 0.036, "step": 121940 }, { "epoch": 0.79, "learning_rate": 0.00018193588361721213, "loss": 0.0408, "step": 121950 }, { "epoch": 0.79, "learning_rate": 0.0001819262022628552, "loss": 0.0478, "step": 121960 }, { "epoch": 0.79, "learning_rate": 0.00018191652090849829, "loss": 0.044, "step": 121970 }, { "epoch": 0.79, "learning_rate": 0.00018190683955414134, "loss": 0.0502, "step": 121980 }, { "epoch": 0.79, "learning_rate": 0.00018189715819978442, "loss": 0.0409, "step": 121990 }, { "epoch": 0.79, "learning_rate": 0.0001818874768454275, "loss": 0.0437, "step": 122000 }, { "epoch": 0.79, "eval_cer": 0.9198617105411818, "eval_loss": 0.028577525168657303, "eval_runtime": 120.1701, "eval_samples_per_second": 16.643, "eval_steps_per_second": 4.161, "step": 122000 }, { "epoch": 0.79, "learning_rate": 0.00018187779549107052, "loss": 0.0392, "step": 122010 }, { "epoch": 0.79, "learning_rate": 0.0001818681141367136, "loss": 0.0412, "step": 122020 }, { "epoch": 0.79, "learning_rate": 0.00018185843278235668, "loss": 0.0414, "step": 122030 }, { "epoch": 0.79, "learning_rate": 0.00018184875142799976, "loss": 0.049, "step": 122040 }, { "epoch": 0.79, "learning_rate": 0.00018183907007364282, "loss": 0.038, "step": 122050 }, { "epoch": 0.79, "learning_rate": 0.0001818293887192859, "loss": 0.0456, "step": 122060 }, { "epoch": 0.79, "learning_rate": 0.00018181970736492898, "loss": 0.0418, "step": 122070 }, { "epoch": 0.79, "learning_rate": 0.000181810026010572, "loss": 0.0422, "step": 122080 }, { "epoch": 0.79, "learning_rate": 0.00018180034465621508, "loss": 0.0392, "step": 122090 }, { "epoch": 0.79, "learning_rate": 0.00018179066330185816, "loss": 0.0377, "step": 122100 }, { "epoch": 0.79, "learning_rate": 0.00018178098194750121, "loss": 0.0398, "step": 122110 }, { "epoch": 0.79, "learning_rate": 0.0001817713005931443, "loss": 0.0417, "step": 122120 }, { "epoch": 0.79, "learning_rate": 0.00018176161923878737, "loss": 0.0403, "step": 122130 }, { "epoch": 0.79, "learning_rate": 0.00018175193788443045, "loss": 0.0431, "step": 122140 }, { "epoch": 0.79, "learning_rate": 0.00018174225653007348, "loss": 0.0439, "step": 122150 }, { "epoch": 0.79, "learning_rate": 0.00018173257517571656, "loss": 0.0469, "step": 122160 }, { "epoch": 0.79, "learning_rate": 0.00018172289382135964, "loss": 0.0407, "step": 122170 }, { "epoch": 0.79, "learning_rate": 0.0001817132124670027, "loss": 0.0426, "step": 122180 }, { "epoch": 0.79, "learning_rate": 0.00018170353111264577, "loss": 0.0447, "step": 122190 }, { "epoch": 0.79, "learning_rate": 0.00018169384975828885, "loss": 0.0438, "step": 122200 }, { "epoch": 0.79, "learning_rate": 0.00018168416840393193, "loss": 0.04, "step": 122210 }, { "epoch": 0.79, "learning_rate": 0.00018167448704957496, "loss": 0.0423, "step": 122220 }, { "epoch": 0.79, "learning_rate": 0.00018166480569521804, "loss": 0.0494, "step": 122230 }, { "epoch": 0.79, "learning_rate": 0.00018165512434086112, "loss": 0.0421, "step": 122240 }, { "epoch": 0.79, "learning_rate": 0.00018164544298650417, "loss": 0.0453, "step": 122250 }, { "epoch": 0.79, "learning_rate": 0.00018163576163214725, "loss": 0.0417, "step": 122260 }, { "epoch": 0.79, "learning_rate": 0.00018162608027779033, "loss": 0.0451, "step": 122270 }, { "epoch": 0.79, "learning_rate": 0.00018161639892343338, "loss": 0.0361, "step": 122280 }, { "epoch": 0.79, "learning_rate": 0.00018160671756907643, "loss": 0.0395, "step": 122290 }, { "epoch": 0.79, "learning_rate": 0.0001815970362147195, "loss": 0.0419, "step": 122300 }, { "epoch": 0.79, "learning_rate": 0.00018158735486036257, "loss": 0.0433, "step": 122310 }, { "epoch": 0.79, "learning_rate": 0.00018157767350600565, "loss": 0.0469, "step": 122320 }, { "epoch": 0.79, "learning_rate": 0.00018156799215164873, "loss": 0.0382, "step": 122330 }, { "epoch": 0.79, "learning_rate": 0.0001815583107972918, "loss": 0.041, "step": 122340 }, { "epoch": 0.79, "learning_rate": 0.00018154862944293486, "loss": 0.0466, "step": 122350 }, { "epoch": 0.79, "learning_rate": 0.0001815389480885779, "loss": 0.0423, "step": 122360 }, { "epoch": 0.79, "learning_rate": 0.000181529266734221, "loss": 0.0409, "step": 122370 }, { "epoch": 0.79, "learning_rate": 0.00018151958537986404, "loss": 0.0368, "step": 122380 }, { "epoch": 0.79, "learning_rate": 0.00018150990402550712, "loss": 0.0403, "step": 122390 }, { "epoch": 0.79, "learning_rate": 0.0001815002226711502, "loss": 0.0406, "step": 122400 }, { "epoch": 0.79, "learning_rate": 0.00018149054131679328, "loss": 0.0427, "step": 122410 }, { "epoch": 0.79, "learning_rate": 0.00018148085996243633, "loss": 0.0399, "step": 122420 }, { "epoch": 0.79, "learning_rate": 0.0001814711786080794, "loss": 0.0492, "step": 122430 }, { "epoch": 0.79, "learning_rate": 0.00018146149725372247, "loss": 0.0457, "step": 122440 }, { "epoch": 0.79, "learning_rate": 0.00018145181589936552, "loss": 0.0567, "step": 122450 }, { "epoch": 0.79, "learning_rate": 0.0001814421345450086, "loss": 0.0425, "step": 122460 }, { "epoch": 0.79, "learning_rate": 0.00018143245319065168, "loss": 0.0411, "step": 122470 }, { "epoch": 0.79, "learning_rate": 0.00018142277183629473, "loss": 0.0401, "step": 122480 }, { "epoch": 0.79, "learning_rate": 0.0001814130904819378, "loss": 0.0471, "step": 122490 }, { "epoch": 0.79, "learning_rate": 0.00018140340912758086, "loss": 0.044, "step": 122500 }, { "epoch": 0.79, "learning_rate": 0.00018139372777322392, "loss": 0.0362, "step": 122510 }, { "epoch": 0.79, "learning_rate": 0.000181384046418867, "loss": 0.0564, "step": 122520 }, { "epoch": 0.79, "learning_rate": 0.00018137436506451008, "loss": 0.0446, "step": 122530 }, { "epoch": 0.79, "learning_rate": 0.00018136468371015316, "loss": 0.0444, "step": 122540 }, { "epoch": 0.79, "learning_rate": 0.0001813550023557962, "loss": 0.0431, "step": 122550 }, { "epoch": 0.79, "learning_rate": 0.0001813453210014393, "loss": 0.0413, "step": 122560 }, { "epoch": 0.79, "learning_rate": 0.00018133563964708234, "loss": 0.0418, "step": 122570 }, { "epoch": 0.79, "learning_rate": 0.0001813259582927254, "loss": 0.05, "step": 122580 }, { "epoch": 0.79, "learning_rate": 0.00018131627693836847, "loss": 0.044, "step": 122590 }, { "epoch": 0.79, "learning_rate": 0.00018130659558401155, "loss": 0.0391, "step": 122600 }, { "epoch": 0.79, "learning_rate": 0.00018129691422965463, "loss": 0.0466, "step": 122610 }, { "epoch": 0.79, "learning_rate": 0.0001812872328752977, "loss": 0.0549, "step": 122620 }, { "epoch": 0.79, "learning_rate": 0.00018127755152094077, "loss": 0.0499, "step": 122630 }, { "epoch": 0.79, "learning_rate": 0.00018126787016658382, "loss": 0.0438, "step": 122640 }, { "epoch": 0.79, "learning_rate": 0.00018125818881222687, "loss": 0.0403, "step": 122650 }, { "epoch": 0.79, "learning_rate": 0.00018124850745786995, "loss": 0.0416, "step": 122660 }, { "epoch": 0.79, "learning_rate": 0.00018123882610351303, "loss": 0.035, "step": 122670 }, { "epoch": 0.79, "learning_rate": 0.00018122914474915608, "loss": 0.0451, "step": 122680 }, { "epoch": 0.79, "learning_rate": 0.00018121946339479916, "loss": 0.0402, "step": 122690 }, { "epoch": 0.79, "learning_rate": 0.00018120978204044224, "loss": 0.0413, "step": 122700 }, { "epoch": 0.79, "learning_rate": 0.00018120010068608527, "loss": 0.0393, "step": 122710 }, { "epoch": 0.79, "learning_rate": 0.00018119041933172835, "loss": 0.0445, "step": 122720 }, { "epoch": 0.79, "learning_rate": 0.00018118073797737143, "loss": 0.0408, "step": 122730 }, { "epoch": 0.79, "learning_rate": 0.0001811710566230145, "loss": 0.038, "step": 122740 }, { "epoch": 0.79, "learning_rate": 0.00018116137526865756, "loss": 0.042, "step": 122750 }, { "epoch": 0.79, "learning_rate": 0.00018115169391430064, "loss": 0.0491, "step": 122760 }, { "epoch": 0.79, "learning_rate": 0.00018114201255994372, "loss": 0.0413, "step": 122770 }, { "epoch": 0.79, "learning_rate": 0.00018113233120558675, "loss": 0.0562, "step": 122780 }, { "epoch": 0.79, "learning_rate": 0.00018112264985122983, "loss": 0.0416, "step": 122790 }, { "epoch": 0.79, "learning_rate": 0.0001811129684968729, "loss": 0.0394, "step": 122800 }, { "epoch": 0.79, "learning_rate": 0.00018110328714251599, "loss": 0.04, "step": 122810 }, { "epoch": 0.79, "learning_rate": 0.00018109360578815904, "loss": 0.0432, "step": 122820 }, { "epoch": 0.79, "learning_rate": 0.00018108392443380212, "loss": 0.0475, "step": 122830 }, { "epoch": 0.79, "learning_rate": 0.0001810742430794452, "loss": 0.0402, "step": 122840 }, { "epoch": 0.79, "learning_rate": 0.00018106456172508822, "loss": 0.0397, "step": 122850 }, { "epoch": 0.79, "learning_rate": 0.0001810548803707313, "loss": 0.0455, "step": 122860 }, { "epoch": 0.79, "learning_rate": 0.00018104519901637438, "loss": 0.0462, "step": 122870 }, { "epoch": 0.79, "learning_rate": 0.00018103551766201744, "loss": 0.0453, "step": 122880 }, { "epoch": 0.79, "learning_rate": 0.00018102583630766052, "loss": 0.0509, "step": 122890 }, { "epoch": 0.79, "learning_rate": 0.0001810161549533036, "loss": 0.0442, "step": 122900 }, { "epoch": 0.79, "learning_rate": 0.00018100647359894668, "loss": 0.0431, "step": 122910 }, { "epoch": 0.79, "learning_rate": 0.0001809967922445897, "loss": 0.042, "step": 122920 }, { "epoch": 0.79, "learning_rate": 0.00018098711089023278, "loss": 0.0471, "step": 122930 }, { "epoch": 0.79, "learning_rate": 0.00018097742953587586, "loss": 0.0413, "step": 122940 }, { "epoch": 0.79, "learning_rate": 0.0001809677481815189, "loss": 0.0395, "step": 122950 }, { "epoch": 0.79, "learning_rate": 0.000180958066827162, "loss": 0.0459, "step": 122960 }, { "epoch": 0.79, "learning_rate": 0.00018094838547280507, "loss": 0.0457, "step": 122970 }, { "epoch": 0.79, "learning_rate": 0.00018093870411844815, "loss": 0.0395, "step": 122980 }, { "epoch": 0.79, "learning_rate": 0.00018092902276409118, "loss": 0.0393, "step": 122990 }, { "epoch": 0.79, "learning_rate": 0.00018091934140973426, "loss": 0.0512, "step": 123000 }, { "epoch": 0.79, "eval_cer": 0.9199557112190713, "eval_loss": 0.028470169752836227, "eval_runtime": 120.5044, "eval_samples_per_second": 16.597, "eval_steps_per_second": 4.149, "step": 123000 }, { "epoch": 0.79, "learning_rate": 0.00018090966005537734, "loss": 0.0497, "step": 123010 }, { "epoch": 0.79, "learning_rate": 0.0001808999787010204, "loss": 0.0392, "step": 123020 }, { "epoch": 0.79, "learning_rate": 0.00018089029734666347, "loss": 0.041, "step": 123030 }, { "epoch": 0.79, "learning_rate": 0.00018088061599230655, "loss": 0.0441, "step": 123040 }, { "epoch": 0.79, "learning_rate": 0.0001808709346379496, "loss": 0.0418, "step": 123050 }, { "epoch": 0.79, "learning_rate": 0.00018086125328359266, "loss": 0.0438, "step": 123060 }, { "epoch": 0.79, "learning_rate": 0.00018085157192923574, "loss": 0.0466, "step": 123070 }, { "epoch": 0.79, "learning_rate": 0.0001808418905748788, "loss": 0.0421, "step": 123080 }, { "epoch": 0.79, "learning_rate": 0.00018083220922052187, "loss": 0.039, "step": 123090 }, { "epoch": 0.79, "learning_rate": 0.00018082252786616495, "loss": 0.0419, "step": 123100 }, { "epoch": 0.79, "learning_rate": 0.00018081284651180803, "loss": 0.0413, "step": 123110 }, { "epoch": 0.79, "learning_rate": 0.00018080316515745108, "loss": 0.0429, "step": 123120 }, { "epoch": 0.79, "learning_rate": 0.00018079348380309413, "loss": 0.0419, "step": 123130 }, { "epoch": 0.79, "learning_rate": 0.0001807838024487372, "loss": 0.0502, "step": 123140 }, { "epoch": 0.79, "learning_rate": 0.00018077412109438027, "loss": 0.0367, "step": 123150 }, { "epoch": 0.79, "learning_rate": 0.00018076443974002334, "loss": 0.0345, "step": 123160 }, { "epoch": 0.79, "learning_rate": 0.00018075475838566642, "loss": 0.037, "step": 123170 }, { "epoch": 0.8, "learning_rate": 0.0001807450770313095, "loss": 0.0378, "step": 123180 }, { "epoch": 0.8, "learning_rate": 0.00018073539567695256, "loss": 0.0434, "step": 123190 }, { "epoch": 0.8, "learning_rate": 0.0001807257143225956, "loss": 0.0393, "step": 123200 }, { "epoch": 0.8, "learning_rate": 0.0001807160329682387, "loss": 0.0417, "step": 123210 }, { "epoch": 0.8, "learning_rate": 0.00018070635161388174, "loss": 0.0395, "step": 123220 }, { "epoch": 0.8, "learning_rate": 0.00018069667025952482, "loss": 0.0413, "step": 123230 }, { "epoch": 0.8, "learning_rate": 0.0001806869889051679, "loss": 0.0443, "step": 123240 }, { "epoch": 0.8, "learning_rate": 0.00018067730755081095, "loss": 0.0431, "step": 123250 }, { "epoch": 0.8, "learning_rate": 0.00018066762619645403, "loss": 0.0407, "step": 123260 }, { "epoch": 0.8, "learning_rate": 0.0001806579448420971, "loss": 0.0443, "step": 123270 }, { "epoch": 0.8, "learning_rate": 0.00018064826348774014, "loss": 0.0403, "step": 123280 }, { "epoch": 0.8, "learning_rate": 0.00018063858213338322, "loss": 0.0446, "step": 123290 }, { "epoch": 0.8, "learning_rate": 0.0001806289007790263, "loss": 0.0427, "step": 123300 }, { "epoch": 0.8, "learning_rate": 0.00018061921942466938, "loss": 0.0539, "step": 123310 }, { "epoch": 0.8, "learning_rate": 0.00018060953807031243, "loss": 0.0481, "step": 123320 }, { "epoch": 0.8, "learning_rate": 0.0001805998567159555, "loss": 0.0467, "step": 123330 }, { "epoch": 0.8, "learning_rate": 0.00018059017536159856, "loss": 0.0444, "step": 123340 }, { "epoch": 0.8, "learning_rate": 0.00018058049400724162, "loss": 0.0419, "step": 123350 }, { "epoch": 0.8, "learning_rate": 0.0001805708126528847, "loss": 0.0467, "step": 123360 }, { "epoch": 0.8, "learning_rate": 0.00018056113129852778, "loss": 0.0411, "step": 123370 }, { "epoch": 0.8, "learning_rate": 0.00018055144994417086, "loss": 0.0427, "step": 123380 }, { "epoch": 0.8, "learning_rate": 0.0001805417685898139, "loss": 0.0398, "step": 123390 }, { "epoch": 0.8, "learning_rate": 0.000180532087235457, "loss": 0.0514, "step": 123400 }, { "epoch": 0.8, "learning_rate": 0.00018052240588110004, "loss": 0.0387, "step": 123410 }, { "epoch": 0.8, "learning_rate": 0.0001805127245267431, "loss": 0.0464, "step": 123420 }, { "epoch": 0.8, "learning_rate": 0.00018050304317238617, "loss": 0.0445, "step": 123430 }, { "epoch": 0.8, "learning_rate": 0.00018049336181802925, "loss": 0.042, "step": 123440 }, { "epoch": 0.8, "learning_rate": 0.0001804836804636723, "loss": 0.0413, "step": 123450 }, { "epoch": 0.8, "learning_rate": 0.00018047399910931539, "loss": 0.0454, "step": 123460 }, { "epoch": 0.8, "learning_rate": 0.00018046431775495847, "loss": 0.0383, "step": 123470 }, { "epoch": 0.8, "learning_rate": 0.0001804546364006015, "loss": 0.0393, "step": 123480 }, { "epoch": 0.8, "learning_rate": 0.00018044495504624457, "loss": 0.0388, "step": 123490 }, { "epoch": 0.8, "learning_rate": 0.00018043527369188765, "loss": 0.0455, "step": 123500 }, { "epoch": 0.8, "learning_rate": 0.00018042559233753073, "loss": 0.0487, "step": 123510 }, { "epoch": 0.8, "learning_rate": 0.00018041591098317378, "loss": 0.0377, "step": 123520 }, { "epoch": 0.8, "learning_rate": 0.00018040622962881686, "loss": 0.0405, "step": 123530 }, { "epoch": 0.8, "learning_rate": 0.00018039654827445994, "loss": 0.0439, "step": 123540 }, { "epoch": 0.8, "learning_rate": 0.00018038686692010297, "loss": 0.0545, "step": 123550 }, { "epoch": 0.8, "learning_rate": 0.00018037718556574605, "loss": 0.0394, "step": 123560 }, { "epoch": 0.8, "learning_rate": 0.00018036750421138913, "loss": 0.042, "step": 123570 }, { "epoch": 0.8, "learning_rate": 0.0001803578228570322, "loss": 0.0477, "step": 123580 }, { "epoch": 0.8, "learning_rate": 0.00018034814150267526, "loss": 0.045, "step": 123590 }, { "epoch": 0.8, "learning_rate": 0.00018033846014831834, "loss": 0.0394, "step": 123600 }, { "epoch": 0.8, "learning_rate": 0.00018032877879396142, "loss": 0.0461, "step": 123610 }, { "epoch": 0.8, "learning_rate": 0.00018031909743960445, "loss": 0.0422, "step": 123620 }, { "epoch": 0.8, "learning_rate": 0.00018030941608524753, "loss": 0.0426, "step": 123630 }, { "epoch": 0.8, "learning_rate": 0.0001802997347308906, "loss": 0.04, "step": 123640 }, { "epoch": 0.8, "learning_rate": 0.00018029005337653366, "loss": 0.0424, "step": 123650 }, { "epoch": 0.8, "learning_rate": 0.00018028037202217674, "loss": 0.048, "step": 123660 }, { "epoch": 0.8, "learning_rate": 0.00018027069066781982, "loss": 0.0471, "step": 123670 }, { "epoch": 0.8, "learning_rate": 0.0001802610093134629, "loss": 0.0413, "step": 123680 }, { "epoch": 0.8, "learning_rate": 0.00018025132795910592, "loss": 0.0395, "step": 123690 }, { "epoch": 0.8, "learning_rate": 0.000180241646604749, "loss": 0.0398, "step": 123700 }, { "epoch": 0.8, "learning_rate": 0.00018023196525039208, "loss": 0.0429, "step": 123710 }, { "epoch": 0.8, "learning_rate": 0.00018022228389603514, "loss": 0.0391, "step": 123720 }, { "epoch": 0.8, "learning_rate": 0.00018021260254167822, "loss": 0.0376, "step": 123730 }, { "epoch": 0.8, "learning_rate": 0.0001802029211873213, "loss": 0.0422, "step": 123740 }, { "epoch": 0.8, "learning_rate": 0.00018019323983296438, "loss": 0.0425, "step": 123750 }, { "epoch": 0.8, "learning_rate": 0.0001801835584786074, "loss": 0.0378, "step": 123760 }, { "epoch": 0.8, "learning_rate": 0.00018017387712425048, "loss": 0.0423, "step": 123770 }, { "epoch": 0.8, "learning_rate": 0.00018016419576989356, "loss": 0.0435, "step": 123780 }, { "epoch": 0.8, "learning_rate": 0.0001801545144155366, "loss": 0.047, "step": 123790 }, { "epoch": 0.8, "learning_rate": 0.0001801448330611797, "loss": 0.0393, "step": 123800 }, { "epoch": 0.8, "learning_rate": 0.00018013515170682277, "loss": 0.0401, "step": 123810 }, { "epoch": 0.8, "learning_rate": 0.00018012547035246585, "loss": 0.0382, "step": 123820 }, { "epoch": 0.8, "learning_rate": 0.00018011578899810888, "loss": 0.0439, "step": 123830 }, { "epoch": 0.8, "learning_rate": 0.00018010610764375196, "loss": 0.0571, "step": 123840 }, { "epoch": 0.8, "learning_rate": 0.000180096426289395, "loss": 0.052, "step": 123850 }, { "epoch": 0.8, "learning_rate": 0.0001800867449350381, "loss": 0.0403, "step": 123860 }, { "epoch": 0.8, "learning_rate": 0.00018007706358068117, "loss": 0.0421, "step": 123870 }, { "epoch": 0.8, "learning_rate": 0.00018006738222632425, "loss": 0.041, "step": 123880 }, { "epoch": 0.8, "learning_rate": 0.0001800577008719673, "loss": 0.0447, "step": 123890 }, { "epoch": 0.8, "learning_rate": 0.00018004801951761036, "loss": 0.0358, "step": 123900 }, { "epoch": 0.8, "learning_rate": 0.00018003833816325343, "loss": 0.0426, "step": 123910 }, { "epoch": 0.8, "learning_rate": 0.0001800286568088965, "loss": 0.0456, "step": 123920 }, { "epoch": 0.8, "learning_rate": 0.00018001897545453957, "loss": 0.0377, "step": 123930 }, { "epoch": 0.8, "learning_rate": 0.00018000929410018265, "loss": 0.0432, "step": 123940 }, { "epoch": 0.8, "learning_rate": 0.00017999961274582573, "loss": 0.048, "step": 123950 }, { "epoch": 0.8, "learning_rate": 0.00017998993139146878, "loss": 0.04, "step": 123960 }, { "epoch": 0.8, "learning_rate": 0.00017998025003711183, "loss": 0.0436, "step": 123970 }, { "epoch": 0.8, "learning_rate": 0.0001799705686827549, "loss": 0.0347, "step": 123980 }, { "epoch": 0.8, "learning_rate": 0.00017996088732839796, "loss": 0.0524, "step": 123990 }, { "epoch": 0.8, "learning_rate": 0.00017995120597404104, "loss": 0.0427, "step": 124000 }, { "epoch": 0.8, "eval_cer": 0.9199322110495989, "eval_loss": 0.02851358987390995, "eval_runtime": 120.0347, "eval_samples_per_second": 16.662, "eval_steps_per_second": 4.165, "step": 124000 }, { "epoch": 0.8, "learning_rate": 0.00017994152461968412, "loss": 0.0427, "step": 124010 }, { "epoch": 0.8, "learning_rate": 0.0001799318432653272, "loss": 0.0406, "step": 124020 }, { "epoch": 0.8, "learning_rate": 0.00017992216191097026, "loss": 0.0433, "step": 124030 }, { "epoch": 0.8, "learning_rate": 0.0001799124805566133, "loss": 0.0464, "step": 124040 }, { "epoch": 0.8, "learning_rate": 0.0001799027992022564, "loss": 0.0488, "step": 124050 }, { "epoch": 0.8, "learning_rate": 0.00017989311784789944, "loss": 0.0359, "step": 124060 }, { "epoch": 0.8, "learning_rate": 0.00017988343649354252, "loss": 0.0368, "step": 124070 }, { "epoch": 0.8, "learning_rate": 0.0001798737551391856, "loss": 0.0484, "step": 124080 }, { "epoch": 0.8, "learning_rate": 0.00017986407378482865, "loss": 0.0388, "step": 124090 }, { "epoch": 0.8, "learning_rate": 0.00017985439243047173, "loss": 0.0451, "step": 124100 }, { "epoch": 0.8, "learning_rate": 0.0001798447110761148, "loss": 0.04, "step": 124110 }, { "epoch": 0.8, "learning_rate": 0.00017983502972175784, "loss": 0.0372, "step": 124120 }, { "epoch": 0.8, "learning_rate": 0.00017982534836740092, "loss": 0.0458, "step": 124130 }, { "epoch": 0.8, "learning_rate": 0.000179815667013044, "loss": 0.0421, "step": 124140 }, { "epoch": 0.8, "learning_rate": 0.00017980598565868708, "loss": 0.039, "step": 124150 }, { "epoch": 0.8, "learning_rate": 0.00017979630430433013, "loss": 0.0429, "step": 124160 }, { "epoch": 0.8, "learning_rate": 0.0001797866229499732, "loss": 0.0469, "step": 124170 }, { "epoch": 0.8, "learning_rate": 0.00017977694159561626, "loss": 0.0422, "step": 124180 }, { "epoch": 0.8, "learning_rate": 0.00017976726024125932, "loss": 0.041, "step": 124190 }, { "epoch": 0.8, "learning_rate": 0.0001797575788869024, "loss": 0.0453, "step": 124200 }, { "epoch": 0.8, "learning_rate": 0.00017974789753254548, "loss": 0.0416, "step": 124210 }, { "epoch": 0.8, "learning_rate": 0.00017973821617818856, "loss": 0.0487, "step": 124220 }, { "epoch": 0.8, "learning_rate": 0.0001797285348238316, "loss": 0.0436, "step": 124230 }, { "epoch": 0.8, "learning_rate": 0.0001797188534694747, "loss": 0.0462, "step": 124240 }, { "epoch": 0.8, "learning_rate": 0.00017970917211511774, "loss": 0.0436, "step": 124250 }, { "epoch": 0.8, "learning_rate": 0.0001796994907607608, "loss": 0.0456, "step": 124260 }, { "epoch": 0.8, "learning_rate": 0.00017968980940640387, "loss": 0.0457, "step": 124270 }, { "epoch": 0.8, "learning_rate": 0.00017968012805204695, "loss": 0.0408, "step": 124280 }, { "epoch": 0.8, "learning_rate": 0.00017967044669769, "loss": 0.0421, "step": 124290 }, { "epoch": 0.8, "learning_rate": 0.00017966076534333309, "loss": 0.0431, "step": 124300 }, { "epoch": 0.8, "learning_rate": 0.00017965108398897617, "loss": 0.0403, "step": 124310 }, { "epoch": 0.8, "learning_rate": 0.0001796414026346192, "loss": 0.0445, "step": 124320 }, { "epoch": 0.8, "learning_rate": 0.00017963172128026227, "loss": 0.0405, "step": 124330 }, { "epoch": 0.8, "learning_rate": 0.00017962203992590535, "loss": 0.0401, "step": 124340 }, { "epoch": 0.8, "learning_rate": 0.00017961235857154843, "loss": 0.04, "step": 124350 }, { "epoch": 0.8, "learning_rate": 0.00017960267721719148, "loss": 0.0392, "step": 124360 }, { "epoch": 0.8, "learning_rate": 0.00017959299586283456, "loss": 0.0405, "step": 124370 }, { "epoch": 0.8, "learning_rate": 0.00017958331450847764, "loss": 0.0501, "step": 124380 }, { "epoch": 0.8, "learning_rate": 0.00017957363315412067, "loss": 0.0421, "step": 124390 }, { "epoch": 0.8, "learning_rate": 0.00017956395179976375, "loss": 0.0413, "step": 124400 }, { "epoch": 0.8, "learning_rate": 0.00017955427044540683, "loss": 0.0385, "step": 124410 }, { "epoch": 0.8, "learning_rate": 0.0001795445890910499, "loss": 0.045, "step": 124420 }, { "epoch": 0.8, "learning_rate": 0.00017953490773669296, "loss": 0.0403, "step": 124430 }, { "epoch": 0.8, "learning_rate": 0.00017952522638233604, "loss": 0.0437, "step": 124440 }, { "epoch": 0.8, "learning_rate": 0.00017951554502797912, "loss": 0.0403, "step": 124450 }, { "epoch": 0.8, "learning_rate": 0.00017950586367362215, "loss": 0.0444, "step": 124460 }, { "epoch": 0.8, "learning_rate": 0.00017949618231926523, "loss": 0.0474, "step": 124470 }, { "epoch": 0.8, "learning_rate": 0.0001794865009649083, "loss": 0.0477, "step": 124480 }, { "epoch": 0.8, "learning_rate": 0.00017947681961055136, "loss": 0.0481, "step": 124490 }, { "epoch": 0.8, "learning_rate": 0.00017946713825619444, "loss": 0.0429, "step": 124500 }, { "epoch": 0.8, "learning_rate": 0.00017945745690183752, "loss": 0.044, "step": 124510 }, { "epoch": 0.8, "learning_rate": 0.0001794477755474806, "loss": 0.0468, "step": 124520 }, { "epoch": 0.8, "learning_rate": 0.00017943809419312362, "loss": 0.0445, "step": 124530 }, { "epoch": 0.8, "learning_rate": 0.0001794284128387667, "loss": 0.0368, "step": 124540 }, { "epoch": 0.8, "learning_rate": 0.00017941873148440978, "loss": 0.0411, "step": 124550 }, { "epoch": 0.8, "learning_rate": 0.00017940905013005284, "loss": 0.0366, "step": 124560 }, { "epoch": 0.8, "learning_rate": 0.00017939936877569592, "loss": 0.0438, "step": 124570 }, { "epoch": 0.8, "learning_rate": 0.000179389687421339, "loss": 0.0437, "step": 124580 }, { "epoch": 0.8, "learning_rate": 0.00017938000606698207, "loss": 0.0402, "step": 124590 }, { "epoch": 0.8, "learning_rate": 0.0001793703247126251, "loss": 0.0423, "step": 124600 }, { "epoch": 0.8, "learning_rate": 0.00017936064335826818, "loss": 0.0489, "step": 124610 }, { "epoch": 0.8, "learning_rate": 0.00017935096200391126, "loss": 0.0469, "step": 124620 }, { "epoch": 0.8, "learning_rate": 0.0001793412806495543, "loss": 0.0451, "step": 124630 }, { "epoch": 0.8, "learning_rate": 0.0001793315992951974, "loss": 0.0426, "step": 124640 }, { "epoch": 0.8, "learning_rate": 0.00017932191794084047, "loss": 0.0435, "step": 124650 }, { "epoch": 0.8, "learning_rate": 0.00017931223658648352, "loss": 0.0416, "step": 124660 }, { "epoch": 0.8, "learning_rate": 0.00017930255523212658, "loss": 0.042, "step": 124670 }, { "epoch": 0.8, "learning_rate": 0.00017929287387776966, "loss": 0.0523, "step": 124680 }, { "epoch": 0.8, "learning_rate": 0.0001792831925234127, "loss": 0.0401, "step": 124690 }, { "epoch": 0.8, "learning_rate": 0.0001792735111690558, "loss": 0.0499, "step": 124700 }, { "epoch": 0.8, "learning_rate": 0.00017926382981469887, "loss": 0.0482, "step": 124710 }, { "epoch": 0.8, "learning_rate": 0.00017925414846034195, "loss": 0.0429, "step": 124720 }, { "epoch": 0.81, "learning_rate": 0.000179244467105985, "loss": 0.0513, "step": 124730 }, { "epoch": 0.81, "learning_rate": 0.00017923478575162805, "loss": 0.0387, "step": 124740 }, { "epoch": 0.81, "learning_rate": 0.00017922510439727113, "loss": 0.0408, "step": 124750 }, { "epoch": 0.81, "learning_rate": 0.0001792154230429142, "loss": 0.0388, "step": 124760 }, { "epoch": 0.81, "learning_rate": 0.00017920574168855727, "loss": 0.0441, "step": 124770 }, { "epoch": 0.81, "learning_rate": 0.00017919606033420035, "loss": 0.0433, "step": 124780 }, { "epoch": 0.81, "learning_rate": 0.00017918637897984343, "loss": 0.0525, "step": 124790 }, { "epoch": 0.81, "learning_rate": 0.00017917669762548648, "loss": 0.0428, "step": 124800 }, { "epoch": 0.81, "learning_rate": 0.00017916701627112953, "loss": 0.0408, "step": 124810 }, { "epoch": 0.81, "learning_rate": 0.0001791573349167726, "loss": 0.0453, "step": 124820 }, { "epoch": 0.81, "learning_rate": 0.00017914765356241566, "loss": 0.0426, "step": 124830 }, { "epoch": 0.81, "learning_rate": 0.00017913797220805874, "loss": 0.0424, "step": 124840 }, { "epoch": 0.81, "learning_rate": 0.00017912829085370182, "loss": 0.0411, "step": 124850 }, { "epoch": 0.81, "learning_rate": 0.00017911860949934488, "loss": 0.0396, "step": 124860 }, { "epoch": 0.81, "learning_rate": 0.00017910892814498796, "loss": 0.039, "step": 124870 }, { "epoch": 0.81, "learning_rate": 0.000179099246790631, "loss": 0.0395, "step": 124880 }, { "epoch": 0.81, "learning_rate": 0.00017908956543627406, "loss": 0.0391, "step": 124890 }, { "epoch": 0.81, "learning_rate": 0.00017907988408191714, "loss": 0.0425, "step": 124900 }, { "epoch": 0.81, "learning_rate": 0.00017907020272756022, "loss": 0.0445, "step": 124910 }, { "epoch": 0.81, "learning_rate": 0.0001790605213732033, "loss": 0.0444, "step": 124920 }, { "epoch": 0.81, "learning_rate": 0.00017905084001884635, "loss": 0.0433, "step": 124930 }, { "epoch": 0.81, "learning_rate": 0.00017904115866448943, "loss": 0.0423, "step": 124940 }, { "epoch": 0.81, "learning_rate": 0.00017903147731013249, "loss": 0.0402, "step": 124950 }, { "epoch": 0.81, "learning_rate": 0.00017902179595577554, "loss": 0.0404, "step": 124960 }, { "epoch": 0.81, "learning_rate": 0.00017901211460141862, "loss": 0.0447, "step": 124970 }, { "epoch": 0.81, "learning_rate": 0.0001790024332470617, "loss": 0.0517, "step": 124980 }, { "epoch": 0.81, "learning_rate": 0.00017899275189270478, "loss": 0.0411, "step": 124990 }, { "epoch": 0.81, "learning_rate": 0.00017898307053834783, "loss": 0.0461, "step": 125000 }, { "epoch": 0.81, "eval_cer": 0.919931307196927, "eval_loss": 0.028672238811850548, "eval_runtime": 120.0797, "eval_samples_per_second": 16.656, "eval_steps_per_second": 4.164, "step": 125000 }, { "epoch": 0.81, "learning_rate": 0.0001789733891839909, "loss": 0.0371, "step": 125010 }, { "epoch": 0.81, "learning_rate": 0.00017896370782963396, "loss": 0.0457, "step": 125020 }, { "epoch": 0.81, "learning_rate": 0.00017895402647527702, "loss": 0.0354, "step": 125030 }, { "epoch": 0.81, "learning_rate": 0.0001789443451209201, "loss": 0.0426, "step": 125040 }, { "epoch": 0.81, "learning_rate": 0.00017893466376656318, "loss": 0.0381, "step": 125050 }, { "epoch": 0.81, "learning_rate": 0.00017892498241220623, "loss": 0.0444, "step": 125060 }, { "epoch": 0.81, "learning_rate": 0.0001789153010578493, "loss": 0.0395, "step": 125070 }, { "epoch": 0.81, "learning_rate": 0.0001789056197034924, "loss": 0.042, "step": 125080 }, { "epoch": 0.81, "learning_rate": 0.00017889593834913541, "loss": 0.0374, "step": 125090 }, { "epoch": 0.81, "learning_rate": 0.0001788862569947785, "loss": 0.0452, "step": 125100 }, { "epoch": 0.81, "learning_rate": 0.00017887657564042157, "loss": 0.0428, "step": 125110 }, { "epoch": 0.81, "learning_rate": 0.00017886689428606465, "loss": 0.041, "step": 125120 }, { "epoch": 0.81, "learning_rate": 0.0001788572129317077, "loss": 0.0412, "step": 125130 }, { "epoch": 0.81, "learning_rate": 0.00017884753157735079, "loss": 0.0368, "step": 125140 }, { "epoch": 0.81, "learning_rate": 0.00017883785022299387, "loss": 0.0437, "step": 125150 }, { "epoch": 0.81, "learning_rate": 0.0001788281688686369, "loss": 0.0453, "step": 125160 }, { "epoch": 0.81, "learning_rate": 0.00017881848751427997, "loss": 0.0439, "step": 125170 }, { "epoch": 0.81, "learning_rate": 0.00017880880615992305, "loss": 0.0397, "step": 125180 }, { "epoch": 0.81, "learning_rate": 0.00017879912480556613, "loss": 0.0423, "step": 125190 }, { "epoch": 0.81, "learning_rate": 0.00017878944345120918, "loss": 0.0392, "step": 125200 }, { "epoch": 0.81, "learning_rate": 0.00017877976209685226, "loss": 0.0431, "step": 125210 }, { "epoch": 0.81, "learning_rate": 0.00017877008074249534, "loss": 0.0365, "step": 125220 }, { "epoch": 0.81, "learning_rate": 0.00017876039938813837, "loss": 0.0379, "step": 125230 }, { "epoch": 0.81, "learning_rate": 0.00017875071803378145, "loss": 0.0404, "step": 125240 }, { "epoch": 0.81, "learning_rate": 0.00017874103667942453, "loss": 0.047, "step": 125250 }, { "epoch": 0.81, "learning_rate": 0.00017873135532506758, "loss": 0.0412, "step": 125260 }, { "epoch": 0.81, "learning_rate": 0.00017872167397071066, "loss": 0.0474, "step": 125270 }, { "epoch": 0.81, "learning_rate": 0.00017871199261635374, "loss": 0.0445, "step": 125280 }, { "epoch": 0.81, "learning_rate": 0.00017870231126199682, "loss": 0.0489, "step": 125290 }, { "epoch": 0.81, "learning_rate": 0.00017869262990763985, "loss": 0.0441, "step": 125300 }, { "epoch": 0.81, "learning_rate": 0.00017868294855328293, "loss": 0.0384, "step": 125310 }, { "epoch": 0.81, "learning_rate": 0.000178673267198926, "loss": 0.0399, "step": 125320 }, { "epoch": 0.81, "learning_rate": 0.00017866358584456906, "loss": 0.0445, "step": 125330 }, { "epoch": 0.81, "learning_rate": 0.00017865390449021214, "loss": 0.0402, "step": 125340 }, { "epoch": 0.81, "learning_rate": 0.00017864422313585522, "loss": 0.0436, "step": 125350 }, { "epoch": 0.81, "learning_rate": 0.0001786345417814983, "loss": 0.0434, "step": 125360 }, { "epoch": 0.81, "learning_rate": 0.00017862486042714132, "loss": 0.04, "step": 125370 }, { "epoch": 0.81, "learning_rate": 0.0001786151790727844, "loss": 0.0415, "step": 125380 }, { "epoch": 0.81, "learning_rate": 0.00017860549771842748, "loss": 0.0509, "step": 125390 }, { "epoch": 0.81, "learning_rate": 0.00017859581636407053, "loss": 0.0459, "step": 125400 }, { "epoch": 0.81, "learning_rate": 0.00017858613500971361, "loss": 0.0464, "step": 125410 }, { "epoch": 0.81, "learning_rate": 0.0001785764536553567, "loss": 0.0423, "step": 125420 }, { "epoch": 0.81, "learning_rate": 0.00017856677230099977, "loss": 0.0398, "step": 125430 }, { "epoch": 0.81, "learning_rate": 0.0001785570909466428, "loss": 0.0365, "step": 125440 }, { "epoch": 0.81, "learning_rate": 0.00017854740959228588, "loss": 0.0468, "step": 125450 }, { "epoch": 0.81, "learning_rate": 0.00017853772823792893, "loss": 0.0423, "step": 125460 }, { "epoch": 0.81, "learning_rate": 0.000178528046883572, "loss": 0.0511, "step": 125470 }, { "epoch": 0.81, "learning_rate": 0.0001785183655292151, "loss": 0.0347, "step": 125480 }, { "epoch": 0.81, "learning_rate": 0.00017850868417485817, "loss": 0.0416, "step": 125490 }, { "epoch": 0.81, "learning_rate": 0.00017849900282050122, "loss": 0.0417, "step": 125500 }, { "epoch": 0.81, "learning_rate": 0.00017848932146614428, "loss": 0.0377, "step": 125510 }, { "epoch": 0.81, "learning_rate": 0.00017847964011178736, "loss": 0.0468, "step": 125520 }, { "epoch": 0.81, "learning_rate": 0.0001784699587574304, "loss": 0.0344, "step": 125530 }, { "epoch": 0.81, "learning_rate": 0.0001784602774030735, "loss": 0.0398, "step": 125540 }, { "epoch": 0.81, "learning_rate": 0.00017845059604871657, "loss": 0.0382, "step": 125550 }, { "epoch": 0.81, "learning_rate": 0.00017844091469435965, "loss": 0.0548, "step": 125560 }, { "epoch": 0.81, "learning_rate": 0.0001784312333400027, "loss": 0.0423, "step": 125570 }, { "epoch": 0.81, "learning_rate": 0.00017842155198564575, "loss": 0.0403, "step": 125580 }, { "epoch": 0.81, "learning_rate": 0.00017841187063128883, "loss": 0.0381, "step": 125590 }, { "epoch": 0.81, "learning_rate": 0.0001784021892769319, "loss": 0.0379, "step": 125600 }, { "epoch": 0.81, "learning_rate": 0.00017839250792257497, "loss": 0.0523, "step": 125610 }, { "epoch": 0.81, "learning_rate": 0.00017838282656821805, "loss": 0.0426, "step": 125620 }, { "epoch": 0.81, "learning_rate": 0.00017837314521386113, "loss": 0.0366, "step": 125630 }, { "epoch": 0.81, "learning_rate": 0.00017836346385950418, "loss": 0.0448, "step": 125640 }, { "epoch": 0.81, "learning_rate": 0.00017835378250514723, "loss": 0.0405, "step": 125650 }, { "epoch": 0.81, "learning_rate": 0.00017834410115079028, "loss": 0.0473, "step": 125660 }, { "epoch": 0.81, "learning_rate": 0.00017833441979643336, "loss": 0.0437, "step": 125670 }, { "epoch": 0.81, "learning_rate": 0.00017832473844207644, "loss": 0.042, "step": 125680 }, { "epoch": 0.81, "learning_rate": 0.00017831505708771952, "loss": 0.0476, "step": 125690 }, { "epoch": 0.81, "learning_rate": 0.00017830537573336258, "loss": 0.0426, "step": 125700 }, { "epoch": 0.81, "learning_rate": 0.00017829569437900566, "loss": 0.0395, "step": 125710 }, { "epoch": 0.81, "learning_rate": 0.0001782860130246487, "loss": 0.0485, "step": 125720 }, { "epoch": 0.81, "learning_rate": 0.00017827633167029176, "loss": 0.0394, "step": 125730 }, { "epoch": 0.81, "learning_rate": 0.00017826665031593484, "loss": 0.0453, "step": 125740 }, { "epoch": 0.81, "learning_rate": 0.00017825696896157792, "loss": 0.0397, "step": 125750 }, { "epoch": 0.81, "learning_rate": 0.000178247287607221, "loss": 0.0425, "step": 125760 }, { "epoch": 0.81, "learning_rate": 0.00017823760625286405, "loss": 0.0426, "step": 125770 }, { "epoch": 0.81, "learning_rate": 0.00017822792489850713, "loss": 0.0425, "step": 125780 }, { "epoch": 0.81, "learning_rate": 0.00017821824354415019, "loss": 0.0471, "step": 125790 }, { "epoch": 0.81, "learning_rate": 0.00017820856218979324, "loss": 0.0445, "step": 125800 }, { "epoch": 0.81, "learning_rate": 0.00017819888083543632, "loss": 0.0416, "step": 125810 }, { "epoch": 0.81, "learning_rate": 0.0001781891994810794, "loss": 0.0448, "step": 125820 }, { "epoch": 0.81, "learning_rate": 0.00017817951812672248, "loss": 0.0356, "step": 125830 }, { "epoch": 0.81, "learning_rate": 0.00017816983677236553, "loss": 0.0406, "step": 125840 }, { "epoch": 0.81, "learning_rate": 0.0001781601554180086, "loss": 0.0399, "step": 125850 }, { "epoch": 0.81, "learning_rate": 0.00017815047406365164, "loss": 0.0423, "step": 125860 }, { "epoch": 0.81, "learning_rate": 0.00017814079270929472, "loss": 0.0316, "step": 125870 }, { "epoch": 0.81, "learning_rate": 0.0001781311113549378, "loss": 0.0393, "step": 125880 }, { "epoch": 0.81, "learning_rate": 0.00017812143000058088, "loss": 0.0367, "step": 125890 }, { "epoch": 0.81, "learning_rate": 0.00017811174864622393, "loss": 0.0407, "step": 125900 }, { "epoch": 0.81, "learning_rate": 0.000178102067291867, "loss": 0.0402, "step": 125910 }, { "epoch": 0.81, "learning_rate": 0.0001780923859375101, "loss": 0.0401, "step": 125920 }, { "epoch": 0.81, "learning_rate": 0.0001780827045831531, "loss": 0.0376, "step": 125930 }, { "epoch": 0.81, "learning_rate": 0.0001780730232287962, "loss": 0.0445, "step": 125940 }, { "epoch": 0.81, "learning_rate": 0.00017806334187443927, "loss": 0.0395, "step": 125950 }, { "epoch": 0.81, "learning_rate": 0.00017805366052008235, "loss": 0.0363, "step": 125960 }, { "epoch": 0.81, "learning_rate": 0.0001780439791657254, "loss": 0.0429, "step": 125970 }, { "epoch": 0.81, "learning_rate": 0.00017803429781136849, "loss": 0.0444, "step": 125980 }, { "epoch": 0.81, "learning_rate": 0.00017802461645701156, "loss": 0.0455, "step": 125990 }, { "epoch": 0.81, "learning_rate": 0.0001780149351026546, "loss": 0.0433, "step": 126000 }, { "epoch": 0.81, "eval_cer": 0.9197939215907807, "eval_loss": 0.029015522450208664, "eval_runtime": 119.846, "eval_samples_per_second": 16.688, "eval_steps_per_second": 4.172, "step": 126000 }, { "epoch": 0.81, "learning_rate": 0.00017800525374829767, "loss": 0.041, "step": 126010 }, { "epoch": 0.81, "learning_rate": 0.00017799557239394075, "loss": 0.0422, "step": 126020 }, { "epoch": 0.81, "learning_rate": 0.00017798589103958383, "loss": 0.0416, "step": 126030 }, { "epoch": 0.81, "learning_rate": 0.00017797620968522688, "loss": 0.0384, "step": 126040 }, { "epoch": 0.81, "learning_rate": 0.00017796652833086996, "loss": 0.0471, "step": 126050 }, { "epoch": 0.81, "learning_rate": 0.00017795684697651304, "loss": 0.0389, "step": 126060 }, { "epoch": 0.81, "learning_rate": 0.00017794716562215607, "loss": 0.0447, "step": 126070 }, { "epoch": 0.81, "learning_rate": 0.00017793748426779915, "loss": 0.0411, "step": 126080 }, { "epoch": 0.81, "learning_rate": 0.00017792780291344223, "loss": 0.0413, "step": 126090 }, { "epoch": 0.81, "learning_rate": 0.00017791812155908528, "loss": 0.0375, "step": 126100 }, { "epoch": 0.81, "learning_rate": 0.00017790844020472836, "loss": 0.0353, "step": 126110 }, { "epoch": 0.81, "learning_rate": 0.00017789875885037144, "loss": 0.039, "step": 126120 }, { "epoch": 0.81, "learning_rate": 0.00017788907749601452, "loss": 0.0429, "step": 126130 }, { "epoch": 0.81, "learning_rate": 0.00017787939614165755, "loss": 0.0418, "step": 126140 }, { "epoch": 0.81, "learning_rate": 0.00017786971478730062, "loss": 0.0367, "step": 126150 }, { "epoch": 0.81, "learning_rate": 0.0001778600334329437, "loss": 0.0382, "step": 126160 }, { "epoch": 0.81, "learning_rate": 0.00017785035207858676, "loss": 0.041, "step": 126170 }, { "epoch": 0.81, "learning_rate": 0.00017784067072422984, "loss": 0.0396, "step": 126180 }, { "epoch": 0.81, "learning_rate": 0.00017783098936987292, "loss": 0.0366, "step": 126190 }, { "epoch": 0.81, "learning_rate": 0.000177821308015516, "loss": 0.0409, "step": 126200 }, { "epoch": 0.81, "learning_rate": 0.00017781162666115902, "loss": 0.0422, "step": 126210 }, { "epoch": 0.81, "learning_rate": 0.0001778019453068021, "loss": 0.045, "step": 126220 }, { "epoch": 0.81, "learning_rate": 0.00017779226395244518, "loss": 0.0449, "step": 126230 }, { "epoch": 0.81, "learning_rate": 0.00017778258259808823, "loss": 0.0432, "step": 126240 }, { "epoch": 0.81, "learning_rate": 0.00017777290124373131, "loss": 0.0409, "step": 126250 }, { "epoch": 0.81, "learning_rate": 0.0001777632198893744, "loss": 0.0451, "step": 126260 }, { "epoch": 0.81, "learning_rate": 0.00017775353853501745, "loss": 0.0413, "step": 126270 }, { "epoch": 0.82, "learning_rate": 0.0001777438571806605, "loss": 0.041, "step": 126280 }, { "epoch": 0.82, "learning_rate": 0.00017773417582630358, "loss": 0.0451, "step": 126290 }, { "epoch": 0.82, "learning_rate": 0.00017772449447194663, "loss": 0.0415, "step": 126300 }, { "epoch": 0.82, "learning_rate": 0.0001777148131175897, "loss": 0.0458, "step": 126310 }, { "epoch": 0.82, "learning_rate": 0.0001777051317632328, "loss": 0.038, "step": 126320 }, { "epoch": 0.82, "learning_rate": 0.00017769545040887587, "loss": 0.0371, "step": 126330 }, { "epoch": 0.82, "learning_rate": 0.00017768576905451892, "loss": 0.0388, "step": 126340 }, { "epoch": 0.82, "learning_rate": 0.00017767608770016198, "loss": 0.0419, "step": 126350 }, { "epoch": 0.82, "learning_rate": 0.00017766640634580506, "loss": 0.0479, "step": 126360 }, { "epoch": 0.82, "learning_rate": 0.0001776567249914481, "loss": 0.0361, "step": 126370 }, { "epoch": 0.82, "learning_rate": 0.0001776470436370912, "loss": 0.0462, "step": 126380 }, { "epoch": 0.82, "learning_rate": 0.00017763736228273427, "loss": 0.0452, "step": 126390 }, { "epoch": 0.82, "learning_rate": 0.00017762768092837735, "loss": 0.0508, "step": 126400 }, { "epoch": 0.82, "learning_rate": 0.0001776179995740204, "loss": 0.0408, "step": 126410 }, { "epoch": 0.82, "learning_rate": 0.00017760831821966345, "loss": 0.0406, "step": 126420 }, { "epoch": 0.82, "learning_rate": 0.00017759863686530653, "loss": 0.039, "step": 126430 }, { "epoch": 0.82, "learning_rate": 0.00017758895551094959, "loss": 0.0394, "step": 126440 }, { "epoch": 0.82, "learning_rate": 0.00017757927415659267, "loss": 0.0464, "step": 126450 }, { "epoch": 0.82, "learning_rate": 0.00017756959280223575, "loss": 0.0538, "step": 126460 }, { "epoch": 0.82, "learning_rate": 0.0001775599114478788, "loss": 0.039, "step": 126470 }, { "epoch": 0.82, "learning_rate": 0.00017755023009352188, "loss": 0.0411, "step": 126480 }, { "epoch": 0.82, "learning_rate": 0.00017754054873916493, "loss": 0.0392, "step": 126490 }, { "epoch": 0.82, "learning_rate": 0.00017753086738480798, "loss": 0.04, "step": 126500 }, { "epoch": 0.82, "learning_rate": 0.00017752118603045106, "loss": 0.0443, "step": 126510 }, { "epoch": 0.82, "learning_rate": 0.00017751150467609414, "loss": 0.0478, "step": 126520 }, { "epoch": 0.82, "learning_rate": 0.00017750182332173722, "loss": 0.044, "step": 126530 }, { "epoch": 0.82, "learning_rate": 0.00017749214196738028, "loss": 0.0419, "step": 126540 }, { "epoch": 0.82, "learning_rate": 0.00017748246061302336, "loss": 0.0403, "step": 126550 }, { "epoch": 0.82, "learning_rate": 0.0001774727792586664, "loss": 0.0347, "step": 126560 }, { "epoch": 0.82, "learning_rate": 0.00017746309790430946, "loss": 0.0388, "step": 126570 }, { "epoch": 0.82, "learning_rate": 0.00017745341654995254, "loss": 0.0421, "step": 126580 }, { "epoch": 0.82, "learning_rate": 0.00017744373519559562, "loss": 0.0411, "step": 126590 }, { "epoch": 0.82, "learning_rate": 0.0001774340538412387, "loss": 0.0369, "step": 126600 }, { "epoch": 0.82, "learning_rate": 0.00017742437248688175, "loss": 0.0381, "step": 126610 }, { "epoch": 0.82, "learning_rate": 0.00017741469113252483, "loss": 0.0385, "step": 126620 }, { "epoch": 0.82, "learning_rate": 0.00017740500977816789, "loss": 0.0419, "step": 126630 }, { "epoch": 0.82, "learning_rate": 0.00017739532842381094, "loss": 0.0411, "step": 126640 }, { "epoch": 0.82, "learning_rate": 0.00017738564706945402, "loss": 0.0495, "step": 126650 }, { "epoch": 0.82, "learning_rate": 0.0001773759657150971, "loss": 0.0458, "step": 126660 }, { "epoch": 0.82, "learning_rate": 0.00017736628436074015, "loss": 0.0382, "step": 126670 }, { "epoch": 0.82, "learning_rate": 0.00017735660300638323, "loss": 0.0472, "step": 126680 }, { "epoch": 0.82, "learning_rate": 0.0001773469216520263, "loss": 0.037, "step": 126690 }, { "epoch": 0.82, "learning_rate": 0.00017733724029766934, "loss": 0.0417, "step": 126700 }, { "epoch": 0.82, "learning_rate": 0.00017732755894331242, "loss": 0.0442, "step": 126710 }, { "epoch": 0.82, "learning_rate": 0.0001773178775889555, "loss": 0.0461, "step": 126720 }, { "epoch": 0.82, "learning_rate": 0.00017730819623459858, "loss": 0.043, "step": 126730 }, { "epoch": 0.82, "learning_rate": 0.00017729851488024163, "loss": 0.0416, "step": 126740 }, { "epoch": 0.82, "learning_rate": 0.0001772888335258847, "loss": 0.0514, "step": 126750 }, { "epoch": 0.82, "learning_rate": 0.0001772791521715278, "loss": 0.0514, "step": 126760 }, { "epoch": 0.82, "learning_rate": 0.0001772694708171708, "loss": 0.0449, "step": 126770 }, { "epoch": 0.82, "learning_rate": 0.0001772597894628139, "loss": 0.0397, "step": 126780 }, { "epoch": 0.82, "learning_rate": 0.00017725010810845697, "loss": 0.046, "step": 126790 }, { "epoch": 0.82, "learning_rate": 0.00017724042675410005, "loss": 0.0405, "step": 126800 }, { "epoch": 0.82, "learning_rate": 0.0001772307453997431, "loss": 0.0456, "step": 126810 }, { "epoch": 0.82, "learning_rate": 0.00017722106404538618, "loss": 0.0519, "step": 126820 }, { "epoch": 0.82, "learning_rate": 0.00017721138269102926, "loss": 0.0399, "step": 126830 }, { "epoch": 0.82, "learning_rate": 0.0001772017013366723, "loss": 0.0401, "step": 126840 }, { "epoch": 0.82, "learning_rate": 0.00017719201998231537, "loss": 0.0455, "step": 126850 }, { "epoch": 0.82, "learning_rate": 0.00017718233862795845, "loss": 0.0411, "step": 126860 }, { "epoch": 0.82, "learning_rate": 0.0001771726572736015, "loss": 0.0432, "step": 126870 }, { "epoch": 0.82, "learning_rate": 0.00017716297591924458, "loss": 0.0412, "step": 126880 }, { "epoch": 0.82, "learning_rate": 0.00017715329456488766, "loss": 0.0459, "step": 126890 }, { "epoch": 0.82, "learning_rate": 0.00017714361321053074, "loss": 0.0392, "step": 126900 }, { "epoch": 0.82, "learning_rate": 0.00017713393185617377, "loss": 0.0407, "step": 126910 }, { "epoch": 0.82, "learning_rate": 0.00017712425050181685, "loss": 0.0444, "step": 126920 }, { "epoch": 0.82, "learning_rate": 0.00017711456914745993, "loss": 0.0394, "step": 126930 }, { "epoch": 0.82, "learning_rate": 0.00017710488779310298, "loss": 0.0364, "step": 126940 }, { "epoch": 0.82, "learning_rate": 0.00017709520643874606, "loss": 0.0368, "step": 126950 }, { "epoch": 0.82, "learning_rate": 0.00017708552508438914, "loss": 0.0365, "step": 126960 }, { "epoch": 0.82, "learning_rate": 0.00017707584373003222, "loss": 0.0384, "step": 126970 }, { "epoch": 0.82, "learning_rate": 0.00017706616237567524, "loss": 0.0408, "step": 126980 }, { "epoch": 0.82, "learning_rate": 0.00017705648102131832, "loss": 0.0367, "step": 126990 }, { "epoch": 0.82, "learning_rate": 0.0001770467996669614, "loss": 0.0386, "step": 127000 }, { "epoch": 0.82, "eval_cer": 0.9199466726923512, "eval_loss": 0.028268195688724518, "eval_runtime": 120.0387, "eval_samples_per_second": 16.661, "eval_steps_per_second": 4.165, "step": 127000 }, { "epoch": 0.82, "learning_rate": 0.00017703711831260446, "loss": 0.0422, "step": 127010 }, { "epoch": 0.82, "learning_rate": 0.00017702743695824754, "loss": 0.041, "step": 127020 }, { "epoch": 0.82, "learning_rate": 0.00017701775560389062, "loss": 0.0395, "step": 127030 }, { "epoch": 0.82, "learning_rate": 0.00017700807424953367, "loss": 0.0428, "step": 127040 }, { "epoch": 0.82, "learning_rate": 0.00017699839289517672, "loss": 0.0419, "step": 127050 }, { "epoch": 0.82, "learning_rate": 0.0001769887115408198, "loss": 0.045, "step": 127060 }, { "epoch": 0.82, "learning_rate": 0.00017697903018646285, "loss": 0.0441, "step": 127070 }, { "epoch": 0.82, "learning_rate": 0.00017696934883210593, "loss": 0.039, "step": 127080 }, { "epoch": 0.82, "learning_rate": 0.00017695966747774901, "loss": 0.0419, "step": 127090 }, { "epoch": 0.82, "learning_rate": 0.0001769499861233921, "loss": 0.0339, "step": 127100 }, { "epoch": 0.82, "learning_rate": 0.00017694030476903515, "loss": 0.0528, "step": 127110 }, { "epoch": 0.82, "learning_rate": 0.0001769306234146782, "loss": 0.0467, "step": 127120 }, { "epoch": 0.82, "learning_rate": 0.00017692094206032128, "loss": 0.0422, "step": 127130 }, { "epoch": 0.82, "learning_rate": 0.00017691126070596433, "loss": 0.0408, "step": 127140 }, { "epoch": 0.82, "learning_rate": 0.0001769015793516074, "loss": 0.0477, "step": 127150 }, { "epoch": 0.82, "learning_rate": 0.0001768918979972505, "loss": 0.0406, "step": 127160 }, { "epoch": 0.82, "learning_rate": 0.00017688221664289357, "loss": 0.0406, "step": 127170 }, { "epoch": 0.82, "learning_rate": 0.00017687253528853662, "loss": 0.0431, "step": 127180 }, { "epoch": 0.82, "learning_rate": 0.00017686285393417968, "loss": 0.0433, "step": 127190 }, { "epoch": 0.82, "learning_rate": 0.00017685317257982276, "loss": 0.0435, "step": 127200 }, { "epoch": 0.82, "learning_rate": 0.0001768434912254658, "loss": 0.0459, "step": 127210 }, { "epoch": 0.82, "learning_rate": 0.0001768338098711089, "loss": 0.0479, "step": 127220 }, { "epoch": 0.82, "learning_rate": 0.00017682412851675197, "loss": 0.045, "step": 127230 }, { "epoch": 0.82, "learning_rate": 0.00017681444716239502, "loss": 0.0353, "step": 127240 }, { "epoch": 0.82, "learning_rate": 0.0001768047658080381, "loss": 0.051, "step": 127250 }, { "epoch": 0.82, "learning_rate": 0.00017679508445368115, "loss": 0.0416, "step": 127260 }, { "epoch": 0.82, "learning_rate": 0.0001767854030993242, "loss": 0.0445, "step": 127270 }, { "epoch": 0.82, "learning_rate": 0.00017677572174496729, "loss": 0.0381, "step": 127280 }, { "epoch": 0.82, "learning_rate": 0.00017676604039061037, "loss": 0.0484, "step": 127290 }, { "epoch": 0.82, "learning_rate": 0.00017675635903625345, "loss": 0.0425, "step": 127300 }, { "epoch": 0.82, "learning_rate": 0.0001767466776818965, "loss": 0.0469, "step": 127310 }, { "epoch": 0.82, "learning_rate": 0.00017673699632753958, "loss": 0.0387, "step": 127320 }, { "epoch": 0.82, "learning_rate": 0.00017672731497318263, "loss": 0.0447, "step": 127330 }, { "epoch": 0.82, "learning_rate": 0.00017671763361882568, "loss": 0.0422, "step": 127340 }, { "epoch": 0.82, "learning_rate": 0.00017670795226446876, "loss": 0.0605, "step": 127350 }, { "epoch": 0.82, "learning_rate": 0.00017669827091011184, "loss": 0.0427, "step": 127360 }, { "epoch": 0.82, "learning_rate": 0.00017668858955575492, "loss": 0.0439, "step": 127370 }, { "epoch": 0.82, "learning_rate": 0.00017667890820139798, "loss": 0.0366, "step": 127380 }, { "epoch": 0.82, "learning_rate": 0.00017666922684704106, "loss": 0.0442, "step": 127390 }, { "epoch": 0.82, "learning_rate": 0.0001766595454926841, "loss": 0.0502, "step": 127400 }, { "epoch": 0.82, "learning_rate": 0.00017664986413832716, "loss": 0.0392, "step": 127410 }, { "epoch": 0.82, "learning_rate": 0.00017664018278397024, "loss": 0.0474, "step": 127420 }, { "epoch": 0.82, "learning_rate": 0.00017663050142961332, "loss": 0.0513, "step": 127430 }, { "epoch": 0.82, "learning_rate": 0.00017662082007525637, "loss": 0.0382, "step": 127440 }, { "epoch": 0.82, "learning_rate": 0.00017661113872089945, "loss": 0.0405, "step": 127450 }, { "epoch": 0.82, "learning_rate": 0.0001766014573665425, "loss": 0.0391, "step": 127460 }, { "epoch": 0.82, "learning_rate": 0.00017659177601218556, "loss": 0.0434, "step": 127470 }, { "epoch": 0.82, "learning_rate": 0.00017658209465782864, "loss": 0.0446, "step": 127480 }, { "epoch": 0.82, "learning_rate": 0.00017657241330347172, "loss": 0.0356, "step": 127490 }, { "epoch": 0.82, "learning_rate": 0.0001765627319491148, "loss": 0.0395, "step": 127500 }, { "epoch": 0.82, "learning_rate": 0.00017655305059475785, "loss": 0.0421, "step": 127510 }, { "epoch": 0.82, "learning_rate": 0.00017654336924040093, "loss": 0.0395, "step": 127520 }, { "epoch": 0.82, "learning_rate": 0.00017653368788604398, "loss": 0.0436, "step": 127530 }, { "epoch": 0.82, "learning_rate": 0.00017652400653168704, "loss": 0.0451, "step": 127540 }, { "epoch": 0.82, "learning_rate": 0.00017651432517733012, "loss": 0.0421, "step": 127550 }, { "epoch": 0.82, "learning_rate": 0.0001765046438229732, "loss": 0.0394, "step": 127560 }, { "epoch": 0.82, "learning_rate": 0.00017649496246861627, "loss": 0.0394, "step": 127570 }, { "epoch": 0.82, "learning_rate": 0.00017648528111425933, "loss": 0.0413, "step": 127580 }, { "epoch": 0.82, "learning_rate": 0.0001764755997599024, "loss": 0.0377, "step": 127590 }, { "epoch": 0.82, "learning_rate": 0.00017646591840554546, "loss": 0.048, "step": 127600 }, { "epoch": 0.82, "learning_rate": 0.0001764562370511885, "loss": 0.0425, "step": 127610 }, { "epoch": 0.82, "learning_rate": 0.0001764465556968316, "loss": 0.0428, "step": 127620 }, { "epoch": 0.82, "learning_rate": 0.00017643687434247467, "loss": 0.0404, "step": 127630 }, { "epoch": 0.82, "learning_rate": 0.00017642719298811772, "loss": 0.0465, "step": 127640 }, { "epoch": 0.82, "learning_rate": 0.0001764175116337608, "loss": 0.0435, "step": 127650 }, { "epoch": 0.82, "learning_rate": 0.00017640783027940388, "loss": 0.0424, "step": 127660 }, { "epoch": 0.82, "learning_rate": 0.0001763981489250469, "loss": 0.0423, "step": 127670 }, { "epoch": 0.82, "learning_rate": 0.00017638846757069, "loss": 0.0483, "step": 127680 }, { "epoch": 0.82, "learning_rate": 0.00017637878621633307, "loss": 0.0465, "step": 127690 }, { "epoch": 0.82, "learning_rate": 0.00017636910486197615, "loss": 0.0513, "step": 127700 }, { "epoch": 0.82, "learning_rate": 0.0001763594235076192, "loss": 0.0442, "step": 127710 }, { "epoch": 0.82, "learning_rate": 0.00017634974215326228, "loss": 0.0404, "step": 127720 }, { "epoch": 0.82, "learning_rate": 0.00017634006079890536, "loss": 0.0453, "step": 127730 }, { "epoch": 0.82, "learning_rate": 0.0001763303794445484, "loss": 0.0441, "step": 127740 }, { "epoch": 0.82, "learning_rate": 0.00017632069809019147, "loss": 0.0381, "step": 127750 }, { "epoch": 0.82, "learning_rate": 0.00017631101673583455, "loss": 0.0426, "step": 127760 }, { "epoch": 0.82, "learning_rate": 0.00017630133538147763, "loss": 0.0375, "step": 127770 }, { "epoch": 0.82, "learning_rate": 0.00017629165402712068, "loss": 0.0441, "step": 127780 }, { "epoch": 0.82, "learning_rate": 0.00017628197267276376, "loss": 0.0416, "step": 127790 }, { "epoch": 0.82, "learning_rate": 0.00017627229131840684, "loss": 0.0388, "step": 127800 }, { "epoch": 0.82, "learning_rate": 0.00017626260996404986, "loss": 0.0484, "step": 127810 }, { "epoch": 0.82, "learning_rate": 0.00017625292860969294, "loss": 0.048, "step": 127820 }, { "epoch": 0.83, "learning_rate": 0.00017624324725533602, "loss": 0.0383, "step": 127830 }, { "epoch": 0.83, "learning_rate": 0.00017623356590097908, "loss": 0.0385, "step": 127840 }, { "epoch": 0.83, "learning_rate": 0.00017622388454662216, "loss": 0.042, "step": 127850 }, { "epoch": 0.83, "learning_rate": 0.00017621420319226524, "loss": 0.0385, "step": 127860 }, { "epoch": 0.83, "learning_rate": 0.00017620452183790832, "loss": 0.0397, "step": 127870 }, { "epoch": 0.83, "learning_rate": 0.00017619484048355134, "loss": 0.0395, "step": 127880 }, { "epoch": 0.83, "learning_rate": 0.00017618515912919442, "loss": 0.0447, "step": 127890 }, { "epoch": 0.83, "learning_rate": 0.0001761754777748375, "loss": 0.0465, "step": 127900 }, { "epoch": 0.83, "learning_rate": 0.00017616579642048055, "loss": 0.0433, "step": 127910 }, { "epoch": 0.83, "learning_rate": 0.00017615611506612363, "loss": 0.0416, "step": 127920 }, { "epoch": 0.83, "learning_rate": 0.0001761464337117667, "loss": 0.0389, "step": 127930 }, { "epoch": 0.83, "learning_rate": 0.0001761367523574098, "loss": 0.038, "step": 127940 }, { "epoch": 0.83, "learning_rate": 0.00017612707100305282, "loss": 0.0432, "step": 127950 }, { "epoch": 0.83, "learning_rate": 0.0001761173896486959, "loss": 0.0416, "step": 127960 }, { "epoch": 0.83, "learning_rate": 0.00017610770829433898, "loss": 0.0366, "step": 127970 }, { "epoch": 0.83, "learning_rate": 0.00017609802693998203, "loss": 0.0428, "step": 127980 }, { "epoch": 0.83, "learning_rate": 0.0001760883455856251, "loss": 0.0395, "step": 127990 }, { "epoch": 0.83, "learning_rate": 0.0001760786642312682, "loss": 0.0407, "step": 128000 }, { "epoch": 0.83, "eval_cer": 0.9198951530900463, "eval_loss": 0.028159523382782936, "eval_runtime": 120.0077, "eval_samples_per_second": 16.666, "eval_steps_per_second": 4.166, "step": 128000 }, { "epoch": 0.83, "learning_rate": 0.00017606898287691127, "loss": 0.0419, "step": 128010 }, { "epoch": 0.83, "learning_rate": 0.0001760593015225543, "loss": 0.0419, "step": 128020 }, { "epoch": 0.83, "learning_rate": 0.00017604962016819738, "loss": 0.0392, "step": 128030 }, { "epoch": 0.83, "learning_rate": 0.00017603993881384043, "loss": 0.0534, "step": 128040 }, { "epoch": 0.83, "learning_rate": 0.0001760302574594835, "loss": 0.0363, "step": 128050 }, { "epoch": 0.83, "learning_rate": 0.0001760205761051266, "loss": 0.0479, "step": 128060 }, { "epoch": 0.83, "learning_rate": 0.00017601089475076967, "loss": 0.041, "step": 128070 }, { "epoch": 0.83, "learning_rate": 0.00017600121339641272, "loss": 0.0438, "step": 128080 }, { "epoch": 0.83, "learning_rate": 0.00017599153204205577, "loss": 0.0371, "step": 128090 }, { "epoch": 0.83, "learning_rate": 0.00017598185068769885, "loss": 0.0415, "step": 128100 }, { "epoch": 0.83, "learning_rate": 0.0001759721693333419, "loss": 0.0406, "step": 128110 }, { "epoch": 0.83, "learning_rate": 0.00017596248797898499, "loss": 0.0466, "step": 128120 }, { "epoch": 0.83, "learning_rate": 0.00017595280662462807, "loss": 0.0355, "step": 128130 }, { "epoch": 0.83, "learning_rate": 0.00017594312527027115, "loss": 0.0436, "step": 128140 }, { "epoch": 0.83, "learning_rate": 0.0001759334439159142, "loss": 0.0417, "step": 128150 }, { "epoch": 0.83, "learning_rate": 0.00017592376256155725, "loss": 0.039, "step": 128160 }, { "epoch": 0.83, "learning_rate": 0.00017591408120720033, "loss": 0.0443, "step": 128170 }, { "epoch": 0.83, "learning_rate": 0.00017590439985284338, "loss": 0.0416, "step": 128180 }, { "epoch": 0.83, "learning_rate": 0.00017589471849848646, "loss": 0.041, "step": 128190 }, { "epoch": 0.83, "learning_rate": 0.00017588503714412954, "loss": 0.0408, "step": 128200 }, { "epoch": 0.83, "learning_rate": 0.00017587535578977262, "loss": 0.0445, "step": 128210 }, { "epoch": 0.83, "learning_rate": 0.00017586567443541568, "loss": 0.0421, "step": 128220 }, { "epoch": 0.83, "learning_rate": 0.00017585599308105873, "loss": 0.0461, "step": 128230 }, { "epoch": 0.83, "learning_rate": 0.00017584631172670178, "loss": 0.0395, "step": 128240 }, { "epoch": 0.83, "learning_rate": 0.00017583663037234486, "loss": 0.0454, "step": 128250 }, { "epoch": 0.83, "learning_rate": 0.00017582694901798794, "loss": 0.0414, "step": 128260 }, { "epoch": 0.83, "learning_rate": 0.00017581726766363102, "loss": 0.0423, "step": 128270 }, { "epoch": 0.83, "learning_rate": 0.00017580758630927407, "loss": 0.0423, "step": 128280 }, { "epoch": 0.83, "learning_rate": 0.00017579790495491715, "loss": 0.0431, "step": 128290 }, { "epoch": 0.83, "learning_rate": 0.0001757882236005602, "loss": 0.0347, "step": 128300 }, { "epoch": 0.83, "learning_rate": 0.00017577854224620326, "loss": 0.0474, "step": 128310 }, { "epoch": 0.83, "learning_rate": 0.00017576886089184634, "loss": 0.0453, "step": 128320 }, { "epoch": 0.83, "learning_rate": 0.00017575917953748942, "loss": 0.0374, "step": 128330 }, { "epoch": 0.83, "learning_rate": 0.0001757494981831325, "loss": 0.0409, "step": 128340 }, { "epoch": 0.83, "learning_rate": 0.00017573981682877555, "loss": 0.038, "step": 128350 }, { "epoch": 0.83, "learning_rate": 0.00017573013547441863, "loss": 0.0439, "step": 128360 }, { "epoch": 0.83, "learning_rate": 0.00017572045412006168, "loss": 0.04, "step": 128370 }, { "epoch": 0.83, "learning_rate": 0.00017571077276570473, "loss": 0.0437, "step": 128380 }, { "epoch": 0.83, "learning_rate": 0.00017570109141134781, "loss": 0.045, "step": 128390 }, { "epoch": 0.83, "learning_rate": 0.0001756914100569909, "loss": 0.0391, "step": 128400 }, { "epoch": 0.83, "learning_rate": 0.00017568172870263397, "loss": 0.0347, "step": 128410 }, { "epoch": 0.83, "learning_rate": 0.00017567204734827703, "loss": 0.0365, "step": 128420 }, { "epoch": 0.83, "learning_rate": 0.0001756623659939201, "loss": 0.0465, "step": 128430 }, { "epoch": 0.83, "learning_rate": 0.00017565268463956316, "loss": 0.0418, "step": 128440 }, { "epoch": 0.83, "learning_rate": 0.0001756430032852062, "loss": 0.0368, "step": 128450 }, { "epoch": 0.83, "learning_rate": 0.0001756333219308493, "loss": 0.0473, "step": 128460 }, { "epoch": 0.83, "learning_rate": 0.00017562364057649237, "loss": 0.0415, "step": 128470 }, { "epoch": 0.83, "learning_rate": 0.00017561395922213542, "loss": 0.048, "step": 128480 }, { "epoch": 0.83, "learning_rate": 0.0001756042778677785, "loss": 0.0483, "step": 128490 }, { "epoch": 0.83, "learning_rate": 0.00017559459651342158, "loss": 0.0351, "step": 128500 }, { "epoch": 0.83, "learning_rate": 0.0001755849151590646, "loss": 0.0359, "step": 128510 }, { "epoch": 0.83, "learning_rate": 0.0001755752338047077, "loss": 0.0387, "step": 128520 }, { "epoch": 0.83, "learning_rate": 0.00017556555245035077, "loss": 0.0398, "step": 128530 }, { "epoch": 0.83, "learning_rate": 0.00017555587109599385, "loss": 0.0434, "step": 128540 }, { "epoch": 0.83, "learning_rate": 0.0001755461897416369, "loss": 0.0389, "step": 128550 }, { "epoch": 0.83, "learning_rate": 0.00017553650838727998, "loss": 0.04, "step": 128560 }, { "epoch": 0.83, "learning_rate": 0.00017552682703292306, "loss": 0.0417, "step": 128570 }, { "epoch": 0.83, "learning_rate": 0.0001755171456785661, "loss": 0.045, "step": 128580 }, { "epoch": 0.83, "learning_rate": 0.00017550746432420917, "loss": 0.0525, "step": 128590 }, { "epoch": 0.83, "learning_rate": 0.00017549778296985225, "loss": 0.0429, "step": 128600 }, { "epoch": 0.83, "learning_rate": 0.00017548810161549533, "loss": 0.0382, "step": 128610 }, { "epoch": 0.83, "learning_rate": 0.00017547842026113838, "loss": 0.0427, "step": 128620 }, { "epoch": 0.83, "learning_rate": 0.00017546873890678146, "loss": 0.0413, "step": 128630 }, { "epoch": 0.83, "learning_rate": 0.00017545905755242454, "loss": 0.0482, "step": 128640 }, { "epoch": 0.83, "learning_rate": 0.00017544937619806756, "loss": 0.0372, "step": 128650 }, { "epoch": 0.83, "learning_rate": 0.00017543969484371064, "loss": 0.0432, "step": 128660 }, { "epoch": 0.83, "learning_rate": 0.00017543001348935372, "loss": 0.0434, "step": 128670 }, { "epoch": 0.83, "learning_rate": 0.00017542033213499678, "loss": 0.0446, "step": 128680 }, { "epoch": 0.83, "learning_rate": 0.00017541065078063986, "loss": 0.0437, "step": 128690 }, { "epoch": 0.83, "learning_rate": 0.00017540096942628294, "loss": 0.0425, "step": 128700 }, { "epoch": 0.83, "learning_rate": 0.00017539128807192602, "loss": 0.0402, "step": 128710 }, { "epoch": 0.83, "learning_rate": 0.00017538160671756904, "loss": 0.0434, "step": 128720 }, { "epoch": 0.83, "learning_rate": 0.00017537192536321212, "loss": 0.0432, "step": 128730 }, { "epoch": 0.83, "learning_rate": 0.0001753622440088552, "loss": 0.0391, "step": 128740 }, { "epoch": 0.83, "learning_rate": 0.00017535256265449825, "loss": 0.0513, "step": 128750 }, { "epoch": 0.83, "learning_rate": 0.00017534288130014133, "loss": 0.0407, "step": 128760 }, { "epoch": 0.83, "learning_rate": 0.0001753331999457844, "loss": 0.0399, "step": 128770 }, { "epoch": 0.83, "learning_rate": 0.0001753235185914275, "loss": 0.0423, "step": 128780 }, { "epoch": 0.83, "learning_rate": 0.00017531383723707052, "loss": 0.04, "step": 128790 }, { "epoch": 0.83, "learning_rate": 0.0001753041558827136, "loss": 0.0329, "step": 128800 }, { "epoch": 0.83, "learning_rate": 0.00017529447452835668, "loss": 0.0418, "step": 128810 }, { "epoch": 0.83, "learning_rate": 0.00017528479317399973, "loss": 0.0436, "step": 128820 }, { "epoch": 0.83, "learning_rate": 0.0001752751118196428, "loss": 0.0481, "step": 128830 }, { "epoch": 0.83, "learning_rate": 0.0001752654304652859, "loss": 0.0432, "step": 128840 }, { "epoch": 0.83, "learning_rate": 0.00017525574911092894, "loss": 0.039, "step": 128850 }, { "epoch": 0.83, "learning_rate": 0.000175246067756572, "loss": 0.0367, "step": 128860 }, { "epoch": 0.83, "learning_rate": 0.00017523638640221508, "loss": 0.045, "step": 128870 }, { "epoch": 0.83, "learning_rate": 0.00017522670504785813, "loss": 0.0413, "step": 128880 }, { "epoch": 0.83, "learning_rate": 0.0001752170236935012, "loss": 0.0378, "step": 128890 }, { "epoch": 0.83, "learning_rate": 0.0001752073423391443, "loss": 0.0395, "step": 128900 }, { "epoch": 0.83, "learning_rate": 0.00017519766098478737, "loss": 0.0403, "step": 128910 }, { "epoch": 0.83, "learning_rate": 0.00017518797963043042, "loss": 0.0482, "step": 128920 }, { "epoch": 0.83, "learning_rate": 0.00017517829827607347, "loss": 0.0403, "step": 128930 }, { "epoch": 0.83, "learning_rate": 0.00017516861692171655, "loss": 0.0473, "step": 128940 }, { "epoch": 0.83, "learning_rate": 0.0001751589355673596, "loss": 0.04, "step": 128950 }, { "epoch": 0.83, "learning_rate": 0.00017514925421300269, "loss": 0.0416, "step": 128960 }, { "epoch": 0.83, "learning_rate": 0.00017513957285864577, "loss": 0.0386, "step": 128970 }, { "epoch": 0.83, "learning_rate": 0.00017512989150428884, "loss": 0.0403, "step": 128980 }, { "epoch": 0.83, "learning_rate": 0.0001751202101499319, "loss": 0.0432, "step": 128990 }, { "epoch": 0.83, "learning_rate": 0.00017511052879557495, "loss": 0.0466, "step": 129000 }, { "epoch": 0.83, "eval_cer": 0.9198589989831657, "eval_loss": 0.02755168452858925, "eval_runtime": 119.9933, "eval_samples_per_second": 16.668, "eval_steps_per_second": 4.167, "step": 129000 }, { "epoch": 0.83, "learning_rate": 0.00017510084744121803, "loss": 0.0418, "step": 129010 }, { "epoch": 0.83, "learning_rate": 0.00017509116608686108, "loss": 0.0393, "step": 129020 }, { "epoch": 0.83, "learning_rate": 0.00017508148473250416, "loss": 0.0434, "step": 129030 }, { "epoch": 0.83, "learning_rate": 0.00017507180337814724, "loss": 0.0441, "step": 129040 }, { "epoch": 0.83, "learning_rate": 0.0001750621220237903, "loss": 0.0422, "step": 129050 }, { "epoch": 0.83, "learning_rate": 0.00017505244066943337, "loss": 0.0391, "step": 129060 }, { "epoch": 0.83, "learning_rate": 0.00017504275931507643, "loss": 0.0462, "step": 129070 }, { "epoch": 0.83, "learning_rate": 0.00017503307796071948, "loss": 0.0385, "step": 129080 }, { "epoch": 0.83, "learning_rate": 0.00017502339660636256, "loss": 0.0378, "step": 129090 }, { "epoch": 0.83, "learning_rate": 0.00017501371525200564, "loss": 0.0351, "step": 129100 }, { "epoch": 0.83, "learning_rate": 0.00017500403389764872, "loss": 0.0418, "step": 129110 }, { "epoch": 0.83, "learning_rate": 0.00017499435254329177, "loss": 0.0412, "step": 129120 }, { "epoch": 0.83, "learning_rate": 0.00017498467118893485, "loss": 0.0423, "step": 129130 }, { "epoch": 0.83, "learning_rate": 0.0001749749898345779, "loss": 0.0368, "step": 129140 }, { "epoch": 0.83, "learning_rate": 0.00017496530848022096, "loss": 0.0378, "step": 129150 }, { "epoch": 0.83, "learning_rate": 0.00017495562712586404, "loss": 0.0469, "step": 129160 }, { "epoch": 0.83, "learning_rate": 0.00017494594577150712, "loss": 0.0397, "step": 129170 }, { "epoch": 0.83, "learning_rate": 0.0001749362644171502, "loss": 0.0386, "step": 129180 }, { "epoch": 0.83, "learning_rate": 0.00017492658306279325, "loss": 0.0468, "step": 129190 }, { "epoch": 0.83, "learning_rate": 0.00017491690170843633, "loss": 0.0411, "step": 129200 }, { "epoch": 0.83, "learning_rate": 0.00017490722035407938, "loss": 0.045, "step": 129210 }, { "epoch": 0.83, "learning_rate": 0.00017489753899972243, "loss": 0.039, "step": 129220 }, { "epoch": 0.83, "learning_rate": 0.00017488785764536551, "loss": 0.0414, "step": 129230 }, { "epoch": 0.83, "learning_rate": 0.0001748781762910086, "loss": 0.0433, "step": 129240 }, { "epoch": 0.83, "learning_rate": 0.00017486849493665165, "loss": 0.0534, "step": 129250 }, { "epoch": 0.83, "learning_rate": 0.00017485881358229473, "loss": 0.0487, "step": 129260 }, { "epoch": 0.83, "learning_rate": 0.0001748491322279378, "loss": 0.0456, "step": 129270 }, { "epoch": 0.83, "learning_rate": 0.00017483945087358083, "loss": 0.0432, "step": 129280 }, { "epoch": 0.83, "learning_rate": 0.0001748297695192239, "loss": 0.0385, "step": 129290 }, { "epoch": 0.83, "learning_rate": 0.000174820088164867, "loss": 0.0461, "step": 129300 }, { "epoch": 0.83, "learning_rate": 0.00017481040681051007, "loss": 0.041, "step": 129310 }, { "epoch": 0.83, "learning_rate": 0.00017480072545615312, "loss": 0.0494, "step": 129320 }, { "epoch": 0.83, "learning_rate": 0.0001747910441017962, "loss": 0.0425, "step": 129330 }, { "epoch": 0.83, "learning_rate": 0.00017478136274743928, "loss": 0.0438, "step": 129340 }, { "epoch": 0.83, "learning_rate": 0.0001747716813930823, "loss": 0.0415, "step": 129350 }, { "epoch": 0.83, "learning_rate": 0.0001747620000387254, "loss": 0.039, "step": 129360 }, { "epoch": 0.83, "learning_rate": 0.00017475231868436847, "loss": 0.0415, "step": 129370 }, { "epoch": 0.84, "learning_rate": 0.00017474263733001155, "loss": 0.0437, "step": 129380 }, { "epoch": 0.84, "learning_rate": 0.0001747329559756546, "loss": 0.0453, "step": 129390 }, { "epoch": 0.84, "learning_rate": 0.00017472327462129768, "loss": 0.044, "step": 129400 }, { "epoch": 0.84, "learning_rate": 0.00017471359326694076, "loss": 0.0434, "step": 129410 }, { "epoch": 0.84, "learning_rate": 0.0001747039119125838, "loss": 0.0458, "step": 129420 }, { "epoch": 0.84, "learning_rate": 0.00017469423055822687, "loss": 0.0415, "step": 129430 }, { "epoch": 0.84, "learning_rate": 0.00017468454920386995, "loss": 0.0378, "step": 129440 }, { "epoch": 0.84, "learning_rate": 0.000174674867849513, "loss": 0.0408, "step": 129450 }, { "epoch": 0.84, "learning_rate": 0.00017466518649515608, "loss": 0.0467, "step": 129460 }, { "epoch": 0.84, "learning_rate": 0.00017465550514079916, "loss": 0.038, "step": 129470 }, { "epoch": 0.84, "learning_rate": 0.00017464582378644224, "loss": 0.0437, "step": 129480 }, { "epoch": 0.84, "learning_rate": 0.00017463614243208526, "loss": 0.042, "step": 129490 }, { "epoch": 0.84, "learning_rate": 0.00017462646107772834, "loss": 0.0351, "step": 129500 }, { "epoch": 0.84, "learning_rate": 0.00017461677972337142, "loss": 0.0441, "step": 129510 }, { "epoch": 0.84, "learning_rate": 0.00017460709836901448, "loss": 0.0413, "step": 129520 }, { "epoch": 0.84, "learning_rate": 0.00017459741701465756, "loss": 0.0441, "step": 129530 }, { "epoch": 0.84, "learning_rate": 0.00017458773566030064, "loss": 0.0414, "step": 129540 }, { "epoch": 0.84, "learning_rate": 0.00017457805430594372, "loss": 0.0451, "step": 129550 }, { "epoch": 0.84, "learning_rate": 0.00017456837295158674, "loss": 0.0456, "step": 129560 }, { "epoch": 0.84, "learning_rate": 0.00017455869159722982, "loss": 0.0504, "step": 129570 }, { "epoch": 0.84, "learning_rate": 0.0001745490102428729, "loss": 0.0426, "step": 129580 }, { "epoch": 0.84, "learning_rate": 0.00017453932888851595, "loss": 0.0428, "step": 129590 }, { "epoch": 0.84, "learning_rate": 0.00017452964753415903, "loss": 0.0394, "step": 129600 }, { "epoch": 0.84, "learning_rate": 0.0001745199661798021, "loss": 0.0355, "step": 129610 }, { "epoch": 0.84, "learning_rate": 0.0001745102848254452, "loss": 0.0436, "step": 129620 }, { "epoch": 0.84, "learning_rate": 0.00017450060347108822, "loss": 0.0405, "step": 129630 }, { "epoch": 0.84, "learning_rate": 0.0001744909221167313, "loss": 0.0402, "step": 129640 }, { "epoch": 0.84, "learning_rate": 0.00017448124076237435, "loss": 0.0441, "step": 129650 }, { "epoch": 0.84, "learning_rate": 0.00017447155940801743, "loss": 0.0404, "step": 129660 }, { "epoch": 0.84, "learning_rate": 0.0001744618780536605, "loss": 0.0424, "step": 129670 }, { "epoch": 0.84, "learning_rate": 0.0001744521966993036, "loss": 0.0457, "step": 129680 }, { "epoch": 0.84, "learning_rate": 0.00017444251534494664, "loss": 0.0409, "step": 129690 }, { "epoch": 0.84, "learning_rate": 0.0001744328339905897, "loss": 0.0508, "step": 129700 }, { "epoch": 0.84, "learning_rate": 0.00017442315263623278, "loss": 0.0407, "step": 129710 }, { "epoch": 0.84, "learning_rate": 0.00017441347128187583, "loss": 0.0384, "step": 129720 }, { "epoch": 0.84, "learning_rate": 0.0001744037899275189, "loss": 0.0422, "step": 129730 }, { "epoch": 0.84, "learning_rate": 0.000174394108573162, "loss": 0.0466, "step": 129740 }, { "epoch": 0.84, "learning_rate": 0.00017438442721880507, "loss": 0.0439, "step": 129750 }, { "epoch": 0.84, "learning_rate": 0.00017437474586444812, "loss": 0.0451, "step": 129760 }, { "epoch": 0.84, "learning_rate": 0.00017436506451009117, "loss": 0.0388, "step": 129770 }, { "epoch": 0.84, "learning_rate": 0.00017435538315573425, "loss": 0.0399, "step": 129780 }, { "epoch": 0.84, "learning_rate": 0.0001743457018013773, "loss": 0.0484, "step": 129790 }, { "epoch": 0.84, "learning_rate": 0.00017433602044702038, "loss": 0.0386, "step": 129800 }, { "epoch": 0.84, "learning_rate": 0.00017432633909266346, "loss": 0.0395, "step": 129810 }, { "epoch": 0.84, "learning_rate": 0.00017431665773830654, "loss": 0.0396, "step": 129820 }, { "epoch": 0.84, "learning_rate": 0.0001743069763839496, "loss": 0.0438, "step": 129830 }, { "epoch": 0.84, "learning_rate": 0.00017429729502959265, "loss": 0.0347, "step": 129840 }, { "epoch": 0.84, "learning_rate": 0.0001742876136752357, "loss": 0.0432, "step": 129850 }, { "epoch": 0.84, "learning_rate": 0.00017427793232087878, "loss": 0.0423, "step": 129860 }, { "epoch": 0.84, "learning_rate": 0.00017426825096652186, "loss": 0.0407, "step": 129870 }, { "epoch": 0.84, "learning_rate": 0.00017425856961216494, "loss": 0.04, "step": 129880 }, { "epoch": 0.84, "learning_rate": 0.000174248888257808, "loss": 0.0359, "step": 129890 }, { "epoch": 0.84, "learning_rate": 0.00017423920690345107, "loss": 0.0375, "step": 129900 }, { "epoch": 0.84, "learning_rate": 0.00017422952554909413, "loss": 0.042, "step": 129910 }, { "epoch": 0.84, "learning_rate": 0.00017421984419473718, "loss": 0.0393, "step": 129920 }, { "epoch": 0.84, "learning_rate": 0.00017421016284038026, "loss": 0.0406, "step": 129930 }, { "epoch": 0.84, "learning_rate": 0.00017420048148602334, "loss": 0.0397, "step": 129940 }, { "epoch": 0.84, "learning_rate": 0.00017419080013166642, "loss": 0.0428, "step": 129950 }, { "epoch": 0.84, "learning_rate": 0.00017418111877730947, "loss": 0.038, "step": 129960 }, { "epoch": 0.84, "learning_rate": 0.00017417143742295255, "loss": 0.0456, "step": 129970 }, { "epoch": 0.84, "learning_rate": 0.0001741617560685956, "loss": 0.0417, "step": 129980 }, { "epoch": 0.84, "learning_rate": 0.00017415207471423866, "loss": 0.0365, "step": 129990 }, { "epoch": 0.84, "learning_rate": 0.00017414239335988174, "loss": 0.048, "step": 130000 }, { "epoch": 0.84, "eval_cer": 0.9200705005084171, "eval_loss": 0.027759570628404617, "eval_runtime": 119.9767, "eval_samples_per_second": 16.67, "eval_steps_per_second": 4.167, "step": 130000 }, { "epoch": 0.84, "learning_rate": 0.00017413271200552482, "loss": 0.0449, "step": 130010 }, { "epoch": 0.84, "learning_rate": 0.0001741230306511679, "loss": 0.0449, "step": 130020 }, { "epoch": 0.84, "learning_rate": 0.00017411334929681095, "loss": 0.0391, "step": 130030 }, { "epoch": 0.84, "learning_rate": 0.00017410366794245403, "loss": 0.0437, "step": 130040 }, { "epoch": 0.84, "learning_rate": 0.00017409398658809705, "loss": 0.0405, "step": 130050 }, { "epoch": 0.84, "learning_rate": 0.00017408430523374013, "loss": 0.0438, "step": 130060 }, { "epoch": 0.84, "learning_rate": 0.00017407462387938321, "loss": 0.0419, "step": 130070 }, { "epoch": 0.84, "learning_rate": 0.0001740649425250263, "loss": 0.0374, "step": 130080 }, { "epoch": 0.84, "learning_rate": 0.00017405526117066935, "loss": 0.0395, "step": 130090 }, { "epoch": 0.84, "learning_rate": 0.00017404557981631243, "loss": 0.039, "step": 130100 }, { "epoch": 0.84, "learning_rate": 0.0001740358984619555, "loss": 0.0373, "step": 130110 }, { "epoch": 0.84, "learning_rate": 0.00017402621710759853, "loss": 0.0426, "step": 130120 }, { "epoch": 0.84, "learning_rate": 0.0001740165357532416, "loss": 0.0419, "step": 130130 }, { "epoch": 0.84, "learning_rate": 0.0001740068543988847, "loss": 0.0461, "step": 130140 }, { "epoch": 0.84, "learning_rate": 0.00017399717304452777, "loss": 0.0405, "step": 130150 }, { "epoch": 0.84, "learning_rate": 0.00017398749169017082, "loss": 0.0387, "step": 130160 }, { "epoch": 0.84, "learning_rate": 0.0001739778103358139, "loss": 0.038, "step": 130170 }, { "epoch": 0.84, "learning_rate": 0.00017396812898145698, "loss": 0.0424, "step": 130180 }, { "epoch": 0.84, "learning_rate": 0.0001739584476271, "loss": 0.0409, "step": 130190 }, { "epoch": 0.84, "learning_rate": 0.0001739487662727431, "loss": 0.0448, "step": 130200 }, { "epoch": 0.84, "learning_rate": 0.00017393908491838617, "loss": 0.0453, "step": 130210 }, { "epoch": 0.84, "learning_rate": 0.00017392940356402925, "loss": 0.0398, "step": 130220 }, { "epoch": 0.84, "learning_rate": 0.0001739197222096723, "loss": 0.0396, "step": 130230 }, { "epoch": 0.84, "learning_rate": 0.00017391004085531538, "loss": 0.0413, "step": 130240 }, { "epoch": 0.84, "learning_rate": 0.00017390035950095846, "loss": 0.0361, "step": 130250 }, { "epoch": 0.84, "learning_rate": 0.00017389067814660149, "loss": 0.0472, "step": 130260 }, { "epoch": 0.84, "learning_rate": 0.00017388099679224457, "loss": 0.0438, "step": 130270 }, { "epoch": 0.84, "learning_rate": 0.00017387131543788765, "loss": 0.0371, "step": 130280 }, { "epoch": 0.84, "learning_rate": 0.0001738616340835307, "loss": 0.0377, "step": 130290 }, { "epoch": 0.84, "learning_rate": 0.00017385195272917378, "loss": 0.0426, "step": 130300 }, { "epoch": 0.84, "learning_rate": 0.00017384227137481686, "loss": 0.0405, "step": 130310 }, { "epoch": 0.84, "learning_rate": 0.00017383259002045994, "loss": 0.0428, "step": 130320 }, { "epoch": 0.84, "learning_rate": 0.00017382290866610296, "loss": 0.0509, "step": 130330 }, { "epoch": 0.84, "learning_rate": 0.00017381322731174604, "loss": 0.0366, "step": 130340 }, { "epoch": 0.84, "learning_rate": 0.00017380354595738912, "loss": 0.0408, "step": 130350 }, { "epoch": 0.84, "learning_rate": 0.00017379386460303218, "loss": 0.0382, "step": 130360 }, { "epoch": 0.84, "learning_rate": 0.00017378418324867526, "loss": 0.0406, "step": 130370 }, { "epoch": 0.84, "learning_rate": 0.00017377450189431834, "loss": 0.0385, "step": 130380 }, { "epoch": 0.84, "learning_rate": 0.00017376482053996141, "loss": 0.0459, "step": 130390 }, { "epoch": 0.84, "learning_rate": 0.00017375513918560444, "loss": 0.0398, "step": 130400 }, { "epoch": 0.84, "learning_rate": 0.00017374545783124752, "loss": 0.0427, "step": 130410 }, { "epoch": 0.84, "learning_rate": 0.0001737357764768906, "loss": 0.0541, "step": 130420 }, { "epoch": 0.84, "learning_rate": 0.00017372609512253365, "loss": 0.0397, "step": 130430 }, { "epoch": 0.84, "learning_rate": 0.00017371641376817673, "loss": 0.051, "step": 130440 }, { "epoch": 0.84, "learning_rate": 0.0001737067324138198, "loss": 0.0392, "step": 130450 }, { "epoch": 0.84, "learning_rate": 0.00017369705105946287, "loss": 0.0375, "step": 130460 }, { "epoch": 0.84, "learning_rate": 0.00017368736970510592, "loss": 0.0455, "step": 130470 }, { "epoch": 0.84, "learning_rate": 0.000173677688350749, "loss": 0.0429, "step": 130480 }, { "epoch": 0.84, "learning_rate": 0.00017366800699639205, "loss": 0.0397, "step": 130490 }, { "epoch": 0.84, "learning_rate": 0.00017365832564203513, "loss": 0.0416, "step": 130500 }, { "epoch": 0.84, "learning_rate": 0.0001736486442876782, "loss": 0.0454, "step": 130510 }, { "epoch": 0.84, "learning_rate": 0.0001736389629333213, "loss": 0.0412, "step": 130520 }, { "epoch": 0.84, "learning_rate": 0.00017362928157896434, "loss": 0.0391, "step": 130530 }, { "epoch": 0.84, "learning_rate": 0.0001736196002246074, "loss": 0.0382, "step": 130540 }, { "epoch": 0.84, "learning_rate": 0.00017360991887025047, "loss": 0.047, "step": 130550 }, { "epoch": 0.84, "learning_rate": 0.00017360023751589353, "loss": 0.0474, "step": 130560 }, { "epoch": 0.84, "learning_rate": 0.0001735905561615366, "loss": 0.0391, "step": 130570 }, { "epoch": 0.84, "learning_rate": 0.0001735808748071797, "loss": 0.0408, "step": 130580 }, { "epoch": 0.84, "learning_rate": 0.00017357119345282277, "loss": 0.0402, "step": 130590 }, { "epoch": 0.84, "learning_rate": 0.00017356151209846582, "loss": 0.0432, "step": 130600 }, { "epoch": 0.84, "learning_rate": 0.00017355183074410887, "loss": 0.0434, "step": 130610 }, { "epoch": 0.84, "learning_rate": 0.00017354214938975195, "loss": 0.0424, "step": 130620 }, { "epoch": 0.84, "learning_rate": 0.000173532468035395, "loss": 0.0418, "step": 130630 }, { "epoch": 0.84, "learning_rate": 0.00017352278668103808, "loss": 0.0479, "step": 130640 }, { "epoch": 0.84, "learning_rate": 0.00017351310532668116, "loss": 0.0399, "step": 130650 }, { "epoch": 0.84, "learning_rate": 0.00017350342397232422, "loss": 0.0488, "step": 130660 }, { "epoch": 0.84, "learning_rate": 0.0001734937426179673, "loss": 0.0459, "step": 130670 }, { "epoch": 0.84, "learning_rate": 0.00017348406126361035, "loss": 0.0429, "step": 130680 }, { "epoch": 0.84, "learning_rate": 0.0001734743799092534, "loss": 0.0503, "step": 130690 }, { "epoch": 0.84, "learning_rate": 0.00017346469855489648, "loss": 0.0488, "step": 130700 }, { "epoch": 0.84, "learning_rate": 0.00017345501720053956, "loss": 0.042, "step": 130710 }, { "epoch": 0.84, "learning_rate": 0.00017344533584618264, "loss": 0.0478, "step": 130720 }, { "epoch": 0.84, "learning_rate": 0.0001734356544918257, "loss": 0.0448, "step": 130730 }, { "epoch": 0.84, "learning_rate": 0.00017342597313746877, "loss": 0.0401, "step": 130740 }, { "epoch": 0.84, "learning_rate": 0.00017341629178311183, "loss": 0.0374, "step": 130750 }, { "epoch": 0.84, "learning_rate": 0.00017340661042875488, "loss": 0.0432, "step": 130760 }, { "epoch": 0.84, "learning_rate": 0.00017339692907439796, "loss": 0.0473, "step": 130770 }, { "epoch": 0.84, "learning_rate": 0.00017338724772004104, "loss": 0.0414, "step": 130780 }, { "epoch": 0.84, "learning_rate": 0.00017337756636568412, "loss": 0.0475, "step": 130790 }, { "epoch": 0.84, "learning_rate": 0.00017336788501132717, "loss": 0.0431, "step": 130800 }, { "epoch": 0.84, "learning_rate": 0.00017335820365697025, "loss": 0.0412, "step": 130810 }, { "epoch": 0.84, "learning_rate": 0.0001733485223026133, "loss": 0.043, "step": 130820 }, { "epoch": 0.84, "learning_rate": 0.00017333884094825636, "loss": 0.0398, "step": 130830 }, { "epoch": 0.84, "learning_rate": 0.00017332915959389944, "loss": 0.0377, "step": 130840 }, { "epoch": 0.84, "learning_rate": 0.00017331947823954252, "loss": 0.0456, "step": 130850 }, { "epoch": 0.84, "learning_rate": 0.00017330979688518557, "loss": 0.0503, "step": 130860 }, { "epoch": 0.84, "learning_rate": 0.00017330011553082865, "loss": 0.0369, "step": 130870 }, { "epoch": 0.84, "learning_rate": 0.00017329043417647173, "loss": 0.0378, "step": 130880 }, { "epoch": 0.84, "learning_rate": 0.00017328075282211475, "loss": 0.0399, "step": 130890 }, { "epoch": 0.84, "learning_rate": 0.00017327107146775783, "loss": 0.0456, "step": 130900 }, { "epoch": 0.84, "learning_rate": 0.00017326139011340091, "loss": 0.045, "step": 130910 }, { "epoch": 0.84, "learning_rate": 0.000173251708759044, "loss": 0.0337, "step": 130920 }, { "epoch": 0.85, "learning_rate": 0.00017324202740468705, "loss": 0.0427, "step": 130930 }, { "epoch": 0.85, "learning_rate": 0.00017323234605033013, "loss": 0.0418, "step": 130940 }, { "epoch": 0.85, "learning_rate": 0.0001732226646959732, "loss": 0.0379, "step": 130950 }, { "epoch": 0.85, "learning_rate": 0.00017321298334161623, "loss": 0.0463, "step": 130960 }, { "epoch": 0.85, "learning_rate": 0.0001732033019872593, "loss": 0.0456, "step": 130970 }, { "epoch": 0.85, "learning_rate": 0.0001731936206329024, "loss": 0.0439, "step": 130980 }, { "epoch": 0.85, "learning_rate": 0.00017318393927854547, "loss": 0.0475, "step": 130990 }, { "epoch": 0.85, "learning_rate": 0.00017317425792418852, "loss": 0.046, "step": 131000 }, { "epoch": 0.85, "eval_cer": 0.9198933453847022, "eval_loss": 0.027897853404283524, "eval_runtime": 120.109, "eval_samples_per_second": 16.652, "eval_steps_per_second": 4.163, "step": 131000 }, { "epoch": 0.85, "learning_rate": 0.0001731645765698316, "loss": 0.041, "step": 131010 }, { "epoch": 0.85, "learning_rate": 0.00017315489521547468, "loss": 0.0381, "step": 131020 }, { "epoch": 0.85, "learning_rate": 0.0001731452138611177, "loss": 0.0421, "step": 131030 }, { "epoch": 0.85, "learning_rate": 0.0001731355325067608, "loss": 0.0418, "step": 131040 }, { "epoch": 0.85, "learning_rate": 0.00017312585115240387, "loss": 0.039, "step": 131050 }, { "epoch": 0.85, "learning_rate": 0.00017311616979804692, "loss": 0.0444, "step": 131060 }, { "epoch": 0.85, "learning_rate": 0.00017310648844369, "loss": 0.0419, "step": 131070 }, { "epoch": 0.85, "learning_rate": 0.00017309680708933308, "loss": 0.0396, "step": 131080 }, { "epoch": 0.85, "learning_rate": 0.00017308712573497616, "loss": 0.0399, "step": 131090 }, { "epoch": 0.85, "learning_rate": 0.00017307744438061919, "loss": 0.0428, "step": 131100 }, { "epoch": 0.85, "learning_rate": 0.00017306776302626227, "loss": 0.0487, "step": 131110 }, { "epoch": 0.85, "learning_rate": 0.00017305808167190535, "loss": 0.042, "step": 131120 }, { "epoch": 0.85, "learning_rate": 0.0001730484003175484, "loss": 0.0399, "step": 131130 }, { "epoch": 0.85, "learning_rate": 0.00017303871896319148, "loss": 0.0366, "step": 131140 }, { "epoch": 0.85, "learning_rate": 0.00017302903760883456, "loss": 0.0481, "step": 131150 }, { "epoch": 0.85, "learning_rate": 0.00017301935625447764, "loss": 0.0384, "step": 131160 }, { "epoch": 0.85, "learning_rate": 0.00017300967490012066, "loss": 0.0386, "step": 131170 }, { "epoch": 0.85, "learning_rate": 0.00017299999354576374, "loss": 0.0432, "step": 131180 }, { "epoch": 0.85, "learning_rate": 0.00017299031219140682, "loss": 0.0446, "step": 131190 }, { "epoch": 0.85, "learning_rate": 0.00017298063083704988, "loss": 0.04, "step": 131200 }, { "epoch": 0.85, "learning_rate": 0.00017297094948269295, "loss": 0.0359, "step": 131210 }, { "epoch": 0.85, "learning_rate": 0.00017296126812833603, "loss": 0.0455, "step": 131220 }, { "epoch": 0.85, "learning_rate": 0.0001729515867739791, "loss": 0.0344, "step": 131230 }, { "epoch": 0.85, "learning_rate": 0.00017294190541962214, "loss": 0.0465, "step": 131240 }, { "epoch": 0.85, "learning_rate": 0.00017293222406526522, "loss": 0.0467, "step": 131250 }, { "epoch": 0.85, "learning_rate": 0.00017292254271090827, "loss": 0.0398, "step": 131260 }, { "epoch": 0.85, "learning_rate": 0.00017291286135655135, "loss": 0.0333, "step": 131270 }, { "epoch": 0.85, "learning_rate": 0.00017290318000219443, "loss": 0.0384, "step": 131280 }, { "epoch": 0.85, "learning_rate": 0.0001728934986478375, "loss": 0.0361, "step": 131290 }, { "epoch": 0.85, "learning_rate": 0.00017288381729348056, "loss": 0.0386, "step": 131300 }, { "epoch": 0.85, "learning_rate": 0.00017287413593912362, "loss": 0.0397, "step": 131310 }, { "epoch": 0.85, "learning_rate": 0.0001728644545847667, "loss": 0.0443, "step": 131320 }, { "epoch": 0.85, "learning_rate": 0.00017285477323040975, "loss": 0.0434, "step": 131330 }, { "epoch": 0.85, "learning_rate": 0.00017284509187605283, "loss": 0.0414, "step": 131340 }, { "epoch": 0.85, "learning_rate": 0.0001728354105216959, "loss": 0.046, "step": 131350 }, { "epoch": 0.85, "learning_rate": 0.000172825729167339, "loss": 0.0412, "step": 131360 }, { "epoch": 0.85, "learning_rate": 0.00017281604781298204, "loss": 0.0448, "step": 131370 }, { "epoch": 0.85, "learning_rate": 0.0001728063664586251, "loss": 0.0472, "step": 131380 }, { "epoch": 0.85, "learning_rate": 0.00017279668510426817, "loss": 0.045, "step": 131390 }, { "epoch": 0.85, "learning_rate": 0.00017278700374991123, "loss": 0.0403, "step": 131400 }, { "epoch": 0.85, "learning_rate": 0.0001727773223955543, "loss": 0.045, "step": 131410 }, { "epoch": 0.85, "learning_rate": 0.0001727676410411974, "loss": 0.0426, "step": 131420 }, { "epoch": 0.85, "learning_rate": 0.00017275795968684044, "loss": 0.044, "step": 131430 }, { "epoch": 0.85, "learning_rate": 0.00017274827833248352, "loss": 0.0365, "step": 131440 }, { "epoch": 0.85, "learning_rate": 0.00017273859697812657, "loss": 0.0409, "step": 131450 }, { "epoch": 0.85, "learning_rate": 0.00017272891562376962, "loss": 0.0441, "step": 131460 }, { "epoch": 0.85, "learning_rate": 0.0001727192342694127, "loss": 0.0408, "step": 131470 }, { "epoch": 0.85, "learning_rate": 0.00017270955291505578, "loss": 0.038, "step": 131480 }, { "epoch": 0.85, "learning_rate": 0.00017269987156069886, "loss": 0.0431, "step": 131490 }, { "epoch": 0.85, "learning_rate": 0.00017269019020634192, "loss": 0.0373, "step": 131500 }, { "epoch": 0.85, "learning_rate": 0.000172680508851985, "loss": 0.0389, "step": 131510 }, { "epoch": 0.85, "learning_rate": 0.00017267082749762805, "loss": 0.0445, "step": 131520 }, { "epoch": 0.85, "learning_rate": 0.0001726611461432711, "loss": 0.0447, "step": 131530 }, { "epoch": 0.85, "learning_rate": 0.00017265146478891418, "loss": 0.0466, "step": 131540 }, { "epoch": 0.85, "learning_rate": 0.00017264178343455726, "loss": 0.0427, "step": 131550 }, { "epoch": 0.85, "learning_rate": 0.00017263210208020034, "loss": 0.0388, "step": 131560 }, { "epoch": 0.85, "learning_rate": 0.0001726224207258434, "loss": 0.0371, "step": 131570 }, { "epoch": 0.85, "learning_rate": 0.00017261273937148647, "loss": 0.0322, "step": 131580 }, { "epoch": 0.85, "learning_rate": 0.00017260305801712953, "loss": 0.0352, "step": 131590 }, { "epoch": 0.85, "learning_rate": 0.00017259337666277258, "loss": 0.0396, "step": 131600 }, { "epoch": 0.85, "learning_rate": 0.00017258369530841566, "loss": 0.0444, "step": 131610 }, { "epoch": 0.85, "learning_rate": 0.00017257401395405874, "loss": 0.0396, "step": 131620 }, { "epoch": 0.85, "learning_rate": 0.0001725643325997018, "loss": 0.0417, "step": 131630 }, { "epoch": 0.85, "learning_rate": 0.00017255465124534487, "loss": 0.0406, "step": 131640 }, { "epoch": 0.85, "learning_rate": 0.00017254496989098795, "loss": 0.0377, "step": 131650 }, { "epoch": 0.85, "learning_rate": 0.00017253528853663098, "loss": 0.0472, "step": 131660 }, { "epoch": 0.85, "learning_rate": 0.00017252560718227406, "loss": 0.04, "step": 131670 }, { "epoch": 0.85, "learning_rate": 0.00017251592582791714, "loss": 0.0448, "step": 131680 }, { "epoch": 0.85, "learning_rate": 0.00017250624447356022, "loss": 0.0369, "step": 131690 }, { "epoch": 0.85, "learning_rate": 0.00017249656311920327, "loss": 0.0446, "step": 131700 }, { "epoch": 0.85, "learning_rate": 0.00017248688176484635, "loss": 0.0417, "step": 131710 }, { "epoch": 0.85, "learning_rate": 0.00017247720041048943, "loss": 0.0469, "step": 131720 }, { "epoch": 0.85, "learning_rate": 0.00017246751905613245, "loss": 0.0384, "step": 131730 }, { "epoch": 0.85, "learning_rate": 0.00017245783770177553, "loss": 0.041, "step": 131740 }, { "epoch": 0.85, "learning_rate": 0.0001724481563474186, "loss": 0.0448, "step": 131750 }, { "epoch": 0.85, "learning_rate": 0.0001724384749930617, "loss": 0.0387, "step": 131760 }, { "epoch": 0.85, "learning_rate": 0.00017242879363870475, "loss": 0.0449, "step": 131770 }, { "epoch": 0.85, "learning_rate": 0.00017241911228434783, "loss": 0.0413, "step": 131780 }, { "epoch": 0.85, "learning_rate": 0.0001724094309299909, "loss": 0.038, "step": 131790 }, { "epoch": 0.85, "learning_rate": 0.00017239974957563393, "loss": 0.0404, "step": 131800 }, { "epoch": 0.85, "learning_rate": 0.000172390068221277, "loss": 0.0361, "step": 131810 }, { "epoch": 0.85, "learning_rate": 0.0001723803868669201, "loss": 0.0392, "step": 131820 }, { "epoch": 0.85, "learning_rate": 0.00017237070551256314, "loss": 0.0426, "step": 131830 }, { "epoch": 0.85, "learning_rate": 0.00017236102415820622, "loss": 0.0393, "step": 131840 }, { "epoch": 0.85, "learning_rate": 0.0001723513428038493, "loss": 0.0512, "step": 131850 }, { "epoch": 0.85, "learning_rate": 0.00017234166144949238, "loss": 0.0415, "step": 131860 }, { "epoch": 0.85, "learning_rate": 0.0001723319800951354, "loss": 0.0415, "step": 131870 }, { "epoch": 0.85, "learning_rate": 0.0001723222987407785, "loss": 0.0451, "step": 131880 }, { "epoch": 0.85, "learning_rate": 0.00017231261738642157, "loss": 0.0403, "step": 131890 }, { "epoch": 0.85, "learning_rate": 0.00017230293603206462, "loss": 0.0385, "step": 131900 }, { "epoch": 0.85, "learning_rate": 0.0001722932546777077, "loss": 0.0434, "step": 131910 }, { "epoch": 0.85, "learning_rate": 0.00017228357332335078, "loss": 0.0441, "step": 131920 }, { "epoch": 0.85, "learning_rate": 0.00017227389196899386, "loss": 0.0385, "step": 131930 }, { "epoch": 0.85, "learning_rate": 0.00017226421061463689, "loss": 0.0405, "step": 131940 }, { "epoch": 0.85, "learning_rate": 0.00017225452926027997, "loss": 0.0367, "step": 131950 }, { "epoch": 0.85, "learning_rate": 0.00017224484790592304, "loss": 0.0424, "step": 131960 }, { "epoch": 0.85, "learning_rate": 0.0001722351665515661, "loss": 0.0378, "step": 131970 }, { "epoch": 0.85, "learning_rate": 0.00017222548519720918, "loss": 0.0361, "step": 131980 }, { "epoch": 0.85, "learning_rate": 0.00017221580384285226, "loss": 0.036, "step": 131990 }, { "epoch": 0.85, "learning_rate": 0.00017220612248849534, "loss": 0.0431, "step": 132000 }, { "epoch": 0.85, "eval_cer": 0.9199023839114224, "eval_loss": 0.02698080614209175, "eval_runtime": 119.8592, "eval_samples_per_second": 16.686, "eval_steps_per_second": 4.172, "step": 132000 }, { "epoch": 0.85, "learning_rate": 0.00017219644113413836, "loss": 0.0361, "step": 132010 }, { "epoch": 0.85, "learning_rate": 0.00017218675977978144, "loss": 0.042, "step": 132020 }, { "epoch": 0.85, "learning_rate": 0.0001721770784254245, "loss": 0.0419, "step": 132030 }, { "epoch": 0.85, "learning_rate": 0.00017216739707106757, "loss": 0.0405, "step": 132040 }, { "epoch": 0.85, "learning_rate": 0.00017215771571671065, "loss": 0.0392, "step": 132050 }, { "epoch": 0.85, "learning_rate": 0.00017214803436235373, "loss": 0.0426, "step": 132060 }, { "epoch": 0.85, "learning_rate": 0.0001721383530079968, "loss": 0.0427, "step": 132070 }, { "epoch": 0.85, "learning_rate": 0.00017212867165363984, "loss": 0.0444, "step": 132080 }, { "epoch": 0.85, "learning_rate": 0.00017211899029928292, "loss": 0.035, "step": 132090 }, { "epoch": 0.85, "learning_rate": 0.00017210930894492597, "loss": 0.0454, "step": 132100 }, { "epoch": 0.85, "learning_rate": 0.00017209962759056905, "loss": 0.046, "step": 132110 }, { "epoch": 0.85, "learning_rate": 0.00017208994623621213, "loss": 0.0384, "step": 132120 }, { "epoch": 0.85, "learning_rate": 0.0001720802648818552, "loss": 0.0372, "step": 132130 }, { "epoch": 0.85, "learning_rate": 0.00017207058352749826, "loss": 0.0381, "step": 132140 }, { "epoch": 0.85, "learning_rate": 0.00017206090217314132, "loss": 0.0474, "step": 132150 }, { "epoch": 0.85, "learning_rate": 0.0001720512208187844, "loss": 0.0437, "step": 132160 }, { "epoch": 0.85, "learning_rate": 0.00017204153946442745, "loss": 0.0409, "step": 132170 }, { "epoch": 0.85, "learning_rate": 0.00017203185811007053, "loss": 0.0388, "step": 132180 }, { "epoch": 0.85, "learning_rate": 0.0001720221767557136, "loss": 0.0507, "step": 132190 }, { "epoch": 0.85, "learning_rate": 0.0001720124954013567, "loss": 0.0459, "step": 132200 }, { "epoch": 0.85, "learning_rate": 0.00017200281404699974, "loss": 0.0471, "step": 132210 }, { "epoch": 0.85, "learning_rate": 0.0001719931326926428, "loss": 0.0393, "step": 132220 }, { "epoch": 0.85, "learning_rate": 0.00017198345133828585, "loss": 0.0377, "step": 132230 }, { "epoch": 0.85, "learning_rate": 0.00017197376998392893, "loss": 0.0418, "step": 132240 }, { "epoch": 0.85, "learning_rate": 0.000171964088629572, "loss": 0.0477, "step": 132250 }, { "epoch": 0.85, "learning_rate": 0.00017195440727521509, "loss": 0.0373, "step": 132260 }, { "epoch": 0.85, "learning_rate": 0.00017194472592085814, "loss": 0.0484, "step": 132270 }, { "epoch": 0.85, "learning_rate": 0.00017193504456650122, "loss": 0.0436, "step": 132280 }, { "epoch": 0.85, "learning_rate": 0.00017192536321214427, "loss": 0.0416, "step": 132290 }, { "epoch": 0.85, "learning_rate": 0.00017191568185778732, "loss": 0.0406, "step": 132300 }, { "epoch": 0.85, "learning_rate": 0.0001719060005034304, "loss": 0.0418, "step": 132310 }, { "epoch": 0.85, "learning_rate": 0.00017189631914907348, "loss": 0.0391, "step": 132320 }, { "epoch": 0.85, "learning_rate": 0.00017188663779471656, "loss": 0.0356, "step": 132330 }, { "epoch": 0.85, "learning_rate": 0.00017187695644035962, "loss": 0.0388, "step": 132340 }, { "epoch": 0.85, "learning_rate": 0.0001718672750860027, "loss": 0.0425, "step": 132350 }, { "epoch": 0.85, "learning_rate": 0.00017185759373164575, "loss": 0.0365, "step": 132360 }, { "epoch": 0.85, "learning_rate": 0.0001718479123772888, "loss": 0.0433, "step": 132370 }, { "epoch": 0.85, "learning_rate": 0.00017183823102293188, "loss": 0.0383, "step": 132380 }, { "epoch": 0.85, "learning_rate": 0.00017182854966857496, "loss": 0.0511, "step": 132390 }, { "epoch": 0.85, "learning_rate": 0.00017181886831421804, "loss": 0.041, "step": 132400 }, { "epoch": 0.85, "learning_rate": 0.0001718091869598611, "loss": 0.0422, "step": 132410 }, { "epoch": 0.85, "learning_rate": 0.00017179950560550417, "loss": 0.04, "step": 132420 }, { "epoch": 0.85, "learning_rate": 0.0001717898242511472, "loss": 0.0455, "step": 132430 }, { "epoch": 0.85, "learning_rate": 0.00017178014289679028, "loss": 0.0431, "step": 132440 }, { "epoch": 0.85, "learning_rate": 0.00017177046154243336, "loss": 0.0329, "step": 132450 }, { "epoch": 0.85, "learning_rate": 0.00017176078018807644, "loss": 0.0386, "step": 132460 }, { "epoch": 0.85, "learning_rate": 0.0001717510988337195, "loss": 0.0463, "step": 132470 }, { "epoch": 0.86, "learning_rate": 0.00017174141747936257, "loss": 0.0368, "step": 132480 }, { "epoch": 0.86, "learning_rate": 0.00017173173612500565, "loss": 0.0441, "step": 132490 }, { "epoch": 0.86, "learning_rate": 0.00017172205477064868, "loss": 0.0394, "step": 132500 }, { "epoch": 0.86, "learning_rate": 0.00017171237341629176, "loss": 0.0432, "step": 132510 }, { "epoch": 0.86, "learning_rate": 0.00017170269206193484, "loss": 0.041, "step": 132520 }, { "epoch": 0.86, "learning_rate": 0.00017169301070757792, "loss": 0.0408, "step": 132530 }, { "epoch": 0.86, "learning_rate": 0.00017168332935322097, "loss": 0.0397, "step": 132540 }, { "epoch": 0.86, "learning_rate": 0.00017167364799886405, "loss": 0.0359, "step": 132550 }, { "epoch": 0.86, "learning_rate": 0.00017166396664450713, "loss": 0.0451, "step": 132560 }, { "epoch": 0.86, "learning_rate": 0.00017165428529015015, "loss": 0.0445, "step": 132570 }, { "epoch": 0.86, "learning_rate": 0.00017164460393579323, "loss": 0.0427, "step": 132580 }, { "epoch": 0.86, "learning_rate": 0.0001716349225814363, "loss": 0.0343, "step": 132590 }, { "epoch": 0.86, "learning_rate": 0.0001716252412270794, "loss": 0.0397, "step": 132600 }, { "epoch": 0.86, "learning_rate": 0.00017161555987272245, "loss": 0.0436, "step": 132610 }, { "epoch": 0.86, "learning_rate": 0.00017160587851836553, "loss": 0.0376, "step": 132620 }, { "epoch": 0.86, "learning_rate": 0.0001715961971640086, "loss": 0.0425, "step": 132630 }, { "epoch": 0.86, "learning_rate": 0.00017158651580965163, "loss": 0.0398, "step": 132640 }, { "epoch": 0.86, "learning_rate": 0.0001715768344552947, "loss": 0.0443, "step": 132650 }, { "epoch": 0.86, "learning_rate": 0.0001715671531009378, "loss": 0.0422, "step": 132660 }, { "epoch": 0.86, "learning_rate": 0.00017155747174658084, "loss": 0.0425, "step": 132670 }, { "epoch": 0.86, "learning_rate": 0.00017154779039222392, "loss": 0.0397, "step": 132680 }, { "epoch": 0.86, "learning_rate": 0.000171538109037867, "loss": 0.0432, "step": 132690 }, { "epoch": 0.86, "learning_rate": 0.00017152842768351008, "loss": 0.0389, "step": 132700 }, { "epoch": 0.86, "learning_rate": 0.0001715187463291531, "loss": 0.0529, "step": 132710 }, { "epoch": 0.86, "learning_rate": 0.0001715090649747962, "loss": 0.0457, "step": 132720 }, { "epoch": 0.86, "learning_rate": 0.00017149938362043927, "loss": 0.0406, "step": 132730 }, { "epoch": 0.86, "learning_rate": 0.00017148970226608232, "loss": 0.0377, "step": 132740 }, { "epoch": 0.86, "learning_rate": 0.0001714800209117254, "loss": 0.0367, "step": 132750 }, { "epoch": 0.86, "learning_rate": 0.00017147033955736848, "loss": 0.0487, "step": 132760 }, { "epoch": 0.86, "learning_rate": 0.00017146065820301156, "loss": 0.0432, "step": 132770 }, { "epoch": 0.86, "learning_rate": 0.00017145097684865458, "loss": 0.0406, "step": 132780 }, { "epoch": 0.86, "learning_rate": 0.00017144129549429766, "loss": 0.0527, "step": 132790 }, { "epoch": 0.86, "learning_rate": 0.00017143161413994074, "loss": 0.0396, "step": 132800 }, { "epoch": 0.86, "learning_rate": 0.0001714219327855838, "loss": 0.0399, "step": 132810 }, { "epoch": 0.86, "learning_rate": 0.00017141225143122688, "loss": 0.0404, "step": 132820 }, { "epoch": 0.86, "learning_rate": 0.00017140257007686996, "loss": 0.0392, "step": 132830 }, { "epoch": 0.86, "learning_rate": 0.000171392888722513, "loss": 0.0549, "step": 132840 }, { "epoch": 0.86, "learning_rate": 0.00017138320736815606, "loss": 0.0434, "step": 132850 }, { "epoch": 0.86, "learning_rate": 0.00017137352601379914, "loss": 0.0435, "step": 132860 }, { "epoch": 0.86, "learning_rate": 0.0001713638446594422, "loss": 0.0373, "step": 132870 }, { "epoch": 0.86, "learning_rate": 0.00017135416330508527, "loss": 0.0454, "step": 132880 }, { "epoch": 0.86, "learning_rate": 0.00017134448195072835, "loss": 0.0418, "step": 132890 }, { "epoch": 0.86, "learning_rate": 0.00017133480059637143, "loss": 0.0436, "step": 132900 }, { "epoch": 0.86, "learning_rate": 0.0001713251192420145, "loss": 0.0432, "step": 132910 }, { "epoch": 0.86, "learning_rate": 0.00017131543788765754, "loss": 0.0438, "step": 132920 }, { "epoch": 0.86, "learning_rate": 0.00017130575653330062, "loss": 0.0447, "step": 132930 }, { "epoch": 0.86, "learning_rate": 0.00017129607517894367, "loss": 0.0453, "step": 132940 }, { "epoch": 0.86, "learning_rate": 0.00017128639382458675, "loss": 0.043, "step": 132950 }, { "epoch": 0.86, "learning_rate": 0.00017127671247022983, "loss": 0.0468, "step": 132960 }, { "epoch": 0.86, "learning_rate": 0.0001712670311158729, "loss": 0.0397, "step": 132970 }, { "epoch": 0.86, "learning_rate": 0.00017125734976151596, "loss": 0.0438, "step": 132980 }, { "epoch": 0.86, "learning_rate": 0.00017124766840715902, "loss": 0.0447, "step": 132990 }, { "epoch": 0.86, "learning_rate": 0.0001712379870528021, "loss": 0.047, "step": 133000 }, { "epoch": 0.86, "eval_cer": 0.9198843068579822, "eval_loss": 0.02717752754688263, "eval_runtime": 119.8783, "eval_samples_per_second": 16.684, "eval_steps_per_second": 4.171, "step": 133000 }, { "epoch": 0.86, "learning_rate": 0.00017122830569844515, "loss": 0.0351, "step": 133010 }, { "epoch": 0.86, "learning_rate": 0.00017121862434408823, "loss": 0.0372, "step": 133020 }, { "epoch": 0.86, "learning_rate": 0.0001712089429897313, "loss": 0.0383, "step": 133030 }, { "epoch": 0.86, "learning_rate": 0.00017119926163537436, "loss": 0.0396, "step": 133040 }, { "epoch": 0.86, "learning_rate": 0.00017118958028101744, "loss": 0.0387, "step": 133050 }, { "epoch": 0.86, "learning_rate": 0.0001711798989266605, "loss": 0.0369, "step": 133060 }, { "epoch": 0.86, "learning_rate": 0.00017117021757230355, "loss": 0.037, "step": 133070 }, { "epoch": 0.86, "learning_rate": 0.00017116053621794663, "loss": 0.0409, "step": 133080 }, { "epoch": 0.86, "learning_rate": 0.0001711508548635897, "loss": 0.0414, "step": 133090 }, { "epoch": 0.86, "learning_rate": 0.00017114117350923279, "loss": 0.04, "step": 133100 }, { "epoch": 0.86, "learning_rate": 0.00017113149215487584, "loss": 0.0406, "step": 133110 }, { "epoch": 0.86, "learning_rate": 0.00017112181080051892, "loss": 0.1446, "step": 133120 }, { "epoch": 0.86, "learning_rate": 0.00017111212944616197, "loss": 0.0545, "step": 133130 }, { "epoch": 0.86, "learning_rate": 0.00017110244809180502, "loss": 0.078, "step": 133140 }, { "epoch": 0.86, "learning_rate": 0.0001710927667374481, "loss": 0.0487, "step": 133150 }, { "epoch": 0.86, "learning_rate": 0.00017108308538309118, "loss": 0.0443, "step": 133160 }, { "epoch": 0.86, "learning_rate": 0.00017107340402873426, "loss": 0.037, "step": 133170 }, { "epoch": 0.86, "learning_rate": 0.00017106372267437732, "loss": 0.0493, "step": 133180 }, { "epoch": 0.86, "learning_rate": 0.0001710540413200204, "loss": 0.039, "step": 133190 }, { "epoch": 0.86, "learning_rate": 0.00017104435996566345, "loss": 0.038, "step": 133200 }, { "epoch": 0.86, "learning_rate": 0.0001710346786113065, "loss": 0.0395, "step": 133210 }, { "epoch": 0.86, "learning_rate": 0.00017102499725694958, "loss": 0.0388, "step": 133220 }, { "epoch": 0.86, "learning_rate": 0.00017101531590259266, "loss": 0.0379, "step": 133230 }, { "epoch": 0.86, "learning_rate": 0.0001710056345482357, "loss": 0.0393, "step": 133240 }, { "epoch": 0.86, "learning_rate": 0.0001709959531938788, "loss": 0.0392, "step": 133250 }, { "epoch": 0.86, "learning_rate": 0.00017098627183952187, "loss": 0.045, "step": 133260 }, { "epoch": 0.86, "learning_rate": 0.0001709765904851649, "loss": 0.0366, "step": 133270 }, { "epoch": 0.86, "learning_rate": 0.00017096690913080798, "loss": 0.0471, "step": 133280 }, { "epoch": 0.86, "learning_rate": 0.00017095722777645106, "loss": 0.0408, "step": 133290 }, { "epoch": 0.86, "learning_rate": 0.00017094754642209414, "loss": 0.0447, "step": 133300 }, { "epoch": 0.86, "learning_rate": 0.0001709378650677372, "loss": 0.0412, "step": 133310 }, { "epoch": 0.86, "learning_rate": 0.00017092818371338027, "loss": 0.0457, "step": 133320 }, { "epoch": 0.86, "learning_rate": 0.00017091850235902335, "loss": 0.0424, "step": 133330 }, { "epoch": 0.86, "learning_rate": 0.00017090882100466638, "loss": 0.0463, "step": 133340 }, { "epoch": 0.86, "learning_rate": 0.00017089913965030946, "loss": 0.0443, "step": 133350 }, { "epoch": 0.86, "learning_rate": 0.00017088945829595254, "loss": 0.0365, "step": 133360 }, { "epoch": 0.86, "learning_rate": 0.00017087977694159561, "loss": 0.0391, "step": 133370 }, { "epoch": 0.86, "learning_rate": 0.00017087009558723867, "loss": 0.0374, "step": 133380 }, { "epoch": 0.86, "learning_rate": 0.00017086041423288175, "loss": 0.0414, "step": 133390 }, { "epoch": 0.86, "learning_rate": 0.00017085073287852483, "loss": 0.0419, "step": 133400 }, { "epoch": 0.86, "learning_rate": 0.00017084105152416785, "loss": 0.0355, "step": 133410 }, { "epoch": 0.86, "learning_rate": 0.00017083137016981093, "loss": 0.0361, "step": 133420 }, { "epoch": 0.86, "learning_rate": 0.000170821688815454, "loss": 0.0384, "step": 133430 }, { "epoch": 0.86, "learning_rate": 0.00017081200746109707, "loss": 0.0385, "step": 133440 }, { "epoch": 0.86, "learning_rate": 0.00017080232610674014, "loss": 0.0405, "step": 133450 }, { "epoch": 0.86, "learning_rate": 0.00017079264475238322, "loss": 0.0434, "step": 133460 }, { "epoch": 0.86, "learning_rate": 0.0001707829633980263, "loss": 0.0365, "step": 133470 }, { "epoch": 0.86, "learning_rate": 0.00017077328204366933, "loss": 0.0375, "step": 133480 }, { "epoch": 0.86, "learning_rate": 0.0001707636006893124, "loss": 0.0396, "step": 133490 }, { "epoch": 0.86, "learning_rate": 0.0001707539193349555, "loss": 0.0408, "step": 133500 }, { "epoch": 0.86, "learning_rate": 0.00017074423798059854, "loss": 0.047, "step": 133510 }, { "epoch": 0.86, "learning_rate": 0.00017073455662624162, "loss": 0.0408, "step": 133520 }, { "epoch": 0.86, "learning_rate": 0.0001707248752718847, "loss": 0.043, "step": 133530 }, { "epoch": 0.86, "learning_rate": 0.00017071519391752778, "loss": 0.0476, "step": 133540 }, { "epoch": 0.86, "learning_rate": 0.0001707055125631708, "loss": 0.0363, "step": 133550 }, { "epoch": 0.86, "learning_rate": 0.0001706958312088139, "loss": 0.0408, "step": 133560 }, { "epoch": 0.86, "learning_rate": 0.00017068614985445697, "loss": 0.0416, "step": 133570 }, { "epoch": 0.86, "learning_rate": 0.00017067646850010002, "loss": 0.0413, "step": 133580 }, { "epoch": 0.86, "learning_rate": 0.0001706667871457431, "loss": 0.0367, "step": 133590 }, { "epoch": 0.86, "learning_rate": 0.00017065710579138618, "loss": 0.0411, "step": 133600 }, { "epoch": 0.86, "learning_rate": 0.00017064742443702923, "loss": 0.0382, "step": 133610 }, { "epoch": 0.86, "learning_rate": 0.00017063774308267228, "loss": 0.0362, "step": 133620 }, { "epoch": 0.86, "learning_rate": 0.00017062806172831536, "loss": 0.0383, "step": 133630 }, { "epoch": 0.86, "learning_rate": 0.00017061838037395842, "loss": 0.0432, "step": 133640 }, { "epoch": 0.86, "learning_rate": 0.0001706086990196015, "loss": 0.0375, "step": 133650 }, { "epoch": 0.86, "learning_rate": 0.00017059901766524458, "loss": 0.0391, "step": 133660 }, { "epoch": 0.86, "learning_rate": 0.00017058933631088766, "loss": 0.0377, "step": 133670 }, { "epoch": 0.86, "learning_rate": 0.0001705796549565307, "loss": 0.0357, "step": 133680 }, { "epoch": 0.86, "learning_rate": 0.00017056997360217376, "loss": 0.0409, "step": 133690 }, { "epoch": 0.86, "learning_rate": 0.00017056029224781684, "loss": 0.0393, "step": 133700 }, { "epoch": 0.86, "learning_rate": 0.0001705506108934599, "loss": 0.0381, "step": 133710 }, { "epoch": 0.86, "learning_rate": 0.00017054092953910297, "loss": 0.0379, "step": 133720 }, { "epoch": 0.86, "learning_rate": 0.00017053124818474605, "loss": 0.0422, "step": 133730 }, { "epoch": 0.86, "learning_rate": 0.00017052156683038913, "loss": 0.0411, "step": 133740 }, { "epoch": 0.86, "learning_rate": 0.00017051188547603219, "loss": 0.0365, "step": 133750 }, { "epoch": 0.86, "learning_rate": 0.00017050220412167524, "loss": 0.0412, "step": 133760 }, { "epoch": 0.86, "learning_rate": 0.00017049252276731832, "loss": 0.0414, "step": 133770 }, { "epoch": 0.86, "learning_rate": 0.00017048284141296137, "loss": 0.0434, "step": 133780 }, { "epoch": 0.86, "learning_rate": 0.00017047316005860445, "loss": 0.0455, "step": 133790 }, { "epoch": 0.86, "learning_rate": 0.00017046347870424753, "loss": 0.034, "step": 133800 }, { "epoch": 0.86, "learning_rate": 0.0001704537973498906, "loss": 0.0409, "step": 133810 }, { "epoch": 0.86, "learning_rate": 0.00017044411599553366, "loss": 0.0428, "step": 133820 }, { "epoch": 0.86, "learning_rate": 0.00017043443464117672, "loss": 0.0428, "step": 133830 }, { "epoch": 0.86, "learning_rate": 0.00017042475328681977, "loss": 0.0463, "step": 133840 }, { "epoch": 0.86, "learning_rate": 0.00017041507193246285, "loss": 0.0384, "step": 133850 }, { "epoch": 0.86, "learning_rate": 0.00017040539057810593, "loss": 0.042, "step": 133860 }, { "epoch": 0.86, "learning_rate": 0.000170395709223749, "loss": 0.0408, "step": 133870 }, { "epoch": 0.86, "learning_rate": 0.00017038602786939206, "loss": 0.0368, "step": 133880 }, { "epoch": 0.86, "learning_rate": 0.00017037634651503514, "loss": 0.0407, "step": 133890 }, { "epoch": 0.86, "learning_rate": 0.0001703666651606782, "loss": 0.0359, "step": 133900 }, { "epoch": 0.86, "learning_rate": 0.00017035698380632125, "loss": 0.0419, "step": 133910 }, { "epoch": 0.86, "learning_rate": 0.00017034730245196433, "loss": 0.0419, "step": 133920 }, { "epoch": 0.86, "learning_rate": 0.0001703376210976074, "loss": 0.0448, "step": 133930 }, { "epoch": 0.86, "learning_rate": 0.00017032793974325049, "loss": 0.0417, "step": 133940 }, { "epoch": 0.86, "learning_rate": 0.00017031825838889354, "loss": 0.044, "step": 133950 }, { "epoch": 0.86, "learning_rate": 0.00017030857703453662, "loss": 0.0404, "step": 133960 }, { "epoch": 0.86, "learning_rate": 0.00017029889568017967, "loss": 0.0329, "step": 133970 }, { "epoch": 0.86, "learning_rate": 0.00017028921432582272, "loss": 0.0381, "step": 133980 }, { "epoch": 0.86, "learning_rate": 0.0001702795329714658, "loss": 0.0415, "step": 133990 }, { "epoch": 0.86, "learning_rate": 0.00017026985161710888, "loss": 0.0466, "step": 134000 }, { "epoch": 0.86, "eval_cer": 0.9199240763755507, "eval_loss": 0.026646053418517113, "eval_runtime": 120.1342, "eval_samples_per_second": 16.648, "eval_steps_per_second": 4.162, "step": 134000 }, { "epoch": 0.86, "learning_rate": 0.00017026017026275196, "loss": 0.0371, "step": 134010 }, { "epoch": 0.86, "learning_rate": 0.00017025048890839502, "loss": 0.039, "step": 134020 }, { "epoch": 0.87, "learning_rate": 0.0001702408075540381, "loss": 0.0381, "step": 134030 }, { "epoch": 0.87, "learning_rate": 0.00017023112619968112, "loss": 0.0404, "step": 134040 }, { "epoch": 0.87, "learning_rate": 0.0001702214448453242, "loss": 0.0522, "step": 134050 }, { "epoch": 0.87, "learning_rate": 0.00017021176349096728, "loss": 0.0418, "step": 134060 }, { "epoch": 0.87, "learning_rate": 0.00017020208213661036, "loss": 0.0389, "step": 134070 }, { "epoch": 0.87, "learning_rate": 0.0001701924007822534, "loss": 0.0409, "step": 134080 }, { "epoch": 0.87, "learning_rate": 0.0001701827194278965, "loss": 0.0446, "step": 134090 }, { "epoch": 0.87, "learning_rate": 0.00017017303807353957, "loss": 0.045, "step": 134100 }, { "epoch": 0.87, "learning_rate": 0.0001701633567191826, "loss": 0.0425, "step": 134110 }, { "epoch": 0.87, "learning_rate": 0.00017015367536482568, "loss": 0.0339, "step": 134120 }, { "epoch": 0.87, "learning_rate": 0.00017014399401046876, "loss": 0.0416, "step": 134130 }, { "epoch": 0.87, "learning_rate": 0.00017013431265611184, "loss": 0.0425, "step": 134140 }, { "epoch": 0.87, "learning_rate": 0.0001701246313017549, "loss": 0.0425, "step": 134150 }, { "epoch": 0.87, "learning_rate": 0.00017011494994739797, "loss": 0.0432, "step": 134160 }, { "epoch": 0.87, "learning_rate": 0.00017010526859304105, "loss": 0.0396, "step": 134170 }, { "epoch": 0.87, "learning_rate": 0.00017009558723868408, "loss": 0.039, "step": 134180 }, { "epoch": 0.87, "learning_rate": 0.00017008590588432716, "loss": 0.0431, "step": 134190 }, { "epoch": 0.87, "learning_rate": 0.00017007622452997023, "loss": 0.0357, "step": 134200 }, { "epoch": 0.87, "learning_rate": 0.00017006654317561331, "loss": 0.0366, "step": 134210 }, { "epoch": 0.87, "learning_rate": 0.00017005686182125637, "loss": 0.038, "step": 134220 }, { "epoch": 0.87, "learning_rate": 0.00017004718046689945, "loss": 0.0457, "step": 134230 }, { "epoch": 0.87, "learning_rate": 0.00017003749911254253, "loss": 0.0403, "step": 134240 }, { "epoch": 0.87, "learning_rate": 0.00017002781775818555, "loss": 0.0379, "step": 134250 }, { "epoch": 0.87, "learning_rate": 0.00017001813640382863, "loss": 0.0442, "step": 134260 }, { "epoch": 0.87, "learning_rate": 0.0001700084550494717, "loss": 0.0371, "step": 134270 }, { "epoch": 0.87, "learning_rate": 0.00016999877369511476, "loss": 0.0424, "step": 134280 }, { "epoch": 0.87, "learning_rate": 0.00016998909234075784, "loss": 0.0412, "step": 134290 }, { "epoch": 0.87, "learning_rate": 0.00016997941098640092, "loss": 0.0436, "step": 134300 }, { "epoch": 0.87, "learning_rate": 0.00016996972963204395, "loss": 0.0408, "step": 134310 }, { "epoch": 0.87, "learning_rate": 0.00016996004827768703, "loss": 0.0509, "step": 134320 }, { "epoch": 0.87, "learning_rate": 0.0001699503669233301, "loss": 0.0418, "step": 134330 }, { "epoch": 0.87, "learning_rate": 0.0001699406855689732, "loss": 0.038, "step": 134340 }, { "epoch": 0.87, "learning_rate": 0.00016993100421461624, "loss": 0.0437, "step": 134350 }, { "epoch": 0.87, "learning_rate": 0.00016992132286025932, "loss": 0.0393, "step": 134360 }, { "epoch": 0.87, "learning_rate": 0.0001699116415059024, "loss": 0.0333, "step": 134370 }, { "epoch": 0.87, "learning_rate": 0.00016990196015154543, "loss": 0.0374, "step": 134380 }, { "epoch": 0.87, "learning_rate": 0.0001698922787971885, "loss": 0.046, "step": 134390 }, { "epoch": 0.87, "learning_rate": 0.0001698825974428316, "loss": 0.0392, "step": 134400 }, { "epoch": 0.87, "learning_rate": 0.00016987291608847467, "loss": 0.0361, "step": 134410 }, { "epoch": 0.87, "learning_rate": 0.00016986323473411772, "loss": 0.0423, "step": 134420 }, { "epoch": 0.87, "learning_rate": 0.0001698535533797608, "loss": 0.0464, "step": 134430 }, { "epoch": 0.87, "learning_rate": 0.00016984387202540388, "loss": 0.0369, "step": 134440 }, { "epoch": 0.87, "learning_rate": 0.0001698341906710469, "loss": 0.0428, "step": 134450 }, { "epoch": 0.87, "learning_rate": 0.00016982450931668998, "loss": 0.0373, "step": 134460 }, { "epoch": 0.87, "learning_rate": 0.00016981482796233306, "loss": 0.038, "step": 134470 }, { "epoch": 0.87, "learning_rate": 0.00016980514660797612, "loss": 0.0328, "step": 134480 }, { "epoch": 0.87, "learning_rate": 0.0001697954652536192, "loss": 0.047, "step": 134490 }, { "epoch": 0.87, "learning_rate": 0.00016978578389926228, "loss": 0.0428, "step": 134500 }, { "epoch": 0.87, "learning_rate": 0.00016977610254490536, "loss": 0.0401, "step": 134510 }, { "epoch": 0.87, "learning_rate": 0.00016976642119054838, "loss": 0.0473, "step": 134520 }, { "epoch": 0.87, "learning_rate": 0.00016975673983619146, "loss": 0.044, "step": 134530 }, { "epoch": 0.87, "learning_rate": 0.00016974705848183454, "loss": 0.0341, "step": 134540 }, { "epoch": 0.87, "learning_rate": 0.0001697373771274776, "loss": 0.0358, "step": 134550 }, { "epoch": 0.87, "learning_rate": 0.00016972769577312067, "loss": 0.0365, "step": 134560 }, { "epoch": 0.87, "learning_rate": 0.00016971801441876375, "loss": 0.0399, "step": 134570 }, { "epoch": 0.87, "learning_rate": 0.00016970833306440683, "loss": 0.0428, "step": 134580 }, { "epoch": 0.87, "learning_rate": 0.00016969865171004986, "loss": 0.0414, "step": 134590 }, { "epoch": 0.87, "learning_rate": 0.00016968897035569294, "loss": 0.0375, "step": 134600 }, { "epoch": 0.87, "learning_rate": 0.00016967928900133602, "loss": 0.0377, "step": 134610 }, { "epoch": 0.87, "learning_rate": 0.00016966960764697907, "loss": 0.0373, "step": 134620 }, { "epoch": 0.87, "learning_rate": 0.00016965992629262215, "loss": 0.0388, "step": 134630 }, { "epoch": 0.87, "learning_rate": 0.00016965024493826523, "loss": 0.0411, "step": 134640 }, { "epoch": 0.87, "learning_rate": 0.00016964056358390828, "loss": 0.0461, "step": 134650 }, { "epoch": 0.87, "learning_rate": 0.00016963088222955134, "loss": 0.0369, "step": 134660 }, { "epoch": 0.87, "learning_rate": 0.00016962120087519442, "loss": 0.0424, "step": 134670 }, { "epoch": 0.87, "learning_rate": 0.00016961151952083747, "loss": 0.0382, "step": 134680 }, { "epoch": 0.87, "learning_rate": 0.00016960183816648055, "loss": 0.0345, "step": 134690 }, { "epoch": 0.87, "learning_rate": 0.00016959215681212363, "loss": 0.0433, "step": 134700 }, { "epoch": 0.87, "learning_rate": 0.0001695824754577667, "loss": 0.0421, "step": 134710 }, { "epoch": 0.87, "learning_rate": 0.00016957279410340976, "loss": 0.0404, "step": 134720 }, { "epoch": 0.87, "learning_rate": 0.0001695631127490528, "loss": 0.0358, "step": 134730 }, { "epoch": 0.87, "learning_rate": 0.0001695534313946959, "loss": 0.0367, "step": 134740 }, { "epoch": 0.87, "learning_rate": 0.00016954375004033895, "loss": 0.0408, "step": 134750 }, { "epoch": 0.87, "learning_rate": 0.00016953406868598203, "loss": 0.0453, "step": 134760 }, { "epoch": 0.87, "learning_rate": 0.0001695243873316251, "loss": 0.0402, "step": 134770 }, { "epoch": 0.87, "learning_rate": 0.00016951470597726819, "loss": 0.0435, "step": 134780 }, { "epoch": 0.87, "learning_rate": 0.00016950502462291124, "loss": 0.0356, "step": 134790 }, { "epoch": 0.87, "learning_rate": 0.0001694953432685543, "loss": 0.0415, "step": 134800 }, { "epoch": 0.87, "learning_rate": 0.00016948566191419737, "loss": 0.0404, "step": 134810 }, { "epoch": 0.87, "learning_rate": 0.00016947598055984042, "loss": 0.0393, "step": 134820 }, { "epoch": 0.87, "learning_rate": 0.0001694662992054835, "loss": 0.0359, "step": 134830 }, { "epoch": 0.87, "learning_rate": 0.00016945661785112658, "loss": 0.0406, "step": 134840 }, { "epoch": 0.87, "learning_rate": 0.00016944693649676964, "loss": 0.0467, "step": 134850 }, { "epoch": 0.87, "learning_rate": 0.00016943725514241272, "loss": 0.0435, "step": 134860 }, { "epoch": 0.87, "learning_rate": 0.00016942757378805577, "loss": 0.0401, "step": 134870 }, { "epoch": 0.87, "learning_rate": 0.00016941789243369882, "loss": 0.0374, "step": 134880 }, { "epoch": 0.87, "learning_rate": 0.0001694082110793419, "loss": 0.0395, "step": 134890 }, { "epoch": 0.87, "learning_rate": 0.00016939852972498498, "loss": 0.0451, "step": 134900 }, { "epoch": 0.87, "learning_rate": 0.00016938884837062806, "loss": 0.0427, "step": 134910 }, { "epoch": 0.87, "learning_rate": 0.0001693791670162711, "loss": 0.0402, "step": 134920 }, { "epoch": 0.87, "learning_rate": 0.0001693694856619142, "loss": 0.0424, "step": 134930 }, { "epoch": 0.87, "learning_rate": 0.00016935980430755724, "loss": 0.0395, "step": 134940 }, { "epoch": 0.87, "learning_rate": 0.0001693501229532003, "loss": 0.0439, "step": 134950 }, { "epoch": 0.87, "learning_rate": 0.00016934044159884338, "loss": 0.0378, "step": 134960 }, { "epoch": 0.87, "learning_rate": 0.00016933076024448646, "loss": 0.0408, "step": 134970 }, { "epoch": 0.87, "learning_rate": 0.00016932107889012954, "loss": 0.0354, "step": 134980 }, { "epoch": 0.87, "learning_rate": 0.0001693113975357726, "loss": 0.0418, "step": 134990 }, { "epoch": 0.87, "learning_rate": 0.00016930171618141567, "loss": 0.04, "step": 135000 }, { "epoch": 0.87, "eval_cer": 0.919934922607615, "eval_loss": 0.02674305997788906, "eval_runtime": 119.9587, "eval_samples_per_second": 16.672, "eval_steps_per_second": 4.168, "step": 135000 }, { "epoch": 0.87, "learning_rate": 0.00016929203482705872, "loss": 0.0434, "step": 135010 }, { "epoch": 0.87, "learning_rate": 0.00016928235347270177, "loss": 0.0429, "step": 135020 }, { "epoch": 0.87, "learning_rate": 0.00016927267211834485, "loss": 0.0424, "step": 135030 }, { "epoch": 0.87, "learning_rate": 0.00016926299076398793, "loss": 0.0404, "step": 135040 }, { "epoch": 0.87, "learning_rate": 0.000169253309409631, "loss": 0.0408, "step": 135050 }, { "epoch": 0.87, "learning_rate": 0.00016924362805527407, "loss": 0.0387, "step": 135060 }, { "epoch": 0.87, "learning_rate": 0.00016923394670091715, "loss": 0.0466, "step": 135070 }, { "epoch": 0.87, "learning_rate": 0.00016922426534656017, "loss": 0.037, "step": 135080 }, { "epoch": 0.87, "learning_rate": 0.00016921458399220325, "loss": 0.0455, "step": 135090 }, { "epoch": 0.87, "learning_rate": 0.00016920490263784633, "loss": 0.0435, "step": 135100 }, { "epoch": 0.87, "learning_rate": 0.0001691952212834894, "loss": 0.0403, "step": 135110 }, { "epoch": 0.87, "learning_rate": 0.00016918553992913246, "loss": 0.0375, "step": 135120 }, { "epoch": 0.87, "learning_rate": 0.00016917585857477554, "loss": 0.0445, "step": 135130 }, { "epoch": 0.87, "learning_rate": 0.00016916617722041862, "loss": 0.0394, "step": 135140 }, { "epoch": 0.87, "learning_rate": 0.00016915649586606165, "loss": 0.0423, "step": 135150 }, { "epoch": 0.87, "learning_rate": 0.00016914681451170473, "loss": 0.0373, "step": 135160 }, { "epoch": 0.87, "learning_rate": 0.0001691371331573478, "loss": 0.0416, "step": 135170 }, { "epoch": 0.87, "learning_rate": 0.0001691274518029909, "loss": 0.0405, "step": 135180 }, { "epoch": 0.87, "learning_rate": 0.00016911777044863394, "loss": 0.0412, "step": 135190 }, { "epoch": 0.87, "learning_rate": 0.00016910808909427702, "loss": 0.0438, "step": 135200 }, { "epoch": 0.87, "learning_rate": 0.0001690984077399201, "loss": 0.0394, "step": 135210 }, { "epoch": 0.87, "learning_rate": 0.00016908872638556313, "loss": 0.0426, "step": 135220 }, { "epoch": 0.87, "learning_rate": 0.0001690790450312062, "loss": 0.0414, "step": 135230 }, { "epoch": 0.87, "learning_rate": 0.00016906936367684929, "loss": 0.0448, "step": 135240 }, { "epoch": 0.87, "learning_rate": 0.00016905968232249234, "loss": 0.0435, "step": 135250 }, { "epoch": 0.87, "learning_rate": 0.00016905000096813542, "loss": 0.0448, "step": 135260 }, { "epoch": 0.87, "learning_rate": 0.0001690403196137785, "loss": 0.0443, "step": 135270 }, { "epoch": 0.87, "learning_rate": 0.00016903063825942158, "loss": 0.0423, "step": 135280 }, { "epoch": 0.87, "learning_rate": 0.0001690209569050646, "loss": 0.0403, "step": 135290 }, { "epoch": 0.87, "learning_rate": 0.00016901127555070768, "loss": 0.0384, "step": 135300 }, { "epoch": 0.87, "learning_rate": 0.00016900159419635076, "loss": 0.0372, "step": 135310 }, { "epoch": 0.87, "learning_rate": 0.00016899191284199382, "loss": 0.0363, "step": 135320 }, { "epoch": 0.87, "learning_rate": 0.0001689822314876369, "loss": 0.0454, "step": 135330 }, { "epoch": 0.87, "learning_rate": 0.00016897255013327998, "loss": 0.0395, "step": 135340 }, { "epoch": 0.87, "learning_rate": 0.00016896286877892306, "loss": 0.0387, "step": 135350 }, { "epoch": 0.87, "learning_rate": 0.00016895318742456608, "loss": 0.0383, "step": 135360 }, { "epoch": 0.87, "learning_rate": 0.00016894350607020916, "loss": 0.0397, "step": 135370 }, { "epoch": 0.87, "learning_rate": 0.00016893382471585224, "loss": 0.0421, "step": 135380 }, { "epoch": 0.87, "learning_rate": 0.0001689241433614953, "loss": 0.0384, "step": 135390 }, { "epoch": 0.87, "learning_rate": 0.00016891446200713837, "loss": 0.0462, "step": 135400 }, { "epoch": 0.87, "learning_rate": 0.00016890478065278145, "loss": 0.0388, "step": 135410 }, { "epoch": 0.87, "learning_rate": 0.0001688950992984245, "loss": 0.0444, "step": 135420 }, { "epoch": 0.87, "learning_rate": 0.00016888541794406756, "loss": 0.0394, "step": 135430 }, { "epoch": 0.87, "learning_rate": 0.00016887573658971064, "loss": 0.0386, "step": 135440 }, { "epoch": 0.87, "learning_rate": 0.0001688660552353537, "loss": 0.0482, "step": 135450 }, { "epoch": 0.87, "learning_rate": 0.00016885637388099677, "loss": 0.0459, "step": 135460 }, { "epoch": 0.87, "learning_rate": 0.00016884669252663985, "loss": 0.0397, "step": 135470 }, { "epoch": 0.87, "learning_rate": 0.00016883701117228293, "loss": 0.0385, "step": 135480 }, { "epoch": 0.87, "learning_rate": 0.00016882732981792598, "loss": 0.0449, "step": 135490 }, { "epoch": 0.87, "learning_rate": 0.00016881764846356904, "loss": 0.0396, "step": 135500 }, { "epoch": 0.87, "learning_rate": 0.00016880796710921212, "loss": 0.046, "step": 135510 }, { "epoch": 0.87, "learning_rate": 0.00016879828575485517, "loss": 0.0439, "step": 135520 }, { "epoch": 0.87, "learning_rate": 0.00016878860440049825, "loss": 0.0361, "step": 135530 }, { "epoch": 0.87, "learning_rate": 0.00016877892304614133, "loss": 0.0482, "step": 135540 }, { "epoch": 0.87, "learning_rate": 0.0001687692416917844, "loss": 0.0468, "step": 135550 }, { "epoch": 0.87, "learning_rate": 0.00016875956033742746, "loss": 0.0435, "step": 135560 }, { "epoch": 0.87, "learning_rate": 0.0001687498789830705, "loss": 0.0401, "step": 135570 }, { "epoch": 0.88, "learning_rate": 0.0001687401976287136, "loss": 0.0443, "step": 135580 }, { "epoch": 0.88, "learning_rate": 0.00016873051627435665, "loss": 0.0393, "step": 135590 }, { "epoch": 0.88, "learning_rate": 0.00016872083491999973, "loss": 0.0389, "step": 135600 }, { "epoch": 0.88, "learning_rate": 0.0001687111535656428, "loss": 0.0399, "step": 135610 }, { "epoch": 0.88, "learning_rate": 0.00016870147221128586, "loss": 0.0436, "step": 135620 }, { "epoch": 0.88, "learning_rate": 0.00016869179085692894, "loss": 0.04, "step": 135630 }, { "epoch": 0.88, "learning_rate": 0.000168682109502572, "loss": 0.0352, "step": 135640 }, { "epoch": 0.88, "learning_rate": 0.00016867242814821504, "loss": 0.0458, "step": 135650 }, { "epoch": 0.88, "learning_rate": 0.00016866274679385812, "loss": 0.0359, "step": 135660 }, { "epoch": 0.88, "learning_rate": 0.0001686530654395012, "loss": 0.039, "step": 135670 }, { "epoch": 0.88, "learning_rate": 0.00016864338408514428, "loss": 0.0426, "step": 135680 }, { "epoch": 0.88, "learning_rate": 0.00016863370273078733, "loss": 0.0511, "step": 135690 }, { "epoch": 0.88, "learning_rate": 0.00016862402137643041, "loss": 0.0388, "step": 135700 }, { "epoch": 0.88, "learning_rate": 0.00016861434002207347, "loss": 0.0405, "step": 135710 }, { "epoch": 0.88, "learning_rate": 0.00016860465866771652, "loss": 0.0406, "step": 135720 }, { "epoch": 0.88, "learning_rate": 0.0001685949773133596, "loss": 0.038, "step": 135730 }, { "epoch": 0.88, "learning_rate": 0.00016858529595900268, "loss": 0.0448, "step": 135740 }, { "epoch": 0.88, "learning_rate": 0.00016857561460464576, "loss": 0.0395, "step": 135750 }, { "epoch": 0.88, "learning_rate": 0.0001685659332502888, "loss": 0.0424, "step": 135760 }, { "epoch": 0.88, "learning_rate": 0.0001685562518959319, "loss": 0.0407, "step": 135770 }, { "epoch": 0.88, "learning_rate": 0.00016854657054157494, "loss": 0.0392, "step": 135780 }, { "epoch": 0.88, "learning_rate": 0.000168536889187218, "loss": 0.0398, "step": 135790 }, { "epoch": 0.88, "learning_rate": 0.00016852720783286108, "loss": 0.0382, "step": 135800 }, { "epoch": 0.88, "learning_rate": 0.00016851752647850416, "loss": 0.039, "step": 135810 }, { "epoch": 0.88, "learning_rate": 0.0001685078451241472, "loss": 0.0412, "step": 135820 }, { "epoch": 0.88, "learning_rate": 0.0001684981637697903, "loss": 0.0371, "step": 135830 }, { "epoch": 0.88, "learning_rate": 0.00016848848241543337, "loss": 0.0331, "step": 135840 }, { "epoch": 0.88, "learning_rate": 0.0001684788010610764, "loss": 0.0376, "step": 135850 }, { "epoch": 0.88, "learning_rate": 0.00016846911970671947, "loss": 0.0447, "step": 135860 }, { "epoch": 0.88, "learning_rate": 0.00016845943835236255, "loss": 0.0497, "step": 135870 }, { "epoch": 0.88, "learning_rate": 0.00016844975699800563, "loss": 0.0442, "step": 135880 }, { "epoch": 0.88, "learning_rate": 0.0001684400756436487, "loss": 0.0432, "step": 135890 }, { "epoch": 0.88, "learning_rate": 0.00016843039428929177, "loss": 0.04, "step": 135900 }, { "epoch": 0.88, "learning_rate": 0.00016842071293493485, "loss": 0.0409, "step": 135910 }, { "epoch": 0.88, "learning_rate": 0.00016841103158057787, "loss": 0.0418, "step": 135920 }, { "epoch": 0.88, "learning_rate": 0.00016840135022622095, "loss": 0.0456, "step": 135930 }, { "epoch": 0.88, "learning_rate": 0.00016839166887186403, "loss": 0.0404, "step": 135940 }, { "epoch": 0.88, "learning_rate": 0.0001683819875175071, "loss": 0.0373, "step": 135950 }, { "epoch": 0.88, "learning_rate": 0.00016837230616315016, "loss": 0.0403, "step": 135960 }, { "epoch": 0.88, "learning_rate": 0.00016836262480879324, "loss": 0.0405, "step": 135970 }, { "epoch": 0.88, "learning_rate": 0.00016835294345443632, "loss": 0.0383, "step": 135980 }, { "epoch": 0.88, "learning_rate": 0.00016834326210007935, "loss": 0.044, "step": 135990 }, { "epoch": 0.88, "learning_rate": 0.00016833358074572243, "loss": 0.038, "step": 136000 }, { "epoch": 0.88, "eval_cer": 0.9199123262908147, "eval_loss": 0.027130674570798874, "eval_runtime": 119.9831, "eval_samples_per_second": 16.669, "eval_steps_per_second": 4.167, "step": 136000 }, { "epoch": 0.88, "learning_rate": 0.0001683238993913655, "loss": 0.0399, "step": 136010 }, { "epoch": 0.88, "learning_rate": 0.00016831421803700856, "loss": 0.0379, "step": 136020 }, { "epoch": 0.88, "learning_rate": 0.00016830453668265164, "loss": 0.0385, "step": 136030 }, { "epoch": 0.88, "learning_rate": 0.00016829485532829472, "loss": 0.0377, "step": 136040 }, { "epoch": 0.88, "learning_rate": 0.0001682851739739378, "loss": 0.0445, "step": 136050 }, { "epoch": 0.88, "learning_rate": 0.00016827549261958083, "loss": 0.0462, "step": 136060 }, { "epoch": 0.88, "learning_rate": 0.0001682658112652239, "loss": 0.0374, "step": 136070 }, { "epoch": 0.88, "learning_rate": 0.00016825612991086699, "loss": 0.0408, "step": 136080 }, { "epoch": 0.88, "learning_rate": 0.00016824644855651004, "loss": 0.0418, "step": 136090 }, { "epoch": 0.88, "learning_rate": 0.00016823676720215312, "loss": 0.0412, "step": 136100 }, { "epoch": 0.88, "learning_rate": 0.0001682270858477962, "loss": 0.043, "step": 136110 }, { "epoch": 0.88, "learning_rate": 0.00016821740449343928, "loss": 0.0484, "step": 136120 }, { "epoch": 0.88, "learning_rate": 0.0001682077231390823, "loss": 0.0367, "step": 136130 }, { "epoch": 0.88, "learning_rate": 0.00016819804178472538, "loss": 0.043, "step": 136140 }, { "epoch": 0.88, "learning_rate": 0.00016818836043036846, "loss": 0.0397, "step": 136150 }, { "epoch": 0.88, "learning_rate": 0.00016817867907601152, "loss": 0.0389, "step": 136160 }, { "epoch": 0.88, "learning_rate": 0.0001681689977216546, "loss": 0.0409, "step": 136170 }, { "epoch": 0.88, "learning_rate": 0.00016815931636729768, "loss": 0.0402, "step": 136180 }, { "epoch": 0.88, "learning_rate": 0.00016814963501294076, "loss": 0.044, "step": 136190 }, { "epoch": 0.88, "learning_rate": 0.00016813995365858378, "loss": 0.0404, "step": 136200 }, { "epoch": 0.88, "learning_rate": 0.00016813027230422686, "loss": 0.0429, "step": 136210 }, { "epoch": 0.88, "learning_rate": 0.0001681205909498699, "loss": 0.0429, "step": 136220 }, { "epoch": 0.88, "learning_rate": 0.000168110909595513, "loss": 0.0448, "step": 136230 }, { "epoch": 0.88, "learning_rate": 0.00016810122824115607, "loss": 0.0433, "step": 136240 }, { "epoch": 0.88, "learning_rate": 0.00016809154688679915, "loss": 0.0375, "step": 136250 }, { "epoch": 0.88, "learning_rate": 0.0001680818655324422, "loss": 0.0381, "step": 136260 }, { "epoch": 0.88, "learning_rate": 0.00016807218417808526, "loss": 0.0346, "step": 136270 }, { "epoch": 0.88, "learning_rate": 0.00016806250282372834, "loss": 0.0438, "step": 136280 }, { "epoch": 0.88, "learning_rate": 0.0001680528214693714, "loss": 0.039, "step": 136290 }, { "epoch": 0.88, "learning_rate": 0.00016804314011501447, "loss": 0.0401, "step": 136300 }, { "epoch": 0.88, "learning_rate": 0.00016803345876065755, "loss": 0.0415, "step": 136310 }, { "epoch": 0.88, "learning_rate": 0.00016802377740630063, "loss": 0.0429, "step": 136320 }, { "epoch": 0.88, "learning_rate": 0.00016801409605194368, "loss": 0.0389, "step": 136330 }, { "epoch": 0.88, "learning_rate": 0.00016800441469758674, "loss": 0.0394, "step": 136340 }, { "epoch": 0.88, "learning_rate": 0.00016799473334322982, "loss": 0.0397, "step": 136350 }, { "epoch": 0.88, "learning_rate": 0.00016798505198887287, "loss": 0.0424, "step": 136360 }, { "epoch": 0.88, "learning_rate": 0.00016797537063451595, "loss": 0.0353, "step": 136370 }, { "epoch": 0.88, "learning_rate": 0.00016796568928015903, "loss": 0.0415, "step": 136380 }, { "epoch": 0.88, "learning_rate": 0.0001679560079258021, "loss": 0.0382, "step": 136390 }, { "epoch": 0.88, "learning_rate": 0.00016794632657144516, "loss": 0.0379, "step": 136400 }, { "epoch": 0.88, "learning_rate": 0.0001679366452170882, "loss": 0.0424, "step": 136410 }, { "epoch": 0.88, "learning_rate": 0.00016792696386273127, "loss": 0.0384, "step": 136420 }, { "epoch": 0.88, "learning_rate": 0.00016791728250837434, "loss": 0.0411, "step": 136430 }, { "epoch": 0.88, "learning_rate": 0.00016790760115401742, "loss": 0.0404, "step": 136440 }, { "epoch": 0.88, "learning_rate": 0.0001678979197996605, "loss": 0.0388, "step": 136450 }, { "epoch": 0.88, "learning_rate": 0.00016788823844530356, "loss": 0.0438, "step": 136460 }, { "epoch": 0.88, "learning_rate": 0.00016787855709094664, "loss": 0.0406, "step": 136470 }, { "epoch": 0.88, "learning_rate": 0.0001678688757365897, "loss": 0.0392, "step": 136480 }, { "epoch": 0.88, "learning_rate": 0.00016785919438223274, "loss": 0.0435, "step": 136490 }, { "epoch": 0.88, "learning_rate": 0.00016784951302787582, "loss": 0.0392, "step": 136500 }, { "epoch": 0.88, "learning_rate": 0.0001678398316735189, "loss": 0.0373, "step": 136510 }, { "epoch": 0.88, "learning_rate": 0.00016783015031916198, "loss": 0.0363, "step": 136520 }, { "epoch": 0.88, "learning_rate": 0.00016782046896480503, "loss": 0.037, "step": 136530 }, { "epoch": 0.88, "learning_rate": 0.00016781078761044811, "loss": 0.0377, "step": 136540 }, { "epoch": 0.88, "learning_rate": 0.00016780110625609117, "loss": 0.0524, "step": 136550 }, { "epoch": 0.88, "learning_rate": 0.00016779142490173422, "loss": 0.0329, "step": 136560 }, { "epoch": 0.88, "learning_rate": 0.0001677817435473773, "loss": 0.0415, "step": 136570 }, { "epoch": 0.88, "learning_rate": 0.00016777206219302038, "loss": 0.0436, "step": 136580 }, { "epoch": 0.88, "learning_rate": 0.00016776238083866346, "loss": 0.0403, "step": 136590 }, { "epoch": 0.88, "learning_rate": 0.0001677526994843065, "loss": 0.0435, "step": 136600 }, { "epoch": 0.88, "learning_rate": 0.0001677430181299496, "loss": 0.0451, "step": 136610 }, { "epoch": 0.88, "learning_rate": 0.00016773333677559262, "loss": 0.0425, "step": 136620 }, { "epoch": 0.88, "learning_rate": 0.0001677236554212357, "loss": 0.0485, "step": 136630 }, { "epoch": 0.88, "learning_rate": 0.00016771397406687878, "loss": 0.0437, "step": 136640 }, { "epoch": 0.88, "learning_rate": 0.00016770429271252186, "loss": 0.0404, "step": 136650 }, { "epoch": 0.88, "learning_rate": 0.0001676946113581649, "loss": 0.0405, "step": 136660 }, { "epoch": 0.88, "learning_rate": 0.000167684930003808, "loss": 0.0383, "step": 136670 }, { "epoch": 0.88, "learning_rate": 0.00016767524864945107, "loss": 0.0454, "step": 136680 }, { "epoch": 0.88, "learning_rate": 0.0001676655672950941, "loss": 0.0427, "step": 136690 }, { "epoch": 0.88, "learning_rate": 0.00016765588594073717, "loss": 0.036, "step": 136700 }, { "epoch": 0.88, "learning_rate": 0.00016764620458638025, "loss": 0.04, "step": 136710 }, { "epoch": 0.88, "learning_rate": 0.00016763652323202333, "loss": 0.0407, "step": 136720 }, { "epoch": 0.88, "learning_rate": 0.00016762684187766639, "loss": 0.0351, "step": 136730 }, { "epoch": 0.88, "learning_rate": 0.00016761716052330947, "loss": 0.0424, "step": 136740 }, { "epoch": 0.88, "learning_rate": 0.00016760747916895255, "loss": 0.0412, "step": 136750 }, { "epoch": 0.88, "learning_rate": 0.00016759779781459557, "loss": 0.0379, "step": 136760 }, { "epoch": 0.88, "learning_rate": 0.00016758811646023865, "loss": 0.0352, "step": 136770 }, { "epoch": 0.88, "learning_rate": 0.00016757843510588173, "loss": 0.0389, "step": 136780 }, { "epoch": 0.88, "learning_rate": 0.0001675687537515248, "loss": 0.0429, "step": 136790 }, { "epoch": 0.88, "learning_rate": 0.00016755907239716786, "loss": 0.0388, "step": 136800 }, { "epoch": 0.88, "learning_rate": 0.00016754939104281094, "loss": 0.0428, "step": 136810 }, { "epoch": 0.88, "learning_rate": 0.00016753970968845402, "loss": 0.0347, "step": 136820 }, { "epoch": 0.88, "learning_rate": 0.00016753002833409705, "loss": 0.0418, "step": 136830 }, { "epoch": 0.88, "learning_rate": 0.00016752034697974013, "loss": 0.0407, "step": 136840 }, { "epoch": 0.88, "learning_rate": 0.0001675106656253832, "loss": 0.0488, "step": 136850 }, { "epoch": 0.88, "learning_rate": 0.00016750098427102626, "loss": 0.0409, "step": 136860 }, { "epoch": 0.88, "learning_rate": 0.00016749130291666934, "loss": 0.0492, "step": 136870 }, { "epoch": 0.88, "learning_rate": 0.00016748162156231242, "loss": 0.0358, "step": 136880 }, { "epoch": 0.88, "learning_rate": 0.0001674719402079555, "loss": 0.0415, "step": 136890 }, { "epoch": 0.88, "learning_rate": 0.00016746225885359853, "loss": 0.045, "step": 136900 }, { "epoch": 0.88, "learning_rate": 0.0001674525774992416, "loss": 0.0388, "step": 136910 }, { "epoch": 0.88, "learning_rate": 0.00016744289614488469, "loss": 0.0451, "step": 136920 }, { "epoch": 0.88, "learning_rate": 0.00016743321479052774, "loss": 0.0385, "step": 136930 }, { "epoch": 0.88, "learning_rate": 0.00016742353343617082, "loss": 0.0412, "step": 136940 }, { "epoch": 0.88, "learning_rate": 0.0001674138520818139, "loss": 0.0449, "step": 136950 }, { "epoch": 0.88, "learning_rate": 0.00016740417072745698, "loss": 0.036, "step": 136960 }, { "epoch": 0.88, "learning_rate": 0.0001673944893731, "loss": 0.042, "step": 136970 }, { "epoch": 0.88, "learning_rate": 0.00016738480801874308, "loss": 0.0446, "step": 136980 }, { "epoch": 0.88, "learning_rate": 0.00016737512666438616, "loss": 0.0458, "step": 136990 }, { "epoch": 0.88, "learning_rate": 0.00016736544531002922, "loss": 0.0382, "step": 137000 }, { "epoch": 0.88, "eval_cer": 0.9199159417015027, "eval_loss": 0.0271102674305439, "eval_runtime": 119.9795, "eval_samples_per_second": 16.67, "eval_steps_per_second": 4.167, "step": 137000 }, { "epoch": 0.88, "learning_rate": 0.0001673557639556723, "loss": 0.0446, "step": 137010 }, { "epoch": 0.88, "learning_rate": 0.00016734608260131538, "loss": 0.0432, "step": 137020 }, { "epoch": 0.88, "learning_rate": 0.00016733640124695843, "loss": 0.0405, "step": 137030 }, { "epoch": 0.88, "learning_rate": 0.00016732671989260148, "loss": 0.0381, "step": 137040 }, { "epoch": 0.88, "learning_rate": 0.00016731703853824456, "loss": 0.0382, "step": 137050 }, { "epoch": 0.88, "learning_rate": 0.0001673073571838876, "loss": 0.0377, "step": 137060 }, { "epoch": 0.88, "learning_rate": 0.0001672976758295307, "loss": 0.0429, "step": 137070 }, { "epoch": 0.88, "learning_rate": 0.00016728799447517377, "loss": 0.0386, "step": 137080 }, { "epoch": 0.88, "learning_rate": 0.00016727831312081685, "loss": 0.0366, "step": 137090 }, { "epoch": 0.88, "learning_rate": 0.0001672686317664599, "loss": 0.0383, "step": 137100 }, { "epoch": 0.88, "learning_rate": 0.00016725895041210296, "loss": 0.0412, "step": 137110 }, { "epoch": 0.89, "learning_rate": 0.00016724926905774604, "loss": 0.0381, "step": 137120 }, { "epoch": 0.89, "learning_rate": 0.0001672395877033891, "loss": 0.0364, "step": 137130 }, { "epoch": 0.89, "learning_rate": 0.00016722990634903217, "loss": 0.0416, "step": 137140 }, { "epoch": 0.89, "learning_rate": 0.00016722022499467525, "loss": 0.0404, "step": 137150 }, { "epoch": 0.89, "learning_rate": 0.00016721054364031833, "loss": 0.0445, "step": 137160 }, { "epoch": 0.89, "learning_rate": 0.00016720086228596138, "loss": 0.0388, "step": 137170 }, { "epoch": 0.89, "learning_rate": 0.00016719118093160443, "loss": 0.0425, "step": 137180 }, { "epoch": 0.89, "learning_rate": 0.00016718149957724751, "loss": 0.0415, "step": 137190 }, { "epoch": 0.89, "learning_rate": 0.00016717181822289057, "loss": 0.0363, "step": 137200 }, { "epoch": 0.89, "learning_rate": 0.00016716213686853365, "loss": 0.0437, "step": 137210 }, { "epoch": 0.89, "learning_rate": 0.00016715245551417673, "loss": 0.0371, "step": 137220 }, { "epoch": 0.89, "learning_rate": 0.00016714277415981978, "loss": 0.039, "step": 137230 }, { "epoch": 0.89, "learning_rate": 0.00016713309280546286, "loss": 0.0382, "step": 137240 }, { "epoch": 0.89, "learning_rate": 0.0001671234114511059, "loss": 0.0392, "step": 137250 }, { "epoch": 0.89, "learning_rate": 0.00016711373009674896, "loss": 0.0437, "step": 137260 }, { "epoch": 0.89, "learning_rate": 0.00016710404874239204, "loss": 0.0413, "step": 137270 }, { "epoch": 0.89, "learning_rate": 0.00016709436738803512, "loss": 0.039, "step": 137280 }, { "epoch": 0.89, "learning_rate": 0.0001670846860336782, "loss": 0.0386, "step": 137290 }, { "epoch": 0.89, "learning_rate": 0.00016707500467932126, "loss": 0.0472, "step": 137300 }, { "epoch": 0.89, "learning_rate": 0.00016706532332496434, "loss": 0.0437, "step": 137310 }, { "epoch": 0.89, "learning_rate": 0.0001670556419706074, "loss": 0.0389, "step": 137320 }, { "epoch": 0.89, "learning_rate": 0.00016704596061625044, "loss": 0.0415, "step": 137330 }, { "epoch": 0.89, "learning_rate": 0.00016703627926189352, "loss": 0.043, "step": 137340 }, { "epoch": 0.89, "learning_rate": 0.0001670265979075366, "loss": 0.0405, "step": 137350 }, { "epoch": 0.89, "learning_rate": 0.00016701691655317968, "loss": 0.0385, "step": 137360 }, { "epoch": 0.89, "learning_rate": 0.00016700723519882273, "loss": 0.0466, "step": 137370 }, { "epoch": 0.89, "learning_rate": 0.00016699755384446581, "loss": 0.0359, "step": 137380 }, { "epoch": 0.89, "learning_rate": 0.00016698787249010887, "loss": 0.0421, "step": 137390 }, { "epoch": 0.89, "learning_rate": 0.00016697819113575192, "loss": 0.0451, "step": 137400 }, { "epoch": 0.89, "learning_rate": 0.000166968509781395, "loss": 0.0391, "step": 137410 }, { "epoch": 0.89, "learning_rate": 0.00016695882842703808, "loss": 0.0415, "step": 137420 }, { "epoch": 0.89, "learning_rate": 0.00016694914707268113, "loss": 0.0432, "step": 137430 }, { "epoch": 0.89, "learning_rate": 0.0001669394657183242, "loss": 0.038, "step": 137440 }, { "epoch": 0.89, "learning_rate": 0.0001669297843639673, "loss": 0.0393, "step": 137450 }, { "epoch": 0.89, "learning_rate": 0.00016692010300961032, "loss": 0.0416, "step": 137460 }, { "epoch": 0.89, "learning_rate": 0.0001669104216552534, "loss": 0.0454, "step": 137470 }, { "epoch": 0.89, "learning_rate": 0.00016690074030089648, "loss": 0.0421, "step": 137480 }, { "epoch": 0.89, "learning_rate": 0.00016689105894653956, "loss": 0.0342, "step": 137490 }, { "epoch": 0.89, "learning_rate": 0.0001668813775921826, "loss": 0.0387, "step": 137500 }, { "epoch": 0.89, "learning_rate": 0.0001668716962378257, "loss": 0.0391, "step": 137510 }, { "epoch": 0.89, "learning_rate": 0.00016686201488346877, "loss": 0.0366, "step": 137520 }, { "epoch": 0.89, "learning_rate": 0.0001668523335291118, "loss": 0.0351, "step": 137530 }, { "epoch": 0.89, "learning_rate": 0.00016684265217475487, "loss": 0.0409, "step": 137540 }, { "epoch": 0.89, "learning_rate": 0.00016683297082039795, "loss": 0.0387, "step": 137550 }, { "epoch": 0.89, "learning_rate": 0.00016682328946604103, "loss": 0.0415, "step": 137560 }, { "epoch": 0.89, "learning_rate": 0.00016681360811168409, "loss": 0.0354, "step": 137570 }, { "epoch": 0.89, "learning_rate": 0.00016680392675732717, "loss": 0.0381, "step": 137580 }, { "epoch": 0.89, "learning_rate": 0.00016679424540297025, "loss": 0.0429, "step": 137590 }, { "epoch": 0.89, "learning_rate": 0.00016678456404861327, "loss": 0.037, "step": 137600 }, { "epoch": 0.89, "learning_rate": 0.00016677488269425635, "loss": 0.0387, "step": 137610 }, { "epoch": 0.89, "learning_rate": 0.00016676520133989943, "loss": 0.0383, "step": 137620 }, { "epoch": 0.89, "learning_rate": 0.00016675551998554248, "loss": 0.0394, "step": 137630 }, { "epoch": 0.89, "learning_rate": 0.00016674583863118556, "loss": 0.0399, "step": 137640 }, { "epoch": 0.89, "learning_rate": 0.00016673615727682864, "loss": 0.043, "step": 137650 }, { "epoch": 0.89, "learning_rate": 0.00016672647592247172, "loss": 0.035, "step": 137660 }, { "epoch": 0.89, "learning_rate": 0.00016671679456811475, "loss": 0.0404, "step": 137670 }, { "epoch": 0.89, "learning_rate": 0.00016670711321375783, "loss": 0.0455, "step": 137680 }, { "epoch": 0.89, "learning_rate": 0.0001666974318594009, "loss": 0.036, "step": 137690 }, { "epoch": 0.89, "learning_rate": 0.00016668775050504396, "loss": 0.0459, "step": 137700 }, { "epoch": 0.89, "learning_rate": 0.00016667806915068704, "loss": 0.0404, "step": 137710 }, { "epoch": 0.89, "learning_rate": 0.00016666838779633012, "loss": 0.0348, "step": 137720 }, { "epoch": 0.89, "learning_rate": 0.0001666587064419732, "loss": 0.0387, "step": 137730 }, { "epoch": 0.89, "learning_rate": 0.00016664902508761623, "loss": 0.0346, "step": 137740 }, { "epoch": 0.89, "learning_rate": 0.0001666393437332593, "loss": 0.0396, "step": 137750 }, { "epoch": 0.89, "learning_rate": 0.00016662966237890239, "loss": 0.0461, "step": 137760 }, { "epoch": 0.89, "learning_rate": 0.00016661998102454544, "loss": 0.0379, "step": 137770 }, { "epoch": 0.89, "learning_rate": 0.00016661029967018852, "loss": 0.0368, "step": 137780 }, { "epoch": 0.89, "learning_rate": 0.0001666006183158316, "loss": 0.0383, "step": 137790 }, { "epoch": 0.89, "learning_rate": 0.00016659093696147465, "loss": 0.0353, "step": 137800 }, { "epoch": 0.89, "learning_rate": 0.0001665812556071177, "loss": 0.0411, "step": 137810 }, { "epoch": 0.89, "learning_rate": 0.00016657157425276078, "loss": 0.0394, "step": 137820 }, { "epoch": 0.89, "learning_rate": 0.00016656189289840384, "loss": 0.0347, "step": 137830 }, { "epoch": 0.89, "learning_rate": 0.00016655221154404692, "loss": 0.039, "step": 137840 }, { "epoch": 0.89, "learning_rate": 0.00016654253018969, "loss": 0.0401, "step": 137850 }, { "epoch": 0.89, "learning_rate": 0.00016653284883533307, "loss": 0.0426, "step": 137860 }, { "epoch": 0.89, "learning_rate": 0.00016652316748097613, "loss": 0.0383, "step": 137870 }, { "epoch": 0.89, "learning_rate": 0.00016651348612661918, "loss": 0.0395, "step": 137880 }, { "epoch": 0.89, "learning_rate": 0.00016650380477226226, "loss": 0.0435, "step": 137890 }, { "epoch": 0.89, "learning_rate": 0.0001664941234179053, "loss": 0.0399, "step": 137900 }, { "epoch": 0.89, "learning_rate": 0.0001664844420635484, "loss": 0.0382, "step": 137910 }, { "epoch": 0.89, "learning_rate": 0.00016647476070919147, "loss": 0.0431, "step": 137920 }, { "epoch": 0.89, "learning_rate": 0.00016646507935483455, "loss": 0.0431, "step": 137930 }, { "epoch": 0.89, "learning_rate": 0.0001664553980004776, "loss": 0.0458, "step": 137940 }, { "epoch": 0.89, "learning_rate": 0.00016644571664612066, "loss": 0.0355, "step": 137950 }, { "epoch": 0.89, "learning_rate": 0.00016643603529176374, "loss": 0.0413, "step": 137960 }, { "epoch": 0.89, "learning_rate": 0.0001664263539374068, "loss": 0.0501, "step": 137970 }, { "epoch": 0.89, "learning_rate": 0.00016641667258304987, "loss": 0.0418, "step": 137980 }, { "epoch": 0.89, "learning_rate": 0.00016640699122869295, "loss": 0.038, "step": 137990 }, { "epoch": 0.89, "learning_rate": 0.00016639730987433603, "loss": 0.0422, "step": 138000 }, { "epoch": 0.89, "eval_cer": 0.9199258840808948, "eval_loss": 0.026540521532297134, "eval_runtime": 119.7003, "eval_samples_per_second": 16.708, "eval_steps_per_second": 4.177, "step": 138000 }, { "epoch": 0.89, "learning_rate": 0.00016638762851997908, "loss": 0.0394, "step": 138010 }, { "epoch": 0.89, "learning_rate": 0.00016637794716562213, "loss": 0.0431, "step": 138020 }, { "epoch": 0.89, "learning_rate": 0.0001663682658112652, "loss": 0.0419, "step": 138030 }, { "epoch": 0.89, "learning_rate": 0.00016635858445690827, "loss": 0.0418, "step": 138040 }, { "epoch": 0.89, "learning_rate": 0.00016634890310255135, "loss": 0.0443, "step": 138050 }, { "epoch": 0.89, "learning_rate": 0.00016633922174819443, "loss": 0.0432, "step": 138060 }, { "epoch": 0.89, "learning_rate": 0.00016632954039383748, "loss": 0.0379, "step": 138070 }, { "epoch": 0.89, "learning_rate": 0.00016631985903948056, "loss": 0.0426, "step": 138080 }, { "epoch": 0.89, "learning_rate": 0.0001663101776851236, "loss": 0.0437, "step": 138090 }, { "epoch": 0.89, "learning_rate": 0.00016630049633076666, "loss": 0.0422, "step": 138100 }, { "epoch": 0.89, "learning_rate": 0.00016629081497640974, "loss": 0.0465, "step": 138110 }, { "epoch": 0.89, "learning_rate": 0.00016628113362205282, "loss": 0.0387, "step": 138120 }, { "epoch": 0.89, "learning_rate": 0.0001662714522676959, "loss": 0.0374, "step": 138130 }, { "epoch": 0.89, "learning_rate": 0.00016626177091333896, "loss": 0.0405, "step": 138140 }, { "epoch": 0.89, "learning_rate": 0.00016625208955898204, "loss": 0.0429, "step": 138150 }, { "epoch": 0.89, "learning_rate": 0.0001662424082046251, "loss": 0.0401, "step": 138160 }, { "epoch": 0.89, "learning_rate": 0.00016623272685026814, "loss": 0.04, "step": 138170 }, { "epoch": 0.89, "learning_rate": 0.00016622304549591122, "loss": 0.042, "step": 138180 }, { "epoch": 0.89, "learning_rate": 0.0001662133641415543, "loss": 0.0473, "step": 138190 }, { "epoch": 0.89, "learning_rate": 0.00016620368278719738, "loss": 0.0393, "step": 138200 }, { "epoch": 0.89, "learning_rate": 0.00016619400143284043, "loss": 0.0462, "step": 138210 }, { "epoch": 0.89, "learning_rate": 0.0001661843200784835, "loss": 0.0405, "step": 138220 }, { "epoch": 0.89, "learning_rate": 0.00016617463872412654, "loss": 0.0426, "step": 138230 }, { "epoch": 0.89, "learning_rate": 0.00016616495736976962, "loss": 0.0348, "step": 138240 }, { "epoch": 0.89, "learning_rate": 0.0001661552760154127, "loss": 0.0437, "step": 138250 }, { "epoch": 0.89, "learning_rate": 0.00016614559466105578, "loss": 0.044, "step": 138260 }, { "epoch": 0.89, "learning_rate": 0.00016613591330669883, "loss": 0.0377, "step": 138270 }, { "epoch": 0.89, "learning_rate": 0.0001661262319523419, "loss": 0.0375, "step": 138280 }, { "epoch": 0.89, "learning_rate": 0.000166116550597985, "loss": 0.0355, "step": 138290 }, { "epoch": 0.89, "learning_rate": 0.00016610686924362802, "loss": 0.05, "step": 138300 }, { "epoch": 0.89, "learning_rate": 0.0001660971878892711, "loss": 0.0409, "step": 138310 }, { "epoch": 0.89, "learning_rate": 0.00016608750653491418, "loss": 0.0388, "step": 138320 }, { "epoch": 0.89, "learning_rate": 0.00016607782518055726, "loss": 0.0354, "step": 138330 }, { "epoch": 0.89, "learning_rate": 0.0001660681438262003, "loss": 0.0403, "step": 138340 }, { "epoch": 0.89, "learning_rate": 0.0001660584624718434, "loss": 0.0403, "step": 138350 }, { "epoch": 0.89, "learning_rate": 0.00016604878111748647, "loss": 0.0448, "step": 138360 }, { "epoch": 0.89, "learning_rate": 0.0001660390997631295, "loss": 0.0425, "step": 138370 }, { "epoch": 0.89, "learning_rate": 0.00016602941840877257, "loss": 0.0419, "step": 138380 }, { "epoch": 0.89, "learning_rate": 0.00016601973705441565, "loss": 0.0388, "step": 138390 }, { "epoch": 0.89, "learning_rate": 0.00016601005570005873, "loss": 0.0378, "step": 138400 }, { "epoch": 0.89, "learning_rate": 0.00016600037434570179, "loss": 0.0437, "step": 138410 }, { "epoch": 0.89, "learning_rate": 0.00016599069299134487, "loss": 0.0417, "step": 138420 }, { "epoch": 0.89, "learning_rate": 0.00016598101163698795, "loss": 0.038, "step": 138430 }, { "epoch": 0.89, "learning_rate": 0.00016597133028263097, "loss": 0.035, "step": 138440 }, { "epoch": 0.89, "learning_rate": 0.00016596164892827405, "loss": 0.0518, "step": 138450 }, { "epoch": 0.89, "learning_rate": 0.00016595196757391713, "loss": 0.0446, "step": 138460 }, { "epoch": 0.89, "learning_rate": 0.00016594228621956018, "loss": 0.0471, "step": 138470 }, { "epoch": 0.89, "learning_rate": 0.00016593260486520326, "loss": 0.0398, "step": 138480 }, { "epoch": 0.89, "learning_rate": 0.00016592292351084634, "loss": 0.0455, "step": 138490 }, { "epoch": 0.89, "learning_rate": 0.00016591324215648942, "loss": 0.0391, "step": 138500 }, { "epoch": 0.89, "learning_rate": 0.00016590356080213245, "loss": 0.0357, "step": 138510 }, { "epoch": 0.89, "learning_rate": 0.00016589387944777553, "loss": 0.0417, "step": 138520 }, { "epoch": 0.89, "learning_rate": 0.0001658841980934186, "loss": 0.036, "step": 138530 }, { "epoch": 0.89, "learning_rate": 0.00016587451673906166, "loss": 0.0357, "step": 138540 }, { "epoch": 0.89, "learning_rate": 0.00016586483538470474, "loss": 0.0478, "step": 138550 }, { "epoch": 0.89, "learning_rate": 0.00016585515403034782, "loss": 0.0355, "step": 138560 }, { "epoch": 0.89, "learning_rate": 0.0001658454726759909, "loss": 0.0449, "step": 138570 }, { "epoch": 0.89, "learning_rate": 0.00016583579132163393, "loss": 0.0395, "step": 138580 }, { "epoch": 0.89, "learning_rate": 0.000165826109967277, "loss": 0.0418, "step": 138590 }, { "epoch": 0.89, "learning_rate": 0.00016581642861292008, "loss": 0.0424, "step": 138600 }, { "epoch": 0.89, "learning_rate": 0.00016580674725856314, "loss": 0.0367, "step": 138610 }, { "epoch": 0.89, "learning_rate": 0.00016579706590420622, "loss": 0.039, "step": 138620 }, { "epoch": 0.89, "learning_rate": 0.0001657873845498493, "loss": 0.0468, "step": 138630 }, { "epoch": 0.89, "learning_rate": 0.00016577770319549235, "loss": 0.0457, "step": 138640 }, { "epoch": 0.89, "learning_rate": 0.0001657680218411354, "loss": 0.0355, "step": 138650 }, { "epoch": 0.89, "learning_rate": 0.00016575834048677848, "loss": 0.04, "step": 138660 }, { "epoch": 0.9, "learning_rate": 0.00016574865913242153, "loss": 0.0446, "step": 138670 }, { "epoch": 0.9, "learning_rate": 0.00016573897777806461, "loss": 0.0436, "step": 138680 }, { "epoch": 0.9, "learning_rate": 0.0001657292964237077, "loss": 0.0391, "step": 138690 }, { "epoch": 0.9, "learning_rate": 0.00016571961506935077, "loss": 0.0417, "step": 138700 }, { "epoch": 0.9, "learning_rate": 0.00016570993371499383, "loss": 0.0373, "step": 138710 }, { "epoch": 0.9, "learning_rate": 0.00016570025236063688, "loss": 0.0413, "step": 138720 }, { "epoch": 0.9, "learning_rate": 0.00016569057100627996, "loss": 0.0427, "step": 138730 }, { "epoch": 0.9, "learning_rate": 0.000165680889651923, "loss": 0.0366, "step": 138740 }, { "epoch": 0.9, "learning_rate": 0.0001656712082975661, "loss": 0.0426, "step": 138750 }, { "epoch": 0.9, "learning_rate": 0.00016566152694320917, "loss": 0.0421, "step": 138760 }, { "epoch": 0.9, "learning_rate": 0.00016565184558885225, "loss": 0.0366, "step": 138770 }, { "epoch": 0.9, "learning_rate": 0.0001656421642344953, "loss": 0.0351, "step": 138780 }, { "epoch": 0.9, "learning_rate": 0.00016563248288013836, "loss": 0.0438, "step": 138790 }, { "epoch": 0.9, "learning_rate": 0.00016562280152578144, "loss": 0.0406, "step": 138800 }, { "epoch": 0.9, "learning_rate": 0.0001656131201714245, "loss": 0.0408, "step": 138810 }, { "epoch": 0.9, "learning_rate": 0.00016560343881706757, "loss": 0.0423, "step": 138820 }, { "epoch": 0.9, "learning_rate": 0.00016559375746271065, "loss": 0.0376, "step": 138830 }, { "epoch": 0.9, "learning_rate": 0.0001655840761083537, "loss": 0.0486, "step": 138840 }, { "epoch": 0.9, "learning_rate": 0.00016557439475399678, "loss": 0.0391, "step": 138850 }, { "epoch": 0.9, "learning_rate": 0.00016556471339963983, "loss": 0.0406, "step": 138860 }, { "epoch": 0.9, "learning_rate": 0.0001655550320452829, "loss": 0.0512, "step": 138870 }, { "epoch": 0.9, "learning_rate": 0.00016554535069092597, "loss": 0.0444, "step": 138880 }, { "epoch": 0.9, "learning_rate": 0.00016553566933656905, "loss": 0.0407, "step": 138890 }, { "epoch": 0.9, "learning_rate": 0.00016552598798221213, "loss": 0.0394, "step": 138900 }, { "epoch": 0.9, "learning_rate": 0.00016551630662785518, "loss": 0.038, "step": 138910 }, { "epoch": 0.9, "learning_rate": 0.00016550662527349826, "loss": 0.0522, "step": 138920 }, { "epoch": 0.9, "learning_rate": 0.0001654969439191413, "loss": 0.0376, "step": 138930 }, { "epoch": 0.9, "learning_rate": 0.00016548726256478436, "loss": 0.0389, "step": 138940 }, { "epoch": 0.9, "learning_rate": 0.00016547758121042744, "loss": 0.0415, "step": 138950 }, { "epoch": 0.9, "learning_rate": 0.00016546789985607052, "loss": 0.0414, "step": 138960 }, { "epoch": 0.9, "learning_rate": 0.0001654582185017136, "loss": 0.0423, "step": 138970 }, { "epoch": 0.9, "learning_rate": 0.00016544853714735666, "loss": 0.0422, "step": 138980 }, { "epoch": 0.9, "learning_rate": 0.00016543885579299974, "loss": 0.0373, "step": 138990 }, { "epoch": 0.9, "learning_rate": 0.0001654291744386428, "loss": 0.0464, "step": 139000 }, { "epoch": 0.9, "eval_cer": 0.9199593266297593, "eval_loss": 0.026463398709893227, "eval_runtime": 120.0017, "eval_samples_per_second": 16.666, "eval_steps_per_second": 4.167, "step": 139000 }, { "epoch": 0.9, "learning_rate": 0.00016541949308428584, "loss": 0.0513, "step": 139010 }, { "epoch": 0.9, "learning_rate": 0.00016540981172992892, "loss": 0.0376, "step": 139020 }, { "epoch": 0.9, "learning_rate": 0.000165400130375572, "loss": 0.0459, "step": 139030 }, { "epoch": 0.9, "learning_rate": 0.00016539044902121505, "loss": 0.0433, "step": 139040 }, { "epoch": 0.9, "learning_rate": 0.00016538076766685813, "loss": 0.0399, "step": 139050 }, { "epoch": 0.9, "learning_rate": 0.0001653710863125012, "loss": 0.0367, "step": 139060 }, { "epoch": 0.9, "learning_rate": 0.00016536140495814424, "loss": 0.0391, "step": 139070 }, { "epoch": 0.9, "learning_rate": 0.00016535172360378732, "loss": 0.0349, "step": 139080 }, { "epoch": 0.9, "learning_rate": 0.0001653420422494304, "loss": 0.0395, "step": 139090 }, { "epoch": 0.9, "learning_rate": 0.00016533236089507348, "loss": 0.0373, "step": 139100 }, { "epoch": 0.9, "learning_rate": 0.00016532267954071653, "loss": 0.0402, "step": 139110 }, { "epoch": 0.9, "learning_rate": 0.0001653129981863596, "loss": 0.0334, "step": 139120 }, { "epoch": 0.9, "learning_rate": 0.0001653033168320027, "loss": 0.0364, "step": 139130 }, { "epoch": 0.9, "learning_rate": 0.00016529363547764572, "loss": 0.0368, "step": 139140 }, { "epoch": 0.9, "learning_rate": 0.0001652839541232888, "loss": 0.038, "step": 139150 }, { "epoch": 0.9, "learning_rate": 0.00016527427276893188, "loss": 0.0306, "step": 139160 }, { "epoch": 0.9, "learning_rate": 0.00016526459141457496, "loss": 0.0424, "step": 139170 }, { "epoch": 0.9, "learning_rate": 0.000165254910060218, "loss": 0.0373, "step": 139180 }, { "epoch": 0.9, "learning_rate": 0.0001652452287058611, "loss": 0.0351, "step": 139190 }, { "epoch": 0.9, "learning_rate": 0.00016523554735150417, "loss": 0.0427, "step": 139200 }, { "epoch": 0.9, "learning_rate": 0.0001652258659971472, "loss": 0.0519, "step": 139210 }, { "epoch": 0.9, "learning_rate": 0.00016521618464279027, "loss": 0.0424, "step": 139220 }, { "epoch": 0.9, "learning_rate": 0.00016520650328843335, "loss": 0.0409, "step": 139230 }, { "epoch": 0.9, "learning_rate": 0.0001651968219340764, "loss": 0.0391, "step": 139240 }, { "epoch": 0.9, "learning_rate": 0.00016518714057971949, "loss": 0.0387, "step": 139250 }, { "epoch": 0.9, "learning_rate": 0.00016517745922536256, "loss": 0.0444, "step": 139260 }, { "epoch": 0.9, "learning_rate": 0.00016516777787100564, "loss": 0.0406, "step": 139270 }, { "epoch": 0.9, "learning_rate": 0.00016515809651664867, "loss": 0.0344, "step": 139280 }, { "epoch": 0.9, "learning_rate": 0.00016514841516229175, "loss": 0.0364, "step": 139290 }, { "epoch": 0.9, "learning_rate": 0.00016513873380793483, "loss": 0.0383, "step": 139300 }, { "epoch": 0.9, "learning_rate": 0.00016512905245357788, "loss": 0.0383, "step": 139310 }, { "epoch": 0.9, "learning_rate": 0.00016511937109922096, "loss": 0.0351, "step": 139320 }, { "epoch": 0.9, "learning_rate": 0.00016510968974486404, "loss": 0.0406, "step": 139330 }, { "epoch": 0.9, "learning_rate": 0.00016510000839050712, "loss": 0.0403, "step": 139340 }, { "epoch": 0.9, "learning_rate": 0.00016509032703615015, "loss": 0.0403, "step": 139350 }, { "epoch": 0.9, "learning_rate": 0.00016508064568179323, "loss": 0.0374, "step": 139360 }, { "epoch": 0.9, "learning_rate": 0.0001650709643274363, "loss": 0.0383, "step": 139370 }, { "epoch": 0.9, "learning_rate": 0.00016506128297307936, "loss": 0.0354, "step": 139380 }, { "epoch": 0.9, "learning_rate": 0.00016505160161872244, "loss": 0.041, "step": 139390 }, { "epoch": 0.9, "learning_rate": 0.00016504192026436552, "loss": 0.0387, "step": 139400 }, { "epoch": 0.9, "learning_rate": 0.00016503223891000857, "loss": 0.0319, "step": 139410 }, { "epoch": 0.9, "learning_rate": 0.00016502255755565162, "loss": 0.0434, "step": 139420 }, { "epoch": 0.9, "learning_rate": 0.0001650128762012947, "loss": 0.0382, "step": 139430 }, { "epoch": 0.9, "learning_rate": 0.00016500319484693776, "loss": 0.0405, "step": 139440 }, { "epoch": 0.9, "learning_rate": 0.00016499351349258084, "loss": 0.0354, "step": 139450 }, { "epoch": 0.9, "learning_rate": 0.00016498383213822392, "loss": 0.0454, "step": 139460 }, { "epoch": 0.9, "learning_rate": 0.000164974150783867, "loss": 0.0429, "step": 139470 }, { "epoch": 0.9, "learning_rate": 0.00016496446942951005, "loss": 0.0434, "step": 139480 }, { "epoch": 0.9, "learning_rate": 0.0001649547880751531, "loss": 0.0389, "step": 139490 }, { "epoch": 0.9, "learning_rate": 0.00016494510672079618, "loss": 0.0436, "step": 139500 }, { "epoch": 0.9, "learning_rate": 0.00016493542536643923, "loss": 0.0375, "step": 139510 }, { "epoch": 0.9, "learning_rate": 0.00016492574401208231, "loss": 0.0385, "step": 139520 }, { "epoch": 0.9, "learning_rate": 0.0001649160626577254, "loss": 0.0492, "step": 139530 }, { "epoch": 0.9, "learning_rate": 0.00016490638130336847, "loss": 0.0357, "step": 139540 }, { "epoch": 0.9, "learning_rate": 0.00016489669994901153, "loss": 0.0365, "step": 139550 }, { "epoch": 0.9, "learning_rate": 0.00016488701859465458, "loss": 0.0448, "step": 139560 }, { "epoch": 0.9, "learning_rate": 0.00016487733724029766, "loss": 0.0379, "step": 139570 }, { "epoch": 0.9, "learning_rate": 0.0001648676558859407, "loss": 0.036, "step": 139580 }, { "epoch": 0.9, "learning_rate": 0.0001648579745315838, "loss": 0.0388, "step": 139590 }, { "epoch": 0.9, "learning_rate": 0.00016484829317722687, "loss": 0.0486, "step": 139600 }, { "epoch": 0.9, "learning_rate": 0.00016483861182286992, "loss": 0.0347, "step": 139610 }, { "epoch": 0.9, "learning_rate": 0.000164828930468513, "loss": 0.0335, "step": 139620 }, { "epoch": 0.9, "learning_rate": 0.00016481924911415606, "loss": 0.041, "step": 139630 }, { "epoch": 0.9, "learning_rate": 0.0001648095677597991, "loss": 0.0334, "step": 139640 }, { "epoch": 0.9, "learning_rate": 0.0001647998864054422, "loss": 0.0494, "step": 139650 }, { "epoch": 0.9, "learning_rate": 0.00016479020505108527, "loss": 0.0455, "step": 139660 }, { "epoch": 0.9, "learning_rate": 0.00016478052369672835, "loss": 0.034, "step": 139670 }, { "epoch": 0.9, "learning_rate": 0.0001647708423423714, "loss": 0.0378, "step": 139680 }, { "epoch": 0.9, "learning_rate": 0.00016476116098801448, "loss": 0.0422, "step": 139690 }, { "epoch": 0.9, "learning_rate": 0.00016475147963365753, "loss": 0.0385, "step": 139700 }, { "epoch": 0.9, "learning_rate": 0.00016474179827930059, "loss": 0.0412, "step": 139710 }, { "epoch": 0.9, "learning_rate": 0.00016473211692494367, "loss": 0.0365, "step": 139720 }, { "epoch": 0.9, "learning_rate": 0.00016472243557058675, "loss": 0.034, "step": 139730 }, { "epoch": 0.9, "learning_rate": 0.00016471275421622983, "loss": 0.0368, "step": 139740 }, { "epoch": 0.9, "learning_rate": 0.00016470307286187288, "loss": 0.0343, "step": 139750 }, { "epoch": 0.9, "learning_rate": 0.00016469339150751596, "loss": 0.0388, "step": 139760 }, { "epoch": 0.9, "learning_rate": 0.000164683710153159, "loss": 0.0499, "step": 139770 }, { "epoch": 0.9, "learning_rate": 0.00016467402879880206, "loss": 0.0396, "step": 139780 }, { "epoch": 0.9, "learning_rate": 0.00016466434744444514, "loss": 0.0423, "step": 139790 }, { "epoch": 0.9, "learning_rate": 0.00016465466609008822, "loss": 0.0412, "step": 139800 }, { "epoch": 0.9, "learning_rate": 0.00016464498473573128, "loss": 0.0418, "step": 139810 }, { "epoch": 0.9, "learning_rate": 0.00016463530338137436, "loss": 0.04, "step": 139820 }, { "epoch": 0.9, "learning_rate": 0.00016462562202701744, "loss": 0.0367, "step": 139830 }, { "epoch": 0.9, "learning_rate": 0.00016461594067266046, "loss": 0.042, "step": 139840 }, { "epoch": 0.9, "learning_rate": 0.00016460625931830354, "loss": 0.0402, "step": 139850 }, { "epoch": 0.9, "learning_rate": 0.00016459657796394662, "loss": 0.0433, "step": 139860 }, { "epoch": 0.9, "learning_rate": 0.0001645868966095897, "loss": 0.0346, "step": 139870 }, { "epoch": 0.9, "learning_rate": 0.00016457721525523275, "loss": 0.0394, "step": 139880 }, { "epoch": 0.9, "learning_rate": 0.00016456753390087583, "loss": 0.0377, "step": 139890 }, { "epoch": 0.9, "learning_rate": 0.0001645578525465189, "loss": 0.0339, "step": 139900 }, { "epoch": 0.9, "learning_rate": 0.00016454817119216194, "loss": 0.0372, "step": 139910 }, { "epoch": 0.9, "learning_rate": 0.00016453848983780502, "loss": 0.0351, "step": 139920 }, { "epoch": 0.9, "learning_rate": 0.0001645288084834481, "loss": 0.0408, "step": 139930 }, { "epoch": 0.9, "learning_rate": 0.00016451912712909118, "loss": 0.041, "step": 139940 }, { "epoch": 0.9, "learning_rate": 0.00016450944577473423, "loss": 0.0504, "step": 139950 }, { "epoch": 0.9, "learning_rate": 0.0001644997644203773, "loss": 0.0447, "step": 139960 }, { "epoch": 0.9, "learning_rate": 0.0001644900830660204, "loss": 0.0451, "step": 139970 }, { "epoch": 0.9, "learning_rate": 0.00016448040171166342, "loss": 0.0405, "step": 139980 }, { "epoch": 0.9, "learning_rate": 0.0001644707203573065, "loss": 0.0367, "step": 139990 }, { "epoch": 0.9, "learning_rate": 0.00016446103900294958, "loss": 0.0372, "step": 140000 }, { "epoch": 0.9, "eval_cer": 0.9199656535984635, "eval_loss": 0.027039654552936554, "eval_runtime": 119.7354, "eval_samples_per_second": 16.703, "eval_steps_per_second": 4.176, "step": 140000 }, { "epoch": 0.9, "learning_rate": 0.00016445135764859263, "loss": 0.0391, "step": 140010 }, { "epoch": 0.9, "learning_rate": 0.0001644416762942357, "loss": 0.0405, "step": 140020 }, { "epoch": 0.9, "learning_rate": 0.0001644319949398788, "loss": 0.0441, "step": 140030 }, { "epoch": 0.9, "learning_rate": 0.00016442231358552187, "loss": 0.0399, "step": 140040 }, { "epoch": 0.9, "learning_rate": 0.0001644126322311649, "loss": 0.0372, "step": 140050 }, { "epoch": 0.9, "learning_rate": 0.00016440295087680797, "loss": 0.0386, "step": 140060 }, { "epoch": 0.9, "learning_rate": 0.00016439326952245105, "loss": 0.0398, "step": 140070 }, { "epoch": 0.9, "learning_rate": 0.0001643835881680941, "loss": 0.0358, "step": 140080 }, { "epoch": 0.9, "learning_rate": 0.00016437390681373718, "loss": 0.0388, "step": 140090 }, { "epoch": 0.9, "learning_rate": 0.00016436422545938026, "loss": 0.0381, "step": 140100 }, { "epoch": 0.9, "learning_rate": 0.00016435454410502334, "loss": 0.0417, "step": 140110 }, { "epoch": 0.9, "learning_rate": 0.00016434486275066637, "loss": 0.0428, "step": 140120 }, { "epoch": 0.9, "learning_rate": 0.00016433518139630945, "loss": 0.0348, "step": 140130 }, { "epoch": 0.9, "learning_rate": 0.00016432550004195253, "loss": 0.0335, "step": 140140 }, { "epoch": 0.9, "learning_rate": 0.00016431581868759558, "loss": 0.0435, "step": 140150 }, { "epoch": 0.9, "learning_rate": 0.00016430613733323866, "loss": 0.0394, "step": 140160 }, { "epoch": 0.9, "learning_rate": 0.00016429645597888174, "loss": 0.0455, "step": 140170 }, { "epoch": 0.9, "learning_rate": 0.00016428677462452482, "loss": 0.0372, "step": 140180 }, { "epoch": 0.9, "learning_rate": 0.00016427709327016785, "loss": 0.0365, "step": 140190 }, { "epoch": 0.9, "learning_rate": 0.00016426741191581093, "loss": 0.039, "step": 140200 }, { "epoch": 0.9, "learning_rate": 0.00016425773056145398, "loss": 0.041, "step": 140210 }, { "epoch": 0.91, "learning_rate": 0.00016424804920709706, "loss": 0.0348, "step": 140220 }, { "epoch": 0.91, "learning_rate": 0.00016423836785274014, "loss": 0.0384, "step": 140230 }, { "epoch": 0.91, "learning_rate": 0.00016422868649838322, "loss": 0.0394, "step": 140240 }, { "epoch": 0.91, "learning_rate": 0.00016421900514402627, "loss": 0.0394, "step": 140250 }, { "epoch": 0.91, "learning_rate": 0.00016420932378966932, "loss": 0.042, "step": 140260 }, { "epoch": 0.91, "learning_rate": 0.0001641996424353124, "loss": 0.0399, "step": 140270 }, { "epoch": 0.91, "learning_rate": 0.00016418996108095546, "loss": 0.0433, "step": 140280 }, { "epoch": 0.91, "learning_rate": 0.00016418027972659854, "loss": 0.0421, "step": 140290 }, { "epoch": 0.91, "learning_rate": 0.00016417059837224162, "loss": 0.0371, "step": 140300 }, { "epoch": 0.91, "learning_rate": 0.0001641609170178847, "loss": 0.0382, "step": 140310 }, { "epoch": 0.91, "learning_rate": 0.00016415123566352775, "loss": 0.0345, "step": 140320 }, { "epoch": 0.91, "learning_rate": 0.0001641415543091708, "loss": 0.0381, "step": 140330 }, { "epoch": 0.91, "learning_rate": 0.00016413187295481388, "loss": 0.0347, "step": 140340 }, { "epoch": 0.91, "learning_rate": 0.00016412219160045693, "loss": 0.0356, "step": 140350 }, { "epoch": 0.91, "learning_rate": 0.00016411251024610001, "loss": 0.0433, "step": 140360 }, { "epoch": 0.91, "learning_rate": 0.0001641028288917431, "loss": 0.0404, "step": 140370 }, { "epoch": 0.91, "learning_rate": 0.00016409314753738617, "loss": 0.0403, "step": 140380 }, { "epoch": 0.91, "learning_rate": 0.00016408346618302923, "loss": 0.0419, "step": 140390 }, { "epoch": 0.91, "learning_rate": 0.00016407378482867228, "loss": 0.0398, "step": 140400 }, { "epoch": 0.91, "learning_rate": 0.00016406410347431533, "loss": 0.0423, "step": 140410 }, { "epoch": 0.91, "learning_rate": 0.0001640544221199584, "loss": 0.0393, "step": 140420 }, { "epoch": 0.91, "learning_rate": 0.0001640447407656015, "loss": 0.0383, "step": 140430 }, { "epoch": 0.91, "learning_rate": 0.00016403505941124457, "loss": 0.0364, "step": 140440 }, { "epoch": 0.91, "learning_rate": 0.00016402537805688762, "loss": 0.0392, "step": 140450 }, { "epoch": 0.91, "learning_rate": 0.0001640156967025307, "loss": 0.0403, "step": 140460 }, { "epoch": 0.91, "learning_rate": 0.00016400601534817376, "loss": 0.0404, "step": 140470 }, { "epoch": 0.91, "learning_rate": 0.0001639963339938168, "loss": 0.038, "step": 140480 }, { "epoch": 0.91, "learning_rate": 0.0001639866526394599, "loss": 0.0427, "step": 140490 }, { "epoch": 0.91, "learning_rate": 0.00016397697128510297, "loss": 0.0407, "step": 140500 }, { "epoch": 0.91, "learning_rate": 0.00016396728993074605, "loss": 0.0416, "step": 140510 }, { "epoch": 0.91, "learning_rate": 0.0001639576085763891, "loss": 0.0385, "step": 140520 }, { "epoch": 0.91, "learning_rate": 0.00016394792722203218, "loss": 0.0392, "step": 140530 }, { "epoch": 0.91, "learning_rate": 0.00016393824586767523, "loss": 0.0389, "step": 140540 }, { "epoch": 0.91, "learning_rate": 0.00016392856451331829, "loss": 0.0402, "step": 140550 }, { "epoch": 0.91, "learning_rate": 0.00016391888315896137, "loss": 0.0401, "step": 140560 }, { "epoch": 0.91, "learning_rate": 0.00016390920180460445, "loss": 0.0355, "step": 140570 }, { "epoch": 0.91, "learning_rate": 0.00016389952045024753, "loss": 0.0398, "step": 140580 }, { "epoch": 0.91, "learning_rate": 0.00016388983909589058, "loss": 0.0339, "step": 140590 }, { "epoch": 0.91, "learning_rate": 0.00016388015774153366, "loss": 0.0413, "step": 140600 }, { "epoch": 0.91, "learning_rate": 0.00016387047638717668, "loss": 0.0455, "step": 140610 }, { "epoch": 0.91, "learning_rate": 0.00016386079503281976, "loss": 0.0361, "step": 140620 }, { "epoch": 0.91, "learning_rate": 0.00016385111367846284, "loss": 0.046, "step": 140630 }, { "epoch": 0.91, "learning_rate": 0.00016384143232410592, "loss": 0.0408, "step": 140640 }, { "epoch": 0.91, "learning_rate": 0.00016383175096974898, "loss": 0.0424, "step": 140650 }, { "epoch": 0.91, "learning_rate": 0.00016382206961539206, "loss": 0.0339, "step": 140660 }, { "epoch": 0.91, "learning_rate": 0.00016381238826103514, "loss": 0.0346, "step": 140670 }, { "epoch": 0.91, "learning_rate": 0.00016380270690667816, "loss": 0.0387, "step": 140680 }, { "epoch": 0.91, "learning_rate": 0.00016379302555232124, "loss": 0.0429, "step": 140690 }, { "epoch": 0.91, "learning_rate": 0.00016378334419796432, "loss": 0.0408, "step": 140700 }, { "epoch": 0.91, "learning_rate": 0.0001637736628436074, "loss": 0.0425, "step": 140710 }, { "epoch": 0.91, "learning_rate": 0.00016376398148925045, "loss": 0.0438, "step": 140720 }, { "epoch": 0.91, "learning_rate": 0.00016375430013489353, "loss": 0.0411, "step": 140730 }, { "epoch": 0.91, "learning_rate": 0.0001637446187805366, "loss": 0.038, "step": 140740 }, { "epoch": 0.91, "learning_rate": 0.00016373493742617964, "loss": 0.044, "step": 140750 }, { "epoch": 0.91, "learning_rate": 0.00016372525607182272, "loss": 0.0361, "step": 140760 }, { "epoch": 0.91, "learning_rate": 0.0001637155747174658, "loss": 0.0422, "step": 140770 }, { "epoch": 0.91, "learning_rate": 0.00016370589336310888, "loss": 0.039, "step": 140780 }, { "epoch": 0.91, "learning_rate": 0.00016369621200875193, "loss": 0.0425, "step": 140790 }, { "epoch": 0.91, "learning_rate": 0.000163686530654395, "loss": 0.0383, "step": 140800 }, { "epoch": 0.91, "learning_rate": 0.0001636768493000381, "loss": 0.0391, "step": 140810 }, { "epoch": 0.91, "learning_rate": 0.00016366716794568112, "loss": 0.0358, "step": 140820 }, { "epoch": 0.91, "learning_rate": 0.0001636574865913242, "loss": 0.0391, "step": 140830 }, { "epoch": 0.91, "learning_rate": 0.00016364780523696727, "loss": 0.0474, "step": 140840 }, { "epoch": 0.91, "learning_rate": 0.00016363812388261033, "loss": 0.0406, "step": 140850 }, { "epoch": 0.91, "learning_rate": 0.0001636284425282534, "loss": 0.0379, "step": 140860 }, { "epoch": 0.91, "learning_rate": 0.0001636187611738965, "loss": 0.0398, "step": 140870 }, { "epoch": 0.91, "learning_rate": 0.00016360907981953957, "loss": 0.0345, "step": 140880 }, { "epoch": 0.91, "learning_rate": 0.0001635993984651826, "loss": 0.0348, "step": 140890 }, { "epoch": 0.91, "learning_rate": 0.00016358971711082567, "loss": 0.0368, "step": 140900 }, { "epoch": 0.91, "learning_rate": 0.00016358003575646875, "loss": 0.0464, "step": 140910 }, { "epoch": 0.91, "learning_rate": 0.0001635703544021118, "loss": 0.0372, "step": 140920 }, { "epoch": 0.91, "learning_rate": 0.00016356067304775488, "loss": 0.0369, "step": 140930 }, { "epoch": 0.91, "learning_rate": 0.00016355099169339796, "loss": 0.0455, "step": 140940 }, { "epoch": 0.91, "learning_rate": 0.00016354131033904104, "loss": 0.0395, "step": 140950 }, { "epoch": 0.91, "learning_rate": 0.00016353162898468407, "loss": 0.0417, "step": 140960 }, { "epoch": 0.91, "learning_rate": 0.00016352194763032715, "loss": 0.0537, "step": 140970 }, { "epoch": 0.91, "learning_rate": 0.00016351226627597023, "loss": 0.039, "step": 140980 }, { "epoch": 0.91, "learning_rate": 0.00016350258492161328, "loss": 0.0389, "step": 140990 }, { "epoch": 0.91, "learning_rate": 0.00016349290356725636, "loss": 0.0381, "step": 141000 }, { "epoch": 0.91, "eval_cer": 0.9199078070274546, "eval_loss": 0.026563717052340508, "eval_runtime": 120.0005, "eval_samples_per_second": 16.667, "eval_steps_per_second": 4.167, "step": 141000 }, { "epoch": 0.91, "learning_rate": 0.00016348322221289944, "loss": 0.0438, "step": 141010 }, { "epoch": 0.91, "learning_rate": 0.0001634735408585425, "loss": 0.038, "step": 141020 }, { "epoch": 0.91, "learning_rate": 0.00016346385950418555, "loss": 0.0431, "step": 141030 }, { "epoch": 0.91, "learning_rate": 0.00016345417814982863, "loss": 0.0427, "step": 141040 }, { "epoch": 0.91, "learning_rate": 0.00016344449679547168, "loss": 0.0396, "step": 141050 }, { "epoch": 0.91, "learning_rate": 0.00016343481544111476, "loss": 0.0437, "step": 141060 }, { "epoch": 0.91, "learning_rate": 0.00016342513408675784, "loss": 0.0415, "step": 141070 }, { "epoch": 0.91, "learning_rate": 0.00016341545273240092, "loss": 0.0381, "step": 141080 }, { "epoch": 0.91, "learning_rate": 0.00016340577137804397, "loss": 0.0416, "step": 141090 }, { "epoch": 0.91, "learning_rate": 0.00016339609002368702, "loss": 0.0392, "step": 141100 }, { "epoch": 0.91, "learning_rate": 0.0001633864086693301, "loss": 0.045, "step": 141110 }, { "epoch": 0.91, "learning_rate": 0.00016337672731497316, "loss": 0.0398, "step": 141120 }, { "epoch": 0.91, "learning_rate": 0.00016336704596061624, "loss": 0.037, "step": 141130 }, { "epoch": 0.91, "learning_rate": 0.00016335736460625932, "loss": 0.0347, "step": 141140 }, { "epoch": 0.91, "learning_rate": 0.0001633476832519024, "loss": 0.0374, "step": 141150 }, { "epoch": 0.91, "learning_rate": 0.00016333800189754545, "loss": 0.0415, "step": 141160 }, { "epoch": 0.91, "learning_rate": 0.0001633283205431885, "loss": 0.0399, "step": 141170 }, { "epoch": 0.91, "learning_rate": 0.00016331863918883158, "loss": 0.0461, "step": 141180 }, { "epoch": 0.91, "learning_rate": 0.00016330895783447463, "loss": 0.0406, "step": 141190 }, { "epoch": 0.91, "learning_rate": 0.0001632992764801177, "loss": 0.0341, "step": 141200 }, { "epoch": 0.91, "learning_rate": 0.0001632895951257608, "loss": 0.0394, "step": 141210 }, { "epoch": 0.91, "learning_rate": 0.00016327991377140385, "loss": 0.0418, "step": 141220 }, { "epoch": 0.91, "learning_rate": 0.0001632702324170469, "loss": 0.0387, "step": 141230 }, { "epoch": 0.91, "learning_rate": 0.00016326055106268998, "loss": 0.0372, "step": 141240 }, { "epoch": 0.91, "learning_rate": 0.00016325086970833303, "loss": 0.0377, "step": 141250 }, { "epoch": 0.91, "learning_rate": 0.0001632411883539761, "loss": 0.0427, "step": 141260 }, { "epoch": 0.91, "learning_rate": 0.0001632315069996192, "loss": 0.0427, "step": 141270 }, { "epoch": 0.91, "learning_rate": 0.00016322182564526227, "loss": 0.0416, "step": 141280 }, { "epoch": 0.91, "learning_rate": 0.00016321214429090532, "loss": 0.0356, "step": 141290 }, { "epoch": 0.91, "learning_rate": 0.00016320246293654838, "loss": 0.0369, "step": 141300 }, { "epoch": 0.91, "learning_rate": 0.00016319278158219146, "loss": 0.0396, "step": 141310 }, { "epoch": 0.91, "learning_rate": 0.0001631831002278345, "loss": 0.0404, "step": 141320 }, { "epoch": 0.91, "learning_rate": 0.0001631734188734776, "loss": 0.0374, "step": 141330 }, { "epoch": 0.91, "learning_rate": 0.00016316373751912067, "loss": 0.0425, "step": 141340 }, { "epoch": 0.91, "learning_rate": 0.00016315405616476375, "loss": 0.034, "step": 141350 }, { "epoch": 0.91, "learning_rate": 0.0001631443748104068, "loss": 0.0394, "step": 141360 }, { "epoch": 0.91, "learning_rate": 0.00016313469345604985, "loss": 0.0387, "step": 141370 }, { "epoch": 0.91, "learning_rate": 0.00016312501210169293, "loss": 0.0419, "step": 141380 }, { "epoch": 0.91, "learning_rate": 0.00016311533074733599, "loss": 0.0367, "step": 141390 }, { "epoch": 0.91, "learning_rate": 0.00016310564939297907, "loss": 0.0332, "step": 141400 }, { "epoch": 0.91, "learning_rate": 0.00016309596803862215, "loss": 0.0353, "step": 141410 }, { "epoch": 0.91, "learning_rate": 0.0001630862866842652, "loss": 0.0333, "step": 141420 }, { "epoch": 0.91, "learning_rate": 0.00016307660532990828, "loss": 0.0349, "step": 141430 }, { "epoch": 0.91, "learning_rate": 0.00016306692397555133, "loss": 0.0367, "step": 141440 }, { "epoch": 0.91, "learning_rate": 0.00016305724262119438, "loss": 0.0377, "step": 141450 }, { "epoch": 0.91, "learning_rate": 0.00016304756126683746, "loss": 0.0355, "step": 141460 }, { "epoch": 0.91, "learning_rate": 0.00016303787991248054, "loss": 0.0399, "step": 141470 }, { "epoch": 0.91, "learning_rate": 0.00016302819855812362, "loss": 0.0387, "step": 141480 }, { "epoch": 0.91, "learning_rate": 0.00016301851720376668, "loss": 0.038, "step": 141490 }, { "epoch": 0.91, "learning_rate": 0.00016300883584940975, "loss": 0.0348, "step": 141500 }, { "epoch": 0.91, "learning_rate": 0.0001629991544950528, "loss": 0.0396, "step": 141510 }, { "epoch": 0.91, "learning_rate": 0.00016298947314069586, "loss": 0.0415, "step": 141520 }, { "epoch": 0.91, "learning_rate": 0.00016297979178633894, "loss": 0.0394, "step": 141530 }, { "epoch": 0.91, "learning_rate": 0.00016297011043198202, "loss": 0.0399, "step": 141540 }, { "epoch": 0.91, "learning_rate": 0.0001629604290776251, "loss": 0.0307, "step": 141550 }, { "epoch": 0.91, "learning_rate": 0.00016295074772326815, "loss": 0.0358, "step": 141560 }, { "epoch": 0.91, "learning_rate": 0.00016294106636891123, "loss": 0.038, "step": 141570 }, { "epoch": 0.91, "learning_rate": 0.00016293138501455428, "loss": 0.0418, "step": 141580 }, { "epoch": 0.91, "learning_rate": 0.00016292170366019734, "loss": 0.0385, "step": 141590 }, { "epoch": 0.91, "learning_rate": 0.00016291202230584042, "loss": 0.0441, "step": 141600 }, { "epoch": 0.91, "learning_rate": 0.0001629023409514835, "loss": 0.0434, "step": 141610 }, { "epoch": 0.91, "learning_rate": 0.00016289265959712655, "loss": 0.0445, "step": 141620 }, { "epoch": 0.91, "learning_rate": 0.00016288297824276963, "loss": 0.0381, "step": 141630 }, { "epoch": 0.91, "learning_rate": 0.0001628732968884127, "loss": 0.0397, "step": 141640 }, { "epoch": 0.91, "learning_rate": 0.00016286361553405573, "loss": 0.0336, "step": 141650 }, { "epoch": 0.91, "learning_rate": 0.00016285393417969881, "loss": 0.0452, "step": 141660 }, { "epoch": 0.91, "learning_rate": 0.0001628442528253419, "loss": 0.0362, "step": 141670 }, { "epoch": 0.91, "learning_rate": 0.00016283457147098497, "loss": 0.0425, "step": 141680 }, { "epoch": 0.91, "learning_rate": 0.00016282489011662803, "loss": 0.0343, "step": 141690 }, { "epoch": 0.91, "learning_rate": 0.0001628152087622711, "loss": 0.0384, "step": 141700 }, { "epoch": 0.91, "learning_rate": 0.0001628055274079142, "loss": 0.0467, "step": 141710 }, { "epoch": 0.91, "learning_rate": 0.0001627958460535572, "loss": 0.0356, "step": 141720 }, { "epoch": 0.91, "learning_rate": 0.0001627861646992003, "loss": 0.0431, "step": 141730 }, { "epoch": 0.91, "learning_rate": 0.00016277648334484337, "loss": 0.0349, "step": 141740 }, { "epoch": 0.91, "learning_rate": 0.00016276680199048645, "loss": 0.0369, "step": 141750 }, { "epoch": 0.91, "learning_rate": 0.0001627571206361295, "loss": 0.0384, "step": 141760 }, { "epoch": 0.92, "learning_rate": 0.00016274743928177258, "loss": 0.0401, "step": 141770 }, { "epoch": 0.92, "learning_rate": 0.00016273775792741566, "loss": 0.0354, "step": 141780 }, { "epoch": 0.92, "learning_rate": 0.0001627280765730587, "loss": 0.0329, "step": 141790 }, { "epoch": 0.92, "learning_rate": 0.00016271839521870177, "loss": 0.0382, "step": 141800 }, { "epoch": 0.92, "learning_rate": 0.00016270871386434485, "loss": 0.0361, "step": 141810 }, { "epoch": 0.92, "learning_rate": 0.0001626990325099879, "loss": 0.0496, "step": 141820 }, { "epoch": 0.92, "learning_rate": 0.00016268935115563098, "loss": 0.0359, "step": 141830 }, { "epoch": 0.92, "learning_rate": 0.00016267966980127406, "loss": 0.0396, "step": 141840 }, { "epoch": 0.92, "learning_rate": 0.00016266998844691714, "loss": 0.0405, "step": 141850 }, { "epoch": 0.92, "learning_rate": 0.00016266030709256017, "loss": 0.0394, "step": 141860 }, { "epoch": 0.92, "learning_rate": 0.00016265062573820325, "loss": 0.0364, "step": 141870 }, { "epoch": 0.92, "learning_rate": 0.00016264094438384633, "loss": 0.0407, "step": 141880 }, { "epoch": 0.92, "learning_rate": 0.00016263126302948938, "loss": 0.0397, "step": 141890 }, { "epoch": 0.92, "learning_rate": 0.00016262158167513246, "loss": 0.0388, "step": 141900 }, { "epoch": 0.92, "learning_rate": 0.00016261190032077554, "loss": 0.0343, "step": 141910 }, { "epoch": 0.92, "learning_rate": 0.00016260221896641862, "loss": 0.0391, "step": 141920 }, { "epoch": 0.92, "learning_rate": 0.00016259253761206164, "loss": 0.0351, "step": 141930 }, { "epoch": 0.92, "learning_rate": 0.00016258285625770472, "loss": 0.0348, "step": 141940 }, { "epoch": 0.92, "learning_rate": 0.0001625731749033478, "loss": 0.0346, "step": 141950 }, { "epoch": 0.92, "learning_rate": 0.00016256349354899086, "loss": 0.0347, "step": 141960 }, { "epoch": 0.92, "learning_rate": 0.00016255381219463394, "loss": 0.0423, "step": 141970 }, { "epoch": 0.92, "learning_rate": 0.00016254413084027702, "loss": 0.0419, "step": 141980 }, { "epoch": 0.92, "learning_rate": 0.00016253444948592007, "loss": 0.0436, "step": 141990 }, { "epoch": 0.92, "learning_rate": 0.00016252476813156312, "loss": 0.0359, "step": 142000 }, { "epoch": 0.92, "eval_cer": 0.9198490566037736, "eval_loss": 0.02665277197957039, "eval_runtime": 119.7024, "eval_samples_per_second": 16.708, "eval_steps_per_second": 4.177, "step": 142000 }, { "epoch": 0.92, "learning_rate": 0.0001625150867772062, "loss": 0.0376, "step": 142010 }, { "epoch": 0.92, "learning_rate": 0.00016250540542284925, "loss": 0.0415, "step": 142020 }, { "epoch": 0.92, "learning_rate": 0.00016249572406849233, "loss": 0.0412, "step": 142030 }, { "epoch": 0.92, "learning_rate": 0.0001624860427141354, "loss": 0.0476, "step": 142040 }, { "epoch": 0.92, "learning_rate": 0.0001624763613597785, "loss": 0.0404, "step": 142050 }, { "epoch": 0.92, "learning_rate": 0.00016246668000542155, "loss": 0.0462, "step": 142060 }, { "epoch": 0.92, "learning_rate": 0.0001624569986510646, "loss": 0.0399, "step": 142070 }, { "epoch": 0.92, "learning_rate": 0.00016244731729670768, "loss": 0.0426, "step": 142080 }, { "epoch": 0.92, "learning_rate": 0.00016243763594235073, "loss": 0.0353, "step": 142090 }, { "epoch": 0.92, "learning_rate": 0.0001624279545879938, "loss": 0.0417, "step": 142100 }, { "epoch": 0.92, "learning_rate": 0.0001624182732336369, "loss": 0.0419, "step": 142110 }, { "epoch": 0.92, "learning_rate": 0.00016240859187927997, "loss": 0.0377, "step": 142120 }, { "epoch": 0.92, "learning_rate": 0.00016239891052492302, "loss": 0.037, "step": 142130 }, { "epoch": 0.92, "learning_rate": 0.00016238922917056608, "loss": 0.041, "step": 142140 }, { "epoch": 0.92, "learning_rate": 0.00016237954781620916, "loss": 0.0401, "step": 142150 }, { "epoch": 0.92, "learning_rate": 0.0001623698664618522, "loss": 0.0425, "step": 142160 }, { "epoch": 0.92, "learning_rate": 0.0001623601851074953, "loss": 0.0383, "step": 142170 }, { "epoch": 0.92, "learning_rate": 0.00016235050375313837, "loss": 0.0438, "step": 142180 }, { "epoch": 0.92, "learning_rate": 0.00016234082239878142, "loss": 0.038, "step": 142190 }, { "epoch": 0.92, "learning_rate": 0.0001623311410444245, "loss": 0.0413, "step": 142200 }, { "epoch": 0.92, "learning_rate": 0.00016232145969006755, "loss": 0.0314, "step": 142210 }, { "epoch": 0.92, "learning_rate": 0.0001623117783357106, "loss": 0.0441, "step": 142220 }, { "epoch": 0.92, "learning_rate": 0.00016230209698135369, "loss": 0.0409, "step": 142230 }, { "epoch": 0.92, "learning_rate": 0.00016229241562699677, "loss": 0.0369, "step": 142240 }, { "epoch": 0.92, "learning_rate": 0.00016228273427263984, "loss": 0.0365, "step": 142250 }, { "epoch": 0.92, "learning_rate": 0.0001622730529182829, "loss": 0.0419, "step": 142260 }, { "epoch": 0.92, "learning_rate": 0.00016226337156392598, "loss": 0.0382, "step": 142270 }, { "epoch": 0.92, "learning_rate": 0.00016225369020956903, "loss": 0.0383, "step": 142280 }, { "epoch": 0.92, "learning_rate": 0.00016224400885521208, "loss": 0.042, "step": 142290 }, { "epoch": 0.92, "learning_rate": 0.00016223432750085516, "loss": 0.0407, "step": 142300 }, { "epoch": 0.92, "learning_rate": 0.00016222464614649824, "loss": 0.0428, "step": 142310 }, { "epoch": 0.92, "learning_rate": 0.00016221496479214132, "loss": 0.0449, "step": 142320 }, { "epoch": 0.92, "learning_rate": 0.00016220528343778437, "loss": 0.0442, "step": 142330 }, { "epoch": 0.92, "learning_rate": 0.00016219560208342745, "loss": 0.0321, "step": 142340 }, { "epoch": 0.92, "learning_rate": 0.0001621859207290705, "loss": 0.0393, "step": 142350 }, { "epoch": 0.92, "learning_rate": 0.00016217623937471356, "loss": 0.0392, "step": 142360 }, { "epoch": 0.92, "learning_rate": 0.00016216655802035664, "loss": 0.0379, "step": 142370 }, { "epoch": 0.92, "learning_rate": 0.00016215687666599972, "loss": 0.04, "step": 142380 }, { "epoch": 0.92, "learning_rate": 0.0001621471953116428, "loss": 0.0429, "step": 142390 }, { "epoch": 0.92, "learning_rate": 0.00016213751395728585, "loss": 0.0362, "step": 142400 }, { "epoch": 0.92, "learning_rate": 0.00016212783260292893, "loss": 0.0364, "step": 142410 }, { "epoch": 0.92, "learning_rate": 0.00016211815124857196, "loss": 0.0349, "step": 142420 }, { "epoch": 0.92, "learning_rate": 0.00016210846989421504, "loss": 0.0455, "step": 142430 }, { "epoch": 0.92, "learning_rate": 0.00016209878853985812, "loss": 0.0393, "step": 142440 }, { "epoch": 0.92, "learning_rate": 0.0001620891071855012, "loss": 0.0398, "step": 142450 }, { "epoch": 0.92, "learning_rate": 0.00016207942583114425, "loss": 0.0397, "step": 142460 }, { "epoch": 0.92, "learning_rate": 0.00016206974447678733, "loss": 0.0444, "step": 142470 }, { "epoch": 0.92, "learning_rate": 0.0001620600631224304, "loss": 0.036, "step": 142480 }, { "epoch": 0.92, "learning_rate": 0.00016205038176807343, "loss": 0.0432, "step": 142490 }, { "epoch": 0.92, "learning_rate": 0.00016204070041371651, "loss": 0.0408, "step": 142500 }, { "epoch": 0.92, "learning_rate": 0.0001620310190593596, "loss": 0.0394, "step": 142510 }, { "epoch": 0.92, "learning_rate": 0.00016202133770500267, "loss": 0.0405, "step": 142520 }, { "epoch": 0.92, "learning_rate": 0.00016201165635064573, "loss": 0.0427, "step": 142530 }, { "epoch": 0.92, "learning_rate": 0.0001620019749962888, "loss": 0.0431, "step": 142540 }, { "epoch": 0.92, "learning_rate": 0.00016199229364193189, "loss": 0.046, "step": 142550 }, { "epoch": 0.92, "learning_rate": 0.0001619826122875749, "loss": 0.0399, "step": 142560 }, { "epoch": 0.92, "learning_rate": 0.000161972930933218, "loss": 0.0423, "step": 142570 }, { "epoch": 0.92, "learning_rate": 0.00016196324957886107, "loss": 0.0438, "step": 142580 }, { "epoch": 0.92, "learning_rate": 0.00016195356822450415, "loss": 0.0382, "step": 142590 }, { "epoch": 0.92, "learning_rate": 0.0001619438868701472, "loss": 0.0414, "step": 142600 }, { "epoch": 0.92, "learning_rate": 0.00016193420551579028, "loss": 0.0441, "step": 142610 }, { "epoch": 0.92, "learning_rate": 0.00016192452416143336, "loss": 0.0392, "step": 142620 }, { "epoch": 0.92, "learning_rate": 0.0001619148428070764, "loss": 0.0503, "step": 142630 }, { "epoch": 0.92, "learning_rate": 0.00016190516145271947, "loss": 0.0441, "step": 142640 }, { "epoch": 0.92, "learning_rate": 0.00016189548009836255, "loss": 0.0426, "step": 142650 }, { "epoch": 0.92, "learning_rate": 0.0001618857987440056, "loss": 0.0556, "step": 142660 }, { "epoch": 0.92, "learning_rate": 0.00016187611738964868, "loss": 0.043, "step": 142670 }, { "epoch": 0.92, "learning_rate": 0.00016186643603529176, "loss": 0.0408, "step": 142680 }, { "epoch": 0.92, "learning_rate": 0.00016185675468093484, "loss": 0.0395, "step": 142690 }, { "epoch": 0.92, "learning_rate": 0.00016184707332657787, "loss": 0.0377, "step": 142700 }, { "epoch": 0.92, "learning_rate": 0.00016183739197222095, "loss": 0.0443, "step": 142710 }, { "epoch": 0.92, "learning_rate": 0.00016182771061786403, "loss": 0.0464, "step": 142720 }, { "epoch": 0.92, "learning_rate": 0.00016181802926350708, "loss": 0.0402, "step": 142730 }, { "epoch": 0.92, "learning_rate": 0.00016180834790915016, "loss": 0.0448, "step": 142740 }, { "epoch": 0.92, "learning_rate": 0.00016179866655479324, "loss": 0.0362, "step": 142750 }, { "epoch": 0.92, "learning_rate": 0.00016178898520043632, "loss": 0.0369, "step": 142760 }, { "epoch": 0.92, "learning_rate": 0.00016177930384607934, "loss": 0.0371, "step": 142770 }, { "epoch": 0.92, "learning_rate": 0.00016176962249172242, "loss": 0.0391, "step": 142780 }, { "epoch": 0.92, "learning_rate": 0.0001617599411373655, "loss": 0.0348, "step": 142790 }, { "epoch": 0.92, "learning_rate": 0.00016175025978300856, "loss": 0.0362, "step": 142800 }, { "epoch": 0.92, "learning_rate": 0.00016174057842865164, "loss": 0.0419, "step": 142810 }, { "epoch": 0.92, "learning_rate": 0.00016173089707429472, "loss": 0.0346, "step": 142820 }, { "epoch": 0.92, "learning_rate": 0.00016172121571993777, "loss": 0.0406, "step": 142830 }, { "epoch": 0.92, "learning_rate": 0.00016171153436558082, "loss": 0.041, "step": 142840 }, { "epoch": 0.92, "learning_rate": 0.0001617018530112239, "loss": 0.036, "step": 142850 }, { "epoch": 0.92, "learning_rate": 0.00016169217165686695, "loss": 0.0447, "step": 142860 }, { "epoch": 0.92, "learning_rate": 0.00016168249030251003, "loss": 0.0337, "step": 142870 }, { "epoch": 0.92, "learning_rate": 0.0001616728089481531, "loss": 0.0296, "step": 142880 }, { "epoch": 0.92, "learning_rate": 0.0001616631275937962, "loss": 0.0374, "step": 142890 }, { "epoch": 0.92, "learning_rate": 0.00016165344623943925, "loss": 0.0399, "step": 142900 }, { "epoch": 0.92, "learning_rate": 0.0001616437648850823, "loss": 0.0385, "step": 142910 }, { "epoch": 0.92, "learning_rate": 0.00016163408353072538, "loss": 0.0396, "step": 142920 }, { "epoch": 0.92, "learning_rate": 0.00016162440217636843, "loss": 0.0379, "step": 142930 }, { "epoch": 0.92, "learning_rate": 0.0001616147208220115, "loss": 0.0378, "step": 142940 }, { "epoch": 0.92, "learning_rate": 0.0001616050394676546, "loss": 0.035, "step": 142950 }, { "epoch": 0.92, "learning_rate": 0.00016159535811329767, "loss": 0.0365, "step": 142960 }, { "epoch": 0.92, "learning_rate": 0.00016158567675894072, "loss": 0.0483, "step": 142970 }, { "epoch": 0.92, "learning_rate": 0.00016157599540458378, "loss": 0.0472, "step": 142980 }, { "epoch": 0.92, "learning_rate": 0.00016156631405022685, "loss": 0.0386, "step": 142990 }, { "epoch": 0.92, "learning_rate": 0.0001615566326958699, "loss": 0.0368, "step": 143000 }, { "epoch": 0.92, "eval_cer": 0.9198716529205739, "eval_loss": 0.027006572112441063, "eval_runtime": 120.0134, "eval_samples_per_second": 16.665, "eval_steps_per_second": 4.166, "step": 143000 }, { "epoch": 0.92, "learning_rate": 0.000161546951341513, "loss": 0.0397, "step": 143010 }, { "epoch": 0.92, "learning_rate": 0.00016153726998715607, "loss": 0.0348, "step": 143020 }, { "epoch": 0.92, "learning_rate": 0.00016152758863279912, "loss": 0.0433, "step": 143030 }, { "epoch": 0.92, "learning_rate": 0.0001615179072784422, "loss": 0.0365, "step": 143040 }, { "epoch": 0.92, "learning_rate": 0.00016150822592408525, "loss": 0.0396, "step": 143050 }, { "epoch": 0.92, "learning_rate": 0.0001614985445697283, "loss": 0.0414, "step": 143060 }, { "epoch": 0.92, "learning_rate": 0.00016148886321537138, "loss": 0.0454, "step": 143070 }, { "epoch": 0.92, "learning_rate": 0.00016147918186101446, "loss": 0.0419, "step": 143080 }, { "epoch": 0.92, "learning_rate": 0.00016146950050665754, "loss": 0.0407, "step": 143090 }, { "epoch": 0.92, "learning_rate": 0.0001614598191523006, "loss": 0.0374, "step": 143100 }, { "epoch": 0.92, "learning_rate": 0.00016145013779794368, "loss": 0.0508, "step": 143110 }, { "epoch": 0.92, "learning_rate": 0.00016144045644358673, "loss": 0.0552, "step": 143120 }, { "epoch": 0.92, "learning_rate": 0.00016143077508922978, "loss": 0.04, "step": 143130 }, { "epoch": 0.92, "learning_rate": 0.00016142109373487286, "loss": 0.0369, "step": 143140 }, { "epoch": 0.92, "learning_rate": 0.00016141141238051594, "loss": 0.0418, "step": 143150 }, { "epoch": 0.92, "learning_rate": 0.00016140173102615902, "loss": 0.0399, "step": 143160 }, { "epoch": 0.92, "learning_rate": 0.00016139204967180207, "loss": 0.0367, "step": 143170 }, { "epoch": 0.92, "learning_rate": 0.00016138236831744515, "loss": 0.0384, "step": 143180 }, { "epoch": 0.92, "learning_rate": 0.0001613726869630882, "loss": 0.0348, "step": 143190 }, { "epoch": 0.92, "learning_rate": 0.00016136300560873126, "loss": 0.0413, "step": 143200 }, { "epoch": 0.92, "learning_rate": 0.00016135332425437434, "loss": 0.0456, "step": 143210 }, { "epoch": 0.92, "learning_rate": 0.00016134364290001742, "loss": 0.0381, "step": 143220 }, { "epoch": 0.92, "learning_rate": 0.00016133396154566047, "loss": 0.0351, "step": 143230 }, { "epoch": 0.92, "learning_rate": 0.00016132428019130355, "loss": 0.0382, "step": 143240 }, { "epoch": 0.92, "learning_rate": 0.00016131459883694663, "loss": 0.0405, "step": 143250 }, { "epoch": 0.92, "learning_rate": 0.00016130491748258966, "loss": 0.0371, "step": 143260 }, { "epoch": 0.92, "learning_rate": 0.00016129523612823274, "loss": 0.0342, "step": 143270 }, { "epoch": 0.92, "learning_rate": 0.00016128555477387582, "loss": 0.042, "step": 143280 }, { "epoch": 0.92, "learning_rate": 0.0001612758734195189, "loss": 0.0431, "step": 143290 }, { "epoch": 0.92, "learning_rate": 0.00016126619206516195, "loss": 0.0401, "step": 143300 }, { "epoch": 0.92, "learning_rate": 0.00016125651071080503, "loss": 0.0442, "step": 143310 }, { "epoch": 0.93, "learning_rate": 0.0001612468293564481, "loss": 0.0428, "step": 143320 }, { "epoch": 0.93, "learning_rate": 0.00016123714800209113, "loss": 0.0359, "step": 143330 }, { "epoch": 0.93, "learning_rate": 0.00016122746664773421, "loss": 0.0344, "step": 143340 }, { "epoch": 0.93, "learning_rate": 0.0001612177852933773, "loss": 0.0512, "step": 143350 }, { "epoch": 0.93, "learning_rate": 0.00016120810393902037, "loss": 0.0353, "step": 143360 }, { "epoch": 0.93, "learning_rate": 0.00016119842258466343, "loss": 0.0436, "step": 143370 }, { "epoch": 0.93, "learning_rate": 0.0001611887412303065, "loss": 0.0404, "step": 143380 }, { "epoch": 0.93, "learning_rate": 0.00016117905987594959, "loss": 0.0407, "step": 143390 }, { "epoch": 0.93, "learning_rate": 0.0001611693785215926, "loss": 0.0398, "step": 143400 }, { "epoch": 0.93, "learning_rate": 0.0001611596971672357, "loss": 0.0436, "step": 143410 }, { "epoch": 0.93, "learning_rate": 0.00016115001581287877, "loss": 0.037, "step": 143420 }, { "epoch": 0.93, "learning_rate": 0.00016114033445852182, "loss": 0.0399, "step": 143430 }, { "epoch": 0.93, "learning_rate": 0.0001611306531041649, "loss": 0.0351, "step": 143440 }, { "epoch": 0.93, "learning_rate": 0.00016112097174980798, "loss": 0.0434, "step": 143450 }, { "epoch": 0.93, "learning_rate": 0.00016111129039545106, "loss": 0.037, "step": 143460 }, { "epoch": 0.93, "learning_rate": 0.0001611016090410941, "loss": 0.0389, "step": 143470 }, { "epoch": 0.93, "learning_rate": 0.00016109192768673717, "loss": 0.0377, "step": 143480 }, { "epoch": 0.93, "learning_rate": 0.00016108224633238025, "loss": 0.0402, "step": 143490 }, { "epoch": 0.93, "learning_rate": 0.0001610725649780233, "loss": 0.0384, "step": 143500 }, { "epoch": 0.93, "learning_rate": 0.00016106288362366638, "loss": 0.0392, "step": 143510 }, { "epoch": 0.93, "learning_rate": 0.00016105320226930946, "loss": 0.0375, "step": 143520 }, { "epoch": 0.93, "learning_rate": 0.00016104352091495254, "loss": 0.0389, "step": 143530 }, { "epoch": 0.93, "learning_rate": 0.00016103383956059557, "loss": 0.043, "step": 143540 }, { "epoch": 0.93, "learning_rate": 0.00016102415820623865, "loss": 0.0403, "step": 143550 }, { "epoch": 0.93, "learning_rate": 0.00016101447685188173, "loss": 0.0367, "step": 143560 }, { "epoch": 0.93, "learning_rate": 0.00016100479549752478, "loss": 0.0363, "step": 143570 }, { "epoch": 0.93, "learning_rate": 0.00016099511414316786, "loss": 0.0425, "step": 143580 }, { "epoch": 0.93, "learning_rate": 0.00016098543278881094, "loss": 0.0399, "step": 143590 }, { "epoch": 0.93, "learning_rate": 0.000160975751434454, "loss": 0.0478, "step": 143600 }, { "epoch": 0.93, "learning_rate": 0.00016096607008009704, "loss": 0.0388, "step": 143610 }, { "epoch": 0.93, "learning_rate": 0.00016095638872574012, "loss": 0.0382, "step": 143620 }, { "epoch": 0.93, "learning_rate": 0.00016094670737138318, "loss": 0.042, "step": 143630 }, { "epoch": 0.93, "learning_rate": 0.00016093702601702626, "loss": 0.0418, "step": 143640 }, { "epoch": 0.93, "learning_rate": 0.00016092734466266934, "loss": 0.0413, "step": 143650 }, { "epoch": 0.93, "learning_rate": 0.00016091766330831241, "loss": 0.0444, "step": 143660 }, { "epoch": 0.93, "learning_rate": 0.00016090798195395547, "loss": 0.039, "step": 143670 }, { "epoch": 0.93, "learning_rate": 0.00016089830059959852, "loss": 0.0518, "step": 143680 }, { "epoch": 0.93, "learning_rate": 0.0001608886192452416, "loss": 0.0332, "step": 143690 }, { "epoch": 0.93, "learning_rate": 0.00016087893789088465, "loss": 0.0358, "step": 143700 }, { "epoch": 0.93, "learning_rate": 0.00016086925653652773, "loss": 0.0397, "step": 143710 }, { "epoch": 0.93, "learning_rate": 0.0001608595751821708, "loss": 0.0398, "step": 143720 }, { "epoch": 0.93, "learning_rate": 0.0001608498938278139, "loss": 0.0357, "step": 143730 }, { "epoch": 0.93, "learning_rate": 0.00016084021247345694, "loss": 0.0418, "step": 143740 }, { "epoch": 0.93, "learning_rate": 0.0001608305311191, "loss": 0.0383, "step": 143750 }, { "epoch": 0.93, "learning_rate": 0.00016082084976474308, "loss": 0.0452, "step": 143760 }, { "epoch": 0.93, "learning_rate": 0.00016081116841038613, "loss": 0.0369, "step": 143770 }, { "epoch": 0.93, "learning_rate": 0.0001608014870560292, "loss": 0.037, "step": 143780 }, { "epoch": 0.93, "learning_rate": 0.0001607918057016723, "loss": 0.0373, "step": 143790 }, { "epoch": 0.93, "learning_rate": 0.00016078212434731534, "loss": 0.0418, "step": 143800 }, { "epoch": 0.93, "learning_rate": 0.00016077244299295842, "loss": 0.0365, "step": 143810 }, { "epoch": 0.93, "learning_rate": 0.00016076276163860147, "loss": 0.035, "step": 143820 }, { "epoch": 0.93, "learning_rate": 0.00016075308028424453, "loss": 0.0432, "step": 143830 }, { "epoch": 0.93, "learning_rate": 0.0001607433989298876, "loss": 0.0406, "step": 143840 }, { "epoch": 0.93, "learning_rate": 0.0001607337175755307, "loss": 0.0457, "step": 143850 }, { "epoch": 0.93, "learning_rate": 0.00016072403622117377, "loss": 0.0332, "step": 143860 }, { "epoch": 0.93, "learning_rate": 0.00016071435486681682, "loss": 0.0391, "step": 143870 }, { "epoch": 0.93, "learning_rate": 0.0001607046735124599, "loss": 0.0382, "step": 143880 }, { "epoch": 0.93, "learning_rate": 0.00016069499215810295, "loss": 0.0327, "step": 143890 }, { "epoch": 0.93, "learning_rate": 0.000160685310803746, "loss": 0.0404, "step": 143900 }, { "epoch": 0.93, "learning_rate": 0.00016067562944938908, "loss": 0.0359, "step": 143910 }, { "epoch": 0.93, "learning_rate": 0.00016066594809503216, "loss": 0.0426, "step": 143920 }, { "epoch": 0.93, "learning_rate": 0.00016065626674067524, "loss": 0.0376, "step": 143930 }, { "epoch": 0.93, "learning_rate": 0.0001606465853863183, "loss": 0.0376, "step": 143940 }, { "epoch": 0.93, "learning_rate": 0.00016063690403196138, "loss": 0.0394, "step": 143950 }, { "epoch": 0.93, "learning_rate": 0.00016062722267760443, "loss": 0.0343, "step": 143960 }, { "epoch": 0.93, "learning_rate": 0.00016061754132324748, "loss": 0.0381, "step": 143970 }, { "epoch": 0.93, "learning_rate": 0.00016060785996889056, "loss": 0.0397, "step": 143980 }, { "epoch": 0.93, "learning_rate": 0.00016059817861453364, "loss": 0.0359, "step": 143990 }, { "epoch": 0.93, "learning_rate": 0.0001605884972601767, "loss": 0.0365, "step": 144000 }, { "epoch": 0.93, "eval_cer": 0.9198861145633261, "eval_loss": 0.02664892189204693, "eval_runtime": 119.7778, "eval_samples_per_second": 16.698, "eval_steps_per_second": 4.174, "step": 144000 }, { "epoch": 0.93, "learning_rate": 0.00016057881590581977, "loss": 0.0456, "step": 144010 }, { "epoch": 0.93, "learning_rate": 0.00016056913455146285, "loss": 0.0338, "step": 144020 }, { "epoch": 0.93, "learning_rate": 0.00016055945319710588, "loss": 0.0327, "step": 144030 }, { "epoch": 0.93, "learning_rate": 0.00016054977184274896, "loss": 0.0383, "step": 144040 }, { "epoch": 0.93, "learning_rate": 0.00016054009048839204, "loss": 0.0402, "step": 144050 }, { "epoch": 0.93, "learning_rate": 0.00016053040913403512, "loss": 0.0422, "step": 144060 }, { "epoch": 0.93, "learning_rate": 0.00016052072777967817, "loss": 0.036, "step": 144070 }, { "epoch": 0.93, "learning_rate": 0.00016051104642532125, "loss": 0.0485, "step": 144080 }, { "epoch": 0.93, "learning_rate": 0.00016050136507096433, "loss": 0.0416, "step": 144090 }, { "epoch": 0.93, "learning_rate": 0.00016049168371660736, "loss": 0.0364, "step": 144100 }, { "epoch": 0.93, "learning_rate": 0.00016048200236225044, "loss": 0.0387, "step": 144110 }, { "epoch": 0.93, "learning_rate": 0.00016047232100789352, "loss": 0.0454, "step": 144120 }, { "epoch": 0.93, "learning_rate": 0.0001604626396535366, "loss": 0.0461, "step": 144130 }, { "epoch": 0.93, "learning_rate": 0.00016045295829917965, "loss": 0.0389, "step": 144140 }, { "epoch": 0.93, "learning_rate": 0.00016044327694482273, "loss": 0.0452, "step": 144150 }, { "epoch": 0.93, "learning_rate": 0.0001604335955904658, "loss": 0.0482, "step": 144160 }, { "epoch": 0.93, "learning_rate": 0.00016042391423610883, "loss": 0.0384, "step": 144170 }, { "epoch": 0.93, "learning_rate": 0.00016041423288175191, "loss": 0.0374, "step": 144180 }, { "epoch": 0.93, "learning_rate": 0.000160404551527395, "loss": 0.0389, "step": 144190 }, { "epoch": 0.93, "learning_rate": 0.00016039487017303805, "loss": 0.0372, "step": 144200 }, { "epoch": 0.93, "learning_rate": 0.00016038518881868113, "loss": 0.0467, "step": 144210 }, { "epoch": 0.93, "learning_rate": 0.0001603755074643242, "loss": 0.0448, "step": 144220 }, { "epoch": 0.93, "learning_rate": 0.00016036582610996729, "loss": 0.0406, "step": 144230 }, { "epoch": 0.93, "learning_rate": 0.0001603561447556103, "loss": 0.0429, "step": 144240 }, { "epoch": 0.93, "learning_rate": 0.0001603464634012534, "loss": 0.0404, "step": 144250 }, { "epoch": 0.93, "learning_rate": 0.00016033678204689647, "loss": 0.0413, "step": 144260 }, { "epoch": 0.93, "learning_rate": 0.00016032710069253952, "loss": 0.0374, "step": 144270 }, { "epoch": 0.93, "learning_rate": 0.0001603174193381826, "loss": 0.0447, "step": 144280 }, { "epoch": 0.93, "learning_rate": 0.00016030773798382568, "loss": 0.0401, "step": 144290 }, { "epoch": 0.93, "learning_rate": 0.00016029805662946876, "loss": 0.0418, "step": 144300 }, { "epoch": 0.93, "learning_rate": 0.0001602883752751118, "loss": 0.0365, "step": 144310 }, { "epoch": 0.93, "learning_rate": 0.00016027869392075487, "loss": 0.0383, "step": 144320 }, { "epoch": 0.93, "learning_rate": 0.00016026901256639795, "loss": 0.0408, "step": 144330 }, { "epoch": 0.93, "learning_rate": 0.000160259331212041, "loss": 0.0386, "step": 144340 }, { "epoch": 0.93, "learning_rate": 0.00016024964985768408, "loss": 0.0379, "step": 144350 }, { "epoch": 0.93, "learning_rate": 0.00016023996850332716, "loss": 0.0382, "step": 144360 }, { "epoch": 0.93, "learning_rate": 0.00016023028714897024, "loss": 0.0415, "step": 144370 }, { "epoch": 0.93, "learning_rate": 0.00016022060579461327, "loss": 0.05, "step": 144380 }, { "epoch": 0.93, "learning_rate": 0.00016021092444025635, "loss": 0.0368, "step": 144390 }, { "epoch": 0.93, "learning_rate": 0.0001602012430858994, "loss": 0.0354, "step": 144400 }, { "epoch": 0.93, "learning_rate": 0.00016019156173154248, "loss": 0.0369, "step": 144410 }, { "epoch": 0.93, "learning_rate": 0.00016018188037718556, "loss": 0.0413, "step": 144420 }, { "epoch": 0.93, "learning_rate": 0.00016017219902282864, "loss": 0.0375, "step": 144430 }, { "epoch": 0.93, "learning_rate": 0.0001601625176684717, "loss": 0.0405, "step": 144440 }, { "epoch": 0.93, "learning_rate": 0.00016015283631411474, "loss": 0.0321, "step": 144450 }, { "epoch": 0.93, "learning_rate": 0.00016014315495975782, "loss": 0.0429, "step": 144460 }, { "epoch": 0.93, "learning_rate": 0.00016013347360540088, "loss": 0.0383, "step": 144470 }, { "epoch": 0.93, "learning_rate": 0.00016012379225104395, "loss": 0.0328, "step": 144480 }, { "epoch": 0.93, "learning_rate": 0.00016011411089668703, "loss": 0.0393, "step": 144490 }, { "epoch": 0.93, "learning_rate": 0.00016010442954233011, "loss": 0.0366, "step": 144500 }, { "epoch": 0.93, "learning_rate": 0.00016009474818797317, "loss": 0.0413, "step": 144510 }, { "epoch": 0.93, "learning_rate": 0.00016008506683361622, "loss": 0.038, "step": 144520 }, { "epoch": 0.93, "learning_rate": 0.0001600753854792593, "loss": 0.0349, "step": 144530 }, { "epoch": 0.93, "learning_rate": 0.00016006570412490235, "loss": 0.0393, "step": 144540 }, { "epoch": 0.93, "learning_rate": 0.00016005602277054543, "loss": 0.0369, "step": 144550 }, { "epoch": 0.93, "learning_rate": 0.0001600463414161885, "loss": 0.0377, "step": 144560 }, { "epoch": 0.93, "learning_rate": 0.0001600366600618316, "loss": 0.0384, "step": 144570 }, { "epoch": 0.93, "learning_rate": 0.00016002697870747464, "loss": 0.0426, "step": 144580 }, { "epoch": 0.93, "learning_rate": 0.0001600172973531177, "loss": 0.0352, "step": 144590 }, { "epoch": 0.93, "learning_rate": 0.00016000761599876075, "loss": 0.0377, "step": 144600 }, { "epoch": 0.93, "learning_rate": 0.00015999793464440383, "loss": 0.0369, "step": 144610 }, { "epoch": 0.93, "learning_rate": 0.0001599882532900469, "loss": 0.0399, "step": 144620 }, { "epoch": 0.93, "learning_rate": 0.00015997857193569, "loss": 0.0386, "step": 144630 }, { "epoch": 0.93, "learning_rate": 0.00015996889058133304, "loss": 0.0369, "step": 144640 }, { "epoch": 0.93, "learning_rate": 0.00015995920922697612, "loss": 0.0404, "step": 144650 }, { "epoch": 0.93, "learning_rate": 0.00015994952787261917, "loss": 0.038, "step": 144660 }, { "epoch": 0.93, "learning_rate": 0.00015993984651826223, "loss": 0.0346, "step": 144670 }, { "epoch": 0.93, "learning_rate": 0.0001599301651639053, "loss": 0.0327, "step": 144680 }, { "epoch": 0.93, "learning_rate": 0.0001599204838095484, "loss": 0.0373, "step": 144690 }, { "epoch": 0.93, "learning_rate": 0.00015991080245519147, "loss": 0.0465, "step": 144700 }, { "epoch": 0.93, "learning_rate": 0.00015990112110083452, "loss": 0.0408, "step": 144710 }, { "epoch": 0.93, "learning_rate": 0.0001598914397464776, "loss": 0.0397, "step": 144720 }, { "epoch": 0.93, "learning_rate": 0.00015988175839212065, "loss": 0.0466, "step": 144730 }, { "epoch": 0.93, "learning_rate": 0.0001598720770377637, "loss": 0.043, "step": 144740 }, { "epoch": 0.93, "learning_rate": 0.00015986239568340678, "loss": 0.0415, "step": 144750 }, { "epoch": 0.93, "learning_rate": 0.00015985271432904986, "loss": 0.0388, "step": 144760 }, { "epoch": 0.93, "learning_rate": 0.00015984303297469294, "loss": 0.0413, "step": 144770 }, { "epoch": 0.93, "learning_rate": 0.000159833351620336, "loss": 0.0421, "step": 144780 }, { "epoch": 0.93, "learning_rate": 0.00015982367026597908, "loss": 0.0424, "step": 144790 }, { "epoch": 0.93, "learning_rate": 0.0001598139889116221, "loss": 0.0413, "step": 144800 }, { "epoch": 0.93, "learning_rate": 0.00015980430755726518, "loss": 0.0379, "step": 144810 }, { "epoch": 0.93, "learning_rate": 0.00015979462620290826, "loss": 0.0367, "step": 144820 }, { "epoch": 0.93, "learning_rate": 0.00015978494484855134, "loss": 0.0352, "step": 144830 }, { "epoch": 0.93, "learning_rate": 0.0001597752634941944, "loss": 0.0395, "step": 144840 }, { "epoch": 0.93, "learning_rate": 0.00015976558213983747, "loss": 0.0342, "step": 144850 }, { "epoch": 0.93, "learning_rate": 0.00015975590078548055, "loss": 0.0347, "step": 144860 }, { "epoch": 0.94, "learning_rate": 0.00015974621943112358, "loss": 0.0358, "step": 144870 }, { "epoch": 0.94, "learning_rate": 0.00015973653807676666, "loss": 0.0407, "step": 144880 }, { "epoch": 0.94, "learning_rate": 0.00015972685672240974, "loss": 0.0399, "step": 144890 }, { "epoch": 0.94, "learning_rate": 0.00015971717536805282, "loss": 0.0343, "step": 144900 }, { "epoch": 0.94, "learning_rate": 0.00015970749401369587, "loss": 0.042, "step": 144910 }, { "epoch": 0.94, "learning_rate": 0.00015969781265933895, "loss": 0.0352, "step": 144920 }, { "epoch": 0.94, "learning_rate": 0.00015968813130498203, "loss": 0.0401, "step": 144930 }, { "epoch": 0.94, "learning_rate": 0.00015967844995062506, "loss": 0.0418, "step": 144940 }, { "epoch": 0.94, "learning_rate": 0.00015966876859626814, "loss": 0.0414, "step": 144950 }, { "epoch": 0.94, "learning_rate": 0.00015965908724191122, "loss": 0.0352, "step": 144960 }, { "epoch": 0.94, "learning_rate": 0.0001596494058875543, "loss": 0.0465, "step": 144970 }, { "epoch": 0.94, "learning_rate": 0.00015963972453319735, "loss": 0.0421, "step": 144980 }, { "epoch": 0.94, "learning_rate": 0.00015963004317884043, "loss": 0.0422, "step": 144990 }, { "epoch": 0.94, "learning_rate": 0.0001596203618244835, "loss": 0.0413, "step": 145000 }, { "epoch": 0.94, "eval_cer": 0.9198535758671337, "eval_loss": 0.02679886296391487, "eval_runtime": 119.8861, "eval_samples_per_second": 16.682, "eval_steps_per_second": 4.171, "step": 145000 }, { "epoch": 0.94, "learning_rate": 0.00015961068047012653, "loss": 0.0407, "step": 145010 }, { "epoch": 0.94, "learning_rate": 0.0001596009991157696, "loss": 0.0393, "step": 145020 }, { "epoch": 0.94, "learning_rate": 0.0001595913177614127, "loss": 0.0387, "step": 145030 }, { "epoch": 0.94, "learning_rate": 0.00015958163640705575, "loss": 0.0418, "step": 145040 }, { "epoch": 0.94, "learning_rate": 0.00015957195505269883, "loss": 0.041, "step": 145050 }, { "epoch": 0.94, "learning_rate": 0.0001595622736983419, "loss": 0.0368, "step": 145060 }, { "epoch": 0.94, "learning_rate": 0.00015955259234398499, "loss": 0.0405, "step": 145070 }, { "epoch": 0.94, "learning_rate": 0.000159542910989628, "loss": 0.0362, "step": 145080 }, { "epoch": 0.94, "learning_rate": 0.0001595332296352711, "loss": 0.0396, "step": 145090 }, { "epoch": 0.94, "learning_rate": 0.00015952354828091417, "loss": 0.0383, "step": 145100 }, { "epoch": 0.94, "learning_rate": 0.00015951386692655722, "loss": 0.0351, "step": 145110 }, { "epoch": 0.94, "learning_rate": 0.0001595041855722003, "loss": 0.0343, "step": 145120 }, { "epoch": 0.94, "learning_rate": 0.00015949450421784338, "loss": 0.0421, "step": 145130 }, { "epoch": 0.94, "learning_rate": 0.00015948482286348646, "loss": 0.043, "step": 145140 }, { "epoch": 0.94, "learning_rate": 0.0001594751415091295, "loss": 0.033, "step": 145150 }, { "epoch": 0.94, "learning_rate": 0.00015946546015477257, "loss": 0.038, "step": 145160 }, { "epoch": 0.94, "learning_rate": 0.00015945577880041565, "loss": 0.0382, "step": 145170 }, { "epoch": 0.94, "learning_rate": 0.0001594460974460587, "loss": 0.0414, "step": 145180 }, { "epoch": 0.94, "learning_rate": 0.00015943641609170178, "loss": 0.0449, "step": 145190 }, { "epoch": 0.94, "learning_rate": 0.00015942673473734486, "loss": 0.0379, "step": 145200 }, { "epoch": 0.94, "learning_rate": 0.0001594170533829879, "loss": 0.0391, "step": 145210 }, { "epoch": 0.94, "learning_rate": 0.00015940737202863097, "loss": 0.0336, "step": 145220 }, { "epoch": 0.94, "learning_rate": 0.00015939769067427404, "loss": 0.0317, "step": 145230 }, { "epoch": 0.94, "learning_rate": 0.0001593880093199171, "loss": 0.0349, "step": 145240 }, { "epoch": 0.94, "learning_rate": 0.00015937832796556018, "loss": 0.0364, "step": 145250 }, { "epoch": 0.94, "learning_rate": 0.00015936864661120326, "loss": 0.0384, "step": 145260 }, { "epoch": 0.94, "learning_rate": 0.00015935896525684634, "loss": 0.0359, "step": 145270 }, { "epoch": 0.94, "learning_rate": 0.0001593492839024894, "loss": 0.0425, "step": 145280 }, { "epoch": 0.94, "learning_rate": 0.00015933960254813244, "loss": 0.0476, "step": 145290 }, { "epoch": 0.94, "learning_rate": 0.00015932992119377552, "loss": 0.0374, "step": 145300 }, { "epoch": 0.94, "learning_rate": 0.00015932023983941857, "loss": 0.0411, "step": 145310 }, { "epoch": 0.94, "learning_rate": 0.00015931055848506165, "loss": 0.0386, "step": 145320 }, { "epoch": 0.94, "learning_rate": 0.00015930087713070473, "loss": 0.0375, "step": 145330 }, { "epoch": 0.94, "learning_rate": 0.00015929119577634781, "loss": 0.0384, "step": 145340 }, { "epoch": 0.94, "learning_rate": 0.00015928151442199087, "loss": 0.041, "step": 145350 }, { "epoch": 0.94, "learning_rate": 0.00015927183306763392, "loss": 0.0447, "step": 145360 }, { "epoch": 0.94, "learning_rate": 0.000159262151713277, "loss": 0.0409, "step": 145370 }, { "epoch": 0.94, "learning_rate": 0.00015925247035892005, "loss": 0.0366, "step": 145380 }, { "epoch": 0.94, "learning_rate": 0.00015924278900456313, "loss": 0.0384, "step": 145390 }, { "epoch": 0.94, "learning_rate": 0.0001592331076502062, "loss": 0.0381, "step": 145400 }, { "epoch": 0.94, "learning_rate": 0.00015922342629584926, "loss": 0.0377, "step": 145410 }, { "epoch": 0.94, "learning_rate": 0.00015921374494149234, "loss": 0.0352, "step": 145420 }, { "epoch": 0.94, "learning_rate": 0.0001592040635871354, "loss": 0.0367, "step": 145430 }, { "epoch": 0.94, "learning_rate": 0.00015919438223277845, "loss": 0.0393, "step": 145440 }, { "epoch": 0.94, "learning_rate": 0.00015918470087842153, "loss": 0.0354, "step": 145450 }, { "epoch": 0.94, "learning_rate": 0.0001591750195240646, "loss": 0.0369, "step": 145460 }, { "epoch": 0.94, "learning_rate": 0.0001591653381697077, "loss": 0.0401, "step": 145470 }, { "epoch": 0.94, "learning_rate": 0.00015915565681535074, "loss": 0.0376, "step": 145480 }, { "epoch": 0.94, "learning_rate": 0.00015914597546099382, "loss": 0.0355, "step": 145490 }, { "epoch": 0.94, "learning_rate": 0.00015913629410663687, "loss": 0.0373, "step": 145500 }, { "epoch": 0.94, "learning_rate": 0.00015912661275227993, "loss": 0.0349, "step": 145510 }, { "epoch": 0.94, "learning_rate": 0.000159116931397923, "loss": 0.0382, "step": 145520 }, { "epoch": 0.94, "learning_rate": 0.00015910725004356609, "loss": 0.0364, "step": 145530 }, { "epoch": 0.94, "learning_rate": 0.00015909756868920917, "loss": 0.0359, "step": 145540 }, { "epoch": 0.94, "learning_rate": 0.00015908788733485222, "loss": 0.0415, "step": 145550 }, { "epoch": 0.94, "learning_rate": 0.0001590782059804953, "loss": 0.0415, "step": 145560 }, { "epoch": 0.94, "learning_rate": 0.00015906852462613835, "loss": 0.0291, "step": 145570 }, { "epoch": 0.94, "learning_rate": 0.0001590588432717814, "loss": 0.0379, "step": 145580 }, { "epoch": 0.94, "learning_rate": 0.00015904916191742448, "loss": 0.0338, "step": 145590 }, { "epoch": 0.94, "learning_rate": 0.00015903948056306756, "loss": 0.0324, "step": 145600 }, { "epoch": 0.94, "learning_rate": 0.00015902979920871062, "loss": 0.0384, "step": 145610 }, { "epoch": 0.94, "learning_rate": 0.0001590201178543537, "loss": 0.0398, "step": 145620 }, { "epoch": 0.94, "learning_rate": 0.00015901043649999678, "loss": 0.0419, "step": 145630 }, { "epoch": 0.94, "learning_rate": 0.0001590007551456398, "loss": 0.0406, "step": 145640 }, { "epoch": 0.94, "learning_rate": 0.00015899107379128288, "loss": 0.041, "step": 145650 }, { "epoch": 0.94, "learning_rate": 0.00015898139243692596, "loss": 0.0367, "step": 145660 }, { "epoch": 0.94, "learning_rate": 0.00015897171108256904, "loss": 0.0377, "step": 145670 }, { "epoch": 0.94, "learning_rate": 0.0001589620297282121, "loss": 0.0447, "step": 145680 }, { "epoch": 0.94, "learning_rate": 0.00015895234837385517, "loss": 0.0413, "step": 145690 }, { "epoch": 0.94, "learning_rate": 0.00015894266701949825, "loss": 0.0413, "step": 145700 }, { "epoch": 0.94, "learning_rate": 0.00015893298566514128, "loss": 0.0453, "step": 145710 }, { "epoch": 0.94, "learning_rate": 0.00015892330431078436, "loss": 0.0473, "step": 145720 }, { "epoch": 0.94, "learning_rate": 0.00015891362295642744, "loss": 0.0369, "step": 145730 }, { "epoch": 0.94, "learning_rate": 0.00015890394160207052, "loss": 0.0355, "step": 145740 }, { "epoch": 0.94, "learning_rate": 0.00015889426024771357, "loss": 0.0379, "step": 145750 }, { "epoch": 0.94, "learning_rate": 0.00015888457889335665, "loss": 0.0473, "step": 145760 }, { "epoch": 0.94, "learning_rate": 0.00015887489753899973, "loss": 0.0393, "step": 145770 }, { "epoch": 0.94, "learning_rate": 0.00015886521618464276, "loss": 0.0392, "step": 145780 }, { "epoch": 0.94, "learning_rate": 0.00015885553483028584, "loss": 0.0349, "step": 145790 }, { "epoch": 0.94, "learning_rate": 0.00015884585347592892, "loss": 0.0354, "step": 145800 }, { "epoch": 0.94, "learning_rate": 0.00015883617212157197, "loss": 0.0375, "step": 145810 }, { "epoch": 0.94, "learning_rate": 0.00015882649076721505, "loss": 0.043, "step": 145820 }, { "epoch": 0.94, "learning_rate": 0.00015881680941285813, "loss": 0.0466, "step": 145830 }, { "epoch": 0.94, "learning_rate": 0.0001588071280585012, "loss": 0.0368, "step": 145840 }, { "epoch": 0.94, "learning_rate": 0.00015879744670414423, "loss": 0.04, "step": 145850 }, { "epoch": 0.94, "learning_rate": 0.0001587877653497873, "loss": 0.0357, "step": 145860 }, { "epoch": 0.94, "learning_rate": 0.0001587780839954304, "loss": 0.0341, "step": 145870 }, { "epoch": 0.94, "learning_rate": 0.00015876840264107345, "loss": 0.036, "step": 145880 }, { "epoch": 0.94, "learning_rate": 0.00015875872128671653, "loss": 0.0398, "step": 145890 }, { "epoch": 0.94, "learning_rate": 0.0001587490399323596, "loss": 0.0409, "step": 145900 }, { "epoch": 0.94, "learning_rate": 0.00015873935857800268, "loss": 0.0395, "step": 145910 }, { "epoch": 0.94, "learning_rate": 0.0001587296772236457, "loss": 0.0399, "step": 145920 }, { "epoch": 0.94, "learning_rate": 0.0001587199958692888, "loss": 0.0368, "step": 145930 }, { "epoch": 0.94, "learning_rate": 0.00015871031451493187, "loss": 0.0389, "step": 145940 }, { "epoch": 0.94, "learning_rate": 0.00015870063316057492, "loss": 0.0423, "step": 145950 }, { "epoch": 0.94, "learning_rate": 0.000158690951806218, "loss": 0.0374, "step": 145960 }, { "epoch": 0.94, "learning_rate": 0.00015868127045186108, "loss": 0.04, "step": 145970 }, { "epoch": 0.94, "learning_rate": 0.00015867158909750413, "loss": 0.0471, "step": 145980 }, { "epoch": 0.94, "learning_rate": 0.0001586619077431472, "loss": 0.0362, "step": 145990 }, { "epoch": 0.94, "learning_rate": 0.00015865222638879027, "loss": 0.0383, "step": 146000 }, { "epoch": 0.94, "eval_cer": 0.9198969607953904, "eval_loss": 0.02613520435988903, "eval_runtime": 119.9802, "eval_samples_per_second": 16.669, "eval_steps_per_second": 4.167, "step": 146000 }, { "epoch": 0.94, "learning_rate": 0.00015864254503443332, "loss": 0.041, "step": 146010 }, { "epoch": 0.94, "learning_rate": 0.0001586328636800764, "loss": 0.0376, "step": 146020 }, { "epoch": 0.94, "learning_rate": 0.00015862318232571948, "loss": 0.0348, "step": 146030 }, { "epoch": 0.94, "learning_rate": 0.00015861350097136256, "loss": 0.0335, "step": 146040 }, { "epoch": 0.94, "learning_rate": 0.0001586038196170056, "loss": 0.0393, "step": 146050 }, { "epoch": 0.94, "learning_rate": 0.00015859413826264866, "loss": 0.0391, "step": 146060 }, { "epoch": 0.94, "learning_rate": 0.00015858445690829174, "loss": 0.0396, "step": 146070 }, { "epoch": 0.94, "learning_rate": 0.0001585747755539348, "loss": 0.0368, "step": 146080 }, { "epoch": 0.94, "learning_rate": 0.00015856509419957788, "loss": 0.0364, "step": 146090 }, { "epoch": 0.94, "learning_rate": 0.00015855541284522096, "loss": 0.044, "step": 146100 }, { "epoch": 0.94, "learning_rate": 0.00015854573149086404, "loss": 0.0406, "step": 146110 }, { "epoch": 0.94, "learning_rate": 0.0001585360501365071, "loss": 0.0359, "step": 146120 }, { "epoch": 0.94, "learning_rate": 0.00015852636878215014, "loss": 0.0351, "step": 146130 }, { "epoch": 0.94, "learning_rate": 0.00015851668742779322, "loss": 0.0391, "step": 146140 }, { "epoch": 0.94, "learning_rate": 0.00015850700607343627, "loss": 0.0406, "step": 146150 }, { "epoch": 0.94, "learning_rate": 0.00015849732471907935, "loss": 0.0369, "step": 146160 }, { "epoch": 0.94, "learning_rate": 0.00015848764336472243, "loss": 0.0386, "step": 146170 }, { "epoch": 0.94, "learning_rate": 0.0001584779620103655, "loss": 0.0453, "step": 146180 }, { "epoch": 0.94, "learning_rate": 0.00015846828065600857, "loss": 0.0349, "step": 146190 }, { "epoch": 0.94, "learning_rate": 0.00015845859930165162, "loss": 0.0346, "step": 146200 }, { "epoch": 0.94, "learning_rate": 0.00015844891794729467, "loss": 0.0395, "step": 146210 }, { "epoch": 0.94, "learning_rate": 0.00015843923659293775, "loss": 0.0397, "step": 146220 }, { "epoch": 0.94, "learning_rate": 0.00015842955523858083, "loss": 0.0361, "step": 146230 }, { "epoch": 0.94, "learning_rate": 0.0001584198738842239, "loss": 0.0286, "step": 146240 }, { "epoch": 0.94, "learning_rate": 0.00015841019252986696, "loss": 0.0442, "step": 146250 }, { "epoch": 0.94, "learning_rate": 0.00015840051117551004, "loss": 0.0383, "step": 146260 }, { "epoch": 0.94, "learning_rate": 0.0001583908298211531, "loss": 0.0431, "step": 146270 }, { "epoch": 0.94, "learning_rate": 0.00015838114846679615, "loss": 0.0406, "step": 146280 }, { "epoch": 0.94, "learning_rate": 0.00015837146711243923, "loss": 0.0365, "step": 146290 }, { "epoch": 0.94, "learning_rate": 0.0001583617857580823, "loss": 0.0392, "step": 146300 }, { "epoch": 0.94, "learning_rate": 0.0001583521044037254, "loss": 0.0317, "step": 146310 }, { "epoch": 0.94, "learning_rate": 0.00015834242304936844, "loss": 0.0324, "step": 146320 }, { "epoch": 0.94, "learning_rate": 0.00015833274169501152, "loss": 0.0369, "step": 146330 }, { "epoch": 0.94, "learning_rate": 0.00015832306034065457, "loss": 0.0403, "step": 146340 }, { "epoch": 0.94, "learning_rate": 0.00015831337898629763, "loss": 0.0366, "step": 146350 }, { "epoch": 0.94, "learning_rate": 0.0001583036976319407, "loss": 0.0383, "step": 146360 }, { "epoch": 0.94, "learning_rate": 0.00015829401627758379, "loss": 0.0375, "step": 146370 }, { "epoch": 0.94, "learning_rate": 0.00015828433492322684, "loss": 0.0404, "step": 146380 }, { "epoch": 0.94, "learning_rate": 0.00015827465356886992, "loss": 0.0429, "step": 146390 }, { "epoch": 0.94, "learning_rate": 0.000158264972214513, "loss": 0.0402, "step": 146400 }, { "epoch": 0.94, "learning_rate": 0.00015825529086015602, "loss": 0.042, "step": 146410 }, { "epoch": 0.95, "learning_rate": 0.0001582456095057991, "loss": 0.0362, "step": 146420 }, { "epoch": 0.95, "learning_rate": 0.00015823592815144218, "loss": 0.0387, "step": 146430 }, { "epoch": 0.95, "learning_rate": 0.00015822624679708526, "loss": 0.0411, "step": 146440 }, { "epoch": 0.95, "learning_rate": 0.00015821656544272832, "loss": 0.037, "step": 146450 }, { "epoch": 0.95, "learning_rate": 0.0001582068840883714, "loss": 0.0368, "step": 146460 }, { "epoch": 0.95, "learning_rate": 0.00015819720273401448, "loss": 0.0441, "step": 146470 }, { "epoch": 0.95, "learning_rate": 0.0001581875213796575, "loss": 0.0442, "step": 146480 }, { "epoch": 0.95, "learning_rate": 0.00015817784002530058, "loss": 0.0322, "step": 146490 }, { "epoch": 0.95, "learning_rate": 0.00015816815867094366, "loss": 0.043, "step": 146500 }, { "epoch": 0.95, "learning_rate": 0.00015815847731658674, "loss": 0.0403, "step": 146510 }, { "epoch": 0.95, "learning_rate": 0.0001581487959622298, "loss": 0.0372, "step": 146520 }, { "epoch": 0.95, "learning_rate": 0.00015813911460787287, "loss": 0.0388, "step": 146530 }, { "epoch": 0.95, "learning_rate": 0.00015812943325351595, "loss": 0.0347, "step": 146540 }, { "epoch": 0.95, "learning_rate": 0.00015811975189915898, "loss": 0.0416, "step": 146550 }, { "epoch": 0.95, "learning_rate": 0.00015811007054480206, "loss": 0.0401, "step": 146560 }, { "epoch": 0.95, "learning_rate": 0.00015810038919044514, "loss": 0.0455, "step": 146570 }, { "epoch": 0.95, "learning_rate": 0.00015809070783608822, "loss": 0.039, "step": 146580 }, { "epoch": 0.95, "learning_rate": 0.00015808102648173127, "loss": 0.0338, "step": 146590 }, { "epoch": 0.95, "learning_rate": 0.00015807134512737435, "loss": 0.0471, "step": 146600 }, { "epoch": 0.95, "learning_rate": 0.00015806166377301743, "loss": 0.0389, "step": 146610 }, { "epoch": 0.95, "learning_rate": 0.00015805198241866046, "loss": 0.0392, "step": 146620 }, { "epoch": 0.95, "learning_rate": 0.00015804230106430354, "loss": 0.0443, "step": 146630 }, { "epoch": 0.95, "learning_rate": 0.00015803261970994661, "loss": 0.0392, "step": 146640 }, { "epoch": 0.95, "learning_rate": 0.00015802293835558967, "loss": 0.0382, "step": 146650 }, { "epoch": 0.95, "learning_rate": 0.00015801325700123275, "loss": 0.0401, "step": 146660 }, { "epoch": 0.95, "learning_rate": 0.00015800357564687583, "loss": 0.0349, "step": 146670 }, { "epoch": 0.95, "learning_rate": 0.0001579938942925189, "loss": 0.0388, "step": 146680 }, { "epoch": 0.95, "learning_rate": 0.00015798421293816193, "loss": 0.0414, "step": 146690 }, { "epoch": 0.95, "learning_rate": 0.000157974531583805, "loss": 0.0492, "step": 146700 }, { "epoch": 0.95, "learning_rate": 0.0001579648502294481, "loss": 0.0387, "step": 146710 }, { "epoch": 0.95, "learning_rate": 0.00015795516887509114, "loss": 0.0467, "step": 146720 }, { "epoch": 0.95, "learning_rate": 0.00015794548752073422, "loss": 0.0401, "step": 146730 }, { "epoch": 0.95, "learning_rate": 0.0001579358061663773, "loss": 0.0355, "step": 146740 }, { "epoch": 0.95, "learning_rate": 0.00015792612481202038, "loss": 0.0366, "step": 146750 }, { "epoch": 0.95, "learning_rate": 0.0001579164434576634, "loss": 0.0392, "step": 146760 }, { "epoch": 0.95, "learning_rate": 0.0001579067621033065, "loss": 0.0408, "step": 146770 }, { "epoch": 0.95, "learning_rate": 0.00015789708074894957, "loss": 0.0366, "step": 146780 }, { "epoch": 0.95, "learning_rate": 0.00015788739939459262, "loss": 0.0358, "step": 146790 }, { "epoch": 0.95, "learning_rate": 0.0001578777180402357, "loss": 0.0363, "step": 146800 }, { "epoch": 0.95, "learning_rate": 0.00015786803668587878, "loss": 0.0333, "step": 146810 }, { "epoch": 0.95, "learning_rate": 0.00015785835533152183, "loss": 0.0363, "step": 146820 }, { "epoch": 0.95, "learning_rate": 0.0001578486739771649, "loss": 0.0398, "step": 146830 }, { "epoch": 0.95, "learning_rate": 0.00015783899262280797, "loss": 0.038, "step": 146840 }, { "epoch": 0.95, "learning_rate": 0.00015782931126845102, "loss": 0.0333, "step": 146850 }, { "epoch": 0.95, "learning_rate": 0.0001578196299140941, "loss": 0.0333, "step": 146860 }, { "epoch": 0.95, "learning_rate": 0.00015780994855973718, "loss": 0.0365, "step": 146870 }, { "epoch": 0.95, "learning_rate": 0.00015780026720538026, "loss": 0.0361, "step": 146880 }, { "epoch": 0.95, "learning_rate": 0.0001577905858510233, "loss": 0.0383, "step": 146890 }, { "epoch": 0.95, "learning_rate": 0.00015778090449666636, "loss": 0.0372, "step": 146900 }, { "epoch": 0.95, "learning_rate": 0.00015777122314230944, "loss": 0.0324, "step": 146910 }, { "epoch": 0.95, "learning_rate": 0.0001577615417879525, "loss": 0.0429, "step": 146920 }, { "epoch": 0.95, "learning_rate": 0.00015775186043359558, "loss": 0.0356, "step": 146930 }, { "epoch": 0.95, "learning_rate": 0.00015774217907923866, "loss": 0.0363, "step": 146940 }, { "epoch": 0.95, "learning_rate": 0.00015773249772488174, "loss": 0.0379, "step": 146950 }, { "epoch": 0.95, "learning_rate": 0.0001577228163705248, "loss": 0.0389, "step": 146960 }, { "epoch": 0.95, "learning_rate": 0.00015771313501616784, "loss": 0.0429, "step": 146970 }, { "epoch": 0.95, "learning_rate": 0.00015770345366181092, "loss": 0.0318, "step": 146980 }, { "epoch": 0.95, "learning_rate": 0.00015769377230745397, "loss": 0.0457, "step": 146990 }, { "epoch": 0.95, "learning_rate": 0.00015768409095309705, "loss": 0.0396, "step": 147000 }, { "epoch": 0.95, "eval_cer": 0.9198553835724776, "eval_loss": 0.025865597650408745, "eval_runtime": 120.0422, "eval_samples_per_second": 16.661, "eval_steps_per_second": 4.165, "step": 147000 }, { "epoch": 0.95, "learning_rate": 0.00015767440959874013, "loss": 0.039, "step": 147010 }, { "epoch": 0.95, "learning_rate": 0.00015766472824438319, "loss": 0.0467, "step": 147020 }, { "epoch": 0.95, "learning_rate": 0.00015765504689002627, "loss": 0.0376, "step": 147030 }, { "epoch": 0.95, "learning_rate": 0.00015764536553566932, "loss": 0.0404, "step": 147040 }, { "epoch": 0.95, "learning_rate": 0.00015763568418131237, "loss": 0.0419, "step": 147050 }, { "epoch": 0.95, "learning_rate": 0.00015762600282695545, "loss": 0.0366, "step": 147060 }, { "epoch": 0.95, "learning_rate": 0.00015761632147259853, "loss": 0.037, "step": 147070 }, { "epoch": 0.95, "learning_rate": 0.0001576066401182416, "loss": 0.0452, "step": 147080 }, { "epoch": 0.95, "learning_rate": 0.00015759695876388466, "loss": 0.0361, "step": 147090 }, { "epoch": 0.95, "learning_rate": 0.00015758727740952774, "loss": 0.0392, "step": 147100 }, { "epoch": 0.95, "learning_rate": 0.0001575775960551708, "loss": 0.0371, "step": 147110 }, { "epoch": 0.95, "learning_rate": 0.00015756791470081385, "loss": 0.0378, "step": 147120 }, { "epoch": 0.95, "learning_rate": 0.00015755823334645693, "loss": 0.0407, "step": 147130 }, { "epoch": 0.95, "learning_rate": 0.0001575485519921, "loss": 0.04, "step": 147140 }, { "epoch": 0.95, "learning_rate": 0.0001575388706377431, "loss": 0.0348, "step": 147150 }, { "epoch": 0.95, "learning_rate": 0.00015752918928338614, "loss": 0.0355, "step": 147160 }, { "epoch": 0.95, "learning_rate": 0.00015751950792902922, "loss": 0.0426, "step": 147170 }, { "epoch": 0.95, "learning_rate": 0.00015750982657467227, "loss": 0.0363, "step": 147180 }, { "epoch": 0.95, "learning_rate": 0.00015750014522031533, "loss": 0.0321, "step": 147190 }, { "epoch": 0.95, "learning_rate": 0.0001574904638659584, "loss": 0.0404, "step": 147200 }, { "epoch": 0.95, "learning_rate": 0.00015748078251160149, "loss": 0.0329, "step": 147210 }, { "epoch": 0.95, "learning_rate": 0.00015747110115724454, "loss": 0.0416, "step": 147220 }, { "epoch": 0.95, "learning_rate": 0.00015746141980288762, "loss": 0.0439, "step": 147230 }, { "epoch": 0.95, "learning_rate": 0.0001574517384485307, "loss": 0.0414, "step": 147240 }, { "epoch": 0.95, "learning_rate": 0.00015744205709417372, "loss": 0.0377, "step": 147250 }, { "epoch": 0.95, "learning_rate": 0.0001574323757398168, "loss": 0.0352, "step": 147260 }, { "epoch": 0.95, "learning_rate": 0.00015742269438545988, "loss": 0.0427, "step": 147270 }, { "epoch": 0.95, "learning_rate": 0.00015741301303110296, "loss": 0.0401, "step": 147280 }, { "epoch": 0.95, "learning_rate": 0.00015740333167674602, "loss": 0.0338, "step": 147290 }, { "epoch": 0.95, "learning_rate": 0.0001573936503223891, "loss": 0.0407, "step": 147300 }, { "epoch": 0.95, "learning_rate": 0.00015738396896803217, "loss": 0.0347, "step": 147310 }, { "epoch": 0.95, "learning_rate": 0.0001573742876136752, "loss": 0.0364, "step": 147320 }, { "epoch": 0.95, "learning_rate": 0.00015736460625931828, "loss": 0.0368, "step": 147330 }, { "epoch": 0.95, "learning_rate": 0.00015735492490496136, "loss": 0.0445, "step": 147340 }, { "epoch": 0.95, "learning_rate": 0.00015734524355060444, "loss": 0.0368, "step": 147350 }, { "epoch": 0.95, "learning_rate": 0.0001573355621962475, "loss": 0.0462, "step": 147360 }, { "epoch": 0.95, "learning_rate": 0.00015732588084189057, "loss": 0.034, "step": 147370 }, { "epoch": 0.95, "learning_rate": 0.00015731619948753365, "loss": 0.0407, "step": 147380 }, { "epoch": 0.95, "learning_rate": 0.00015730651813317668, "loss": 0.0435, "step": 147390 }, { "epoch": 0.95, "learning_rate": 0.00015729683677881976, "loss": 0.0399, "step": 147400 }, { "epoch": 0.95, "learning_rate": 0.00015728715542446284, "loss": 0.0434, "step": 147410 }, { "epoch": 0.95, "learning_rate": 0.0001572774740701059, "loss": 0.0405, "step": 147420 }, { "epoch": 0.95, "learning_rate": 0.00015726779271574897, "loss": 0.0344, "step": 147430 }, { "epoch": 0.95, "learning_rate": 0.00015725811136139205, "loss": 0.0375, "step": 147440 }, { "epoch": 0.95, "learning_rate": 0.00015724843000703513, "loss": 0.0411, "step": 147450 }, { "epoch": 0.95, "learning_rate": 0.00015723874865267816, "loss": 0.0405, "step": 147460 }, { "epoch": 0.95, "learning_rate": 0.00015722906729832123, "loss": 0.0383, "step": 147470 }, { "epoch": 0.95, "learning_rate": 0.00015721938594396431, "loss": 0.0426, "step": 147480 }, { "epoch": 0.95, "learning_rate": 0.00015720970458960737, "loss": 0.0409, "step": 147490 }, { "epoch": 0.95, "learning_rate": 0.00015720002323525045, "loss": 0.0351, "step": 147500 }, { "epoch": 0.95, "learning_rate": 0.00015719034188089353, "loss": 0.0371, "step": 147510 }, { "epoch": 0.95, "learning_rate": 0.0001571806605265366, "loss": 0.0358, "step": 147520 }, { "epoch": 0.95, "learning_rate": 0.00015717097917217963, "loss": 0.0425, "step": 147530 }, { "epoch": 0.95, "learning_rate": 0.0001571612978178227, "loss": 0.0398, "step": 147540 }, { "epoch": 0.95, "learning_rate": 0.0001571516164634658, "loss": 0.0401, "step": 147550 }, { "epoch": 0.95, "learning_rate": 0.00015714193510910884, "loss": 0.0388, "step": 147560 }, { "epoch": 0.95, "learning_rate": 0.00015713225375475192, "loss": 0.0383, "step": 147570 }, { "epoch": 0.95, "learning_rate": 0.000157122572400395, "loss": 0.0353, "step": 147580 }, { "epoch": 0.95, "learning_rate": 0.00015711289104603806, "loss": 0.0409, "step": 147590 }, { "epoch": 0.95, "learning_rate": 0.0001571032096916811, "loss": 0.0392, "step": 147600 }, { "epoch": 0.95, "learning_rate": 0.0001570935283373242, "loss": 0.0354, "step": 147610 }, { "epoch": 0.95, "learning_rate": 0.00015708384698296724, "loss": 0.0398, "step": 147620 }, { "epoch": 0.95, "learning_rate": 0.00015707416562861032, "loss": 0.0419, "step": 147630 }, { "epoch": 0.95, "learning_rate": 0.0001570644842742534, "loss": 0.0353, "step": 147640 }, { "epoch": 0.95, "learning_rate": 0.00015705480291989648, "loss": 0.0361, "step": 147650 }, { "epoch": 0.95, "learning_rate": 0.00015704512156553953, "loss": 0.0446, "step": 147660 }, { "epoch": 0.95, "learning_rate": 0.0001570354402111826, "loss": 0.0387, "step": 147670 }, { "epoch": 0.95, "learning_rate": 0.00015702575885682567, "loss": 0.0351, "step": 147680 }, { "epoch": 0.95, "learning_rate": 0.00015701607750246872, "loss": 0.0362, "step": 147690 }, { "epoch": 0.95, "learning_rate": 0.0001570063961481118, "loss": 0.0342, "step": 147700 }, { "epoch": 0.95, "learning_rate": 0.00015699671479375488, "loss": 0.0338, "step": 147710 }, { "epoch": 0.95, "learning_rate": 0.00015698703343939796, "loss": 0.0376, "step": 147720 }, { "epoch": 0.95, "learning_rate": 0.000156977352085041, "loss": 0.0394, "step": 147730 }, { "epoch": 0.95, "learning_rate": 0.00015696767073068406, "loss": 0.0528, "step": 147740 }, { "epoch": 0.95, "learning_rate": 0.00015695798937632714, "loss": 0.0366, "step": 147750 }, { "epoch": 0.95, "learning_rate": 0.0001569483080219702, "loss": 0.0454, "step": 147760 }, { "epoch": 0.95, "learning_rate": 0.00015693862666761328, "loss": 0.0365, "step": 147770 }, { "epoch": 0.95, "learning_rate": 0.00015692894531325636, "loss": 0.037, "step": 147780 }, { "epoch": 0.95, "learning_rate": 0.0001569192639588994, "loss": 0.0395, "step": 147790 }, { "epoch": 0.95, "learning_rate": 0.0001569095826045425, "loss": 0.0449, "step": 147800 }, { "epoch": 0.95, "learning_rate": 0.00015689990125018554, "loss": 0.0407, "step": 147810 }, { "epoch": 0.95, "learning_rate": 0.0001568902198958286, "loss": 0.0404, "step": 147820 }, { "epoch": 0.95, "learning_rate": 0.00015688053854147167, "loss": 0.0328, "step": 147830 }, { "epoch": 0.95, "learning_rate": 0.00015687085718711475, "loss": 0.0334, "step": 147840 }, { "epoch": 0.95, "learning_rate": 0.00015686117583275783, "loss": 0.0456, "step": 147850 }, { "epoch": 0.95, "learning_rate": 0.00015685149447840089, "loss": 0.0355, "step": 147860 }, { "epoch": 0.95, "learning_rate": 0.00015684181312404397, "loss": 0.042, "step": 147870 }, { "epoch": 0.95, "learning_rate": 0.00015683213176968702, "loss": 0.0478, "step": 147880 }, { "epoch": 0.95, "learning_rate": 0.00015682245041533007, "loss": 0.033, "step": 147890 }, { "epoch": 0.95, "learning_rate": 0.00015681276906097315, "loss": 0.0397, "step": 147900 }, { "epoch": 0.95, "learning_rate": 0.00015680308770661623, "loss": 0.0367, "step": 147910 }, { "epoch": 0.95, "learning_rate": 0.0001567934063522593, "loss": 0.0378, "step": 147920 }, { "epoch": 0.95, "learning_rate": 0.00015678372499790236, "loss": 0.0358, "step": 147930 }, { "epoch": 0.95, "learning_rate": 0.00015677404364354544, "loss": 0.0418, "step": 147940 }, { "epoch": 0.95, "learning_rate": 0.0001567643622891885, "loss": 0.0383, "step": 147950 }, { "epoch": 0.95, "learning_rate": 0.00015675468093483155, "loss": 0.0366, "step": 147960 }, { "epoch": 0.96, "learning_rate": 0.00015674499958047463, "loss": 0.0429, "step": 147970 }, { "epoch": 0.96, "learning_rate": 0.0001567353182261177, "loss": 0.0343, "step": 147980 }, { "epoch": 0.96, "learning_rate": 0.00015672563687176076, "loss": 0.0539, "step": 147990 }, { "epoch": 0.96, "learning_rate": 0.00015671595551740384, "loss": 0.0405, "step": 148000 }, { "epoch": 0.96, "eval_cer": 0.9198861145633261, "eval_loss": 0.025960681959986687, "eval_runtime": 119.8751, "eval_samples_per_second": 16.684, "eval_steps_per_second": 4.171, "step": 148000 }, { "epoch": 0.96, "learning_rate": 0.00015670627416304692, "loss": 0.0314, "step": 148010 }, { "epoch": 0.96, "learning_rate": 0.00015669659280868995, "loss": 0.0357, "step": 148020 }, { "epoch": 0.96, "learning_rate": 0.00015668691145433303, "loss": 0.0404, "step": 148030 }, { "epoch": 0.96, "learning_rate": 0.0001566772300999761, "loss": 0.0365, "step": 148040 }, { "epoch": 0.96, "learning_rate": 0.00015666754874561919, "loss": 0.0374, "step": 148050 }, { "epoch": 0.96, "learning_rate": 0.00015665786739126224, "loss": 0.0398, "step": 148060 }, { "epoch": 0.96, "learning_rate": 0.00015664818603690532, "loss": 0.0456, "step": 148070 }, { "epoch": 0.96, "learning_rate": 0.00015663850468254837, "loss": 0.0348, "step": 148080 }, { "epoch": 0.96, "learning_rate": 0.00015662882332819142, "loss": 0.0376, "step": 148090 }, { "epoch": 0.96, "learning_rate": 0.0001566191419738345, "loss": 0.0396, "step": 148100 }, { "epoch": 0.96, "learning_rate": 0.00015660946061947758, "loss": 0.0393, "step": 148110 }, { "epoch": 0.96, "learning_rate": 0.00015659977926512066, "loss": 0.0374, "step": 148120 }, { "epoch": 0.96, "learning_rate": 0.00015659009791076372, "loss": 0.0426, "step": 148130 }, { "epoch": 0.96, "learning_rate": 0.0001565804165564068, "loss": 0.0351, "step": 148140 }, { "epoch": 0.96, "learning_rate": 0.00015657073520204985, "loss": 0.0364, "step": 148150 }, { "epoch": 0.96, "learning_rate": 0.0001565610538476929, "loss": 0.0413, "step": 148160 }, { "epoch": 0.96, "learning_rate": 0.00015655137249333598, "loss": 0.0344, "step": 148170 }, { "epoch": 0.96, "learning_rate": 0.00015654169113897906, "loss": 0.035, "step": 148180 }, { "epoch": 0.96, "learning_rate": 0.0001565320097846221, "loss": 0.0417, "step": 148190 }, { "epoch": 0.96, "learning_rate": 0.0001565223284302652, "loss": 0.0349, "step": 148200 }, { "epoch": 0.96, "learning_rate": 0.00015651264707590827, "loss": 0.0405, "step": 148210 }, { "epoch": 0.96, "learning_rate": 0.0001565029657215513, "loss": 0.0426, "step": 148220 }, { "epoch": 0.96, "learning_rate": 0.00015649328436719438, "loss": 0.0364, "step": 148230 }, { "epoch": 0.96, "learning_rate": 0.00015648360301283746, "loss": 0.0356, "step": 148240 }, { "epoch": 0.96, "learning_rate": 0.00015647392165848054, "loss": 0.0353, "step": 148250 }, { "epoch": 0.96, "learning_rate": 0.0001564642403041236, "loss": 0.043, "step": 148260 }, { "epoch": 0.96, "learning_rate": 0.00015645455894976667, "loss": 0.0402, "step": 148270 }, { "epoch": 0.96, "learning_rate": 0.00015644487759540975, "loss": 0.039, "step": 148280 }, { "epoch": 0.96, "learning_rate": 0.00015643519624105277, "loss": 0.0365, "step": 148290 }, { "epoch": 0.96, "learning_rate": 0.00015642551488669585, "loss": 0.0373, "step": 148300 }, { "epoch": 0.96, "learning_rate": 0.00015641583353233893, "loss": 0.0321, "step": 148310 }, { "epoch": 0.96, "learning_rate": 0.00015640615217798201, "loss": 0.0353, "step": 148320 }, { "epoch": 0.96, "learning_rate": 0.00015639647082362507, "loss": 0.039, "step": 148330 }, { "epoch": 0.96, "learning_rate": 0.00015638678946926815, "loss": 0.0429, "step": 148340 }, { "epoch": 0.96, "learning_rate": 0.00015637710811491123, "loss": 0.035, "step": 148350 }, { "epoch": 0.96, "learning_rate": 0.00015636742676055425, "loss": 0.0575, "step": 148360 }, { "epoch": 0.96, "learning_rate": 0.00015635774540619733, "loss": 0.0481, "step": 148370 }, { "epoch": 0.96, "learning_rate": 0.0001563480640518404, "loss": 0.0352, "step": 148380 }, { "epoch": 0.96, "learning_rate": 0.00015633838269748346, "loss": 0.0369, "step": 148390 }, { "epoch": 0.96, "learning_rate": 0.00015632870134312654, "loss": 0.0325, "step": 148400 }, { "epoch": 0.96, "learning_rate": 0.00015631901998876962, "loss": 0.0458, "step": 148410 }, { "epoch": 0.96, "learning_rate": 0.0001563093386344127, "loss": 0.0425, "step": 148420 }, { "epoch": 0.96, "learning_rate": 0.00015629965728005573, "loss": 0.0332, "step": 148430 }, { "epoch": 0.96, "learning_rate": 0.0001562899759256988, "loss": 0.0323, "step": 148440 }, { "epoch": 0.96, "learning_rate": 0.0001562802945713419, "loss": 0.037, "step": 148450 }, { "epoch": 0.96, "learning_rate": 0.00015627061321698494, "loss": 0.0469, "step": 148460 }, { "epoch": 0.96, "learning_rate": 0.00015626093186262802, "loss": 0.0368, "step": 148470 }, { "epoch": 0.96, "learning_rate": 0.0001562512505082711, "loss": 0.0444, "step": 148480 }, { "epoch": 0.96, "learning_rate": 0.00015624156915391418, "loss": 0.0321, "step": 148490 }, { "epoch": 0.96, "learning_rate": 0.0001562318877995572, "loss": 0.0499, "step": 148500 }, { "epoch": 0.96, "learning_rate": 0.00015622220644520029, "loss": 0.034, "step": 148510 }, { "epoch": 0.96, "learning_rate": 0.00015621252509084337, "loss": 0.0405, "step": 148520 }, { "epoch": 0.96, "learning_rate": 0.00015620284373648642, "loss": 0.0407, "step": 148530 }, { "epoch": 0.96, "learning_rate": 0.0001561931623821295, "loss": 0.0486, "step": 148540 }, { "epoch": 0.96, "learning_rate": 0.00015618348102777258, "loss": 0.0434, "step": 148550 }, { "epoch": 0.96, "learning_rate": 0.00015617379967341566, "loss": 0.0437, "step": 148560 }, { "epoch": 0.96, "learning_rate": 0.00015616411831905868, "loss": 0.0441, "step": 148570 }, { "epoch": 0.96, "learning_rate": 0.00015615443696470176, "loss": 0.0385, "step": 148580 }, { "epoch": 0.96, "learning_rate": 0.00015614475561034482, "loss": 0.0391, "step": 148590 }, { "epoch": 0.96, "learning_rate": 0.0001561350742559879, "loss": 0.0329, "step": 148600 }, { "epoch": 0.96, "learning_rate": 0.00015612539290163098, "loss": 0.0372, "step": 148610 }, { "epoch": 0.96, "learning_rate": 0.00015611571154727406, "loss": 0.0355, "step": 148620 }, { "epoch": 0.96, "learning_rate": 0.0001561060301929171, "loss": 0.0409, "step": 148630 }, { "epoch": 0.96, "learning_rate": 0.00015609634883856016, "loss": 0.0362, "step": 148640 }, { "epoch": 0.96, "learning_rate": 0.00015608666748420324, "loss": 0.0393, "step": 148650 }, { "epoch": 0.96, "learning_rate": 0.0001560769861298463, "loss": 0.0352, "step": 148660 }, { "epoch": 0.96, "learning_rate": 0.00015606730477548937, "loss": 0.0405, "step": 148670 }, { "epoch": 0.96, "learning_rate": 0.00015605762342113245, "loss": 0.0377, "step": 148680 }, { "epoch": 0.96, "learning_rate": 0.00015604794206677553, "loss": 0.033, "step": 148690 }, { "epoch": 0.96, "learning_rate": 0.00015603826071241859, "loss": 0.0434, "step": 148700 }, { "epoch": 0.96, "learning_rate": 0.00015602857935806164, "loss": 0.0443, "step": 148710 }, { "epoch": 0.96, "learning_rate": 0.00015601889800370472, "loss": 0.0396, "step": 148720 }, { "epoch": 0.96, "learning_rate": 0.00015600921664934777, "loss": 0.0386, "step": 148730 }, { "epoch": 0.96, "learning_rate": 0.00015599953529499085, "loss": 0.0479, "step": 148740 }, { "epoch": 0.96, "learning_rate": 0.00015598985394063393, "loss": 0.041, "step": 148750 }, { "epoch": 0.96, "learning_rate": 0.000155980172586277, "loss": 0.0386, "step": 148760 }, { "epoch": 0.96, "learning_rate": 0.00015597049123192006, "loss": 0.0392, "step": 148770 }, { "epoch": 0.96, "learning_rate": 0.00015596080987756312, "loss": 0.036, "step": 148780 }, { "epoch": 0.96, "learning_rate": 0.00015595112852320617, "loss": 0.036, "step": 148790 }, { "epoch": 0.96, "learning_rate": 0.00015594144716884925, "loss": 0.0355, "step": 148800 }, { "epoch": 0.96, "learning_rate": 0.00015593176581449233, "loss": 0.0431, "step": 148810 }, { "epoch": 0.96, "learning_rate": 0.0001559220844601354, "loss": 0.0388, "step": 148820 }, { "epoch": 0.96, "learning_rate": 0.00015591240310577846, "loss": 0.0365, "step": 148830 }, { "epoch": 0.96, "learning_rate": 0.00015590272175142154, "loss": 0.0385, "step": 148840 }, { "epoch": 0.96, "learning_rate": 0.0001558930403970646, "loss": 0.0406, "step": 148850 }, { "epoch": 0.96, "learning_rate": 0.00015588335904270765, "loss": 0.0348, "step": 148860 }, { "epoch": 0.96, "learning_rate": 0.00015587367768835073, "loss": 0.043, "step": 148870 }, { "epoch": 0.96, "learning_rate": 0.0001558639963339938, "loss": 0.0362, "step": 148880 }, { "epoch": 0.96, "learning_rate": 0.00015585431497963688, "loss": 0.0394, "step": 148890 }, { "epoch": 0.96, "learning_rate": 0.00015584463362527994, "loss": 0.0374, "step": 148900 }, { "epoch": 0.96, "learning_rate": 0.00015583495227092302, "loss": 0.0467, "step": 148910 }, { "epoch": 0.96, "learning_rate": 0.00015582527091656607, "loss": 0.045, "step": 148920 }, { "epoch": 0.96, "learning_rate": 0.00015581558956220912, "loss": 0.0465, "step": 148930 }, { "epoch": 0.96, "learning_rate": 0.0001558059082078522, "loss": 0.0378, "step": 148940 }, { "epoch": 0.96, "learning_rate": 0.00015579622685349528, "loss": 0.0413, "step": 148950 }, { "epoch": 0.96, "learning_rate": 0.00015578654549913836, "loss": 0.0397, "step": 148960 }, { "epoch": 0.96, "learning_rate": 0.00015577686414478141, "loss": 0.0363, "step": 148970 }, { "epoch": 0.96, "learning_rate": 0.0001557671827904245, "loss": 0.0481, "step": 148980 }, { "epoch": 0.96, "learning_rate": 0.00015575750143606752, "loss": 0.0466, "step": 148990 }, { "epoch": 0.96, "learning_rate": 0.0001557478200817106, "loss": 0.0433, "step": 149000 }, { "epoch": 0.96, "eval_cer": 0.919936730312959, "eval_loss": 0.025839416310191154, "eval_runtime": 119.7309, "eval_samples_per_second": 16.704, "eval_steps_per_second": 4.176, "step": 149000 }, { "epoch": 0.96, "learning_rate": 0.00015573813872735368, "loss": 0.0354, "step": 149010 }, { "epoch": 0.96, "learning_rate": 0.00015572845737299676, "loss": 0.0353, "step": 149020 }, { "epoch": 0.96, "learning_rate": 0.0001557187760186398, "loss": 0.0358, "step": 149030 }, { "epoch": 0.96, "learning_rate": 0.0001557090946642829, "loss": 0.0546, "step": 149040 }, { "epoch": 0.96, "learning_rate": 0.00015569941330992597, "loss": 0.0436, "step": 149050 }, { "epoch": 0.96, "learning_rate": 0.000155689731955569, "loss": 0.0369, "step": 149060 }, { "epoch": 0.96, "learning_rate": 0.00015568005060121208, "loss": 0.041, "step": 149070 }, { "epoch": 0.96, "learning_rate": 0.00015567036924685516, "loss": 0.0374, "step": 149080 }, { "epoch": 0.96, "learning_rate": 0.00015566068789249824, "loss": 0.0366, "step": 149090 }, { "epoch": 0.96, "learning_rate": 0.0001556510065381413, "loss": 0.0358, "step": 149100 }, { "epoch": 0.96, "learning_rate": 0.00015564132518378437, "loss": 0.0375, "step": 149110 }, { "epoch": 0.96, "learning_rate": 0.00015563164382942745, "loss": 0.0347, "step": 149120 }, { "epoch": 0.96, "learning_rate": 0.00015562196247507047, "loss": 0.0363, "step": 149130 }, { "epoch": 0.96, "learning_rate": 0.00015561228112071355, "loss": 0.0462, "step": 149140 }, { "epoch": 0.96, "learning_rate": 0.00015560259976635663, "loss": 0.0369, "step": 149150 }, { "epoch": 0.96, "learning_rate": 0.00015559291841199971, "loss": 0.0406, "step": 149160 }, { "epoch": 0.96, "learning_rate": 0.00015558323705764277, "loss": 0.038, "step": 149170 }, { "epoch": 0.96, "learning_rate": 0.00015557355570328585, "loss": 0.0402, "step": 149180 }, { "epoch": 0.96, "learning_rate": 0.00015556387434892893, "loss": 0.0338, "step": 149190 }, { "epoch": 0.96, "learning_rate": 0.00015555419299457195, "loss": 0.0384, "step": 149200 }, { "epoch": 0.96, "learning_rate": 0.00015554451164021503, "loss": 0.0304, "step": 149210 }, { "epoch": 0.96, "learning_rate": 0.0001555348302858581, "loss": 0.0439, "step": 149220 }, { "epoch": 0.96, "learning_rate": 0.00015552514893150116, "loss": 0.0399, "step": 149230 }, { "epoch": 0.96, "learning_rate": 0.00015551546757714424, "loss": 0.0373, "step": 149240 }, { "epoch": 0.96, "learning_rate": 0.00015550578622278732, "loss": 0.0377, "step": 149250 }, { "epoch": 0.96, "learning_rate": 0.0001554961048684304, "loss": 0.0347, "step": 149260 }, { "epoch": 0.96, "learning_rate": 0.00015548642351407343, "loss": 0.0401, "step": 149270 }, { "epoch": 0.96, "learning_rate": 0.0001554767421597165, "loss": 0.0441, "step": 149280 }, { "epoch": 0.96, "learning_rate": 0.0001554670608053596, "loss": 0.0388, "step": 149290 }, { "epoch": 0.96, "learning_rate": 0.00015545737945100264, "loss": 0.0423, "step": 149300 }, { "epoch": 0.96, "learning_rate": 0.00015544769809664572, "loss": 0.0311, "step": 149310 }, { "epoch": 0.96, "learning_rate": 0.0001554380167422888, "loss": 0.041, "step": 149320 }, { "epoch": 0.96, "learning_rate": 0.00015542833538793188, "loss": 0.0385, "step": 149330 }, { "epoch": 0.96, "learning_rate": 0.0001554186540335749, "loss": 0.041, "step": 149340 }, { "epoch": 0.96, "learning_rate": 0.00015540897267921799, "loss": 0.0342, "step": 149350 }, { "epoch": 0.96, "learning_rate": 0.00015539929132486107, "loss": 0.0377, "step": 149360 }, { "epoch": 0.96, "learning_rate": 0.00015538960997050412, "loss": 0.0317, "step": 149370 }, { "epoch": 0.96, "learning_rate": 0.0001553799286161472, "loss": 0.0338, "step": 149380 }, { "epoch": 0.96, "learning_rate": 0.00015537024726179028, "loss": 0.0346, "step": 149390 }, { "epoch": 0.96, "learning_rate": 0.00015536056590743333, "loss": 0.0428, "step": 149400 }, { "epoch": 0.96, "learning_rate": 0.00015535088455307638, "loss": 0.0354, "step": 149410 }, { "epoch": 0.96, "learning_rate": 0.00015534120319871946, "loss": 0.0383, "step": 149420 }, { "epoch": 0.96, "learning_rate": 0.00015533152184436252, "loss": 0.0398, "step": 149430 }, { "epoch": 0.96, "learning_rate": 0.0001553218404900056, "loss": 0.0369, "step": 149440 }, { "epoch": 0.96, "learning_rate": 0.00015531215913564868, "loss": 0.037, "step": 149450 }, { "epoch": 0.96, "learning_rate": 0.00015530247778129176, "loss": 0.0386, "step": 149460 }, { "epoch": 0.96, "learning_rate": 0.0001552927964269348, "loss": 0.046, "step": 149470 }, { "epoch": 0.96, "learning_rate": 0.00015528311507257786, "loss": 0.0466, "step": 149480 }, { "epoch": 0.96, "learning_rate": 0.00015527343371822094, "loss": 0.0371, "step": 149490 }, { "epoch": 0.96, "learning_rate": 0.000155263752363864, "loss": 0.0417, "step": 149500 }, { "epoch": 0.96, "learning_rate": 0.00015525407100950707, "loss": 0.041, "step": 149510 }, { "epoch": 0.97, "learning_rate": 0.00015524438965515015, "loss": 0.0344, "step": 149520 }, { "epoch": 0.97, "learning_rate": 0.00015523470830079323, "loss": 0.0368, "step": 149530 }, { "epoch": 0.97, "learning_rate": 0.00015522502694643629, "loss": 0.0313, "step": 149540 }, { "epoch": 0.97, "learning_rate": 0.00015521534559207934, "loss": 0.0371, "step": 149550 }, { "epoch": 0.97, "learning_rate": 0.00015520566423772242, "loss": 0.0368, "step": 149560 }, { "epoch": 0.97, "learning_rate": 0.00015519598288336547, "loss": 0.0354, "step": 149570 }, { "epoch": 0.97, "learning_rate": 0.00015518630152900855, "loss": 0.0394, "step": 149580 }, { "epoch": 0.97, "learning_rate": 0.00015517662017465163, "loss": 0.0357, "step": 149590 }, { "epoch": 0.97, "learning_rate": 0.00015516693882029468, "loss": 0.0407, "step": 149600 }, { "epoch": 0.97, "learning_rate": 0.00015515725746593776, "loss": 0.0464, "step": 149610 }, { "epoch": 0.97, "learning_rate": 0.00015514757611158082, "loss": 0.035, "step": 149620 }, { "epoch": 0.97, "learning_rate": 0.00015513789475722387, "loss": 0.0482, "step": 149630 }, { "epoch": 0.97, "learning_rate": 0.00015512821340286695, "loss": 0.033, "step": 149640 }, { "epoch": 0.97, "learning_rate": 0.00015511853204851003, "loss": 0.0421, "step": 149650 }, { "epoch": 0.97, "learning_rate": 0.0001551088506941531, "loss": 0.038, "step": 149660 }, { "epoch": 0.97, "learning_rate": 0.00015509916933979616, "loss": 0.0417, "step": 149670 }, { "epoch": 0.97, "learning_rate": 0.00015508948798543924, "loss": 0.0415, "step": 149680 }, { "epoch": 0.97, "learning_rate": 0.0001550798066310823, "loss": 0.0405, "step": 149690 }, { "epoch": 0.97, "learning_rate": 0.00015507012527672534, "loss": 0.034, "step": 149700 }, { "epoch": 0.97, "learning_rate": 0.00015506044392236842, "loss": 0.0386, "step": 149710 }, { "epoch": 0.97, "learning_rate": 0.0001550507625680115, "loss": 0.0444, "step": 149720 }, { "epoch": 0.97, "learning_rate": 0.00015504108121365458, "loss": 0.0398, "step": 149730 }, { "epoch": 0.97, "learning_rate": 0.00015503139985929764, "loss": 0.0349, "step": 149740 }, { "epoch": 0.97, "learning_rate": 0.00015502171850494072, "loss": 0.039, "step": 149750 }, { "epoch": 0.97, "learning_rate": 0.00015501203715058377, "loss": 0.0375, "step": 149760 }, { "epoch": 0.97, "learning_rate": 0.00015500235579622682, "loss": 0.0343, "step": 149770 }, { "epoch": 0.97, "learning_rate": 0.0001549926744418699, "loss": 0.0359, "step": 149780 }, { "epoch": 0.97, "learning_rate": 0.00015498299308751298, "loss": 0.0394, "step": 149790 }, { "epoch": 0.97, "learning_rate": 0.00015497331173315603, "loss": 0.0368, "step": 149800 }, { "epoch": 0.97, "learning_rate": 0.00015496363037879911, "loss": 0.0341, "step": 149810 }, { "epoch": 0.97, "learning_rate": 0.0001549539490244422, "loss": 0.0437, "step": 149820 }, { "epoch": 0.97, "learning_rate": 0.00015494426767008522, "loss": 0.0452, "step": 149830 }, { "epoch": 0.97, "learning_rate": 0.0001549345863157283, "loss": 0.0433, "step": 149840 }, { "epoch": 0.97, "learning_rate": 0.00015492490496137138, "loss": 0.0389, "step": 149850 }, { "epoch": 0.97, "learning_rate": 0.00015491522360701446, "loss": 0.0413, "step": 149860 }, { "epoch": 0.97, "learning_rate": 0.0001549055422526575, "loss": 0.0334, "step": 149870 }, { "epoch": 0.97, "learning_rate": 0.0001548958608983006, "loss": 0.0389, "step": 149880 }, { "epoch": 0.97, "learning_rate": 0.00015488617954394367, "loss": 0.0406, "step": 149890 }, { "epoch": 0.97, "learning_rate": 0.0001548764981895867, "loss": 0.0366, "step": 149900 }, { "epoch": 0.97, "learning_rate": 0.00015486681683522978, "loss": 0.0344, "step": 149910 }, { "epoch": 0.97, "learning_rate": 0.00015485713548087286, "loss": 0.0366, "step": 149920 }, { "epoch": 0.97, "learning_rate": 0.00015484745412651594, "loss": 0.0378, "step": 149930 }, { "epoch": 0.97, "learning_rate": 0.000154837772772159, "loss": 0.0365, "step": 149940 }, { "epoch": 0.97, "learning_rate": 0.00015482809141780207, "loss": 0.0363, "step": 149950 }, { "epoch": 0.97, "learning_rate": 0.00015481841006344515, "loss": 0.0402, "step": 149960 }, { "epoch": 0.97, "learning_rate": 0.00015480872870908817, "loss": 0.042, "step": 149970 }, { "epoch": 0.97, "learning_rate": 0.00015479904735473125, "loss": 0.0349, "step": 149980 }, { "epoch": 0.97, "learning_rate": 0.00015478936600037433, "loss": 0.0389, "step": 149990 }, { "epoch": 0.97, "learning_rate": 0.00015477968464601739, "loss": 0.0378, "step": 150000 }, { "epoch": 0.97, "eval_cer": 0.9199909614732799, "eval_loss": 0.026005547493696213, "eval_runtime": 119.8926, "eval_samples_per_second": 16.682, "eval_steps_per_second": 4.17, "step": 150000 }, { "epoch": 0.97, "learning_rate": 0.00015477000329166047, "loss": 0.0436, "step": 150010 }, { "epoch": 0.97, "learning_rate": 0.00015476032193730355, "loss": 0.0347, "step": 150020 }, { "epoch": 0.97, "learning_rate": 0.00015475064058294663, "loss": 0.0352, "step": 150030 }, { "epoch": 0.97, "learning_rate": 0.00015474095922858965, "loss": 0.0415, "step": 150040 }, { "epoch": 0.97, "learning_rate": 0.00015473127787423273, "loss": 0.0391, "step": 150050 }, { "epoch": 0.97, "learning_rate": 0.0001547215965198758, "loss": 0.0401, "step": 150060 }, { "epoch": 0.97, "learning_rate": 0.00015471191516551886, "loss": 0.0407, "step": 150070 }, { "epoch": 0.97, "learning_rate": 0.00015470223381116194, "loss": 0.043, "step": 150080 }, { "epoch": 0.97, "learning_rate": 0.00015469255245680502, "loss": 0.0432, "step": 150090 }, { "epoch": 0.97, "learning_rate": 0.0001546828711024481, "loss": 0.0341, "step": 150100 }, { "epoch": 0.97, "learning_rate": 0.00015467318974809113, "loss": 0.0436, "step": 150110 }, { "epoch": 0.97, "learning_rate": 0.0001546635083937342, "loss": 0.0445, "step": 150120 }, { "epoch": 0.97, "learning_rate": 0.0001546538270393773, "loss": 0.0388, "step": 150130 }, { "epoch": 0.97, "learning_rate": 0.00015464414568502034, "loss": 0.0377, "step": 150140 }, { "epoch": 0.97, "learning_rate": 0.00015463446433066342, "loss": 0.04, "step": 150150 }, { "epoch": 0.97, "learning_rate": 0.0001546247829763065, "loss": 0.0361, "step": 150160 }, { "epoch": 0.97, "learning_rate": 0.00015461510162194955, "loss": 0.0368, "step": 150170 }, { "epoch": 0.97, "learning_rate": 0.0001546054202675926, "loss": 0.0377, "step": 150180 }, { "epoch": 0.97, "learning_rate": 0.00015459573891323569, "loss": 0.0352, "step": 150190 }, { "epoch": 0.97, "learning_rate": 0.00015458605755887874, "loss": 0.036, "step": 150200 }, { "epoch": 0.97, "learning_rate": 0.00015457637620452182, "loss": 0.0325, "step": 150210 }, { "epoch": 0.97, "learning_rate": 0.0001545666948501649, "loss": 0.0414, "step": 150220 }, { "epoch": 0.97, "learning_rate": 0.00015455701349580798, "loss": 0.038, "step": 150230 }, { "epoch": 0.97, "learning_rate": 0.00015454733214145103, "loss": 0.033, "step": 150240 }, { "epoch": 0.97, "learning_rate": 0.00015453765078709408, "loss": 0.0421, "step": 150250 }, { "epoch": 0.97, "learning_rate": 0.00015452796943273716, "loss": 0.038, "step": 150260 }, { "epoch": 0.97, "learning_rate": 0.00015451828807838022, "loss": 0.0437, "step": 150270 }, { "epoch": 0.97, "learning_rate": 0.0001545086067240233, "loss": 0.0367, "step": 150280 }, { "epoch": 0.97, "learning_rate": 0.00015449892536966638, "loss": 0.0424, "step": 150290 }, { "epoch": 0.97, "learning_rate": 0.00015448924401530945, "loss": 0.0457, "step": 150300 }, { "epoch": 0.97, "learning_rate": 0.0001544795626609525, "loss": 0.0434, "step": 150310 }, { "epoch": 0.97, "learning_rate": 0.00015446988130659556, "loss": 0.0466, "step": 150320 }, { "epoch": 0.97, "learning_rate": 0.00015446019995223864, "loss": 0.0428, "step": 150330 }, { "epoch": 0.97, "learning_rate": 0.0001544505185978817, "loss": 0.0432, "step": 150340 }, { "epoch": 0.97, "learning_rate": 0.00015444083724352477, "loss": 0.0357, "step": 150350 }, { "epoch": 0.97, "learning_rate": 0.00015443115588916785, "loss": 0.0372, "step": 150360 }, { "epoch": 0.97, "learning_rate": 0.0001544214745348109, "loss": 0.0378, "step": 150370 }, { "epoch": 0.97, "learning_rate": 0.00015441179318045398, "loss": 0.0415, "step": 150380 }, { "epoch": 0.97, "learning_rate": 0.00015440211182609704, "loss": 0.0408, "step": 150390 }, { "epoch": 0.97, "learning_rate": 0.0001543924304717401, "loss": 0.0393, "step": 150400 }, { "epoch": 0.97, "learning_rate": 0.00015438274911738317, "loss": 0.0369, "step": 150410 }, { "epoch": 0.97, "learning_rate": 0.00015437306776302625, "loss": 0.0344, "step": 150420 }, { "epoch": 0.97, "learning_rate": 0.00015436338640866933, "loss": 0.0345, "step": 150430 }, { "epoch": 0.97, "learning_rate": 0.00015435370505431238, "loss": 0.0417, "step": 150440 }, { "epoch": 0.97, "learning_rate": 0.00015434402369995546, "loss": 0.0411, "step": 150450 }, { "epoch": 0.97, "learning_rate": 0.00015433434234559851, "loss": 0.0398, "step": 150460 }, { "epoch": 0.97, "learning_rate": 0.00015432466099124157, "loss": 0.0409, "step": 150470 }, { "epoch": 0.97, "learning_rate": 0.00015431497963688465, "loss": 0.0346, "step": 150480 }, { "epoch": 0.97, "learning_rate": 0.00015430529828252773, "loss": 0.0396, "step": 150490 }, { "epoch": 0.97, "learning_rate": 0.0001542956169281708, "loss": 0.0427, "step": 150500 }, { "epoch": 0.97, "learning_rate": 0.00015428593557381386, "loss": 0.0326, "step": 150510 }, { "epoch": 0.97, "learning_rate": 0.00015427625421945694, "loss": 0.0383, "step": 150520 }, { "epoch": 0.97, "learning_rate": 0.0001542665728651, "loss": 0.0364, "step": 150530 }, { "epoch": 0.97, "learning_rate": 0.00015425689151074304, "loss": 0.0401, "step": 150540 }, { "epoch": 0.97, "learning_rate": 0.00015424721015638612, "loss": 0.0398, "step": 150550 }, { "epoch": 0.97, "learning_rate": 0.0001542375288020292, "loss": 0.0379, "step": 150560 }, { "epoch": 0.97, "learning_rate": 0.00015422784744767226, "loss": 0.0352, "step": 150570 }, { "epoch": 0.97, "learning_rate": 0.00015421816609331534, "loss": 0.0399, "step": 150580 }, { "epoch": 0.97, "learning_rate": 0.00015420848473895842, "loss": 0.0377, "step": 150590 }, { "epoch": 0.97, "learning_rate": 0.00015419880338460144, "loss": 0.0406, "step": 150600 }, { "epoch": 0.97, "learning_rate": 0.00015418912203024452, "loss": 0.042, "step": 150610 }, { "epoch": 0.97, "learning_rate": 0.0001541794406758876, "loss": 0.0388, "step": 150620 }, { "epoch": 0.97, "learning_rate": 0.00015416975932153068, "loss": 0.04, "step": 150630 }, { "epoch": 0.97, "learning_rate": 0.00015416007796717373, "loss": 0.0429, "step": 150640 }, { "epoch": 0.97, "learning_rate": 0.00015415039661281681, "loss": 0.045, "step": 150650 }, { "epoch": 0.97, "learning_rate": 0.0001541407152584599, "loss": 0.0354, "step": 150660 }, { "epoch": 0.97, "learning_rate": 0.00015413103390410292, "loss": 0.0438, "step": 150670 }, { "epoch": 0.97, "learning_rate": 0.000154121352549746, "loss": 0.0426, "step": 150680 }, { "epoch": 0.97, "learning_rate": 0.00015411167119538908, "loss": 0.0376, "step": 150690 }, { "epoch": 0.97, "learning_rate": 0.00015410198984103216, "loss": 0.0329, "step": 150700 }, { "epoch": 0.97, "learning_rate": 0.0001540923084866752, "loss": 0.0392, "step": 150710 }, { "epoch": 0.97, "learning_rate": 0.0001540826271323183, "loss": 0.032, "step": 150720 }, { "epoch": 0.97, "learning_rate": 0.00015407294577796137, "loss": 0.0432, "step": 150730 }, { "epoch": 0.97, "learning_rate": 0.0001540632644236044, "loss": 0.0302, "step": 150740 }, { "epoch": 0.97, "learning_rate": 0.00015405358306924748, "loss": 0.0356, "step": 150750 }, { "epoch": 0.97, "learning_rate": 0.00015404390171489056, "loss": 0.0354, "step": 150760 }, { "epoch": 0.97, "learning_rate": 0.0001540342203605336, "loss": 0.0416, "step": 150770 }, { "epoch": 0.97, "learning_rate": 0.0001540245390061767, "loss": 0.0379, "step": 150780 }, { "epoch": 0.97, "learning_rate": 0.00015401485765181977, "loss": 0.033, "step": 150790 }, { "epoch": 0.97, "learning_rate": 0.00015400517629746285, "loss": 0.0387, "step": 150800 }, { "epoch": 0.97, "learning_rate": 0.00015399549494310587, "loss": 0.0393, "step": 150810 }, { "epoch": 0.97, "learning_rate": 0.00015398581358874895, "loss": 0.0394, "step": 150820 }, { "epoch": 0.97, "learning_rate": 0.00015397613223439203, "loss": 0.0351, "step": 150830 }, { "epoch": 0.97, "learning_rate": 0.00015396645088003509, "loss": 0.045, "step": 150840 }, { "epoch": 0.97, "learning_rate": 0.00015395676952567817, "loss": 0.0394, "step": 150850 }, { "epoch": 0.97, "learning_rate": 0.00015394708817132125, "loss": 0.0393, "step": 150860 }, { "epoch": 0.97, "learning_rate": 0.00015393740681696433, "loss": 0.0394, "step": 150870 }, { "epoch": 0.97, "learning_rate": 0.00015392772546260735, "loss": 0.0395, "step": 150880 }, { "epoch": 0.97, "learning_rate": 0.00015391804410825043, "loss": 0.0433, "step": 150890 }, { "epoch": 0.97, "learning_rate": 0.0001539083627538935, "loss": 0.0362, "step": 150900 }, { "epoch": 0.97, "learning_rate": 0.00015389868139953656, "loss": 0.0386, "step": 150910 }, { "epoch": 0.97, "learning_rate": 0.00015388900004517964, "loss": 0.039, "step": 150920 }, { "epoch": 0.97, "learning_rate": 0.00015387931869082272, "loss": 0.0314, "step": 150930 }, { "epoch": 0.97, "learning_rate": 0.0001538696373364658, "loss": 0.033, "step": 150940 }, { "epoch": 0.97, "learning_rate": 0.00015385995598210883, "loss": 0.0386, "step": 150950 }, { "epoch": 0.97, "learning_rate": 0.0001538502746277519, "loss": 0.0352, "step": 150960 }, { "epoch": 0.97, "learning_rate": 0.000153840593273395, "loss": 0.0347, "step": 150970 }, { "epoch": 0.97, "learning_rate": 0.00015383091191903804, "loss": 0.035, "step": 150980 }, { "epoch": 0.97, "learning_rate": 0.00015382123056468112, "loss": 0.0362, "step": 150990 }, { "epoch": 0.97, "learning_rate": 0.0001538115492103242, "loss": 0.0337, "step": 151000 }, { "epoch": 0.97, "eval_cer": 0.9198951530900463, "eval_loss": 0.025833461433649063, "eval_runtime": 120.3543, "eval_samples_per_second": 16.618, "eval_steps_per_second": 4.154, "step": 151000 }, { "epoch": 0.97, "learning_rate": 0.00015380186785596725, "loss": 0.0423, "step": 151010 }, { "epoch": 0.97, "learning_rate": 0.0001537921865016103, "loss": 0.0407, "step": 151020 }, { "epoch": 0.97, "learning_rate": 0.00015378250514725339, "loss": 0.0353, "step": 151030 }, { "epoch": 0.97, "learning_rate": 0.00015377282379289644, "loss": 0.0353, "step": 151040 }, { "epoch": 0.97, "learning_rate": 0.00015376314243853952, "loss": 0.0464, "step": 151050 }, { "epoch": 0.97, "learning_rate": 0.0001537534610841826, "loss": 0.0385, "step": 151060 }, { "epoch": 0.98, "learning_rate": 0.00015374377972982568, "loss": 0.036, "step": 151070 }, { "epoch": 0.98, "learning_rate": 0.00015373409837546873, "loss": 0.0344, "step": 151080 }, { "epoch": 0.98, "learning_rate": 0.00015372441702111178, "loss": 0.0379, "step": 151090 }, { "epoch": 0.98, "learning_rate": 0.00015371473566675486, "loss": 0.0339, "step": 151100 }, { "epoch": 0.98, "learning_rate": 0.00015370505431239792, "loss": 0.0375, "step": 151110 }, { "epoch": 0.98, "learning_rate": 0.000153695372958041, "loss": 0.0401, "step": 151120 }, { "epoch": 0.98, "learning_rate": 0.00015368569160368407, "loss": 0.0346, "step": 151130 }, { "epoch": 0.98, "learning_rate": 0.00015367601024932715, "loss": 0.0402, "step": 151140 }, { "epoch": 0.98, "learning_rate": 0.0001536663288949702, "loss": 0.0422, "step": 151150 }, { "epoch": 0.98, "learning_rate": 0.00015365664754061326, "loss": 0.0387, "step": 151160 }, { "epoch": 0.98, "learning_rate": 0.00015364696618625634, "loss": 0.0474, "step": 151170 }, { "epoch": 0.98, "learning_rate": 0.0001536372848318994, "loss": 0.0351, "step": 151180 }, { "epoch": 0.98, "learning_rate": 0.00015362760347754247, "loss": 0.0356, "step": 151190 }, { "epoch": 0.98, "learning_rate": 0.00015361792212318555, "loss": 0.042, "step": 151200 }, { "epoch": 0.98, "learning_rate": 0.0001536082407688286, "loss": 0.0383, "step": 151210 }, { "epoch": 0.98, "learning_rate": 0.00015359855941447168, "loss": 0.0397, "step": 151220 }, { "epoch": 0.98, "learning_rate": 0.00015358887806011474, "loss": 0.037, "step": 151230 }, { "epoch": 0.98, "learning_rate": 0.0001535791967057578, "loss": 0.0312, "step": 151240 }, { "epoch": 0.98, "learning_rate": 0.00015356951535140087, "loss": 0.0376, "step": 151250 }, { "epoch": 0.98, "learning_rate": 0.00015355983399704395, "loss": 0.0395, "step": 151260 }, { "epoch": 0.98, "learning_rate": 0.00015355015264268703, "loss": 0.0402, "step": 151270 }, { "epoch": 0.98, "learning_rate": 0.00015354047128833008, "loss": 0.0424, "step": 151280 }, { "epoch": 0.98, "learning_rate": 0.00015353078993397316, "loss": 0.0395, "step": 151290 }, { "epoch": 0.98, "learning_rate": 0.00015352110857961621, "loss": 0.0395, "step": 151300 }, { "epoch": 0.98, "learning_rate": 0.00015351142722525927, "loss": 0.0432, "step": 151310 }, { "epoch": 0.98, "learning_rate": 0.00015350174587090235, "loss": 0.0384, "step": 151320 }, { "epoch": 0.98, "learning_rate": 0.00015349206451654543, "loss": 0.0428, "step": 151330 }, { "epoch": 0.98, "learning_rate": 0.0001534823831621885, "loss": 0.0403, "step": 151340 }, { "epoch": 0.98, "learning_rate": 0.00015347270180783156, "loss": 0.0393, "step": 151350 }, { "epoch": 0.98, "learning_rate": 0.00015346302045347464, "loss": 0.0385, "step": 151360 }, { "epoch": 0.98, "learning_rate": 0.0001534533390991177, "loss": 0.0333, "step": 151370 }, { "epoch": 0.98, "learning_rate": 0.00015344365774476074, "loss": 0.0347, "step": 151380 }, { "epoch": 0.98, "learning_rate": 0.00015343397639040382, "loss": 0.0429, "step": 151390 }, { "epoch": 0.98, "learning_rate": 0.0001534242950360469, "loss": 0.0475, "step": 151400 }, { "epoch": 0.98, "learning_rate": 0.00015341461368168996, "loss": 0.0348, "step": 151410 }, { "epoch": 0.98, "learning_rate": 0.00015340493232733304, "loss": 0.0377, "step": 151420 }, { "epoch": 0.98, "learning_rate": 0.00015339525097297612, "loss": 0.0467, "step": 151430 }, { "epoch": 0.98, "learning_rate": 0.00015338556961861914, "loss": 0.0356, "step": 151440 }, { "epoch": 0.98, "learning_rate": 0.00015337588826426222, "loss": 0.0373, "step": 151450 }, { "epoch": 0.98, "learning_rate": 0.0001533662069099053, "loss": 0.0411, "step": 151460 }, { "epoch": 0.98, "learning_rate": 0.00015335652555554838, "loss": 0.0396, "step": 151470 }, { "epoch": 0.98, "learning_rate": 0.00015334684420119143, "loss": 0.0345, "step": 151480 }, { "epoch": 0.98, "learning_rate": 0.0001533371628468345, "loss": 0.0408, "step": 151490 }, { "epoch": 0.98, "learning_rate": 0.0001533274814924776, "loss": 0.0344, "step": 151500 }, { "epoch": 0.98, "learning_rate": 0.00015331780013812062, "loss": 0.0414, "step": 151510 }, { "epoch": 0.98, "learning_rate": 0.0001533081187837637, "loss": 0.046, "step": 151520 }, { "epoch": 0.98, "learning_rate": 0.00015329843742940678, "loss": 0.042, "step": 151530 }, { "epoch": 0.98, "learning_rate": 0.00015328875607504986, "loss": 0.0338, "step": 151540 }, { "epoch": 0.98, "learning_rate": 0.0001532790747206929, "loss": 0.0429, "step": 151550 }, { "epoch": 0.98, "learning_rate": 0.000153269393366336, "loss": 0.0354, "step": 151560 }, { "epoch": 0.98, "learning_rate": 0.00015325971201197907, "loss": 0.0374, "step": 151570 }, { "epoch": 0.98, "learning_rate": 0.0001532500306576221, "loss": 0.0329, "step": 151580 }, { "epoch": 0.98, "learning_rate": 0.00015324034930326518, "loss": 0.0368, "step": 151590 }, { "epoch": 0.98, "learning_rate": 0.00015323066794890826, "loss": 0.0449, "step": 151600 }, { "epoch": 0.98, "learning_rate": 0.0001532209865945513, "loss": 0.0379, "step": 151610 }, { "epoch": 0.98, "learning_rate": 0.0001532113052401944, "loss": 0.0411, "step": 151620 }, { "epoch": 0.98, "learning_rate": 0.00015320162388583747, "loss": 0.0426, "step": 151630 }, { "epoch": 0.98, "learning_rate": 0.00015319194253148055, "loss": 0.0384, "step": 151640 }, { "epoch": 0.98, "learning_rate": 0.00015318226117712357, "loss": 0.0365, "step": 151650 }, { "epoch": 0.98, "learning_rate": 0.00015317257982276665, "loss": 0.0421, "step": 151660 }, { "epoch": 0.98, "learning_rate": 0.00015316289846840973, "loss": 0.0323, "step": 151670 }, { "epoch": 0.98, "learning_rate": 0.00015315321711405279, "loss": 0.0327, "step": 151680 }, { "epoch": 0.98, "learning_rate": 0.00015314353575969587, "loss": 0.0418, "step": 151690 }, { "epoch": 0.98, "learning_rate": 0.00015313385440533895, "loss": 0.0391, "step": 151700 }, { "epoch": 0.98, "learning_rate": 0.00015312417305098202, "loss": 0.0359, "step": 151710 }, { "epoch": 0.98, "learning_rate": 0.00015311449169662505, "loss": 0.0394, "step": 151720 }, { "epoch": 0.98, "learning_rate": 0.00015310481034226813, "loss": 0.0345, "step": 151730 }, { "epoch": 0.98, "learning_rate": 0.0001530951289879112, "loss": 0.0375, "step": 151740 }, { "epoch": 0.98, "learning_rate": 0.00015308544763355426, "loss": 0.0342, "step": 151750 }, { "epoch": 0.98, "learning_rate": 0.00015307576627919734, "loss": 0.0361, "step": 151760 }, { "epoch": 0.98, "learning_rate": 0.00015306608492484042, "loss": 0.0358, "step": 151770 }, { "epoch": 0.98, "learning_rate": 0.00015305640357048348, "loss": 0.0432, "step": 151780 }, { "epoch": 0.98, "learning_rate": 0.00015304672221612653, "loss": 0.0399, "step": 151790 }, { "epoch": 0.98, "learning_rate": 0.0001530370408617696, "loss": 0.0458, "step": 151800 }, { "epoch": 0.98, "learning_rate": 0.00015302735950741266, "loss": 0.0404, "step": 151810 }, { "epoch": 0.98, "learning_rate": 0.00015301767815305574, "loss": 0.0408, "step": 151820 }, { "epoch": 0.98, "learning_rate": 0.00015300799679869882, "loss": 0.0471, "step": 151830 }, { "epoch": 0.98, "learning_rate": 0.0001529983154443419, "loss": 0.0351, "step": 151840 }, { "epoch": 0.98, "learning_rate": 0.00015298863408998495, "loss": 0.0425, "step": 151850 }, { "epoch": 0.98, "learning_rate": 0.000152978952735628, "loss": 0.0376, "step": 151860 }, { "epoch": 0.98, "learning_rate": 0.00015296927138127108, "loss": 0.0421, "step": 151870 }, { "epoch": 0.98, "learning_rate": 0.00015295959002691414, "loss": 0.0405, "step": 151880 }, { "epoch": 0.98, "learning_rate": 0.00015294990867255722, "loss": 0.0349, "step": 151890 }, { "epoch": 0.98, "learning_rate": 0.0001529402273182003, "loss": 0.0374, "step": 151900 }, { "epoch": 0.98, "learning_rate": 0.00015293054596384338, "loss": 0.0418, "step": 151910 }, { "epoch": 0.98, "learning_rate": 0.00015292086460948643, "loss": 0.035, "step": 151920 }, { "epoch": 0.98, "learning_rate": 0.00015291118325512948, "loss": 0.0379, "step": 151930 }, { "epoch": 0.98, "learning_rate": 0.00015290150190077256, "loss": 0.0386, "step": 151940 }, { "epoch": 0.98, "learning_rate": 0.00015289182054641561, "loss": 0.042, "step": 151950 }, { "epoch": 0.98, "learning_rate": 0.0001528821391920587, "loss": 0.0353, "step": 151960 }, { "epoch": 0.98, "learning_rate": 0.00015287245783770177, "loss": 0.0349, "step": 151970 }, { "epoch": 0.98, "learning_rate": 0.00015286277648334483, "loss": 0.0355, "step": 151980 }, { "epoch": 0.98, "learning_rate": 0.0001528530951289879, "loss": 0.0446, "step": 151990 }, { "epoch": 0.98, "learning_rate": 0.00015284341377463096, "loss": 0.0456, "step": 152000 }, { "epoch": 0.98, "eval_cer": 0.9199484803976952, "eval_loss": 0.02544480562210083, "eval_runtime": 119.9384, "eval_samples_per_second": 16.675, "eval_steps_per_second": 4.169, "step": 152000 }, { "epoch": 0.98, "learning_rate": 0.000152833732420274, "loss": 0.0438, "step": 152010 }, { "epoch": 0.98, "learning_rate": 0.0001528240510659171, "loss": 0.0327, "step": 152020 }, { "epoch": 0.98, "learning_rate": 0.00015281436971156017, "loss": 0.0362, "step": 152030 }, { "epoch": 0.98, "learning_rate": 0.00015280468835720325, "loss": 0.0365, "step": 152040 }, { "epoch": 0.98, "learning_rate": 0.0001527950070028463, "loss": 0.0399, "step": 152050 }, { "epoch": 0.98, "learning_rate": 0.00015278532564848938, "loss": 0.0367, "step": 152060 }, { "epoch": 0.98, "learning_rate": 0.00015277564429413244, "loss": 0.0398, "step": 152070 }, { "epoch": 0.98, "learning_rate": 0.0001527659629397755, "loss": 0.0375, "step": 152080 }, { "epoch": 0.98, "learning_rate": 0.00015275628158541857, "loss": 0.047, "step": 152090 }, { "epoch": 0.98, "learning_rate": 0.00015274660023106165, "loss": 0.0465, "step": 152100 }, { "epoch": 0.98, "learning_rate": 0.00015273691887670473, "loss": 0.0347, "step": 152110 }, { "epoch": 0.98, "learning_rate": 0.00015272723752234778, "loss": 0.0374, "step": 152120 }, { "epoch": 0.98, "learning_rate": 0.00015271755616799086, "loss": 0.0392, "step": 152130 }, { "epoch": 0.98, "learning_rate": 0.00015270787481363391, "loss": 0.0377, "step": 152140 }, { "epoch": 0.98, "learning_rate": 0.00015269819345927697, "loss": 0.0395, "step": 152150 }, { "epoch": 0.98, "learning_rate": 0.00015268851210492005, "loss": 0.0397, "step": 152160 }, { "epoch": 0.98, "learning_rate": 0.00015267883075056313, "loss": 0.0378, "step": 152170 }, { "epoch": 0.98, "learning_rate": 0.00015266914939620618, "loss": 0.0427, "step": 152180 }, { "epoch": 0.98, "learning_rate": 0.00015265946804184926, "loss": 0.042, "step": 152190 }, { "epoch": 0.98, "learning_rate": 0.00015264978668749234, "loss": 0.0388, "step": 152200 }, { "epoch": 0.98, "learning_rate": 0.00015264010533313536, "loss": 0.0386, "step": 152210 }, { "epoch": 0.98, "learning_rate": 0.00015263042397877844, "loss": 0.0355, "step": 152220 }, { "epoch": 0.98, "learning_rate": 0.00015262074262442152, "loss": 0.0366, "step": 152230 }, { "epoch": 0.98, "learning_rate": 0.0001526110612700646, "loss": 0.036, "step": 152240 }, { "epoch": 0.98, "learning_rate": 0.00015260137991570766, "loss": 0.0445, "step": 152250 }, { "epoch": 0.98, "learning_rate": 0.00015259169856135074, "loss": 0.043, "step": 152260 }, { "epoch": 0.98, "learning_rate": 0.00015258201720699382, "loss": 0.037, "step": 152270 }, { "epoch": 0.98, "learning_rate": 0.00015257233585263684, "loss": 0.0329, "step": 152280 }, { "epoch": 0.98, "learning_rate": 0.00015256265449827992, "loss": 0.0393, "step": 152290 }, { "epoch": 0.98, "learning_rate": 0.000152552973143923, "loss": 0.0466, "step": 152300 }, { "epoch": 0.98, "learning_rate": 0.00015254329178956608, "loss": 0.0437, "step": 152310 }, { "epoch": 0.98, "learning_rate": 0.00015253361043520913, "loss": 0.0381, "step": 152320 }, { "epoch": 0.98, "learning_rate": 0.0001525239290808522, "loss": 0.0343, "step": 152330 }, { "epoch": 0.98, "learning_rate": 0.0001525142477264953, "loss": 0.0322, "step": 152340 }, { "epoch": 0.98, "learning_rate": 0.00015250456637213832, "loss": 0.0397, "step": 152350 }, { "epoch": 0.98, "learning_rate": 0.0001524948850177814, "loss": 0.0374, "step": 152360 }, { "epoch": 0.98, "learning_rate": 0.00015248520366342448, "loss": 0.0413, "step": 152370 }, { "epoch": 0.98, "learning_rate": 0.00015247552230906753, "loss": 0.0384, "step": 152380 }, { "epoch": 0.98, "learning_rate": 0.0001524658409547106, "loss": 0.0362, "step": 152390 }, { "epoch": 0.98, "learning_rate": 0.0001524561596003537, "loss": 0.0385, "step": 152400 }, { "epoch": 0.98, "learning_rate": 0.00015244647824599677, "loss": 0.0374, "step": 152410 }, { "epoch": 0.98, "learning_rate": 0.0001524367968916398, "loss": 0.035, "step": 152420 }, { "epoch": 0.98, "learning_rate": 0.00015242711553728288, "loss": 0.0402, "step": 152430 }, { "epoch": 0.98, "learning_rate": 0.00015241743418292596, "loss": 0.0361, "step": 152440 }, { "epoch": 0.98, "learning_rate": 0.000152407752828569, "loss": 0.0423, "step": 152450 }, { "epoch": 0.98, "learning_rate": 0.0001523980714742121, "loss": 0.0298, "step": 152460 }, { "epoch": 0.98, "learning_rate": 0.00015238839011985517, "loss": 0.0347, "step": 152470 }, { "epoch": 0.98, "learning_rate": 0.00015237870876549825, "loss": 0.0326, "step": 152480 }, { "epoch": 0.98, "learning_rate": 0.00015236902741114127, "loss": 0.0358, "step": 152490 }, { "epoch": 0.98, "learning_rate": 0.00015235934605678435, "loss": 0.0341, "step": 152500 }, { "epoch": 0.98, "learning_rate": 0.00015234966470242743, "loss": 0.0368, "step": 152510 }, { "epoch": 0.98, "learning_rate": 0.00015233998334807049, "loss": 0.044, "step": 152520 }, { "epoch": 0.98, "learning_rate": 0.00015233030199371356, "loss": 0.0375, "step": 152530 }, { "epoch": 0.98, "learning_rate": 0.00015232062063935664, "loss": 0.0377, "step": 152540 }, { "epoch": 0.98, "learning_rate": 0.00015231093928499972, "loss": 0.0351, "step": 152550 }, { "epoch": 0.98, "learning_rate": 0.00015230125793064275, "loss": 0.0376, "step": 152560 }, { "epoch": 0.98, "learning_rate": 0.00015229157657628583, "loss": 0.042, "step": 152570 }, { "epoch": 0.98, "learning_rate": 0.00015228189522192888, "loss": 0.0349, "step": 152580 }, { "epoch": 0.98, "learning_rate": 0.00015227221386757196, "loss": 0.0361, "step": 152590 }, { "epoch": 0.98, "learning_rate": 0.00015226253251321504, "loss": 0.036, "step": 152600 }, { "epoch": 0.98, "learning_rate": 0.00015225285115885812, "loss": 0.0379, "step": 152610 }, { "epoch": 0.99, "learning_rate": 0.00015224316980450117, "loss": 0.0378, "step": 152620 }, { "epoch": 0.99, "learning_rate": 0.00015223348845014423, "loss": 0.0365, "step": 152630 }, { "epoch": 0.99, "learning_rate": 0.0001522238070957873, "loss": 0.0394, "step": 152640 }, { "epoch": 0.99, "learning_rate": 0.00015221412574143036, "loss": 0.0395, "step": 152650 }, { "epoch": 0.99, "learning_rate": 0.00015220444438707344, "loss": 0.0418, "step": 152660 }, { "epoch": 0.99, "learning_rate": 0.00015219476303271652, "loss": 0.0337, "step": 152670 }, { "epoch": 0.99, "learning_rate": 0.0001521850816783596, "loss": 0.0369, "step": 152680 }, { "epoch": 0.99, "learning_rate": 0.00015217540032400265, "loss": 0.0408, "step": 152690 }, { "epoch": 0.99, "learning_rate": 0.0001521657189696457, "loss": 0.0408, "step": 152700 }, { "epoch": 0.99, "learning_rate": 0.00015215603761528878, "loss": 0.0344, "step": 152710 }, { "epoch": 0.99, "learning_rate": 0.00015214635626093184, "loss": 0.0346, "step": 152720 }, { "epoch": 0.99, "learning_rate": 0.00015213667490657492, "loss": 0.0329, "step": 152730 }, { "epoch": 0.99, "learning_rate": 0.000152126993552218, "loss": 0.0378, "step": 152740 }, { "epoch": 0.99, "learning_rate": 0.00015211731219786108, "loss": 0.0363, "step": 152750 }, { "epoch": 0.99, "learning_rate": 0.00015210763084350413, "loss": 0.0375, "step": 152760 }, { "epoch": 0.99, "learning_rate": 0.00015209794948914718, "loss": 0.044, "step": 152770 }, { "epoch": 0.99, "learning_rate": 0.00015208826813479023, "loss": 0.0331, "step": 152780 }, { "epoch": 0.99, "learning_rate": 0.00015207858678043331, "loss": 0.0323, "step": 152790 }, { "epoch": 0.99, "learning_rate": 0.0001520689054260764, "loss": 0.032, "step": 152800 }, { "epoch": 0.99, "learning_rate": 0.00015205922407171947, "loss": 0.0359, "step": 152810 }, { "epoch": 0.99, "learning_rate": 0.00015204954271736253, "loss": 0.0333, "step": 152820 }, { "epoch": 0.99, "learning_rate": 0.0001520398613630056, "loss": 0.0323, "step": 152830 }, { "epoch": 0.99, "learning_rate": 0.00015203018000864866, "loss": 0.0334, "step": 152840 }, { "epoch": 0.99, "learning_rate": 0.0001520204986542917, "loss": 0.0327, "step": 152850 }, { "epoch": 0.99, "learning_rate": 0.0001520108172999348, "loss": 0.0384, "step": 152860 }, { "epoch": 0.99, "learning_rate": 0.00015200113594557787, "loss": 0.035, "step": 152870 }, { "epoch": 0.99, "learning_rate": 0.00015199145459122095, "loss": 0.0447, "step": 152880 }, { "epoch": 0.99, "learning_rate": 0.000151981773236864, "loss": 0.0348, "step": 152890 }, { "epoch": 0.99, "learning_rate": 0.00015197209188250708, "loss": 0.0357, "step": 152900 }, { "epoch": 0.99, "learning_rate": 0.00015196241052815014, "loss": 0.0307, "step": 152910 }, { "epoch": 0.99, "learning_rate": 0.0001519527291737932, "loss": 0.0346, "step": 152920 }, { "epoch": 0.99, "learning_rate": 0.00015194304781943627, "loss": 0.0355, "step": 152930 }, { "epoch": 0.99, "learning_rate": 0.00015193336646507935, "loss": 0.0384, "step": 152940 }, { "epoch": 0.99, "learning_rate": 0.00015192368511072243, "loss": 0.0392, "step": 152950 }, { "epoch": 0.99, "learning_rate": 0.00015191400375636548, "loss": 0.0386, "step": 152960 }, { "epoch": 0.99, "learning_rate": 0.00015190432240200856, "loss": 0.0352, "step": 152970 }, { "epoch": 0.99, "learning_rate": 0.00015189464104765159, "loss": 0.0438, "step": 152980 }, { "epoch": 0.99, "learning_rate": 0.00015188495969329467, "loss": 0.0362, "step": 152990 }, { "epoch": 0.99, "learning_rate": 0.00015187527833893775, "loss": 0.0355, "step": 153000 }, { "epoch": 0.99, "eval_cer": 0.9198879222686702, "eval_loss": 0.02557929791510105, "eval_runtime": 119.8042, "eval_samples_per_second": 16.694, "eval_steps_per_second": 4.173, "step": 153000 }, { "epoch": 0.99, "learning_rate": 0.00015186559698458083, "loss": 0.0425, "step": 153010 }, { "epoch": 0.99, "learning_rate": 0.00015185591563022388, "loss": 0.0391, "step": 153020 }, { "epoch": 0.99, "learning_rate": 0.00015184623427586696, "loss": 0.0404, "step": 153030 }, { "epoch": 0.99, "learning_rate": 0.00015183655292151004, "loss": 0.031, "step": 153040 }, { "epoch": 0.99, "learning_rate": 0.00015182687156715306, "loss": 0.0379, "step": 153050 }, { "epoch": 0.99, "learning_rate": 0.00015181719021279614, "loss": 0.0362, "step": 153060 }, { "epoch": 0.99, "learning_rate": 0.00015180750885843922, "loss": 0.0426, "step": 153070 }, { "epoch": 0.99, "learning_rate": 0.0001517978275040823, "loss": 0.0393, "step": 153080 }, { "epoch": 0.99, "learning_rate": 0.00015178814614972536, "loss": 0.0409, "step": 153090 }, { "epoch": 0.99, "learning_rate": 0.00015177846479536844, "loss": 0.0344, "step": 153100 }, { "epoch": 0.99, "learning_rate": 0.00015176878344101152, "loss": 0.0465, "step": 153110 }, { "epoch": 0.99, "learning_rate": 0.00015175910208665454, "loss": 0.0384, "step": 153120 }, { "epoch": 0.99, "learning_rate": 0.00015174942073229762, "loss": 0.0392, "step": 153130 }, { "epoch": 0.99, "learning_rate": 0.0001517397393779407, "loss": 0.0411, "step": 153140 }, { "epoch": 0.99, "learning_rate": 0.00015173005802358378, "loss": 0.0366, "step": 153150 }, { "epoch": 0.99, "learning_rate": 0.00015172037666922683, "loss": 0.0387, "step": 153160 }, { "epoch": 0.99, "learning_rate": 0.0001517106953148699, "loss": 0.0325, "step": 153170 }, { "epoch": 0.99, "learning_rate": 0.000151701013960513, "loss": 0.0402, "step": 153180 }, { "epoch": 0.99, "learning_rate": 0.00015169133260615602, "loss": 0.0407, "step": 153190 }, { "epoch": 0.99, "learning_rate": 0.0001516816512517991, "loss": 0.038, "step": 153200 }, { "epoch": 0.99, "learning_rate": 0.00015167196989744218, "loss": 0.0362, "step": 153210 }, { "epoch": 0.99, "learning_rate": 0.00015166228854308523, "loss": 0.037, "step": 153220 }, { "epoch": 0.99, "learning_rate": 0.0001516526071887283, "loss": 0.0366, "step": 153230 }, { "epoch": 0.99, "learning_rate": 0.0001516429258343714, "loss": 0.0345, "step": 153240 }, { "epoch": 0.99, "learning_rate": 0.00015163324448001447, "loss": 0.038, "step": 153250 }, { "epoch": 0.99, "learning_rate": 0.0001516235631256575, "loss": 0.0396, "step": 153260 }, { "epoch": 0.99, "learning_rate": 0.00015161388177130058, "loss": 0.0327, "step": 153270 }, { "epoch": 0.99, "learning_rate": 0.00015160420041694365, "loss": 0.0447, "step": 153280 }, { "epoch": 0.99, "learning_rate": 0.0001515945190625867, "loss": 0.0414, "step": 153290 }, { "epoch": 0.99, "learning_rate": 0.0001515848377082298, "loss": 0.0441, "step": 153300 }, { "epoch": 0.99, "learning_rate": 0.00015157515635387287, "loss": 0.0344, "step": 153310 }, { "epoch": 0.99, "learning_rate": 0.00015156547499951595, "loss": 0.0416, "step": 153320 }, { "epoch": 0.99, "learning_rate": 0.00015155579364515897, "loss": 0.0354, "step": 153330 }, { "epoch": 0.99, "learning_rate": 0.00015154611229080205, "loss": 0.0427, "step": 153340 }, { "epoch": 0.99, "learning_rate": 0.00015153643093644513, "loss": 0.0309, "step": 153350 }, { "epoch": 0.99, "learning_rate": 0.00015152674958208818, "loss": 0.041, "step": 153360 }, { "epoch": 0.99, "learning_rate": 0.00015151706822773126, "loss": 0.0345, "step": 153370 }, { "epoch": 0.99, "learning_rate": 0.00015150738687337434, "loss": 0.0355, "step": 153380 }, { "epoch": 0.99, "learning_rate": 0.0001514977055190174, "loss": 0.0341, "step": 153390 }, { "epoch": 0.99, "learning_rate": 0.00015148802416466045, "loss": 0.039, "step": 153400 }, { "epoch": 0.99, "learning_rate": 0.00015147834281030353, "loss": 0.047, "step": 153410 }, { "epoch": 0.99, "learning_rate": 0.00015146866145594658, "loss": 0.0374, "step": 153420 }, { "epoch": 0.99, "learning_rate": 0.00015145898010158966, "loss": 0.0427, "step": 153430 }, { "epoch": 0.99, "learning_rate": 0.00015144929874723274, "loss": 0.0364, "step": 153440 }, { "epoch": 0.99, "learning_rate": 0.00015143961739287582, "loss": 0.0384, "step": 153450 }, { "epoch": 0.99, "learning_rate": 0.00015142993603851887, "loss": 0.0386, "step": 153460 }, { "epoch": 0.99, "learning_rate": 0.00015142025468416193, "loss": 0.0394, "step": 153470 }, { "epoch": 0.99, "learning_rate": 0.000151410573329805, "loss": 0.0375, "step": 153480 }, { "epoch": 0.99, "learning_rate": 0.00015140089197544806, "loss": 0.0416, "step": 153490 }, { "epoch": 0.99, "learning_rate": 0.00015139121062109114, "loss": 0.0318, "step": 153500 }, { "epoch": 0.99, "learning_rate": 0.00015138152926673422, "loss": 0.0408, "step": 153510 }, { "epoch": 0.99, "learning_rate": 0.0001513718479123773, "loss": 0.0471, "step": 153520 }, { "epoch": 0.99, "learning_rate": 0.00015136216655802035, "loss": 0.0348, "step": 153530 }, { "epoch": 0.99, "learning_rate": 0.0001513524852036634, "loss": 0.0393, "step": 153540 }, { "epoch": 0.99, "learning_rate": 0.00015134280384930648, "loss": 0.0378, "step": 153550 }, { "epoch": 0.99, "learning_rate": 0.00015133312249494954, "loss": 0.0372, "step": 153560 }, { "epoch": 0.99, "learning_rate": 0.00015132344114059262, "loss": 0.0371, "step": 153570 }, { "epoch": 0.99, "learning_rate": 0.0001513137597862357, "loss": 0.0406, "step": 153580 }, { "epoch": 0.99, "learning_rate": 0.00015130407843187875, "loss": 0.0392, "step": 153590 }, { "epoch": 0.99, "learning_rate": 0.00015129439707752183, "loss": 0.0424, "step": 153600 }, { "epoch": 0.99, "learning_rate": 0.00015128471572316488, "loss": 0.0356, "step": 153610 }, { "epoch": 0.99, "learning_rate": 0.00015127503436880793, "loss": 0.0429, "step": 153620 }, { "epoch": 0.99, "learning_rate": 0.00015126535301445101, "loss": 0.0395, "step": 153630 }, { "epoch": 0.99, "learning_rate": 0.0001512556716600941, "loss": 0.042, "step": 153640 }, { "epoch": 0.99, "learning_rate": 0.00015124599030573717, "loss": 0.0423, "step": 153650 }, { "epoch": 0.99, "learning_rate": 0.00015123630895138023, "loss": 0.0376, "step": 153660 }, { "epoch": 0.99, "learning_rate": 0.0001512266275970233, "loss": 0.0343, "step": 153670 }, { "epoch": 0.99, "learning_rate": 0.00015121694624266636, "loss": 0.0331, "step": 153680 }, { "epoch": 0.99, "learning_rate": 0.0001512072648883094, "loss": 0.0353, "step": 153690 }, { "epoch": 0.99, "learning_rate": 0.0001511975835339525, "loss": 0.0396, "step": 153700 }, { "epoch": 0.99, "learning_rate": 0.00015118790217959557, "loss": 0.0331, "step": 153710 }, { "epoch": 0.99, "learning_rate": 0.00015117822082523865, "loss": 0.0341, "step": 153720 }, { "epoch": 0.99, "learning_rate": 0.0001511685394708817, "loss": 0.0409, "step": 153730 }, { "epoch": 0.99, "learning_rate": 0.00015115885811652478, "loss": 0.0355, "step": 153740 }, { "epoch": 0.99, "learning_rate": 0.00015114917676216784, "loss": 0.0358, "step": 153750 }, { "epoch": 0.99, "learning_rate": 0.0001511394954078109, "loss": 0.0354, "step": 153760 }, { "epoch": 0.99, "learning_rate": 0.00015112981405345397, "loss": 0.0332, "step": 153770 }, { "epoch": 0.99, "learning_rate": 0.00015112013269909705, "loss": 0.0489, "step": 153780 }, { "epoch": 0.99, "learning_rate": 0.0001511104513447401, "loss": 0.0394, "step": 153790 }, { "epoch": 0.99, "learning_rate": 0.00015110076999038318, "loss": 0.0351, "step": 153800 }, { "epoch": 0.99, "learning_rate": 0.00015109108863602626, "loss": 0.0384, "step": 153810 }, { "epoch": 0.99, "learning_rate": 0.00015108140728166929, "loss": 0.0358, "step": 153820 }, { "epoch": 0.99, "learning_rate": 0.00015107172592731237, "loss": 0.043, "step": 153830 }, { "epoch": 0.99, "learning_rate": 0.00015106204457295545, "loss": 0.04, "step": 153840 }, { "epoch": 0.99, "learning_rate": 0.00015105236321859853, "loss": 0.0359, "step": 153850 }, { "epoch": 0.99, "learning_rate": 0.00015104268186424158, "loss": 0.0402, "step": 153860 }, { "epoch": 0.99, "learning_rate": 0.00015103300050988466, "loss": 0.0373, "step": 153870 }, { "epoch": 0.99, "learning_rate": 0.00015102331915552774, "loss": 0.0422, "step": 153880 }, { "epoch": 0.99, "learning_rate": 0.00015101363780117076, "loss": 0.0354, "step": 153890 }, { "epoch": 0.99, "learning_rate": 0.00015100395644681384, "loss": 0.0377, "step": 153900 }, { "epoch": 0.99, "learning_rate": 0.00015099427509245692, "loss": 0.0322, "step": 153910 }, { "epoch": 0.99, "learning_rate": 0.0001509845937381, "loss": 0.0385, "step": 153920 }, { "epoch": 0.99, "learning_rate": 0.00015097491238374306, "loss": 0.0392, "step": 153930 }, { "epoch": 0.99, "learning_rate": 0.00015096523102938614, "loss": 0.0372, "step": 153940 }, { "epoch": 0.99, "learning_rate": 0.00015095554967502921, "loss": 0.0447, "step": 153950 }, { "epoch": 0.99, "learning_rate": 0.00015094586832067224, "loss": 0.0374, "step": 153960 }, { "epoch": 0.99, "learning_rate": 0.00015093618696631532, "loss": 0.039, "step": 153970 }, { "epoch": 0.99, "learning_rate": 0.0001509265056119584, "loss": 0.0325, "step": 153980 }, { "epoch": 0.99, "learning_rate": 0.00015091682425760145, "loss": 0.0432, "step": 153990 }, { "epoch": 0.99, "learning_rate": 0.00015090714290324453, "loss": 0.0396, "step": 154000 }, { "epoch": 0.99, "eval_cer": 0.9199123262908147, "eval_loss": 0.025343097746372223, "eval_runtime": 119.9926, "eval_samples_per_second": 16.668, "eval_steps_per_second": 4.167, "step": 154000 }, { "epoch": 0.99, "learning_rate": 0.0001508974615488876, "loss": 0.0374, "step": 154010 }, { "epoch": 0.99, "learning_rate": 0.0001508877801945307, "loss": 0.04, "step": 154020 }, { "epoch": 0.99, "learning_rate": 0.00015087809884017372, "loss": 0.0331, "step": 154030 }, { "epoch": 0.99, "learning_rate": 0.0001508684174858168, "loss": 0.038, "step": 154040 }, { "epoch": 0.99, "learning_rate": 0.00015085873613145988, "loss": 0.0362, "step": 154050 }, { "epoch": 0.99, "learning_rate": 0.00015084905477710293, "loss": 0.0374, "step": 154060 }, { "epoch": 0.99, "learning_rate": 0.000150839373422746, "loss": 0.0358, "step": 154070 }, { "epoch": 0.99, "learning_rate": 0.0001508296920683891, "loss": 0.0405, "step": 154080 }, { "epoch": 0.99, "learning_rate": 0.00015082001071403217, "loss": 0.0442, "step": 154090 }, { "epoch": 0.99, "learning_rate": 0.0001508103293596752, "loss": 0.0371, "step": 154100 }, { "epoch": 0.99, "learning_rate": 0.00015080064800531827, "loss": 0.036, "step": 154110 }, { "epoch": 0.99, "learning_rate": 0.00015079096665096135, "loss": 0.0368, "step": 154120 }, { "epoch": 0.99, "learning_rate": 0.0001507812852966044, "loss": 0.043, "step": 154130 }, { "epoch": 0.99, "learning_rate": 0.0001507716039422475, "loss": 0.0322, "step": 154140 }, { "epoch": 0.99, "learning_rate": 0.00015076192258789057, "loss": 0.0413, "step": 154150 }, { "epoch": 0.99, "learning_rate": 0.00015075224123353362, "loss": 0.033, "step": 154160 }, { "epoch": 1.0, "learning_rate": 0.00015074255987917667, "loss": 0.0385, "step": 154170 }, { "epoch": 1.0, "learning_rate": 0.00015073287852481975, "loss": 0.0334, "step": 154180 }, { "epoch": 1.0, "learning_rate": 0.0001507231971704628, "loss": 0.0389, "step": 154190 }, { "epoch": 1.0, "learning_rate": 0.00015071351581610588, "loss": 0.0385, "step": 154200 }, { "epoch": 1.0, "learning_rate": 0.00015070383446174896, "loss": 0.0392, "step": 154210 }, { "epoch": 1.0, "learning_rate": 0.00015069415310739204, "loss": 0.0396, "step": 154220 }, { "epoch": 1.0, "learning_rate": 0.0001506844717530351, "loss": 0.0373, "step": 154230 }, { "epoch": 1.0, "learning_rate": 0.00015067479039867815, "loss": 0.0387, "step": 154240 }, { "epoch": 1.0, "learning_rate": 0.00015066510904432123, "loss": 0.0381, "step": 154250 }, { "epoch": 1.0, "learning_rate": 0.00015065542768996428, "loss": 0.0338, "step": 154260 }, { "epoch": 1.0, "learning_rate": 0.00015064574633560736, "loss": 0.0395, "step": 154270 }, { "epoch": 1.0, "learning_rate": 0.00015063606498125044, "loss": 0.0399, "step": 154280 }, { "epoch": 1.0, "learning_rate": 0.00015062638362689352, "loss": 0.036, "step": 154290 }, { "epoch": 1.0, "learning_rate": 0.00015061670227253657, "loss": 0.0389, "step": 154300 }, { "epoch": 1.0, "learning_rate": 0.00015060702091817963, "loss": 0.0396, "step": 154310 }, { "epoch": 1.0, "learning_rate": 0.0001505973395638227, "loss": 0.0352, "step": 154320 }, { "epoch": 1.0, "learning_rate": 0.00015058765820946576, "loss": 0.0362, "step": 154330 }, { "epoch": 1.0, "learning_rate": 0.00015057797685510884, "loss": 0.0448, "step": 154340 }, { "epoch": 1.0, "learning_rate": 0.00015056829550075192, "loss": 0.0416, "step": 154350 }, { "epoch": 1.0, "learning_rate": 0.00015055861414639497, "loss": 0.0471, "step": 154360 }, { "epoch": 1.0, "learning_rate": 0.00015054893279203805, "loss": 0.0417, "step": 154370 }, { "epoch": 1.0, "learning_rate": 0.0001505392514376811, "loss": 0.0401, "step": 154380 }, { "epoch": 1.0, "learning_rate": 0.00015052957008332416, "loss": 0.0378, "step": 154390 }, { "epoch": 1.0, "learning_rate": 0.00015051988872896724, "loss": 0.036, "step": 154400 }, { "epoch": 1.0, "learning_rate": 0.00015051020737461032, "loss": 0.0337, "step": 154410 }, { "epoch": 1.0, "learning_rate": 0.0001505005260202534, "loss": 0.0341, "step": 154420 }, { "epoch": 1.0, "learning_rate": 0.00015049084466589645, "loss": 0.0363, "step": 154430 }, { "epoch": 1.0, "learning_rate": 0.00015048116331153953, "loss": 0.0313, "step": 154440 }, { "epoch": 1.0, "learning_rate": 0.00015047148195718258, "loss": 0.042, "step": 154450 }, { "epoch": 1.0, "learning_rate": 0.00015046180060282563, "loss": 0.0382, "step": 154460 }, { "epoch": 1.0, "learning_rate": 0.0001504521192484687, "loss": 0.0356, "step": 154470 }, { "epoch": 1.0, "learning_rate": 0.0001504424378941118, "loss": 0.0415, "step": 154480 }, { "epoch": 1.0, "learning_rate": 0.00015043275653975487, "loss": 0.0381, "step": 154490 }, { "epoch": 1.0, "learning_rate": 0.00015042307518539793, "loss": 0.0363, "step": 154500 }, { "epoch": 1.0, "learning_rate": 0.000150413393831041, "loss": 0.0416, "step": 154510 }, { "epoch": 1.0, "learning_rate": 0.00015040371247668406, "loss": 0.0367, "step": 154520 }, { "epoch": 1.0, "learning_rate": 0.0001503940311223271, "loss": 0.0426, "step": 154530 }, { "epoch": 1.0, "learning_rate": 0.0001503843497679702, "loss": 0.041, "step": 154540 }, { "epoch": 1.0, "learning_rate": 0.00015037466841361327, "loss": 0.0385, "step": 154550 }, { "epoch": 1.0, "learning_rate": 0.00015036498705925632, "loss": 0.0358, "step": 154560 }, { "epoch": 1.0, "learning_rate": 0.0001503553057048994, "loss": 0.0352, "step": 154570 }, { "epoch": 1.0, "learning_rate": 0.00015034562435054248, "loss": 0.0429, "step": 154580 }, { "epoch": 1.0, "learning_rate": 0.0001503359429961855, "loss": 0.0408, "step": 154590 }, { "epoch": 1.0, "learning_rate": 0.0001503262616418286, "loss": 0.042, "step": 154600 }, { "epoch": 1.0, "learning_rate": 0.00015031658028747167, "loss": 0.0409, "step": 154610 }, { "epoch": 1.0, "learning_rate": 0.00015030689893311475, "loss": 0.0341, "step": 154620 }, { "epoch": 1.0, "learning_rate": 0.0001502972175787578, "loss": 0.0332, "step": 154630 }, { "epoch": 1.0, "learning_rate": 0.00015028753622440088, "loss": 0.0356, "step": 154640 }, { "epoch": 1.0, "learning_rate": 0.00015027785487004396, "loss": 0.0365, "step": 154650 }, { "epoch": 1.0, "learning_rate": 0.00015026817351568699, "loss": 0.0426, "step": 154660 }, { "epoch": 1.0, "learning_rate": 0.00015025849216133007, "loss": 0.0361, "step": 154670 }, { "epoch": 1.0, "learning_rate": 0.00015024881080697315, "loss": 0.0363, "step": 154680 }, { "epoch": 1.0, "learning_rate": 0.00015023912945261623, "loss": 0.0419, "step": 154690 }, { "epoch": 1.0, "learning_rate": 0.00015022944809825928, "loss": 0.0399, "step": 154700 }, { "epoch": 1.0, "learning_rate": 0.00015021976674390236, "loss": 0.0393, "step": 154710 }, { "epoch": 1.0, "learning_rate": 0.00015021008538954544, "loss": 0.0381, "step": 154720 }, { "epoch": 1.0, "learning_rate": 0.00015020040403518846, "loss": 0.0335, "step": 154730 }, { "epoch": 1.0, "learning_rate": 0.00015019072268083154, "loss": 0.0371, "step": 154740 }, { "epoch": 1.0, "learning_rate": 0.00015018104132647462, "loss": 0.0339, "step": 154750 }, { "epoch": 1.0, "learning_rate": 0.00015017135997211768, "loss": 0.0367, "step": 154760 }, { "epoch": 1.0, "learning_rate": 0.00015016167861776075, "loss": 0.0408, "step": 154770 }, { "epoch": 1.0, "learning_rate": 0.00015015199726340383, "loss": 0.0344, "step": 154780 }, { "epoch": 1.0, "learning_rate": 0.00015014231590904691, "loss": 0.0433, "step": 154790 }, { "epoch": 1.0, "learning_rate": 0.00015013263455468994, "loss": 0.0355, "step": 154800 }, { "epoch": 1.0, "learning_rate": 0.00015012295320033302, "loss": 0.0365, "step": 154810 }, { "epoch": 1.0, "learning_rate": 0.0001501132718459761, "loss": 0.04, "step": 154820 }, { "epoch": 1.0, "learning_rate": 0.00015010359049161915, "loss": 0.0355, "step": 154830 }, { "epoch": 1.0, "learning_rate": 0.00015009390913726223, "loss": 0.0343, "step": 154840 }, { "epoch": 1.0, "learning_rate": 0.0001500842277829053, "loss": 0.0336, "step": 154850 }, { "epoch": 1.0, "learning_rate": 0.0001500745464285484, "loss": 0.0324, "step": 154860 }, { "epoch": 1.0, "learning_rate": 0.00015006486507419142, "loss": 0.0381, "step": 154870 }, { "epoch": 1.0, "learning_rate": 0.0001500551837198345, "loss": 0.0397, "step": 154880 }, { "epoch": 1.0, "learning_rate": 0.00015004550236547758, "loss": 0.0435, "step": 154890 }, { "epoch": 1.0, "learning_rate": 0.00015003582101112063, "loss": 0.0382, "step": 154900 }, { "epoch": 1.0, "learning_rate": 0.0001500261396567637, "loss": 0.0305, "step": 154910 }, { "epoch": 1.0, "learning_rate": 0.0001500164583024068, "loss": 0.0357, "step": 154920 }, { "epoch": 1.0, "learning_rate": 0.00015000677694804987, "loss": 0.0422, "step": 154930 }, { "epoch": 1.0, "learning_rate": 0.00014999709559369292, "loss": 0.0439, "step": 154940 }, { "epoch": 1.0, "learning_rate": 0.00014998741423933597, "loss": 0.0317, "step": 154950 }, { "epoch": 1.0, "learning_rate": 0.00014997773288497903, "loss": 0.0317, "step": 154960 }, { "epoch": 1.0, "learning_rate": 0.0001499680515306221, "loss": 0.0352, "step": 154970 }, { "epoch": 1.0, "learning_rate": 0.0001499583701762652, "loss": 0.0339, "step": 154980 }, { "epoch": 1.0, "learning_rate": 0.00014994868882190824, "loss": 0.0411, "step": 154990 }, { "epoch": 1.0, "learning_rate": 0.00014993900746755132, "loss": 0.0353, "step": 155000 }, { "epoch": 1.0, "eval_cer": 0.9199014800587504, "eval_loss": 0.025568395853042603, "eval_runtime": 120.4271, "eval_samples_per_second": 16.608, "eval_steps_per_second": 4.152, "step": 155000 }, { "epoch": 1.0, "learning_rate": 0.0001499293261131944, "loss": 0.0359, "step": 155010 }, { "epoch": 1.0, "learning_rate": 0.00014991964475883745, "loss": 0.0331, "step": 155020 }, { "epoch": 1.0, "learning_rate": 0.0001499099634044805, "loss": 0.0358, "step": 155030 }, { "epoch": 1.0, "learning_rate": 0.00014990028205012358, "loss": 0.0383, "step": 155040 }, { "epoch": 1.0, "learning_rate": 0.00014989060069576666, "loss": 0.0365, "step": 155050 }, { "epoch": 1.0, "learning_rate": 0.00014988091934140972, "loss": 0.0406, "step": 155060 }, { "epoch": 1.0, "learning_rate": 0.0001498712379870528, "loss": 0.0346, "step": 155070 }, { "epoch": 1.0, "learning_rate": 0.00014986155663269585, "loss": 0.0334, "step": 155080 }, { "epoch": 1.0, "learning_rate": 0.00014985187527833893, "loss": 0.0312, "step": 155090 }, { "epoch": 1.0, "learning_rate": 0.00014984219392398198, "loss": 0.032, "step": 155100 }, { "epoch": 1.0, "learning_rate": 0.00014983251256962506, "loss": 0.0362, "step": 155110 }, { "epoch": 1.0, "learning_rate": 0.00014982283121526814, "loss": 0.0304, "step": 155120 }, { "epoch": 1.0, "learning_rate": 0.0001498131498609112, "loss": 0.0371, "step": 155130 }, { "epoch": 1.0, "learning_rate": 0.00014980346850655427, "loss": 0.0348, "step": 155140 }, { "epoch": 1.0, "learning_rate": 0.00014979378715219733, "loss": 0.0327, "step": 155150 }, { "epoch": 1.0, "learning_rate": 0.00014978410579784038, "loss": 0.0399, "step": 155160 }, { "epoch": 1.0, "learning_rate": 0.00014977442444348346, "loss": 0.0378, "step": 155170 }, { "epoch": 1.0, "learning_rate": 0.00014976474308912654, "loss": 0.0295, "step": 155180 }, { "epoch": 1.0, "learning_rate": 0.00014975506173476962, "loss": 0.0385, "step": 155190 }, { "epoch": 1.0, "learning_rate": 0.00014974538038041267, "loss": 0.0422, "step": 155200 }, { "epoch": 1.0, "learning_rate": 0.00014973569902605575, "loss": 0.0397, "step": 155210 }, { "epoch": 1.0, "learning_rate": 0.0001497260176716988, "loss": 0.0359, "step": 155220 }, { "epoch": 1.0, "learning_rate": 0.00014971633631734186, "loss": 0.0306, "step": 155230 }, { "epoch": 1.0, "learning_rate": 0.00014970665496298494, "loss": 0.0316, "step": 155240 }, { "epoch": 1.0, "learning_rate": 0.00014969697360862802, "loss": 0.033, "step": 155250 }, { "epoch": 1.0, "learning_rate": 0.0001496872922542711, "loss": 0.0382, "step": 155260 }, { "epoch": 1.0, "learning_rate": 0.00014967761089991415, "loss": 0.037, "step": 155270 }, { "epoch": 1.0, "learning_rate": 0.0001496679295455572, "loss": 0.0362, "step": 155280 }, { "epoch": 1.0, "learning_rate": 0.00014965824819120028, "loss": 0.0328, "step": 155290 }, { "epoch": 1.0, "learning_rate": 0.00014964856683684333, "loss": 0.033, "step": 155300 }, { "epoch": 1.0, "learning_rate": 0.0001496388854824864, "loss": 0.0299, "step": 155310 }, { "epoch": 1.0, "learning_rate": 0.0001496292041281295, "loss": 0.0343, "step": 155320 }, { "epoch": 1.0, "learning_rate": 0.00014961952277377257, "loss": 0.0366, "step": 155330 }, { "epoch": 1.0, "learning_rate": 0.00014960984141941563, "loss": 0.0294, "step": 155340 }, { "epoch": 1.0, "learning_rate": 0.00014960016006505868, "loss": 0.0366, "step": 155350 }, { "epoch": 1.0, "learning_rate": 0.00014959047871070176, "loss": 0.0372, "step": 155360 }, { "epoch": 1.0, "learning_rate": 0.0001495807973563448, "loss": 0.0404, "step": 155370 }, { "epoch": 1.0, "learning_rate": 0.0001495711160019879, "loss": 0.0347, "step": 155380 }, { "epoch": 1.0, "learning_rate": 0.00014956143464763097, "loss": 0.03, "step": 155390 }, { "epoch": 1.0, "learning_rate": 0.00014955175329327402, "loss": 0.0377, "step": 155400 }, { "epoch": 1.0, "learning_rate": 0.0001495420719389171, "loss": 0.0361, "step": 155410 }, { "epoch": 1.0, "learning_rate": 0.00014953239058456016, "loss": 0.0376, "step": 155420 }, { "epoch": 1.0, "learning_rate": 0.00014952270923020324, "loss": 0.0357, "step": 155430 }, { "epoch": 1.0, "learning_rate": 0.0001495130278758463, "loss": 0.0308, "step": 155440 }, { "epoch": 1.0, "learning_rate": 0.00014950334652148937, "loss": 0.0361, "step": 155450 }, { "epoch": 1.0, "learning_rate": 0.00014949366516713245, "loss": 0.0324, "step": 155460 }, { "epoch": 1.0, "learning_rate": 0.0001494839838127755, "loss": 0.0311, "step": 155470 }, { "epoch": 1.0, "learning_rate": 0.00014947430245841855, "loss": 0.0321, "step": 155480 }, { "epoch": 1.0, "learning_rate": 0.00014946462110406163, "loss": 0.0379, "step": 155490 }, { "epoch": 1.0, "learning_rate": 0.0001494549397497047, "loss": 0.0357, "step": 155500 }, { "epoch": 1.0, "learning_rate": 0.00014944525839534777, "loss": 0.0372, "step": 155510 }, { "epoch": 1.0, "learning_rate": 0.00014943557704099084, "loss": 0.0326, "step": 155520 }, { "epoch": 1.0, "learning_rate": 0.00014942589568663392, "loss": 0.0331, "step": 155530 }, { "epoch": 1.0, "learning_rate": 0.00014941621433227698, "loss": 0.0372, "step": 155540 }, { "epoch": 1.0, "learning_rate": 0.00014940653297792003, "loss": 0.0385, "step": 155550 }, { "epoch": 1.0, "learning_rate": 0.0001493968516235631, "loss": 0.0402, "step": 155560 }, { "epoch": 1.0, "learning_rate": 0.0001493871702692062, "loss": 0.0312, "step": 155570 }, { "epoch": 1.0, "learning_rate": 0.00014937748891484924, "loss": 0.0371, "step": 155580 }, { "epoch": 1.0, "learning_rate": 0.00014936780756049232, "loss": 0.0378, "step": 155590 }, { "epoch": 1.0, "learning_rate": 0.00014935812620613537, "loss": 0.0329, "step": 155600 }, { "epoch": 1.0, "learning_rate": 0.00014934844485177845, "loss": 0.0319, "step": 155610 }, { "epoch": 1.0, "learning_rate": 0.0001493387634974215, "loss": 0.0376, "step": 155620 }, { "epoch": 1.0, "learning_rate": 0.0001493290821430646, "loss": 0.0347, "step": 155630 }, { "epoch": 1.0, "learning_rate": 0.00014931940078870767, "loss": 0.0371, "step": 155640 }, { "epoch": 1.0, "learning_rate": 0.00014930971943435072, "loss": 0.0413, "step": 155650 }, { "epoch": 1.0, "learning_rate": 0.0001493000380799938, "loss": 0.0333, "step": 155660 }, { "epoch": 1.0, "learning_rate": 0.00014929035672563685, "loss": 0.0375, "step": 155670 }, { "epoch": 1.0, "learning_rate": 0.00014928067537127993, "loss": 0.0377, "step": 155680 }, { "epoch": 1.0, "learning_rate": 0.00014927099401692298, "loss": 0.0347, "step": 155690 }, { "epoch": 1.0, "learning_rate": 0.00014926131266256606, "loss": 0.0315, "step": 155700 }, { "epoch": 1.0, "learning_rate": 0.00014925163130820914, "loss": 0.0374, "step": 155710 }, { "epoch": 1.01, "learning_rate": 0.0001492419499538522, "loss": 0.0337, "step": 155720 }, { "epoch": 1.01, "learning_rate": 0.00014923226859949528, "loss": 0.0357, "step": 155730 }, { "epoch": 1.01, "learning_rate": 0.00014922258724513833, "loss": 0.036, "step": 155740 }, { "epoch": 1.01, "learning_rate": 0.0001492129058907814, "loss": 0.042, "step": 155750 }, { "epoch": 1.01, "learning_rate": 0.00014920322453642446, "loss": 0.0397, "step": 155760 }, { "epoch": 1.01, "learning_rate": 0.00014919354318206754, "loss": 0.0328, "step": 155770 }, { "epoch": 1.01, "learning_rate": 0.00014918386182771062, "loss": 0.0395, "step": 155780 }, { "epoch": 1.01, "learning_rate": 0.00014917418047335367, "loss": 0.0388, "step": 155790 }, { "epoch": 1.01, "learning_rate": 0.00014916449911899673, "loss": 0.0373, "step": 155800 }, { "epoch": 1.01, "learning_rate": 0.0001491548177646398, "loss": 0.0382, "step": 155810 }, { "epoch": 1.01, "learning_rate": 0.00014914513641028289, "loss": 0.0438, "step": 155820 }, { "epoch": 1.01, "learning_rate": 0.00014913545505592594, "loss": 0.0337, "step": 155830 }, { "epoch": 1.01, "learning_rate": 0.00014912577370156902, "loss": 0.0339, "step": 155840 }, { "epoch": 1.01, "learning_rate": 0.0001491160923472121, "loss": 0.0367, "step": 155850 }, { "epoch": 1.01, "learning_rate": 0.00014910641099285515, "loss": 0.0343, "step": 155860 }, { "epoch": 1.01, "learning_rate": 0.0001490967296384982, "loss": 0.032, "step": 155870 }, { "epoch": 1.01, "learning_rate": 0.00014908704828414128, "loss": 0.0319, "step": 155880 }, { "epoch": 1.01, "learning_rate": 0.00014907736692978436, "loss": 0.0325, "step": 155890 }, { "epoch": 1.01, "learning_rate": 0.00014906768557542742, "loss": 0.0347, "step": 155900 }, { "epoch": 1.01, "learning_rate": 0.0001490580042210705, "loss": 0.0386, "step": 155910 }, { "epoch": 1.01, "learning_rate": 0.00014904832286671355, "loss": 0.0361, "step": 155920 }, { "epoch": 1.01, "learning_rate": 0.00014903864151235663, "loss": 0.0312, "step": 155930 }, { "epoch": 1.01, "learning_rate": 0.00014902896015799968, "loss": 0.0369, "step": 155940 }, { "epoch": 1.01, "learning_rate": 0.00014901927880364276, "loss": 0.0361, "step": 155950 }, { "epoch": 1.01, "learning_rate": 0.00014900959744928584, "loss": 0.035, "step": 155960 }, { "epoch": 1.01, "learning_rate": 0.0001489999160949289, "loss": 0.0373, "step": 155970 }, { "epoch": 1.01, "learning_rate": 0.00014899023474057197, "loss": 0.035, "step": 155980 }, { "epoch": 1.01, "learning_rate": 0.00014898055338621503, "loss": 0.0393, "step": 155990 }, { "epoch": 1.01, "learning_rate": 0.00014897087203185808, "loss": 0.036, "step": 156000 }, { "epoch": 1.01, "eval_cer": 0.9199502881030392, "eval_loss": 0.02528407983481884, "eval_runtime": 120.345, "eval_samples_per_second": 16.619, "eval_steps_per_second": 4.155, "step": 156000 }, { "epoch": 1.01, "learning_rate": 0.00014896119067750116, "loss": 0.033, "step": 156010 }, { "epoch": 1.01, "learning_rate": 0.00014895150932314424, "loss": 0.0362, "step": 156020 }, { "epoch": 1.01, "learning_rate": 0.00014894182796878732, "loss": 0.0361, "step": 156030 }, { "epoch": 1.01, "learning_rate": 0.00014893214661443037, "loss": 0.0355, "step": 156040 }, { "epoch": 1.01, "learning_rate": 0.00014892246526007345, "loss": 0.0323, "step": 156050 }, { "epoch": 1.01, "learning_rate": 0.0001489127839057165, "loss": 0.0364, "step": 156060 }, { "epoch": 1.01, "learning_rate": 0.00014890310255135956, "loss": 0.0345, "step": 156070 }, { "epoch": 1.01, "learning_rate": 0.00014889342119700264, "loss": 0.0359, "step": 156080 }, { "epoch": 1.01, "learning_rate": 0.00014888373984264572, "loss": 0.033, "step": 156090 }, { "epoch": 1.01, "learning_rate": 0.0001488740584882888, "loss": 0.0332, "step": 156100 }, { "epoch": 1.01, "learning_rate": 0.00014886437713393185, "loss": 0.035, "step": 156110 }, { "epoch": 1.01, "learning_rate": 0.0001488546957795749, "loss": 0.0328, "step": 156120 }, { "epoch": 1.01, "learning_rate": 0.00014884501442521798, "loss": 0.0366, "step": 156130 }, { "epoch": 1.01, "learning_rate": 0.00014883533307086103, "loss": 0.0341, "step": 156140 }, { "epoch": 1.01, "learning_rate": 0.0001488256517165041, "loss": 0.0368, "step": 156150 }, { "epoch": 1.01, "learning_rate": 0.0001488159703621472, "loss": 0.0365, "step": 156160 }, { "epoch": 1.01, "learning_rate": 0.00014880628900779025, "loss": 0.0314, "step": 156170 }, { "epoch": 1.01, "learning_rate": 0.00014879660765343333, "loss": 0.0368, "step": 156180 }, { "epoch": 1.01, "learning_rate": 0.00014878692629907638, "loss": 0.0358, "step": 156190 }, { "epoch": 1.01, "learning_rate": 0.00014877724494471946, "loss": 0.0384, "step": 156200 }, { "epoch": 1.01, "learning_rate": 0.0001487675635903625, "loss": 0.0436, "step": 156210 }, { "epoch": 1.01, "learning_rate": 0.0001487578822360056, "loss": 0.0323, "step": 156220 }, { "epoch": 1.01, "learning_rate": 0.00014874820088164867, "loss": 0.0325, "step": 156230 }, { "epoch": 1.01, "learning_rate": 0.00014873851952729172, "loss": 0.0322, "step": 156240 }, { "epoch": 1.01, "learning_rate": 0.0001487288381729348, "loss": 0.0321, "step": 156250 }, { "epoch": 1.01, "learning_rate": 0.00014871915681857785, "loss": 0.0336, "step": 156260 }, { "epoch": 1.01, "learning_rate": 0.00014870947546422093, "loss": 0.0343, "step": 156270 }, { "epoch": 1.01, "learning_rate": 0.000148699794109864, "loss": 0.0333, "step": 156280 }, { "epoch": 1.01, "learning_rate": 0.00014869011275550707, "loss": 0.035, "step": 156290 }, { "epoch": 1.01, "learning_rate": 0.00014868043140115015, "loss": 0.0302, "step": 156300 }, { "epoch": 1.01, "learning_rate": 0.0001486707500467932, "loss": 0.0346, "step": 156310 }, { "epoch": 1.01, "learning_rate": 0.00014866106869243625, "loss": 0.0356, "step": 156320 }, { "epoch": 1.01, "learning_rate": 0.00014865138733807933, "loss": 0.035, "step": 156330 }, { "epoch": 1.01, "learning_rate": 0.0001486417059837224, "loss": 0.0325, "step": 156340 }, { "epoch": 1.01, "learning_rate": 0.00014863202462936546, "loss": 0.0368, "step": 156350 }, { "epoch": 1.01, "learning_rate": 0.00014862234327500854, "loss": 0.0388, "step": 156360 }, { "epoch": 1.01, "learning_rate": 0.0001486126619206516, "loss": 0.0395, "step": 156370 }, { "epoch": 1.01, "learning_rate": 0.00014860298056629468, "loss": 0.0352, "step": 156380 }, { "epoch": 1.01, "learning_rate": 0.00014859329921193773, "loss": 0.0396, "step": 156390 }, { "epoch": 1.01, "learning_rate": 0.0001485836178575808, "loss": 0.0346, "step": 156400 }, { "epoch": 1.01, "learning_rate": 0.0001485739365032239, "loss": 0.0322, "step": 156410 }, { "epoch": 1.01, "learning_rate": 0.00014856425514886694, "loss": 0.0353, "step": 156420 }, { "epoch": 1.01, "learning_rate": 0.00014855457379451002, "loss": 0.0328, "step": 156430 }, { "epoch": 1.01, "learning_rate": 0.00014854489244015307, "loss": 0.0312, "step": 156440 }, { "epoch": 1.01, "learning_rate": 0.00014853521108579615, "loss": 0.0401, "step": 156450 }, { "epoch": 1.01, "learning_rate": 0.0001485255297314392, "loss": 0.0396, "step": 156460 }, { "epoch": 1.01, "learning_rate": 0.0001485158483770823, "loss": 0.0359, "step": 156470 }, { "epoch": 1.01, "learning_rate": 0.00014850616702272537, "loss": 0.0315, "step": 156480 }, { "epoch": 1.01, "learning_rate": 0.00014849648566836842, "loss": 0.036, "step": 156490 }, { "epoch": 1.01, "learning_rate": 0.0001484868043140115, "loss": 0.0372, "step": 156500 }, { "epoch": 1.01, "learning_rate": 0.00014847712295965455, "loss": 0.0349, "step": 156510 }, { "epoch": 1.01, "learning_rate": 0.00014846744160529763, "loss": 0.0319, "step": 156520 }, { "epoch": 1.01, "learning_rate": 0.00014845776025094068, "loss": 0.0339, "step": 156530 }, { "epoch": 1.01, "learning_rate": 0.00014844807889658376, "loss": 0.0304, "step": 156540 }, { "epoch": 1.01, "learning_rate": 0.00014843839754222684, "loss": 0.0333, "step": 156550 }, { "epoch": 1.01, "learning_rate": 0.0001484287161878699, "loss": 0.0395, "step": 156560 }, { "epoch": 1.01, "learning_rate": 0.00014841903483351295, "loss": 0.0306, "step": 156570 }, { "epoch": 1.01, "learning_rate": 0.00014840935347915603, "loss": 0.0392, "step": 156580 }, { "epoch": 1.01, "learning_rate": 0.0001483996721247991, "loss": 0.0362, "step": 156590 }, { "epoch": 1.01, "learning_rate": 0.00014838999077044216, "loss": 0.0354, "step": 156600 }, { "epoch": 1.01, "learning_rate": 0.00014838030941608524, "loss": 0.0394, "step": 156610 }, { "epoch": 1.01, "learning_rate": 0.00014837062806172832, "loss": 0.0384, "step": 156620 }, { "epoch": 1.01, "learning_rate": 0.00014836094670737137, "loss": 0.0371, "step": 156630 }, { "epoch": 1.01, "learning_rate": 0.00014835126535301443, "loss": 0.0361, "step": 156640 }, { "epoch": 1.01, "learning_rate": 0.0001483415839986575, "loss": 0.038, "step": 156650 }, { "epoch": 1.01, "learning_rate": 0.00014833190264430056, "loss": 0.0401, "step": 156660 }, { "epoch": 1.01, "learning_rate": 0.00014832222128994364, "loss": 0.0358, "step": 156670 }, { "epoch": 1.01, "learning_rate": 0.00014831253993558672, "loss": 0.0357, "step": 156680 }, { "epoch": 1.01, "learning_rate": 0.00014830285858122977, "loss": 0.0317, "step": 156690 }, { "epoch": 1.01, "learning_rate": 0.00014829317722687285, "loss": 0.0383, "step": 156700 }, { "epoch": 1.01, "learning_rate": 0.0001482834958725159, "loss": 0.0296, "step": 156710 }, { "epoch": 1.01, "learning_rate": 0.00014827381451815898, "loss": 0.0369, "step": 156720 }, { "epoch": 1.01, "learning_rate": 0.00014826413316380204, "loss": 0.041, "step": 156730 }, { "epoch": 1.01, "learning_rate": 0.00014825445180944512, "loss": 0.0367, "step": 156740 }, { "epoch": 1.01, "learning_rate": 0.0001482447704550882, "loss": 0.0366, "step": 156750 }, { "epoch": 1.01, "learning_rate": 0.00014823508910073125, "loss": 0.0356, "step": 156760 }, { "epoch": 1.01, "learning_rate": 0.0001482254077463743, "loss": 0.0386, "step": 156770 }, { "epoch": 1.01, "learning_rate": 0.00014821572639201738, "loss": 0.0351, "step": 156780 }, { "epoch": 1.01, "learning_rate": 0.00014820604503766046, "loss": 0.0379, "step": 156790 }, { "epoch": 1.01, "learning_rate": 0.0001481963636833035, "loss": 0.0347, "step": 156800 }, { "epoch": 1.01, "learning_rate": 0.0001481866823289466, "loss": 0.036, "step": 156810 }, { "epoch": 1.01, "learning_rate": 0.00014817700097458967, "loss": 0.0326, "step": 156820 }, { "epoch": 1.01, "learning_rate": 0.00014816731962023273, "loss": 0.0337, "step": 156830 }, { "epoch": 1.01, "learning_rate": 0.00014815763826587578, "loss": 0.039, "step": 156840 }, { "epoch": 1.01, "learning_rate": 0.00014814795691151886, "loss": 0.0376, "step": 156850 }, { "epoch": 1.01, "learning_rate": 0.00014813827555716194, "loss": 0.0338, "step": 156860 }, { "epoch": 1.01, "learning_rate": 0.000148128594202805, "loss": 0.0343, "step": 156870 }, { "epoch": 1.01, "learning_rate": 0.00014811891284844807, "loss": 0.0305, "step": 156880 }, { "epoch": 1.01, "learning_rate": 0.00014810923149409112, "loss": 0.0355, "step": 156890 }, { "epoch": 1.01, "learning_rate": 0.0001480995501397342, "loss": 0.0377, "step": 156900 }, { "epoch": 1.01, "learning_rate": 0.00014808986878537726, "loss": 0.0286, "step": 156910 }, { "epoch": 1.01, "learning_rate": 0.00014808018743102034, "loss": 0.042, "step": 156920 }, { "epoch": 1.01, "learning_rate": 0.00014807050607666341, "loss": 0.0347, "step": 156930 }, { "epoch": 1.01, "learning_rate": 0.00014806082472230647, "loss": 0.0358, "step": 156940 }, { "epoch": 1.01, "learning_rate": 0.00014805114336794955, "loss": 0.0417, "step": 156950 }, { "epoch": 1.01, "learning_rate": 0.0001480414620135926, "loss": 0.0336, "step": 156960 }, { "epoch": 1.01, "learning_rate": 0.00014803178065923568, "loss": 0.0333, "step": 156970 }, { "epoch": 1.01, "learning_rate": 0.00014802209930487873, "loss": 0.032, "step": 156980 }, { "epoch": 1.01, "learning_rate": 0.0001480124179505218, "loss": 0.0318, "step": 156990 }, { "epoch": 1.01, "learning_rate": 0.0001480027365961649, "loss": 0.0345, "step": 157000 }, { "epoch": 1.01, "eval_cer": 0.9199014800587504, "eval_loss": 0.025441249832510948, "eval_runtime": 120.9546, "eval_samples_per_second": 16.535, "eval_steps_per_second": 4.134, "step": 157000 }, { "epoch": 1.01, "learning_rate": 0.00014799305524180794, "loss": 0.0367, "step": 157010 }, { "epoch": 1.01, "learning_rate": 0.00014798337388745102, "loss": 0.0335, "step": 157020 }, { "epoch": 1.01, "learning_rate": 0.00014797369253309408, "loss": 0.0405, "step": 157030 }, { "epoch": 1.01, "learning_rate": 0.00014796401117873716, "loss": 0.0323, "step": 157040 }, { "epoch": 1.01, "learning_rate": 0.0001479543298243802, "loss": 0.0383, "step": 157050 }, { "epoch": 1.01, "learning_rate": 0.0001479446484700233, "loss": 0.0342, "step": 157060 }, { "epoch": 1.01, "learning_rate": 0.00014793496711566637, "loss": 0.0357, "step": 157070 }, { "epoch": 1.01, "learning_rate": 0.00014792528576130942, "loss": 0.0357, "step": 157080 }, { "epoch": 1.01, "learning_rate": 0.00014791560440695247, "loss": 0.0307, "step": 157090 }, { "epoch": 1.01, "learning_rate": 0.00014790592305259555, "loss": 0.0318, "step": 157100 }, { "epoch": 1.01, "learning_rate": 0.00014789624169823863, "loss": 0.031, "step": 157110 }, { "epoch": 1.01, "learning_rate": 0.0001478865603438817, "loss": 0.0341, "step": 157120 }, { "epoch": 1.01, "learning_rate": 0.00014787687898952477, "loss": 0.0392, "step": 157130 }, { "epoch": 1.01, "learning_rate": 0.00014786719763516785, "loss": 0.0325, "step": 157140 }, { "epoch": 1.01, "learning_rate": 0.0001478575162808109, "loss": 0.0384, "step": 157150 }, { "epoch": 1.01, "learning_rate": 0.00014784783492645395, "loss": 0.0354, "step": 157160 }, { "epoch": 1.01, "learning_rate": 0.00014783815357209703, "loss": 0.0405, "step": 157170 }, { "epoch": 1.01, "learning_rate": 0.0001478284722177401, "loss": 0.0436, "step": 157180 }, { "epoch": 1.01, "learning_rate": 0.00014781879086338316, "loss": 0.0335, "step": 157190 }, { "epoch": 1.01, "learning_rate": 0.00014780910950902624, "loss": 0.0316, "step": 157200 }, { "epoch": 1.01, "learning_rate": 0.0001477994281546693, "loss": 0.037, "step": 157210 }, { "epoch": 1.01, "learning_rate": 0.00014778974680031238, "loss": 0.0349, "step": 157220 }, { "epoch": 1.01, "learning_rate": 0.00014778006544595543, "loss": 0.0392, "step": 157230 }, { "epoch": 1.01, "learning_rate": 0.0001477703840915985, "loss": 0.0352, "step": 157240 }, { "epoch": 1.01, "learning_rate": 0.0001477607027372416, "loss": 0.0312, "step": 157250 }, { "epoch": 1.01, "learning_rate": 0.00014775102138288464, "loss": 0.0348, "step": 157260 }, { "epoch": 1.02, "learning_rate": 0.00014774134002852772, "loss": 0.0364, "step": 157270 }, { "epoch": 1.02, "learning_rate": 0.00014773165867417077, "loss": 0.0375, "step": 157280 }, { "epoch": 1.02, "learning_rate": 0.00014772197731981383, "loss": 0.0359, "step": 157290 }, { "epoch": 1.02, "learning_rate": 0.0001477122959654569, "loss": 0.0311, "step": 157300 }, { "epoch": 1.02, "learning_rate": 0.00014770261461109999, "loss": 0.0327, "step": 157310 }, { "epoch": 1.02, "learning_rate": 0.00014769293325674307, "loss": 0.0332, "step": 157320 }, { "epoch": 1.02, "learning_rate": 0.00014768325190238612, "loss": 0.0377, "step": 157330 }, { "epoch": 1.02, "learning_rate": 0.0001476735705480292, "loss": 0.0333, "step": 157340 }, { "epoch": 1.02, "learning_rate": 0.00014766388919367225, "loss": 0.0331, "step": 157350 }, { "epoch": 1.02, "learning_rate": 0.0001476542078393153, "loss": 0.036, "step": 157360 }, { "epoch": 1.02, "learning_rate": 0.00014764452648495838, "loss": 0.0385, "step": 157370 }, { "epoch": 1.02, "learning_rate": 0.00014763484513060146, "loss": 0.038, "step": 157380 }, { "epoch": 1.02, "learning_rate": 0.00014762516377624454, "loss": 0.0374, "step": 157390 }, { "epoch": 1.02, "learning_rate": 0.0001476154824218876, "loss": 0.0381, "step": 157400 }, { "epoch": 1.02, "learning_rate": 0.00014760580106753065, "loss": 0.0536, "step": 157410 }, { "epoch": 1.02, "learning_rate": 0.00014759611971317373, "loss": 0.0396, "step": 157420 }, { "epoch": 1.02, "learning_rate": 0.00014758643835881678, "loss": 0.0348, "step": 157430 }, { "epoch": 1.02, "learning_rate": 0.00014757675700445986, "loss": 0.0341, "step": 157440 }, { "epoch": 1.02, "learning_rate": 0.00014756707565010294, "loss": 0.0369, "step": 157450 }, { "epoch": 1.02, "learning_rate": 0.000147557394295746, "loss": 0.0337, "step": 157460 }, { "epoch": 1.02, "learning_rate": 0.00014754771294138907, "loss": 0.0334, "step": 157470 }, { "epoch": 1.02, "learning_rate": 0.00014753803158703213, "loss": 0.0362, "step": 157480 }, { "epoch": 1.02, "learning_rate": 0.0001475283502326752, "loss": 0.0397, "step": 157490 }, { "epoch": 1.02, "learning_rate": 0.00014751866887831826, "loss": 0.0341, "step": 157500 }, { "epoch": 1.02, "learning_rate": 0.00014750898752396134, "loss": 0.0409, "step": 157510 }, { "epoch": 1.02, "learning_rate": 0.00014749930616960442, "loss": 0.0348, "step": 157520 }, { "epoch": 1.02, "learning_rate": 0.00014748962481524747, "loss": 0.0352, "step": 157530 }, { "epoch": 1.02, "learning_rate": 0.00014747994346089055, "loss": 0.0374, "step": 157540 }, { "epoch": 1.02, "learning_rate": 0.0001474702621065336, "loss": 0.0375, "step": 157550 }, { "epoch": 1.02, "learning_rate": 0.00014746058075217668, "loss": 0.035, "step": 157560 }, { "epoch": 1.02, "learning_rate": 0.00014745089939781974, "loss": 0.0407, "step": 157570 }, { "epoch": 1.02, "learning_rate": 0.00014744121804346282, "loss": 0.0288, "step": 157580 }, { "epoch": 1.02, "learning_rate": 0.0001474315366891059, "loss": 0.034, "step": 157590 }, { "epoch": 1.02, "learning_rate": 0.00014742185533474895, "loss": 0.0344, "step": 157600 }, { "epoch": 1.02, "learning_rate": 0.000147412173980392, "loss": 0.0349, "step": 157610 }, { "epoch": 1.02, "learning_rate": 0.00014740249262603508, "loss": 0.0337, "step": 157620 }, { "epoch": 1.02, "learning_rate": 0.00014739281127167816, "loss": 0.0397, "step": 157630 }, { "epoch": 1.02, "learning_rate": 0.0001473831299173212, "loss": 0.0383, "step": 157640 }, { "epoch": 1.02, "learning_rate": 0.0001473734485629643, "loss": 0.0478, "step": 157650 }, { "epoch": 1.02, "learning_rate": 0.00014736376720860735, "loss": 0.0402, "step": 157660 }, { "epoch": 1.02, "learning_rate": 0.00014735408585425043, "loss": 0.0348, "step": 157670 }, { "epoch": 1.02, "learning_rate": 0.00014734440449989348, "loss": 0.036, "step": 157680 }, { "epoch": 1.02, "learning_rate": 0.00014733472314553656, "loss": 0.0552, "step": 157690 }, { "epoch": 1.02, "learning_rate": 0.00014732504179117964, "loss": 0.0389, "step": 157700 }, { "epoch": 1.02, "learning_rate": 0.0001473153604368227, "loss": 0.0348, "step": 157710 }, { "epoch": 1.02, "learning_rate": 0.00014730567908246577, "loss": 0.0346, "step": 157720 }, { "epoch": 1.02, "learning_rate": 0.00014729599772810882, "loss": 0.0395, "step": 157730 }, { "epoch": 1.02, "learning_rate": 0.0001472863163737519, "loss": 0.0343, "step": 157740 }, { "epoch": 1.02, "learning_rate": 0.00014727663501939495, "loss": 0.0356, "step": 157750 }, { "epoch": 1.02, "learning_rate": 0.00014726695366503803, "loss": 0.0357, "step": 157760 }, { "epoch": 1.02, "learning_rate": 0.00014725727231068111, "loss": 0.0362, "step": 157770 }, { "epoch": 1.02, "learning_rate": 0.00014724759095632417, "loss": 0.0354, "step": 157780 }, { "epoch": 1.02, "learning_rate": 0.00014723790960196725, "loss": 0.0387, "step": 157790 }, { "epoch": 1.02, "learning_rate": 0.0001472282282476103, "loss": 0.0343, "step": 157800 }, { "epoch": 1.02, "learning_rate": 0.00014721854689325338, "loss": 0.0421, "step": 157810 }, { "epoch": 1.02, "learning_rate": 0.00014720886553889643, "loss": 0.033, "step": 157820 }, { "epoch": 1.02, "learning_rate": 0.0001471991841845395, "loss": 0.0351, "step": 157830 }, { "epoch": 1.02, "learning_rate": 0.0001471895028301826, "loss": 0.0346, "step": 157840 }, { "epoch": 1.02, "learning_rate": 0.00014717982147582564, "loss": 0.0371, "step": 157850 }, { "epoch": 1.02, "learning_rate": 0.0001471701401214687, "loss": 0.0404, "step": 157860 }, { "epoch": 1.02, "learning_rate": 0.00014716045876711178, "loss": 0.0418, "step": 157870 }, { "epoch": 1.02, "learning_rate": 0.00014715077741275486, "loss": 0.0329, "step": 157880 }, { "epoch": 1.02, "learning_rate": 0.0001471410960583979, "loss": 0.0296, "step": 157890 }, { "epoch": 1.02, "learning_rate": 0.000147131414704041, "loss": 0.0375, "step": 157900 }, { "epoch": 1.02, "learning_rate": 0.00014712173334968407, "loss": 0.0395, "step": 157910 }, { "epoch": 1.02, "learning_rate": 0.00014711205199532712, "loss": 0.0379, "step": 157920 }, { "epoch": 1.02, "learning_rate": 0.00014710237064097017, "loss": 0.0392, "step": 157930 }, { "epoch": 1.02, "learning_rate": 0.00014709268928661325, "loss": 0.0361, "step": 157940 }, { "epoch": 1.02, "learning_rate": 0.00014708300793225633, "loss": 0.0304, "step": 157950 }, { "epoch": 1.02, "learning_rate": 0.0001470733265778994, "loss": 0.0374, "step": 157960 }, { "epoch": 1.02, "learning_rate": 0.00014706364522354247, "loss": 0.0299, "step": 157970 }, { "epoch": 1.02, "learning_rate": 0.00014705396386918552, "loss": 0.0366, "step": 157980 }, { "epoch": 1.02, "learning_rate": 0.0001470442825148286, "loss": 0.0374, "step": 157990 }, { "epoch": 1.02, "learning_rate": 0.00014703460116047165, "loss": 0.0321, "step": 158000 }, { "epoch": 1.02, "eval_cer": 0.9197731329793244, "eval_loss": 0.024751625955104828, "eval_runtime": 120.2028, "eval_samples_per_second": 16.639, "eval_steps_per_second": 4.16, "step": 158000 }, { "epoch": 1.02, "learning_rate": 0.00014702491980611473, "loss": 0.0361, "step": 158010 }, { "epoch": 1.02, "learning_rate": 0.0001470152384517578, "loss": 0.0356, "step": 158020 }, { "epoch": 1.02, "learning_rate": 0.00014700555709740086, "loss": 0.0295, "step": 158030 }, { "epoch": 1.02, "learning_rate": 0.00014699587574304394, "loss": 0.0346, "step": 158040 }, { "epoch": 1.02, "learning_rate": 0.000146986194388687, "loss": 0.0434, "step": 158050 }, { "epoch": 1.02, "learning_rate": 0.00014697651303433005, "loss": 0.0352, "step": 158060 }, { "epoch": 1.02, "learning_rate": 0.00014696683167997313, "loss": 0.0357, "step": 158070 }, { "epoch": 1.02, "learning_rate": 0.0001469571503256162, "loss": 0.0381, "step": 158080 }, { "epoch": 1.02, "learning_rate": 0.0001469474689712593, "loss": 0.034, "step": 158090 }, { "epoch": 1.02, "learning_rate": 0.00014693778761690234, "loss": 0.0342, "step": 158100 }, { "epoch": 1.02, "learning_rate": 0.00014692810626254542, "loss": 0.0356, "step": 158110 }, { "epoch": 1.02, "learning_rate": 0.00014691842490818847, "loss": 0.0314, "step": 158120 }, { "epoch": 1.02, "learning_rate": 0.00014690874355383153, "loss": 0.0339, "step": 158130 }, { "epoch": 1.02, "learning_rate": 0.0001468990621994746, "loss": 0.0346, "step": 158140 }, { "epoch": 1.02, "learning_rate": 0.00014688938084511769, "loss": 0.0309, "step": 158150 }, { "epoch": 1.02, "learning_rate": 0.00014687969949076077, "loss": 0.0368, "step": 158160 }, { "epoch": 1.02, "learning_rate": 0.00014687001813640382, "loss": 0.0425, "step": 158170 }, { "epoch": 1.02, "learning_rate": 0.00014686033678204687, "loss": 0.0353, "step": 158180 }, { "epoch": 1.02, "learning_rate": 0.00014685065542768995, "loss": 0.0363, "step": 158190 }, { "epoch": 1.02, "learning_rate": 0.000146840974073333, "loss": 0.0373, "step": 158200 }, { "epoch": 1.02, "learning_rate": 0.00014683129271897608, "loss": 0.0338, "step": 158210 }, { "epoch": 1.02, "learning_rate": 0.00014682161136461916, "loss": 0.0429, "step": 158220 }, { "epoch": 1.02, "learning_rate": 0.00014681193001026224, "loss": 0.037, "step": 158230 }, { "epoch": 1.02, "learning_rate": 0.0001468022486559053, "loss": 0.0435, "step": 158240 }, { "epoch": 1.02, "learning_rate": 0.00014679256730154835, "loss": 0.0355, "step": 158250 }, { "epoch": 1.02, "learning_rate": 0.00014678288594719143, "loss": 0.036, "step": 158260 }, { "epoch": 1.02, "learning_rate": 0.00014677320459283448, "loss": 0.0391, "step": 158270 }, { "epoch": 1.02, "learning_rate": 0.00014676352323847756, "loss": 0.0373, "step": 158280 }, { "epoch": 1.02, "learning_rate": 0.00014675384188412064, "loss": 0.0349, "step": 158290 }, { "epoch": 1.02, "learning_rate": 0.0001467441605297637, "loss": 0.0356, "step": 158300 }, { "epoch": 1.02, "learning_rate": 0.00014673447917540677, "loss": 0.0343, "step": 158310 }, { "epoch": 1.02, "learning_rate": 0.00014672479782104983, "loss": 0.036, "step": 158320 }, { "epoch": 1.02, "learning_rate": 0.0001467151164666929, "loss": 0.0341, "step": 158330 }, { "epoch": 1.02, "learning_rate": 0.00014670543511233596, "loss": 0.0362, "step": 158340 }, { "epoch": 1.02, "learning_rate": 0.00014669575375797904, "loss": 0.0381, "step": 158350 }, { "epoch": 1.02, "learning_rate": 0.00014668607240362212, "loss": 0.0357, "step": 158360 }, { "epoch": 1.02, "learning_rate": 0.00014667639104926517, "loss": 0.0327, "step": 158370 }, { "epoch": 1.02, "learning_rate": 0.00014666670969490822, "loss": 0.0295, "step": 158380 }, { "epoch": 1.02, "learning_rate": 0.0001466570283405513, "loss": 0.0291, "step": 158390 }, { "epoch": 1.02, "learning_rate": 0.00014664734698619438, "loss": 0.0299, "step": 158400 }, { "epoch": 1.02, "learning_rate": 0.00014663766563183744, "loss": 0.036, "step": 158410 }, { "epoch": 1.02, "learning_rate": 0.00014662798427748051, "loss": 0.0321, "step": 158420 }, { "epoch": 1.02, "learning_rate": 0.0001466183029231236, "loss": 0.034, "step": 158430 }, { "epoch": 1.02, "learning_rate": 0.00014660862156876665, "loss": 0.037, "step": 158440 }, { "epoch": 1.02, "learning_rate": 0.0001465989402144097, "loss": 0.0341, "step": 158450 }, { "epoch": 1.02, "learning_rate": 0.00014658925886005278, "loss": 0.0363, "step": 158460 }, { "epoch": 1.02, "learning_rate": 0.00014657957750569586, "loss": 0.0301, "step": 158470 }, { "epoch": 1.02, "learning_rate": 0.0001465698961513389, "loss": 0.0314, "step": 158480 }, { "epoch": 1.02, "learning_rate": 0.000146560214796982, "loss": 0.0385, "step": 158490 }, { "epoch": 1.02, "learning_rate": 0.00014655053344262504, "loss": 0.0327, "step": 158500 }, { "epoch": 1.02, "learning_rate": 0.00014654085208826812, "loss": 0.0315, "step": 158510 }, { "epoch": 1.02, "learning_rate": 0.00014653117073391118, "loss": 0.0366, "step": 158520 }, { "epoch": 1.02, "learning_rate": 0.00014652148937955426, "loss": 0.0393, "step": 158530 }, { "epoch": 1.02, "learning_rate": 0.00014651180802519734, "loss": 0.0343, "step": 158540 }, { "epoch": 1.02, "learning_rate": 0.0001465021266708404, "loss": 0.0405, "step": 158550 }, { "epoch": 1.02, "learning_rate": 0.00014649244531648347, "loss": 0.0339, "step": 158560 }, { "epoch": 1.02, "learning_rate": 0.00014648276396212652, "loss": 0.0384, "step": 158570 }, { "epoch": 1.02, "learning_rate": 0.0001464730826077696, "loss": 0.0349, "step": 158580 }, { "epoch": 1.02, "learning_rate": 0.00014646340125341265, "loss": 0.0347, "step": 158590 }, { "epoch": 1.02, "learning_rate": 0.00014645371989905573, "loss": 0.031, "step": 158600 }, { "epoch": 1.02, "learning_rate": 0.00014644403854469881, "loss": 0.0358, "step": 158610 }, { "epoch": 1.02, "learning_rate": 0.00014643435719034187, "loss": 0.0345, "step": 158620 }, { "epoch": 1.02, "learning_rate": 0.00014642467583598495, "loss": 0.0372, "step": 158630 }, { "epoch": 1.02, "learning_rate": 0.000146414994481628, "loss": 0.0318, "step": 158640 }, { "epoch": 1.02, "learning_rate": 0.00014640531312727108, "loss": 0.0342, "step": 158650 }, { "epoch": 1.02, "learning_rate": 0.00014639563177291413, "loss": 0.0302, "step": 158660 }, { "epoch": 1.02, "learning_rate": 0.0001463859504185572, "loss": 0.0361, "step": 158670 }, { "epoch": 1.02, "learning_rate": 0.0001463762690642003, "loss": 0.0402, "step": 158680 }, { "epoch": 1.02, "learning_rate": 0.00014636658770984334, "loss": 0.0353, "step": 158690 }, { "epoch": 1.02, "learning_rate": 0.0001463569063554864, "loss": 0.036, "step": 158700 }, { "epoch": 1.02, "learning_rate": 0.00014634722500112948, "loss": 0.0341, "step": 158710 }, { "epoch": 1.02, "learning_rate": 0.00014633754364677256, "loss": 0.0326, "step": 158720 }, { "epoch": 1.02, "learning_rate": 0.0001463278622924156, "loss": 0.0314, "step": 158730 }, { "epoch": 1.02, "learning_rate": 0.0001463181809380587, "loss": 0.0318, "step": 158740 }, { "epoch": 1.02, "learning_rate": 0.00014630849958370174, "loss": 0.0323, "step": 158750 }, { "epoch": 1.02, "learning_rate": 0.00014629881822934482, "loss": 0.0323, "step": 158760 }, { "epoch": 1.02, "learning_rate": 0.00014628913687498787, "loss": 0.0395, "step": 158770 }, { "epoch": 1.02, "learning_rate": 0.00014627945552063095, "loss": 0.0349, "step": 158780 }, { "epoch": 1.02, "learning_rate": 0.00014626977416627403, "loss": 0.0402, "step": 158790 }, { "epoch": 1.02, "learning_rate": 0.00014626009281191709, "loss": 0.0395, "step": 158800 }, { "epoch": 1.02, "learning_rate": 0.00014625041145756017, "loss": 0.0315, "step": 158810 }, { "epoch": 1.03, "learning_rate": 0.00014624073010320322, "loss": 0.0346, "step": 158820 }, { "epoch": 1.03, "learning_rate": 0.0001462310487488463, "loss": 0.0308, "step": 158830 }, { "epoch": 1.03, "learning_rate": 0.00014622136739448935, "loss": 0.0347, "step": 158840 }, { "epoch": 1.03, "learning_rate": 0.00014621168604013243, "loss": 0.0408, "step": 158850 }, { "epoch": 1.03, "learning_rate": 0.0001462020046857755, "loss": 0.0373, "step": 158860 }, { "epoch": 1.03, "learning_rate": 0.00014619232333141856, "loss": 0.0296, "step": 158870 }, { "epoch": 1.03, "learning_rate": 0.00014618264197706164, "loss": 0.0361, "step": 158880 }, { "epoch": 1.03, "learning_rate": 0.0001461729606227047, "loss": 0.0293, "step": 158890 }, { "epoch": 1.03, "learning_rate": 0.00014616327926834775, "loss": 0.0312, "step": 158900 }, { "epoch": 1.03, "learning_rate": 0.00014615359791399083, "loss": 0.032, "step": 158910 }, { "epoch": 1.03, "learning_rate": 0.0001461439165596339, "loss": 0.0288, "step": 158920 }, { "epoch": 1.03, "learning_rate": 0.000146134235205277, "loss": 0.0335, "step": 158930 }, { "epoch": 1.03, "learning_rate": 0.00014612455385092004, "loss": 0.0346, "step": 158940 }, { "epoch": 1.03, "learning_rate": 0.0001461148724965631, "loss": 0.031, "step": 158950 }, { "epoch": 1.03, "learning_rate": 0.00014610519114220617, "loss": 0.0355, "step": 158960 }, { "epoch": 1.03, "learning_rate": 0.00014609550978784923, "loss": 0.0364, "step": 158970 }, { "epoch": 1.03, "learning_rate": 0.0001460858284334923, "loss": 0.0331, "step": 158980 }, { "epoch": 1.03, "learning_rate": 0.00014607614707913539, "loss": 0.0347, "step": 158990 }, { "epoch": 1.03, "learning_rate": 0.00014606646572477847, "loss": 0.0366, "step": 159000 }, { "epoch": 1.03, "eval_cer": 0.9199665574511354, "eval_loss": 0.02524988353252411, "eval_runtime": 120.5727, "eval_samples_per_second": 16.587, "eval_steps_per_second": 4.147, "step": 159000 }, { "epoch": 1.03, "learning_rate": 0.00014605678437042152, "loss": 0.0339, "step": 159010 }, { "epoch": 1.03, "learning_rate": 0.00014604710301606457, "loss": 0.0347, "step": 159020 }, { "epoch": 1.03, "learning_rate": 0.00014603742166170765, "loss": 0.0381, "step": 159030 }, { "epoch": 1.03, "learning_rate": 0.0001460277403073507, "loss": 0.0335, "step": 159040 }, { "epoch": 1.03, "learning_rate": 0.00014601805895299378, "loss": 0.0321, "step": 159050 }, { "epoch": 1.03, "learning_rate": 0.00014600837759863686, "loss": 0.0295, "step": 159060 }, { "epoch": 1.03, "learning_rate": 0.00014599869624427992, "loss": 0.0345, "step": 159070 }, { "epoch": 1.03, "learning_rate": 0.000145989014889923, "loss": 0.0364, "step": 159080 }, { "epoch": 1.03, "learning_rate": 0.00014597933353556605, "loss": 0.0325, "step": 159090 }, { "epoch": 1.03, "learning_rate": 0.00014596965218120913, "loss": 0.0388, "step": 159100 }, { "epoch": 1.03, "learning_rate": 0.00014595997082685218, "loss": 0.0381, "step": 159110 }, { "epoch": 1.03, "learning_rate": 0.00014595028947249526, "loss": 0.0344, "step": 159120 }, { "epoch": 1.03, "learning_rate": 0.00014594060811813834, "loss": 0.0367, "step": 159130 }, { "epoch": 1.03, "learning_rate": 0.0001459309267637814, "loss": 0.037, "step": 159140 }, { "epoch": 1.03, "learning_rate": 0.00014592124540942445, "loss": 0.0363, "step": 159150 }, { "epoch": 1.03, "learning_rate": 0.00014591156405506753, "loss": 0.0301, "step": 159160 }, { "epoch": 1.03, "learning_rate": 0.0001459018827007106, "loss": 0.0356, "step": 159170 }, { "epoch": 1.03, "learning_rate": 0.00014589220134635366, "loss": 0.034, "step": 159180 }, { "epoch": 1.03, "learning_rate": 0.00014588251999199674, "loss": 0.0345, "step": 159190 }, { "epoch": 1.03, "learning_rate": 0.00014587283863763982, "loss": 0.0394, "step": 159200 }, { "epoch": 1.03, "learning_rate": 0.00014586315728328287, "loss": 0.0334, "step": 159210 }, { "epoch": 1.03, "learning_rate": 0.00014585347592892592, "loss": 0.0372, "step": 159220 }, { "epoch": 1.03, "learning_rate": 0.000145843794574569, "loss": 0.0323, "step": 159230 }, { "epoch": 1.03, "learning_rate": 0.00014583411322021208, "loss": 0.0393, "step": 159240 }, { "epoch": 1.03, "learning_rate": 0.00014582443186585513, "loss": 0.0356, "step": 159250 }, { "epoch": 1.03, "learning_rate": 0.00014581475051149821, "loss": 0.0378, "step": 159260 }, { "epoch": 1.03, "learning_rate": 0.00014580506915714127, "loss": 0.0331, "step": 159270 }, { "epoch": 1.03, "learning_rate": 0.00014579538780278435, "loss": 0.036, "step": 159280 }, { "epoch": 1.03, "learning_rate": 0.0001457857064484274, "loss": 0.0357, "step": 159290 }, { "epoch": 1.03, "learning_rate": 0.00014577602509407048, "loss": 0.0329, "step": 159300 }, { "epoch": 1.03, "learning_rate": 0.00014576634373971356, "loss": 0.0352, "step": 159310 }, { "epoch": 1.03, "learning_rate": 0.0001457566623853566, "loss": 0.0405, "step": 159320 }, { "epoch": 1.03, "learning_rate": 0.0001457469810309997, "loss": 0.0313, "step": 159330 }, { "epoch": 1.03, "learning_rate": 0.00014573729967664274, "loss": 0.0378, "step": 159340 }, { "epoch": 1.03, "learning_rate": 0.00014572761832228582, "loss": 0.0355, "step": 159350 }, { "epoch": 1.03, "learning_rate": 0.00014571793696792888, "loss": 0.0334, "step": 159360 }, { "epoch": 1.03, "learning_rate": 0.00014570825561357196, "loss": 0.0325, "step": 159370 }, { "epoch": 1.03, "learning_rate": 0.00014569857425921504, "loss": 0.0342, "step": 159380 }, { "epoch": 1.03, "learning_rate": 0.0001456888929048581, "loss": 0.037, "step": 159390 }, { "epoch": 1.03, "learning_rate": 0.00014567921155050117, "loss": 0.0397, "step": 159400 }, { "epoch": 1.03, "learning_rate": 0.00014566953019614422, "loss": 0.0342, "step": 159410 }, { "epoch": 1.03, "learning_rate": 0.0001456598488417873, "loss": 0.0357, "step": 159420 }, { "epoch": 1.03, "learning_rate": 0.00014565016748743035, "loss": 0.0393, "step": 159430 }, { "epoch": 1.03, "learning_rate": 0.00014564048613307343, "loss": 0.0369, "step": 159440 }, { "epoch": 1.03, "learning_rate": 0.00014563080477871651, "loss": 0.0304, "step": 159450 }, { "epoch": 1.03, "learning_rate": 0.00014562112342435957, "loss": 0.0335, "step": 159460 }, { "epoch": 1.03, "learning_rate": 0.00014561144207000262, "loss": 0.0335, "step": 159470 }, { "epoch": 1.03, "learning_rate": 0.0001456017607156457, "loss": 0.0314, "step": 159480 }, { "epoch": 1.03, "learning_rate": 0.00014559207936128878, "loss": 0.0323, "step": 159490 }, { "epoch": 1.03, "learning_rate": 0.00014558239800693183, "loss": 0.0375, "step": 159500 }, { "epoch": 1.03, "learning_rate": 0.0001455727166525749, "loss": 0.0348, "step": 159510 }, { "epoch": 1.03, "learning_rate": 0.000145563035298218, "loss": 0.0321, "step": 159520 }, { "epoch": 1.03, "learning_rate": 0.00014555335394386104, "loss": 0.0324, "step": 159530 }, { "epoch": 1.03, "learning_rate": 0.0001455436725895041, "loss": 0.0322, "step": 159540 }, { "epoch": 1.03, "learning_rate": 0.00014553399123514718, "loss": 0.035, "step": 159550 }, { "epoch": 1.03, "learning_rate": 0.00014552430988079026, "loss": 0.0357, "step": 159560 }, { "epoch": 1.03, "learning_rate": 0.0001455146285264333, "loss": 0.0331, "step": 159570 }, { "epoch": 1.03, "learning_rate": 0.0001455049471720764, "loss": 0.0306, "step": 159580 }, { "epoch": 1.03, "learning_rate": 0.00014549526581771944, "loss": 0.0381, "step": 159590 }, { "epoch": 1.03, "learning_rate": 0.00014548558446336252, "loss": 0.0341, "step": 159600 }, { "epoch": 1.03, "learning_rate": 0.00014547590310900557, "loss": 0.0332, "step": 159610 }, { "epoch": 1.03, "learning_rate": 0.00014546622175464865, "loss": 0.0371, "step": 159620 }, { "epoch": 1.03, "learning_rate": 0.00014545654040029173, "loss": 0.0332, "step": 159630 }, { "epoch": 1.03, "learning_rate": 0.00014544685904593479, "loss": 0.0366, "step": 159640 }, { "epoch": 1.03, "learning_rate": 0.00014543717769157787, "loss": 0.0324, "step": 159650 }, { "epoch": 1.03, "learning_rate": 0.00014542749633722092, "loss": 0.032, "step": 159660 }, { "epoch": 1.03, "learning_rate": 0.00014541781498286397, "loss": 0.0333, "step": 159670 }, { "epoch": 1.03, "learning_rate": 0.00014540813362850705, "loss": 0.0271, "step": 159680 }, { "epoch": 1.03, "learning_rate": 0.00014539845227415013, "loss": 0.0347, "step": 159690 }, { "epoch": 1.03, "learning_rate": 0.0001453887709197932, "loss": 0.0344, "step": 159700 }, { "epoch": 1.03, "learning_rate": 0.00014537908956543626, "loss": 0.0391, "step": 159710 }, { "epoch": 1.03, "learning_rate": 0.00014536940821107934, "loss": 0.0395, "step": 159720 }, { "epoch": 1.03, "learning_rate": 0.0001453597268567224, "loss": 0.0417, "step": 159730 }, { "epoch": 1.03, "learning_rate": 0.00014535004550236545, "loss": 0.0404, "step": 159740 }, { "epoch": 1.03, "learning_rate": 0.00014534036414800853, "loss": 0.0372, "step": 159750 }, { "epoch": 1.03, "learning_rate": 0.0001453306827936516, "loss": 0.0339, "step": 159760 }, { "epoch": 1.03, "learning_rate": 0.0001453210014392947, "loss": 0.0315, "step": 159770 }, { "epoch": 1.03, "learning_rate": 0.00014531132008493774, "loss": 0.032, "step": 159780 }, { "epoch": 1.03, "learning_rate": 0.0001453016387305808, "loss": 0.0365, "step": 159790 }, { "epoch": 1.03, "learning_rate": 0.00014529195737622387, "loss": 0.0362, "step": 159800 }, { "epoch": 1.03, "learning_rate": 0.00014528227602186693, "loss": 0.0282, "step": 159810 }, { "epoch": 1.03, "learning_rate": 0.00014527259466751, "loss": 0.0361, "step": 159820 }, { "epoch": 1.03, "learning_rate": 0.00014526291331315309, "loss": 0.0395, "step": 159830 }, { "epoch": 1.03, "learning_rate": 0.00014525323195879614, "loss": 0.0347, "step": 159840 }, { "epoch": 1.03, "learning_rate": 0.00014524355060443922, "loss": 0.031, "step": 159850 }, { "epoch": 1.03, "learning_rate": 0.00014523386925008227, "loss": 0.0333, "step": 159860 }, { "epoch": 1.03, "learning_rate": 0.00014522418789572535, "loss": 0.035, "step": 159870 }, { "epoch": 1.03, "learning_rate": 0.0001452145065413684, "loss": 0.0326, "step": 159880 }, { "epoch": 1.03, "learning_rate": 0.00014520482518701148, "loss": 0.0392, "step": 159890 }, { "epoch": 1.03, "learning_rate": 0.00014519514383265456, "loss": 0.0313, "step": 159900 }, { "epoch": 1.03, "learning_rate": 0.00014518546247829761, "loss": 0.0378, "step": 159910 }, { "epoch": 1.03, "learning_rate": 0.0001451757811239407, "loss": 0.032, "step": 159920 }, { "epoch": 1.03, "learning_rate": 0.00014516609976958375, "loss": 0.0359, "step": 159930 }, { "epoch": 1.03, "learning_rate": 0.00014515641841522683, "loss": 0.0361, "step": 159940 }, { "epoch": 1.03, "learning_rate": 0.00014514673706086988, "loss": 0.0343, "step": 159950 }, { "epoch": 1.03, "learning_rate": 0.00014513705570651296, "loss": 0.0442, "step": 159960 }, { "epoch": 1.03, "learning_rate": 0.00014512737435215604, "loss": 0.0358, "step": 159970 }, { "epoch": 1.03, "learning_rate": 0.0001451176929977991, "loss": 0.0376, "step": 159980 }, { "epoch": 1.03, "learning_rate": 0.00014510801164344214, "loss": 0.0335, "step": 159990 }, { "epoch": 1.03, "learning_rate": 0.00014509833028908522, "loss": 0.0298, "step": 160000 }, { "epoch": 1.03, "eval_cer": 0.919810190938877, "eval_loss": 0.025443054735660553, "eval_runtime": 120.5621, "eval_samples_per_second": 16.589, "eval_steps_per_second": 4.147, "step": 160000 }, { "epoch": 1.03, "learning_rate": 0.0001450886489347283, "loss": 0.0344, "step": 160010 }, { "epoch": 1.03, "learning_rate": 0.00014507896758037136, "loss": 0.0417, "step": 160020 }, { "epoch": 1.03, "learning_rate": 0.00014506928622601444, "loss": 0.0344, "step": 160030 }, { "epoch": 1.03, "learning_rate": 0.00014505960487165752, "loss": 0.0317, "step": 160040 }, { "epoch": 1.03, "learning_rate": 0.00014504992351730057, "loss": 0.0311, "step": 160050 }, { "epoch": 1.03, "learning_rate": 0.00014504024216294362, "loss": 0.0316, "step": 160060 }, { "epoch": 1.03, "learning_rate": 0.0001450305608085867, "loss": 0.0382, "step": 160070 }, { "epoch": 1.03, "learning_rate": 0.00014502087945422978, "loss": 0.0411, "step": 160080 }, { "epoch": 1.03, "learning_rate": 0.00014501119809987283, "loss": 0.0304, "step": 160090 }, { "epoch": 1.03, "learning_rate": 0.00014500151674551591, "loss": 0.0428, "step": 160100 }, { "epoch": 1.03, "learning_rate": 0.00014499183539115897, "loss": 0.0383, "step": 160110 }, { "epoch": 1.03, "learning_rate": 0.00014498215403680205, "loss": 0.0345, "step": 160120 }, { "epoch": 1.03, "learning_rate": 0.0001449724726824451, "loss": 0.0293, "step": 160130 }, { "epoch": 1.03, "learning_rate": 0.00014496279132808818, "loss": 0.0343, "step": 160140 }, { "epoch": 1.03, "learning_rate": 0.00014495310997373126, "loss": 0.0378, "step": 160150 }, { "epoch": 1.03, "learning_rate": 0.0001449434286193743, "loss": 0.0283, "step": 160160 }, { "epoch": 1.03, "learning_rate": 0.0001449337472650174, "loss": 0.0307, "step": 160170 }, { "epoch": 1.03, "learning_rate": 0.00014492406591066044, "loss": 0.0331, "step": 160180 }, { "epoch": 1.03, "learning_rate": 0.0001449143845563035, "loss": 0.0333, "step": 160190 }, { "epoch": 1.03, "learning_rate": 0.00014490470320194658, "loss": 0.0395, "step": 160200 }, { "epoch": 1.03, "learning_rate": 0.00014489502184758966, "loss": 0.037, "step": 160210 }, { "epoch": 1.03, "learning_rate": 0.00014488534049323274, "loss": 0.0434, "step": 160220 }, { "epoch": 1.03, "learning_rate": 0.0001448756591388758, "loss": 0.0345, "step": 160230 }, { "epoch": 1.03, "learning_rate": 0.00014486597778451887, "loss": 0.0339, "step": 160240 }, { "epoch": 1.03, "learning_rate": 0.00014485629643016192, "loss": 0.0328, "step": 160250 }, { "epoch": 1.03, "learning_rate": 0.00014484661507580497, "loss": 0.0346, "step": 160260 }, { "epoch": 1.03, "learning_rate": 0.00014483693372144805, "loss": 0.0313, "step": 160270 }, { "epoch": 1.03, "learning_rate": 0.00014482725236709113, "loss": 0.0323, "step": 160280 }, { "epoch": 1.03, "learning_rate": 0.0001448175710127342, "loss": 0.0375, "step": 160290 }, { "epoch": 1.03, "learning_rate": 0.00014480788965837727, "loss": 0.0313, "step": 160300 }, { "epoch": 1.03, "learning_rate": 0.00014479820830402032, "loss": 0.0317, "step": 160310 }, { "epoch": 1.03, "learning_rate": 0.0001447885269496634, "loss": 0.039, "step": 160320 }, { "epoch": 1.03, "learning_rate": 0.00014477884559530645, "loss": 0.0325, "step": 160330 }, { "epoch": 1.03, "learning_rate": 0.00014476916424094953, "loss": 0.0372, "step": 160340 }, { "epoch": 1.03, "learning_rate": 0.0001447594828865926, "loss": 0.0346, "step": 160350 }, { "epoch": 1.03, "learning_rate": 0.00014474980153223566, "loss": 0.0328, "step": 160360 }, { "epoch": 1.04, "learning_rate": 0.00014474012017787874, "loss": 0.0338, "step": 160370 }, { "epoch": 1.04, "learning_rate": 0.0001447304388235218, "loss": 0.0317, "step": 160380 }, { "epoch": 1.04, "learning_rate": 0.00014472075746916488, "loss": 0.0336, "step": 160390 }, { "epoch": 1.04, "learning_rate": 0.00014471107611480793, "loss": 0.0315, "step": 160400 }, { "epoch": 1.04, "learning_rate": 0.000144701394760451, "loss": 0.0377, "step": 160410 }, { "epoch": 1.04, "learning_rate": 0.0001446917134060941, "loss": 0.0368, "step": 160420 }, { "epoch": 1.04, "learning_rate": 0.00014468203205173714, "loss": 0.0324, "step": 160430 }, { "epoch": 1.04, "learning_rate": 0.00014467235069738022, "loss": 0.0344, "step": 160440 }, { "epoch": 1.04, "learning_rate": 0.00014466266934302327, "loss": 0.0316, "step": 160450 }, { "epoch": 1.04, "learning_rate": 0.00014465298798866635, "loss": 0.0374, "step": 160460 }, { "epoch": 1.04, "learning_rate": 0.0001446433066343094, "loss": 0.0327, "step": 160470 }, { "epoch": 1.04, "learning_rate": 0.00014463362527995249, "loss": 0.0414, "step": 160480 }, { "epoch": 1.04, "learning_rate": 0.00014462394392559557, "loss": 0.0388, "step": 160490 }, { "epoch": 1.04, "learning_rate": 0.00014461426257123862, "loss": 0.0398, "step": 160500 }, { "epoch": 1.04, "learning_rate": 0.00014460458121688167, "loss": 0.0383, "step": 160510 }, { "epoch": 1.04, "learning_rate": 0.00014459489986252475, "loss": 0.0366, "step": 160520 }, { "epoch": 1.04, "learning_rate": 0.00014458521850816783, "loss": 0.0397, "step": 160530 }, { "epoch": 1.04, "learning_rate": 0.00014457553715381088, "loss": 0.0353, "step": 160540 }, { "epoch": 1.04, "learning_rate": 0.00014456585579945396, "loss": 0.0341, "step": 160550 }, { "epoch": 1.04, "learning_rate": 0.00014455617444509702, "loss": 0.0397, "step": 160560 }, { "epoch": 1.04, "learning_rate": 0.0001445464930907401, "loss": 0.0377, "step": 160570 }, { "epoch": 1.04, "learning_rate": 0.00014453681173638315, "loss": 0.035, "step": 160580 }, { "epoch": 1.04, "learning_rate": 0.00014452713038202623, "loss": 0.0321, "step": 160590 }, { "epoch": 1.04, "learning_rate": 0.0001445174490276693, "loss": 0.0322, "step": 160600 }, { "epoch": 1.04, "learning_rate": 0.00014450776767331236, "loss": 0.0348, "step": 160610 }, { "epoch": 1.04, "learning_rate": 0.00014449808631895544, "loss": 0.0304, "step": 160620 }, { "epoch": 1.04, "learning_rate": 0.0001444884049645985, "loss": 0.037, "step": 160630 }, { "epoch": 1.04, "learning_rate": 0.00014447872361024157, "loss": 0.0389, "step": 160640 }, { "epoch": 1.04, "learning_rate": 0.00014446904225588463, "loss": 0.0355, "step": 160650 }, { "epoch": 1.04, "learning_rate": 0.0001444593609015277, "loss": 0.0343, "step": 160660 }, { "epoch": 1.04, "learning_rate": 0.00014444967954717078, "loss": 0.032, "step": 160670 }, { "epoch": 1.04, "learning_rate": 0.00014443999819281384, "loss": 0.0322, "step": 160680 }, { "epoch": 1.04, "learning_rate": 0.00014443031683845692, "loss": 0.0308, "step": 160690 }, { "epoch": 1.04, "learning_rate": 0.00014442063548409997, "loss": 0.0357, "step": 160700 }, { "epoch": 1.04, "learning_rate": 0.00014441095412974305, "loss": 0.0352, "step": 160710 }, { "epoch": 1.04, "learning_rate": 0.0001444012727753861, "loss": 0.035, "step": 160720 }, { "epoch": 1.04, "learning_rate": 0.00014439159142102918, "loss": 0.0333, "step": 160730 }, { "epoch": 1.04, "learning_rate": 0.00014438191006667226, "loss": 0.04, "step": 160740 }, { "epoch": 1.04, "learning_rate": 0.00014437222871231531, "loss": 0.035, "step": 160750 }, { "epoch": 1.04, "learning_rate": 0.00014436254735795837, "loss": 0.0377, "step": 160760 }, { "epoch": 1.04, "learning_rate": 0.00014435286600360145, "loss": 0.034, "step": 160770 }, { "epoch": 1.04, "learning_rate": 0.00014434318464924453, "loss": 0.0359, "step": 160780 }, { "epoch": 1.04, "learning_rate": 0.00014433350329488758, "loss": 0.0313, "step": 160790 }, { "epoch": 1.04, "learning_rate": 0.00014432382194053066, "loss": 0.0316, "step": 160800 }, { "epoch": 1.04, "learning_rate": 0.00014431414058617374, "loss": 0.0324, "step": 160810 }, { "epoch": 1.04, "learning_rate": 0.0001443044592318168, "loss": 0.0376, "step": 160820 }, { "epoch": 1.04, "learning_rate": 0.00014429477787745984, "loss": 0.0303, "step": 160830 }, { "epoch": 1.04, "learning_rate": 0.00014428509652310292, "loss": 0.0359, "step": 160840 }, { "epoch": 1.04, "learning_rate": 0.000144275415168746, "loss": 0.0341, "step": 160850 }, { "epoch": 1.04, "learning_rate": 0.00014426573381438906, "loss": 0.0338, "step": 160860 }, { "epoch": 1.04, "learning_rate": 0.00014425605246003214, "loss": 0.0329, "step": 160870 }, { "epoch": 1.04, "learning_rate": 0.0001442463711056752, "loss": 0.0329, "step": 160880 }, { "epoch": 1.04, "learning_rate": 0.00014423668975131827, "loss": 0.0366, "step": 160890 }, { "epoch": 1.04, "learning_rate": 0.00014422700839696132, "loss": 0.0303, "step": 160900 }, { "epoch": 1.04, "learning_rate": 0.0001442173270426044, "loss": 0.0371, "step": 160910 }, { "epoch": 1.04, "learning_rate": 0.00014420764568824748, "loss": 0.0332, "step": 160920 }, { "epoch": 1.04, "learning_rate": 0.00014419796433389053, "loss": 0.0335, "step": 160930 }, { "epoch": 1.04, "learning_rate": 0.00014418828297953361, "loss": 0.0317, "step": 160940 }, { "epoch": 1.04, "learning_rate": 0.00014417860162517667, "loss": 0.0398, "step": 160950 }, { "epoch": 1.04, "learning_rate": 0.00014416892027081972, "loss": 0.0311, "step": 160960 }, { "epoch": 1.04, "learning_rate": 0.0001441592389164628, "loss": 0.035, "step": 160970 }, { "epoch": 1.04, "learning_rate": 0.00014414955756210588, "loss": 0.0365, "step": 160980 }, { "epoch": 1.04, "learning_rate": 0.00014413987620774896, "loss": 0.034, "step": 160990 }, { "epoch": 1.04, "learning_rate": 0.000144130194853392, "loss": 0.0316, "step": 161000 }, { "epoch": 1.04, "eval_cer": 0.9198617105411818, "eval_loss": 0.025041013956069946, "eval_runtime": 120.0341, "eval_samples_per_second": 16.662, "eval_steps_per_second": 4.165, "step": 161000 }, { "epoch": 1.04, "learning_rate": 0.0001441205134990351, "loss": 0.032, "step": 161010 }, { "epoch": 1.04, "learning_rate": 0.00014411083214467814, "loss": 0.0337, "step": 161020 }, { "epoch": 1.04, "learning_rate": 0.0001441011507903212, "loss": 0.037, "step": 161030 }, { "epoch": 1.04, "learning_rate": 0.00014409146943596428, "loss": 0.0404, "step": 161040 }, { "epoch": 1.04, "learning_rate": 0.00014408178808160736, "loss": 0.0339, "step": 161050 }, { "epoch": 1.04, "learning_rate": 0.00014407210672725044, "loss": 0.0345, "step": 161060 }, { "epoch": 1.04, "learning_rate": 0.0001440624253728935, "loss": 0.0313, "step": 161070 }, { "epoch": 1.04, "learning_rate": 0.00014405274401853654, "loss": 0.0331, "step": 161080 }, { "epoch": 1.04, "learning_rate": 0.00014404306266417962, "loss": 0.0405, "step": 161090 }, { "epoch": 1.04, "learning_rate": 0.00014403338130982267, "loss": 0.0336, "step": 161100 }, { "epoch": 1.04, "learning_rate": 0.00014402369995546575, "loss": 0.0392, "step": 161110 }, { "epoch": 1.04, "learning_rate": 0.00014401401860110883, "loss": 0.0355, "step": 161120 }, { "epoch": 1.04, "learning_rate": 0.0001440043372467519, "loss": 0.0292, "step": 161130 }, { "epoch": 1.04, "learning_rate": 0.00014399465589239497, "loss": 0.0356, "step": 161140 }, { "epoch": 1.04, "learning_rate": 0.00014398497453803802, "loss": 0.0335, "step": 161150 }, { "epoch": 1.04, "learning_rate": 0.0001439752931836811, "loss": 0.0311, "step": 161160 }, { "epoch": 1.04, "learning_rate": 0.00014396561182932415, "loss": 0.0333, "step": 161170 }, { "epoch": 1.04, "learning_rate": 0.00014395593047496723, "loss": 0.0313, "step": 161180 }, { "epoch": 1.04, "learning_rate": 0.0001439462491206103, "loss": 0.0322, "step": 161190 }, { "epoch": 1.04, "learning_rate": 0.00014393656776625336, "loss": 0.0306, "step": 161200 }, { "epoch": 1.04, "learning_rate": 0.00014392688641189644, "loss": 0.0392, "step": 161210 }, { "epoch": 1.04, "learning_rate": 0.0001439172050575395, "loss": 0.0408, "step": 161220 }, { "epoch": 1.04, "learning_rate": 0.00014390752370318258, "loss": 0.0371, "step": 161230 }, { "epoch": 1.04, "learning_rate": 0.00014389784234882563, "loss": 0.0369, "step": 161240 }, { "epoch": 1.04, "learning_rate": 0.0001438881609944687, "loss": 0.032, "step": 161250 }, { "epoch": 1.04, "learning_rate": 0.0001438784796401118, "loss": 0.0369, "step": 161260 }, { "epoch": 1.04, "learning_rate": 0.00014386879828575484, "loss": 0.0318, "step": 161270 }, { "epoch": 1.04, "learning_rate": 0.0001438591169313979, "loss": 0.0352, "step": 161280 }, { "epoch": 1.04, "learning_rate": 0.00014384943557704097, "loss": 0.0365, "step": 161290 }, { "epoch": 1.04, "learning_rate": 0.00014383975422268405, "loss": 0.0364, "step": 161300 }, { "epoch": 1.04, "learning_rate": 0.0001438300728683271, "loss": 0.0351, "step": 161310 }, { "epoch": 1.04, "learning_rate": 0.00014382039151397019, "loss": 0.0339, "step": 161320 }, { "epoch": 1.04, "learning_rate": 0.00014381071015961326, "loss": 0.0363, "step": 161330 }, { "epoch": 1.04, "learning_rate": 0.00014380102880525632, "loss": 0.0315, "step": 161340 }, { "epoch": 1.04, "learning_rate": 0.00014379134745089937, "loss": 0.0338, "step": 161350 }, { "epoch": 1.04, "learning_rate": 0.00014378166609654245, "loss": 0.0319, "step": 161360 }, { "epoch": 1.04, "learning_rate": 0.00014377198474218553, "loss": 0.0321, "step": 161370 }, { "epoch": 1.04, "learning_rate": 0.00014376230338782858, "loss": 0.0412, "step": 161380 }, { "epoch": 1.04, "learning_rate": 0.00014375262203347166, "loss": 0.03, "step": 161390 }, { "epoch": 1.04, "learning_rate": 0.00014374294067911472, "loss": 0.0345, "step": 161400 }, { "epoch": 1.04, "learning_rate": 0.0001437332593247578, "loss": 0.0305, "step": 161410 }, { "epoch": 1.04, "learning_rate": 0.00014372357797040085, "loss": 0.0329, "step": 161420 }, { "epoch": 1.04, "learning_rate": 0.00014371389661604393, "loss": 0.0335, "step": 161430 }, { "epoch": 1.04, "learning_rate": 0.000143704215261687, "loss": 0.0335, "step": 161440 }, { "epoch": 1.04, "learning_rate": 0.00014369453390733006, "loss": 0.0368, "step": 161450 }, { "epoch": 1.04, "learning_rate": 0.00014368485255297314, "loss": 0.039, "step": 161460 }, { "epoch": 1.04, "learning_rate": 0.0001436751711986162, "loss": 0.0306, "step": 161470 }, { "epoch": 1.04, "learning_rate": 0.00014366548984425927, "loss": 0.0313, "step": 161480 }, { "epoch": 1.04, "learning_rate": 0.00014365580848990232, "loss": 0.0342, "step": 161490 }, { "epoch": 1.04, "learning_rate": 0.0001436461271355454, "loss": 0.039, "step": 161500 }, { "epoch": 1.04, "learning_rate": 0.00014363644578118848, "loss": 0.0386, "step": 161510 }, { "epoch": 1.04, "learning_rate": 0.00014362676442683154, "loss": 0.0367, "step": 161520 }, { "epoch": 1.04, "learning_rate": 0.00014361708307247462, "loss": 0.0331, "step": 161530 }, { "epoch": 1.04, "learning_rate": 0.00014360740171811767, "loss": 0.0407, "step": 161540 }, { "epoch": 1.04, "learning_rate": 0.00014359772036376075, "loss": 0.0338, "step": 161550 }, { "epoch": 1.04, "learning_rate": 0.0001435880390094038, "loss": 0.0295, "step": 161560 }, { "epoch": 1.04, "learning_rate": 0.00014357835765504688, "loss": 0.0356, "step": 161570 }, { "epoch": 1.04, "learning_rate": 0.00014356867630068996, "loss": 0.0387, "step": 161580 }, { "epoch": 1.04, "learning_rate": 0.00014355899494633301, "loss": 0.0398, "step": 161590 }, { "epoch": 1.04, "learning_rate": 0.00014354931359197607, "loss": 0.032, "step": 161600 }, { "epoch": 1.04, "learning_rate": 0.00014353963223761915, "loss": 0.0315, "step": 161610 }, { "epoch": 1.04, "learning_rate": 0.00014352995088326223, "loss": 0.0406, "step": 161620 }, { "epoch": 1.04, "learning_rate": 0.00014352026952890528, "loss": 0.036, "step": 161630 }, { "epoch": 1.04, "learning_rate": 0.00014351058817454836, "loss": 0.0315, "step": 161640 }, { "epoch": 1.04, "learning_rate": 0.0001435009068201914, "loss": 0.0396, "step": 161650 }, { "epoch": 1.04, "learning_rate": 0.0001434912254658345, "loss": 0.0302, "step": 161660 }, { "epoch": 1.04, "learning_rate": 0.00014348154411147754, "loss": 0.0387, "step": 161670 }, { "epoch": 1.04, "learning_rate": 0.00014347186275712062, "loss": 0.0354, "step": 161680 }, { "epoch": 1.04, "learning_rate": 0.0001434621814027637, "loss": 0.0361, "step": 161690 }, { "epoch": 1.04, "learning_rate": 0.00014345250004840676, "loss": 0.0345, "step": 161700 }, { "epoch": 1.04, "learning_rate": 0.00014344281869404984, "loss": 0.0311, "step": 161710 }, { "epoch": 1.04, "learning_rate": 0.0001434331373396929, "loss": 0.0361, "step": 161720 }, { "epoch": 1.04, "learning_rate": 0.00014342345598533597, "loss": 0.0336, "step": 161730 }, { "epoch": 1.04, "learning_rate": 0.00014341377463097902, "loss": 0.04, "step": 161740 }, { "epoch": 1.04, "learning_rate": 0.0001434040932766221, "loss": 0.0311, "step": 161750 }, { "epoch": 1.04, "learning_rate": 0.00014339441192226518, "loss": 0.0383, "step": 161760 }, { "epoch": 1.04, "learning_rate": 0.00014338473056790823, "loss": 0.0318, "step": 161770 }, { "epoch": 1.04, "learning_rate": 0.0001433750492135513, "loss": 0.032, "step": 161780 }, { "epoch": 1.04, "learning_rate": 0.00014336536785919437, "loss": 0.0308, "step": 161790 }, { "epoch": 1.04, "learning_rate": 0.00014335568650483742, "loss": 0.039, "step": 161800 }, { "epoch": 1.04, "learning_rate": 0.0001433460051504805, "loss": 0.0333, "step": 161810 }, { "epoch": 1.04, "learning_rate": 0.00014333632379612358, "loss": 0.0322, "step": 161820 }, { "epoch": 1.04, "learning_rate": 0.00014332664244176666, "loss": 0.0376, "step": 161830 }, { "epoch": 1.04, "learning_rate": 0.0001433169610874097, "loss": 0.0414, "step": 161840 }, { "epoch": 1.04, "learning_rate": 0.00014330727973305276, "loss": 0.0359, "step": 161850 }, { "epoch": 1.04, "learning_rate": 0.00014329759837869584, "loss": 0.0372, "step": 161860 }, { "epoch": 1.04, "learning_rate": 0.0001432879170243389, "loss": 0.0341, "step": 161870 }, { "epoch": 1.04, "learning_rate": 0.00014327823566998198, "loss": 0.0334, "step": 161880 }, { "epoch": 1.04, "learning_rate": 0.00014326855431562506, "loss": 0.0335, "step": 161890 }, { "epoch": 1.04, "learning_rate": 0.00014325887296126814, "loss": 0.039, "step": 161900 }, { "epoch": 1.05, "learning_rate": 0.0001432491916069112, "loss": 0.0415, "step": 161910 }, { "epoch": 1.05, "learning_rate": 0.00014323951025255424, "loss": 0.0348, "step": 161920 }, { "epoch": 1.05, "learning_rate": 0.00014322982889819732, "loss": 0.0309, "step": 161930 }, { "epoch": 1.05, "learning_rate": 0.00014322014754384037, "loss": 0.0333, "step": 161940 }, { "epoch": 1.05, "learning_rate": 0.00014321046618948345, "loss": 0.0359, "step": 161950 }, { "epoch": 1.05, "learning_rate": 0.00014320078483512653, "loss": 0.0324, "step": 161960 }, { "epoch": 1.05, "learning_rate": 0.00014319110348076959, "loss": 0.0322, "step": 161970 }, { "epoch": 1.05, "learning_rate": 0.00014318142212641267, "loss": 0.0318, "step": 161980 }, { "epoch": 1.05, "learning_rate": 0.00014317174077205572, "loss": 0.0386, "step": 161990 }, { "epoch": 1.05, "learning_rate": 0.0001431620594176988, "loss": 0.0322, "step": 162000 }, { "epoch": 1.05, "eval_cer": 0.9199168455541746, "eval_loss": 0.024344589561223984, "eval_runtime": 120.0857, "eval_samples_per_second": 16.655, "eval_steps_per_second": 4.164, "step": 162000 }, { "epoch": 1.05, "learning_rate": 0.00014315237806334185, "loss": 0.0327, "step": 162010 }, { "epoch": 1.05, "learning_rate": 0.00014314269670898493, "loss": 0.0367, "step": 162020 }, { "epoch": 1.05, "learning_rate": 0.000143133015354628, "loss": 0.0369, "step": 162030 }, { "epoch": 1.05, "learning_rate": 0.00014312333400027106, "loss": 0.036, "step": 162040 }, { "epoch": 1.05, "learning_rate": 0.00014311365264591412, "loss": 0.0399, "step": 162050 }, { "epoch": 1.05, "learning_rate": 0.0001431039712915572, "loss": 0.0353, "step": 162060 }, { "epoch": 1.05, "learning_rate": 0.00014309428993720028, "loss": 0.0294, "step": 162070 }, { "epoch": 1.05, "learning_rate": 0.00014308460858284333, "loss": 0.0263, "step": 162080 }, { "epoch": 1.05, "learning_rate": 0.0001430749272284864, "loss": 0.0408, "step": 162090 }, { "epoch": 1.05, "learning_rate": 0.0001430652458741295, "loss": 0.0361, "step": 162100 }, { "epoch": 1.05, "learning_rate": 0.00014305556451977254, "loss": 0.0347, "step": 162110 }, { "epoch": 1.05, "learning_rate": 0.0001430458831654156, "loss": 0.0343, "step": 162120 }, { "epoch": 1.05, "learning_rate": 0.00014303620181105867, "loss": 0.0348, "step": 162130 }, { "epoch": 1.05, "learning_rate": 0.00014302652045670175, "loss": 0.0362, "step": 162140 }, { "epoch": 1.05, "learning_rate": 0.0001430168391023448, "loss": 0.0299, "step": 162150 }, { "epoch": 1.05, "learning_rate": 0.00014300715774798788, "loss": 0.0363, "step": 162160 }, { "epoch": 1.05, "learning_rate": 0.00014299747639363094, "loss": 0.0392, "step": 162170 }, { "epoch": 1.05, "learning_rate": 0.00014298779503927402, "loss": 0.0379, "step": 162180 }, { "epoch": 1.05, "learning_rate": 0.00014297811368491707, "loss": 0.0364, "step": 162190 }, { "epoch": 1.05, "learning_rate": 0.00014296843233056015, "loss": 0.0308, "step": 162200 }, { "epoch": 1.05, "learning_rate": 0.00014295875097620323, "loss": 0.0347, "step": 162210 }, { "epoch": 1.05, "learning_rate": 0.00014294906962184628, "loss": 0.0368, "step": 162220 }, { "epoch": 1.05, "learning_rate": 0.00014293938826748936, "loss": 0.0323, "step": 162230 }, { "epoch": 1.05, "learning_rate": 0.00014292970691313241, "loss": 0.0317, "step": 162240 }, { "epoch": 1.05, "learning_rate": 0.0001429200255587755, "loss": 0.0316, "step": 162250 }, { "epoch": 1.05, "learning_rate": 0.00014291034420441855, "loss": 0.0337, "step": 162260 }, { "epoch": 1.05, "learning_rate": 0.00014290066285006163, "loss": 0.0423, "step": 162270 }, { "epoch": 1.05, "learning_rate": 0.0001428909814957047, "loss": 0.0366, "step": 162280 }, { "epoch": 1.05, "learning_rate": 0.00014288130014134776, "loss": 0.0375, "step": 162290 }, { "epoch": 1.05, "learning_rate": 0.00014287161878699084, "loss": 0.032, "step": 162300 }, { "epoch": 1.05, "learning_rate": 0.0001428619374326339, "loss": 0.0325, "step": 162310 }, { "epoch": 1.05, "learning_rate": 0.00014285225607827697, "loss": 0.0379, "step": 162320 }, { "epoch": 1.05, "learning_rate": 0.00014284257472392002, "loss": 0.0308, "step": 162330 }, { "epoch": 1.05, "learning_rate": 0.0001428328933695631, "loss": 0.0324, "step": 162340 }, { "epoch": 1.05, "learning_rate": 0.00014282321201520618, "loss": 0.0318, "step": 162350 }, { "epoch": 1.05, "learning_rate": 0.00014281353066084924, "loss": 0.0311, "step": 162360 }, { "epoch": 1.05, "learning_rate": 0.0001428038493064923, "loss": 0.033, "step": 162370 }, { "epoch": 1.05, "learning_rate": 0.00014279416795213537, "loss": 0.0333, "step": 162380 }, { "epoch": 1.05, "learning_rate": 0.00014278448659777845, "loss": 0.0345, "step": 162390 }, { "epoch": 1.05, "learning_rate": 0.0001427748052434215, "loss": 0.0315, "step": 162400 }, { "epoch": 1.05, "learning_rate": 0.00014276512388906458, "loss": 0.0312, "step": 162410 }, { "epoch": 1.05, "learning_rate": 0.00014275544253470766, "loss": 0.0424, "step": 162420 }, { "epoch": 1.05, "learning_rate": 0.00014274576118035071, "loss": 0.0336, "step": 162430 }, { "epoch": 1.05, "learning_rate": 0.00014273607982599377, "loss": 0.0317, "step": 162440 }, { "epoch": 1.05, "learning_rate": 0.00014272639847163685, "loss": 0.0346, "step": 162450 }, { "epoch": 1.05, "learning_rate": 0.00014271671711727993, "loss": 0.0334, "step": 162460 }, { "epoch": 1.05, "learning_rate": 0.00014270703576292298, "loss": 0.0361, "step": 162470 }, { "epoch": 1.05, "learning_rate": 0.00014269735440856606, "loss": 0.0355, "step": 162480 }, { "epoch": 1.05, "learning_rate": 0.0001426876730542091, "loss": 0.0408, "step": 162490 }, { "epoch": 1.05, "learning_rate": 0.0001426779916998522, "loss": 0.0304, "step": 162500 }, { "epoch": 1.05, "learning_rate": 0.00014266831034549524, "loss": 0.0343, "step": 162510 }, { "epoch": 1.05, "learning_rate": 0.00014265862899113832, "loss": 0.0369, "step": 162520 }, { "epoch": 1.05, "learning_rate": 0.0001426489476367814, "loss": 0.0385, "step": 162530 }, { "epoch": 1.05, "learning_rate": 0.00014263926628242446, "loss": 0.033, "step": 162540 }, { "epoch": 1.05, "learning_rate": 0.00014262958492806754, "loss": 0.0393, "step": 162550 }, { "epoch": 1.05, "learning_rate": 0.0001426199035737106, "loss": 0.0363, "step": 162560 }, { "epoch": 1.05, "learning_rate": 0.00014261022221935364, "loss": 0.035, "step": 162570 }, { "epoch": 1.05, "learning_rate": 0.00014260054086499672, "loss": 0.0509, "step": 162580 }, { "epoch": 1.05, "learning_rate": 0.0001425908595106398, "loss": 0.0344, "step": 162590 }, { "epoch": 1.05, "learning_rate": 0.00014258117815628288, "loss": 0.0312, "step": 162600 }, { "epoch": 1.05, "learning_rate": 0.00014257149680192593, "loss": 0.0307, "step": 162610 }, { "epoch": 1.05, "learning_rate": 0.000142561815447569, "loss": 0.0284, "step": 162620 }, { "epoch": 1.05, "learning_rate": 0.00014255213409321207, "loss": 0.0342, "step": 162630 }, { "epoch": 1.05, "learning_rate": 0.00014254245273885512, "loss": 0.0325, "step": 162640 }, { "epoch": 1.05, "learning_rate": 0.0001425327713844982, "loss": 0.0302, "step": 162650 }, { "epoch": 1.05, "learning_rate": 0.00014252309003014128, "loss": 0.0359, "step": 162660 }, { "epoch": 1.05, "learning_rate": 0.00014251340867578436, "loss": 0.0333, "step": 162670 }, { "epoch": 1.05, "learning_rate": 0.0001425037273214274, "loss": 0.0471, "step": 162680 }, { "epoch": 1.05, "learning_rate": 0.00014249404596707046, "loss": 0.0311, "step": 162690 }, { "epoch": 1.05, "learning_rate": 0.00014248436461271354, "loss": 0.0329, "step": 162700 }, { "epoch": 1.05, "learning_rate": 0.0001424746832583566, "loss": 0.0355, "step": 162710 }, { "epoch": 1.05, "learning_rate": 0.00014246500190399968, "loss": 0.0337, "step": 162720 }, { "epoch": 1.05, "learning_rate": 0.00014245532054964276, "loss": 0.0348, "step": 162730 }, { "epoch": 1.05, "learning_rate": 0.0001424456391952858, "loss": 0.029, "step": 162740 }, { "epoch": 1.05, "learning_rate": 0.0001424359578409289, "loss": 0.0304, "step": 162750 }, { "epoch": 1.05, "learning_rate": 0.00014242627648657194, "loss": 0.0341, "step": 162760 }, { "epoch": 1.05, "learning_rate": 0.00014241659513221502, "loss": 0.0323, "step": 162770 }, { "epoch": 1.05, "learning_rate": 0.00014240691377785807, "loss": 0.0365, "step": 162780 }, { "epoch": 1.05, "learning_rate": 0.00014239723242350115, "loss": 0.0326, "step": 162790 }, { "epoch": 1.05, "learning_rate": 0.00014238755106914423, "loss": 0.0305, "step": 162800 }, { "epoch": 1.05, "learning_rate": 0.00014237786971478729, "loss": 0.0324, "step": 162810 }, { "epoch": 1.05, "learning_rate": 0.00014236818836043036, "loss": 0.0358, "step": 162820 }, { "epoch": 1.05, "learning_rate": 0.00014235850700607342, "loss": 0.0343, "step": 162830 }, { "epoch": 1.05, "learning_rate": 0.0001423488256517165, "loss": 0.0265, "step": 162840 }, { "epoch": 1.05, "learning_rate": 0.00014233914429735955, "loss": 0.0336, "step": 162850 }, { "epoch": 1.05, "learning_rate": 0.00014232946294300263, "loss": 0.0346, "step": 162860 }, { "epoch": 1.05, "learning_rate": 0.0001423197815886457, "loss": 0.0414, "step": 162870 }, { "epoch": 1.05, "learning_rate": 0.00014231010023428876, "loss": 0.0293, "step": 162880 }, { "epoch": 1.05, "learning_rate": 0.00014230041887993182, "loss": 0.0371, "step": 162890 }, { "epoch": 1.05, "learning_rate": 0.0001422907375255749, "loss": 0.0407, "step": 162900 }, { "epoch": 1.05, "learning_rate": 0.00014228105617121797, "loss": 0.0293, "step": 162910 }, { "epoch": 1.05, "learning_rate": 0.00014227137481686103, "loss": 0.0388, "step": 162920 }, { "epoch": 1.05, "learning_rate": 0.0001422616934625041, "loss": 0.0318, "step": 162930 }, { "epoch": 1.05, "learning_rate": 0.00014225201210814716, "loss": 0.035, "step": 162940 }, { "epoch": 1.05, "learning_rate": 0.00014224233075379024, "loss": 0.0376, "step": 162950 }, { "epoch": 1.05, "learning_rate": 0.0001422326493994333, "loss": 0.0311, "step": 162960 }, { "epoch": 1.05, "learning_rate": 0.00014222296804507637, "loss": 0.0312, "step": 162970 }, { "epoch": 1.05, "learning_rate": 0.00014221328669071945, "loss": 0.0327, "step": 162980 }, { "epoch": 1.05, "learning_rate": 0.0001422036053363625, "loss": 0.0341, "step": 162990 }, { "epoch": 1.05, "learning_rate": 0.00014219392398200558, "loss": 0.0313, "step": 163000 }, { "epoch": 1.05, "eval_cer": 0.9198481527511015, "eval_loss": 0.024626342579722404, "eval_runtime": 120.1691, "eval_samples_per_second": 16.643, "eval_steps_per_second": 4.161, "step": 163000 }, { "epoch": 1.05, "learning_rate": 0.00014218424262764864, "loss": 0.0356, "step": 163010 }, { "epoch": 1.05, "learning_rate": 0.00014217456127329172, "loss": 0.0372, "step": 163020 }, { "epoch": 1.05, "learning_rate": 0.00014216487991893477, "loss": 0.0331, "step": 163030 }, { "epoch": 1.05, "learning_rate": 0.00014215519856457785, "loss": 0.0353, "step": 163040 }, { "epoch": 1.05, "learning_rate": 0.00014214551721022093, "loss": 0.0386, "step": 163050 }, { "epoch": 1.05, "learning_rate": 0.00014213583585586398, "loss": 0.0388, "step": 163060 }, { "epoch": 1.05, "learning_rate": 0.00014212615450150706, "loss": 0.0356, "step": 163070 }, { "epoch": 1.05, "learning_rate": 0.00014211647314715011, "loss": 0.0364, "step": 163080 }, { "epoch": 1.05, "learning_rate": 0.0001421067917927932, "loss": 0.0326, "step": 163090 }, { "epoch": 1.05, "learning_rate": 0.00014209711043843625, "loss": 0.0318, "step": 163100 }, { "epoch": 1.05, "learning_rate": 0.00014208742908407933, "loss": 0.0384, "step": 163110 }, { "epoch": 1.05, "learning_rate": 0.0001420777477297224, "loss": 0.0364, "step": 163120 }, { "epoch": 1.05, "learning_rate": 0.00014206806637536546, "loss": 0.0329, "step": 163130 }, { "epoch": 1.05, "learning_rate": 0.0001420583850210085, "loss": 0.0339, "step": 163140 }, { "epoch": 1.05, "learning_rate": 0.0001420487036666516, "loss": 0.0342, "step": 163150 }, { "epoch": 1.05, "learning_rate": 0.00014203902231229467, "loss": 0.0323, "step": 163160 }, { "epoch": 1.05, "learning_rate": 0.00014202934095793772, "loss": 0.0323, "step": 163170 }, { "epoch": 1.05, "learning_rate": 0.0001420196596035808, "loss": 0.0344, "step": 163180 }, { "epoch": 1.05, "learning_rate": 0.00014200997824922388, "loss": 0.0347, "step": 163190 }, { "epoch": 1.05, "learning_rate": 0.00014200029689486694, "loss": 0.034, "step": 163200 }, { "epoch": 1.05, "learning_rate": 0.00014199061554051, "loss": 0.0452, "step": 163210 }, { "epoch": 1.05, "learning_rate": 0.00014198093418615307, "loss": 0.0346, "step": 163220 }, { "epoch": 1.05, "learning_rate": 0.00014197125283179615, "loss": 0.0352, "step": 163230 }, { "epoch": 1.05, "learning_rate": 0.0001419615714774392, "loss": 0.0304, "step": 163240 }, { "epoch": 1.05, "learning_rate": 0.00014195189012308228, "loss": 0.031, "step": 163250 }, { "epoch": 1.05, "learning_rate": 0.00014194220876872533, "loss": 0.0404, "step": 163260 }, { "epoch": 1.05, "learning_rate": 0.0001419325274143684, "loss": 0.0284, "step": 163270 }, { "epoch": 1.05, "learning_rate": 0.00014192284606001147, "loss": 0.0363, "step": 163280 }, { "epoch": 1.05, "learning_rate": 0.00014191316470565455, "loss": 0.0363, "step": 163290 }, { "epoch": 1.05, "learning_rate": 0.00014190348335129763, "loss": 0.0344, "step": 163300 }, { "epoch": 1.05, "learning_rate": 0.00014189380199694068, "loss": 0.0342, "step": 163310 }, { "epoch": 1.05, "learning_rate": 0.00014188412064258376, "loss": 0.0358, "step": 163320 }, { "epoch": 1.05, "learning_rate": 0.0001418744392882268, "loss": 0.0325, "step": 163330 }, { "epoch": 1.05, "learning_rate": 0.00014186475793386986, "loss": 0.0344, "step": 163340 }, { "epoch": 1.05, "learning_rate": 0.00014185507657951294, "loss": 0.0332, "step": 163350 }, { "epoch": 1.05, "learning_rate": 0.00014184539522515602, "loss": 0.0382, "step": 163360 }, { "epoch": 1.05, "learning_rate": 0.0001418357138707991, "loss": 0.0396, "step": 163370 }, { "epoch": 1.05, "learning_rate": 0.00014182603251644216, "loss": 0.0318, "step": 163380 }, { "epoch": 1.05, "learning_rate": 0.00014181635116208524, "loss": 0.0374, "step": 163390 }, { "epoch": 1.05, "learning_rate": 0.0001418066698077283, "loss": 0.0368, "step": 163400 }, { "epoch": 1.05, "learning_rate": 0.00014179698845337134, "loss": 0.0345, "step": 163410 }, { "epoch": 1.05, "learning_rate": 0.00014178730709901442, "loss": 0.0346, "step": 163420 }, { "epoch": 1.05, "learning_rate": 0.0001417776257446575, "loss": 0.0435, "step": 163430 }, { "epoch": 1.05, "learning_rate": 0.00014176794439030058, "loss": 0.04, "step": 163440 }, { "epoch": 1.05, "learning_rate": 0.00014175826303594363, "loss": 0.0386, "step": 163450 }, { "epoch": 1.06, "learning_rate": 0.00014174858168158669, "loss": 0.0358, "step": 163460 }, { "epoch": 1.06, "learning_rate": 0.00014173890032722977, "loss": 0.0389, "step": 163470 }, { "epoch": 1.06, "learning_rate": 0.00014172921897287282, "loss": 0.0333, "step": 163480 }, { "epoch": 1.06, "learning_rate": 0.0001417195376185159, "loss": 0.0359, "step": 163490 }, { "epoch": 1.06, "learning_rate": 0.00014170985626415898, "loss": 0.0337, "step": 163500 }, { "epoch": 1.06, "learning_rate": 0.00014170017490980206, "loss": 0.0352, "step": 163510 }, { "epoch": 1.06, "learning_rate": 0.0001416904935554451, "loss": 0.0351, "step": 163520 }, { "epoch": 1.06, "learning_rate": 0.00014168081220108816, "loss": 0.0414, "step": 163530 }, { "epoch": 1.06, "learning_rate": 0.00014167113084673124, "loss": 0.0364, "step": 163540 }, { "epoch": 1.06, "learning_rate": 0.0001416614494923743, "loss": 0.0345, "step": 163550 }, { "epoch": 1.06, "learning_rate": 0.00014165176813801738, "loss": 0.0322, "step": 163560 }, { "epoch": 1.06, "learning_rate": 0.00014164208678366045, "loss": 0.0313, "step": 163570 }, { "epoch": 1.06, "learning_rate": 0.0001416324054293035, "loss": 0.0355, "step": 163580 }, { "epoch": 1.06, "learning_rate": 0.0001416227240749466, "loss": 0.03, "step": 163590 }, { "epoch": 1.06, "learning_rate": 0.00014161304272058964, "loss": 0.0314, "step": 163600 }, { "epoch": 1.06, "learning_rate": 0.00014160336136623272, "loss": 0.0329, "step": 163610 }, { "epoch": 1.06, "learning_rate": 0.00014159368001187577, "loss": 0.0351, "step": 163620 }, { "epoch": 1.06, "learning_rate": 0.00014158399865751885, "loss": 0.0338, "step": 163630 }, { "epoch": 1.06, "learning_rate": 0.00014157431730316193, "loss": 0.0323, "step": 163640 }, { "epoch": 1.06, "learning_rate": 0.00014156463594880498, "loss": 0.0297, "step": 163650 }, { "epoch": 1.06, "learning_rate": 0.00014155495459444804, "loss": 0.0349, "step": 163660 }, { "epoch": 1.06, "learning_rate": 0.00014154527324009112, "loss": 0.0335, "step": 163670 }, { "epoch": 1.06, "learning_rate": 0.0001415355918857342, "loss": 0.0342, "step": 163680 }, { "epoch": 1.06, "learning_rate": 0.00014152591053137725, "loss": 0.0343, "step": 163690 }, { "epoch": 1.06, "learning_rate": 0.00014151622917702033, "loss": 0.0293, "step": 163700 }, { "epoch": 1.06, "learning_rate": 0.0001415065478226634, "loss": 0.036, "step": 163710 }, { "epoch": 1.06, "learning_rate": 0.00014149686646830646, "loss": 0.0393, "step": 163720 }, { "epoch": 1.06, "learning_rate": 0.00014148718511394951, "loss": 0.0341, "step": 163730 }, { "epoch": 1.06, "learning_rate": 0.0001414775037595926, "loss": 0.0314, "step": 163740 }, { "epoch": 1.06, "learning_rate": 0.00014146782240523567, "loss": 0.038, "step": 163750 }, { "epoch": 1.06, "learning_rate": 0.00014145814105087873, "loss": 0.0321, "step": 163760 }, { "epoch": 1.06, "learning_rate": 0.0001414484596965218, "loss": 0.0301, "step": 163770 }, { "epoch": 1.06, "learning_rate": 0.00014143877834216486, "loss": 0.0351, "step": 163780 }, { "epoch": 1.06, "learning_rate": 0.00014142909698780794, "loss": 0.0356, "step": 163790 }, { "epoch": 1.06, "learning_rate": 0.000141419415633451, "loss": 0.0372, "step": 163800 }, { "epoch": 1.06, "learning_rate": 0.00014140973427909407, "loss": 0.0401, "step": 163810 }, { "epoch": 1.06, "learning_rate": 0.00014140005292473715, "loss": 0.0363, "step": 163820 }, { "epoch": 1.06, "learning_rate": 0.0001413903715703802, "loss": 0.0398, "step": 163830 }, { "epoch": 1.06, "learning_rate": 0.00014138069021602328, "loss": 0.0307, "step": 163840 }, { "epoch": 1.06, "learning_rate": 0.00014137100886166634, "loss": 0.0351, "step": 163850 }, { "epoch": 1.06, "learning_rate": 0.0001413613275073094, "loss": 0.0325, "step": 163860 }, { "epoch": 1.06, "learning_rate": 0.00014135164615295247, "loss": 0.0356, "step": 163870 }, { "epoch": 1.06, "learning_rate": 0.00014134196479859555, "loss": 0.032, "step": 163880 }, { "epoch": 1.06, "learning_rate": 0.00014133228344423863, "loss": 0.0332, "step": 163890 }, { "epoch": 1.06, "learning_rate": 0.00014132260208988168, "loss": 0.0274, "step": 163900 }, { "epoch": 1.06, "learning_rate": 0.00014131292073552476, "loss": 0.0346, "step": 163910 }, { "epoch": 1.06, "learning_rate": 0.00014130323938116781, "loss": 0.0489, "step": 163920 }, { "epoch": 1.06, "learning_rate": 0.00014129355802681087, "loss": 0.0384, "step": 163930 }, { "epoch": 1.06, "learning_rate": 0.00014128387667245395, "loss": 0.0361, "step": 163940 }, { "epoch": 1.06, "learning_rate": 0.00014127419531809703, "loss": 0.0387, "step": 163950 }, { "epoch": 1.06, "learning_rate": 0.0001412645139637401, "loss": 0.0358, "step": 163960 }, { "epoch": 1.06, "learning_rate": 0.00014125483260938316, "loss": 0.035, "step": 163970 }, { "epoch": 1.06, "learning_rate": 0.0001412451512550262, "loss": 0.0431, "step": 163980 }, { "epoch": 1.06, "learning_rate": 0.0001412354699006693, "loss": 0.0316, "step": 163990 }, { "epoch": 1.06, "learning_rate": 0.00014122578854631234, "loss": 0.0329, "step": 164000 }, { "epoch": 1.06, "eval_cer": 0.9199502881030392, "eval_loss": 0.024694031104445457, "eval_runtime": 120.2156, "eval_samples_per_second": 16.637, "eval_steps_per_second": 4.159, "step": 164000 }, { "epoch": 1.06, "learning_rate": 0.00014121610719195542, "loss": 0.0348, "step": 164010 }, { "epoch": 1.06, "learning_rate": 0.0001412064258375985, "loss": 0.0334, "step": 164020 }, { "epoch": 1.06, "learning_rate": 0.00014119674448324156, "loss": 0.0377, "step": 164030 }, { "epoch": 1.06, "learning_rate": 0.00014118706312888464, "loss": 0.033, "step": 164040 }, { "epoch": 1.06, "learning_rate": 0.0001411773817745277, "loss": 0.0391, "step": 164050 }, { "epoch": 1.06, "learning_rate": 0.00014116770042017077, "loss": 0.0366, "step": 164060 }, { "epoch": 1.06, "learning_rate": 0.00014115801906581382, "loss": 0.0321, "step": 164070 }, { "epoch": 1.06, "learning_rate": 0.0001411483377114569, "loss": 0.0377, "step": 164080 }, { "epoch": 1.06, "learning_rate": 0.00014113865635709998, "loss": 0.034, "step": 164090 }, { "epoch": 1.06, "learning_rate": 0.00014112897500274303, "loss": 0.0352, "step": 164100 }, { "epoch": 1.06, "learning_rate": 0.0001411192936483861, "loss": 0.0418, "step": 164110 }, { "epoch": 1.06, "learning_rate": 0.00014110961229402917, "loss": 0.032, "step": 164120 }, { "epoch": 1.06, "learning_rate": 0.00014109993093967225, "loss": 0.0336, "step": 164130 }, { "epoch": 1.06, "learning_rate": 0.0001410902495853153, "loss": 0.0342, "step": 164140 }, { "epoch": 1.06, "learning_rate": 0.00014108056823095838, "loss": 0.0324, "step": 164150 }, { "epoch": 1.06, "learning_rate": 0.00014107088687660146, "loss": 0.0336, "step": 164160 }, { "epoch": 1.06, "learning_rate": 0.0001410612055222445, "loss": 0.0289, "step": 164170 }, { "epoch": 1.06, "learning_rate": 0.00014105152416788756, "loss": 0.0342, "step": 164180 }, { "epoch": 1.06, "learning_rate": 0.00014104184281353064, "loss": 0.0363, "step": 164190 }, { "epoch": 1.06, "learning_rate": 0.00014103216145917372, "loss": 0.034, "step": 164200 }, { "epoch": 1.06, "learning_rate": 0.00014102248010481678, "loss": 0.0322, "step": 164210 }, { "epoch": 1.06, "learning_rate": 0.00014101279875045986, "loss": 0.0305, "step": 164220 }, { "epoch": 1.06, "learning_rate": 0.0001410031173961029, "loss": 0.0365, "step": 164230 }, { "epoch": 1.06, "learning_rate": 0.000140993436041746, "loss": 0.0333, "step": 164240 }, { "epoch": 1.06, "learning_rate": 0.00014098375468738904, "loss": 0.0355, "step": 164250 }, { "epoch": 1.06, "learning_rate": 0.00014097407333303212, "loss": 0.0353, "step": 164260 }, { "epoch": 1.06, "learning_rate": 0.0001409643919786752, "loss": 0.034, "step": 164270 }, { "epoch": 1.06, "learning_rate": 0.00014095471062431825, "loss": 0.0327, "step": 164280 }, { "epoch": 1.06, "learning_rate": 0.00014094502926996133, "loss": 0.0326, "step": 164290 }, { "epoch": 1.06, "learning_rate": 0.00014093534791560439, "loss": 0.0334, "step": 164300 }, { "epoch": 1.06, "learning_rate": 0.00014092566656124746, "loss": 0.0351, "step": 164310 }, { "epoch": 1.06, "learning_rate": 0.00014091598520689052, "loss": 0.033, "step": 164320 }, { "epoch": 1.06, "learning_rate": 0.0001409063038525336, "loss": 0.0319, "step": 164330 }, { "epoch": 1.06, "learning_rate": 0.00014089662249817668, "loss": 0.037, "step": 164340 }, { "epoch": 1.06, "learning_rate": 0.00014088694114381973, "loss": 0.0388, "step": 164350 }, { "epoch": 1.06, "learning_rate": 0.0001408772597894628, "loss": 0.0339, "step": 164360 }, { "epoch": 1.06, "learning_rate": 0.00014086757843510586, "loss": 0.0359, "step": 164370 }, { "epoch": 1.06, "learning_rate": 0.00014085789708074894, "loss": 0.0383, "step": 164380 }, { "epoch": 1.06, "learning_rate": 0.000140848215726392, "loss": 0.0361, "step": 164390 }, { "epoch": 1.06, "learning_rate": 0.00014083853437203507, "loss": 0.0302, "step": 164400 }, { "epoch": 1.06, "learning_rate": 0.00014082885301767815, "loss": 0.0361, "step": 164410 }, { "epoch": 1.06, "learning_rate": 0.0001408191716633212, "loss": 0.0295, "step": 164420 }, { "epoch": 1.06, "learning_rate": 0.0001408094903089643, "loss": 0.0359, "step": 164430 }, { "epoch": 1.06, "learning_rate": 0.00014079980895460734, "loss": 0.034, "step": 164440 }, { "epoch": 1.06, "learning_rate": 0.00014079012760025042, "loss": 0.0338, "step": 164450 }, { "epoch": 1.06, "learning_rate": 0.00014078044624589347, "loss": 0.0343, "step": 164460 }, { "epoch": 1.06, "learning_rate": 0.00014077076489153655, "loss": 0.0308, "step": 164470 }, { "epoch": 1.06, "learning_rate": 0.00014076108353717963, "loss": 0.0335, "step": 164480 }, { "epoch": 1.06, "learning_rate": 0.00014075140218282268, "loss": 0.0381, "step": 164490 }, { "epoch": 1.06, "learning_rate": 0.00014074172082846574, "loss": 0.031, "step": 164500 }, { "epoch": 1.06, "learning_rate": 0.00014073203947410882, "loss": 0.0398, "step": 164510 }, { "epoch": 1.06, "learning_rate": 0.0001407223581197519, "loss": 0.027, "step": 164520 }, { "epoch": 1.06, "learning_rate": 0.00014071267676539495, "loss": 0.0364, "step": 164530 }, { "epoch": 1.06, "learning_rate": 0.00014070299541103803, "loss": 0.0309, "step": 164540 }, { "epoch": 1.06, "learning_rate": 0.00014069331405668108, "loss": 0.0321, "step": 164550 }, { "epoch": 1.06, "learning_rate": 0.00014068363270232416, "loss": 0.0377, "step": 164560 }, { "epoch": 1.06, "learning_rate": 0.00014067395134796721, "loss": 0.0385, "step": 164570 }, { "epoch": 1.06, "learning_rate": 0.0001406642699936103, "loss": 0.0328, "step": 164580 }, { "epoch": 1.06, "learning_rate": 0.00014065458863925337, "loss": 0.039, "step": 164590 }, { "epoch": 1.06, "learning_rate": 0.00014064490728489643, "loss": 0.0303, "step": 164600 }, { "epoch": 1.06, "learning_rate": 0.0001406352259305395, "loss": 0.0351, "step": 164610 }, { "epoch": 1.06, "learning_rate": 0.00014062554457618256, "loss": 0.0317, "step": 164620 }, { "epoch": 1.06, "learning_rate": 0.00014061586322182564, "loss": 0.0399, "step": 164630 }, { "epoch": 1.06, "learning_rate": 0.0001406061818674687, "loss": 0.0332, "step": 164640 }, { "epoch": 1.06, "learning_rate": 0.00014059650051311177, "loss": 0.0331, "step": 164650 }, { "epoch": 1.06, "learning_rate": 0.00014058681915875485, "loss": 0.0324, "step": 164660 }, { "epoch": 1.06, "learning_rate": 0.0001405771378043979, "loss": 0.0368, "step": 164670 }, { "epoch": 1.06, "learning_rate": 0.00014056745645004098, "loss": 0.0343, "step": 164680 }, { "epoch": 1.06, "learning_rate": 0.00014055777509568404, "loss": 0.031, "step": 164690 }, { "epoch": 1.06, "learning_rate": 0.0001405480937413271, "loss": 0.0325, "step": 164700 }, { "epoch": 1.06, "learning_rate": 0.00014053841238697017, "loss": 0.032, "step": 164710 }, { "epoch": 1.06, "learning_rate": 0.00014052873103261325, "loss": 0.0392, "step": 164720 }, { "epoch": 1.06, "learning_rate": 0.00014051904967825633, "loss": 0.0345, "step": 164730 }, { "epoch": 1.06, "learning_rate": 0.00014050936832389938, "loss": 0.0394, "step": 164740 }, { "epoch": 1.06, "learning_rate": 0.00014049968696954243, "loss": 0.0337, "step": 164750 }, { "epoch": 1.06, "learning_rate": 0.0001404900056151855, "loss": 0.039, "step": 164760 }, { "epoch": 1.06, "learning_rate": 0.00014048032426082857, "loss": 0.0311, "step": 164770 }, { "epoch": 1.06, "learning_rate": 0.00014047064290647165, "loss": 0.0383, "step": 164780 }, { "epoch": 1.06, "learning_rate": 0.00014046096155211473, "loss": 0.0358, "step": 164790 }, { "epoch": 1.06, "learning_rate": 0.0001404512801977578, "loss": 0.0366, "step": 164800 }, { "epoch": 1.06, "learning_rate": 0.00014044159884340086, "loss": 0.038, "step": 164810 }, { "epoch": 1.06, "learning_rate": 0.0001404319174890439, "loss": 0.0387, "step": 164820 }, { "epoch": 1.06, "learning_rate": 0.000140422236134687, "loss": 0.0398, "step": 164830 }, { "epoch": 1.06, "learning_rate": 0.00014041255478033004, "loss": 0.0356, "step": 164840 }, { "epoch": 1.06, "learning_rate": 0.00014040287342597312, "loss": 0.0333, "step": 164850 }, { "epoch": 1.06, "learning_rate": 0.0001403931920716162, "loss": 0.0345, "step": 164860 }, { "epoch": 1.06, "learning_rate": 0.00014038351071725926, "loss": 0.0332, "step": 164870 }, { "epoch": 1.06, "learning_rate": 0.00014037382936290234, "loss": 0.0325, "step": 164880 }, { "epoch": 1.06, "learning_rate": 0.0001403641480085454, "loss": 0.0351, "step": 164890 }, { "epoch": 1.06, "learning_rate": 0.00014035446665418847, "loss": 0.0366, "step": 164900 }, { "epoch": 1.06, "learning_rate": 0.00014034478529983152, "loss": 0.0342, "step": 164910 }, { "epoch": 1.06, "learning_rate": 0.0001403351039454746, "loss": 0.045, "step": 164920 }, { "epoch": 1.06, "learning_rate": 0.00014032542259111768, "loss": 0.0308, "step": 164930 }, { "epoch": 1.06, "learning_rate": 0.00014031574123676073, "loss": 0.0359, "step": 164940 }, { "epoch": 1.06, "learning_rate": 0.00014030605988240379, "loss": 0.0403, "step": 164950 }, { "epoch": 1.06, "learning_rate": 0.00014029637852804687, "loss": 0.0343, "step": 164960 }, { "epoch": 1.06, "learning_rate": 0.00014028669717368995, "loss": 0.0327, "step": 164970 }, { "epoch": 1.06, "learning_rate": 0.000140277015819333, "loss": 0.0405, "step": 164980 }, { "epoch": 1.06, "learning_rate": 0.00014026733446497608, "loss": 0.038, "step": 164990 }, { "epoch": 1.06, "learning_rate": 0.00014025765311061916, "loss": 0.0393, "step": 165000 }, { "epoch": 1.06, "eval_cer": 0.9198345949610214, "eval_loss": 0.02478347346186638, "eval_runtime": 120.113, "eval_samples_per_second": 16.651, "eval_steps_per_second": 4.163, "step": 165000 }, { "epoch": 1.07, "learning_rate": 0.0001402479717562622, "loss": 0.0324, "step": 165010 }, { "epoch": 1.07, "learning_rate": 0.00014023829040190526, "loss": 0.0342, "step": 165020 }, { "epoch": 1.07, "learning_rate": 0.00014022860904754834, "loss": 0.0368, "step": 165030 }, { "epoch": 1.07, "learning_rate": 0.00014021892769319142, "loss": 0.0332, "step": 165040 }, { "epoch": 1.07, "learning_rate": 0.00014020924633883448, "loss": 0.0415, "step": 165050 }, { "epoch": 1.07, "learning_rate": 0.00014019956498447755, "loss": 0.0358, "step": 165060 }, { "epoch": 1.07, "learning_rate": 0.0001401898836301206, "loss": 0.0396, "step": 165070 }, { "epoch": 1.07, "learning_rate": 0.0001401802022757637, "loss": 0.0321, "step": 165080 }, { "epoch": 1.07, "learning_rate": 0.00014017052092140674, "loss": 0.035, "step": 165090 }, { "epoch": 1.07, "learning_rate": 0.00014016083956704982, "loss": 0.0384, "step": 165100 }, { "epoch": 1.07, "learning_rate": 0.0001401511582126929, "loss": 0.0346, "step": 165110 }, { "epoch": 1.07, "learning_rate": 0.00014014147685833595, "loss": 0.0337, "step": 165120 }, { "epoch": 1.07, "learning_rate": 0.00014013179550397903, "loss": 0.0328, "step": 165130 }, { "epoch": 1.07, "learning_rate": 0.00014012211414962208, "loss": 0.0376, "step": 165140 }, { "epoch": 1.07, "learning_rate": 0.00014011243279526516, "loss": 0.0354, "step": 165150 }, { "epoch": 1.07, "learning_rate": 0.00014010275144090822, "loss": 0.036, "step": 165160 }, { "epoch": 1.07, "learning_rate": 0.0001400930700865513, "loss": 0.0384, "step": 165170 }, { "epoch": 1.07, "learning_rate": 0.00014008338873219438, "loss": 0.0339, "step": 165180 }, { "epoch": 1.07, "learning_rate": 0.00014007370737783743, "loss": 0.0332, "step": 165190 }, { "epoch": 1.07, "learning_rate": 0.0001400640260234805, "loss": 0.0332, "step": 165200 }, { "epoch": 1.07, "learning_rate": 0.00014005434466912356, "loss": 0.0406, "step": 165210 }, { "epoch": 1.07, "learning_rate": 0.00014004466331476664, "loss": 0.0298, "step": 165220 }, { "epoch": 1.07, "learning_rate": 0.0001400349819604097, "loss": 0.0386, "step": 165230 }, { "epoch": 1.07, "learning_rate": 0.00014002530060605277, "loss": 0.0405, "step": 165240 }, { "epoch": 1.07, "learning_rate": 0.00014001561925169585, "loss": 0.0315, "step": 165250 }, { "epoch": 1.07, "learning_rate": 0.0001400059378973389, "loss": 0.0343, "step": 165260 }, { "epoch": 1.07, "learning_rate": 0.00013999625654298196, "loss": 0.0331, "step": 165270 }, { "epoch": 1.07, "learning_rate": 0.00013998657518862504, "loss": 0.0335, "step": 165280 }, { "epoch": 1.07, "learning_rate": 0.00013997689383426812, "loss": 0.0327, "step": 165290 }, { "epoch": 1.07, "learning_rate": 0.00013996721247991117, "loss": 0.0336, "step": 165300 }, { "epoch": 1.07, "learning_rate": 0.00013995753112555425, "loss": 0.0289, "step": 165310 }, { "epoch": 1.07, "learning_rate": 0.00013994784977119733, "loss": 0.0337, "step": 165320 }, { "epoch": 1.07, "learning_rate": 0.00013993816841684038, "loss": 0.0315, "step": 165330 }, { "epoch": 1.07, "learning_rate": 0.00013992848706248344, "loss": 0.0321, "step": 165340 }, { "epoch": 1.07, "learning_rate": 0.00013991880570812652, "loss": 0.032, "step": 165350 }, { "epoch": 1.07, "learning_rate": 0.0001399091243537696, "loss": 0.0321, "step": 165360 }, { "epoch": 1.07, "learning_rate": 0.00013989944299941265, "loss": 0.041, "step": 165370 }, { "epoch": 1.07, "learning_rate": 0.00013988976164505573, "loss": 0.0325, "step": 165380 }, { "epoch": 1.07, "learning_rate": 0.00013988008029069878, "loss": 0.0367, "step": 165390 }, { "epoch": 1.07, "learning_rate": 0.00013987039893634186, "loss": 0.0331, "step": 165400 }, { "epoch": 1.07, "learning_rate": 0.00013986071758198491, "loss": 0.0361, "step": 165410 }, { "epoch": 1.07, "learning_rate": 0.000139851036227628, "loss": 0.0335, "step": 165420 }, { "epoch": 1.07, "learning_rate": 0.00013984135487327107, "loss": 0.0348, "step": 165430 }, { "epoch": 1.07, "learning_rate": 0.00013983167351891413, "loss": 0.0336, "step": 165440 }, { "epoch": 1.07, "learning_rate": 0.0001398219921645572, "loss": 0.0376, "step": 165450 }, { "epoch": 1.07, "learning_rate": 0.00013981231081020026, "loss": 0.0304, "step": 165460 }, { "epoch": 1.07, "learning_rate": 0.0001398026294558433, "loss": 0.0325, "step": 165470 }, { "epoch": 1.07, "learning_rate": 0.0001397929481014864, "loss": 0.0334, "step": 165480 }, { "epoch": 1.07, "learning_rate": 0.00013978326674712947, "loss": 0.0329, "step": 165490 }, { "epoch": 1.07, "learning_rate": 0.00013977358539277255, "loss": 0.0343, "step": 165500 }, { "epoch": 1.07, "learning_rate": 0.0001397639040384156, "loss": 0.0359, "step": 165510 }, { "epoch": 1.07, "learning_rate": 0.00013975422268405868, "loss": 0.0354, "step": 165520 }, { "epoch": 1.07, "learning_rate": 0.00013974454132970174, "loss": 0.0308, "step": 165530 }, { "epoch": 1.07, "learning_rate": 0.0001397348599753448, "loss": 0.0359, "step": 165540 }, { "epoch": 1.07, "learning_rate": 0.00013972517862098787, "loss": 0.0389, "step": 165550 }, { "epoch": 1.07, "learning_rate": 0.00013971549726663095, "loss": 0.0279, "step": 165560 }, { "epoch": 1.07, "learning_rate": 0.00013970581591227403, "loss": 0.0295, "step": 165570 }, { "epoch": 1.07, "learning_rate": 0.00013969613455791708, "loss": 0.0285, "step": 165580 }, { "epoch": 1.07, "learning_rate": 0.00013968645320356013, "loss": 0.0364, "step": 165590 }, { "epoch": 1.07, "learning_rate": 0.0001396767718492032, "loss": 0.0274, "step": 165600 }, { "epoch": 1.07, "learning_rate": 0.00013966709049484627, "loss": 0.0344, "step": 165610 }, { "epoch": 1.07, "learning_rate": 0.00013965740914048935, "loss": 0.0304, "step": 165620 }, { "epoch": 1.07, "learning_rate": 0.00013964772778613243, "loss": 0.0314, "step": 165630 }, { "epoch": 1.07, "learning_rate": 0.00013963804643177548, "loss": 0.0288, "step": 165640 }, { "epoch": 1.07, "learning_rate": 0.00013962836507741856, "loss": 0.0401, "step": 165650 }, { "epoch": 1.07, "learning_rate": 0.0001396186837230616, "loss": 0.0314, "step": 165660 }, { "epoch": 1.07, "learning_rate": 0.0001396090023687047, "loss": 0.0325, "step": 165670 }, { "epoch": 1.07, "learning_rate": 0.00013959932101434774, "loss": 0.031, "step": 165680 }, { "epoch": 1.07, "learning_rate": 0.00013958963965999082, "loss": 0.0371, "step": 165690 }, { "epoch": 1.07, "learning_rate": 0.0001395799583056339, "loss": 0.0367, "step": 165700 }, { "epoch": 1.07, "learning_rate": 0.00013957027695127696, "loss": 0.0376, "step": 165710 }, { "epoch": 1.07, "learning_rate": 0.00013956059559692004, "loss": 0.0356, "step": 165720 }, { "epoch": 1.07, "learning_rate": 0.0001395509142425631, "loss": 0.0329, "step": 165730 }, { "epoch": 1.07, "learning_rate": 0.00013954123288820617, "loss": 0.0365, "step": 165740 }, { "epoch": 1.07, "learning_rate": 0.00013953155153384922, "loss": 0.0436, "step": 165750 }, { "epoch": 1.07, "learning_rate": 0.0001395218701794923, "loss": 0.0292, "step": 165760 }, { "epoch": 1.07, "learning_rate": 0.00013951218882513538, "loss": 0.0336, "step": 165770 }, { "epoch": 1.07, "learning_rate": 0.00013950250747077843, "loss": 0.0375, "step": 165780 }, { "epoch": 1.07, "learning_rate": 0.00013949282611642149, "loss": 0.0303, "step": 165790 }, { "epoch": 1.07, "learning_rate": 0.00013948314476206456, "loss": 0.0289, "step": 165800 }, { "epoch": 1.07, "learning_rate": 0.00013947346340770764, "loss": 0.0291, "step": 165810 }, { "epoch": 1.07, "learning_rate": 0.0001394637820533507, "loss": 0.0353, "step": 165820 }, { "epoch": 1.07, "learning_rate": 0.00013945410069899378, "loss": 0.0315, "step": 165830 }, { "epoch": 1.07, "learning_rate": 0.00013944441934463683, "loss": 0.0369, "step": 165840 }, { "epoch": 1.07, "learning_rate": 0.0001394347379902799, "loss": 0.0291, "step": 165850 }, { "epoch": 1.07, "learning_rate": 0.00013942505663592296, "loss": 0.0313, "step": 165860 }, { "epoch": 1.07, "learning_rate": 0.00013941537528156604, "loss": 0.0317, "step": 165870 }, { "epoch": 1.07, "learning_rate": 0.00013940569392720912, "loss": 0.0329, "step": 165880 }, { "epoch": 1.07, "learning_rate": 0.00013939601257285217, "loss": 0.0367, "step": 165890 }, { "epoch": 1.07, "learning_rate": 0.00013938633121849525, "loss": 0.0344, "step": 165900 }, { "epoch": 1.07, "learning_rate": 0.0001393766498641383, "loss": 0.0281, "step": 165910 }, { "epoch": 1.07, "learning_rate": 0.0001393669685097814, "loss": 0.0348, "step": 165920 }, { "epoch": 1.07, "learning_rate": 0.00013935728715542444, "loss": 0.0336, "step": 165930 }, { "epoch": 1.07, "learning_rate": 0.00013934760580106752, "loss": 0.0389, "step": 165940 }, { "epoch": 1.07, "learning_rate": 0.0001393379244467106, "loss": 0.032, "step": 165950 }, { "epoch": 1.07, "learning_rate": 0.00013932824309235365, "loss": 0.0386, "step": 165960 }, { "epoch": 1.07, "learning_rate": 0.00013931856173799673, "loss": 0.0385, "step": 165970 }, { "epoch": 1.07, "learning_rate": 0.00013930888038363978, "loss": 0.0404, "step": 165980 }, { "epoch": 1.07, "learning_rate": 0.00013929919902928286, "loss": 0.0343, "step": 165990 }, { "epoch": 1.07, "learning_rate": 0.00013928951767492592, "loss": 0.0352, "step": 166000 }, { "epoch": 1.07, "eval_cer": 0.9198219410236131, "eval_loss": 0.02429656684398651, "eval_runtime": 120.1547, "eval_samples_per_second": 16.645, "eval_steps_per_second": 4.161, "step": 166000 }, { "epoch": 1.07, "learning_rate": 0.000139279836320569, "loss": 0.0322, "step": 166010 }, { "epoch": 1.07, "learning_rate": 0.00013927015496621208, "loss": 0.0341, "step": 166020 }, { "epoch": 1.07, "learning_rate": 0.00013926047361185513, "loss": 0.0379, "step": 166030 }, { "epoch": 1.07, "learning_rate": 0.00013925079225749818, "loss": 0.0401, "step": 166040 }, { "epoch": 1.07, "learning_rate": 0.00013924111090314126, "loss": 0.0321, "step": 166050 }, { "epoch": 1.07, "learning_rate": 0.00013923142954878434, "loss": 0.0371, "step": 166060 }, { "epoch": 1.07, "learning_rate": 0.0001392217481944274, "loss": 0.0357, "step": 166070 }, { "epoch": 1.07, "learning_rate": 0.00013921206684007047, "loss": 0.033, "step": 166080 }, { "epoch": 1.07, "learning_rate": 0.00013920238548571355, "loss": 0.0354, "step": 166090 }, { "epoch": 1.07, "learning_rate": 0.0001391927041313566, "loss": 0.0375, "step": 166100 }, { "epoch": 1.07, "learning_rate": 0.00013918302277699966, "loss": 0.0396, "step": 166110 }, { "epoch": 1.07, "learning_rate": 0.00013917334142264274, "loss": 0.034, "step": 166120 }, { "epoch": 1.07, "learning_rate": 0.00013916366006828582, "loss": 0.0356, "step": 166130 }, { "epoch": 1.07, "learning_rate": 0.00013915397871392887, "loss": 0.0329, "step": 166140 }, { "epoch": 1.07, "learning_rate": 0.00013914429735957195, "loss": 0.0275, "step": 166150 }, { "epoch": 1.07, "learning_rate": 0.000139134616005215, "loss": 0.0356, "step": 166160 }, { "epoch": 1.07, "learning_rate": 0.00013912493465085808, "loss": 0.0338, "step": 166170 }, { "epoch": 1.07, "learning_rate": 0.00013911525329650114, "loss": 0.0357, "step": 166180 }, { "epoch": 1.07, "learning_rate": 0.00013910557194214422, "loss": 0.0349, "step": 166190 }, { "epoch": 1.07, "learning_rate": 0.0001390958905877873, "loss": 0.0367, "step": 166200 }, { "epoch": 1.07, "learning_rate": 0.00013908620923343035, "loss": 0.0328, "step": 166210 }, { "epoch": 1.07, "learning_rate": 0.00013907652787907343, "loss": 0.0365, "step": 166220 }, { "epoch": 1.07, "learning_rate": 0.00013906684652471648, "loss": 0.0293, "step": 166230 }, { "epoch": 1.07, "learning_rate": 0.00013905716517035953, "loss": 0.0368, "step": 166240 }, { "epoch": 1.07, "learning_rate": 0.0001390474838160026, "loss": 0.0335, "step": 166250 }, { "epoch": 1.07, "learning_rate": 0.0001390378024616457, "loss": 0.032, "step": 166260 }, { "epoch": 1.07, "learning_rate": 0.00013902812110728877, "loss": 0.0345, "step": 166270 }, { "epoch": 1.07, "learning_rate": 0.00013901843975293183, "loss": 0.0338, "step": 166280 }, { "epoch": 1.07, "learning_rate": 0.0001390087583985749, "loss": 0.0291, "step": 166290 }, { "epoch": 1.07, "learning_rate": 0.00013899907704421796, "loss": 0.0352, "step": 166300 }, { "epoch": 1.07, "learning_rate": 0.000138989395689861, "loss": 0.0365, "step": 166310 }, { "epoch": 1.07, "learning_rate": 0.0001389797143355041, "loss": 0.0347, "step": 166320 }, { "epoch": 1.07, "learning_rate": 0.00013897003298114717, "loss": 0.0336, "step": 166330 }, { "epoch": 1.07, "learning_rate": 0.00013896035162679025, "loss": 0.0377, "step": 166340 }, { "epoch": 1.07, "learning_rate": 0.0001389506702724333, "loss": 0.0384, "step": 166350 }, { "epoch": 1.07, "learning_rate": 0.00013894098891807636, "loss": 0.0386, "step": 166360 }, { "epoch": 1.07, "learning_rate": 0.00013893130756371944, "loss": 0.0346, "step": 166370 }, { "epoch": 1.07, "learning_rate": 0.0001389216262093625, "loss": 0.0347, "step": 166380 }, { "epoch": 1.07, "learning_rate": 0.00013891194485500557, "loss": 0.0365, "step": 166390 }, { "epoch": 1.07, "learning_rate": 0.00013890226350064865, "loss": 0.0283, "step": 166400 }, { "epoch": 1.07, "learning_rate": 0.00013889258214629173, "loss": 0.0324, "step": 166410 }, { "epoch": 1.07, "learning_rate": 0.00013888290079193478, "loss": 0.0336, "step": 166420 }, { "epoch": 1.07, "learning_rate": 0.00013887321943757783, "loss": 0.0355, "step": 166430 }, { "epoch": 1.07, "learning_rate": 0.0001388635380832209, "loss": 0.0321, "step": 166440 }, { "epoch": 1.07, "learning_rate": 0.00013885385672886397, "loss": 0.0325, "step": 166450 }, { "epoch": 1.07, "learning_rate": 0.00013884417537450705, "loss": 0.029, "step": 166460 }, { "epoch": 1.07, "learning_rate": 0.00013883449402015012, "loss": 0.0326, "step": 166470 }, { "epoch": 1.07, "learning_rate": 0.00013882481266579318, "loss": 0.0334, "step": 166480 }, { "epoch": 1.07, "learning_rate": 0.00013881513131143626, "loss": 0.0348, "step": 166490 }, { "epoch": 1.07, "learning_rate": 0.0001388054499570793, "loss": 0.0304, "step": 166500 }, { "epoch": 1.07, "learning_rate": 0.0001387957686027224, "loss": 0.0372, "step": 166510 }, { "epoch": 1.07, "learning_rate": 0.00013878608724836544, "loss": 0.0334, "step": 166520 }, { "epoch": 1.07, "learning_rate": 0.00013877640589400852, "loss": 0.0373, "step": 166530 }, { "epoch": 1.07, "learning_rate": 0.0001387667245396516, "loss": 0.0395, "step": 166540 }, { "epoch": 1.07, "learning_rate": 0.00013875704318529465, "loss": 0.0346, "step": 166550 }, { "epoch": 1.08, "learning_rate": 0.0001387473618309377, "loss": 0.0359, "step": 166560 }, { "epoch": 1.08, "learning_rate": 0.0001387376804765808, "loss": 0.0331, "step": 166570 }, { "epoch": 1.08, "learning_rate": 0.00013872799912222387, "loss": 0.0318, "step": 166580 }, { "epoch": 1.08, "learning_rate": 0.00013871831776786692, "loss": 0.0309, "step": 166590 }, { "epoch": 1.08, "learning_rate": 0.00013870863641351, "loss": 0.0336, "step": 166600 }, { "epoch": 1.08, "learning_rate": 0.00013869895505915308, "loss": 0.0339, "step": 166610 }, { "epoch": 1.08, "learning_rate": 0.00013868927370479613, "loss": 0.0321, "step": 166620 }, { "epoch": 1.08, "learning_rate": 0.00013867959235043918, "loss": 0.0319, "step": 166630 }, { "epoch": 1.08, "learning_rate": 0.00013866991099608226, "loss": 0.0401, "step": 166640 }, { "epoch": 1.08, "learning_rate": 0.00013866022964172534, "loss": 0.0326, "step": 166650 }, { "epoch": 1.08, "learning_rate": 0.0001386505482873684, "loss": 0.0336, "step": 166660 }, { "epoch": 1.08, "learning_rate": 0.00013864086693301148, "loss": 0.0397, "step": 166670 }, { "epoch": 1.08, "learning_rate": 0.00013863118557865453, "loss": 0.0307, "step": 166680 }, { "epoch": 1.08, "learning_rate": 0.0001386215042242976, "loss": 0.0318, "step": 166690 }, { "epoch": 1.08, "learning_rate": 0.00013861182286994066, "loss": 0.0371, "step": 166700 }, { "epoch": 1.08, "learning_rate": 0.00013860214151558374, "loss": 0.0343, "step": 166710 }, { "epoch": 1.08, "learning_rate": 0.00013859246016122682, "loss": 0.0311, "step": 166720 }, { "epoch": 1.08, "learning_rate": 0.00013858277880686987, "loss": 0.0279, "step": 166730 }, { "epoch": 1.08, "learning_rate": 0.00013857309745251295, "loss": 0.0463, "step": 166740 }, { "epoch": 1.08, "learning_rate": 0.000138563416098156, "loss": 0.0292, "step": 166750 }, { "epoch": 1.08, "learning_rate": 0.0001385537347437991, "loss": 0.0314, "step": 166760 }, { "epoch": 1.08, "learning_rate": 0.00013854405338944214, "loss": 0.0345, "step": 166770 }, { "epoch": 1.08, "learning_rate": 0.00013853437203508522, "loss": 0.0459, "step": 166780 }, { "epoch": 1.08, "learning_rate": 0.0001385246906807283, "loss": 0.0378, "step": 166790 }, { "epoch": 1.08, "learning_rate": 0.00013851500932637135, "loss": 0.034, "step": 166800 }, { "epoch": 1.08, "learning_rate": 0.00013850532797201443, "loss": 0.0325, "step": 166810 }, { "epoch": 1.08, "learning_rate": 0.00013849564661765748, "loss": 0.0303, "step": 166820 }, { "epoch": 1.08, "learning_rate": 0.00013848596526330056, "loss": 0.0329, "step": 166830 }, { "epoch": 1.08, "learning_rate": 0.00013847628390894362, "loss": 0.0344, "step": 166840 }, { "epoch": 1.08, "learning_rate": 0.0001384666025545867, "loss": 0.0326, "step": 166850 }, { "epoch": 1.08, "learning_rate": 0.00013845692120022978, "loss": 0.033, "step": 166860 }, { "epoch": 1.08, "learning_rate": 0.00013844723984587283, "loss": 0.03, "step": 166870 }, { "epoch": 1.08, "learning_rate": 0.00013843755849151588, "loss": 0.0406, "step": 166880 }, { "epoch": 1.08, "learning_rate": 0.00013842787713715896, "loss": 0.0331, "step": 166890 }, { "epoch": 1.08, "learning_rate": 0.00013841819578280204, "loss": 0.0316, "step": 166900 }, { "epoch": 1.08, "learning_rate": 0.0001384085144284451, "loss": 0.0317, "step": 166910 }, { "epoch": 1.08, "learning_rate": 0.00013839883307408817, "loss": 0.0348, "step": 166920 }, { "epoch": 1.08, "learning_rate": 0.00013838915171973123, "loss": 0.0323, "step": 166930 }, { "epoch": 1.08, "learning_rate": 0.0001383794703653743, "loss": 0.0344, "step": 166940 }, { "epoch": 1.08, "learning_rate": 0.00013836978901101736, "loss": 0.0346, "step": 166950 }, { "epoch": 1.08, "learning_rate": 0.00013836010765666044, "loss": 0.0354, "step": 166960 }, { "epoch": 1.08, "learning_rate": 0.00013835042630230352, "loss": 0.0356, "step": 166970 }, { "epoch": 1.08, "learning_rate": 0.00013834074494794657, "loss": 0.0316, "step": 166980 }, { "epoch": 1.08, "learning_rate": 0.00013833106359358965, "loss": 0.0351, "step": 166990 }, { "epoch": 1.08, "learning_rate": 0.0001383213822392327, "loss": 0.0319, "step": 167000 }, { "epoch": 1.08, "eval_cer": 0.919931307196927, "eval_loss": 0.02439761720597744, "eval_runtime": 120.0555, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 167000 }, { "epoch": 1.08, "learning_rate": 0.00013831170088487578, "loss": 0.0326, "step": 167010 }, { "epoch": 1.08, "learning_rate": 0.00013830201953051884, "loss": 0.0288, "step": 167020 }, { "epoch": 1.08, "learning_rate": 0.00013829233817616192, "loss": 0.035, "step": 167030 }, { "epoch": 1.08, "learning_rate": 0.00013828265682180497, "loss": 0.0323, "step": 167040 }, { "epoch": 1.08, "learning_rate": 0.00013827297546744805, "loss": 0.038, "step": 167050 }, { "epoch": 1.08, "learning_rate": 0.00013826329411309113, "loss": 0.0404, "step": 167060 }, { "epoch": 1.08, "learning_rate": 0.00013825361275873418, "loss": 0.0308, "step": 167070 }, { "epoch": 1.08, "learning_rate": 0.00013824393140437723, "loss": 0.0345, "step": 167080 }, { "epoch": 1.08, "learning_rate": 0.0001382342500500203, "loss": 0.0317, "step": 167090 }, { "epoch": 1.08, "learning_rate": 0.0001382245686956634, "loss": 0.0316, "step": 167100 }, { "epoch": 1.08, "learning_rate": 0.00013821488734130645, "loss": 0.0335, "step": 167110 }, { "epoch": 1.08, "learning_rate": 0.00013820520598694953, "loss": 0.0366, "step": 167120 }, { "epoch": 1.08, "learning_rate": 0.00013819552463259258, "loss": 0.0315, "step": 167130 }, { "epoch": 1.08, "learning_rate": 0.00013818584327823566, "loss": 0.0375, "step": 167140 }, { "epoch": 1.08, "learning_rate": 0.0001381761619238787, "loss": 0.034, "step": 167150 }, { "epoch": 1.08, "learning_rate": 0.0001381664805695218, "loss": 0.0339, "step": 167160 }, { "epoch": 1.08, "learning_rate": 0.00013815679921516487, "loss": 0.0314, "step": 167170 }, { "epoch": 1.08, "learning_rate": 0.00013814711786080792, "loss": 0.0292, "step": 167180 }, { "epoch": 1.08, "learning_rate": 0.000138137436506451, "loss": 0.0315, "step": 167190 }, { "epoch": 1.08, "learning_rate": 0.00013812775515209406, "loss": 0.0322, "step": 167200 }, { "epoch": 1.08, "learning_rate": 0.00013811807379773714, "loss": 0.032, "step": 167210 }, { "epoch": 1.08, "learning_rate": 0.0001381083924433802, "loss": 0.0318, "step": 167220 }, { "epoch": 1.08, "learning_rate": 0.00013809871108902327, "loss": 0.0293, "step": 167230 }, { "epoch": 1.08, "learning_rate": 0.00013808902973466635, "loss": 0.0304, "step": 167240 }, { "epoch": 1.08, "learning_rate": 0.0001380793483803094, "loss": 0.0319, "step": 167250 }, { "epoch": 1.08, "learning_rate": 0.00013806966702595248, "loss": 0.0332, "step": 167260 }, { "epoch": 1.08, "learning_rate": 0.00013805998567159553, "loss": 0.0357, "step": 167270 }, { "epoch": 1.08, "learning_rate": 0.0001380503043172386, "loss": 0.0307, "step": 167280 }, { "epoch": 1.08, "learning_rate": 0.00013804062296288167, "loss": 0.0365, "step": 167290 }, { "epoch": 1.08, "learning_rate": 0.00013803094160852474, "loss": 0.0352, "step": 167300 }, { "epoch": 1.08, "learning_rate": 0.00013802126025416782, "loss": 0.0307, "step": 167310 }, { "epoch": 1.08, "learning_rate": 0.00013801157889981088, "loss": 0.0346, "step": 167320 }, { "epoch": 1.08, "learning_rate": 0.00013800189754545393, "loss": 0.0306, "step": 167330 }, { "epoch": 1.08, "learning_rate": 0.000137992216191097, "loss": 0.0319, "step": 167340 }, { "epoch": 1.08, "learning_rate": 0.0001379825348367401, "loss": 0.0353, "step": 167350 }, { "epoch": 1.08, "learning_rate": 0.00013797285348238314, "loss": 0.0328, "step": 167360 }, { "epoch": 1.08, "learning_rate": 0.00013796317212802622, "loss": 0.0346, "step": 167370 }, { "epoch": 1.08, "learning_rate": 0.0001379534907736693, "loss": 0.0356, "step": 167380 }, { "epoch": 1.08, "learning_rate": 0.00013794380941931235, "loss": 0.0317, "step": 167390 }, { "epoch": 1.08, "learning_rate": 0.0001379341280649554, "loss": 0.0312, "step": 167400 }, { "epoch": 1.08, "learning_rate": 0.0001379244467105985, "loss": 0.0396, "step": 167410 }, { "epoch": 1.08, "learning_rate": 0.00013791476535624157, "loss": 0.0307, "step": 167420 }, { "epoch": 1.08, "learning_rate": 0.00013790508400188462, "loss": 0.0302, "step": 167430 }, { "epoch": 1.08, "learning_rate": 0.0001378954026475277, "loss": 0.0299, "step": 167440 }, { "epoch": 1.08, "learning_rate": 0.00013788572129317075, "loss": 0.033, "step": 167450 }, { "epoch": 1.08, "learning_rate": 0.00013787603993881383, "loss": 0.0326, "step": 167460 }, { "epoch": 1.08, "learning_rate": 0.00013786635858445688, "loss": 0.0327, "step": 167470 }, { "epoch": 1.08, "learning_rate": 0.00013785667723009996, "loss": 0.0368, "step": 167480 }, { "epoch": 1.08, "learning_rate": 0.00013784699587574304, "loss": 0.0379, "step": 167490 }, { "epoch": 1.08, "learning_rate": 0.0001378373145213861, "loss": 0.0345, "step": 167500 }, { "epoch": 1.08, "learning_rate": 0.00013782763316702918, "loss": 0.0305, "step": 167510 }, { "epoch": 1.08, "learning_rate": 0.00013781795181267223, "loss": 0.0362, "step": 167520 }, { "epoch": 1.08, "learning_rate": 0.00013780827045831528, "loss": 0.0323, "step": 167530 }, { "epoch": 1.08, "learning_rate": 0.00013779858910395836, "loss": 0.0342, "step": 167540 }, { "epoch": 1.08, "learning_rate": 0.00013778890774960144, "loss": 0.0372, "step": 167550 }, { "epoch": 1.08, "learning_rate": 0.00013777922639524452, "loss": 0.0299, "step": 167560 }, { "epoch": 1.08, "learning_rate": 0.00013776954504088757, "loss": 0.0297, "step": 167570 }, { "epoch": 1.08, "learning_rate": 0.00013775986368653065, "loss": 0.0283, "step": 167580 }, { "epoch": 1.08, "learning_rate": 0.0001377501823321737, "loss": 0.0304, "step": 167590 }, { "epoch": 1.08, "learning_rate": 0.00013774050097781676, "loss": 0.0383, "step": 167600 }, { "epoch": 1.08, "learning_rate": 0.00013773081962345984, "loss": 0.0338, "step": 167610 }, { "epoch": 1.08, "learning_rate": 0.00013772113826910292, "loss": 0.0399, "step": 167620 }, { "epoch": 1.08, "learning_rate": 0.000137711456914746, "loss": 0.0384, "step": 167630 }, { "epoch": 1.08, "learning_rate": 0.00013770177556038905, "loss": 0.0367, "step": 167640 }, { "epoch": 1.08, "learning_rate": 0.0001376920942060321, "loss": 0.0343, "step": 167650 }, { "epoch": 1.08, "learning_rate": 0.00013768241285167518, "loss": 0.0308, "step": 167660 }, { "epoch": 1.08, "learning_rate": 0.00013767273149731824, "loss": 0.039, "step": 167670 }, { "epoch": 1.08, "learning_rate": 0.00013766305014296132, "loss": 0.0382, "step": 167680 }, { "epoch": 1.08, "learning_rate": 0.0001376533687886044, "loss": 0.0356, "step": 167690 }, { "epoch": 1.08, "learning_rate": 0.00013764368743424748, "loss": 0.0326, "step": 167700 }, { "epoch": 1.08, "learning_rate": 0.00013763400607989053, "loss": 0.041, "step": 167710 }, { "epoch": 1.08, "learning_rate": 0.00013762432472553358, "loss": 0.033, "step": 167720 }, { "epoch": 1.08, "learning_rate": 0.00013761464337117666, "loss": 0.0327, "step": 167730 }, { "epoch": 1.08, "learning_rate": 0.0001376049620168197, "loss": 0.0359, "step": 167740 }, { "epoch": 1.08, "learning_rate": 0.0001375952806624628, "loss": 0.042, "step": 167750 }, { "epoch": 1.08, "learning_rate": 0.00013758559930810587, "loss": 0.0335, "step": 167760 }, { "epoch": 1.08, "learning_rate": 0.00013757591795374893, "loss": 0.0358, "step": 167770 }, { "epoch": 1.08, "learning_rate": 0.000137566236599392, "loss": 0.0351, "step": 167780 }, { "epoch": 1.08, "learning_rate": 0.00013755655524503506, "loss": 0.0363, "step": 167790 }, { "epoch": 1.08, "learning_rate": 0.00013754687389067814, "loss": 0.0387, "step": 167800 }, { "epoch": 1.08, "learning_rate": 0.0001375371925363212, "loss": 0.0339, "step": 167810 }, { "epoch": 1.08, "learning_rate": 0.00013752751118196427, "loss": 0.0275, "step": 167820 }, { "epoch": 1.08, "learning_rate": 0.00013751782982760735, "loss": 0.0378, "step": 167830 }, { "epoch": 1.08, "learning_rate": 0.0001375081484732504, "loss": 0.0299, "step": 167840 }, { "epoch": 1.08, "learning_rate": 0.00013749846711889346, "loss": 0.0303, "step": 167850 }, { "epoch": 1.08, "learning_rate": 0.00013748878576453654, "loss": 0.0329, "step": 167860 }, { "epoch": 1.08, "learning_rate": 0.00013747910441017962, "loss": 0.0376, "step": 167870 }, { "epoch": 1.08, "learning_rate": 0.00013746942305582267, "loss": 0.0287, "step": 167880 }, { "epoch": 1.08, "learning_rate": 0.00013745974170146575, "loss": 0.0306, "step": 167890 }, { "epoch": 1.08, "learning_rate": 0.00013745006034710883, "loss": 0.0363, "step": 167900 }, { "epoch": 1.08, "learning_rate": 0.00013744037899275188, "loss": 0.0311, "step": 167910 }, { "epoch": 1.08, "learning_rate": 0.00013743069763839493, "loss": 0.0343, "step": 167920 }, { "epoch": 1.08, "learning_rate": 0.000137421016284038, "loss": 0.0344, "step": 167930 }, { "epoch": 1.08, "learning_rate": 0.0001374113349296811, "loss": 0.0298, "step": 167940 }, { "epoch": 1.08, "learning_rate": 0.00013740165357532415, "loss": 0.0348, "step": 167950 }, { "epoch": 1.08, "learning_rate": 0.00013739197222096722, "loss": 0.0306, "step": 167960 }, { "epoch": 1.08, "learning_rate": 0.00013738229086661028, "loss": 0.0333, "step": 167970 }, { "epoch": 1.08, "learning_rate": 0.00013737260951225336, "loss": 0.0335, "step": 167980 }, { "epoch": 1.08, "learning_rate": 0.0001373629281578964, "loss": 0.0299, "step": 167990 }, { "epoch": 1.08, "learning_rate": 0.0001373532468035395, "loss": 0.0315, "step": 168000 }, { "epoch": 1.08, "eval_cer": 0.9197975370014687, "eval_loss": 0.025038884952664375, "eval_runtime": 120.1957, "eval_samples_per_second": 16.64, "eval_steps_per_second": 4.16, "step": 168000 }, { "epoch": 1.08, "learning_rate": 0.00013734356544918257, "loss": 0.032, "step": 168010 }, { "epoch": 1.08, "learning_rate": 0.00013733388409482562, "loss": 0.0329, "step": 168020 }, { "epoch": 1.08, "learning_rate": 0.0001373242027404687, "loss": 0.0369, "step": 168030 }, { "epoch": 1.08, "learning_rate": 0.00013731452138611175, "loss": 0.0352, "step": 168040 }, { "epoch": 1.08, "learning_rate": 0.00013730484003175483, "loss": 0.0345, "step": 168050 }, { "epoch": 1.08, "learning_rate": 0.0001372951586773979, "loss": 0.0385, "step": 168060 }, { "epoch": 1.08, "learning_rate": 0.00013728547732304097, "loss": 0.0317, "step": 168070 }, { "epoch": 1.08, "learning_rate": 0.00013727579596868405, "loss": 0.0367, "step": 168080 }, { "epoch": 1.08, "learning_rate": 0.0001372661146143271, "loss": 0.0338, "step": 168090 }, { "epoch": 1.08, "learning_rate": 0.00013725643325997018, "loss": 0.0355, "step": 168100 }, { "epoch": 1.09, "learning_rate": 0.00013724675190561323, "loss": 0.0461, "step": 168110 }, { "epoch": 1.09, "learning_rate": 0.0001372370705512563, "loss": 0.0359, "step": 168120 }, { "epoch": 1.09, "learning_rate": 0.00013722738919689936, "loss": 0.0339, "step": 168130 }, { "epoch": 1.09, "learning_rate": 0.00013721770784254244, "loss": 0.0359, "step": 168140 }, { "epoch": 1.09, "learning_rate": 0.00013720802648818552, "loss": 0.0297, "step": 168150 }, { "epoch": 1.09, "learning_rate": 0.00013719834513382858, "loss": 0.0328, "step": 168160 }, { "epoch": 1.09, "learning_rate": 0.00013718866377947163, "loss": 0.0355, "step": 168170 }, { "epoch": 1.09, "learning_rate": 0.0001371789824251147, "loss": 0.038, "step": 168180 }, { "epoch": 1.09, "learning_rate": 0.0001371693010707578, "loss": 0.0357, "step": 168190 }, { "epoch": 1.09, "learning_rate": 0.00013715961971640084, "loss": 0.0329, "step": 168200 }, { "epoch": 1.09, "learning_rate": 0.00013714993836204392, "loss": 0.033, "step": 168210 }, { "epoch": 1.09, "learning_rate": 0.00013714025700768697, "loss": 0.0375, "step": 168220 }, { "epoch": 1.09, "learning_rate": 0.00013713057565333005, "loss": 0.0318, "step": 168230 }, { "epoch": 1.09, "learning_rate": 0.0001371208942989731, "loss": 0.0323, "step": 168240 }, { "epoch": 1.09, "learning_rate": 0.0001371112129446162, "loss": 0.0343, "step": 168250 }, { "epoch": 1.09, "learning_rate": 0.00013710153159025927, "loss": 0.0303, "step": 168260 }, { "epoch": 1.09, "learning_rate": 0.00013709185023590232, "loss": 0.0356, "step": 168270 }, { "epoch": 1.09, "learning_rate": 0.0001370821688815454, "loss": 0.0318, "step": 168280 }, { "epoch": 1.09, "learning_rate": 0.00013707248752718845, "loss": 0.032, "step": 168290 }, { "epoch": 1.09, "learning_rate": 0.00013706280617283153, "loss": 0.0327, "step": 168300 }, { "epoch": 1.09, "learning_rate": 0.00013705312481847458, "loss": 0.0378, "step": 168310 }, { "epoch": 1.09, "learning_rate": 0.00013704344346411766, "loss": 0.0341, "step": 168320 }, { "epoch": 1.09, "learning_rate": 0.00013703376210976074, "loss": 0.0334, "step": 168330 }, { "epoch": 1.09, "learning_rate": 0.0001370240807554038, "loss": 0.04, "step": 168340 }, { "epoch": 1.09, "learning_rate": 0.00013701439940104688, "loss": 0.0299, "step": 168350 }, { "epoch": 1.09, "learning_rate": 0.00013700471804668993, "loss": 0.0389, "step": 168360 }, { "epoch": 1.09, "learning_rate": 0.00013699503669233298, "loss": 0.0389, "step": 168370 }, { "epoch": 1.09, "learning_rate": 0.00013698535533797606, "loss": 0.032, "step": 168380 }, { "epoch": 1.09, "learning_rate": 0.00013697567398361914, "loss": 0.0352, "step": 168390 }, { "epoch": 1.09, "learning_rate": 0.00013696599262926222, "loss": 0.0341, "step": 168400 }, { "epoch": 1.09, "learning_rate": 0.00013695631127490527, "loss": 0.0362, "step": 168410 }, { "epoch": 1.09, "learning_rate": 0.00013694662992054833, "loss": 0.0329, "step": 168420 }, { "epoch": 1.09, "learning_rate": 0.0001369369485661914, "loss": 0.0342, "step": 168430 }, { "epoch": 1.09, "learning_rate": 0.00013692726721183446, "loss": 0.0281, "step": 168440 }, { "epoch": 1.09, "learning_rate": 0.00013691758585747754, "loss": 0.0325, "step": 168450 }, { "epoch": 1.09, "learning_rate": 0.00013690790450312062, "loss": 0.03, "step": 168460 }, { "epoch": 1.09, "learning_rate": 0.0001368982231487637, "loss": 0.0342, "step": 168470 }, { "epoch": 1.09, "learning_rate": 0.00013688854179440675, "loss": 0.0316, "step": 168480 }, { "epoch": 1.09, "learning_rate": 0.0001368788604400498, "loss": 0.0337, "step": 168490 }, { "epoch": 1.09, "learning_rate": 0.00013686917908569288, "loss": 0.0381, "step": 168500 }, { "epoch": 1.09, "learning_rate": 0.00013685949773133594, "loss": 0.0368, "step": 168510 }, { "epoch": 1.09, "learning_rate": 0.00013684981637697902, "loss": 0.0306, "step": 168520 }, { "epoch": 1.09, "learning_rate": 0.0001368401350226221, "loss": 0.0299, "step": 168530 }, { "epoch": 1.09, "learning_rate": 0.00013683045366826515, "loss": 0.0346, "step": 168540 }, { "epoch": 1.09, "learning_rate": 0.00013682077231390823, "loss": 0.034, "step": 168550 }, { "epoch": 1.09, "learning_rate": 0.00013681109095955128, "loss": 0.0348, "step": 168560 }, { "epoch": 1.09, "learning_rate": 0.00013680140960519436, "loss": 0.0326, "step": 168570 }, { "epoch": 1.09, "learning_rate": 0.0001367917282508374, "loss": 0.0326, "step": 168580 }, { "epoch": 1.09, "learning_rate": 0.0001367820468964805, "loss": 0.0347, "step": 168590 }, { "epoch": 1.09, "learning_rate": 0.00013677236554212357, "loss": 0.0486, "step": 168600 }, { "epoch": 1.09, "learning_rate": 0.00013676268418776663, "loss": 0.0364, "step": 168610 }, { "epoch": 1.09, "learning_rate": 0.0001367530028334097, "loss": 0.0375, "step": 168620 }, { "epoch": 1.09, "learning_rate": 0.00013674332147905276, "loss": 0.0357, "step": 168630 }, { "epoch": 1.09, "learning_rate": 0.00013673364012469584, "loss": 0.0381, "step": 168640 }, { "epoch": 1.09, "learning_rate": 0.0001367239587703389, "loss": 0.0317, "step": 168650 }, { "epoch": 1.09, "learning_rate": 0.00013671427741598197, "loss": 0.0312, "step": 168660 }, { "epoch": 1.09, "learning_rate": 0.00013670459606162505, "loss": 0.0335, "step": 168670 }, { "epoch": 1.09, "learning_rate": 0.0001366949147072681, "loss": 0.0325, "step": 168680 }, { "epoch": 1.09, "learning_rate": 0.00013668523335291116, "loss": 0.0338, "step": 168690 }, { "epoch": 1.09, "learning_rate": 0.00013667555199855424, "loss": 0.0318, "step": 168700 }, { "epoch": 1.09, "learning_rate": 0.00013666587064419731, "loss": 0.0339, "step": 168710 }, { "epoch": 1.09, "learning_rate": 0.00013665618928984037, "loss": 0.0305, "step": 168720 }, { "epoch": 1.09, "learning_rate": 0.00013664650793548345, "loss": 0.0352, "step": 168730 }, { "epoch": 1.09, "learning_rate": 0.0001366368265811265, "loss": 0.0374, "step": 168740 }, { "epoch": 1.09, "learning_rate": 0.00013662714522676958, "loss": 0.0331, "step": 168750 }, { "epoch": 1.09, "learning_rate": 0.00013661746387241263, "loss": 0.0339, "step": 168760 }, { "epoch": 1.09, "learning_rate": 0.0001366077825180557, "loss": 0.0344, "step": 168770 }, { "epoch": 1.09, "learning_rate": 0.0001365981011636988, "loss": 0.0322, "step": 168780 }, { "epoch": 1.09, "learning_rate": 0.00013658841980934184, "loss": 0.0329, "step": 168790 }, { "epoch": 1.09, "learning_rate": 0.00013657873845498492, "loss": 0.0415, "step": 168800 }, { "epoch": 1.09, "learning_rate": 0.00013656905710062798, "loss": 0.0363, "step": 168810 }, { "epoch": 1.09, "learning_rate": 0.00013655937574627106, "loss": 0.0359, "step": 168820 }, { "epoch": 1.09, "learning_rate": 0.0001365496943919141, "loss": 0.0304, "step": 168830 }, { "epoch": 1.09, "learning_rate": 0.0001365400130375572, "loss": 0.0377, "step": 168840 }, { "epoch": 1.09, "learning_rate": 0.00013653033168320027, "loss": 0.0289, "step": 168850 }, { "epoch": 1.09, "learning_rate": 0.00013652065032884332, "loss": 0.0347, "step": 168860 }, { "epoch": 1.09, "learning_rate": 0.0001365109689744864, "loss": 0.0384, "step": 168870 }, { "epoch": 1.09, "learning_rate": 0.00013650128762012945, "loss": 0.0294, "step": 168880 }, { "epoch": 1.09, "learning_rate": 0.00013649160626577253, "loss": 0.0401, "step": 168890 }, { "epoch": 1.09, "learning_rate": 0.0001364819249114156, "loss": 0.0321, "step": 168900 }, { "epoch": 1.09, "learning_rate": 0.00013647224355705867, "loss": 0.0386, "step": 168910 }, { "epoch": 1.09, "learning_rate": 0.00013646256220270175, "loss": 0.0304, "step": 168920 }, { "epoch": 1.09, "learning_rate": 0.0001364528808483448, "loss": 0.0364, "step": 168930 }, { "epoch": 1.09, "learning_rate": 0.00013644319949398785, "loss": 0.0349, "step": 168940 }, { "epoch": 1.09, "learning_rate": 0.00013643351813963093, "loss": 0.0346, "step": 168950 }, { "epoch": 1.09, "learning_rate": 0.000136423836785274, "loss": 0.029, "step": 168960 }, { "epoch": 1.09, "learning_rate": 0.00013641415543091706, "loss": 0.0307, "step": 168970 }, { "epoch": 1.09, "learning_rate": 0.00013640447407656014, "loss": 0.031, "step": 168980 }, { "epoch": 1.09, "learning_rate": 0.00013639479272220322, "loss": 0.0345, "step": 168990 }, { "epoch": 1.09, "learning_rate": 0.00013638511136784628, "loss": 0.0345, "step": 169000 }, { "epoch": 1.09, "eval_cer": 0.9198879222686702, "eval_loss": 0.0242831502109766, "eval_runtime": 120.0326, "eval_samples_per_second": 16.662, "eval_steps_per_second": 4.166, "step": 169000 }, { "epoch": 1.09, "learning_rate": 0.00013637543001348933, "loss": 0.0327, "step": 169010 }, { "epoch": 1.09, "learning_rate": 0.0001363657486591324, "loss": 0.0332, "step": 169020 }, { "epoch": 1.09, "learning_rate": 0.0001363560673047755, "loss": 0.0379, "step": 169030 }, { "epoch": 1.09, "learning_rate": 0.00013634638595041854, "loss": 0.0331, "step": 169040 }, { "epoch": 1.09, "learning_rate": 0.00013633670459606162, "loss": 0.0326, "step": 169050 }, { "epoch": 1.09, "learning_rate": 0.00013632702324170467, "loss": 0.0342, "step": 169060 }, { "epoch": 1.09, "learning_rate": 0.00013631734188734775, "loss": 0.035, "step": 169070 }, { "epoch": 1.09, "learning_rate": 0.0001363076605329908, "loss": 0.0402, "step": 169080 }, { "epoch": 1.09, "learning_rate": 0.00013629797917863389, "loss": 0.0369, "step": 169090 }, { "epoch": 1.09, "learning_rate": 0.00013628829782427697, "loss": 0.0314, "step": 169100 }, { "epoch": 1.09, "learning_rate": 0.00013627861646992002, "loss": 0.0357, "step": 169110 }, { "epoch": 1.09, "learning_rate": 0.0001362689351155631, "loss": 0.0285, "step": 169120 }, { "epoch": 1.09, "learning_rate": 0.00013625925376120615, "loss": 0.0357, "step": 169130 }, { "epoch": 1.09, "learning_rate": 0.0001362495724068492, "loss": 0.0357, "step": 169140 }, { "epoch": 1.09, "learning_rate": 0.00013623989105249228, "loss": 0.0314, "step": 169150 }, { "epoch": 1.09, "learning_rate": 0.00013623020969813536, "loss": 0.034, "step": 169160 }, { "epoch": 1.09, "learning_rate": 0.00013622052834377844, "loss": 0.0275, "step": 169170 }, { "epoch": 1.09, "learning_rate": 0.0001362108469894215, "loss": 0.0358, "step": 169180 }, { "epoch": 1.09, "learning_rate": 0.00013620116563506458, "loss": 0.0365, "step": 169190 }, { "epoch": 1.09, "learning_rate": 0.00013619148428070763, "loss": 0.0341, "step": 169200 }, { "epoch": 1.09, "learning_rate": 0.00013618180292635068, "loss": 0.035, "step": 169210 }, { "epoch": 1.09, "learning_rate": 0.00013617212157199376, "loss": 0.032, "step": 169220 }, { "epoch": 1.09, "learning_rate": 0.00013616244021763684, "loss": 0.0356, "step": 169230 }, { "epoch": 1.09, "learning_rate": 0.00013615275886327992, "loss": 0.0314, "step": 169240 }, { "epoch": 1.09, "learning_rate": 0.00013614307750892297, "loss": 0.0359, "step": 169250 }, { "epoch": 1.09, "learning_rate": 0.00013613339615456603, "loss": 0.0381, "step": 169260 }, { "epoch": 1.09, "learning_rate": 0.0001361237148002091, "loss": 0.0356, "step": 169270 }, { "epoch": 1.09, "learning_rate": 0.00013611403344585216, "loss": 0.0323, "step": 169280 }, { "epoch": 1.09, "learning_rate": 0.00013610435209149524, "loss": 0.0299, "step": 169290 }, { "epoch": 1.09, "learning_rate": 0.00013609467073713832, "loss": 0.0361, "step": 169300 }, { "epoch": 1.09, "learning_rate": 0.0001360849893827814, "loss": 0.0311, "step": 169310 }, { "epoch": 1.09, "learning_rate": 0.00013607530802842445, "loss": 0.0301, "step": 169320 }, { "epoch": 1.09, "learning_rate": 0.0001360656266740675, "loss": 0.0369, "step": 169330 }, { "epoch": 1.09, "learning_rate": 0.00013605594531971058, "loss": 0.0322, "step": 169340 }, { "epoch": 1.09, "learning_rate": 0.00013604626396535364, "loss": 0.0368, "step": 169350 }, { "epoch": 1.09, "learning_rate": 0.00013603658261099672, "loss": 0.0384, "step": 169360 }, { "epoch": 1.09, "learning_rate": 0.0001360269012566398, "loss": 0.0302, "step": 169370 }, { "epoch": 1.09, "learning_rate": 0.00013601721990228285, "loss": 0.031, "step": 169380 }, { "epoch": 1.09, "learning_rate": 0.00013600753854792593, "loss": 0.0363, "step": 169390 }, { "epoch": 1.09, "learning_rate": 0.00013599785719356898, "loss": 0.0326, "step": 169400 }, { "epoch": 1.09, "learning_rate": 0.00013598817583921206, "loss": 0.0305, "step": 169410 }, { "epoch": 1.09, "learning_rate": 0.0001359784944848551, "loss": 0.037, "step": 169420 }, { "epoch": 1.09, "learning_rate": 0.0001359688131304982, "loss": 0.0318, "step": 169430 }, { "epoch": 1.09, "learning_rate": 0.00013595913177614127, "loss": 0.0275, "step": 169440 }, { "epoch": 1.09, "learning_rate": 0.00013594945042178433, "loss": 0.0314, "step": 169450 }, { "epoch": 1.09, "learning_rate": 0.00013593976906742738, "loss": 0.033, "step": 169460 }, { "epoch": 1.09, "learning_rate": 0.00013593008771307046, "loss": 0.0343, "step": 169470 }, { "epoch": 1.09, "learning_rate": 0.00013592040635871354, "loss": 0.03, "step": 169480 }, { "epoch": 1.09, "learning_rate": 0.0001359107250043566, "loss": 0.0342, "step": 169490 }, { "epoch": 1.09, "learning_rate": 0.00013590104364999967, "loss": 0.0334, "step": 169500 }, { "epoch": 1.09, "learning_rate": 0.00013589136229564275, "loss": 0.0363, "step": 169510 }, { "epoch": 1.09, "learning_rate": 0.0001358816809412858, "loss": 0.0346, "step": 169520 }, { "epoch": 1.09, "learning_rate": 0.00013587199958692885, "loss": 0.0286, "step": 169530 }, { "epoch": 1.09, "learning_rate": 0.00013586231823257193, "loss": 0.0296, "step": 169540 }, { "epoch": 1.09, "learning_rate": 0.00013585263687821501, "loss": 0.0307, "step": 169550 }, { "epoch": 1.09, "learning_rate": 0.00013584295552385807, "loss": 0.0324, "step": 169560 }, { "epoch": 1.09, "learning_rate": 0.00013583327416950115, "loss": 0.031, "step": 169570 }, { "epoch": 1.09, "learning_rate": 0.0001358235928151442, "loss": 0.0347, "step": 169580 }, { "epoch": 1.09, "learning_rate": 0.00013581391146078728, "loss": 0.037, "step": 169590 }, { "epoch": 1.09, "learning_rate": 0.00013580423010643033, "loss": 0.0319, "step": 169600 }, { "epoch": 1.09, "learning_rate": 0.0001357945487520734, "loss": 0.0367, "step": 169610 }, { "epoch": 1.09, "learning_rate": 0.0001357848673977165, "loss": 0.0363, "step": 169620 }, { "epoch": 1.09, "learning_rate": 0.00013577518604335954, "loss": 0.0409, "step": 169630 }, { "epoch": 1.09, "learning_rate": 0.00013576550468900262, "loss": 0.0356, "step": 169640 }, { "epoch": 1.09, "learning_rate": 0.00013575582333464568, "loss": 0.0358, "step": 169650 }, { "epoch": 1.1, "learning_rate": 0.00013574614198028876, "loss": 0.0378, "step": 169660 }, { "epoch": 1.1, "learning_rate": 0.0001357364606259318, "loss": 0.0391, "step": 169670 }, { "epoch": 1.1, "learning_rate": 0.0001357267792715749, "loss": 0.035, "step": 169680 }, { "epoch": 1.1, "learning_rate": 0.00013571709791721797, "loss": 0.0315, "step": 169690 }, { "epoch": 1.1, "learning_rate": 0.00013570741656286102, "loss": 0.0344, "step": 169700 }, { "epoch": 1.1, "learning_rate": 0.0001356977352085041, "loss": 0.0352, "step": 169710 }, { "epoch": 1.1, "learning_rate": 0.00013568805385414715, "loss": 0.0336, "step": 169720 }, { "epoch": 1.1, "learning_rate": 0.00013567837249979023, "loss": 0.0382, "step": 169730 }, { "epoch": 1.1, "learning_rate": 0.0001356686911454333, "loss": 0.0329, "step": 169740 }, { "epoch": 1.1, "learning_rate": 0.00013565900979107637, "loss": 0.032, "step": 169750 }, { "epoch": 1.1, "learning_rate": 0.00013564932843671945, "loss": 0.0374, "step": 169760 }, { "epoch": 1.1, "learning_rate": 0.0001356396470823625, "loss": 0.0308, "step": 169770 }, { "epoch": 1.1, "learning_rate": 0.00013562996572800555, "loss": 0.0313, "step": 169780 }, { "epoch": 1.1, "learning_rate": 0.00013562028437364863, "loss": 0.0321, "step": 169790 }, { "epoch": 1.1, "learning_rate": 0.0001356106030192917, "loss": 0.0334, "step": 169800 }, { "epoch": 1.1, "learning_rate": 0.00013560092166493476, "loss": 0.0335, "step": 169810 }, { "epoch": 1.1, "learning_rate": 0.00013559124031057784, "loss": 0.0359, "step": 169820 }, { "epoch": 1.1, "learning_rate": 0.0001355815589562209, "loss": 0.0349, "step": 169830 }, { "epoch": 1.1, "learning_rate": 0.00013557187760186398, "loss": 0.0385, "step": 169840 }, { "epoch": 1.1, "learning_rate": 0.00013556219624750703, "loss": 0.0337, "step": 169850 }, { "epoch": 1.1, "learning_rate": 0.0001355525148931501, "loss": 0.0369, "step": 169860 }, { "epoch": 1.1, "learning_rate": 0.0001355428335387932, "loss": 0.034, "step": 169870 }, { "epoch": 1.1, "learning_rate": 0.00013553315218443624, "loss": 0.0321, "step": 169880 }, { "epoch": 1.1, "learning_rate": 0.00013552347083007932, "loss": 0.0295, "step": 169890 }, { "epoch": 1.1, "learning_rate": 0.00013551378947572237, "loss": 0.0397, "step": 169900 }, { "epoch": 1.1, "learning_rate": 0.00013550410812136545, "loss": 0.0299, "step": 169910 }, { "epoch": 1.1, "learning_rate": 0.0001354944267670085, "loss": 0.0391, "step": 169920 }, { "epoch": 1.1, "learning_rate": 0.00013548474541265159, "loss": 0.0381, "step": 169930 }, { "epoch": 1.1, "learning_rate": 0.00013547506405829467, "loss": 0.037, "step": 169940 }, { "epoch": 1.1, "learning_rate": 0.00013546538270393772, "loss": 0.0291, "step": 169950 }, { "epoch": 1.1, "learning_rate": 0.0001354557013495808, "loss": 0.0314, "step": 169960 }, { "epoch": 1.1, "learning_rate": 0.00013544601999522385, "loss": 0.0286, "step": 169970 }, { "epoch": 1.1, "learning_rate": 0.0001354363386408669, "loss": 0.0317, "step": 169980 }, { "epoch": 1.1, "learning_rate": 0.00013542665728650998, "loss": 0.0413, "step": 169990 }, { "epoch": 1.1, "learning_rate": 0.00013541697593215306, "loss": 0.0341, "step": 170000 }, { "epoch": 1.1, "eval_cer": 0.9198942492373743, "eval_loss": 0.024668850004673004, "eval_runtime": 120.0558, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 170000 }, { "epoch": 1.1, "learning_rate": 0.00013540729457779614, "loss": 0.0414, "step": 170010 }, { "epoch": 1.1, "learning_rate": 0.0001353976132234392, "loss": 0.0341, "step": 170020 }, { "epoch": 1.1, "learning_rate": 0.00013538793186908225, "loss": 0.0359, "step": 170030 }, { "epoch": 1.1, "learning_rate": 0.00013537825051472533, "loss": 0.0384, "step": 170040 }, { "epoch": 1.1, "learning_rate": 0.00013536856916036838, "loss": 0.0321, "step": 170050 }, { "epoch": 1.1, "learning_rate": 0.00013535888780601146, "loss": 0.0336, "step": 170060 }, { "epoch": 1.1, "learning_rate": 0.00013534920645165454, "loss": 0.0315, "step": 170070 }, { "epoch": 1.1, "learning_rate": 0.00013533952509729762, "loss": 0.042, "step": 170080 }, { "epoch": 1.1, "learning_rate": 0.00013532984374294067, "loss": 0.0338, "step": 170090 }, { "epoch": 1.1, "learning_rate": 0.00013532016238858373, "loss": 0.033, "step": 170100 }, { "epoch": 1.1, "learning_rate": 0.0001353104810342268, "loss": 0.0316, "step": 170110 }, { "epoch": 1.1, "learning_rate": 0.00013530079967986986, "loss": 0.0311, "step": 170120 }, { "epoch": 1.1, "learning_rate": 0.00013529111832551294, "loss": 0.0338, "step": 170130 }, { "epoch": 1.1, "learning_rate": 0.00013528143697115602, "loss": 0.0346, "step": 170140 }, { "epoch": 1.1, "learning_rate": 0.00013527175561679907, "loss": 0.0355, "step": 170150 }, { "epoch": 1.1, "learning_rate": 0.00013526207426244215, "loss": 0.0343, "step": 170160 }, { "epoch": 1.1, "learning_rate": 0.0001352523929080852, "loss": 0.0349, "step": 170170 }, { "epoch": 1.1, "learning_rate": 0.00013524271155372828, "loss": 0.0359, "step": 170180 }, { "epoch": 1.1, "learning_rate": 0.00013523303019937134, "loss": 0.032, "step": 170190 }, { "epoch": 1.1, "learning_rate": 0.00013522334884501441, "loss": 0.0331, "step": 170200 }, { "epoch": 1.1, "learning_rate": 0.0001352136674906575, "loss": 0.0293, "step": 170210 }, { "epoch": 1.1, "learning_rate": 0.00013520398613630055, "loss": 0.0307, "step": 170220 }, { "epoch": 1.1, "learning_rate": 0.0001351943047819436, "loss": 0.0314, "step": 170230 }, { "epoch": 1.1, "learning_rate": 0.00013518462342758668, "loss": 0.0328, "step": 170240 }, { "epoch": 1.1, "learning_rate": 0.00013517494207322976, "loss": 0.0348, "step": 170250 }, { "epoch": 1.1, "learning_rate": 0.0001351652607188728, "loss": 0.0382, "step": 170260 }, { "epoch": 1.1, "learning_rate": 0.0001351555793645159, "loss": 0.0326, "step": 170270 }, { "epoch": 1.1, "learning_rate": 0.00013514589801015897, "loss": 0.033, "step": 170280 }, { "epoch": 1.1, "learning_rate": 0.00013513621665580202, "loss": 0.0333, "step": 170290 }, { "epoch": 1.1, "learning_rate": 0.00013512653530144508, "loss": 0.0358, "step": 170300 }, { "epoch": 1.1, "learning_rate": 0.00013511685394708816, "loss": 0.0347, "step": 170310 }, { "epoch": 1.1, "learning_rate": 0.00013510717259273124, "loss": 0.0336, "step": 170320 }, { "epoch": 1.1, "learning_rate": 0.0001350974912383743, "loss": 0.0362, "step": 170330 }, { "epoch": 1.1, "learning_rate": 0.00013508780988401737, "loss": 0.0345, "step": 170340 }, { "epoch": 1.1, "learning_rate": 0.00013507812852966042, "loss": 0.0308, "step": 170350 }, { "epoch": 1.1, "learning_rate": 0.0001350684471753035, "loss": 0.0326, "step": 170360 }, { "epoch": 1.1, "learning_rate": 0.00013505876582094655, "loss": 0.0371, "step": 170370 }, { "epoch": 1.1, "learning_rate": 0.00013504908446658963, "loss": 0.0313, "step": 170380 }, { "epoch": 1.1, "learning_rate": 0.00013503940311223271, "loss": 0.0314, "step": 170390 }, { "epoch": 1.1, "learning_rate": 0.00013502972175787577, "loss": 0.0316, "step": 170400 }, { "epoch": 1.1, "learning_rate": 0.00013502004040351885, "loss": 0.037, "step": 170410 }, { "epoch": 1.1, "learning_rate": 0.0001350103590491619, "loss": 0.0292, "step": 170420 }, { "epoch": 1.1, "learning_rate": 0.00013500067769480498, "loss": 0.0303, "step": 170430 }, { "epoch": 1.1, "learning_rate": 0.00013499099634044803, "loss": 0.0355, "step": 170440 }, { "epoch": 1.1, "learning_rate": 0.0001349813149860911, "loss": 0.0378, "step": 170450 }, { "epoch": 1.1, "learning_rate": 0.0001349716336317342, "loss": 0.0345, "step": 170460 }, { "epoch": 1.1, "learning_rate": 0.00013496195227737724, "loss": 0.0375, "step": 170470 }, { "epoch": 1.1, "learning_rate": 0.00013495227092302032, "loss": 0.0313, "step": 170480 }, { "epoch": 1.1, "learning_rate": 0.00013494258956866338, "loss": 0.0366, "step": 170490 }, { "epoch": 1.1, "learning_rate": 0.00013493290821430643, "loss": 0.0308, "step": 170500 }, { "epoch": 1.1, "learning_rate": 0.0001349232268599495, "loss": 0.0323, "step": 170510 }, { "epoch": 1.1, "learning_rate": 0.0001349135455055926, "loss": 0.0302, "step": 170520 }, { "epoch": 1.1, "learning_rate": 0.00013490386415123567, "loss": 0.032, "step": 170530 }, { "epoch": 1.1, "learning_rate": 0.00013489418279687872, "loss": 0.0295, "step": 170540 }, { "epoch": 1.1, "learning_rate": 0.00013488450144252177, "loss": 0.0364, "step": 170550 }, { "epoch": 1.1, "learning_rate": 0.00013487482008816485, "loss": 0.0349, "step": 170560 }, { "epoch": 1.1, "learning_rate": 0.0001348651387338079, "loss": 0.0355, "step": 170570 }, { "epoch": 1.1, "learning_rate": 0.00013485545737945099, "loss": 0.0314, "step": 170580 }, { "epoch": 1.1, "learning_rate": 0.00013484577602509407, "loss": 0.0389, "step": 170590 }, { "epoch": 1.1, "learning_rate": 0.00013483609467073715, "loss": 0.0395, "step": 170600 }, { "epoch": 1.1, "learning_rate": 0.0001348264133163802, "loss": 0.0268, "step": 170610 }, { "epoch": 1.1, "learning_rate": 0.00013481673196202325, "loss": 0.0331, "step": 170620 }, { "epoch": 1.1, "learning_rate": 0.00013480705060766633, "loss": 0.0328, "step": 170630 }, { "epoch": 1.1, "learning_rate": 0.00013479736925330938, "loss": 0.0256, "step": 170640 }, { "epoch": 1.1, "learning_rate": 0.00013478768789895246, "loss": 0.0354, "step": 170650 }, { "epoch": 1.1, "learning_rate": 0.00013477800654459554, "loss": 0.031, "step": 170660 }, { "epoch": 1.1, "learning_rate": 0.0001347683251902386, "loss": 0.0314, "step": 170670 }, { "epoch": 1.1, "learning_rate": 0.00013475864383588168, "loss": 0.0315, "step": 170680 }, { "epoch": 1.1, "learning_rate": 0.00013474896248152473, "loss": 0.0344, "step": 170690 }, { "epoch": 1.1, "learning_rate": 0.0001347392811271678, "loss": 0.0322, "step": 170700 }, { "epoch": 1.1, "learning_rate": 0.00013472959977281086, "loss": 0.0363, "step": 170710 }, { "epoch": 1.1, "learning_rate": 0.00013471991841845394, "loss": 0.0417, "step": 170720 }, { "epoch": 1.1, "learning_rate": 0.00013471023706409702, "loss": 0.0351, "step": 170730 }, { "epoch": 1.1, "learning_rate": 0.00013470055570974007, "loss": 0.0338, "step": 170740 }, { "epoch": 1.1, "learning_rate": 0.00013469087435538313, "loss": 0.033, "step": 170750 }, { "epoch": 1.1, "learning_rate": 0.0001346811930010262, "loss": 0.0358, "step": 170760 }, { "epoch": 1.1, "learning_rate": 0.00013467151164666929, "loss": 0.0349, "step": 170770 }, { "epoch": 1.1, "learning_rate": 0.00013466183029231234, "loss": 0.0316, "step": 170780 }, { "epoch": 1.1, "learning_rate": 0.00013465214893795542, "loss": 0.0299, "step": 170790 }, { "epoch": 1.1, "learning_rate": 0.0001346424675835985, "loss": 0.0363, "step": 170800 }, { "epoch": 1.1, "learning_rate": 0.00013463278622924155, "loss": 0.0322, "step": 170810 }, { "epoch": 1.1, "learning_rate": 0.0001346231048748846, "loss": 0.0375, "step": 170820 }, { "epoch": 1.1, "learning_rate": 0.00013461342352052768, "loss": 0.0388, "step": 170830 }, { "epoch": 1.1, "learning_rate": 0.00013460374216617076, "loss": 0.0366, "step": 170840 }, { "epoch": 1.1, "learning_rate": 0.00013459406081181382, "loss": 0.0349, "step": 170850 }, { "epoch": 1.1, "learning_rate": 0.0001345843794574569, "loss": 0.0353, "step": 170860 }, { "epoch": 1.1, "learning_rate": 0.00013457469810309995, "loss": 0.0304, "step": 170870 }, { "epoch": 1.1, "learning_rate": 0.00013456501674874303, "loss": 0.0347, "step": 170880 }, { "epoch": 1.1, "learning_rate": 0.00013455533539438608, "loss": 0.0348, "step": 170890 }, { "epoch": 1.1, "learning_rate": 0.00013454565404002916, "loss": 0.035, "step": 170900 }, { "epoch": 1.1, "learning_rate": 0.00013453597268567224, "loss": 0.036, "step": 170910 }, { "epoch": 1.1, "learning_rate": 0.0001345262913313153, "loss": 0.029, "step": 170920 }, { "epoch": 1.1, "learning_rate": 0.00013451660997695837, "loss": 0.0285, "step": 170930 }, { "epoch": 1.1, "learning_rate": 0.00013450692862260143, "loss": 0.0304, "step": 170940 }, { "epoch": 1.1, "learning_rate": 0.0001344972472682445, "loss": 0.0289, "step": 170950 }, { "epoch": 1.1, "learning_rate": 0.00013448756591388756, "loss": 0.0368, "step": 170960 }, { "epoch": 1.1, "learning_rate": 0.00013447788455953064, "loss": 0.0324, "step": 170970 }, { "epoch": 1.1, "learning_rate": 0.00013446820320517372, "loss": 0.0304, "step": 170980 }, { "epoch": 1.1, "learning_rate": 0.00013445852185081677, "loss": 0.0285, "step": 170990 }, { "epoch": 1.1, "learning_rate": 0.00013444884049645985, "loss": 0.0317, "step": 171000 }, { "epoch": 1.1, "eval_cer": 0.9198897299740142, "eval_loss": 0.02412121742963791, "eval_runtime": 120.2503, "eval_samples_per_second": 16.632, "eval_steps_per_second": 4.158, "step": 171000 }, { "epoch": 1.1, "learning_rate": 0.0001344391591421029, "loss": 0.0346, "step": 171010 }, { "epoch": 1.1, "learning_rate": 0.00013442947778774598, "loss": 0.0328, "step": 171020 }, { "epoch": 1.1, "learning_rate": 0.00013441979643338903, "loss": 0.0325, "step": 171030 }, { "epoch": 1.1, "learning_rate": 0.00013441011507903211, "loss": 0.031, "step": 171040 }, { "epoch": 1.1, "learning_rate": 0.0001344004337246752, "loss": 0.0392, "step": 171050 }, { "epoch": 1.1, "learning_rate": 0.00013439075237031825, "loss": 0.037, "step": 171060 }, { "epoch": 1.1, "learning_rate": 0.0001343810710159613, "loss": 0.0339, "step": 171070 }, { "epoch": 1.1, "learning_rate": 0.00013437138966160438, "loss": 0.0384, "step": 171080 }, { "epoch": 1.1, "learning_rate": 0.00013436170830724746, "loss": 0.0305, "step": 171090 }, { "epoch": 1.1, "learning_rate": 0.0001343520269528905, "loss": 0.0352, "step": 171100 }, { "epoch": 1.1, "learning_rate": 0.0001343423455985336, "loss": 0.0357, "step": 171110 }, { "epoch": 1.1, "learning_rate": 0.00013433266424417664, "loss": 0.0385, "step": 171120 }, { "epoch": 1.1, "learning_rate": 0.00013432298288981972, "loss": 0.0313, "step": 171130 }, { "epoch": 1.1, "learning_rate": 0.00013431330153546278, "loss": 0.0324, "step": 171140 }, { "epoch": 1.1, "learning_rate": 0.00013430362018110586, "loss": 0.0349, "step": 171150 }, { "epoch": 1.1, "learning_rate": 0.00013429393882674894, "loss": 0.0312, "step": 171160 }, { "epoch": 1.1, "learning_rate": 0.000134284257472392, "loss": 0.0311, "step": 171170 }, { "epoch": 1.1, "learning_rate": 0.00013427457611803507, "loss": 0.0366, "step": 171180 }, { "epoch": 1.1, "learning_rate": 0.00013426489476367812, "loss": 0.0346, "step": 171190 }, { "epoch": 1.1, "learning_rate": 0.0001342552134093212, "loss": 0.0306, "step": 171200 }, { "epoch": 1.11, "learning_rate": 0.00013424553205496425, "loss": 0.0386, "step": 171210 }, { "epoch": 1.11, "learning_rate": 0.00013423585070060733, "loss": 0.0331, "step": 171220 }, { "epoch": 1.11, "learning_rate": 0.00013422616934625041, "loss": 0.0356, "step": 171230 }, { "epoch": 1.11, "learning_rate": 0.00013421648799189347, "loss": 0.0303, "step": 171240 }, { "epoch": 1.11, "learning_rate": 0.00013420680663753655, "loss": 0.0339, "step": 171250 }, { "epoch": 1.11, "learning_rate": 0.0001341971252831796, "loss": 0.0336, "step": 171260 }, { "epoch": 1.11, "learning_rate": 0.00013418744392882265, "loss": 0.0356, "step": 171270 }, { "epoch": 1.11, "learning_rate": 0.00013417776257446573, "loss": 0.0357, "step": 171280 }, { "epoch": 1.11, "learning_rate": 0.0001341680812201088, "loss": 0.0357, "step": 171290 }, { "epoch": 1.11, "learning_rate": 0.0001341583998657519, "loss": 0.0342, "step": 171300 }, { "epoch": 1.11, "learning_rate": 0.00013414871851139494, "loss": 0.0335, "step": 171310 }, { "epoch": 1.11, "learning_rate": 0.000134139037157038, "loss": 0.0315, "step": 171320 }, { "epoch": 1.11, "learning_rate": 0.00013412935580268108, "loss": 0.0331, "step": 171330 }, { "epoch": 1.11, "learning_rate": 0.00013411967444832413, "loss": 0.0269, "step": 171340 }, { "epoch": 1.11, "learning_rate": 0.0001341099930939672, "loss": 0.0323, "step": 171350 }, { "epoch": 1.11, "learning_rate": 0.0001341003117396103, "loss": 0.0336, "step": 171360 }, { "epoch": 1.11, "learning_rate": 0.00013409063038525337, "loss": 0.0312, "step": 171370 }, { "epoch": 1.11, "learning_rate": 0.00013408094903089642, "loss": 0.0338, "step": 171380 }, { "epoch": 1.11, "learning_rate": 0.00013407126767653947, "loss": 0.0361, "step": 171390 }, { "epoch": 1.11, "learning_rate": 0.00013406158632218255, "loss": 0.0406, "step": 171400 }, { "epoch": 1.11, "learning_rate": 0.0001340519049678256, "loss": 0.0371, "step": 171410 }, { "epoch": 1.11, "learning_rate": 0.00013404222361346869, "loss": 0.0377, "step": 171420 }, { "epoch": 1.11, "learning_rate": 0.00013403254225911177, "loss": 0.0352, "step": 171430 }, { "epoch": 1.11, "learning_rate": 0.00013402286090475482, "loss": 0.0304, "step": 171440 }, { "epoch": 1.11, "learning_rate": 0.0001340131795503979, "loss": 0.0311, "step": 171450 }, { "epoch": 1.11, "learning_rate": 0.00013400349819604095, "loss": 0.0347, "step": 171460 }, { "epoch": 1.11, "learning_rate": 0.00013399381684168403, "loss": 0.0315, "step": 171470 }, { "epoch": 1.11, "learning_rate": 0.00013398413548732708, "loss": 0.0349, "step": 171480 }, { "epoch": 1.11, "learning_rate": 0.00013397445413297016, "loss": 0.0341, "step": 171490 }, { "epoch": 1.11, "learning_rate": 0.00013396477277861324, "loss": 0.0338, "step": 171500 }, { "epoch": 1.11, "learning_rate": 0.0001339550914242563, "loss": 0.0307, "step": 171510 }, { "epoch": 1.11, "learning_rate": 0.00013394541006989935, "loss": 0.0377, "step": 171520 }, { "epoch": 1.11, "learning_rate": 0.00013393572871554243, "loss": 0.0287, "step": 171530 }, { "epoch": 1.11, "learning_rate": 0.0001339260473611855, "loss": 0.0287, "step": 171540 }, { "epoch": 1.11, "learning_rate": 0.00013391636600682856, "loss": 0.0366, "step": 171550 }, { "epoch": 1.11, "learning_rate": 0.00013390668465247164, "loss": 0.0397, "step": 171560 }, { "epoch": 1.11, "learning_rate": 0.00013389700329811472, "loss": 0.0289, "step": 171570 }, { "epoch": 1.11, "learning_rate": 0.00013388732194375777, "loss": 0.0362, "step": 171580 }, { "epoch": 1.11, "learning_rate": 0.00013387764058940083, "loss": 0.0392, "step": 171590 }, { "epoch": 1.11, "learning_rate": 0.0001338679592350439, "loss": 0.0339, "step": 171600 }, { "epoch": 1.11, "learning_rate": 0.00013385827788068699, "loss": 0.0328, "step": 171610 }, { "epoch": 1.11, "learning_rate": 0.00013384859652633004, "loss": 0.0355, "step": 171620 }, { "epoch": 1.11, "learning_rate": 0.00013383891517197312, "loss": 0.0364, "step": 171630 }, { "epoch": 1.11, "learning_rate": 0.00013382923381761617, "loss": 0.0433, "step": 171640 }, { "epoch": 1.11, "learning_rate": 0.00013381955246325925, "loss": 0.0342, "step": 171650 }, { "epoch": 1.11, "learning_rate": 0.0001338098711089023, "loss": 0.0342, "step": 171660 }, { "epoch": 1.11, "learning_rate": 0.00013380018975454538, "loss": 0.0363, "step": 171670 }, { "epoch": 1.11, "learning_rate": 0.00013379050840018846, "loss": 0.0344, "step": 171680 }, { "epoch": 1.11, "learning_rate": 0.00013378082704583151, "loss": 0.0301, "step": 171690 }, { "epoch": 1.11, "learning_rate": 0.0001337711456914746, "loss": 0.0296, "step": 171700 }, { "epoch": 1.11, "learning_rate": 0.00013376146433711765, "loss": 0.0314, "step": 171710 }, { "epoch": 1.11, "learning_rate": 0.00013375178298276073, "loss": 0.0353, "step": 171720 }, { "epoch": 1.11, "learning_rate": 0.00013374210162840378, "loss": 0.0348, "step": 171730 }, { "epoch": 1.11, "learning_rate": 0.00013373242027404686, "loss": 0.0299, "step": 171740 }, { "epoch": 1.11, "learning_rate": 0.00013372273891968994, "loss": 0.0333, "step": 171750 }, { "epoch": 1.11, "learning_rate": 0.000133713057565333, "loss": 0.0342, "step": 171760 }, { "epoch": 1.11, "learning_rate": 0.00013370337621097607, "loss": 0.0338, "step": 171770 }, { "epoch": 1.11, "learning_rate": 0.00013369369485661912, "loss": 0.0338, "step": 171780 }, { "epoch": 1.11, "learning_rate": 0.0001336840135022622, "loss": 0.0324, "step": 171790 }, { "epoch": 1.11, "learning_rate": 0.00013367433214790526, "loss": 0.034, "step": 171800 }, { "epoch": 1.11, "learning_rate": 0.00013366465079354834, "loss": 0.0362, "step": 171810 }, { "epoch": 1.11, "learning_rate": 0.00013365496943919142, "loss": 0.0285, "step": 171820 }, { "epoch": 1.11, "learning_rate": 0.00013364528808483447, "loss": 0.0346, "step": 171830 }, { "epoch": 1.11, "learning_rate": 0.00013363560673047752, "loss": 0.0357, "step": 171840 }, { "epoch": 1.11, "learning_rate": 0.0001336259253761206, "loss": 0.0297, "step": 171850 }, { "epoch": 1.11, "learning_rate": 0.00013361624402176368, "loss": 0.0335, "step": 171860 }, { "epoch": 1.11, "learning_rate": 0.00013360656266740673, "loss": 0.032, "step": 171870 }, { "epoch": 1.11, "learning_rate": 0.00013359688131304981, "loss": 0.0346, "step": 171880 }, { "epoch": 1.11, "learning_rate": 0.0001335871999586929, "loss": 0.0335, "step": 171890 }, { "epoch": 1.11, "learning_rate": 0.00013357751860433595, "loss": 0.0299, "step": 171900 }, { "epoch": 1.11, "learning_rate": 0.000133567837249979, "loss": 0.0322, "step": 171910 }, { "epoch": 1.11, "learning_rate": 0.00013355815589562208, "loss": 0.0313, "step": 171920 }, { "epoch": 1.11, "learning_rate": 0.00013354847454126516, "loss": 0.0348, "step": 171930 }, { "epoch": 1.11, "learning_rate": 0.0001335387931869082, "loss": 0.0306, "step": 171940 }, { "epoch": 1.11, "learning_rate": 0.0001335291118325513, "loss": 0.0323, "step": 171950 }, { "epoch": 1.11, "learning_rate": 0.00013351943047819434, "loss": 0.03, "step": 171960 }, { "epoch": 1.11, "learning_rate": 0.00013350974912383742, "loss": 0.031, "step": 171970 }, { "epoch": 1.11, "learning_rate": 0.00013350006776948048, "loss": 0.0367, "step": 171980 }, { "epoch": 1.11, "learning_rate": 0.00013349038641512356, "loss": 0.0312, "step": 171990 }, { "epoch": 1.11, "learning_rate": 0.00013348070506076664, "loss": 0.0313, "step": 172000 }, { "epoch": 1.11, "eval_cer": 0.9199041916167665, "eval_loss": 0.02452256716787815, "eval_runtime": 120.1075, "eval_samples_per_second": 16.652, "eval_steps_per_second": 4.163, "step": 172000 }, { "epoch": 1.11, "learning_rate": 0.0001334710237064097, "loss": 0.0282, "step": 172010 }, { "epoch": 1.11, "learning_rate": 0.00013346134235205277, "loss": 0.0308, "step": 172020 }, { "epoch": 1.11, "learning_rate": 0.00013345166099769582, "loss": 0.0338, "step": 172030 }, { "epoch": 1.11, "learning_rate": 0.00013344197964333887, "loss": 0.0327, "step": 172040 }, { "epoch": 1.11, "learning_rate": 0.00013343229828898195, "loss": 0.0342, "step": 172050 }, { "epoch": 1.11, "learning_rate": 0.00013342261693462503, "loss": 0.0495, "step": 172060 }, { "epoch": 1.11, "learning_rate": 0.0001334129355802681, "loss": 0.0319, "step": 172070 }, { "epoch": 1.11, "learning_rate": 0.00013340325422591117, "loss": 0.0312, "step": 172080 }, { "epoch": 1.11, "learning_rate": 0.00013339357287155425, "loss": 0.0295, "step": 172090 }, { "epoch": 1.11, "learning_rate": 0.0001333838915171973, "loss": 0.0353, "step": 172100 }, { "epoch": 1.11, "learning_rate": 0.00013337421016284035, "loss": 0.0354, "step": 172110 }, { "epoch": 1.11, "learning_rate": 0.00013336452880848343, "loss": 0.0314, "step": 172120 }, { "epoch": 1.11, "learning_rate": 0.0001333548474541265, "loss": 0.0412, "step": 172130 }, { "epoch": 1.11, "learning_rate": 0.0001333451660997696, "loss": 0.033, "step": 172140 }, { "epoch": 1.11, "learning_rate": 0.00013333548474541264, "loss": 0.0431, "step": 172150 }, { "epoch": 1.11, "learning_rate": 0.0001333258033910557, "loss": 0.0381, "step": 172160 }, { "epoch": 1.11, "learning_rate": 0.00013331612203669878, "loss": 0.0331, "step": 172170 }, { "epoch": 1.11, "learning_rate": 0.00013330644068234183, "loss": 0.0387, "step": 172180 }, { "epoch": 1.11, "learning_rate": 0.0001332967593279849, "loss": 0.0359, "step": 172190 }, { "epoch": 1.11, "learning_rate": 0.000133287077973628, "loss": 0.0362, "step": 172200 }, { "epoch": 1.11, "learning_rate": 0.00013327739661927104, "loss": 0.0367, "step": 172210 }, { "epoch": 1.11, "learning_rate": 0.00013326771526491412, "loss": 0.0325, "step": 172220 }, { "epoch": 1.11, "learning_rate": 0.00013325803391055717, "loss": 0.0374, "step": 172230 }, { "epoch": 1.11, "learning_rate": 0.00013324835255620025, "loss": 0.0324, "step": 172240 }, { "epoch": 1.11, "learning_rate": 0.0001332386712018433, "loss": 0.0292, "step": 172250 }, { "epoch": 1.11, "learning_rate": 0.00013322898984748639, "loss": 0.0342, "step": 172260 }, { "epoch": 1.11, "learning_rate": 0.00013321930849312947, "loss": 0.0329, "step": 172270 }, { "epoch": 1.11, "learning_rate": 0.00013320962713877252, "loss": 0.0325, "step": 172280 }, { "epoch": 1.11, "learning_rate": 0.0001331999457844156, "loss": 0.0319, "step": 172290 }, { "epoch": 1.11, "learning_rate": 0.00013319026443005865, "loss": 0.0326, "step": 172300 }, { "epoch": 1.11, "learning_rate": 0.00013318058307570173, "loss": 0.0386, "step": 172310 }, { "epoch": 1.11, "learning_rate": 0.00013317090172134478, "loss": 0.0399, "step": 172320 }, { "epoch": 1.11, "learning_rate": 0.00013316122036698786, "loss": 0.0324, "step": 172330 }, { "epoch": 1.11, "learning_rate": 0.00013315153901263094, "loss": 0.0357, "step": 172340 }, { "epoch": 1.11, "learning_rate": 0.000133141857658274, "loss": 0.0378, "step": 172350 }, { "epoch": 1.11, "learning_rate": 0.00013313217630391705, "loss": 0.0296, "step": 172360 }, { "epoch": 1.11, "learning_rate": 0.00013312249494956013, "loss": 0.037, "step": 172370 }, { "epoch": 1.11, "learning_rate": 0.0001331128135952032, "loss": 0.0328, "step": 172380 }, { "epoch": 1.11, "learning_rate": 0.00013310313224084626, "loss": 0.035, "step": 172390 }, { "epoch": 1.11, "learning_rate": 0.00013309345088648934, "loss": 0.0327, "step": 172400 }, { "epoch": 1.11, "learning_rate": 0.0001330837695321324, "loss": 0.0289, "step": 172410 }, { "epoch": 1.11, "learning_rate": 0.00013307408817777547, "loss": 0.0346, "step": 172420 }, { "epoch": 1.11, "learning_rate": 0.00013306440682341853, "loss": 0.0353, "step": 172430 }, { "epoch": 1.11, "learning_rate": 0.0001330547254690616, "loss": 0.0338, "step": 172440 }, { "epoch": 1.11, "learning_rate": 0.00013304504411470468, "loss": 0.0339, "step": 172450 }, { "epoch": 1.11, "learning_rate": 0.00013303536276034774, "loss": 0.0337, "step": 172460 }, { "epoch": 1.11, "learning_rate": 0.00013302568140599082, "loss": 0.0366, "step": 172470 }, { "epoch": 1.11, "learning_rate": 0.00013301600005163387, "loss": 0.037, "step": 172480 }, { "epoch": 1.11, "learning_rate": 0.00013300631869727695, "loss": 0.029, "step": 172490 }, { "epoch": 1.11, "learning_rate": 0.00013299663734292, "loss": 0.033, "step": 172500 }, { "epoch": 1.11, "learning_rate": 0.00013298695598856308, "loss": 0.0299, "step": 172510 }, { "epoch": 1.11, "learning_rate": 0.00013297727463420616, "loss": 0.0368, "step": 172520 }, { "epoch": 1.11, "learning_rate": 0.00013296759327984921, "loss": 0.0333, "step": 172530 }, { "epoch": 1.11, "learning_rate": 0.0001329579119254923, "loss": 0.0322, "step": 172540 }, { "epoch": 1.11, "learning_rate": 0.00013294823057113535, "loss": 0.0424, "step": 172550 }, { "epoch": 1.11, "learning_rate": 0.00013293854921677843, "loss": 0.0355, "step": 172560 }, { "epoch": 1.11, "learning_rate": 0.00013292886786242148, "loss": 0.032, "step": 172570 }, { "epoch": 1.11, "learning_rate": 0.00013291918650806456, "loss": 0.0361, "step": 172580 }, { "epoch": 1.11, "learning_rate": 0.00013290950515370764, "loss": 0.0268, "step": 172590 }, { "epoch": 1.11, "learning_rate": 0.0001328998237993507, "loss": 0.0348, "step": 172600 }, { "epoch": 1.11, "learning_rate": 0.00013289014244499374, "loss": 0.0307, "step": 172610 }, { "epoch": 1.11, "learning_rate": 0.00013288046109063682, "loss": 0.0349, "step": 172620 }, { "epoch": 1.11, "learning_rate": 0.0001328707797362799, "loss": 0.0331, "step": 172630 }, { "epoch": 1.11, "learning_rate": 0.00013286109838192296, "loss": 0.0335, "step": 172640 }, { "epoch": 1.11, "learning_rate": 0.00013285141702756604, "loss": 0.0404, "step": 172650 }, { "epoch": 1.11, "learning_rate": 0.00013284173567320912, "loss": 0.037, "step": 172660 }, { "epoch": 1.11, "learning_rate": 0.00013283205431885217, "loss": 0.0353, "step": 172670 }, { "epoch": 1.11, "learning_rate": 0.00013282237296449522, "loss": 0.0416, "step": 172680 }, { "epoch": 1.11, "learning_rate": 0.0001328126916101383, "loss": 0.0286, "step": 172690 }, { "epoch": 1.11, "learning_rate": 0.00013280301025578138, "loss": 0.034, "step": 172700 }, { "epoch": 1.11, "learning_rate": 0.00013279332890142443, "loss": 0.0373, "step": 172710 }, { "epoch": 1.11, "learning_rate": 0.00013278364754706751, "loss": 0.0348, "step": 172720 }, { "epoch": 1.11, "learning_rate": 0.00013277396619271057, "loss": 0.0323, "step": 172730 }, { "epoch": 1.11, "learning_rate": 0.00013276428483835365, "loss": 0.0336, "step": 172740 }, { "epoch": 1.11, "learning_rate": 0.0001327546034839967, "loss": 0.034, "step": 172750 }, { "epoch": 1.12, "learning_rate": 0.00013274492212963978, "loss": 0.0408, "step": 172760 }, { "epoch": 1.12, "learning_rate": 0.00013273524077528286, "loss": 0.0348, "step": 172770 }, { "epoch": 1.12, "learning_rate": 0.0001327255594209259, "loss": 0.0354, "step": 172780 }, { "epoch": 1.12, "learning_rate": 0.000132715878066569, "loss": 0.0308, "step": 172790 }, { "epoch": 1.12, "learning_rate": 0.00013270619671221204, "loss": 0.0386, "step": 172800 }, { "epoch": 1.12, "learning_rate": 0.0001326965153578551, "loss": 0.0378, "step": 172810 }, { "epoch": 1.12, "learning_rate": 0.00013268683400349818, "loss": 0.0343, "step": 172820 }, { "epoch": 1.12, "learning_rate": 0.00013267715264914126, "loss": 0.0326, "step": 172830 }, { "epoch": 1.12, "learning_rate": 0.00013266747129478434, "loss": 0.0382, "step": 172840 }, { "epoch": 1.12, "learning_rate": 0.0001326577899404274, "loss": 0.0342, "step": 172850 }, { "epoch": 1.12, "learning_rate": 0.00013264810858607047, "loss": 0.0324, "step": 172860 }, { "epoch": 1.12, "learning_rate": 0.00013263842723171352, "loss": 0.0348, "step": 172870 }, { "epoch": 1.12, "learning_rate": 0.00013262874587735657, "loss": 0.0317, "step": 172880 }, { "epoch": 1.12, "learning_rate": 0.00013261906452299965, "loss": 0.0353, "step": 172890 }, { "epoch": 1.12, "learning_rate": 0.00013260938316864273, "loss": 0.0375, "step": 172900 }, { "epoch": 1.12, "learning_rate": 0.0001325997018142858, "loss": 0.0394, "step": 172910 }, { "epoch": 1.12, "learning_rate": 0.00013259002045992887, "loss": 0.0354, "step": 172920 }, { "epoch": 1.12, "learning_rate": 0.00013258033910557192, "loss": 0.0395, "step": 172930 }, { "epoch": 1.12, "learning_rate": 0.000132570657751215, "loss": 0.0312, "step": 172940 }, { "epoch": 1.12, "learning_rate": 0.00013256097639685805, "loss": 0.0313, "step": 172950 }, { "epoch": 1.12, "learning_rate": 0.00013255129504250113, "loss": 0.0334, "step": 172960 }, { "epoch": 1.12, "learning_rate": 0.0001325416136881442, "loss": 0.0323, "step": 172970 }, { "epoch": 1.12, "learning_rate": 0.0001325319323337873, "loss": 0.0309, "step": 172980 }, { "epoch": 1.12, "learning_rate": 0.00013252225097943034, "loss": 0.0355, "step": 172990 }, { "epoch": 1.12, "learning_rate": 0.0001325125696250734, "loss": 0.033, "step": 173000 }, { "epoch": 1.12, "eval_cer": 0.9199412495763191, "eval_loss": 0.023672111332416534, "eval_runtime": 120.0714, "eval_samples_per_second": 16.657, "eval_steps_per_second": 4.164, "step": 173000 }, { "epoch": 1.12, "learning_rate": 0.00013250288827071648, "loss": 0.0387, "step": 173010 }, { "epoch": 1.12, "learning_rate": 0.00013249320691635953, "loss": 0.0389, "step": 173020 }, { "epoch": 1.12, "learning_rate": 0.0001324835255620026, "loss": 0.0371, "step": 173030 }, { "epoch": 1.12, "learning_rate": 0.0001324738442076457, "loss": 0.0329, "step": 173040 }, { "epoch": 1.12, "learning_rate": 0.00013246416285328874, "loss": 0.032, "step": 173050 }, { "epoch": 1.12, "learning_rate": 0.00013245448149893182, "loss": 0.0347, "step": 173060 }, { "epoch": 1.12, "learning_rate": 0.00013244480014457487, "loss": 0.0365, "step": 173070 }, { "epoch": 1.12, "learning_rate": 0.00013243511879021795, "loss": 0.0345, "step": 173080 }, { "epoch": 1.12, "learning_rate": 0.000132425437435861, "loss": 0.0355, "step": 173090 }, { "epoch": 1.12, "learning_rate": 0.00013241575608150409, "loss": 0.0356, "step": 173100 }, { "epoch": 1.12, "learning_rate": 0.00013240607472714716, "loss": 0.0398, "step": 173110 }, { "epoch": 1.12, "learning_rate": 0.00013239639337279022, "loss": 0.0319, "step": 173120 }, { "epoch": 1.12, "learning_rate": 0.00013238671201843327, "loss": 0.0371, "step": 173130 }, { "epoch": 1.12, "learning_rate": 0.00013237703066407635, "loss": 0.0308, "step": 173140 }, { "epoch": 1.12, "learning_rate": 0.00013236734930971943, "loss": 0.0365, "step": 173150 }, { "epoch": 1.12, "learning_rate": 0.00013235766795536248, "loss": 0.0377, "step": 173160 }, { "epoch": 1.12, "learning_rate": 0.00013234798660100556, "loss": 0.0335, "step": 173170 }, { "epoch": 1.12, "learning_rate": 0.00013233830524664864, "loss": 0.0315, "step": 173180 }, { "epoch": 1.12, "learning_rate": 0.0001323286238922917, "loss": 0.0314, "step": 173190 }, { "epoch": 1.12, "learning_rate": 0.00013231894253793475, "loss": 0.0288, "step": 173200 }, { "epoch": 1.12, "learning_rate": 0.00013230926118357783, "loss": 0.0351, "step": 173210 }, { "epoch": 1.12, "learning_rate": 0.0001322995798292209, "loss": 0.0331, "step": 173220 }, { "epoch": 1.12, "learning_rate": 0.00013228989847486396, "loss": 0.0327, "step": 173230 }, { "epoch": 1.12, "learning_rate": 0.00013228021712050704, "loss": 0.0307, "step": 173240 }, { "epoch": 1.12, "learning_rate": 0.0001322705357661501, "loss": 0.0275, "step": 173250 }, { "epoch": 1.12, "learning_rate": 0.00013226085441179317, "loss": 0.0314, "step": 173260 }, { "epoch": 1.12, "learning_rate": 0.00013225117305743622, "loss": 0.0328, "step": 173270 }, { "epoch": 1.12, "learning_rate": 0.0001322414917030793, "loss": 0.032, "step": 173280 }, { "epoch": 1.12, "learning_rate": 0.00013223181034872238, "loss": 0.0373, "step": 173290 }, { "epoch": 1.12, "learning_rate": 0.00013222212899436544, "loss": 0.0327, "step": 173300 }, { "epoch": 1.12, "learning_rate": 0.00013221244764000852, "loss": 0.0365, "step": 173310 }, { "epoch": 1.12, "learning_rate": 0.00013220276628565157, "loss": 0.0356, "step": 173320 }, { "epoch": 1.12, "learning_rate": 0.00013219308493129465, "loss": 0.0333, "step": 173330 }, { "epoch": 1.12, "learning_rate": 0.0001321834035769377, "loss": 0.0352, "step": 173340 }, { "epoch": 1.12, "learning_rate": 0.00013217372222258078, "loss": 0.0323, "step": 173350 }, { "epoch": 1.12, "learning_rate": 0.00013216404086822386, "loss": 0.0372, "step": 173360 }, { "epoch": 1.12, "learning_rate": 0.00013215435951386691, "loss": 0.0342, "step": 173370 }, { "epoch": 1.12, "learning_rate": 0.00013214467815951, "loss": 0.0358, "step": 173380 }, { "epoch": 1.12, "learning_rate": 0.00013213499680515305, "loss": 0.0349, "step": 173390 }, { "epoch": 1.12, "learning_rate": 0.00013212531545079613, "loss": 0.0345, "step": 173400 }, { "epoch": 1.12, "learning_rate": 0.00013211563409643918, "loss": 0.0321, "step": 173410 }, { "epoch": 1.12, "learning_rate": 0.00013210595274208226, "loss": 0.0299, "step": 173420 }, { "epoch": 1.12, "learning_rate": 0.00013209627138772534, "loss": 0.0345, "step": 173430 }, { "epoch": 1.12, "learning_rate": 0.0001320865900333684, "loss": 0.0334, "step": 173440 }, { "epoch": 1.12, "learning_rate": 0.00013207690867901144, "loss": 0.0281, "step": 173450 }, { "epoch": 1.12, "learning_rate": 0.00013206722732465452, "loss": 0.0302, "step": 173460 }, { "epoch": 1.12, "learning_rate": 0.0001320575459702976, "loss": 0.0295, "step": 173470 }, { "epoch": 1.12, "learning_rate": 0.00013204786461594066, "loss": 0.0344, "step": 173480 }, { "epoch": 1.12, "learning_rate": 0.00013203818326158374, "loss": 0.0352, "step": 173490 }, { "epoch": 1.12, "learning_rate": 0.00013202850190722682, "loss": 0.0314, "step": 173500 }, { "epoch": 1.12, "learning_rate": 0.00013201882055286987, "loss": 0.0426, "step": 173510 }, { "epoch": 1.12, "learning_rate": 0.00013200913919851292, "loss": 0.033, "step": 173520 }, { "epoch": 1.12, "learning_rate": 0.000131999457844156, "loss": 0.0363, "step": 173530 }, { "epoch": 1.12, "learning_rate": 0.00013198977648979908, "loss": 0.0371, "step": 173540 }, { "epoch": 1.12, "learning_rate": 0.00013198009513544213, "loss": 0.0359, "step": 173550 }, { "epoch": 1.12, "learning_rate": 0.0001319704137810852, "loss": 0.0368, "step": 173560 }, { "epoch": 1.12, "learning_rate": 0.00013196073242672827, "loss": 0.0345, "step": 173570 }, { "epoch": 1.12, "learning_rate": 0.00013195105107237135, "loss": 0.0341, "step": 173580 }, { "epoch": 1.12, "learning_rate": 0.0001319413697180144, "loss": 0.0335, "step": 173590 }, { "epoch": 1.12, "learning_rate": 0.00013193168836365748, "loss": 0.0358, "step": 173600 }, { "epoch": 1.12, "learning_rate": 0.00013192200700930056, "loss": 0.0286, "step": 173610 }, { "epoch": 1.12, "learning_rate": 0.0001319123256549436, "loss": 0.0321, "step": 173620 }, { "epoch": 1.12, "learning_rate": 0.0001319026443005867, "loss": 0.0282, "step": 173630 }, { "epoch": 1.12, "learning_rate": 0.00013189296294622974, "loss": 0.0333, "step": 173640 }, { "epoch": 1.12, "learning_rate": 0.0001318832815918728, "loss": 0.033, "step": 173650 }, { "epoch": 1.12, "learning_rate": 0.00013187360023751588, "loss": 0.032, "step": 173660 }, { "epoch": 1.12, "learning_rate": 0.00013186391888315896, "loss": 0.0301, "step": 173670 }, { "epoch": 1.12, "learning_rate": 0.00013185423752880204, "loss": 0.0303, "step": 173680 }, { "epoch": 1.12, "learning_rate": 0.0001318445561744451, "loss": 0.0378, "step": 173690 }, { "epoch": 1.12, "learning_rate": 0.00013183487482008817, "loss": 0.0328, "step": 173700 }, { "epoch": 1.12, "learning_rate": 0.00013182519346573122, "loss": 0.0338, "step": 173710 }, { "epoch": 1.12, "learning_rate": 0.00013181551211137427, "loss": 0.0294, "step": 173720 }, { "epoch": 1.12, "learning_rate": 0.00013180583075701735, "loss": 0.0325, "step": 173730 }, { "epoch": 1.12, "learning_rate": 0.00013179614940266043, "loss": 0.0297, "step": 173740 }, { "epoch": 1.12, "learning_rate": 0.0001317864680483035, "loss": 0.0367, "step": 173750 }, { "epoch": 1.12, "learning_rate": 0.00013177678669394657, "loss": 0.0339, "step": 173760 }, { "epoch": 1.12, "learning_rate": 0.00013176710533958962, "loss": 0.0341, "step": 173770 }, { "epoch": 1.12, "learning_rate": 0.0001317574239852327, "loss": 0.0347, "step": 173780 }, { "epoch": 1.12, "learning_rate": 0.00013174774263087575, "loss": 0.0312, "step": 173790 }, { "epoch": 1.12, "learning_rate": 0.00013173806127651883, "loss": 0.0367, "step": 173800 }, { "epoch": 1.12, "learning_rate": 0.0001317283799221619, "loss": 0.0366, "step": 173810 }, { "epoch": 1.12, "learning_rate": 0.00013171869856780496, "loss": 0.0316, "step": 173820 }, { "epoch": 1.12, "learning_rate": 0.00013170901721344804, "loss": 0.0329, "step": 173830 }, { "epoch": 1.12, "learning_rate": 0.0001316993358590911, "loss": 0.0327, "step": 173840 }, { "epoch": 1.12, "learning_rate": 0.00013168965450473417, "loss": 0.0364, "step": 173850 }, { "epoch": 1.12, "learning_rate": 0.00013167997315037723, "loss": 0.0363, "step": 173860 }, { "epoch": 1.12, "learning_rate": 0.0001316702917960203, "loss": 0.027, "step": 173870 }, { "epoch": 1.12, "learning_rate": 0.0001316606104416634, "loss": 0.0358, "step": 173880 }, { "epoch": 1.12, "learning_rate": 0.00013165092908730644, "loss": 0.0326, "step": 173890 }, { "epoch": 1.12, "learning_rate": 0.00013164124773294952, "loss": 0.0351, "step": 173900 }, { "epoch": 1.12, "learning_rate": 0.00013163156637859257, "loss": 0.0355, "step": 173910 }, { "epoch": 1.12, "learning_rate": 0.00013162188502423565, "loss": 0.0325, "step": 173920 }, { "epoch": 1.12, "learning_rate": 0.0001316122036698787, "loss": 0.0319, "step": 173930 }, { "epoch": 1.12, "learning_rate": 0.00013160252231552178, "loss": 0.038, "step": 173940 }, { "epoch": 1.12, "learning_rate": 0.00013159284096116486, "loss": 0.0319, "step": 173950 }, { "epoch": 1.12, "learning_rate": 0.00013158315960680792, "loss": 0.0368, "step": 173960 }, { "epoch": 1.12, "learning_rate": 0.00013157347825245097, "loss": 0.036, "step": 173970 }, { "epoch": 1.12, "learning_rate": 0.00013156379689809405, "loss": 0.0406, "step": 173980 }, { "epoch": 1.12, "learning_rate": 0.00013155411554373713, "loss": 0.034, "step": 173990 }, { "epoch": 1.12, "learning_rate": 0.00013154443418938018, "loss": 0.0339, "step": 174000 }, { "epoch": 1.12, "eval_cer": 0.9199159417015027, "eval_loss": 0.0237259678542614, "eval_runtime": 120.3788, "eval_samples_per_second": 16.614, "eval_steps_per_second": 4.154, "step": 174000 }, { "epoch": 1.12, "learning_rate": 0.00013153475283502326, "loss": 0.0352, "step": 174010 }, { "epoch": 1.12, "learning_rate": 0.00013152507148066631, "loss": 0.034, "step": 174020 }, { "epoch": 1.12, "learning_rate": 0.0001315153901263094, "loss": 0.0366, "step": 174030 }, { "epoch": 1.12, "learning_rate": 0.00013150570877195245, "loss": 0.0344, "step": 174040 }, { "epoch": 1.12, "learning_rate": 0.00013149602741759553, "loss": 0.0332, "step": 174050 }, { "epoch": 1.12, "learning_rate": 0.0001314863460632386, "loss": 0.0311, "step": 174060 }, { "epoch": 1.12, "learning_rate": 0.00013147666470888166, "loss": 0.0377, "step": 174070 }, { "epoch": 1.12, "learning_rate": 0.00013146698335452474, "loss": 0.034, "step": 174080 }, { "epoch": 1.12, "learning_rate": 0.0001314573020001678, "loss": 0.0359, "step": 174090 }, { "epoch": 1.12, "learning_rate": 0.00013144762064581087, "loss": 0.0361, "step": 174100 }, { "epoch": 1.12, "learning_rate": 0.00013143793929145392, "loss": 0.0343, "step": 174110 }, { "epoch": 1.12, "learning_rate": 0.000131428257937097, "loss": 0.0348, "step": 174120 }, { "epoch": 1.12, "learning_rate": 0.00013141857658274008, "loss": 0.0363, "step": 174130 }, { "epoch": 1.12, "learning_rate": 0.00013140889522838314, "loss": 0.0383, "step": 174140 }, { "epoch": 1.12, "learning_rate": 0.00013139921387402622, "loss": 0.0319, "step": 174150 }, { "epoch": 1.12, "learning_rate": 0.00013138953251966927, "loss": 0.0326, "step": 174160 }, { "epoch": 1.12, "learning_rate": 0.00013137985116531232, "loss": 0.0366, "step": 174170 }, { "epoch": 1.12, "learning_rate": 0.0001313701698109554, "loss": 0.0302, "step": 174180 }, { "epoch": 1.12, "learning_rate": 0.00013136048845659848, "loss": 0.0372, "step": 174190 }, { "epoch": 1.12, "learning_rate": 0.00013135080710224156, "loss": 0.0339, "step": 174200 }, { "epoch": 1.12, "learning_rate": 0.00013134112574788461, "loss": 0.0316, "step": 174210 }, { "epoch": 1.12, "learning_rate": 0.00013133144439352767, "loss": 0.0332, "step": 174220 }, { "epoch": 1.12, "learning_rate": 0.00013132176303917075, "loss": 0.0353, "step": 174230 }, { "epoch": 1.12, "learning_rate": 0.0001313120816848138, "loss": 0.0442, "step": 174240 }, { "epoch": 1.12, "learning_rate": 0.00013130240033045688, "loss": 0.0302, "step": 174250 }, { "epoch": 1.12, "learning_rate": 0.00013129271897609996, "loss": 0.0368, "step": 174260 }, { "epoch": 1.12, "learning_rate": 0.00013128303762174304, "loss": 0.0331, "step": 174270 }, { "epoch": 1.12, "learning_rate": 0.0001312733562673861, "loss": 0.043, "step": 174280 }, { "epoch": 1.12, "learning_rate": 0.00013126367491302914, "loss": 0.0365, "step": 174290 }, { "epoch": 1.12, "learning_rate": 0.00013125399355867222, "loss": 0.0367, "step": 174300 }, { "epoch": 1.13, "learning_rate": 0.00013124431220431528, "loss": 0.0319, "step": 174310 }, { "epoch": 1.13, "learning_rate": 0.00013123463084995836, "loss": 0.0333, "step": 174320 }, { "epoch": 1.13, "learning_rate": 0.00013122494949560144, "loss": 0.034, "step": 174330 }, { "epoch": 1.13, "learning_rate": 0.0001312152681412445, "loss": 0.0295, "step": 174340 }, { "epoch": 1.13, "learning_rate": 0.00013120558678688757, "loss": 0.0365, "step": 174350 }, { "epoch": 1.13, "learning_rate": 0.00013119590543253062, "loss": 0.0343, "step": 174360 }, { "epoch": 1.13, "learning_rate": 0.0001311862240781737, "loss": 0.0302, "step": 174370 }, { "epoch": 1.13, "learning_rate": 0.00013117654272381675, "loss": 0.0328, "step": 174380 }, { "epoch": 1.13, "learning_rate": 0.00013116686136945983, "loss": 0.0348, "step": 174390 }, { "epoch": 1.13, "learning_rate": 0.0001311571800151029, "loss": 0.0378, "step": 174400 }, { "epoch": 1.13, "learning_rate": 0.00013114749866074597, "loss": 0.0356, "step": 174410 }, { "epoch": 1.13, "learning_rate": 0.00013113781730638902, "loss": 0.0313, "step": 174420 }, { "epoch": 1.13, "learning_rate": 0.0001311281359520321, "loss": 0.0357, "step": 174430 }, { "epoch": 1.13, "learning_rate": 0.00013111845459767518, "loss": 0.0483, "step": 174440 }, { "epoch": 1.13, "learning_rate": 0.00013110877324331823, "loss": 0.0275, "step": 174450 }, { "epoch": 1.13, "learning_rate": 0.0001310990918889613, "loss": 0.0361, "step": 174460 }, { "epoch": 1.13, "learning_rate": 0.0001310894105346044, "loss": 0.0319, "step": 174470 }, { "epoch": 1.13, "learning_rate": 0.00013107972918024744, "loss": 0.0294, "step": 174480 }, { "epoch": 1.13, "learning_rate": 0.0001310700478258905, "loss": 0.0392, "step": 174490 }, { "epoch": 1.13, "learning_rate": 0.00013106036647153358, "loss": 0.0364, "step": 174500 }, { "epoch": 1.13, "learning_rate": 0.00013105068511717666, "loss": 0.0306, "step": 174510 }, { "epoch": 1.13, "learning_rate": 0.0001310410037628197, "loss": 0.0295, "step": 174520 }, { "epoch": 1.13, "learning_rate": 0.0001310313224084628, "loss": 0.0345, "step": 174530 }, { "epoch": 1.13, "learning_rate": 0.00013102164105410584, "loss": 0.0344, "step": 174540 }, { "epoch": 1.13, "learning_rate": 0.00013101195969974892, "loss": 0.0346, "step": 174550 }, { "epoch": 1.13, "learning_rate": 0.00013100227834539197, "loss": 0.0325, "step": 174560 }, { "epoch": 1.13, "learning_rate": 0.00013099259699103505, "loss": 0.0334, "step": 174570 }, { "epoch": 1.13, "learning_rate": 0.00013098291563667813, "loss": 0.0329, "step": 174580 }, { "epoch": 1.13, "learning_rate": 0.00013097323428232119, "loss": 0.0289, "step": 174590 }, { "epoch": 1.13, "learning_rate": 0.00013096355292796426, "loss": 0.0311, "step": 174600 }, { "epoch": 1.13, "learning_rate": 0.00013095387157360732, "loss": 0.0359, "step": 174610 }, { "epoch": 1.13, "learning_rate": 0.0001309441902192504, "loss": 0.037, "step": 174620 }, { "epoch": 1.13, "learning_rate": 0.00013093450886489345, "loss": 0.034, "step": 174630 }, { "epoch": 1.13, "learning_rate": 0.00013092482751053653, "loss": 0.0352, "step": 174640 }, { "epoch": 1.13, "learning_rate": 0.0001309151461561796, "loss": 0.038, "step": 174650 }, { "epoch": 1.13, "learning_rate": 0.00013090546480182266, "loss": 0.0338, "step": 174660 }, { "epoch": 1.13, "learning_rate": 0.00013089578344746574, "loss": 0.0315, "step": 174670 }, { "epoch": 1.13, "learning_rate": 0.0001308861020931088, "loss": 0.0321, "step": 174680 }, { "epoch": 1.13, "learning_rate": 0.00013087642073875187, "loss": 0.035, "step": 174690 }, { "epoch": 1.13, "learning_rate": 0.00013086673938439493, "loss": 0.0314, "step": 174700 }, { "epoch": 1.13, "learning_rate": 0.000130857058030038, "loss": 0.0268, "step": 174710 }, { "epoch": 1.13, "learning_rate": 0.0001308473766756811, "loss": 0.037, "step": 174720 }, { "epoch": 1.13, "learning_rate": 0.00013083769532132414, "loss": 0.0311, "step": 174730 }, { "epoch": 1.13, "learning_rate": 0.0001308280139669672, "loss": 0.0354, "step": 174740 }, { "epoch": 1.13, "learning_rate": 0.00013081833261261027, "loss": 0.0254, "step": 174750 }, { "epoch": 1.13, "learning_rate": 0.00013080865125825335, "loss": 0.0355, "step": 174760 }, { "epoch": 1.13, "learning_rate": 0.0001307989699038964, "loss": 0.0286, "step": 174770 }, { "epoch": 1.13, "learning_rate": 0.00013078928854953948, "loss": 0.0319, "step": 174780 }, { "epoch": 1.13, "learning_rate": 0.00013077960719518256, "loss": 0.0308, "step": 174790 }, { "epoch": 1.13, "learning_rate": 0.00013076992584082562, "loss": 0.0341, "step": 174800 }, { "epoch": 1.13, "learning_rate": 0.00013076024448646867, "loss": 0.0301, "step": 174810 }, { "epoch": 1.13, "learning_rate": 0.00013075056313211175, "loss": 0.0337, "step": 174820 }, { "epoch": 1.13, "learning_rate": 0.00013074088177775483, "loss": 0.0404, "step": 174830 }, { "epoch": 1.13, "learning_rate": 0.00013073120042339788, "loss": 0.0337, "step": 174840 }, { "epoch": 1.13, "learning_rate": 0.00013072151906904096, "loss": 0.043, "step": 174850 }, { "epoch": 1.13, "learning_rate": 0.00013071183771468401, "loss": 0.0414, "step": 174860 }, { "epoch": 1.13, "learning_rate": 0.0001307021563603271, "loss": 0.0317, "step": 174870 }, { "epoch": 1.13, "learning_rate": 0.00013069247500597015, "loss": 0.0357, "step": 174880 }, { "epoch": 1.13, "learning_rate": 0.00013068279365161323, "loss": 0.0308, "step": 174890 }, { "epoch": 1.13, "learning_rate": 0.0001306731122972563, "loss": 0.0335, "step": 174900 }, { "epoch": 1.13, "learning_rate": 0.00013066343094289936, "loss": 0.0325, "step": 174910 }, { "epoch": 1.13, "learning_rate": 0.00013065374958854244, "loss": 0.0371, "step": 174920 }, { "epoch": 1.13, "learning_rate": 0.0001306440682341855, "loss": 0.0341, "step": 174930 }, { "epoch": 1.13, "learning_rate": 0.00013063438687982854, "loss": 0.0352, "step": 174940 }, { "epoch": 1.13, "learning_rate": 0.00013062470552547162, "loss": 0.0365, "step": 174950 }, { "epoch": 1.13, "learning_rate": 0.0001306150241711147, "loss": 0.0393, "step": 174960 }, { "epoch": 1.13, "learning_rate": 0.00013060534281675778, "loss": 0.033, "step": 174970 }, { "epoch": 1.13, "learning_rate": 0.00013059566146240084, "loss": 0.0382, "step": 174980 }, { "epoch": 1.13, "learning_rate": 0.00013058598010804392, "loss": 0.0389, "step": 174990 }, { "epoch": 1.13, "learning_rate": 0.00013057629875368697, "loss": 0.0319, "step": 175000 }, { "epoch": 1.13, "eval_cer": 0.919877979889278, "eval_loss": 0.02397312968969345, "eval_runtime": 120.0597, "eval_samples_per_second": 16.658, "eval_steps_per_second": 4.165, "step": 175000 }, { "epoch": 1.13, "learning_rate": 0.00013056661739933002, "loss": 0.0353, "step": 175010 }, { "epoch": 1.13, "learning_rate": 0.0001305569360449731, "loss": 0.0348, "step": 175020 }, { "epoch": 1.13, "learning_rate": 0.00013054725469061618, "loss": 0.033, "step": 175030 }, { "epoch": 1.13, "learning_rate": 0.00013053757333625926, "loss": 0.0311, "step": 175040 }, { "epoch": 1.13, "learning_rate": 0.0001305278919819023, "loss": 0.0347, "step": 175050 }, { "epoch": 1.13, "learning_rate": 0.00013051821062754537, "loss": 0.0364, "step": 175060 }, { "epoch": 1.13, "learning_rate": 0.00013050852927318845, "loss": 0.0294, "step": 175070 }, { "epoch": 1.13, "learning_rate": 0.0001304988479188315, "loss": 0.0339, "step": 175080 }, { "epoch": 1.13, "learning_rate": 0.00013048916656447458, "loss": 0.0276, "step": 175090 }, { "epoch": 1.13, "learning_rate": 0.00013047948521011766, "loss": 0.03, "step": 175100 }, { "epoch": 1.13, "learning_rate": 0.0001304698038557607, "loss": 0.0315, "step": 175110 }, { "epoch": 1.13, "learning_rate": 0.0001304601225014038, "loss": 0.0339, "step": 175120 }, { "epoch": 1.13, "learning_rate": 0.00013045044114704684, "loss": 0.0343, "step": 175130 }, { "epoch": 1.13, "learning_rate": 0.00013044075979268992, "loss": 0.0279, "step": 175140 }, { "epoch": 1.13, "learning_rate": 0.00013043107843833298, "loss": 0.0371, "step": 175150 }, { "epoch": 1.13, "learning_rate": 0.00013042139708397606, "loss": 0.0344, "step": 175160 }, { "epoch": 1.13, "learning_rate": 0.00013041171572961914, "loss": 0.0362, "step": 175170 }, { "epoch": 1.13, "learning_rate": 0.0001304020343752622, "loss": 0.0308, "step": 175180 }, { "epoch": 1.13, "learning_rate": 0.00013039235302090527, "loss": 0.0371, "step": 175190 }, { "epoch": 1.13, "learning_rate": 0.00013038267166654832, "loss": 0.0369, "step": 175200 }, { "epoch": 1.13, "learning_rate": 0.0001303729903121914, "loss": 0.0312, "step": 175210 }, { "epoch": 1.13, "learning_rate": 0.00013036330895783445, "loss": 0.0325, "step": 175220 }, { "epoch": 1.13, "learning_rate": 0.00013035362760347753, "loss": 0.0351, "step": 175230 }, { "epoch": 1.13, "learning_rate": 0.0001303439462491206, "loss": 0.0323, "step": 175240 }, { "epoch": 1.13, "learning_rate": 0.00013033426489476367, "loss": 0.0375, "step": 175250 }, { "epoch": 1.13, "learning_rate": 0.00013032458354040672, "loss": 0.0378, "step": 175260 }, { "epoch": 1.13, "learning_rate": 0.0001303149021860498, "loss": 0.0388, "step": 175270 }, { "epoch": 1.13, "learning_rate": 0.00013030522083169288, "loss": 0.0283, "step": 175280 }, { "epoch": 1.13, "learning_rate": 0.00013029553947733593, "loss": 0.0351, "step": 175290 }, { "epoch": 1.13, "learning_rate": 0.000130285858122979, "loss": 0.0305, "step": 175300 }, { "epoch": 1.13, "learning_rate": 0.00013027617676862206, "loss": 0.0288, "step": 175310 }, { "epoch": 1.13, "learning_rate": 0.00013026649541426514, "loss": 0.0328, "step": 175320 }, { "epoch": 1.13, "learning_rate": 0.0001302568140599082, "loss": 0.0343, "step": 175330 }, { "epoch": 1.13, "learning_rate": 0.00013024713270555128, "loss": 0.0327, "step": 175340 }, { "epoch": 1.13, "learning_rate": 0.00013023745135119435, "loss": 0.0286, "step": 175350 }, { "epoch": 1.13, "learning_rate": 0.0001302277699968374, "loss": 0.0326, "step": 175360 }, { "epoch": 1.13, "learning_rate": 0.0001302180886424805, "loss": 0.0313, "step": 175370 }, { "epoch": 1.13, "learning_rate": 0.00013020840728812354, "loss": 0.037, "step": 175380 }, { "epoch": 1.13, "learning_rate": 0.00013019872593376662, "loss": 0.0359, "step": 175390 }, { "epoch": 1.13, "learning_rate": 0.00013018904457940967, "loss": 0.0415, "step": 175400 }, { "epoch": 1.13, "learning_rate": 0.00013017936322505275, "loss": 0.0319, "step": 175410 }, { "epoch": 1.13, "learning_rate": 0.00013016968187069583, "loss": 0.0282, "step": 175420 }, { "epoch": 1.13, "learning_rate": 0.00013016000051633888, "loss": 0.0297, "step": 175430 }, { "epoch": 1.13, "learning_rate": 0.00013015031916198196, "loss": 0.036, "step": 175440 }, { "epoch": 1.13, "learning_rate": 0.00013014063780762502, "loss": 0.0337, "step": 175450 }, { "epoch": 1.13, "learning_rate": 0.0001301309564532681, "loss": 0.0391, "step": 175460 }, { "epoch": 1.13, "learning_rate": 0.00013012127509891115, "loss": 0.0305, "step": 175470 }, { "epoch": 1.13, "learning_rate": 0.00013011159374455423, "loss": 0.0329, "step": 175480 }, { "epoch": 1.13, "learning_rate": 0.0001301019123901973, "loss": 0.0361, "step": 175490 }, { "epoch": 1.13, "learning_rate": 0.00013009223103584036, "loss": 0.0313, "step": 175500 }, { "epoch": 1.13, "learning_rate": 0.00013008254968148341, "loss": 0.0354, "step": 175510 }, { "epoch": 1.13, "learning_rate": 0.0001300728683271265, "loss": 0.0278, "step": 175520 }, { "epoch": 1.13, "learning_rate": 0.00013006318697276957, "loss": 0.0384, "step": 175530 }, { "epoch": 1.13, "learning_rate": 0.00013005350561841263, "loss": 0.0324, "step": 175540 }, { "epoch": 1.13, "learning_rate": 0.0001300438242640557, "loss": 0.0398, "step": 175550 }, { "epoch": 1.13, "learning_rate": 0.0001300341429096988, "loss": 0.0349, "step": 175560 }, { "epoch": 1.13, "learning_rate": 0.00013002446155534184, "loss": 0.0332, "step": 175570 }, { "epoch": 1.13, "learning_rate": 0.0001300147802009849, "loss": 0.0267, "step": 175580 }, { "epoch": 1.13, "learning_rate": 0.00013000509884662797, "loss": 0.0336, "step": 175590 }, { "epoch": 1.13, "learning_rate": 0.00012999541749227105, "loss": 0.0286, "step": 175600 }, { "epoch": 1.13, "learning_rate": 0.0001299857361379141, "loss": 0.0293, "step": 175610 }, { "epoch": 1.13, "learning_rate": 0.00012997605478355718, "loss": 0.0324, "step": 175620 }, { "epoch": 1.13, "learning_rate": 0.00012996637342920024, "loss": 0.0304, "step": 175630 }, { "epoch": 1.13, "learning_rate": 0.00012995669207484332, "loss": 0.0337, "step": 175640 }, { "epoch": 1.13, "learning_rate": 0.00012994701072048637, "loss": 0.0302, "step": 175650 }, { "epoch": 1.13, "learning_rate": 0.00012993732936612945, "loss": 0.0301, "step": 175660 }, { "epoch": 1.13, "learning_rate": 0.00012992764801177253, "loss": 0.0327, "step": 175670 }, { "epoch": 1.13, "learning_rate": 0.00012991796665741558, "loss": 0.0408, "step": 175680 }, { "epoch": 1.13, "learning_rate": 0.00012990828530305866, "loss": 0.0317, "step": 175690 }, { "epoch": 1.13, "learning_rate": 0.00012989860394870171, "loss": 0.036, "step": 175700 }, { "epoch": 1.13, "learning_rate": 0.00012988892259434477, "loss": 0.0295, "step": 175710 }, { "epoch": 1.13, "learning_rate": 0.00012987924123998785, "loss": 0.0311, "step": 175720 }, { "epoch": 1.13, "learning_rate": 0.00012986955988563093, "loss": 0.0295, "step": 175730 }, { "epoch": 1.13, "learning_rate": 0.000129859878531274, "loss": 0.0322, "step": 175740 }, { "epoch": 1.13, "learning_rate": 0.00012985019717691706, "loss": 0.0348, "step": 175750 }, { "epoch": 1.13, "learning_rate": 0.00012984051582256014, "loss": 0.0276, "step": 175760 }, { "epoch": 1.13, "learning_rate": 0.0001298308344682032, "loss": 0.0319, "step": 175770 }, { "epoch": 1.13, "learning_rate": 0.00012982115311384624, "loss": 0.0343, "step": 175780 }, { "epoch": 1.13, "learning_rate": 0.00012981147175948932, "loss": 0.0313, "step": 175790 }, { "epoch": 1.13, "learning_rate": 0.0001298017904051324, "loss": 0.0284, "step": 175800 }, { "epoch": 1.13, "learning_rate": 0.00012979210905077548, "loss": 0.0317, "step": 175810 }, { "epoch": 1.13, "learning_rate": 0.00012978242769641854, "loss": 0.0316, "step": 175820 }, { "epoch": 1.13, "learning_rate": 0.0001297727463420616, "loss": 0.0286, "step": 175830 }, { "epoch": 1.13, "learning_rate": 0.00012976306498770467, "loss": 0.0374, "step": 175840 }, { "epoch": 1.13, "learning_rate": 0.00012975338363334772, "loss": 0.0368, "step": 175850 }, { "epoch": 1.14, "learning_rate": 0.0001297437022789908, "loss": 0.0359, "step": 175860 }, { "epoch": 1.14, "learning_rate": 0.00012973402092463388, "loss": 0.0326, "step": 175870 }, { "epoch": 1.14, "learning_rate": 0.00012972433957027696, "loss": 0.0283, "step": 175880 }, { "epoch": 1.14, "learning_rate": 0.00012971465821592, "loss": 0.035, "step": 175890 }, { "epoch": 1.14, "learning_rate": 0.00012970497686156307, "loss": 0.0304, "step": 175900 }, { "epoch": 1.14, "learning_rate": 0.00012969529550720615, "loss": 0.0334, "step": 175910 }, { "epoch": 1.14, "learning_rate": 0.0001296856141528492, "loss": 0.034, "step": 175920 }, { "epoch": 1.14, "learning_rate": 0.00012967593279849228, "loss": 0.0319, "step": 175930 }, { "epoch": 1.14, "learning_rate": 0.00012966625144413536, "loss": 0.0338, "step": 175940 }, { "epoch": 1.14, "learning_rate": 0.0001296565700897784, "loss": 0.0277, "step": 175950 }, { "epoch": 1.14, "learning_rate": 0.0001296468887354215, "loss": 0.0338, "step": 175960 }, { "epoch": 1.14, "learning_rate": 0.00012963720738106454, "loss": 0.0318, "step": 175970 }, { "epoch": 1.14, "learning_rate": 0.00012962752602670762, "loss": 0.0329, "step": 175980 }, { "epoch": 1.14, "learning_rate": 0.00012961784467235068, "loss": 0.0344, "step": 175990 }, { "epoch": 1.14, "learning_rate": 0.00012960816331799376, "loss": 0.0391, "step": 176000 }, { "epoch": 1.14, "eval_cer": 0.919873460625918, "eval_loss": 0.024145476520061493, "eval_runtime": 120.3294, "eval_samples_per_second": 16.621, "eval_steps_per_second": 4.155, "step": 176000 }, { "epoch": 1.14, "learning_rate": 0.00012959848196363684, "loss": 0.0324, "step": 176010 }, { "epoch": 1.14, "learning_rate": 0.0001295888006092799, "loss": 0.0371, "step": 176020 }, { "epoch": 1.14, "learning_rate": 0.00012957911925492294, "loss": 0.0411, "step": 176030 }, { "epoch": 1.14, "learning_rate": 0.00012956943790056602, "loss": 0.0299, "step": 176040 }, { "epoch": 1.14, "learning_rate": 0.0001295597565462091, "loss": 0.0317, "step": 176050 }, { "epoch": 1.14, "learning_rate": 0.00012955007519185215, "loss": 0.0347, "step": 176060 }, { "epoch": 1.14, "learning_rate": 0.00012954039383749523, "loss": 0.0362, "step": 176070 }, { "epoch": 1.14, "learning_rate": 0.0001295307124831383, "loss": 0.0379, "step": 176080 }, { "epoch": 1.14, "learning_rate": 0.00012952103112878136, "loss": 0.0341, "step": 176090 }, { "epoch": 1.14, "learning_rate": 0.00012951134977442442, "loss": 0.0313, "step": 176100 }, { "epoch": 1.14, "learning_rate": 0.0001295016684200675, "loss": 0.0337, "step": 176110 }, { "epoch": 1.14, "learning_rate": 0.00012949198706571058, "loss": 0.0312, "step": 176120 }, { "epoch": 1.14, "learning_rate": 0.00012948230571135363, "loss": 0.0362, "step": 176130 }, { "epoch": 1.14, "learning_rate": 0.0001294726243569967, "loss": 0.033, "step": 176140 }, { "epoch": 1.14, "learning_rate": 0.00012946294300263976, "loss": 0.0342, "step": 176150 }, { "epoch": 1.14, "learning_rate": 0.00012945326164828284, "loss": 0.0309, "step": 176160 }, { "epoch": 1.14, "learning_rate": 0.0001294435802939259, "loss": 0.0338, "step": 176170 }, { "epoch": 1.14, "learning_rate": 0.00012943389893956897, "loss": 0.0345, "step": 176180 }, { "epoch": 1.14, "learning_rate": 0.00012942421758521205, "loss": 0.0318, "step": 176190 }, { "epoch": 1.14, "learning_rate": 0.0001294145362308551, "loss": 0.0362, "step": 176200 }, { "epoch": 1.14, "learning_rate": 0.0001294048548764982, "loss": 0.0335, "step": 176210 }, { "epoch": 1.14, "learning_rate": 0.00012939517352214124, "loss": 0.033, "step": 176220 }, { "epoch": 1.14, "learning_rate": 0.00012938549216778432, "loss": 0.0354, "step": 176230 }, { "epoch": 1.14, "learning_rate": 0.00012937581081342737, "loss": 0.0346, "step": 176240 }, { "epoch": 1.14, "learning_rate": 0.00012936612945907045, "loss": 0.0364, "step": 176250 }, { "epoch": 1.14, "learning_rate": 0.00012935644810471353, "loss": 0.0395, "step": 176260 }, { "epoch": 1.14, "learning_rate": 0.00012934676675035658, "loss": 0.0298, "step": 176270 }, { "epoch": 1.14, "learning_rate": 0.00012933708539599966, "loss": 0.0289, "step": 176280 }, { "epoch": 1.14, "learning_rate": 0.00012932740404164272, "loss": 0.0331, "step": 176290 }, { "epoch": 1.14, "learning_rate": 0.0001293177226872858, "loss": 0.032, "step": 176300 }, { "epoch": 1.14, "learning_rate": 0.00012930804133292885, "loss": 0.0302, "step": 176310 }, { "epoch": 1.14, "learning_rate": 0.00012929835997857193, "loss": 0.0326, "step": 176320 }, { "epoch": 1.14, "learning_rate": 0.000129288678624215, "loss": 0.0304, "step": 176330 }, { "epoch": 1.14, "learning_rate": 0.00012927899726985806, "loss": 0.0303, "step": 176340 }, { "epoch": 1.14, "learning_rate": 0.00012926931591550111, "loss": 0.0376, "step": 176350 }, { "epoch": 1.14, "learning_rate": 0.0001292596345611442, "loss": 0.0304, "step": 176360 }, { "epoch": 1.14, "learning_rate": 0.00012924995320678727, "loss": 0.0346, "step": 176370 }, { "epoch": 1.14, "learning_rate": 0.00012924027185243033, "loss": 0.0335, "step": 176380 }, { "epoch": 1.14, "learning_rate": 0.0001292305904980734, "loss": 0.0311, "step": 176390 }, { "epoch": 1.14, "learning_rate": 0.00012922090914371646, "loss": 0.0318, "step": 176400 }, { "epoch": 1.14, "learning_rate": 0.00012921122778935954, "loss": 0.0396, "step": 176410 }, { "epoch": 1.14, "learning_rate": 0.0001292015464350026, "loss": 0.0323, "step": 176420 }, { "epoch": 1.14, "learning_rate": 0.00012919186508064567, "loss": 0.0321, "step": 176430 }, { "epoch": 1.14, "learning_rate": 0.00012918218372628875, "loss": 0.0309, "step": 176440 }, { "epoch": 1.14, "learning_rate": 0.0001291725023719318, "loss": 0.0313, "step": 176450 }, { "epoch": 1.14, "learning_rate": 0.00012916282101757488, "loss": 0.0326, "step": 176460 }, { "epoch": 1.14, "learning_rate": 0.00012915313966321794, "loss": 0.0359, "step": 176470 }, { "epoch": 1.14, "learning_rate": 0.00012914345830886102, "loss": 0.0332, "step": 176480 }, { "epoch": 1.14, "learning_rate": 0.00012913377695450407, "loss": 0.035, "step": 176490 }, { "epoch": 1.14, "learning_rate": 0.00012912409560014715, "loss": 0.0386, "step": 176500 }, { "epoch": 1.14, "learning_rate": 0.00012911441424579023, "loss": 0.0308, "step": 176510 }, { "epoch": 1.14, "learning_rate": 0.00012910473289143328, "loss": 0.0279, "step": 176520 }, { "epoch": 1.14, "learning_rate": 0.00012909505153707636, "loss": 0.0297, "step": 176530 }, { "epoch": 1.14, "learning_rate": 0.0001290853701827194, "loss": 0.0397, "step": 176540 }, { "epoch": 1.14, "learning_rate": 0.00012907568882836247, "loss": 0.0384, "step": 176550 }, { "epoch": 1.14, "learning_rate": 0.00012906600747400555, "loss": 0.0304, "step": 176560 }, { "epoch": 1.14, "learning_rate": 0.00012905632611964863, "loss": 0.0346, "step": 176570 }, { "epoch": 1.14, "learning_rate": 0.0001290466447652917, "loss": 0.0334, "step": 176580 }, { "epoch": 1.14, "learning_rate": 0.00012903696341093476, "loss": 0.0387, "step": 176590 }, { "epoch": 1.14, "learning_rate": 0.0001290272820565778, "loss": 0.0328, "step": 176600 }, { "epoch": 1.14, "learning_rate": 0.0001290176007022209, "loss": 0.0344, "step": 176610 }, { "epoch": 1.14, "learning_rate": 0.00012900791934786394, "loss": 0.0396, "step": 176620 }, { "epoch": 1.14, "learning_rate": 0.00012899823799350702, "loss": 0.0326, "step": 176630 }, { "epoch": 1.14, "learning_rate": 0.0001289885566391501, "loss": 0.0301, "step": 176640 }, { "epoch": 1.14, "learning_rate": 0.00012897887528479318, "loss": 0.0465, "step": 176650 }, { "epoch": 1.14, "learning_rate": 0.00012896919393043624, "loss": 0.0371, "step": 176660 }, { "epoch": 1.14, "learning_rate": 0.0001289595125760793, "loss": 0.0412, "step": 176670 }, { "epoch": 1.14, "learning_rate": 0.00012894983122172237, "loss": 0.0344, "step": 176680 }, { "epoch": 1.14, "learning_rate": 0.00012894014986736542, "loss": 0.0342, "step": 176690 }, { "epoch": 1.14, "learning_rate": 0.0001289304685130085, "loss": 0.0394, "step": 176700 }, { "epoch": 1.14, "learning_rate": 0.00012892078715865158, "loss": 0.0314, "step": 176710 }, { "epoch": 1.14, "learning_rate": 0.00012891110580429463, "loss": 0.0328, "step": 176720 }, { "epoch": 1.14, "learning_rate": 0.0001289014244499377, "loss": 0.0313, "step": 176730 }, { "epoch": 1.14, "learning_rate": 0.00012889174309558077, "loss": 0.0303, "step": 176740 }, { "epoch": 1.14, "learning_rate": 0.00012888206174122385, "loss": 0.0294, "step": 176750 }, { "epoch": 1.14, "learning_rate": 0.0001288723803868669, "loss": 0.0377, "step": 176760 }, { "epoch": 1.14, "learning_rate": 0.00012886269903250998, "loss": 0.0285, "step": 176770 }, { "epoch": 1.14, "learning_rate": 0.00012885301767815306, "loss": 0.0316, "step": 176780 }, { "epoch": 1.14, "learning_rate": 0.0001288433363237961, "loss": 0.0362, "step": 176790 }, { "epoch": 1.14, "learning_rate": 0.00012883365496943916, "loss": 0.0398, "step": 176800 }, { "epoch": 1.14, "learning_rate": 0.00012882397361508224, "loss": 0.0315, "step": 176810 }, { "epoch": 1.14, "learning_rate": 0.00012881429226072532, "loss": 0.034, "step": 176820 }, { "epoch": 1.14, "learning_rate": 0.00012880461090636838, "loss": 0.035, "step": 176830 }, { "epoch": 1.14, "learning_rate": 0.00012879492955201145, "loss": 0.0297, "step": 176840 }, { "epoch": 1.14, "learning_rate": 0.00012878524819765453, "loss": 0.031, "step": 176850 }, { "epoch": 1.14, "learning_rate": 0.0001287755668432976, "loss": 0.0299, "step": 176860 }, { "epoch": 1.14, "learning_rate": 0.00012876588548894064, "loss": 0.0291, "step": 176870 }, { "epoch": 1.14, "learning_rate": 0.00012875620413458372, "loss": 0.0284, "step": 176880 }, { "epoch": 1.14, "learning_rate": 0.0001287465227802268, "loss": 0.0324, "step": 176890 }, { "epoch": 1.14, "learning_rate": 0.00012873684142586985, "loss": 0.0319, "step": 176900 }, { "epoch": 1.14, "learning_rate": 0.00012872716007151293, "loss": 0.0289, "step": 176910 }, { "epoch": 1.14, "learning_rate": 0.00012871747871715598, "loss": 0.0324, "step": 176920 }, { "epoch": 1.14, "learning_rate": 0.00012870779736279906, "loss": 0.0286, "step": 176930 }, { "epoch": 1.14, "learning_rate": 0.00012869811600844212, "loss": 0.0299, "step": 176940 }, { "epoch": 1.14, "learning_rate": 0.0001286884346540852, "loss": 0.0372, "step": 176950 }, { "epoch": 1.14, "learning_rate": 0.00012867875329972828, "loss": 0.0301, "step": 176960 }, { "epoch": 1.14, "learning_rate": 0.00012866907194537133, "loss": 0.0335, "step": 176970 }, { "epoch": 1.14, "learning_rate": 0.0001286593905910144, "loss": 0.0344, "step": 176980 }, { "epoch": 1.14, "learning_rate": 0.00012864970923665746, "loss": 0.0358, "step": 176990 }, { "epoch": 1.14, "learning_rate": 0.00012864002788230054, "loss": 0.0325, "step": 177000 }, { "epoch": 1.14, "eval_cer": 0.9199520958083832, "eval_loss": 0.023923007771372795, "eval_runtime": 120.1567, "eval_samples_per_second": 16.645, "eval_steps_per_second": 4.161, "step": 177000 }, { "epoch": 1.14, "learning_rate": 0.0001286303465279436, "loss": 0.0333, "step": 177010 }, { "epoch": 1.14, "learning_rate": 0.00012862066517358667, "loss": 0.0348, "step": 177020 }, { "epoch": 1.14, "learning_rate": 0.00012861098381922975, "loss": 0.0363, "step": 177030 }, { "epoch": 1.14, "learning_rate": 0.0001286013024648728, "loss": 0.0368, "step": 177040 }, { "epoch": 1.14, "learning_rate": 0.0001285916211105159, "loss": 0.0334, "step": 177050 }, { "epoch": 1.14, "learning_rate": 0.00012858193975615894, "loss": 0.0297, "step": 177060 }, { "epoch": 1.14, "learning_rate": 0.00012857225840180202, "loss": 0.0342, "step": 177070 }, { "epoch": 1.14, "learning_rate": 0.00012856257704744507, "loss": 0.0317, "step": 177080 }, { "epoch": 1.14, "learning_rate": 0.00012855289569308815, "loss": 0.0352, "step": 177090 }, { "epoch": 1.14, "learning_rate": 0.00012854321433873123, "loss": 0.0324, "step": 177100 }, { "epoch": 1.14, "learning_rate": 0.00012853353298437428, "loss": 0.0362, "step": 177110 }, { "epoch": 1.14, "learning_rate": 0.00012852385163001734, "loss": 0.0274, "step": 177120 }, { "epoch": 1.14, "learning_rate": 0.00012851417027566042, "loss": 0.0321, "step": 177130 }, { "epoch": 1.14, "learning_rate": 0.0001285044889213035, "loss": 0.033, "step": 177140 }, { "epoch": 1.14, "learning_rate": 0.00012849480756694655, "loss": 0.0288, "step": 177150 }, { "epoch": 1.14, "learning_rate": 0.00012848512621258963, "loss": 0.0337, "step": 177160 }, { "epoch": 1.14, "learning_rate": 0.0001284754448582327, "loss": 0.0328, "step": 177170 }, { "epoch": 1.14, "learning_rate": 0.00012846576350387576, "loss": 0.0343, "step": 177180 }, { "epoch": 1.14, "learning_rate": 0.00012845608214951881, "loss": 0.035, "step": 177190 }, { "epoch": 1.14, "learning_rate": 0.0001284464007951619, "loss": 0.036, "step": 177200 }, { "epoch": 1.14, "learning_rate": 0.00012843671944080497, "loss": 0.0407, "step": 177210 }, { "epoch": 1.14, "learning_rate": 0.00012842703808644803, "loss": 0.0376, "step": 177220 }, { "epoch": 1.14, "learning_rate": 0.0001284173567320911, "loss": 0.0297, "step": 177230 }, { "epoch": 1.14, "learning_rate": 0.00012840767537773416, "loss": 0.0311, "step": 177240 }, { "epoch": 1.14, "learning_rate": 0.00012839799402337724, "loss": 0.0329, "step": 177250 }, { "epoch": 1.14, "learning_rate": 0.0001283883126690203, "loss": 0.0411, "step": 177260 }, { "epoch": 1.14, "learning_rate": 0.00012837863131466337, "loss": 0.0309, "step": 177270 }, { "epoch": 1.14, "learning_rate": 0.00012836894996030645, "loss": 0.0346, "step": 177280 }, { "epoch": 1.14, "learning_rate": 0.0001283592686059495, "loss": 0.0346, "step": 177290 }, { "epoch": 1.14, "learning_rate": 0.00012834958725159258, "loss": 0.033, "step": 177300 }, { "epoch": 1.14, "learning_rate": 0.00012833990589723564, "loss": 0.0335, "step": 177310 }, { "epoch": 1.14, "learning_rate": 0.0001283302245428787, "loss": 0.0329, "step": 177320 }, { "epoch": 1.14, "learning_rate": 0.00012832054318852177, "loss": 0.0337, "step": 177330 }, { "epoch": 1.14, "learning_rate": 0.00012831086183416485, "loss": 0.0372, "step": 177340 }, { "epoch": 1.14, "learning_rate": 0.0001283011804798079, "loss": 0.0365, "step": 177350 }, { "epoch": 1.14, "learning_rate": 0.00012829149912545098, "loss": 0.0384, "step": 177360 }, { "epoch": 1.14, "learning_rate": 0.00012828181777109406, "loss": 0.0342, "step": 177370 }, { "epoch": 1.14, "learning_rate": 0.0001282721364167371, "loss": 0.0329, "step": 177380 }, { "epoch": 1.14, "learning_rate": 0.00012826245506238017, "loss": 0.0372, "step": 177390 }, { "epoch": 1.14, "learning_rate": 0.00012825277370802325, "loss": 0.0352, "step": 177400 }, { "epoch": 1.15, "learning_rate": 0.00012824309235366633, "loss": 0.032, "step": 177410 }, { "epoch": 1.15, "learning_rate": 0.00012823341099930938, "loss": 0.0348, "step": 177420 }, { "epoch": 1.15, "learning_rate": 0.00012822372964495246, "loss": 0.0362, "step": 177430 }, { "epoch": 1.15, "learning_rate": 0.0001282140482905955, "loss": 0.037, "step": 177440 }, { "epoch": 1.15, "learning_rate": 0.0001282043669362386, "loss": 0.0324, "step": 177450 }, { "epoch": 1.15, "learning_rate": 0.00012819468558188164, "loss": 0.0394, "step": 177460 }, { "epoch": 1.15, "learning_rate": 0.00012818500422752472, "loss": 0.0372, "step": 177470 }, { "epoch": 1.15, "learning_rate": 0.0001281753228731678, "loss": 0.0323, "step": 177480 }, { "epoch": 1.15, "learning_rate": 0.00012816564151881086, "loss": 0.0381, "step": 177490 }, { "epoch": 1.15, "learning_rate": 0.00012815596016445394, "loss": 0.0325, "step": 177500 }, { "epoch": 1.15, "learning_rate": 0.000128146278810097, "loss": 0.0305, "step": 177510 }, { "epoch": 1.15, "learning_rate": 0.00012813659745574007, "loss": 0.0347, "step": 177520 }, { "epoch": 1.15, "learning_rate": 0.00012812691610138312, "loss": 0.0359, "step": 177530 }, { "epoch": 1.15, "learning_rate": 0.0001281172347470262, "loss": 0.0386, "step": 177540 }, { "epoch": 1.15, "learning_rate": 0.00012810755339266928, "loss": 0.0299, "step": 177550 }, { "epoch": 1.15, "learning_rate": 0.00012809787203831233, "loss": 0.0352, "step": 177560 }, { "epoch": 1.15, "learning_rate": 0.0001280881906839554, "loss": 0.0324, "step": 177570 }, { "epoch": 1.15, "learning_rate": 0.00012807850932959846, "loss": 0.0313, "step": 177580 }, { "epoch": 1.15, "learning_rate": 0.00012806882797524154, "loss": 0.0329, "step": 177590 }, { "epoch": 1.15, "learning_rate": 0.0001280591466208846, "loss": 0.0272, "step": 177600 }, { "epoch": 1.15, "learning_rate": 0.00012804946526652768, "loss": 0.0341, "step": 177610 }, { "epoch": 1.15, "learning_rate": 0.00012803978391217076, "loss": 0.0311, "step": 177620 }, { "epoch": 1.15, "learning_rate": 0.0001280301025578138, "loss": 0.0342, "step": 177630 }, { "epoch": 1.15, "learning_rate": 0.00012802042120345686, "loss": 0.0311, "step": 177640 }, { "epoch": 1.15, "learning_rate": 0.00012801073984909994, "loss": 0.0262, "step": 177650 }, { "epoch": 1.15, "learning_rate": 0.00012800105849474302, "loss": 0.0367, "step": 177660 }, { "epoch": 1.15, "learning_rate": 0.00012799137714038607, "loss": 0.0326, "step": 177670 }, { "epoch": 1.15, "learning_rate": 0.00012798169578602915, "loss": 0.0305, "step": 177680 }, { "epoch": 1.15, "learning_rate": 0.0001279720144316722, "loss": 0.0318, "step": 177690 }, { "epoch": 1.15, "learning_rate": 0.0001279623330773153, "loss": 0.0381, "step": 177700 }, { "epoch": 1.15, "learning_rate": 0.00012795265172295834, "loss": 0.0337, "step": 177710 }, { "epoch": 1.15, "learning_rate": 0.00012794297036860142, "loss": 0.0315, "step": 177720 }, { "epoch": 1.15, "learning_rate": 0.0001279332890142445, "loss": 0.0326, "step": 177730 }, { "epoch": 1.15, "learning_rate": 0.00012792360765988755, "loss": 0.0327, "step": 177740 }, { "epoch": 1.15, "learning_rate": 0.00012791392630553063, "loss": 0.0303, "step": 177750 }, { "epoch": 1.15, "learning_rate": 0.00012790424495117368, "loss": 0.0285, "step": 177760 }, { "epoch": 1.15, "learning_rate": 0.00012789456359681676, "loss": 0.0361, "step": 177770 }, { "epoch": 1.15, "learning_rate": 0.00012788488224245982, "loss": 0.0323, "step": 177780 }, { "epoch": 1.15, "learning_rate": 0.0001278752008881029, "loss": 0.031, "step": 177790 }, { "epoch": 1.15, "learning_rate": 0.00012786551953374598, "loss": 0.033, "step": 177800 }, { "epoch": 1.15, "learning_rate": 0.00012785583817938903, "loss": 0.028, "step": 177810 }, { "epoch": 1.15, "learning_rate": 0.0001278461568250321, "loss": 0.0314, "step": 177820 }, { "epoch": 1.15, "learning_rate": 0.00012783647547067516, "loss": 0.0338, "step": 177830 }, { "epoch": 1.15, "learning_rate": 0.00012782679411631821, "loss": 0.0291, "step": 177840 }, { "epoch": 1.15, "learning_rate": 0.0001278171127619613, "loss": 0.0365, "step": 177850 }, { "epoch": 1.15, "learning_rate": 0.00012780743140760437, "loss": 0.0289, "step": 177860 }, { "epoch": 1.15, "learning_rate": 0.00012779775005324745, "loss": 0.0321, "step": 177870 }, { "epoch": 1.15, "learning_rate": 0.0001277880686988905, "loss": 0.0279, "step": 177880 }, { "epoch": 1.15, "learning_rate": 0.00012777838734453359, "loss": 0.0286, "step": 177890 }, { "epoch": 1.15, "learning_rate": 0.00012776870599017664, "loss": 0.0367, "step": 177900 }, { "epoch": 1.15, "learning_rate": 0.0001277590246358197, "loss": 0.0289, "step": 177910 }, { "epoch": 1.15, "learning_rate": 0.00012774934328146277, "loss": 0.0301, "step": 177920 }, { "epoch": 1.15, "learning_rate": 0.00012773966192710585, "loss": 0.0305, "step": 177930 }, { "epoch": 1.15, "learning_rate": 0.00012772998057274893, "loss": 0.0358, "step": 177940 }, { "epoch": 1.15, "learning_rate": 0.00012772029921839198, "loss": 0.0363, "step": 177950 }, { "epoch": 1.15, "learning_rate": 0.00012771061786403504, "loss": 0.0273, "step": 177960 }, { "epoch": 1.15, "learning_rate": 0.00012770093650967812, "loss": 0.0303, "step": 177970 }, { "epoch": 1.15, "learning_rate": 0.00012769125515532117, "loss": 0.0346, "step": 177980 }, { "epoch": 1.15, "learning_rate": 0.00012768157380096425, "loss": 0.0322, "step": 177990 }, { "epoch": 1.15, "learning_rate": 0.00012767189244660733, "loss": 0.0295, "step": 178000 }, { "epoch": 1.15, "eval_cer": 0.9198888261213423, "eval_loss": 0.02403685823082924, "eval_runtime": 120.1071, "eval_samples_per_second": 16.652, "eval_steps_per_second": 4.163, "step": 178000 }, { "epoch": 1.15, "learning_rate": 0.00012766221109225038, "loss": 0.0355, "step": 178010 }, { "epoch": 1.15, "learning_rate": 0.00012765252973789346, "loss": 0.0298, "step": 178020 }, { "epoch": 1.15, "learning_rate": 0.0001276428483835365, "loss": 0.0328, "step": 178030 }, { "epoch": 1.15, "learning_rate": 0.0001276331670291796, "loss": 0.0325, "step": 178040 }, { "epoch": 1.15, "learning_rate": 0.00012762348567482265, "loss": 0.0347, "step": 178050 }, { "epoch": 1.15, "learning_rate": 0.00012761380432046573, "loss": 0.0248, "step": 178060 }, { "epoch": 1.15, "learning_rate": 0.0001276041229661088, "loss": 0.0347, "step": 178070 }, { "epoch": 1.15, "learning_rate": 0.00012759444161175186, "loss": 0.0365, "step": 178080 }, { "epoch": 1.15, "learning_rate": 0.00012758476025739494, "loss": 0.0323, "step": 178090 }, { "epoch": 1.15, "learning_rate": 0.000127575078903038, "loss": 0.0311, "step": 178100 }, { "epoch": 1.15, "learning_rate": 0.00012756539754868107, "loss": 0.0311, "step": 178110 }, { "epoch": 1.15, "learning_rate": 0.00012755571619432412, "loss": 0.0334, "step": 178120 }, { "epoch": 1.15, "learning_rate": 0.0001275460348399672, "loss": 0.0345, "step": 178130 }, { "epoch": 1.15, "learning_rate": 0.00012753635348561028, "loss": 0.0382, "step": 178140 }, { "epoch": 1.15, "learning_rate": 0.00012752667213125334, "loss": 0.0345, "step": 178150 }, { "epoch": 1.15, "learning_rate": 0.0001275169907768964, "loss": 0.0327, "step": 178160 }, { "epoch": 1.15, "learning_rate": 0.00012750730942253947, "loss": 0.033, "step": 178170 }, { "epoch": 1.15, "learning_rate": 0.00012749762806818255, "loss": 0.0279, "step": 178180 }, { "epoch": 1.15, "learning_rate": 0.0001274879467138256, "loss": 0.0326, "step": 178190 }, { "epoch": 1.15, "learning_rate": 0.00012747826535946868, "loss": 0.0272, "step": 178200 }, { "epoch": 1.15, "learning_rate": 0.00012746858400511173, "loss": 0.0344, "step": 178210 }, { "epoch": 1.15, "learning_rate": 0.0001274589026507548, "loss": 0.0405, "step": 178220 }, { "epoch": 1.15, "learning_rate": 0.00012744922129639787, "loss": 0.0308, "step": 178230 }, { "epoch": 1.15, "learning_rate": 0.00012743953994204095, "loss": 0.0302, "step": 178240 }, { "epoch": 1.15, "learning_rate": 0.00012742985858768402, "loss": 0.0345, "step": 178250 }, { "epoch": 1.15, "learning_rate": 0.00012742017723332708, "loss": 0.0335, "step": 178260 }, { "epoch": 1.15, "learning_rate": 0.00012741049587897016, "loss": 0.0405, "step": 178270 }, { "epoch": 1.15, "learning_rate": 0.0001274008145246132, "loss": 0.0344, "step": 178280 }, { "epoch": 1.15, "learning_rate": 0.0001273911331702563, "loss": 0.0325, "step": 178290 }, { "epoch": 1.15, "learning_rate": 0.00012738145181589934, "loss": 0.0311, "step": 178300 }, { "epoch": 1.15, "learning_rate": 0.00012737177046154242, "loss": 0.035, "step": 178310 }, { "epoch": 1.15, "learning_rate": 0.0001273620891071855, "loss": 0.0317, "step": 178320 }, { "epoch": 1.15, "learning_rate": 0.00012735240775282855, "loss": 0.0364, "step": 178330 }, { "epoch": 1.15, "learning_rate": 0.00012734272639847163, "loss": 0.0356, "step": 178340 }, { "epoch": 1.15, "learning_rate": 0.0001273330450441147, "loss": 0.0357, "step": 178350 }, { "epoch": 1.15, "learning_rate": 0.00012732336368975777, "loss": 0.0339, "step": 178360 }, { "epoch": 1.15, "learning_rate": 0.00012731368233540082, "loss": 0.0346, "step": 178370 }, { "epoch": 1.15, "learning_rate": 0.0001273040009810439, "loss": 0.0333, "step": 178380 }, { "epoch": 1.15, "learning_rate": 0.00012729431962668698, "loss": 0.039, "step": 178390 }, { "epoch": 1.15, "learning_rate": 0.00012728463827233003, "loss": 0.0374, "step": 178400 }, { "epoch": 1.15, "learning_rate": 0.00012727495691797308, "loss": 0.03, "step": 178410 }, { "epoch": 1.15, "learning_rate": 0.00012726527556361616, "loss": 0.0338, "step": 178420 }, { "epoch": 1.15, "learning_rate": 0.00012725559420925924, "loss": 0.0292, "step": 178430 }, { "epoch": 1.15, "learning_rate": 0.0001272459128549023, "loss": 0.0315, "step": 178440 }, { "epoch": 1.15, "learning_rate": 0.00012723623150054538, "loss": 0.0375, "step": 178450 }, { "epoch": 1.15, "learning_rate": 0.00012722655014618846, "loss": 0.0349, "step": 178460 }, { "epoch": 1.15, "learning_rate": 0.0001272168687918315, "loss": 0.0293, "step": 178470 }, { "epoch": 1.15, "learning_rate": 0.00012720718743747456, "loss": 0.0345, "step": 178480 }, { "epoch": 1.15, "learning_rate": 0.00012719750608311764, "loss": 0.03, "step": 178490 }, { "epoch": 1.15, "learning_rate": 0.00012718782472876072, "loss": 0.0304, "step": 178500 }, { "epoch": 1.15, "learning_rate": 0.00012717814337440377, "loss": 0.0341, "step": 178510 }, { "epoch": 1.15, "learning_rate": 0.00012716846202004685, "loss": 0.0319, "step": 178520 }, { "epoch": 1.15, "learning_rate": 0.0001271587806656899, "loss": 0.0356, "step": 178530 }, { "epoch": 1.15, "learning_rate": 0.000127149099311333, "loss": 0.0416, "step": 178540 }, { "epoch": 1.15, "learning_rate": 0.00012713941795697604, "loss": 0.0327, "step": 178550 }, { "epoch": 1.15, "learning_rate": 0.00012712973660261912, "loss": 0.0272, "step": 178560 }, { "epoch": 1.15, "learning_rate": 0.0001271200552482622, "loss": 0.0369, "step": 178570 }, { "epoch": 1.15, "learning_rate": 0.00012711037389390525, "loss": 0.0346, "step": 178580 }, { "epoch": 1.15, "learning_rate": 0.00012710069253954833, "loss": 0.0354, "step": 178590 }, { "epoch": 1.15, "learning_rate": 0.00012709101118519138, "loss": 0.0399, "step": 178600 }, { "epoch": 1.15, "learning_rate": 0.00012708132983083444, "loss": 0.0325, "step": 178610 }, { "epoch": 1.15, "learning_rate": 0.00012707164847647752, "loss": 0.0352, "step": 178620 }, { "epoch": 1.15, "learning_rate": 0.0001270619671221206, "loss": 0.0325, "step": 178630 }, { "epoch": 1.15, "learning_rate": 0.00012705228576776368, "loss": 0.0342, "step": 178640 }, { "epoch": 1.15, "learning_rate": 0.00012704260441340673, "loss": 0.0313, "step": 178650 }, { "epoch": 1.15, "learning_rate": 0.0001270329230590498, "loss": 0.0369, "step": 178660 }, { "epoch": 1.15, "learning_rate": 0.00012702324170469286, "loss": 0.036, "step": 178670 }, { "epoch": 1.15, "learning_rate": 0.00012701356035033591, "loss": 0.0286, "step": 178680 }, { "epoch": 1.15, "learning_rate": 0.000127003878995979, "loss": 0.0347, "step": 178690 }, { "epoch": 1.15, "learning_rate": 0.00012699419764162207, "loss": 0.0338, "step": 178700 }, { "epoch": 1.15, "learning_rate": 0.00012698451628726515, "loss": 0.0352, "step": 178710 }, { "epoch": 1.15, "learning_rate": 0.0001269748349329082, "loss": 0.034, "step": 178720 }, { "epoch": 1.15, "learning_rate": 0.00012696515357855126, "loss": 0.0304, "step": 178730 }, { "epoch": 1.15, "learning_rate": 0.00012695547222419434, "loss": 0.0413, "step": 178740 }, { "epoch": 1.15, "learning_rate": 0.0001269457908698374, "loss": 0.033, "step": 178750 }, { "epoch": 1.15, "learning_rate": 0.00012693610951548047, "loss": 0.0334, "step": 178760 }, { "epoch": 1.15, "learning_rate": 0.00012692642816112355, "loss": 0.034, "step": 178770 }, { "epoch": 1.15, "learning_rate": 0.00012691674680676663, "loss": 0.0293, "step": 178780 }, { "epoch": 1.15, "learning_rate": 0.00012690706545240968, "loss": 0.0312, "step": 178790 }, { "epoch": 1.15, "learning_rate": 0.00012689738409805274, "loss": 0.0288, "step": 178800 }, { "epoch": 1.15, "learning_rate": 0.00012688770274369582, "loss": 0.0327, "step": 178810 }, { "epoch": 1.15, "learning_rate": 0.00012687802138933887, "loss": 0.0316, "step": 178820 }, { "epoch": 1.15, "learning_rate": 0.00012686834003498195, "loss": 0.0347, "step": 178830 }, { "epoch": 1.15, "learning_rate": 0.00012685865868062503, "loss": 0.0337, "step": 178840 }, { "epoch": 1.15, "learning_rate": 0.00012684897732626808, "loss": 0.0276, "step": 178850 }, { "epoch": 1.15, "learning_rate": 0.00012683929597191116, "loss": 0.0339, "step": 178860 }, { "epoch": 1.15, "learning_rate": 0.0001268296146175542, "loss": 0.0312, "step": 178870 }, { "epoch": 1.15, "learning_rate": 0.0001268199332631973, "loss": 0.0261, "step": 178880 }, { "epoch": 1.15, "learning_rate": 0.00012681025190884035, "loss": 0.0316, "step": 178890 }, { "epoch": 1.15, "learning_rate": 0.00012680057055448343, "loss": 0.0291, "step": 178900 }, { "epoch": 1.15, "learning_rate": 0.0001267908892001265, "loss": 0.0307, "step": 178910 }, { "epoch": 1.15, "learning_rate": 0.00012678120784576956, "loss": 0.0325, "step": 178920 }, { "epoch": 1.15, "learning_rate": 0.0001267715264914126, "loss": 0.0375, "step": 178930 }, { "epoch": 1.15, "learning_rate": 0.0001267618451370557, "loss": 0.038, "step": 178940 }, { "epoch": 1.15, "learning_rate": 0.00012675216378269877, "loss": 0.0323, "step": 178950 }, { "epoch": 1.16, "learning_rate": 0.00012674248242834182, "loss": 0.0321, "step": 178960 }, { "epoch": 1.16, "learning_rate": 0.0001267328010739849, "loss": 0.0334, "step": 178970 }, { "epoch": 1.16, "learning_rate": 0.00012672311971962798, "loss": 0.0335, "step": 178980 }, { "epoch": 1.16, "learning_rate": 0.00012671343836527104, "loss": 0.0333, "step": 178990 }, { "epoch": 1.16, "learning_rate": 0.0001267037570109141, "loss": 0.0288, "step": 179000 }, { "epoch": 1.16, "eval_cer": 0.9199475765450231, "eval_loss": 0.023168489336967468, "eval_runtime": 120.4946, "eval_samples_per_second": 16.598, "eval_steps_per_second": 4.15, "step": 179000 }, { "epoch": 1.16, "learning_rate": 0.00012669407565655717, "loss": 0.0343, "step": 179010 }, { "epoch": 1.16, "learning_rate": 0.00012668439430220025, "loss": 0.0291, "step": 179020 }, { "epoch": 1.16, "learning_rate": 0.0001266747129478433, "loss": 0.0318, "step": 179030 }, { "epoch": 1.16, "learning_rate": 0.00012666503159348638, "loss": 0.0302, "step": 179040 }, { "epoch": 1.16, "learning_rate": 0.00012665535023912943, "loss": 0.0339, "step": 179050 }, { "epoch": 1.16, "learning_rate": 0.0001266456688847725, "loss": 0.0305, "step": 179060 }, { "epoch": 1.16, "learning_rate": 0.00012663598753041556, "loss": 0.0303, "step": 179070 }, { "epoch": 1.16, "learning_rate": 0.00012662630617605864, "loss": 0.0334, "step": 179080 }, { "epoch": 1.16, "learning_rate": 0.00012661662482170172, "loss": 0.0333, "step": 179090 }, { "epoch": 1.16, "learning_rate": 0.00012660694346734478, "loss": 0.0271, "step": 179100 }, { "epoch": 1.16, "learning_rate": 0.00012659726211298786, "loss": 0.0307, "step": 179110 }, { "epoch": 1.16, "learning_rate": 0.0001265875807586309, "loss": 0.0302, "step": 179120 }, { "epoch": 1.16, "learning_rate": 0.000126577899404274, "loss": 0.0338, "step": 179130 }, { "epoch": 1.16, "learning_rate": 0.00012656821804991704, "loss": 0.0276, "step": 179140 }, { "epoch": 1.16, "learning_rate": 0.00012655853669556012, "loss": 0.0359, "step": 179150 }, { "epoch": 1.16, "learning_rate": 0.0001265488553412032, "loss": 0.0343, "step": 179160 }, { "epoch": 1.16, "learning_rate": 0.00012653917398684625, "loss": 0.0316, "step": 179170 }, { "epoch": 1.16, "learning_rate": 0.00012652949263248933, "loss": 0.0292, "step": 179180 }, { "epoch": 1.16, "learning_rate": 0.0001265198112781324, "loss": 0.0391, "step": 179190 }, { "epoch": 1.16, "learning_rate": 0.00012651012992377547, "loss": 0.0359, "step": 179200 }, { "epoch": 1.16, "learning_rate": 0.00012650044856941852, "loss": 0.0342, "step": 179210 }, { "epoch": 1.16, "learning_rate": 0.0001264907672150616, "loss": 0.033, "step": 179220 }, { "epoch": 1.16, "learning_rate": 0.00012648108586070468, "loss": 0.0364, "step": 179230 }, { "epoch": 1.16, "learning_rate": 0.00012647140450634773, "loss": 0.0326, "step": 179240 }, { "epoch": 1.16, "learning_rate": 0.00012646172315199078, "loss": 0.0348, "step": 179250 }, { "epoch": 1.16, "learning_rate": 0.00012645204179763386, "loss": 0.0336, "step": 179260 }, { "epoch": 1.16, "learning_rate": 0.00012644236044327694, "loss": 0.036, "step": 179270 }, { "epoch": 1.16, "learning_rate": 0.00012643267908892, "loss": 0.0283, "step": 179280 }, { "epoch": 1.16, "learning_rate": 0.00012642299773456308, "loss": 0.0382, "step": 179290 }, { "epoch": 1.16, "learning_rate": 0.00012641331638020613, "loss": 0.0318, "step": 179300 }, { "epoch": 1.16, "learning_rate": 0.0001264036350258492, "loss": 0.0365, "step": 179310 }, { "epoch": 1.16, "learning_rate": 0.00012639395367149226, "loss": 0.0293, "step": 179320 }, { "epoch": 1.16, "learning_rate": 0.00012638427231713534, "loss": 0.0368, "step": 179330 }, { "epoch": 1.16, "learning_rate": 0.00012637459096277842, "loss": 0.0306, "step": 179340 }, { "epoch": 1.16, "learning_rate": 0.00012636490960842147, "loss": 0.0303, "step": 179350 }, { "epoch": 1.16, "learning_rate": 0.00012635522825406455, "loss": 0.0296, "step": 179360 }, { "epoch": 1.16, "learning_rate": 0.0001263455468997076, "loss": 0.0362, "step": 179370 }, { "epoch": 1.16, "learning_rate": 0.00012633586554535069, "loss": 0.0345, "step": 179380 }, { "epoch": 1.16, "learning_rate": 0.00012632618419099374, "loss": 0.0306, "step": 179390 }, { "epoch": 1.16, "learning_rate": 0.00012631650283663682, "loss": 0.0333, "step": 179400 }, { "epoch": 1.16, "learning_rate": 0.0001263068214822799, "loss": 0.0316, "step": 179410 }, { "epoch": 1.16, "learning_rate": 0.00012629714012792295, "loss": 0.0304, "step": 179420 }, { "epoch": 1.16, "learning_rate": 0.00012628745877356603, "loss": 0.0318, "step": 179430 }, { "epoch": 1.16, "learning_rate": 0.00012627777741920908, "loss": 0.0317, "step": 179440 }, { "epoch": 1.16, "learning_rate": 0.00012626809606485214, "loss": 0.0359, "step": 179450 }, { "epoch": 1.16, "learning_rate": 0.00012625841471049522, "loss": 0.0343, "step": 179460 }, { "epoch": 1.16, "learning_rate": 0.0001262487333561383, "loss": 0.0366, "step": 179470 }, { "epoch": 1.16, "learning_rate": 0.00012623905200178138, "loss": 0.0307, "step": 179480 }, { "epoch": 1.16, "learning_rate": 0.00012622937064742443, "loss": 0.0361, "step": 179490 }, { "epoch": 1.16, "learning_rate": 0.00012621968929306748, "loss": 0.0324, "step": 179500 }, { "epoch": 1.16, "learning_rate": 0.00012621000793871056, "loss": 0.035, "step": 179510 }, { "epoch": 1.16, "learning_rate": 0.0001262003265843536, "loss": 0.0405, "step": 179520 }, { "epoch": 1.16, "learning_rate": 0.0001261906452299967, "loss": 0.0441, "step": 179530 }, { "epoch": 1.16, "learning_rate": 0.00012618096387563977, "loss": 0.0379, "step": 179540 }, { "epoch": 1.16, "learning_rate": 0.00012617128252128285, "loss": 0.031, "step": 179550 }, { "epoch": 1.16, "learning_rate": 0.0001261616011669259, "loss": 0.0281, "step": 179560 }, { "epoch": 1.16, "learning_rate": 0.00012615191981256896, "loss": 0.0274, "step": 179570 }, { "epoch": 1.16, "learning_rate": 0.00012614223845821204, "loss": 0.0312, "step": 179580 }, { "epoch": 1.16, "learning_rate": 0.0001261325571038551, "loss": 0.0372, "step": 179590 }, { "epoch": 1.16, "learning_rate": 0.00012612287574949817, "loss": 0.0311, "step": 179600 }, { "epoch": 1.16, "learning_rate": 0.00012611319439514125, "loss": 0.0317, "step": 179610 }, { "epoch": 1.16, "learning_rate": 0.0001261035130407843, "loss": 0.0286, "step": 179620 }, { "epoch": 1.16, "learning_rate": 0.00012609383168642738, "loss": 0.0376, "step": 179630 }, { "epoch": 1.16, "learning_rate": 0.00012608415033207044, "loss": 0.0339, "step": 179640 }, { "epoch": 1.16, "learning_rate": 0.00012607446897771352, "loss": 0.0324, "step": 179650 }, { "epoch": 1.16, "learning_rate": 0.00012606478762335657, "loss": 0.0346, "step": 179660 }, { "epoch": 1.16, "learning_rate": 0.00012605510626899965, "loss": 0.0366, "step": 179670 }, { "epoch": 1.16, "learning_rate": 0.00012604542491464273, "loss": 0.0291, "step": 179680 }, { "epoch": 1.16, "learning_rate": 0.00012603574356028578, "loss": 0.0303, "step": 179690 }, { "epoch": 1.16, "learning_rate": 0.00012602606220592883, "loss": 0.0351, "step": 179700 }, { "epoch": 1.16, "learning_rate": 0.0001260163808515719, "loss": 0.0298, "step": 179710 }, { "epoch": 1.16, "learning_rate": 0.000126006699497215, "loss": 0.0374, "step": 179720 }, { "epoch": 1.16, "learning_rate": 0.00012599701814285805, "loss": 0.0258, "step": 179730 }, { "epoch": 1.16, "learning_rate": 0.00012598733678850112, "loss": 0.0305, "step": 179740 }, { "epoch": 1.16, "learning_rate": 0.0001259776554341442, "loss": 0.0374, "step": 179750 }, { "epoch": 1.16, "learning_rate": 0.00012596797407978726, "loss": 0.0385, "step": 179760 }, { "epoch": 1.16, "learning_rate": 0.0001259582927254303, "loss": 0.039, "step": 179770 }, { "epoch": 1.16, "learning_rate": 0.0001259486113710734, "loss": 0.0348, "step": 179780 }, { "epoch": 1.16, "learning_rate": 0.00012593893001671647, "loss": 0.0336, "step": 179790 }, { "epoch": 1.16, "learning_rate": 0.00012592924866235952, "loss": 0.0302, "step": 179800 }, { "epoch": 1.16, "learning_rate": 0.0001259195673080026, "loss": 0.0297, "step": 179810 }, { "epoch": 1.16, "learning_rate": 0.00012590988595364565, "loss": 0.0305, "step": 179820 }, { "epoch": 1.16, "learning_rate": 0.00012590020459928873, "loss": 0.0394, "step": 179830 }, { "epoch": 1.16, "learning_rate": 0.0001258905232449318, "loss": 0.0309, "step": 179840 }, { "epoch": 1.16, "learning_rate": 0.00012588084189057487, "loss": 0.0342, "step": 179850 }, { "epoch": 1.16, "learning_rate": 0.00012587116053621795, "loss": 0.0303, "step": 179860 }, { "epoch": 1.16, "learning_rate": 0.000125861479181861, "loss": 0.0337, "step": 179870 }, { "epoch": 1.16, "learning_rate": 0.00012585179782750408, "loss": 0.0285, "step": 179880 }, { "epoch": 1.16, "learning_rate": 0.00012584211647314713, "loss": 0.0342, "step": 179890 }, { "epoch": 1.16, "learning_rate": 0.0001258324351187902, "loss": 0.0282, "step": 179900 }, { "epoch": 1.16, "learning_rate": 0.00012582275376443326, "loss": 0.0333, "step": 179910 }, { "epoch": 1.16, "learning_rate": 0.00012581307241007634, "loss": 0.0336, "step": 179920 }, { "epoch": 1.16, "learning_rate": 0.00012580339105571942, "loss": 0.0346, "step": 179930 }, { "epoch": 1.16, "learning_rate": 0.00012579370970136248, "loss": 0.0358, "step": 179940 }, { "epoch": 1.16, "learning_rate": 0.00012578402834700556, "loss": 0.032, "step": 179950 }, { "epoch": 1.16, "learning_rate": 0.0001257743469926486, "loss": 0.0328, "step": 179960 }, { "epoch": 1.16, "learning_rate": 0.0001257646656382917, "loss": 0.0302, "step": 179970 }, { "epoch": 1.16, "learning_rate": 0.00012575498428393474, "loss": 0.0298, "step": 179980 }, { "epoch": 1.16, "learning_rate": 0.00012574530292957782, "loss": 0.0314, "step": 179990 }, { "epoch": 1.16, "learning_rate": 0.0001257356215752209, "loss": 0.0347, "step": 180000 }, { "epoch": 1.16, "eval_cer": 0.91986984521523, "eval_loss": 0.023445699363946915, "eval_runtime": 120.1491, "eval_samples_per_second": 16.646, "eval_steps_per_second": 4.161, "step": 180000 }, { "epoch": 1.16, "learning_rate": 0.00012572594022086395, "loss": 0.0369, "step": 180010 }, { "epoch": 1.16, "learning_rate": 0.000125716258866507, "loss": 0.0321, "step": 180020 }, { "epoch": 1.16, "learning_rate": 0.0001257065775121501, "loss": 0.0381, "step": 180030 }, { "epoch": 1.16, "learning_rate": 0.00012569689615779317, "loss": 0.0293, "step": 180040 }, { "epoch": 1.16, "learning_rate": 0.00012568721480343622, "loss": 0.0329, "step": 180050 }, { "epoch": 1.16, "learning_rate": 0.0001256775334490793, "loss": 0.0317, "step": 180060 }, { "epoch": 1.16, "learning_rate": 0.00012566785209472238, "loss": 0.0315, "step": 180070 }, { "epoch": 1.16, "learning_rate": 0.00012565817074036543, "loss": 0.0343, "step": 180080 }, { "epoch": 1.16, "learning_rate": 0.00012564848938600848, "loss": 0.0353, "step": 180090 }, { "epoch": 1.16, "learning_rate": 0.00012563880803165156, "loss": 0.0315, "step": 180100 }, { "epoch": 1.16, "learning_rate": 0.00012562912667729464, "loss": 0.0347, "step": 180110 }, { "epoch": 1.16, "learning_rate": 0.0001256194453229377, "loss": 0.0293, "step": 180120 }, { "epoch": 1.16, "learning_rate": 0.00012560976396858078, "loss": 0.0307, "step": 180130 }, { "epoch": 1.16, "learning_rate": 0.00012560008261422383, "loss": 0.0324, "step": 180140 }, { "epoch": 1.16, "learning_rate": 0.0001255904012598669, "loss": 0.036, "step": 180150 }, { "epoch": 1.16, "learning_rate": 0.00012558071990550996, "loss": 0.0346, "step": 180160 }, { "epoch": 1.16, "learning_rate": 0.00012557103855115304, "loss": 0.0372, "step": 180170 }, { "epoch": 1.16, "learning_rate": 0.00012556135719679612, "loss": 0.036, "step": 180180 }, { "epoch": 1.16, "learning_rate": 0.00012555167584243917, "loss": 0.0353, "step": 180190 }, { "epoch": 1.16, "learning_rate": 0.00012554199448808225, "loss": 0.0279, "step": 180200 }, { "epoch": 1.16, "learning_rate": 0.0001255323131337253, "loss": 0.0296, "step": 180210 }, { "epoch": 1.16, "learning_rate": 0.00012552263177936836, "loss": 0.0374, "step": 180220 }, { "epoch": 1.16, "learning_rate": 0.00012551295042501144, "loss": 0.0308, "step": 180230 }, { "epoch": 1.16, "learning_rate": 0.00012550326907065452, "loss": 0.0323, "step": 180240 }, { "epoch": 1.16, "learning_rate": 0.0001254935877162976, "loss": 0.0335, "step": 180250 }, { "epoch": 1.16, "learning_rate": 0.00012548390636194065, "loss": 0.037, "step": 180260 }, { "epoch": 1.16, "learning_rate": 0.00012547422500758373, "loss": 0.0328, "step": 180270 }, { "epoch": 1.16, "learning_rate": 0.00012546454365322678, "loss": 0.0342, "step": 180280 }, { "epoch": 1.16, "learning_rate": 0.00012545486229886984, "loss": 0.0323, "step": 180290 }, { "epoch": 1.16, "learning_rate": 0.00012544518094451292, "loss": 0.0323, "step": 180300 }, { "epoch": 1.16, "learning_rate": 0.000125435499590156, "loss": 0.0295, "step": 180310 }, { "epoch": 1.16, "learning_rate": 0.00012542581823579908, "loss": 0.0319, "step": 180320 }, { "epoch": 1.16, "learning_rate": 0.00012541613688144213, "loss": 0.0383, "step": 180330 }, { "epoch": 1.16, "learning_rate": 0.00012540645552708518, "loss": 0.0332, "step": 180340 }, { "epoch": 1.16, "learning_rate": 0.00012539677417272826, "loss": 0.0291, "step": 180350 }, { "epoch": 1.16, "learning_rate": 0.0001253870928183713, "loss": 0.0367, "step": 180360 }, { "epoch": 1.16, "learning_rate": 0.0001253774114640144, "loss": 0.0302, "step": 180370 }, { "epoch": 1.16, "learning_rate": 0.00012536773010965747, "loss": 0.0335, "step": 180380 }, { "epoch": 1.16, "learning_rate": 0.00012535804875530053, "loss": 0.0343, "step": 180390 }, { "epoch": 1.16, "learning_rate": 0.0001253483674009436, "loss": 0.0345, "step": 180400 }, { "epoch": 1.16, "learning_rate": 0.00012533868604658666, "loss": 0.0305, "step": 180410 }, { "epoch": 1.16, "learning_rate": 0.00012532900469222974, "loss": 0.0329, "step": 180420 }, { "epoch": 1.16, "learning_rate": 0.0001253193233378728, "loss": 0.0403, "step": 180430 }, { "epoch": 1.16, "learning_rate": 0.00012530964198351587, "loss": 0.0335, "step": 180440 }, { "epoch": 1.16, "learning_rate": 0.00012529996062915895, "loss": 0.031, "step": 180450 }, { "epoch": 1.16, "learning_rate": 0.000125290279274802, "loss": 0.032, "step": 180460 }, { "epoch": 1.16, "learning_rate": 0.00012528059792044508, "loss": 0.0373, "step": 180470 }, { "epoch": 1.16, "learning_rate": 0.00012527091656608814, "loss": 0.0295, "step": 180480 }, { "epoch": 1.16, "learning_rate": 0.00012526123521173121, "loss": 0.0334, "step": 180490 }, { "epoch": 1.16, "learning_rate": 0.00012525155385737427, "loss": 0.0334, "step": 180500 }, { "epoch": 1.17, "learning_rate": 0.00012524187250301735, "loss": 0.0289, "step": 180510 }, { "epoch": 1.17, "learning_rate": 0.00012523219114866043, "loss": 0.0369, "step": 180520 }, { "epoch": 1.17, "learning_rate": 0.00012522250979430348, "loss": 0.0345, "step": 180530 }, { "epoch": 1.17, "learning_rate": 0.00012521282843994653, "loss": 0.0291, "step": 180540 }, { "epoch": 1.17, "learning_rate": 0.0001252031470855896, "loss": 0.0367, "step": 180550 }, { "epoch": 1.17, "learning_rate": 0.0001251934657312327, "loss": 0.0335, "step": 180560 }, { "epoch": 1.17, "learning_rate": 0.00012518378437687574, "loss": 0.033, "step": 180570 }, { "epoch": 1.17, "learning_rate": 0.00012517410302251882, "loss": 0.0344, "step": 180580 }, { "epoch": 1.17, "learning_rate": 0.00012516442166816188, "loss": 0.0392, "step": 180590 }, { "epoch": 1.17, "learning_rate": 0.00012515474031380496, "loss": 0.043, "step": 180600 }, { "epoch": 1.17, "learning_rate": 0.000125145058959448, "loss": 0.0286, "step": 180610 }, { "epoch": 1.17, "learning_rate": 0.0001251353776050911, "loss": 0.0332, "step": 180620 }, { "epoch": 1.17, "learning_rate": 0.00012512569625073417, "loss": 0.0282, "step": 180630 }, { "epoch": 1.17, "learning_rate": 0.00012511601489637722, "loss": 0.0336, "step": 180640 }, { "epoch": 1.17, "learning_rate": 0.0001251063335420203, "loss": 0.0359, "step": 180650 }, { "epoch": 1.17, "learning_rate": 0.00012509665218766335, "loss": 0.0342, "step": 180660 }, { "epoch": 1.17, "learning_rate": 0.00012508697083330643, "loss": 0.03, "step": 180670 }, { "epoch": 1.17, "learning_rate": 0.0001250772894789495, "loss": 0.0318, "step": 180680 }, { "epoch": 1.17, "learning_rate": 0.00012506760812459257, "loss": 0.0311, "step": 180690 }, { "epoch": 1.17, "learning_rate": 0.00012505792677023565, "loss": 0.0315, "step": 180700 }, { "epoch": 1.17, "learning_rate": 0.0001250482454158787, "loss": 0.0339, "step": 180710 }, { "epoch": 1.17, "learning_rate": 0.00012503856406152178, "loss": 0.0346, "step": 180720 }, { "epoch": 1.17, "learning_rate": 0.00012502888270716483, "loss": 0.0356, "step": 180730 }, { "epoch": 1.17, "learning_rate": 0.0001250192013528079, "loss": 0.0362, "step": 180740 }, { "epoch": 1.17, "learning_rate": 0.00012500951999845096, "loss": 0.0355, "step": 180750 }, { "epoch": 1.17, "learning_rate": 0.00012499983864409404, "loss": 0.0292, "step": 180760 }, { "epoch": 1.17, "learning_rate": 0.00012499015728973712, "loss": 0.0347, "step": 180770 }, { "epoch": 1.17, "learning_rate": 0.00012498047593538018, "loss": 0.0355, "step": 180780 }, { "epoch": 1.17, "learning_rate": 0.00012497079458102323, "loss": 0.0277, "step": 180790 }, { "epoch": 1.17, "learning_rate": 0.0001249611132266663, "loss": 0.0342, "step": 180800 }, { "epoch": 1.17, "learning_rate": 0.00012495143187230936, "loss": 0.0338, "step": 180810 }, { "epoch": 1.17, "learning_rate": 0.00012494175051795244, "loss": 0.0288, "step": 180820 }, { "epoch": 1.17, "learning_rate": 0.00012493206916359552, "loss": 0.0355, "step": 180830 }, { "epoch": 1.17, "learning_rate": 0.0001249223878092386, "loss": 0.0318, "step": 180840 }, { "epoch": 1.17, "learning_rate": 0.00012491270645488165, "loss": 0.0326, "step": 180850 }, { "epoch": 1.17, "learning_rate": 0.0001249030251005247, "loss": 0.029, "step": 180860 }, { "epoch": 1.17, "learning_rate": 0.00012489334374616779, "loss": 0.0317, "step": 180870 }, { "epoch": 1.17, "learning_rate": 0.00012488366239181084, "loss": 0.0332, "step": 180880 }, { "epoch": 1.17, "learning_rate": 0.00012487398103745392, "loss": 0.0326, "step": 180890 }, { "epoch": 1.17, "learning_rate": 0.000124864299683097, "loss": 0.0311, "step": 180900 }, { "epoch": 1.17, "learning_rate": 0.00012485461832874005, "loss": 0.0429, "step": 180910 }, { "epoch": 1.17, "learning_rate": 0.00012484493697438313, "loss": 0.0318, "step": 180920 }, { "epoch": 1.17, "learning_rate": 0.00012483525562002618, "loss": 0.0345, "step": 180930 }, { "epoch": 1.17, "learning_rate": 0.00012482557426566926, "loss": 0.0316, "step": 180940 }, { "epoch": 1.17, "learning_rate": 0.00012481589291131232, "loss": 0.0304, "step": 180950 }, { "epoch": 1.17, "learning_rate": 0.0001248062115569554, "loss": 0.0357, "step": 180960 }, { "epoch": 1.17, "learning_rate": 0.00012479653020259848, "loss": 0.0336, "step": 180970 }, { "epoch": 1.17, "learning_rate": 0.00012478684884824153, "loss": 0.0355, "step": 180980 }, { "epoch": 1.17, "learning_rate": 0.00012477716749388458, "loss": 0.0291, "step": 180990 }, { "epoch": 1.17, "learning_rate": 0.00012476748613952766, "loss": 0.029, "step": 181000 }, { "epoch": 1.17, "eval_cer": 0.9198345949610214, "eval_loss": 0.02338983491063118, "eval_runtime": 120.1574, "eval_samples_per_second": 16.645, "eval_steps_per_second": 4.161, "step": 181000 }, { "epoch": 1.17, "learning_rate": 0.00012475780478517074, "loss": 0.0365, "step": 181010 }, { "epoch": 1.17, "learning_rate": 0.0001247481234308138, "loss": 0.0356, "step": 181020 }, { "epoch": 1.17, "learning_rate": 0.00012473844207645687, "loss": 0.0287, "step": 181030 }, { "epoch": 1.17, "learning_rate": 0.00012472876072209995, "loss": 0.0354, "step": 181040 }, { "epoch": 1.17, "learning_rate": 0.000124719079367743, "loss": 0.0289, "step": 181050 }, { "epoch": 1.17, "learning_rate": 0.00012470939801338606, "loss": 0.0305, "step": 181060 }, { "epoch": 1.17, "learning_rate": 0.00012469971665902914, "loss": 0.028, "step": 181070 }, { "epoch": 1.17, "learning_rate": 0.00012469003530467222, "loss": 0.0341, "step": 181080 }, { "epoch": 1.17, "learning_rate": 0.00012468035395031527, "loss": 0.028, "step": 181090 }, { "epoch": 1.17, "learning_rate": 0.00012467067259595835, "loss": 0.0359, "step": 181100 }, { "epoch": 1.17, "learning_rate": 0.0001246609912416014, "loss": 0.0402, "step": 181110 }, { "epoch": 1.17, "learning_rate": 0.00012465130988724448, "loss": 0.0369, "step": 181120 }, { "epoch": 1.17, "learning_rate": 0.00012464162853288754, "loss": 0.0368, "step": 181130 }, { "epoch": 1.17, "learning_rate": 0.00012463194717853062, "loss": 0.0335, "step": 181140 }, { "epoch": 1.17, "learning_rate": 0.0001246222658241737, "loss": 0.0302, "step": 181150 }, { "epoch": 1.17, "learning_rate": 0.00012461258446981675, "loss": 0.0292, "step": 181160 }, { "epoch": 1.17, "learning_rate": 0.00012460290311545983, "loss": 0.0304, "step": 181170 }, { "epoch": 1.17, "learning_rate": 0.00012459322176110288, "loss": 0.0323, "step": 181180 }, { "epoch": 1.17, "learning_rate": 0.00012458354040674596, "loss": 0.0336, "step": 181190 }, { "epoch": 1.17, "learning_rate": 0.000124573859052389, "loss": 0.0329, "step": 181200 }, { "epoch": 1.17, "learning_rate": 0.0001245641776980321, "loss": 0.0334, "step": 181210 }, { "epoch": 1.17, "learning_rate": 0.00012455449634367517, "loss": 0.0368, "step": 181220 }, { "epoch": 1.17, "learning_rate": 0.00012454481498931822, "loss": 0.0307, "step": 181230 }, { "epoch": 1.17, "learning_rate": 0.0001245351336349613, "loss": 0.0275, "step": 181240 }, { "epoch": 1.17, "learning_rate": 0.00012452545228060436, "loss": 0.0282, "step": 181250 }, { "epoch": 1.17, "learning_rate": 0.00012451577092624744, "loss": 0.0459, "step": 181260 }, { "epoch": 1.17, "learning_rate": 0.0001245060895718905, "loss": 0.0361, "step": 181270 }, { "epoch": 1.17, "learning_rate": 0.00012449640821753357, "loss": 0.0338, "step": 181280 }, { "epoch": 1.17, "learning_rate": 0.00012448672686317665, "loss": 0.0325, "step": 181290 }, { "epoch": 1.17, "learning_rate": 0.0001244770455088197, "loss": 0.0362, "step": 181300 }, { "epoch": 1.17, "learning_rate": 0.00012446736415446275, "loss": 0.0313, "step": 181310 }, { "epoch": 1.17, "learning_rate": 0.00012445768280010583, "loss": 0.0316, "step": 181320 }, { "epoch": 1.17, "learning_rate": 0.00012444800144574891, "loss": 0.0294, "step": 181330 }, { "epoch": 1.17, "learning_rate": 0.00012443832009139197, "loss": 0.0332, "step": 181340 }, { "epoch": 1.17, "learning_rate": 0.00012442863873703505, "loss": 0.028, "step": 181350 }, { "epoch": 1.17, "learning_rate": 0.00012441895738267813, "loss": 0.0326, "step": 181360 }, { "epoch": 1.17, "learning_rate": 0.00012440927602832118, "loss": 0.0445, "step": 181370 }, { "epoch": 1.17, "learning_rate": 0.00012439959467396423, "loss": 0.0319, "step": 181380 }, { "epoch": 1.17, "learning_rate": 0.0001243899133196073, "loss": 0.0336, "step": 181390 }, { "epoch": 1.17, "learning_rate": 0.0001243802319652504, "loss": 0.0356, "step": 181400 }, { "epoch": 1.17, "learning_rate": 0.00012437055061089344, "loss": 0.0308, "step": 181410 }, { "epoch": 1.17, "learning_rate": 0.00012436086925653652, "loss": 0.0335, "step": 181420 }, { "epoch": 1.17, "learning_rate": 0.00012435118790217958, "loss": 0.0306, "step": 181430 }, { "epoch": 1.17, "learning_rate": 0.00012434150654782266, "loss": 0.0259, "step": 181440 }, { "epoch": 1.17, "learning_rate": 0.0001243318251934657, "loss": 0.0335, "step": 181450 }, { "epoch": 1.17, "learning_rate": 0.0001243221438391088, "loss": 0.0293, "step": 181460 }, { "epoch": 1.17, "learning_rate": 0.00012431246248475187, "loss": 0.0404, "step": 181470 }, { "epoch": 1.17, "learning_rate": 0.00012430278113039492, "loss": 0.0277, "step": 181480 }, { "epoch": 1.17, "learning_rate": 0.000124293099776038, "loss": 0.0286, "step": 181490 }, { "epoch": 1.17, "learning_rate": 0.00012428341842168105, "loss": 0.0431, "step": 181500 }, { "epoch": 1.17, "learning_rate": 0.0001242737370673241, "loss": 0.0359, "step": 181510 }, { "epoch": 1.17, "learning_rate": 0.0001242640557129672, "loss": 0.0404, "step": 181520 }, { "epoch": 1.17, "learning_rate": 0.00012425437435861027, "loss": 0.0326, "step": 181530 }, { "epoch": 1.17, "learning_rate": 0.00012424469300425335, "loss": 0.0338, "step": 181540 }, { "epoch": 1.17, "learning_rate": 0.0001242350116498964, "loss": 0.0398, "step": 181550 }, { "epoch": 1.17, "learning_rate": 0.00012422533029553948, "loss": 0.0346, "step": 181560 }, { "epoch": 1.17, "learning_rate": 0.00012421564894118253, "loss": 0.0343, "step": 181570 }, { "epoch": 1.17, "learning_rate": 0.00012420596758682558, "loss": 0.0318, "step": 181580 }, { "epoch": 1.17, "learning_rate": 0.00012419628623246866, "loss": 0.0314, "step": 181590 }, { "epoch": 1.17, "learning_rate": 0.00012418660487811174, "loss": 0.0319, "step": 181600 }, { "epoch": 1.17, "learning_rate": 0.00012417692352375482, "loss": 0.0342, "step": 181610 }, { "epoch": 1.17, "learning_rate": 0.00012416724216939788, "loss": 0.0326, "step": 181620 }, { "epoch": 1.17, "learning_rate": 0.00012415756081504093, "loss": 0.0354, "step": 181630 }, { "epoch": 1.17, "learning_rate": 0.000124147879460684, "loss": 0.0375, "step": 181640 }, { "epoch": 1.17, "learning_rate": 0.00012413819810632706, "loss": 0.0311, "step": 181650 }, { "epoch": 1.17, "learning_rate": 0.00012412851675197014, "loss": 0.0352, "step": 181660 }, { "epoch": 1.17, "learning_rate": 0.00012411883539761322, "loss": 0.0304, "step": 181670 }, { "epoch": 1.17, "learning_rate": 0.00012410915404325627, "loss": 0.0291, "step": 181680 }, { "epoch": 1.17, "learning_rate": 0.00012409947268889935, "loss": 0.0294, "step": 181690 }, { "epoch": 1.17, "learning_rate": 0.0001240897913345424, "loss": 0.0349, "step": 181700 }, { "epoch": 1.17, "learning_rate": 0.00012408010998018549, "loss": 0.0331, "step": 181710 }, { "epoch": 1.17, "learning_rate": 0.00012407042862582854, "loss": 0.0323, "step": 181720 }, { "epoch": 1.17, "learning_rate": 0.00012406074727147162, "loss": 0.0359, "step": 181730 }, { "epoch": 1.17, "learning_rate": 0.0001240510659171147, "loss": 0.03, "step": 181740 }, { "epoch": 1.17, "learning_rate": 0.00012404138456275775, "loss": 0.0302, "step": 181750 }, { "epoch": 1.17, "learning_rate": 0.00012403170320840083, "loss": 0.0325, "step": 181760 }, { "epoch": 1.17, "learning_rate": 0.00012402202185404388, "loss": 0.0326, "step": 181770 }, { "epoch": 1.17, "learning_rate": 0.00012401234049968696, "loss": 0.0332, "step": 181780 }, { "epoch": 1.17, "learning_rate": 0.00012400265914533002, "loss": 0.0308, "step": 181790 }, { "epoch": 1.17, "learning_rate": 0.0001239929777909731, "loss": 0.0327, "step": 181800 }, { "epoch": 1.17, "learning_rate": 0.00012398329643661618, "loss": 0.0322, "step": 181810 }, { "epoch": 1.17, "learning_rate": 0.00012397361508225923, "loss": 0.032, "step": 181820 }, { "epoch": 1.17, "learning_rate": 0.00012396393372790228, "loss": 0.0289, "step": 181830 }, { "epoch": 1.17, "learning_rate": 0.00012395425237354536, "loss": 0.0296, "step": 181840 }, { "epoch": 1.17, "learning_rate": 0.00012394457101918844, "loss": 0.043, "step": 181850 }, { "epoch": 1.17, "learning_rate": 0.0001239348896648315, "loss": 0.0327, "step": 181860 }, { "epoch": 1.17, "learning_rate": 0.00012392520831047457, "loss": 0.0313, "step": 181870 }, { "epoch": 1.17, "learning_rate": 0.00012391552695611763, "loss": 0.0386, "step": 181880 }, { "epoch": 1.17, "learning_rate": 0.0001239058456017607, "loss": 0.0358, "step": 181890 }, { "epoch": 1.17, "learning_rate": 0.00012389616424740376, "loss": 0.0313, "step": 181900 }, { "epoch": 1.17, "learning_rate": 0.00012388648289304684, "loss": 0.0317, "step": 181910 }, { "epoch": 1.17, "learning_rate": 0.00012387680153868992, "loss": 0.0347, "step": 181920 }, { "epoch": 1.17, "learning_rate": 0.00012386712018433297, "loss": 0.0327, "step": 181930 }, { "epoch": 1.17, "learning_rate": 0.00012385743882997605, "loss": 0.0405, "step": 181940 }, { "epoch": 1.17, "learning_rate": 0.0001238477574756191, "loss": 0.0301, "step": 181950 }, { "epoch": 1.17, "learning_rate": 0.00012383807612126218, "loss": 0.028, "step": 181960 }, { "epoch": 1.17, "learning_rate": 0.00012382839476690524, "loss": 0.0276, "step": 181970 }, { "epoch": 1.17, "learning_rate": 0.00012381871341254831, "loss": 0.0332, "step": 181980 }, { "epoch": 1.17, "learning_rate": 0.0001238090320581914, "loss": 0.0268, "step": 181990 }, { "epoch": 1.17, "learning_rate": 0.00012379935070383445, "loss": 0.0305, "step": 182000 }, { "epoch": 1.17, "eval_cer": 0.9198861145633261, "eval_loss": 0.0231363195925951, "eval_runtime": 120.0639, "eval_samples_per_second": 16.658, "eval_steps_per_second": 4.164, "step": 182000 }, { "epoch": 1.17, "learning_rate": 0.00012378966934947753, "loss": 0.0339, "step": 182010 }, { "epoch": 1.17, "learning_rate": 0.00012377998799512058, "loss": 0.033, "step": 182020 }, { "epoch": 1.17, "learning_rate": 0.00012377030664076366, "loss": 0.0328, "step": 182030 }, { "epoch": 1.17, "learning_rate": 0.0001237606252864067, "loss": 0.0302, "step": 182040 }, { "epoch": 1.17, "learning_rate": 0.0001237509439320498, "loss": 0.0301, "step": 182050 }, { "epoch": 1.18, "learning_rate": 0.00012374126257769287, "loss": 0.033, "step": 182060 }, { "epoch": 1.18, "learning_rate": 0.00012373158122333592, "loss": 0.0315, "step": 182070 }, { "epoch": 1.18, "learning_rate": 0.000123721899868979, "loss": 0.0368, "step": 182080 }, { "epoch": 1.18, "learning_rate": 0.00012371221851462206, "loss": 0.0333, "step": 182090 }, { "epoch": 1.18, "learning_rate": 0.00012370253716026514, "loss": 0.0337, "step": 182100 }, { "epoch": 1.18, "learning_rate": 0.0001236928558059082, "loss": 0.0315, "step": 182110 }, { "epoch": 1.18, "learning_rate": 0.00012368317445155127, "loss": 0.0301, "step": 182120 }, { "epoch": 1.18, "learning_rate": 0.00012367349309719435, "loss": 0.0307, "step": 182130 }, { "epoch": 1.18, "learning_rate": 0.0001236638117428374, "loss": 0.0319, "step": 182140 }, { "epoch": 1.18, "learning_rate": 0.00012365413038848045, "loss": 0.0291, "step": 182150 }, { "epoch": 1.18, "learning_rate": 0.00012364444903412353, "loss": 0.0308, "step": 182160 }, { "epoch": 1.18, "learning_rate": 0.00012363476767976661, "loss": 0.0283, "step": 182170 }, { "epoch": 1.18, "learning_rate": 0.00012362508632540967, "loss": 0.0339, "step": 182180 }, { "epoch": 1.18, "learning_rate": 0.00012361540497105275, "loss": 0.0286, "step": 182190 }, { "epoch": 1.18, "learning_rate": 0.0001236057236166958, "loss": 0.0293, "step": 182200 }, { "epoch": 1.18, "learning_rate": 0.00012359604226233888, "loss": 0.0306, "step": 182210 }, { "epoch": 1.18, "learning_rate": 0.00012358636090798193, "loss": 0.0314, "step": 182220 }, { "epoch": 1.18, "learning_rate": 0.000123576679553625, "loss": 0.0319, "step": 182230 }, { "epoch": 1.18, "learning_rate": 0.0001235669981992681, "loss": 0.0409, "step": 182240 }, { "epoch": 1.18, "learning_rate": 0.00012355731684491114, "loss": 0.0335, "step": 182250 }, { "epoch": 1.18, "learning_rate": 0.00012354763549055422, "loss": 0.0414, "step": 182260 }, { "epoch": 1.18, "learning_rate": 0.00012353795413619728, "loss": 0.0286, "step": 182270 }, { "epoch": 1.18, "learning_rate": 0.00012352827278184036, "loss": 0.0279, "step": 182280 }, { "epoch": 1.18, "learning_rate": 0.0001235185914274834, "loss": 0.0348, "step": 182290 }, { "epoch": 1.18, "learning_rate": 0.0001235089100731265, "loss": 0.0302, "step": 182300 }, { "epoch": 1.18, "learning_rate": 0.00012349922871876957, "loss": 0.0289, "step": 182310 }, { "epoch": 1.18, "learning_rate": 0.00012348954736441262, "loss": 0.0292, "step": 182320 }, { "epoch": 1.18, "learning_rate": 0.0001234798660100557, "loss": 0.0348, "step": 182330 }, { "epoch": 1.18, "learning_rate": 0.00012347018465569875, "loss": 0.034, "step": 182340 }, { "epoch": 1.18, "learning_rate": 0.0001234605033013418, "loss": 0.0262, "step": 182350 }, { "epoch": 1.18, "learning_rate": 0.00012345082194698489, "loss": 0.0263, "step": 182360 }, { "epoch": 1.18, "learning_rate": 0.00012344114059262797, "loss": 0.0368, "step": 182370 }, { "epoch": 1.18, "learning_rate": 0.00012343145923827105, "loss": 0.0377, "step": 182380 }, { "epoch": 1.18, "learning_rate": 0.0001234217778839141, "loss": 0.0289, "step": 182390 }, { "epoch": 1.18, "learning_rate": 0.00012341209652955715, "loss": 0.0343, "step": 182400 }, { "epoch": 1.18, "learning_rate": 0.00012340241517520023, "loss": 0.036, "step": 182410 }, { "epoch": 1.18, "learning_rate": 0.00012339273382084328, "loss": 0.0291, "step": 182420 }, { "epoch": 1.18, "learning_rate": 0.00012338305246648636, "loss": 0.0292, "step": 182430 }, { "epoch": 1.18, "learning_rate": 0.00012337337111212944, "loss": 0.0343, "step": 182440 }, { "epoch": 1.18, "learning_rate": 0.00012336368975777252, "loss": 0.0324, "step": 182450 }, { "epoch": 1.18, "learning_rate": 0.00012335400840341558, "loss": 0.0286, "step": 182460 }, { "epoch": 1.18, "learning_rate": 0.00012334432704905863, "loss": 0.0339, "step": 182470 }, { "epoch": 1.18, "learning_rate": 0.0001233346456947017, "loss": 0.0302, "step": 182480 }, { "epoch": 1.18, "learning_rate": 0.00012332496434034476, "loss": 0.0371, "step": 182490 }, { "epoch": 1.18, "learning_rate": 0.00012331528298598784, "loss": 0.0391, "step": 182500 }, { "epoch": 1.18, "learning_rate": 0.00012330560163163092, "loss": 0.0336, "step": 182510 }, { "epoch": 1.18, "learning_rate": 0.00012329592027727397, "loss": 0.0301, "step": 182520 }, { "epoch": 1.18, "learning_rate": 0.00012328623892291705, "loss": 0.0311, "step": 182530 }, { "epoch": 1.18, "learning_rate": 0.0001232765575685601, "loss": 0.0273, "step": 182540 }, { "epoch": 1.18, "learning_rate": 0.00012326687621420319, "loss": 0.032, "step": 182550 }, { "epoch": 1.18, "learning_rate": 0.00012325719485984624, "loss": 0.0364, "step": 182560 }, { "epoch": 1.18, "learning_rate": 0.00012324751350548932, "loss": 0.032, "step": 182570 }, { "epoch": 1.18, "learning_rate": 0.0001232378321511324, "loss": 0.0307, "step": 182580 }, { "epoch": 1.18, "learning_rate": 0.00012322815079677545, "loss": 0.0315, "step": 182590 }, { "epoch": 1.18, "learning_rate": 0.0001232184694424185, "loss": 0.0304, "step": 182600 }, { "epoch": 1.18, "learning_rate": 0.00012320878808806158, "loss": 0.0328, "step": 182610 }, { "epoch": 1.18, "learning_rate": 0.00012319910673370466, "loss": 0.0389, "step": 182620 }, { "epoch": 1.18, "learning_rate": 0.00012318942537934772, "loss": 0.0304, "step": 182630 }, { "epoch": 1.18, "learning_rate": 0.0001231797440249908, "loss": 0.0317, "step": 182640 }, { "epoch": 1.18, "learning_rate": 0.00012317006267063387, "loss": 0.0329, "step": 182650 }, { "epoch": 1.18, "learning_rate": 0.00012316038131627693, "loss": 0.033, "step": 182660 }, { "epoch": 1.18, "learning_rate": 0.00012315069996191998, "loss": 0.0375, "step": 182670 }, { "epoch": 1.18, "learning_rate": 0.00012314101860756306, "loss": 0.036, "step": 182680 }, { "epoch": 1.18, "learning_rate": 0.00012313133725320614, "loss": 0.0351, "step": 182690 }, { "epoch": 1.18, "learning_rate": 0.0001231216558988492, "loss": 0.0379, "step": 182700 }, { "epoch": 1.18, "learning_rate": 0.00012311197454449227, "loss": 0.0362, "step": 182710 }, { "epoch": 1.18, "learning_rate": 0.00012310229319013533, "loss": 0.0295, "step": 182720 }, { "epoch": 1.18, "learning_rate": 0.0001230926118357784, "loss": 0.031, "step": 182730 }, { "epoch": 1.18, "learning_rate": 0.00012308293048142146, "loss": 0.0327, "step": 182740 }, { "epoch": 1.18, "learning_rate": 0.00012307324912706454, "loss": 0.0357, "step": 182750 }, { "epoch": 1.18, "learning_rate": 0.00012306356777270762, "loss": 0.0357, "step": 182760 }, { "epoch": 1.18, "learning_rate": 0.00012305388641835067, "loss": 0.0283, "step": 182770 }, { "epoch": 1.18, "learning_rate": 0.00012304420506399375, "loss": 0.0405, "step": 182780 }, { "epoch": 1.18, "learning_rate": 0.0001230345237096368, "loss": 0.0323, "step": 182790 }, { "epoch": 1.18, "learning_rate": 0.00012302484235527988, "loss": 0.0311, "step": 182800 }, { "epoch": 1.18, "learning_rate": 0.00012301516100092293, "loss": 0.0302, "step": 182810 }, { "epoch": 1.18, "learning_rate": 0.00012300547964656601, "loss": 0.0381, "step": 182820 }, { "epoch": 1.18, "learning_rate": 0.0001229957982922091, "loss": 0.0282, "step": 182830 }, { "epoch": 1.18, "learning_rate": 0.00012298611693785215, "loss": 0.0353, "step": 182840 }, { "epoch": 1.18, "learning_rate": 0.00012297643558349523, "loss": 0.0373, "step": 182850 }, { "epoch": 1.18, "learning_rate": 0.00012296675422913828, "loss": 0.0317, "step": 182860 }, { "epoch": 1.18, "learning_rate": 0.00012295707287478136, "loss": 0.0343, "step": 182870 }, { "epoch": 1.18, "learning_rate": 0.0001229473915204244, "loss": 0.0267, "step": 182880 }, { "epoch": 1.18, "learning_rate": 0.0001229377101660675, "loss": 0.0396, "step": 182890 }, { "epoch": 1.18, "learning_rate": 0.00012292802881171057, "loss": 0.0345, "step": 182900 }, { "epoch": 1.18, "learning_rate": 0.00012291834745735362, "loss": 0.0337, "step": 182910 }, { "epoch": 1.18, "learning_rate": 0.00012290866610299668, "loss": 0.0292, "step": 182920 }, { "epoch": 1.18, "learning_rate": 0.00012289898474863976, "loss": 0.0362, "step": 182930 }, { "epoch": 1.18, "learning_rate": 0.00012288930339428284, "loss": 0.0334, "step": 182940 }, { "epoch": 1.18, "learning_rate": 0.0001228796220399259, "loss": 0.0372, "step": 182950 }, { "epoch": 1.18, "learning_rate": 0.00012286994068556897, "loss": 0.0303, "step": 182960 }, { "epoch": 1.18, "learning_rate": 0.00012286025933121205, "loss": 0.0385, "step": 182970 }, { "epoch": 1.18, "learning_rate": 0.0001228505779768551, "loss": 0.0367, "step": 182980 }, { "epoch": 1.18, "learning_rate": 0.00012284089662249815, "loss": 0.0338, "step": 182990 }, { "epoch": 1.18, "learning_rate": 0.00012283121526814123, "loss": 0.0454, "step": 183000 }, { "epoch": 1.18, "eval_cer": 0.9199674613038075, "eval_loss": 0.023103881627321243, "eval_runtime": 120.0626, "eval_samples_per_second": 16.658, "eval_steps_per_second": 4.164, "step": 183000 }, { "epoch": 1.18, "learning_rate": 0.00012282153391378431, "loss": 0.0339, "step": 183010 }, { "epoch": 1.18, "learning_rate": 0.00012281185255942737, "loss": 0.0299, "step": 183020 }, { "epoch": 1.18, "learning_rate": 0.00012280217120507045, "loss": 0.0337, "step": 183030 }, { "epoch": 1.18, "learning_rate": 0.0001227924898507135, "loss": 0.0272, "step": 183040 }, { "epoch": 1.18, "learning_rate": 0.00012278280849635658, "loss": 0.0322, "step": 183050 }, { "epoch": 1.18, "learning_rate": 0.00012277312714199963, "loss": 0.0301, "step": 183060 }, { "epoch": 1.18, "learning_rate": 0.0001227634457876427, "loss": 0.0366, "step": 183070 }, { "epoch": 1.18, "learning_rate": 0.0001227537644332858, "loss": 0.0266, "step": 183080 }, { "epoch": 1.18, "learning_rate": 0.00012274408307892884, "loss": 0.0324, "step": 183090 }, { "epoch": 1.18, "learning_rate": 0.00012273440172457192, "loss": 0.0306, "step": 183100 }, { "epoch": 1.18, "learning_rate": 0.00012272472037021498, "loss": 0.0308, "step": 183110 }, { "epoch": 1.18, "learning_rate": 0.00012271503901585803, "loss": 0.0324, "step": 183120 }, { "epoch": 1.18, "learning_rate": 0.0001227053576615011, "loss": 0.0339, "step": 183130 }, { "epoch": 1.18, "learning_rate": 0.0001226956763071442, "loss": 0.0385, "step": 183140 }, { "epoch": 1.18, "learning_rate": 0.00012268599495278727, "loss": 0.0426, "step": 183150 }, { "epoch": 1.18, "learning_rate": 0.00012267631359843032, "loss": 0.0336, "step": 183160 }, { "epoch": 1.18, "learning_rate": 0.0001226666322440734, "loss": 0.0323, "step": 183170 }, { "epoch": 1.18, "learning_rate": 0.00012265695088971645, "loss": 0.0343, "step": 183180 }, { "epoch": 1.18, "learning_rate": 0.0001226472695353595, "loss": 0.0303, "step": 183190 }, { "epoch": 1.18, "learning_rate": 0.00012263758818100259, "loss": 0.0312, "step": 183200 }, { "epoch": 1.18, "learning_rate": 0.00012262790682664567, "loss": 0.0271, "step": 183210 }, { "epoch": 1.18, "learning_rate": 0.00012261822547228875, "loss": 0.0356, "step": 183220 }, { "epoch": 1.18, "learning_rate": 0.0001226085441179318, "loss": 0.0387, "step": 183230 }, { "epoch": 1.18, "learning_rate": 0.00012259886276357485, "loss": 0.0379, "step": 183240 }, { "epoch": 1.18, "learning_rate": 0.00012258918140921793, "loss": 0.0358, "step": 183250 }, { "epoch": 1.18, "learning_rate": 0.00012257950005486098, "loss": 0.0363, "step": 183260 }, { "epoch": 1.18, "learning_rate": 0.00012256981870050406, "loss": 0.0361, "step": 183270 }, { "epoch": 1.18, "learning_rate": 0.00012256013734614714, "loss": 0.0309, "step": 183280 }, { "epoch": 1.18, "learning_rate": 0.0001225504559917902, "loss": 0.0335, "step": 183290 }, { "epoch": 1.18, "learning_rate": 0.00012254077463743328, "loss": 0.0308, "step": 183300 }, { "epoch": 1.18, "learning_rate": 0.00012253109328307633, "loss": 0.0338, "step": 183310 }, { "epoch": 1.18, "learning_rate": 0.0001225214119287194, "loss": 0.0265, "step": 183320 }, { "epoch": 1.18, "learning_rate": 0.00012251173057436246, "loss": 0.0357, "step": 183330 }, { "epoch": 1.18, "learning_rate": 0.00012250204922000554, "loss": 0.0381, "step": 183340 }, { "epoch": 1.18, "learning_rate": 0.00012249236786564862, "loss": 0.0319, "step": 183350 }, { "epoch": 1.18, "learning_rate": 0.00012248268651129167, "loss": 0.0297, "step": 183360 }, { "epoch": 1.18, "learning_rate": 0.00012247300515693475, "loss": 0.0423, "step": 183370 }, { "epoch": 1.18, "learning_rate": 0.0001224633238025778, "loss": 0.0384, "step": 183380 }, { "epoch": 1.18, "learning_rate": 0.00012245364244822089, "loss": 0.0337, "step": 183390 }, { "epoch": 1.18, "learning_rate": 0.00012244396109386394, "loss": 0.0339, "step": 183400 }, { "epoch": 1.18, "learning_rate": 0.00012243427973950702, "loss": 0.0293, "step": 183410 }, { "epoch": 1.18, "learning_rate": 0.0001224245983851501, "loss": 0.0309, "step": 183420 }, { "epoch": 1.18, "learning_rate": 0.00012241491703079315, "loss": 0.0298, "step": 183430 }, { "epoch": 1.18, "learning_rate": 0.0001224052356764362, "loss": 0.0351, "step": 183440 }, { "epoch": 1.18, "learning_rate": 0.00012239555432207928, "loss": 0.0298, "step": 183450 }, { "epoch": 1.18, "learning_rate": 0.00012238587296772236, "loss": 0.033, "step": 183460 }, { "epoch": 1.18, "learning_rate": 0.00012237619161336541, "loss": 0.0331, "step": 183470 }, { "epoch": 1.18, "learning_rate": 0.0001223665102590085, "loss": 0.0304, "step": 183480 }, { "epoch": 1.18, "learning_rate": 0.00012235682890465155, "loss": 0.0333, "step": 183490 }, { "epoch": 1.18, "learning_rate": 0.00012234714755029463, "loss": 0.0327, "step": 183500 }, { "epoch": 1.18, "learning_rate": 0.00012233746619593768, "loss": 0.0296, "step": 183510 }, { "epoch": 1.18, "learning_rate": 0.00012232778484158076, "loss": 0.0332, "step": 183520 }, { "epoch": 1.18, "learning_rate": 0.00012231810348722384, "loss": 0.0311, "step": 183530 }, { "epoch": 1.18, "learning_rate": 0.0001223084221328669, "loss": 0.0398, "step": 183540 }, { "epoch": 1.18, "learning_rate": 0.00012229874077850997, "loss": 0.0344, "step": 183550 }, { "epoch": 1.18, "learning_rate": 0.00012228905942415302, "loss": 0.0286, "step": 183560 }, { "epoch": 1.18, "learning_rate": 0.0001222793780697961, "loss": 0.0281, "step": 183570 }, { "epoch": 1.18, "learning_rate": 0.00012226969671543916, "loss": 0.0354, "step": 183580 }, { "epoch": 1.18, "learning_rate": 0.00012226001536108224, "loss": 0.0329, "step": 183590 }, { "epoch": 1.18, "learning_rate": 0.00012225033400672532, "loss": 0.0283, "step": 183600 }, { "epoch": 1.19, "learning_rate": 0.00012224065265236837, "loss": 0.0296, "step": 183610 }, { "epoch": 1.19, "learning_rate": 0.00012223097129801145, "loss": 0.0281, "step": 183620 }, { "epoch": 1.19, "learning_rate": 0.0001222212899436545, "loss": 0.0326, "step": 183630 }, { "epoch": 1.19, "learning_rate": 0.00012221160858929758, "loss": 0.0309, "step": 183640 }, { "epoch": 1.19, "learning_rate": 0.00012220192723494063, "loss": 0.0353, "step": 183650 }, { "epoch": 1.19, "learning_rate": 0.00012219224588058371, "loss": 0.0343, "step": 183660 }, { "epoch": 1.19, "learning_rate": 0.0001221825645262268, "loss": 0.0331, "step": 183670 }, { "epoch": 1.19, "learning_rate": 0.00012217288317186985, "loss": 0.0338, "step": 183680 }, { "epoch": 1.19, "learning_rate": 0.0001221632018175129, "loss": 0.0388, "step": 183690 }, { "epoch": 1.19, "learning_rate": 0.00012215352046315598, "loss": 0.0338, "step": 183700 }, { "epoch": 1.19, "learning_rate": 0.00012214383910879906, "loss": 0.0331, "step": 183710 }, { "epoch": 1.19, "learning_rate": 0.0001221341577544421, "loss": 0.0309, "step": 183720 }, { "epoch": 1.19, "learning_rate": 0.0001221244764000852, "loss": 0.0346, "step": 183730 }, { "epoch": 1.19, "learning_rate": 0.00012211479504572827, "loss": 0.0321, "step": 183740 }, { "epoch": 1.19, "learning_rate": 0.00012210511369137132, "loss": 0.0265, "step": 183750 }, { "epoch": 1.19, "learning_rate": 0.00012209543233701438, "loss": 0.0331, "step": 183760 }, { "epoch": 1.19, "learning_rate": 0.00012208575098265746, "loss": 0.0342, "step": 183770 }, { "epoch": 1.19, "learning_rate": 0.00012207606962830054, "loss": 0.0261, "step": 183780 }, { "epoch": 1.19, "learning_rate": 0.00012206638827394359, "loss": 0.0333, "step": 183790 }, { "epoch": 1.19, "learning_rate": 0.00012205670691958666, "loss": 0.0359, "step": 183800 }, { "epoch": 1.19, "learning_rate": 0.00012204702556522973, "loss": 0.0364, "step": 183810 }, { "epoch": 1.19, "learning_rate": 0.00012203734421087279, "loss": 0.0352, "step": 183820 }, { "epoch": 1.19, "learning_rate": 0.00012202766285651587, "loss": 0.0357, "step": 183830 }, { "epoch": 1.19, "learning_rate": 0.00012201798150215893, "loss": 0.0314, "step": 183840 }, { "epoch": 1.19, "learning_rate": 0.00012200830014780201, "loss": 0.0386, "step": 183850 }, { "epoch": 1.19, "learning_rate": 0.00012199861879344507, "loss": 0.0325, "step": 183860 }, { "epoch": 1.19, "learning_rate": 0.00012198893743908813, "loss": 0.0376, "step": 183870 }, { "epoch": 1.19, "learning_rate": 0.00012197925608473121, "loss": 0.037, "step": 183880 }, { "epoch": 1.19, "learning_rate": 0.00012196957473037426, "loss": 0.0342, "step": 183890 }, { "epoch": 1.19, "learning_rate": 0.00012195989337601733, "loss": 0.0351, "step": 183900 }, { "epoch": 1.19, "learning_rate": 0.00012195021202166041, "loss": 0.03, "step": 183910 }, { "epoch": 1.19, "learning_rate": 0.00012194053066730348, "loss": 0.029, "step": 183920 }, { "epoch": 1.19, "learning_rate": 0.00012193084931294654, "loss": 0.0296, "step": 183930 }, { "epoch": 1.19, "learning_rate": 0.00012192116795858961, "loss": 0.0317, "step": 183940 }, { "epoch": 1.19, "learning_rate": 0.00012191148660423269, "loss": 0.0399, "step": 183950 }, { "epoch": 1.19, "learning_rate": 0.00012190180524987574, "loss": 0.033, "step": 183960 }, { "epoch": 1.19, "learning_rate": 0.00012189212389551881, "loss": 0.0319, "step": 183970 }, { "epoch": 1.19, "learning_rate": 0.00012188244254116189, "loss": 0.0357, "step": 183980 }, { "epoch": 1.19, "learning_rate": 0.00012187276118680495, "loss": 0.028, "step": 183990 }, { "epoch": 1.19, "learning_rate": 0.00012186307983244801, "loss": 0.0339, "step": 184000 }, { "epoch": 1.19, "eval_cer": 0.9198978646480623, "eval_loss": 0.023351291194558144, "eval_runtime": 120.0133, "eval_samples_per_second": 16.665, "eval_steps_per_second": 4.166, "step": 184000 }, { "epoch": 1.19, "learning_rate": 0.00012185339847809109, "loss": 0.0279, "step": 184010 }, { "epoch": 1.19, "learning_rate": 0.00012184371712373415, "loss": 0.0329, "step": 184020 }, { "epoch": 1.19, "learning_rate": 0.00012183403576937722, "loss": 0.0363, "step": 184030 }, { "epoch": 1.19, "learning_rate": 0.00012182435441502029, "loss": 0.0325, "step": 184040 }, { "epoch": 1.19, "learning_rate": 0.00012181467306066337, "loss": 0.0309, "step": 184050 }, { "epoch": 1.19, "learning_rate": 0.00012180499170630643, "loss": 0.0312, "step": 184060 }, { "epoch": 1.19, "learning_rate": 0.00012179531035194948, "loss": 0.0269, "step": 184070 }, { "epoch": 1.19, "learning_rate": 0.00012178562899759256, "loss": 0.0297, "step": 184080 }, { "epoch": 1.19, "learning_rate": 0.00012177594764323563, "loss": 0.0302, "step": 184090 }, { "epoch": 1.19, "learning_rate": 0.00012176626628887868, "loss": 0.0286, "step": 184100 }, { "epoch": 1.19, "learning_rate": 0.00012175658493452176, "loss": 0.0365, "step": 184110 }, { "epoch": 1.19, "learning_rate": 0.00012174690358016483, "loss": 0.0311, "step": 184120 }, { "epoch": 1.19, "learning_rate": 0.00012173722222580791, "loss": 0.0385, "step": 184130 }, { "epoch": 1.19, "learning_rate": 0.00012172754087145096, "loss": 0.0381, "step": 184140 }, { "epoch": 1.19, "learning_rate": 0.00012171785951709404, "loss": 0.0319, "step": 184150 }, { "epoch": 1.19, "learning_rate": 0.00012170817816273711, "loss": 0.0342, "step": 184160 }, { "epoch": 1.19, "learning_rate": 0.00012169849680838016, "loss": 0.029, "step": 184170 }, { "epoch": 1.19, "learning_rate": 0.00012168881545402324, "loss": 0.0324, "step": 184180 }, { "epoch": 1.19, "learning_rate": 0.0001216791340996663, "loss": 0.0339, "step": 184190 }, { "epoch": 1.19, "learning_rate": 0.00012166945274530939, "loss": 0.0298, "step": 184200 }, { "epoch": 1.19, "learning_rate": 0.00012165977139095244, "loss": 0.0287, "step": 184210 }, { "epoch": 1.19, "learning_rate": 0.0001216500900365955, "loss": 0.0302, "step": 184220 }, { "epoch": 1.19, "learning_rate": 0.00012164040868223858, "loss": 0.0292, "step": 184230 }, { "epoch": 1.19, "learning_rate": 0.00012163072732788164, "loss": 0.03, "step": 184240 }, { "epoch": 1.19, "learning_rate": 0.00012162104597352472, "loss": 0.03, "step": 184250 }, { "epoch": 1.19, "learning_rate": 0.00012161136461916778, "loss": 0.0262, "step": 184260 }, { "epoch": 1.19, "learning_rate": 0.00012160168326481084, "loss": 0.0329, "step": 184270 }, { "epoch": 1.19, "learning_rate": 0.00012159200191045392, "loss": 0.0296, "step": 184280 }, { "epoch": 1.19, "learning_rate": 0.00012158232055609698, "loss": 0.0374, "step": 184290 }, { "epoch": 1.19, "learning_rate": 0.00012157263920174006, "loss": 0.0328, "step": 184300 }, { "epoch": 1.19, "learning_rate": 0.00012156295784738311, "loss": 0.0335, "step": 184310 }, { "epoch": 1.19, "learning_rate": 0.00012155327649302618, "loss": 0.0324, "step": 184320 }, { "epoch": 1.19, "learning_rate": 0.00012154359513866926, "loss": 0.0284, "step": 184330 }, { "epoch": 1.19, "learning_rate": 0.00012153391378431231, "loss": 0.0251, "step": 184340 }, { "epoch": 1.19, "learning_rate": 0.00012152423242995539, "loss": 0.0296, "step": 184350 }, { "epoch": 1.19, "learning_rate": 0.00012151455107559846, "loss": 0.0361, "step": 184360 }, { "epoch": 1.19, "learning_rate": 0.00012150486972124153, "loss": 0.0329, "step": 184370 }, { "epoch": 1.19, "learning_rate": 0.00012149518836688459, "loss": 0.027, "step": 184380 }, { "epoch": 1.19, "learning_rate": 0.00012148550701252766, "loss": 0.0308, "step": 184390 }, { "epoch": 1.19, "learning_rate": 0.00012147582565817074, "loss": 0.0307, "step": 184400 }, { "epoch": 1.19, "learning_rate": 0.00012146614430381379, "loss": 0.0347, "step": 184410 }, { "epoch": 1.19, "learning_rate": 0.00012145646294945686, "loss": 0.0295, "step": 184420 }, { "epoch": 1.19, "learning_rate": 0.00012144678159509994, "loss": 0.0301, "step": 184430 }, { "epoch": 1.19, "learning_rate": 0.000121437100240743, "loss": 0.0375, "step": 184440 }, { "epoch": 1.19, "learning_rate": 0.00012142741888638607, "loss": 0.0302, "step": 184450 }, { "epoch": 1.19, "learning_rate": 0.00012141773753202914, "loss": 0.031, "step": 184460 }, { "epoch": 1.19, "learning_rate": 0.00012140805617767222, "loss": 0.0323, "step": 184470 }, { "epoch": 1.19, "learning_rate": 0.00012139837482331527, "loss": 0.0285, "step": 184480 }, { "epoch": 1.19, "learning_rate": 0.00012138869346895833, "loss": 0.0288, "step": 184490 }, { "epoch": 1.19, "learning_rate": 0.00012137901211460141, "loss": 0.0377, "step": 184500 }, { "epoch": 1.19, "learning_rate": 0.00012136933076024448, "loss": 0.0298, "step": 184510 }, { "epoch": 1.19, "learning_rate": 0.00012135964940588753, "loss": 0.032, "step": 184520 }, { "epoch": 1.19, "learning_rate": 0.00012134996805153061, "loss": 0.034, "step": 184530 }, { "epoch": 1.19, "learning_rate": 0.00012134028669717368, "loss": 0.0333, "step": 184540 }, { "epoch": 1.19, "learning_rate": 0.00012133060534281674, "loss": 0.0372, "step": 184550 }, { "epoch": 1.19, "learning_rate": 0.00012132092398845981, "loss": 0.0302, "step": 184560 }, { "epoch": 1.19, "learning_rate": 0.00012131124263410289, "loss": 0.0315, "step": 184570 }, { "epoch": 1.19, "learning_rate": 0.00012130156127974596, "loss": 0.0408, "step": 184580 }, { "epoch": 1.19, "learning_rate": 0.00012129187992538901, "loss": 0.0363, "step": 184590 }, { "epoch": 1.19, "learning_rate": 0.00012128219857103209, "loss": 0.0328, "step": 184600 }, { "epoch": 1.19, "learning_rate": 0.00012127251721667516, "loss": 0.032, "step": 184610 }, { "epoch": 1.19, "learning_rate": 0.00012126283586231821, "loss": 0.0303, "step": 184620 }, { "epoch": 1.19, "learning_rate": 0.00012125315450796129, "loss": 0.0277, "step": 184630 }, { "epoch": 1.19, "learning_rate": 0.00012124347315360435, "loss": 0.0262, "step": 184640 }, { "epoch": 1.19, "learning_rate": 0.00012123379179924743, "loss": 0.0383, "step": 184650 }, { "epoch": 1.19, "learning_rate": 0.00012122411044489049, "loss": 0.0346, "step": 184660 }, { "epoch": 1.19, "learning_rate": 0.00012121442909053357, "loss": 0.0369, "step": 184670 }, { "epoch": 1.19, "learning_rate": 0.00012120474773617663, "loss": 0.0345, "step": 184680 }, { "epoch": 1.19, "learning_rate": 0.00012119506638181969, "loss": 0.0325, "step": 184690 }, { "epoch": 1.19, "learning_rate": 0.00012118538502746277, "loss": 0.0354, "step": 184700 }, { "epoch": 1.19, "learning_rate": 0.00012117570367310583, "loss": 0.0316, "step": 184710 }, { "epoch": 1.19, "learning_rate": 0.00012116602231874891, "loss": 0.0414, "step": 184720 }, { "epoch": 1.19, "learning_rate": 0.00012115634096439196, "loss": 0.0296, "step": 184730 }, { "epoch": 1.19, "learning_rate": 0.00012114665961003503, "loss": 0.0351, "step": 184740 }, { "epoch": 1.19, "learning_rate": 0.00012113697825567811, "loss": 0.0338, "step": 184750 }, { "epoch": 1.19, "learning_rate": 0.00012112729690132116, "loss": 0.0289, "step": 184760 }, { "epoch": 1.19, "learning_rate": 0.00012111761554696424, "loss": 0.0327, "step": 184770 }, { "epoch": 1.19, "learning_rate": 0.00012110793419260731, "loss": 0.0328, "step": 184780 }, { "epoch": 1.19, "learning_rate": 0.00012109825283825038, "loss": 0.0322, "step": 184790 }, { "epoch": 1.19, "learning_rate": 0.00012108857148389344, "loss": 0.0325, "step": 184800 }, { "epoch": 1.19, "learning_rate": 0.00012107889012953651, "loss": 0.0356, "step": 184810 }, { "epoch": 1.19, "learning_rate": 0.00012106920877517959, "loss": 0.0332, "step": 184820 }, { "epoch": 1.19, "learning_rate": 0.00012105952742082264, "loss": 0.0255, "step": 184830 }, { "epoch": 1.19, "learning_rate": 0.0001210498460664657, "loss": 0.0318, "step": 184840 }, { "epoch": 1.19, "learning_rate": 0.00012104016471210879, "loss": 0.0276, "step": 184850 }, { "epoch": 1.19, "learning_rate": 0.00012103048335775185, "loss": 0.0326, "step": 184860 }, { "epoch": 1.19, "learning_rate": 0.00012102080200339492, "loss": 0.0429, "step": 184870 }, { "epoch": 1.19, "learning_rate": 0.00012101112064903799, "loss": 0.0294, "step": 184880 }, { "epoch": 1.19, "learning_rate": 0.00012100143929468105, "loss": 0.0303, "step": 184890 }, { "epoch": 1.19, "learning_rate": 0.00012099175794032412, "loss": 0.0264, "step": 184900 }, { "epoch": 1.19, "learning_rate": 0.00012098207658596718, "loss": 0.0295, "step": 184910 }, { "epoch": 1.19, "learning_rate": 0.00012097239523161026, "loss": 0.0324, "step": 184920 }, { "epoch": 1.19, "learning_rate": 0.00012096271387725333, "loss": 0.0338, "step": 184930 }, { "epoch": 1.19, "learning_rate": 0.00012095303252289638, "loss": 0.0291, "step": 184940 }, { "epoch": 1.19, "learning_rate": 0.00012094335116853946, "loss": 0.0293, "step": 184950 }, { "epoch": 1.19, "learning_rate": 0.00012093366981418253, "loss": 0.0323, "step": 184960 }, { "epoch": 1.19, "learning_rate": 0.0001209239884598256, "loss": 0.0329, "step": 184970 }, { "epoch": 1.19, "learning_rate": 0.00012091430710546866, "loss": 0.0278, "step": 184980 }, { "epoch": 1.19, "learning_rate": 0.00012090462575111173, "loss": 0.0255, "step": 184990 }, { "epoch": 1.19, "learning_rate": 0.00012089494439675481, "loss": 0.0375, "step": 185000 }, { "epoch": 1.19, "eval_cer": 0.9199150378488307, "eval_loss": 0.022892048582434654, "eval_runtime": 120.0905, "eval_samples_per_second": 16.654, "eval_steps_per_second": 4.164, "step": 185000 }, { "epoch": 1.19, "learning_rate": 0.00012088526304239786, "loss": 0.0303, "step": 185010 }, { "epoch": 1.19, "learning_rate": 0.00012087558168804094, "loss": 0.0331, "step": 185020 }, { "epoch": 1.19, "learning_rate": 0.000120865900333684, "loss": 0.0302, "step": 185030 }, { "epoch": 1.19, "learning_rate": 0.00012085621897932706, "loss": 0.0281, "step": 185040 }, { "epoch": 1.19, "learning_rate": 0.00012084653762497014, "loss": 0.0306, "step": 185050 }, { "epoch": 1.19, "learning_rate": 0.0001208368562706132, "loss": 0.0306, "step": 185060 }, { "epoch": 1.19, "learning_rate": 0.00012082717491625628, "loss": 0.0304, "step": 185070 }, { "epoch": 1.19, "learning_rate": 0.00012081749356189934, "loss": 0.0281, "step": 185080 }, { "epoch": 1.19, "learning_rate": 0.0001208078122075424, "loss": 0.0385, "step": 185090 }, { "epoch": 1.19, "learning_rate": 0.00012079813085318548, "loss": 0.0352, "step": 185100 }, { "epoch": 1.19, "learning_rate": 0.00012078844949882854, "loss": 0.0364, "step": 185110 }, { "epoch": 1.19, "learning_rate": 0.00012077876814447162, "loss": 0.0312, "step": 185120 }, { "epoch": 1.19, "learning_rate": 0.00012076908679011468, "loss": 0.0322, "step": 185130 }, { "epoch": 1.19, "learning_rate": 0.00012075940543575776, "loss": 0.0318, "step": 185140 }, { "epoch": 1.19, "learning_rate": 0.00012074972408140081, "loss": 0.0299, "step": 185150 }, { "epoch": 1.2, "learning_rate": 0.00012074004272704388, "loss": 0.035, "step": 185160 }, { "epoch": 1.2, "learning_rate": 0.00012073036137268696, "loss": 0.0365, "step": 185170 }, { "epoch": 1.2, "learning_rate": 0.00012072068001833001, "loss": 0.0332, "step": 185180 }, { "epoch": 1.2, "learning_rate": 0.00012071099866397308, "loss": 0.035, "step": 185190 }, { "epoch": 1.2, "learning_rate": 0.00012070131730961616, "loss": 0.0333, "step": 185200 }, { "epoch": 1.2, "learning_rate": 0.00012069163595525923, "loss": 0.029, "step": 185210 }, { "epoch": 1.2, "learning_rate": 0.00012068195460090229, "loss": 0.0367, "step": 185220 }, { "epoch": 1.2, "learning_rate": 0.00012067227324654536, "loss": 0.0396, "step": 185230 }, { "epoch": 1.2, "learning_rate": 0.00012066259189218844, "loss": 0.0288, "step": 185240 }, { "epoch": 1.2, "learning_rate": 0.00012065291053783149, "loss": 0.0343, "step": 185250 }, { "epoch": 1.2, "learning_rate": 0.00012064322918347456, "loss": 0.0305, "step": 185260 }, { "epoch": 1.2, "learning_rate": 0.00012063354782911764, "loss": 0.0373, "step": 185270 }, { "epoch": 1.2, "learning_rate": 0.0001206238664747607, "loss": 0.0336, "step": 185280 }, { "epoch": 1.2, "learning_rate": 0.00012061418512040376, "loss": 0.0284, "step": 185290 }, { "epoch": 1.2, "learning_rate": 0.00012060450376604683, "loss": 0.0332, "step": 185300 }, { "epoch": 1.2, "learning_rate": 0.0001205948224116899, "loss": 0.029, "step": 185310 }, { "epoch": 1.2, "learning_rate": 0.00012058514105733297, "loss": 0.0331, "step": 185320 }, { "epoch": 1.2, "learning_rate": 0.00012057545970297603, "loss": 0.0334, "step": 185330 }, { "epoch": 1.2, "learning_rate": 0.00012056577834861911, "loss": 0.0274, "step": 185340 }, { "epoch": 1.2, "learning_rate": 0.00012055609699426218, "loss": 0.0324, "step": 185350 }, { "epoch": 1.2, "learning_rate": 0.00012054641563990523, "loss": 0.0366, "step": 185360 }, { "epoch": 1.2, "learning_rate": 0.00012053673428554831, "loss": 0.0293, "step": 185370 }, { "epoch": 1.2, "learning_rate": 0.00012052705293119138, "loss": 0.0262, "step": 185380 }, { "epoch": 1.2, "learning_rate": 0.00012051737157683443, "loss": 0.03, "step": 185390 }, { "epoch": 1.2, "learning_rate": 0.00012050769022247751, "loss": 0.0319, "step": 185400 }, { "epoch": 1.2, "learning_rate": 0.00012049800886812058, "loss": 0.0299, "step": 185410 }, { "epoch": 1.2, "learning_rate": 0.00012048832751376366, "loss": 0.0361, "step": 185420 }, { "epoch": 1.2, "learning_rate": 0.00012047864615940671, "loss": 0.0258, "step": 185430 }, { "epoch": 1.2, "learning_rate": 0.00012046896480504979, "loss": 0.0378, "step": 185440 }, { "epoch": 1.2, "learning_rate": 0.00012045928345069286, "loss": 0.0317, "step": 185450 }, { "epoch": 1.2, "learning_rate": 0.00012044960209633591, "loss": 0.0286, "step": 185460 }, { "epoch": 1.2, "learning_rate": 0.00012043992074197899, "loss": 0.0272, "step": 185470 }, { "epoch": 1.2, "learning_rate": 0.00012043023938762205, "loss": 0.0341, "step": 185480 }, { "epoch": 1.2, "learning_rate": 0.00012042055803326513, "loss": 0.0302, "step": 185490 }, { "epoch": 1.2, "learning_rate": 0.00012041087667890819, "loss": 0.0305, "step": 185500 }, { "epoch": 1.2, "learning_rate": 0.00012040119532455125, "loss": 0.03, "step": 185510 }, { "epoch": 1.2, "learning_rate": 0.00012039151397019433, "loss": 0.0359, "step": 185520 }, { "epoch": 1.2, "learning_rate": 0.00012038183261583739, "loss": 0.0354, "step": 185530 }, { "epoch": 1.2, "learning_rate": 0.00012037215126148047, "loss": 0.0395, "step": 185540 }, { "epoch": 1.2, "learning_rate": 0.00012036246990712353, "loss": 0.0295, "step": 185550 }, { "epoch": 1.2, "learning_rate": 0.00012035278855276661, "loss": 0.0339, "step": 185560 }, { "epoch": 1.2, "learning_rate": 0.00012034310719840966, "loss": 0.0361, "step": 185570 }, { "epoch": 1.2, "learning_rate": 0.00012033342584405273, "loss": 0.0279, "step": 185580 }, { "epoch": 1.2, "learning_rate": 0.00012032374448969581, "loss": 0.0321, "step": 185590 }, { "epoch": 1.2, "learning_rate": 0.00012031406313533886, "loss": 0.0353, "step": 185600 }, { "epoch": 1.2, "learning_rate": 0.00012030438178098193, "loss": 0.0342, "step": 185610 }, { "epoch": 1.2, "learning_rate": 0.00012029470042662501, "loss": 0.0345, "step": 185620 }, { "epoch": 1.2, "learning_rate": 0.00012028501907226807, "loss": 0.031, "step": 185630 }, { "epoch": 1.2, "learning_rate": 0.00012027533771791114, "loss": 0.0371, "step": 185640 }, { "epoch": 1.2, "learning_rate": 0.00012026565636355421, "loss": 0.0292, "step": 185650 }, { "epoch": 1.2, "learning_rate": 0.00012025597500919729, "loss": 0.033, "step": 185660 }, { "epoch": 1.2, "learning_rate": 0.00012024629365484034, "loss": 0.0355, "step": 185670 }, { "epoch": 1.2, "learning_rate": 0.0001202366123004834, "loss": 0.029, "step": 185680 }, { "epoch": 1.2, "learning_rate": 0.00012022693094612649, "loss": 0.0293, "step": 185690 }, { "epoch": 1.2, "learning_rate": 0.00012021724959176955, "loss": 0.0335, "step": 185700 }, { "epoch": 1.2, "learning_rate": 0.0001202075682374126, "loss": 0.032, "step": 185710 }, { "epoch": 1.2, "learning_rate": 0.00012019788688305568, "loss": 0.029, "step": 185720 }, { "epoch": 1.2, "learning_rate": 0.00012018820552869875, "loss": 0.0324, "step": 185730 }, { "epoch": 1.2, "learning_rate": 0.00012017852417434182, "loss": 0.0353, "step": 185740 }, { "epoch": 1.2, "learning_rate": 0.00012016884281998488, "loss": 0.03, "step": 185750 }, { "epoch": 1.2, "learning_rate": 0.00012015916146562796, "loss": 0.0275, "step": 185760 }, { "epoch": 1.2, "learning_rate": 0.00012014948011127103, "loss": 0.0318, "step": 185770 }, { "epoch": 1.2, "learning_rate": 0.00012013979875691408, "loss": 0.0255, "step": 185780 }, { "epoch": 1.2, "learning_rate": 0.00012013011740255716, "loss": 0.0315, "step": 185790 }, { "epoch": 1.2, "learning_rate": 0.00012012043604820023, "loss": 0.0369, "step": 185800 }, { "epoch": 1.2, "learning_rate": 0.00012011075469384328, "loss": 0.0325, "step": 185810 }, { "epoch": 1.2, "learning_rate": 0.00012010107333948636, "loss": 0.0378, "step": 185820 }, { "epoch": 1.2, "learning_rate": 0.00012009139198512943, "loss": 0.0307, "step": 185830 }, { "epoch": 1.2, "learning_rate": 0.0001200817106307725, "loss": 0.0297, "step": 185840 }, { "epoch": 1.2, "learning_rate": 0.00012007202927641556, "loss": 0.0338, "step": 185850 }, { "epoch": 1.2, "learning_rate": 0.00012006234792205864, "loss": 0.0344, "step": 185860 }, { "epoch": 1.2, "learning_rate": 0.0001200526665677017, "loss": 0.0308, "step": 185870 }, { "epoch": 1.2, "learning_rate": 0.00012004298521334476, "loss": 0.0346, "step": 185880 }, { "epoch": 1.2, "learning_rate": 0.00012003330385898784, "loss": 0.0343, "step": 185890 }, { "epoch": 1.2, "learning_rate": 0.0001200236225046309, "loss": 0.0318, "step": 185900 }, { "epoch": 1.2, "learning_rate": 0.00012001394115027398, "loss": 0.027, "step": 185910 }, { "epoch": 1.2, "learning_rate": 0.00012000425979591704, "loss": 0.0302, "step": 185920 }, { "epoch": 1.2, "learning_rate": 0.0001199945784415601, "loss": 0.0304, "step": 185930 }, { "epoch": 1.2, "learning_rate": 0.00011998489708720318, "loss": 0.0303, "step": 185940 }, { "epoch": 1.2, "learning_rate": 0.00011997521573284624, "loss": 0.0323, "step": 185950 }, { "epoch": 1.2, "learning_rate": 0.00011996553437848932, "loss": 0.0336, "step": 185960 }, { "epoch": 1.2, "learning_rate": 0.00011995585302413238, "loss": 0.0344, "step": 185970 }, { "epoch": 1.2, "learning_rate": 0.00011994617166977545, "loss": 0.0369, "step": 185980 }, { "epoch": 1.2, "learning_rate": 0.00011993649031541851, "loss": 0.0323, "step": 185990 }, { "epoch": 1.2, "learning_rate": 0.00011992680896106158, "loss": 0.0351, "step": 186000 }, { "epoch": 1.2, "eval_cer": 0.9198815952999662, "eval_loss": 0.022712325677275658, "eval_runtime": 120.0277, "eval_samples_per_second": 16.663, "eval_steps_per_second": 4.166, "step": 186000 }, { "epoch": 1.2, "learning_rate": 0.00011991712760670466, "loss": 0.0321, "step": 186010 }, { "epoch": 1.2, "learning_rate": 0.00011990744625234771, "loss": 0.0325, "step": 186020 }, { "epoch": 1.2, "learning_rate": 0.00011989776489799078, "loss": 0.0341, "step": 186030 }, { "epoch": 1.2, "learning_rate": 0.00011988808354363386, "loss": 0.0283, "step": 186040 }, { "epoch": 1.2, "learning_rate": 0.00011987840218927692, "loss": 0.0304, "step": 186050 }, { "epoch": 1.2, "learning_rate": 0.00011986872083491999, "loss": 0.038, "step": 186060 }, { "epoch": 1.2, "learning_rate": 0.00011985903948056306, "loss": 0.0335, "step": 186070 }, { "epoch": 1.2, "learning_rate": 0.00011984935812620612, "loss": 0.0361, "step": 186080 }, { "epoch": 1.2, "learning_rate": 0.00011983967677184919, "loss": 0.0357, "step": 186090 }, { "epoch": 1.2, "learning_rate": 0.00011982999541749226, "loss": 0.03, "step": 186100 }, { "epoch": 1.2, "learning_rate": 0.00011982031406313534, "loss": 0.0304, "step": 186110 }, { "epoch": 1.2, "learning_rate": 0.0001198106327087784, "loss": 0.031, "step": 186120 }, { "epoch": 1.2, "learning_rate": 0.00011980095135442145, "loss": 0.0323, "step": 186130 }, { "epoch": 1.2, "learning_rate": 0.00011979127000006453, "loss": 0.0331, "step": 186140 }, { "epoch": 1.2, "learning_rate": 0.0001197815886457076, "loss": 0.0254, "step": 186150 }, { "epoch": 1.2, "learning_rate": 0.00011977190729135067, "loss": 0.0328, "step": 186160 }, { "epoch": 1.2, "learning_rate": 0.00011976222593699373, "loss": 0.0325, "step": 186170 }, { "epoch": 1.2, "learning_rate": 0.0001197525445826368, "loss": 0.0356, "step": 186180 }, { "epoch": 1.2, "learning_rate": 0.00011974286322827988, "loss": 0.0321, "step": 186190 }, { "epoch": 1.2, "learning_rate": 0.00011973318187392293, "loss": 0.0319, "step": 186200 }, { "epoch": 1.2, "learning_rate": 0.00011972350051956601, "loss": 0.0314, "step": 186210 }, { "epoch": 1.2, "learning_rate": 0.00011971381916520908, "loss": 0.0353, "step": 186220 }, { "epoch": 1.2, "learning_rate": 0.00011970413781085213, "loss": 0.0267, "step": 186230 }, { "epoch": 1.2, "learning_rate": 0.00011969445645649521, "loss": 0.0323, "step": 186240 }, { "epoch": 1.2, "learning_rate": 0.00011968477510213828, "loss": 0.0291, "step": 186250 }, { "epoch": 1.2, "learning_rate": 0.00011967509374778136, "loss": 0.0293, "step": 186260 }, { "epoch": 1.2, "learning_rate": 0.00011966541239342441, "loss": 0.0331, "step": 186270 }, { "epoch": 1.2, "learning_rate": 0.00011965573103906748, "loss": 0.0354, "step": 186280 }, { "epoch": 1.2, "learning_rate": 0.00011964604968471056, "loss": 0.0278, "step": 186290 }, { "epoch": 1.2, "learning_rate": 0.00011963636833035361, "loss": 0.0403, "step": 186300 }, { "epoch": 1.2, "learning_rate": 0.00011962668697599669, "loss": 0.0322, "step": 186310 }, { "epoch": 1.2, "learning_rate": 0.00011961700562163975, "loss": 0.0316, "step": 186320 }, { "epoch": 1.2, "learning_rate": 0.00011960732426728283, "loss": 0.0331, "step": 186330 }, { "epoch": 1.2, "learning_rate": 0.00011959764291292589, "loss": 0.028, "step": 186340 }, { "epoch": 1.2, "learning_rate": 0.00011958796155856895, "loss": 0.0326, "step": 186350 }, { "epoch": 1.2, "learning_rate": 0.00011957828020421203, "loss": 0.0283, "step": 186360 }, { "epoch": 1.2, "learning_rate": 0.00011956859884985509, "loss": 0.0337, "step": 186370 }, { "epoch": 1.2, "learning_rate": 0.00011955891749549815, "loss": 0.0319, "step": 186380 }, { "epoch": 1.2, "learning_rate": 0.00011954923614114123, "loss": 0.0338, "step": 186390 }, { "epoch": 1.2, "learning_rate": 0.0001195395547867843, "loss": 0.0272, "step": 186400 }, { "epoch": 1.2, "learning_rate": 0.00011952987343242736, "loss": 0.0386, "step": 186410 }, { "epoch": 1.2, "learning_rate": 0.00011952019207807043, "loss": 0.0298, "step": 186420 }, { "epoch": 1.2, "learning_rate": 0.00011951051072371351, "loss": 0.0319, "step": 186430 }, { "epoch": 1.2, "learning_rate": 0.00011950082936935656, "loss": 0.0388, "step": 186440 }, { "epoch": 1.2, "learning_rate": 0.00011949114801499963, "loss": 0.0322, "step": 186450 }, { "epoch": 1.2, "learning_rate": 0.00011948146666064271, "loss": 0.0327, "step": 186460 }, { "epoch": 1.2, "learning_rate": 0.00011947178530628577, "loss": 0.0415, "step": 186470 }, { "epoch": 1.2, "learning_rate": 0.00011946210395192883, "loss": 0.0302, "step": 186480 }, { "epoch": 1.2, "learning_rate": 0.00011945242259757191, "loss": 0.0292, "step": 186490 }, { "epoch": 1.2, "learning_rate": 0.00011944274124321497, "loss": 0.0284, "step": 186500 }, { "epoch": 1.2, "learning_rate": 0.00011943305988885804, "loss": 0.031, "step": 186510 }, { "epoch": 1.2, "learning_rate": 0.0001194233785345011, "loss": 0.0364, "step": 186520 }, { "epoch": 1.2, "learning_rate": 0.00011941369718014419, "loss": 0.0361, "step": 186530 }, { "epoch": 1.2, "learning_rate": 0.00011940401582578725, "loss": 0.0367, "step": 186540 }, { "epoch": 1.2, "learning_rate": 0.0001193943344714303, "loss": 0.0315, "step": 186550 }, { "epoch": 1.2, "learning_rate": 0.00011938465311707338, "loss": 0.0348, "step": 186560 }, { "epoch": 1.2, "learning_rate": 0.00011937497176271645, "loss": 0.0352, "step": 186570 }, { "epoch": 1.2, "learning_rate": 0.0001193652904083595, "loss": 0.039, "step": 186580 }, { "epoch": 1.2, "learning_rate": 0.00011935560905400258, "loss": 0.0324, "step": 186590 }, { "epoch": 1.2, "learning_rate": 0.00011934592769964565, "loss": 0.0279, "step": 186600 }, { "epoch": 1.2, "learning_rate": 0.00011933624634528873, "loss": 0.0329, "step": 186610 }, { "epoch": 1.2, "learning_rate": 0.00011932656499093178, "loss": 0.0351, "step": 186620 }, { "epoch": 1.2, "learning_rate": 0.00011931688363657486, "loss": 0.0299, "step": 186630 }, { "epoch": 1.2, "learning_rate": 0.00011930720228221793, "loss": 0.0322, "step": 186640 }, { "epoch": 1.2, "learning_rate": 0.00011929752092786098, "loss": 0.0291, "step": 186650 }, { "epoch": 1.2, "learning_rate": 0.00011928783957350406, "loss": 0.0374, "step": 186660 }, { "epoch": 1.2, "learning_rate": 0.00011927815821914713, "loss": 0.035, "step": 186670 }, { "epoch": 1.2, "learning_rate": 0.0001192684768647902, "loss": 0.0298, "step": 186680 }, { "epoch": 1.2, "learning_rate": 0.00011925879551043326, "loss": 0.0306, "step": 186690 }, { "epoch": 1.21, "learning_rate": 0.00011924911415607633, "loss": 0.0281, "step": 186700 }, { "epoch": 1.21, "learning_rate": 0.0001192394328017194, "loss": 0.0321, "step": 186710 }, { "epoch": 1.21, "learning_rate": 0.00011922975144736246, "loss": 0.0386, "step": 186720 }, { "epoch": 1.21, "learning_rate": 0.00011922007009300554, "loss": 0.0346, "step": 186730 }, { "epoch": 1.21, "learning_rate": 0.0001192103887386486, "loss": 0.0302, "step": 186740 }, { "epoch": 1.21, "learning_rate": 0.00011920070738429168, "loss": 0.0317, "step": 186750 }, { "epoch": 1.21, "learning_rate": 0.00011919102602993474, "loss": 0.0317, "step": 186760 }, { "epoch": 1.21, "learning_rate": 0.0001191813446755778, "loss": 0.0324, "step": 186770 }, { "epoch": 1.21, "learning_rate": 0.00011917166332122088, "loss": 0.0301, "step": 186780 }, { "epoch": 1.21, "learning_rate": 0.00011916198196686393, "loss": 0.0299, "step": 186790 }, { "epoch": 1.21, "learning_rate": 0.000119152300612507, "loss": 0.0299, "step": 186800 }, { "epoch": 1.21, "learning_rate": 0.00011914261925815008, "loss": 0.0371, "step": 186810 }, { "epoch": 1.21, "learning_rate": 0.00011913293790379315, "loss": 0.0305, "step": 186820 }, { "epoch": 1.21, "learning_rate": 0.00011912325654943621, "loss": 0.0269, "step": 186830 }, { "epoch": 1.21, "learning_rate": 0.00011911357519507928, "loss": 0.0346, "step": 186840 }, { "epoch": 1.21, "learning_rate": 0.00011910389384072236, "loss": 0.0322, "step": 186850 }, { "epoch": 1.21, "learning_rate": 0.00011909421248636541, "loss": 0.0298, "step": 186860 }, { "epoch": 1.21, "learning_rate": 0.00011908453113200848, "loss": 0.0289, "step": 186870 }, { "epoch": 1.21, "learning_rate": 0.00011907484977765156, "loss": 0.0306, "step": 186880 }, { "epoch": 1.21, "learning_rate": 0.00011906516842329462, "loss": 0.0387, "step": 186890 }, { "epoch": 1.21, "learning_rate": 0.00011905548706893768, "loss": 0.034, "step": 186900 }, { "epoch": 1.21, "learning_rate": 0.00011904580571458076, "loss": 0.0293, "step": 186910 }, { "epoch": 1.21, "learning_rate": 0.00011903612436022382, "loss": 0.0292, "step": 186920 }, { "epoch": 1.21, "learning_rate": 0.00011902644300586689, "loss": 0.0311, "step": 186930 }, { "epoch": 1.21, "learning_rate": 0.00011901676165150996, "loss": 0.0328, "step": 186940 }, { "epoch": 1.21, "learning_rate": 0.00011900708029715304, "loss": 0.0312, "step": 186950 }, { "epoch": 1.21, "learning_rate": 0.0001189973989427961, "loss": 0.0337, "step": 186960 }, { "epoch": 1.21, "learning_rate": 0.00011898771758843915, "loss": 0.0291, "step": 186970 }, { "epoch": 1.21, "learning_rate": 0.00011897803623408223, "loss": 0.0285, "step": 186980 }, { "epoch": 1.21, "learning_rate": 0.0001189683548797253, "loss": 0.0328, "step": 186990 }, { "epoch": 1.21, "learning_rate": 0.00011895867352536835, "loss": 0.0305, "step": 187000 }, { "epoch": 1.21, "eval_cer": 0.9199005762060785, "eval_loss": 0.022978171706199646, "eval_runtime": 120.5367, "eval_samples_per_second": 16.592, "eval_steps_per_second": 4.148, "step": 187000 }, { "epoch": 1.21, "learning_rate": 0.00011894899217101143, "loss": 0.032, "step": 187010 }, { "epoch": 1.21, "learning_rate": 0.0001189393108166545, "loss": 0.03, "step": 187020 }, { "epoch": 1.21, "learning_rate": 0.00011892962946229758, "loss": 0.0314, "step": 187030 }, { "epoch": 1.21, "learning_rate": 0.00011891994810794063, "loss": 0.032, "step": 187040 }, { "epoch": 1.21, "learning_rate": 0.00011891026675358371, "loss": 0.0337, "step": 187050 }, { "epoch": 1.21, "learning_rate": 0.00011890058539922678, "loss": 0.0295, "step": 187060 }, { "epoch": 1.21, "learning_rate": 0.00011889090404486983, "loss": 0.0301, "step": 187070 }, { "epoch": 1.21, "learning_rate": 0.00011888122269051291, "loss": 0.0365, "step": 187080 }, { "epoch": 1.21, "learning_rate": 0.00011887154133615598, "loss": 0.0293, "step": 187090 }, { "epoch": 1.21, "learning_rate": 0.00011886185998179906, "loss": 0.0329, "step": 187100 }, { "epoch": 1.21, "learning_rate": 0.00011885217862744211, "loss": 0.0341, "step": 187110 }, { "epoch": 1.21, "learning_rate": 0.00011884249727308517, "loss": 0.0353, "step": 187120 }, { "epoch": 1.21, "learning_rate": 0.00011883281591872825, "loss": 0.0413, "step": 187130 }, { "epoch": 1.21, "learning_rate": 0.00011882313456437131, "loss": 0.0292, "step": 187140 }, { "epoch": 1.21, "learning_rate": 0.00011881345321001439, "loss": 0.0378, "step": 187150 }, { "epoch": 1.21, "learning_rate": 0.00011880377185565745, "loss": 0.0304, "step": 187160 }, { "epoch": 1.21, "learning_rate": 0.00011879409050130052, "loss": 0.0306, "step": 187170 }, { "epoch": 1.21, "learning_rate": 0.00011878440914694359, "loss": 0.0327, "step": 187180 }, { "epoch": 1.21, "learning_rate": 0.00011877472779258665, "loss": 0.0355, "step": 187190 }, { "epoch": 1.21, "learning_rate": 0.00011876504643822973, "loss": 0.0312, "step": 187200 }, { "epoch": 1.21, "learning_rate": 0.00011875536508387278, "loss": 0.0302, "step": 187210 }, { "epoch": 1.21, "learning_rate": 0.00011874568372951585, "loss": 0.0293, "step": 187220 }, { "epoch": 1.21, "learning_rate": 0.00011873600237515893, "loss": 0.0271, "step": 187230 }, { "epoch": 1.21, "learning_rate": 0.000118726321020802, "loss": 0.0285, "step": 187240 }, { "epoch": 1.21, "learning_rate": 0.00011871663966644506, "loss": 0.0345, "step": 187250 }, { "epoch": 1.21, "learning_rate": 0.00011870695831208813, "loss": 0.0289, "step": 187260 }, { "epoch": 1.21, "learning_rate": 0.0001186972769577312, "loss": 0.032, "step": 187270 }, { "epoch": 1.21, "learning_rate": 0.00011868759560337426, "loss": 0.0318, "step": 187280 }, { "epoch": 1.21, "learning_rate": 0.00011867791424901733, "loss": 0.0303, "step": 187290 }, { "epoch": 1.21, "learning_rate": 0.00011866823289466041, "loss": 0.0281, "step": 187300 }, { "epoch": 1.21, "learning_rate": 0.00011865855154030347, "loss": 0.0318, "step": 187310 }, { "epoch": 1.21, "learning_rate": 0.00011864887018594653, "loss": 0.0291, "step": 187320 }, { "epoch": 1.21, "learning_rate": 0.0001186391888315896, "loss": 0.0374, "step": 187330 }, { "epoch": 1.21, "learning_rate": 0.00011862950747723267, "loss": 0.0318, "step": 187340 }, { "epoch": 1.21, "learning_rate": 0.00011861982612287574, "loss": 0.0295, "step": 187350 }, { "epoch": 1.21, "learning_rate": 0.0001186101447685188, "loss": 0.0311, "step": 187360 }, { "epoch": 1.21, "learning_rate": 0.00011860046341416187, "loss": 0.0315, "step": 187370 }, { "epoch": 1.21, "learning_rate": 0.00011859078205980495, "loss": 0.0301, "step": 187380 }, { "epoch": 1.21, "learning_rate": 0.000118581100705448, "loss": 0.0306, "step": 187390 }, { "epoch": 1.21, "learning_rate": 0.00011857141935109108, "loss": 0.031, "step": 187400 }, { "epoch": 1.21, "learning_rate": 0.00011856173799673415, "loss": 0.0319, "step": 187410 }, { "epoch": 1.21, "learning_rate": 0.0001185520566423772, "loss": 0.0328, "step": 187420 }, { "epoch": 1.21, "learning_rate": 0.00011854237528802028, "loss": 0.0308, "step": 187430 }, { "epoch": 1.21, "learning_rate": 0.00011853269393366335, "loss": 0.028, "step": 187440 }, { "epoch": 1.21, "learning_rate": 0.00011852301257930643, "loss": 0.0365, "step": 187450 }, { "epoch": 1.21, "learning_rate": 0.00011851333122494948, "loss": 0.0295, "step": 187460 }, { "epoch": 1.21, "learning_rate": 0.00011850364987059255, "loss": 0.0292, "step": 187470 }, { "epoch": 1.21, "learning_rate": 0.00011849396851623563, "loss": 0.0331, "step": 187480 }, { "epoch": 1.21, "learning_rate": 0.00011848428716187868, "loss": 0.0343, "step": 187490 }, { "epoch": 1.21, "learning_rate": 0.00011847460580752176, "loss": 0.0362, "step": 187500 }, { "epoch": 1.21, "learning_rate": 0.00011846492445316483, "loss": 0.0317, "step": 187510 }, { "epoch": 1.21, "learning_rate": 0.0001184552430988079, "loss": 0.036, "step": 187520 }, { "epoch": 1.21, "learning_rate": 0.00011844556174445096, "loss": 0.0354, "step": 187530 }, { "epoch": 1.21, "learning_rate": 0.00011843588039009402, "loss": 0.0262, "step": 187540 }, { "epoch": 1.21, "learning_rate": 0.0001184261990357371, "loss": 0.0395, "step": 187550 }, { "epoch": 1.21, "learning_rate": 0.00011841651768138016, "loss": 0.0259, "step": 187560 }, { "epoch": 1.21, "learning_rate": 0.00011840683632702322, "loss": 0.0347, "step": 187570 }, { "epoch": 1.21, "learning_rate": 0.0001183971549726663, "loss": 0.0322, "step": 187580 }, { "epoch": 1.21, "learning_rate": 0.00011838747361830937, "loss": 0.0336, "step": 187590 }, { "epoch": 1.21, "learning_rate": 0.00011837779226395244, "loss": 0.0297, "step": 187600 }, { "epoch": 1.21, "learning_rate": 0.0001183681109095955, "loss": 0.0346, "step": 187610 }, { "epoch": 1.21, "learning_rate": 0.00011835842955523858, "loss": 0.0322, "step": 187620 }, { "epoch": 1.21, "learning_rate": 0.00011834874820088163, "loss": 0.0362, "step": 187630 }, { "epoch": 1.21, "learning_rate": 0.0001183390668465247, "loss": 0.0392, "step": 187640 }, { "epoch": 1.21, "learning_rate": 0.00011832938549216778, "loss": 0.0327, "step": 187650 }, { "epoch": 1.21, "learning_rate": 0.00011831970413781083, "loss": 0.0291, "step": 187660 }, { "epoch": 1.21, "learning_rate": 0.0001183100227834539, "loss": 0.037, "step": 187670 }, { "epoch": 1.21, "learning_rate": 0.00011830034142909698, "loss": 0.0371, "step": 187680 }, { "epoch": 1.21, "learning_rate": 0.00011829066007474005, "loss": 0.0346, "step": 187690 }, { "epoch": 1.21, "learning_rate": 0.00011828097872038311, "loss": 0.0324, "step": 187700 }, { "epoch": 1.21, "learning_rate": 0.00011827129736602618, "loss": 0.0315, "step": 187710 }, { "epoch": 1.21, "learning_rate": 0.00011826161601166926, "loss": 0.034, "step": 187720 }, { "epoch": 1.21, "learning_rate": 0.00011825193465731231, "loss": 0.0331, "step": 187730 }, { "epoch": 1.21, "learning_rate": 0.00011824225330295538, "loss": 0.032, "step": 187740 }, { "epoch": 1.21, "learning_rate": 0.00011823257194859846, "loss": 0.0246, "step": 187750 }, { "epoch": 1.21, "learning_rate": 0.00011822289059424152, "loss": 0.0339, "step": 187760 }, { "epoch": 1.21, "learning_rate": 0.00011821320923988458, "loss": 0.0356, "step": 187770 }, { "epoch": 1.21, "learning_rate": 0.00011820352788552766, "loss": 0.0318, "step": 187780 }, { "epoch": 1.21, "learning_rate": 0.00011819384653117072, "loss": 0.0319, "step": 187790 }, { "epoch": 1.21, "learning_rate": 0.00011818416517681379, "loss": 0.0333, "step": 187800 }, { "epoch": 1.21, "learning_rate": 0.00011817448382245685, "loss": 0.0373, "step": 187810 }, { "epoch": 1.21, "learning_rate": 0.00011816480246809993, "loss": 0.0285, "step": 187820 }, { "epoch": 1.21, "learning_rate": 0.000118155121113743, "loss": 0.0344, "step": 187830 }, { "epoch": 1.21, "learning_rate": 0.00011814543975938605, "loss": 0.0305, "step": 187840 }, { "epoch": 1.21, "learning_rate": 0.00011813575840502913, "loss": 0.0311, "step": 187850 }, { "epoch": 1.21, "learning_rate": 0.0001181260770506722, "loss": 0.0328, "step": 187860 }, { "epoch": 1.21, "learning_rate": 0.00011811639569631525, "loss": 0.0329, "step": 187870 }, { "epoch": 1.21, "learning_rate": 0.00011810671434195833, "loss": 0.0296, "step": 187880 }, { "epoch": 1.21, "learning_rate": 0.0001180970329876014, "loss": 0.0322, "step": 187890 }, { "epoch": 1.21, "learning_rate": 0.00011808735163324448, "loss": 0.0362, "step": 187900 }, { "epoch": 1.21, "learning_rate": 0.00011807767027888753, "loss": 0.0363, "step": 187910 }, { "epoch": 1.21, "learning_rate": 0.00011806798892453061, "loss": 0.0314, "step": 187920 }, { "epoch": 1.21, "learning_rate": 0.00011805830757017368, "loss": 0.0317, "step": 187930 }, { "epoch": 1.21, "learning_rate": 0.00011804862621581673, "loss": 0.0288, "step": 187940 }, { "epoch": 1.21, "learning_rate": 0.00011803894486145981, "loss": 0.0295, "step": 187950 }, { "epoch": 1.21, "learning_rate": 0.00011802926350710287, "loss": 0.0305, "step": 187960 }, { "epoch": 1.21, "learning_rate": 0.00011801958215274595, "loss": 0.0346, "step": 187970 }, { "epoch": 1.21, "learning_rate": 0.00011800990079838901, "loss": 0.0318, "step": 187980 }, { "epoch": 1.21, "learning_rate": 0.00011800021944403207, "loss": 0.0301, "step": 187990 }, { "epoch": 1.21, "learning_rate": 0.00011799053808967515, "loss": 0.0376, "step": 188000 }, { "epoch": 1.21, "eval_cer": 0.9199258840808948, "eval_loss": 0.022766409441828728, "eval_runtime": 120.0519, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 188000 }, { "epoch": 1.21, "learning_rate": 0.0001179808567353182, "loss": 0.0315, "step": 188010 }, { "epoch": 1.21, "learning_rate": 0.00011797117538096129, "loss": 0.0358, "step": 188020 }, { "epoch": 1.21, "learning_rate": 0.00011796149402660435, "loss": 0.0336, "step": 188030 }, { "epoch": 1.21, "learning_rate": 0.00011795181267224743, "loss": 0.0348, "step": 188040 }, { "epoch": 1.21, "learning_rate": 0.00011794213131789048, "loss": 0.0289, "step": 188050 }, { "epoch": 1.21, "learning_rate": 0.00011793244996353355, "loss": 0.0286, "step": 188060 }, { "epoch": 1.21, "learning_rate": 0.00011792276860917663, "loss": 0.0313, "step": 188070 }, { "epoch": 1.21, "learning_rate": 0.00011791308725481968, "loss": 0.03, "step": 188080 }, { "epoch": 1.21, "learning_rate": 0.00011790340590046275, "loss": 0.0362, "step": 188090 }, { "epoch": 1.21, "learning_rate": 0.00011789372454610583, "loss": 0.0354, "step": 188100 }, { "epoch": 1.21, "learning_rate": 0.0001178840431917489, "loss": 0.0331, "step": 188110 }, { "epoch": 1.21, "learning_rate": 0.00011787436183739196, "loss": 0.0279, "step": 188120 }, { "epoch": 1.21, "learning_rate": 0.00011786468048303503, "loss": 0.0334, "step": 188130 }, { "epoch": 1.21, "learning_rate": 0.00011785499912867811, "loss": 0.0354, "step": 188140 }, { "epoch": 1.21, "learning_rate": 0.00011784531777432116, "loss": 0.0314, "step": 188150 }, { "epoch": 1.21, "learning_rate": 0.00011783563641996423, "loss": 0.0332, "step": 188160 }, { "epoch": 1.21, "learning_rate": 0.0001178259550656073, "loss": 0.0364, "step": 188170 }, { "epoch": 1.21, "learning_rate": 0.00011781627371125037, "loss": 0.0289, "step": 188180 }, { "epoch": 1.21, "learning_rate": 0.00011780659235689343, "loss": 0.0305, "step": 188190 }, { "epoch": 1.21, "learning_rate": 0.0001177969110025365, "loss": 0.0285, "step": 188200 }, { "epoch": 1.21, "learning_rate": 0.00011778722964817957, "loss": 0.0306, "step": 188210 }, { "epoch": 1.21, "learning_rate": 0.00011777754829382264, "loss": 0.0303, "step": 188220 }, { "epoch": 1.21, "learning_rate": 0.0001177678669394657, "loss": 0.0353, "step": 188230 }, { "epoch": 1.21, "learning_rate": 0.00011775818558510878, "loss": 0.0282, "step": 188240 }, { "epoch": 1.22, "learning_rate": 0.00011774850423075185, "loss": 0.0334, "step": 188250 }, { "epoch": 1.22, "learning_rate": 0.0001177388228763949, "loss": 0.0308, "step": 188260 }, { "epoch": 1.22, "learning_rate": 0.00011772914152203798, "loss": 0.0302, "step": 188270 }, { "epoch": 1.22, "learning_rate": 0.00011771946016768105, "loss": 0.0296, "step": 188280 }, { "epoch": 1.22, "learning_rate": 0.0001177097788133241, "loss": 0.0301, "step": 188290 }, { "epoch": 1.22, "learning_rate": 0.00011770009745896718, "loss": 0.0328, "step": 188300 }, { "epoch": 1.22, "learning_rate": 0.00011769041610461025, "loss": 0.0325, "step": 188310 }, { "epoch": 1.22, "learning_rate": 0.00011768073475025333, "loss": 0.0297, "step": 188320 }, { "epoch": 1.22, "learning_rate": 0.00011767105339589638, "loss": 0.0341, "step": 188330 }, { "epoch": 1.22, "learning_rate": 0.00011766137204153946, "loss": 0.0299, "step": 188340 }, { "epoch": 1.22, "learning_rate": 0.00011765169068718253, "loss": 0.0347, "step": 188350 }, { "epoch": 1.22, "learning_rate": 0.00011764200933282558, "loss": 0.033, "step": 188360 }, { "epoch": 1.22, "learning_rate": 0.00011763232797846866, "loss": 0.0292, "step": 188370 }, { "epoch": 1.22, "learning_rate": 0.00011762264662411172, "loss": 0.0309, "step": 188380 }, { "epoch": 1.22, "learning_rate": 0.0001176129652697548, "loss": 0.0299, "step": 188390 }, { "epoch": 1.22, "learning_rate": 0.00011760328391539786, "loss": 0.0385, "step": 188400 }, { "epoch": 1.22, "learning_rate": 0.00011759360256104092, "loss": 0.0317, "step": 188410 }, { "epoch": 1.22, "learning_rate": 0.000117583921206684, "loss": 0.0332, "step": 188420 }, { "epoch": 1.22, "learning_rate": 0.00011757423985232706, "loss": 0.0263, "step": 188430 }, { "epoch": 1.22, "learning_rate": 0.00011756455849797014, "loss": 0.0341, "step": 188440 }, { "epoch": 1.22, "learning_rate": 0.0001175548771436132, "loss": 0.0313, "step": 188450 }, { "epoch": 1.22, "learning_rate": 0.00011754519578925627, "loss": 0.0258, "step": 188460 }, { "epoch": 1.22, "learning_rate": 0.00011753551443489933, "loss": 0.0297, "step": 188470 }, { "epoch": 1.22, "learning_rate": 0.0001175258330805424, "loss": 0.0309, "step": 188480 }, { "epoch": 1.22, "learning_rate": 0.00011751615172618548, "loss": 0.0284, "step": 188490 }, { "epoch": 1.22, "learning_rate": 0.00011750647037182853, "loss": 0.0296, "step": 188500 }, { "epoch": 1.22, "learning_rate": 0.0001174967890174716, "loss": 0.033, "step": 188510 }, { "epoch": 1.22, "learning_rate": 0.00011748710766311468, "loss": 0.029, "step": 188520 }, { "epoch": 1.22, "learning_rate": 0.00011747742630875775, "loss": 0.0327, "step": 188530 }, { "epoch": 1.22, "learning_rate": 0.00011746774495440081, "loss": 0.031, "step": 188540 }, { "epoch": 1.22, "learning_rate": 0.00011745806360004388, "loss": 0.0331, "step": 188550 }, { "epoch": 1.22, "learning_rate": 0.00011744838224568694, "loss": 0.0315, "step": 188560 }, { "epoch": 1.22, "learning_rate": 0.00011743870089133001, "loss": 0.0288, "step": 188570 }, { "epoch": 1.22, "learning_rate": 0.00011742901953697308, "loss": 0.0347, "step": 188580 }, { "epoch": 1.22, "learning_rate": 0.00011741933818261616, "loss": 0.0345, "step": 188590 }, { "epoch": 1.22, "learning_rate": 0.00011740965682825922, "loss": 0.034, "step": 188600 }, { "epoch": 1.22, "learning_rate": 0.00011739997547390228, "loss": 0.0291, "step": 188610 }, { "epoch": 1.22, "learning_rate": 0.00011739029411954535, "loss": 0.0347, "step": 188620 }, { "epoch": 1.22, "learning_rate": 0.00011738061276518842, "loss": 0.0285, "step": 188630 }, { "epoch": 1.22, "learning_rate": 0.00011737093141083149, "loss": 0.0361, "step": 188640 }, { "epoch": 1.22, "learning_rate": 0.00011736125005647455, "loss": 0.0358, "step": 188650 }, { "epoch": 1.22, "learning_rate": 0.00011735156870211762, "loss": 0.0298, "step": 188660 }, { "epoch": 1.22, "learning_rate": 0.0001173418873477607, "loss": 0.0311, "step": 188670 }, { "epoch": 1.22, "learning_rate": 0.00011733220599340375, "loss": 0.0274, "step": 188680 }, { "epoch": 1.22, "learning_rate": 0.00011732252463904683, "loss": 0.037, "step": 188690 }, { "epoch": 1.22, "learning_rate": 0.0001173128432846899, "loss": 0.0329, "step": 188700 }, { "epoch": 1.22, "learning_rate": 0.00011730316193033295, "loss": 0.0321, "step": 188710 }, { "epoch": 1.22, "learning_rate": 0.00011729348057597603, "loss": 0.0312, "step": 188720 }, { "epoch": 1.22, "learning_rate": 0.0001172837992216191, "loss": 0.0331, "step": 188730 }, { "epoch": 1.22, "learning_rate": 0.00011727411786726218, "loss": 0.0331, "step": 188740 }, { "epoch": 1.22, "learning_rate": 0.00011726443651290523, "loss": 0.037, "step": 188750 }, { "epoch": 1.22, "learning_rate": 0.00011725475515854831, "loss": 0.0368, "step": 188760 }, { "epoch": 1.22, "learning_rate": 0.00011724507380419138, "loss": 0.0305, "step": 188770 }, { "epoch": 1.22, "learning_rate": 0.00011723539244983443, "loss": 0.0361, "step": 188780 }, { "epoch": 1.22, "learning_rate": 0.00011722571109547751, "loss": 0.0255, "step": 188790 }, { "epoch": 1.22, "learning_rate": 0.00011721602974112057, "loss": 0.039, "step": 188800 }, { "epoch": 1.22, "learning_rate": 0.00011720634838676365, "loss": 0.0334, "step": 188810 }, { "epoch": 1.22, "learning_rate": 0.0001171966670324067, "loss": 0.0359, "step": 188820 }, { "epoch": 1.22, "learning_rate": 0.00011718698567804977, "loss": 0.0302, "step": 188830 }, { "epoch": 1.22, "learning_rate": 0.00011717730432369285, "loss": 0.0276, "step": 188840 }, { "epoch": 1.22, "learning_rate": 0.0001171676229693359, "loss": 0.0349, "step": 188850 }, { "epoch": 1.22, "learning_rate": 0.00011715794161497899, "loss": 0.0358, "step": 188860 }, { "epoch": 1.22, "learning_rate": 0.00011714826026062205, "loss": 0.0313, "step": 188870 }, { "epoch": 1.22, "learning_rate": 0.00011713857890626512, "loss": 0.0342, "step": 188880 }, { "epoch": 1.22, "learning_rate": 0.00011712889755190818, "loss": 0.0257, "step": 188890 }, { "epoch": 1.22, "learning_rate": 0.00011711921619755125, "loss": 0.031, "step": 188900 }, { "epoch": 1.22, "learning_rate": 0.00011710953484319433, "loss": 0.031, "step": 188910 }, { "epoch": 1.22, "learning_rate": 0.00011709985348883738, "loss": 0.0251, "step": 188920 }, { "epoch": 1.22, "learning_rate": 0.00011709017213448045, "loss": 0.0294, "step": 188930 }, { "epoch": 1.22, "learning_rate": 0.00011708049078012353, "loss": 0.0326, "step": 188940 }, { "epoch": 1.22, "learning_rate": 0.0001170708094257666, "loss": 0.0333, "step": 188950 }, { "epoch": 1.22, "learning_rate": 0.00011706112807140966, "loss": 0.0319, "step": 188960 }, { "epoch": 1.22, "learning_rate": 0.00011705144671705273, "loss": 0.026, "step": 188970 }, { "epoch": 1.22, "learning_rate": 0.0001170417653626958, "loss": 0.0325, "step": 188980 }, { "epoch": 1.22, "learning_rate": 0.00011703208400833886, "loss": 0.0325, "step": 188990 }, { "epoch": 1.22, "learning_rate": 0.00011702240265398193, "loss": 0.0338, "step": 189000 }, { "epoch": 1.22, "eval_cer": 0.9199575189244154, "eval_loss": 0.02248038910329342, "eval_runtime": 120.1814, "eval_samples_per_second": 16.642, "eval_steps_per_second": 4.16, "step": 189000 }, { "epoch": 1.22, "learning_rate": 0.000117012721299625, "loss": 0.0337, "step": 189010 }, { "epoch": 1.22, "learning_rate": 0.00011700303994526807, "loss": 0.0304, "step": 189020 }, { "epoch": 1.22, "learning_rate": 0.00011699335859091112, "loss": 0.0317, "step": 189030 }, { "epoch": 1.22, "learning_rate": 0.0001169836772365542, "loss": 0.0345, "step": 189040 }, { "epoch": 1.22, "learning_rate": 0.00011697399588219727, "loss": 0.0378, "step": 189050 }, { "epoch": 1.22, "learning_rate": 0.00011696431452784034, "loss": 0.0291, "step": 189060 }, { "epoch": 1.22, "learning_rate": 0.0001169546331734834, "loss": 0.0362, "step": 189070 }, { "epoch": 1.22, "learning_rate": 0.00011694495181912647, "loss": 0.0331, "step": 189080 }, { "epoch": 1.22, "learning_rate": 0.00011693527046476955, "loss": 0.0343, "step": 189090 }, { "epoch": 1.22, "learning_rate": 0.0001169255891104126, "loss": 0.0334, "step": 189100 }, { "epoch": 1.22, "learning_rate": 0.00011691590775605568, "loss": 0.0376, "step": 189110 }, { "epoch": 1.22, "learning_rate": 0.00011690622640169875, "loss": 0.031, "step": 189120 }, { "epoch": 1.22, "learning_rate": 0.0001168965450473418, "loss": 0.0347, "step": 189130 }, { "epoch": 1.22, "learning_rate": 0.00011688686369298488, "loss": 0.0268, "step": 189140 }, { "epoch": 1.22, "learning_rate": 0.00011687718233862795, "loss": 0.0298, "step": 189150 }, { "epoch": 1.22, "learning_rate": 0.00011686750098427103, "loss": 0.0329, "step": 189160 }, { "epoch": 1.22, "learning_rate": 0.00011685781962991408, "loss": 0.0338, "step": 189170 }, { "epoch": 1.22, "learning_rate": 0.00011684813827555715, "loss": 0.0336, "step": 189180 }, { "epoch": 1.22, "learning_rate": 0.00011683845692120023, "loss": 0.0338, "step": 189190 }, { "epoch": 1.22, "learning_rate": 0.00011682877556684328, "loss": 0.0298, "step": 189200 }, { "epoch": 1.22, "learning_rate": 0.00011681909421248636, "loss": 0.0252, "step": 189210 }, { "epoch": 1.22, "learning_rate": 0.00011680941285812942, "loss": 0.0349, "step": 189220 }, { "epoch": 1.22, "learning_rate": 0.0001167997315037725, "loss": 0.0306, "step": 189230 }, { "epoch": 1.22, "learning_rate": 0.00011679005014941556, "loss": 0.0293, "step": 189240 }, { "epoch": 1.22, "learning_rate": 0.00011678036879505862, "loss": 0.029, "step": 189250 }, { "epoch": 1.22, "learning_rate": 0.0001167706874407017, "loss": 0.0261, "step": 189260 }, { "epoch": 1.22, "learning_rate": 0.00011676100608634476, "loss": 0.028, "step": 189270 }, { "epoch": 1.22, "learning_rate": 0.00011675132473198782, "loss": 0.0272, "step": 189280 }, { "epoch": 1.22, "learning_rate": 0.0001167416433776309, "loss": 0.0305, "step": 189290 }, { "epoch": 1.22, "learning_rate": 0.00011673196202327397, "loss": 0.0314, "step": 189300 }, { "epoch": 1.22, "learning_rate": 0.00011672228066891703, "loss": 0.0278, "step": 189310 }, { "epoch": 1.22, "learning_rate": 0.0001167125993145601, "loss": 0.0285, "step": 189320 }, { "epoch": 1.22, "learning_rate": 0.00011670291796020318, "loss": 0.0351, "step": 189330 }, { "epoch": 1.22, "learning_rate": 0.00011669323660584623, "loss": 0.031, "step": 189340 }, { "epoch": 1.22, "learning_rate": 0.0001166835552514893, "loss": 0.0306, "step": 189350 }, { "epoch": 1.22, "learning_rate": 0.00011667387389713238, "loss": 0.029, "step": 189360 }, { "epoch": 1.22, "learning_rate": 0.00011666419254277544, "loss": 0.0303, "step": 189370 }, { "epoch": 1.22, "learning_rate": 0.0001166545111884185, "loss": 0.0286, "step": 189380 }, { "epoch": 1.22, "learning_rate": 0.00011664482983406158, "loss": 0.0327, "step": 189390 }, { "epoch": 1.22, "learning_rate": 0.00011663514847970464, "loss": 0.0302, "step": 189400 }, { "epoch": 1.22, "learning_rate": 0.00011662546712534771, "loss": 0.0346, "step": 189410 }, { "epoch": 1.22, "learning_rate": 0.00011661578577099078, "loss": 0.029, "step": 189420 }, { "epoch": 1.22, "learning_rate": 0.00011660610441663386, "loss": 0.0311, "step": 189430 }, { "epoch": 1.22, "learning_rate": 0.00011659642306227692, "loss": 0.0278, "step": 189440 }, { "epoch": 1.22, "learning_rate": 0.00011658674170791997, "loss": 0.0364, "step": 189450 }, { "epoch": 1.22, "learning_rate": 0.00011657706035356305, "loss": 0.0292, "step": 189460 }, { "epoch": 1.22, "learning_rate": 0.00011656737899920612, "loss": 0.0288, "step": 189470 }, { "epoch": 1.22, "learning_rate": 0.00011655769764484917, "loss": 0.0257, "step": 189480 }, { "epoch": 1.22, "learning_rate": 0.00011654801629049225, "loss": 0.0292, "step": 189490 }, { "epoch": 1.22, "learning_rate": 0.00011653833493613532, "loss": 0.0333, "step": 189500 }, { "epoch": 1.22, "learning_rate": 0.0001165286535817784, "loss": 0.0262, "step": 189510 }, { "epoch": 1.22, "learning_rate": 0.00011651897222742145, "loss": 0.0319, "step": 189520 }, { "epoch": 1.22, "learning_rate": 0.00011650929087306453, "loss": 0.0311, "step": 189530 }, { "epoch": 1.22, "learning_rate": 0.0001164996095187076, "loss": 0.0356, "step": 189540 }, { "epoch": 1.22, "learning_rate": 0.00011648992816435065, "loss": 0.0348, "step": 189550 }, { "epoch": 1.22, "learning_rate": 0.00011648024680999373, "loss": 0.0348, "step": 189560 }, { "epoch": 1.22, "learning_rate": 0.0001164705654556368, "loss": 0.0348, "step": 189570 }, { "epoch": 1.22, "learning_rate": 0.00011646088410127988, "loss": 0.0281, "step": 189580 }, { "epoch": 1.22, "learning_rate": 0.00011645120274692293, "loss": 0.0332, "step": 189590 }, { "epoch": 1.22, "learning_rate": 0.000116441521392566, "loss": 0.0315, "step": 189600 }, { "epoch": 1.22, "learning_rate": 0.00011643184003820908, "loss": 0.0273, "step": 189610 }, { "epoch": 1.22, "learning_rate": 0.00011642215868385213, "loss": 0.0365, "step": 189620 }, { "epoch": 1.22, "learning_rate": 0.00011641247732949521, "loss": 0.037, "step": 189630 }, { "epoch": 1.22, "learning_rate": 0.00011640279597513827, "loss": 0.0307, "step": 189640 }, { "epoch": 1.22, "learning_rate": 0.00011639311462078135, "loss": 0.0256, "step": 189650 }, { "epoch": 1.22, "learning_rate": 0.0001163834332664244, "loss": 0.0275, "step": 189660 }, { "epoch": 1.22, "learning_rate": 0.00011637375191206747, "loss": 0.0319, "step": 189670 }, { "epoch": 1.22, "learning_rate": 0.00011636407055771055, "loss": 0.0325, "step": 189680 }, { "epoch": 1.22, "learning_rate": 0.0001163543892033536, "loss": 0.0401, "step": 189690 }, { "epoch": 1.22, "learning_rate": 0.00011634470784899667, "loss": 0.0311, "step": 189700 }, { "epoch": 1.22, "learning_rate": 0.00011633502649463975, "loss": 0.0332, "step": 189710 }, { "epoch": 1.22, "learning_rate": 0.00011632534514028282, "loss": 0.031, "step": 189720 }, { "epoch": 1.22, "learning_rate": 0.00011631566378592588, "loss": 0.0307, "step": 189730 }, { "epoch": 1.22, "learning_rate": 0.00011630598243156895, "loss": 0.025, "step": 189740 }, { "epoch": 1.22, "learning_rate": 0.00011629630107721203, "loss": 0.0318, "step": 189750 }, { "epoch": 1.22, "learning_rate": 0.00011628661972285508, "loss": 0.0338, "step": 189760 }, { "epoch": 1.22, "learning_rate": 0.00011627693836849815, "loss": 0.0318, "step": 189770 }, { "epoch": 1.22, "learning_rate": 0.00011626725701414123, "loss": 0.0332, "step": 189780 }, { "epoch": 1.22, "learning_rate": 0.0001162575756597843, "loss": 0.0262, "step": 189790 }, { "epoch": 1.23, "learning_rate": 0.00011624789430542735, "loss": 0.032, "step": 189800 }, { "epoch": 1.23, "learning_rate": 0.00011623821295107043, "loss": 0.0337, "step": 189810 }, { "epoch": 1.23, "learning_rate": 0.0001162285315967135, "loss": 0.0263, "step": 189820 }, { "epoch": 1.23, "learning_rate": 0.00011621885024235656, "loss": 0.0325, "step": 189830 }, { "epoch": 1.23, "learning_rate": 0.00011620916888799963, "loss": 0.0377, "step": 189840 }, { "epoch": 1.23, "learning_rate": 0.0001161994875336427, "loss": 0.0291, "step": 189850 }, { "epoch": 1.23, "learning_rate": 0.00011618980617928577, "loss": 0.0298, "step": 189860 }, { "epoch": 1.23, "learning_rate": 0.00011618012482492882, "loss": 0.0301, "step": 189870 }, { "epoch": 1.23, "learning_rate": 0.0001161704434705719, "loss": 0.034, "step": 189880 }, { "epoch": 1.23, "learning_rate": 0.00011616076211621497, "loss": 0.0293, "step": 189890 }, { "epoch": 1.23, "learning_rate": 0.00011615108076185802, "loss": 0.0327, "step": 189900 }, { "epoch": 1.23, "learning_rate": 0.0001161413994075011, "loss": 0.0305, "step": 189910 }, { "epoch": 1.23, "learning_rate": 0.00011613171805314417, "loss": 0.0283, "step": 189920 }, { "epoch": 1.23, "learning_rate": 0.00011612203669878725, "loss": 0.0279, "step": 189930 }, { "epoch": 1.23, "learning_rate": 0.0001161123553444303, "loss": 0.0287, "step": 189940 }, { "epoch": 1.23, "learning_rate": 0.00011610267399007338, "loss": 0.0286, "step": 189950 }, { "epoch": 1.23, "learning_rate": 0.00011609299263571645, "loss": 0.0336, "step": 189960 }, { "epoch": 1.23, "learning_rate": 0.0001160833112813595, "loss": 0.0389, "step": 189970 }, { "epoch": 1.23, "learning_rate": 0.00011607362992700258, "loss": 0.0419, "step": 189980 }, { "epoch": 1.23, "learning_rate": 0.00011606394857264565, "loss": 0.0321, "step": 189990 }, { "epoch": 1.23, "learning_rate": 0.00011605426721828873, "loss": 0.0315, "step": 190000 }, { "epoch": 1.23, "eval_cer": 0.9198580951304938, "eval_loss": 0.02292782999575138, "eval_runtime": 120.2546, "eval_samples_per_second": 16.631, "eval_steps_per_second": 4.158, "step": 190000 }, { "epoch": 1.23, "learning_rate": 0.00011604458586393178, "loss": 0.0329, "step": 190010 }, { "epoch": 1.23, "learning_rate": 0.00011603490450957485, "loss": 0.0348, "step": 190020 }, { "epoch": 1.23, "learning_rate": 0.00011602522315521792, "loss": 0.0299, "step": 190030 }, { "epoch": 1.23, "learning_rate": 0.00011601554180086098, "loss": 0.0266, "step": 190040 }, { "epoch": 1.23, "learning_rate": 0.00011600586044650406, "loss": 0.0321, "step": 190050 }, { "epoch": 1.23, "learning_rate": 0.00011599617909214712, "loss": 0.0321, "step": 190060 }, { "epoch": 1.23, "learning_rate": 0.00011598649773779019, "loss": 0.0311, "step": 190070 }, { "epoch": 1.23, "learning_rate": 0.00011597681638343326, "loss": 0.0321, "step": 190080 }, { "epoch": 1.23, "learning_rate": 0.00011596713502907632, "loss": 0.0325, "step": 190090 }, { "epoch": 1.23, "learning_rate": 0.0001159574536747194, "loss": 0.0327, "step": 190100 }, { "epoch": 1.23, "learning_rate": 0.00011594777232036245, "loss": 0.0339, "step": 190110 }, { "epoch": 1.23, "learning_rate": 0.00011593809096600552, "loss": 0.0298, "step": 190120 }, { "epoch": 1.23, "learning_rate": 0.0001159284096116486, "loss": 0.0303, "step": 190130 }, { "epoch": 1.23, "learning_rate": 0.00011591872825729167, "loss": 0.0373, "step": 190140 }, { "epoch": 1.23, "learning_rate": 0.00011590904690293473, "loss": 0.0275, "step": 190150 }, { "epoch": 1.23, "learning_rate": 0.0001158993655485778, "loss": 0.0303, "step": 190160 }, { "epoch": 1.23, "learning_rate": 0.00011588968419422087, "loss": 0.0295, "step": 190170 }, { "epoch": 1.23, "learning_rate": 0.00011588000283986393, "loss": 0.0323, "step": 190180 }, { "epoch": 1.23, "learning_rate": 0.000115870321485507, "loss": 0.0301, "step": 190190 }, { "epoch": 1.23, "learning_rate": 0.00011586064013115008, "loss": 0.0276, "step": 190200 }, { "epoch": 1.23, "learning_rate": 0.00011585095877679314, "loss": 0.03, "step": 190210 }, { "epoch": 1.23, "learning_rate": 0.0001158412774224362, "loss": 0.0302, "step": 190220 }, { "epoch": 1.23, "learning_rate": 0.00011583159606807928, "loss": 0.0286, "step": 190230 }, { "epoch": 1.23, "learning_rate": 0.00011582191471372234, "loss": 0.0362, "step": 190240 }, { "epoch": 1.23, "learning_rate": 0.00011581223335936541, "loss": 0.0326, "step": 190250 }, { "epoch": 1.23, "learning_rate": 0.00011580255200500848, "loss": 0.0277, "step": 190260 }, { "epoch": 1.23, "learning_rate": 0.00011579287065065154, "loss": 0.0333, "step": 190270 }, { "epoch": 1.23, "learning_rate": 0.00011578318929629462, "loss": 0.0263, "step": 190280 }, { "epoch": 1.23, "learning_rate": 0.00011577350794193767, "loss": 0.0313, "step": 190290 }, { "epoch": 1.23, "learning_rate": 0.00011576382658758075, "loss": 0.0327, "step": 190300 }, { "epoch": 1.23, "learning_rate": 0.00011575414523322382, "loss": 0.0304, "step": 190310 }, { "epoch": 1.23, "learning_rate": 0.00011574446387886687, "loss": 0.0294, "step": 190320 }, { "epoch": 1.23, "learning_rate": 0.00011573478252450995, "loss": 0.0331, "step": 190330 }, { "epoch": 1.23, "learning_rate": 0.00011572510117015302, "loss": 0.0312, "step": 190340 }, { "epoch": 1.23, "learning_rate": 0.0001157154198157961, "loss": 0.0313, "step": 190350 }, { "epoch": 1.23, "learning_rate": 0.00011570573846143915, "loss": 0.0276, "step": 190360 }, { "epoch": 1.23, "learning_rate": 0.00011569605710708222, "loss": 0.036, "step": 190370 }, { "epoch": 1.23, "learning_rate": 0.0001156863757527253, "loss": 0.03, "step": 190380 }, { "epoch": 1.23, "learning_rate": 0.00011567669439836835, "loss": 0.0372, "step": 190390 }, { "epoch": 1.23, "learning_rate": 0.00011566701304401143, "loss": 0.0311, "step": 190400 }, { "epoch": 1.23, "learning_rate": 0.0001156573316896545, "loss": 0.0343, "step": 190410 }, { "epoch": 1.23, "learning_rate": 0.00011564765033529758, "loss": 0.0321, "step": 190420 }, { "epoch": 1.23, "learning_rate": 0.00011563796898094063, "loss": 0.0268, "step": 190430 }, { "epoch": 1.23, "learning_rate": 0.0001156282876265837, "loss": 0.0314, "step": 190440 }, { "epoch": 1.23, "learning_rate": 0.00011561860627222677, "loss": 0.0317, "step": 190450 }, { "epoch": 1.23, "learning_rate": 0.00011560892491786983, "loss": 0.0358, "step": 190460 }, { "epoch": 1.23, "learning_rate": 0.0001155992435635129, "loss": 0.0299, "step": 190470 }, { "epoch": 1.23, "learning_rate": 0.00011558956220915597, "loss": 0.0321, "step": 190480 }, { "epoch": 1.23, "learning_rate": 0.00011557988085479904, "loss": 0.0276, "step": 190490 }, { "epoch": 1.23, "learning_rate": 0.0001155701995004421, "loss": 0.0286, "step": 190500 }, { "epoch": 1.23, "learning_rate": 0.00011556051814608517, "loss": 0.0311, "step": 190510 }, { "epoch": 1.23, "learning_rate": 0.00011555083679172825, "loss": 0.0261, "step": 190520 }, { "epoch": 1.23, "learning_rate": 0.0001155411554373713, "loss": 0.0327, "step": 190530 }, { "epoch": 1.23, "learning_rate": 0.00011553147408301437, "loss": 0.0291, "step": 190540 }, { "epoch": 1.23, "learning_rate": 0.00011552179272865745, "loss": 0.0328, "step": 190550 }, { "epoch": 1.23, "learning_rate": 0.00011551211137430052, "loss": 0.0327, "step": 190560 }, { "epoch": 1.23, "learning_rate": 0.00011550243001994357, "loss": 0.0308, "step": 190570 }, { "epoch": 1.23, "learning_rate": 0.00011549274866558665, "loss": 0.032, "step": 190580 }, { "epoch": 1.23, "learning_rate": 0.00011548306731122972, "loss": 0.0323, "step": 190590 }, { "epoch": 1.23, "learning_rate": 0.00011547338595687278, "loss": 0.0329, "step": 190600 }, { "epoch": 1.23, "learning_rate": 0.00011546370460251585, "loss": 0.0349, "step": 190610 }, { "epoch": 1.23, "learning_rate": 0.00011545402324815893, "loss": 0.0326, "step": 190620 }, { "epoch": 1.23, "learning_rate": 0.000115444341893802, "loss": 0.03, "step": 190630 }, { "epoch": 1.23, "learning_rate": 0.00011543466053944505, "loss": 0.0305, "step": 190640 }, { "epoch": 1.23, "learning_rate": 0.00011542497918508813, "loss": 0.0373, "step": 190650 }, { "epoch": 1.23, "learning_rate": 0.00011541529783073119, "loss": 0.0313, "step": 190660 }, { "epoch": 1.23, "learning_rate": 0.00011540561647637425, "loss": 0.0316, "step": 190670 }, { "epoch": 1.23, "learning_rate": 0.00011539593512201733, "loss": 0.0304, "step": 190680 }, { "epoch": 1.23, "learning_rate": 0.00011538625376766039, "loss": 0.0322, "step": 190690 }, { "epoch": 1.23, "learning_rate": 0.00011537657241330347, "loss": 0.029, "step": 190700 }, { "epoch": 1.23, "learning_rate": 0.00011536689105894652, "loss": 0.0319, "step": 190710 }, { "epoch": 1.23, "learning_rate": 0.0001153572097045896, "loss": 0.0318, "step": 190720 }, { "epoch": 1.23, "learning_rate": 0.00011534752835023267, "loss": 0.0295, "step": 190730 }, { "epoch": 1.23, "learning_rate": 0.00011533784699587572, "loss": 0.0319, "step": 190740 }, { "epoch": 1.23, "learning_rate": 0.0001153281656415188, "loss": 0.0308, "step": 190750 }, { "epoch": 1.23, "learning_rate": 0.00011531848428716187, "loss": 0.0298, "step": 190760 }, { "epoch": 1.23, "learning_rate": 0.00011530880293280495, "loss": 0.0313, "step": 190770 }, { "epoch": 1.23, "learning_rate": 0.000115299121578448, "loss": 0.0338, "step": 190780 }, { "epoch": 1.23, "learning_rate": 0.00011528944022409107, "loss": 0.0387, "step": 190790 }, { "epoch": 1.23, "learning_rate": 0.00011527975886973415, "loss": 0.0272, "step": 190800 }, { "epoch": 1.23, "learning_rate": 0.0001152700775153772, "loss": 0.035, "step": 190810 }, { "epoch": 1.23, "learning_rate": 0.00011526039616102028, "loss": 0.0305, "step": 190820 }, { "epoch": 1.23, "learning_rate": 0.00011525071480666335, "loss": 0.0367, "step": 190830 }, { "epoch": 1.23, "learning_rate": 0.00011524103345230643, "loss": 0.0319, "step": 190840 }, { "epoch": 1.23, "learning_rate": 0.00011523135209794948, "loss": 0.0307, "step": 190850 }, { "epoch": 1.23, "learning_rate": 0.00011522167074359254, "loss": 0.0308, "step": 190860 }, { "epoch": 1.23, "learning_rate": 0.00011521198938923562, "loss": 0.0362, "step": 190870 }, { "epoch": 1.23, "learning_rate": 0.00011520230803487868, "loss": 0.0278, "step": 190880 }, { "epoch": 1.23, "learning_rate": 0.00011519262668052174, "loss": 0.0344, "step": 190890 }, { "epoch": 1.23, "learning_rate": 0.00011518294532616482, "loss": 0.0307, "step": 190900 }, { "epoch": 1.23, "learning_rate": 0.00011517326397180789, "loss": 0.0312, "step": 190910 }, { "epoch": 1.23, "learning_rate": 0.00011516358261745096, "loss": 0.0318, "step": 190920 }, { "epoch": 1.23, "learning_rate": 0.00011515390126309402, "loss": 0.0324, "step": 190930 }, { "epoch": 1.23, "learning_rate": 0.0001151442199087371, "loss": 0.0362, "step": 190940 }, { "epoch": 1.23, "learning_rate": 0.00011513453855438015, "loss": 0.0316, "step": 190950 }, { "epoch": 1.23, "learning_rate": 0.00011512485720002322, "loss": 0.0275, "step": 190960 }, { "epoch": 1.23, "learning_rate": 0.0001151151758456663, "loss": 0.0259, "step": 190970 }, { "epoch": 1.23, "learning_rate": 0.00011510549449130937, "loss": 0.0332, "step": 190980 }, { "epoch": 1.23, "learning_rate": 0.00011509581313695242, "loss": 0.0322, "step": 190990 }, { "epoch": 1.23, "learning_rate": 0.0001150861317825955, "loss": 0.0369, "step": 191000 }, { "epoch": 1.23, "eval_cer": 0.9199421534289911, "eval_loss": 0.022925306111574173, "eval_runtime": 120.1456, "eval_samples_per_second": 16.646, "eval_steps_per_second": 4.162, "step": 191000 }, { "epoch": 1.23, "learning_rate": 0.00011507645042823857, "loss": 0.0278, "step": 191010 }, { "epoch": 1.23, "learning_rate": 0.00011506676907388163, "loss": 0.0316, "step": 191020 }, { "epoch": 1.23, "learning_rate": 0.0001150570877195247, "loss": 0.0279, "step": 191030 }, { "epoch": 1.23, "learning_rate": 0.00011504740636516778, "loss": 0.0319, "step": 191040 }, { "epoch": 1.23, "learning_rate": 0.00011503772501081084, "loss": 0.0293, "step": 191050 }, { "epoch": 1.23, "learning_rate": 0.0001150280436564539, "loss": 0.0337, "step": 191060 }, { "epoch": 1.23, "learning_rate": 0.00011501836230209698, "loss": 0.0307, "step": 191070 }, { "epoch": 1.23, "learning_rate": 0.00011500868094774004, "loss": 0.0276, "step": 191080 }, { "epoch": 1.23, "learning_rate": 0.0001149989995933831, "loss": 0.0281, "step": 191090 }, { "epoch": 1.23, "learning_rate": 0.00011498931823902618, "loss": 0.0303, "step": 191100 }, { "epoch": 1.23, "learning_rate": 0.00011497963688466924, "loss": 0.0333, "step": 191110 }, { "epoch": 1.23, "learning_rate": 0.00011496995553031231, "loss": 0.0311, "step": 191120 }, { "epoch": 1.23, "learning_rate": 0.00011496027417595537, "loss": 0.0264, "step": 191130 }, { "epoch": 1.23, "learning_rate": 0.00011495059282159845, "loss": 0.0343, "step": 191140 }, { "epoch": 1.23, "learning_rate": 0.00011494091146724152, "loss": 0.0326, "step": 191150 }, { "epoch": 1.23, "learning_rate": 0.00011493123011288457, "loss": 0.0276, "step": 191160 }, { "epoch": 1.23, "learning_rate": 0.00011492154875852765, "loss": 0.0376, "step": 191170 }, { "epoch": 1.23, "learning_rate": 0.00011491186740417072, "loss": 0.0362, "step": 191180 }, { "epoch": 1.23, "learning_rate": 0.00011490218604981377, "loss": 0.032, "step": 191190 }, { "epoch": 1.23, "learning_rate": 0.00011489250469545685, "loss": 0.0307, "step": 191200 }, { "epoch": 1.23, "learning_rate": 0.00011488282334109992, "loss": 0.0332, "step": 191210 }, { "epoch": 1.23, "learning_rate": 0.000114873141986743, "loss": 0.042, "step": 191220 }, { "epoch": 1.23, "learning_rate": 0.00011486346063238605, "loss": 0.0345, "step": 191230 }, { "epoch": 1.23, "learning_rate": 0.00011485377927802913, "loss": 0.0305, "step": 191240 }, { "epoch": 1.23, "learning_rate": 0.0001148440979236722, "loss": 0.032, "step": 191250 }, { "epoch": 1.23, "learning_rate": 0.00011483441656931525, "loss": 0.0356, "step": 191260 }, { "epoch": 1.23, "learning_rate": 0.00011482473521495833, "loss": 0.0324, "step": 191270 }, { "epoch": 1.23, "learning_rate": 0.0001148150538606014, "loss": 0.0306, "step": 191280 }, { "epoch": 1.23, "learning_rate": 0.00011480537250624447, "loss": 0.0278, "step": 191290 }, { "epoch": 1.23, "learning_rate": 0.00011479569115188753, "loss": 0.028, "step": 191300 }, { "epoch": 1.23, "learning_rate": 0.0001147860097975306, "loss": 0.0312, "step": 191310 }, { "epoch": 1.23, "learning_rate": 0.00011477632844317367, "loss": 0.0326, "step": 191320 }, { "epoch": 1.23, "learning_rate": 0.00011476664708881673, "loss": 0.0324, "step": 191330 }, { "epoch": 1.23, "learning_rate": 0.0001147569657344598, "loss": 0.0306, "step": 191340 }, { "epoch": 1.24, "learning_rate": 0.00011474728438010287, "loss": 0.0259, "step": 191350 }, { "epoch": 1.24, "learning_rate": 0.00011473760302574594, "loss": 0.025, "step": 191360 }, { "epoch": 1.24, "learning_rate": 0.000114727921671389, "loss": 0.0343, "step": 191370 }, { "epoch": 1.24, "learning_rate": 0.00011471824031703207, "loss": 0.0361, "step": 191380 }, { "epoch": 1.24, "learning_rate": 0.00011470855896267515, "loss": 0.0345, "step": 191390 }, { "epoch": 1.24, "learning_rate": 0.0001146988776083182, "loss": 0.0338, "step": 191400 }, { "epoch": 1.24, "learning_rate": 0.00011468919625396127, "loss": 0.0328, "step": 191410 }, { "epoch": 1.24, "learning_rate": 0.00011467951489960435, "loss": 0.0284, "step": 191420 }, { "epoch": 1.24, "learning_rate": 0.00011466983354524742, "loss": 0.0317, "step": 191430 }, { "epoch": 1.24, "learning_rate": 0.00011466015219089048, "loss": 0.0269, "step": 191440 }, { "epoch": 1.24, "learning_rate": 0.00011465047083653355, "loss": 0.0347, "step": 191450 }, { "epoch": 1.24, "learning_rate": 0.00011464078948217661, "loss": 0.0349, "step": 191460 }, { "epoch": 1.24, "learning_rate": 0.00011463110812781968, "loss": 0.0329, "step": 191470 }, { "epoch": 1.24, "learning_rate": 0.00011462142677346275, "loss": 0.0385, "step": 191480 }, { "epoch": 1.24, "learning_rate": 0.00011461174541910583, "loss": 0.0316, "step": 191490 }, { "epoch": 1.24, "learning_rate": 0.00011460206406474889, "loss": 0.0388, "step": 191500 }, { "epoch": 1.24, "learning_rate": 0.00011459238271039195, "loss": 0.0277, "step": 191510 }, { "epoch": 1.24, "learning_rate": 0.00011458270135603502, "loss": 0.033, "step": 191520 }, { "epoch": 1.24, "learning_rate": 0.00011457302000167809, "loss": 0.0264, "step": 191530 }, { "epoch": 1.24, "learning_rate": 0.00011456333864732116, "loss": 0.0358, "step": 191540 }, { "epoch": 1.24, "learning_rate": 0.00011455365729296422, "loss": 0.0299, "step": 191550 }, { "epoch": 1.24, "learning_rate": 0.00011454397593860729, "loss": 0.0286, "step": 191560 }, { "epoch": 1.24, "learning_rate": 0.00011453429458425037, "loss": 0.0311, "step": 191570 }, { "epoch": 1.24, "learning_rate": 0.00011452461322989342, "loss": 0.0304, "step": 191580 }, { "epoch": 1.24, "learning_rate": 0.0001145149318755365, "loss": 0.0374, "step": 191590 }, { "epoch": 1.24, "learning_rate": 0.00011450525052117957, "loss": 0.0308, "step": 191600 }, { "epoch": 1.24, "learning_rate": 0.00011449556916682262, "loss": 0.0283, "step": 191610 }, { "epoch": 1.24, "learning_rate": 0.0001144858878124657, "loss": 0.0285, "step": 191620 }, { "epoch": 1.24, "learning_rate": 0.00011447620645810877, "loss": 0.0295, "step": 191630 }, { "epoch": 1.24, "learning_rate": 0.00011446652510375185, "loss": 0.0315, "step": 191640 }, { "epoch": 1.24, "learning_rate": 0.0001144568437493949, "loss": 0.0293, "step": 191650 }, { "epoch": 1.24, "learning_rate": 0.00011444716239503797, "loss": 0.0299, "step": 191660 }, { "epoch": 1.24, "learning_rate": 0.00011443748104068105, "loss": 0.0325, "step": 191670 }, { "epoch": 1.24, "learning_rate": 0.0001144277996863241, "loss": 0.0298, "step": 191680 }, { "epoch": 1.24, "learning_rate": 0.00011441811833196718, "loss": 0.0262, "step": 191690 }, { "epoch": 1.24, "learning_rate": 0.00011440843697761024, "loss": 0.0334, "step": 191700 }, { "epoch": 1.24, "learning_rate": 0.00011439875562325332, "loss": 0.0292, "step": 191710 }, { "epoch": 1.24, "learning_rate": 0.00011438907426889638, "loss": 0.0294, "step": 191720 }, { "epoch": 1.24, "learning_rate": 0.00011437939291453944, "loss": 0.0412, "step": 191730 }, { "epoch": 1.24, "learning_rate": 0.00011436971156018252, "loss": 0.0295, "step": 191740 }, { "epoch": 1.24, "learning_rate": 0.00011436003020582558, "loss": 0.0367, "step": 191750 }, { "epoch": 1.24, "learning_rate": 0.00011435034885146864, "loss": 0.0315, "step": 191760 }, { "epoch": 1.24, "learning_rate": 0.00011434066749711172, "loss": 0.0297, "step": 191770 }, { "epoch": 1.24, "learning_rate": 0.00011433098614275479, "loss": 0.032, "step": 191780 }, { "epoch": 1.24, "learning_rate": 0.00011432130478839785, "loss": 0.0304, "step": 191790 }, { "epoch": 1.24, "learning_rate": 0.00011431162343404092, "loss": 0.0297, "step": 191800 }, { "epoch": 1.24, "learning_rate": 0.000114301942079684, "loss": 0.0259, "step": 191810 }, { "epoch": 1.24, "learning_rate": 0.00011429226072532705, "loss": 0.0304, "step": 191820 }, { "epoch": 1.24, "learning_rate": 0.00011428257937097012, "loss": 0.0318, "step": 191830 }, { "epoch": 1.24, "learning_rate": 0.0001142728980166132, "loss": 0.0331, "step": 191840 }, { "epoch": 1.24, "learning_rate": 0.00011426321666225627, "loss": 0.0298, "step": 191850 }, { "epoch": 1.24, "learning_rate": 0.00011425353530789932, "loss": 0.0286, "step": 191860 }, { "epoch": 1.24, "learning_rate": 0.0001142438539535424, "loss": 0.0275, "step": 191870 }, { "epoch": 1.24, "learning_rate": 0.00011423417259918546, "loss": 0.0257, "step": 191880 }, { "epoch": 1.24, "learning_rate": 0.00011422449124482853, "loss": 0.0272, "step": 191890 }, { "epoch": 1.24, "learning_rate": 0.0001142148098904716, "loss": 0.031, "step": 191900 }, { "epoch": 1.24, "learning_rate": 0.00011420512853611468, "loss": 0.0342, "step": 191910 }, { "epoch": 1.24, "learning_rate": 0.00011419544718175774, "loss": 0.0271, "step": 191920 }, { "epoch": 1.24, "learning_rate": 0.0001141857658274008, "loss": 0.033, "step": 191930 }, { "epoch": 1.24, "learning_rate": 0.00011417608447304387, "loss": 0.0278, "step": 191940 }, { "epoch": 1.24, "learning_rate": 0.00011416640311868694, "loss": 0.0374, "step": 191950 }, { "epoch": 1.24, "learning_rate": 0.00011415672176433, "loss": 0.03, "step": 191960 }, { "epoch": 1.24, "learning_rate": 0.00011414704040997307, "loss": 0.031, "step": 191970 }, { "epoch": 1.24, "learning_rate": 0.00011413735905561614, "loss": 0.0376, "step": 191980 }, { "epoch": 1.24, "learning_rate": 0.00011412767770125922, "loss": 0.0343, "step": 191990 }, { "epoch": 1.24, "learning_rate": 0.00011411799634690227, "loss": 0.0288, "step": 192000 }, { "epoch": 1.24, "eval_cer": 0.919876172183934, "eval_loss": 0.022667761892080307, "eval_runtime": 120.1644, "eval_samples_per_second": 16.644, "eval_steps_per_second": 4.161, "step": 192000 }, { "epoch": 1.24, "learning_rate": 0.00011410831499254535, "loss": 0.0354, "step": 192010 }, { "epoch": 1.24, "learning_rate": 0.00011409863363818842, "loss": 0.0436, "step": 192020 }, { "epoch": 1.24, "learning_rate": 0.00011408895228383147, "loss": 0.0312, "step": 192030 }, { "epoch": 1.24, "learning_rate": 0.00011407927092947455, "loss": 0.0304, "step": 192040 }, { "epoch": 1.24, "learning_rate": 0.00011406958957511762, "loss": 0.0317, "step": 192050 }, { "epoch": 1.24, "learning_rate": 0.0001140599082207607, "loss": 0.0326, "step": 192060 }, { "epoch": 1.24, "learning_rate": 0.00011405022686640375, "loss": 0.0348, "step": 192070 }, { "epoch": 1.24, "learning_rate": 0.00011404054551204682, "loss": 0.0379, "step": 192080 }, { "epoch": 1.24, "learning_rate": 0.0001140308641576899, "loss": 0.0286, "step": 192090 }, { "epoch": 1.24, "learning_rate": 0.00011402118280333295, "loss": 0.0367, "step": 192100 }, { "epoch": 1.24, "learning_rate": 0.00011401150144897603, "loss": 0.0296, "step": 192110 }, { "epoch": 1.24, "learning_rate": 0.0001140018200946191, "loss": 0.0297, "step": 192120 }, { "epoch": 1.24, "learning_rate": 0.00011399213874026217, "loss": 0.032, "step": 192130 }, { "epoch": 1.24, "learning_rate": 0.00011398245738590523, "loss": 0.0348, "step": 192140 }, { "epoch": 1.24, "learning_rate": 0.00011397277603154829, "loss": 0.0309, "step": 192150 }, { "epoch": 1.24, "learning_rate": 0.00011396309467719137, "loss": 0.0322, "step": 192160 }, { "epoch": 1.24, "learning_rate": 0.00011395341332283443, "loss": 0.0335, "step": 192170 }, { "epoch": 1.24, "learning_rate": 0.00011394373196847749, "loss": 0.0296, "step": 192180 }, { "epoch": 1.24, "learning_rate": 0.00011393405061412057, "loss": 0.0346, "step": 192190 }, { "epoch": 1.24, "learning_rate": 0.00011392436925976364, "loss": 0.0367, "step": 192200 }, { "epoch": 1.24, "learning_rate": 0.0001139146879054067, "loss": 0.0334, "step": 192210 }, { "epoch": 1.24, "learning_rate": 0.00011390500655104977, "loss": 0.0307, "step": 192220 }, { "epoch": 1.24, "learning_rate": 0.00011389532519669285, "loss": 0.0351, "step": 192230 }, { "epoch": 1.24, "learning_rate": 0.0001138856438423359, "loss": 0.027, "step": 192240 }, { "epoch": 1.24, "learning_rate": 0.00011387596248797897, "loss": 0.0323, "step": 192250 }, { "epoch": 1.24, "learning_rate": 0.00011386628113362205, "loss": 0.0302, "step": 192260 }, { "epoch": 1.24, "learning_rate": 0.00011385659977926511, "loss": 0.0369, "step": 192270 }, { "epoch": 1.24, "learning_rate": 0.00011384691842490817, "loss": 0.0244, "step": 192280 }, { "epoch": 1.24, "learning_rate": 0.00011383723707055125, "loss": 0.0279, "step": 192290 }, { "epoch": 1.24, "learning_rate": 0.00011382755571619431, "loss": 0.0266, "step": 192300 }, { "epoch": 1.24, "learning_rate": 0.00011381787436183738, "loss": 0.0308, "step": 192310 }, { "epoch": 1.24, "learning_rate": 0.00011380819300748045, "loss": 0.0332, "step": 192320 }, { "epoch": 1.24, "learning_rate": 0.00011379851165312353, "loss": 0.0272, "step": 192330 }, { "epoch": 1.24, "learning_rate": 0.00011378883029876659, "loss": 0.0361, "step": 192340 }, { "epoch": 1.24, "learning_rate": 0.00011377914894440964, "loss": 0.0287, "step": 192350 }, { "epoch": 1.24, "learning_rate": 0.00011376946759005272, "loss": 0.0294, "step": 192360 }, { "epoch": 1.24, "learning_rate": 0.00011375978623569579, "loss": 0.0321, "step": 192370 }, { "epoch": 1.24, "learning_rate": 0.00011375010488133884, "loss": 0.0317, "step": 192380 }, { "epoch": 1.24, "learning_rate": 0.00011374042352698192, "loss": 0.0287, "step": 192390 }, { "epoch": 1.24, "learning_rate": 0.00011373074217262499, "loss": 0.0293, "step": 192400 }, { "epoch": 1.24, "learning_rate": 0.00011372106081826807, "loss": 0.0316, "step": 192410 }, { "epoch": 1.24, "learning_rate": 0.00011371137946391112, "loss": 0.032, "step": 192420 }, { "epoch": 1.24, "learning_rate": 0.0001137016981095542, "loss": 0.0333, "step": 192430 }, { "epoch": 1.24, "learning_rate": 0.00011369201675519727, "loss": 0.0299, "step": 192440 }, { "epoch": 1.24, "learning_rate": 0.00011368233540084032, "loss": 0.0334, "step": 192450 }, { "epoch": 1.24, "learning_rate": 0.0001136726540464834, "loss": 0.0298, "step": 192460 }, { "epoch": 1.24, "learning_rate": 0.00011366297269212647, "loss": 0.0319, "step": 192470 }, { "epoch": 1.24, "learning_rate": 0.00011365329133776955, "loss": 0.0365, "step": 192480 }, { "epoch": 1.24, "learning_rate": 0.0001136436099834126, "loss": 0.0322, "step": 192490 }, { "epoch": 1.24, "learning_rate": 0.00011363392862905567, "loss": 0.0355, "step": 192500 }, { "epoch": 1.24, "learning_rate": 0.00011362424727469875, "loss": 0.0326, "step": 192510 }, { "epoch": 1.24, "learning_rate": 0.0001136145659203418, "loss": 0.0352, "step": 192520 }, { "epoch": 1.24, "learning_rate": 0.00011360488456598488, "loss": 0.0347, "step": 192530 }, { "epoch": 1.24, "learning_rate": 0.00011359520321162794, "loss": 0.0297, "step": 192540 }, { "epoch": 1.24, "learning_rate": 0.00011358552185727101, "loss": 0.0284, "step": 192550 }, { "epoch": 1.24, "learning_rate": 0.00011357584050291408, "loss": 0.0282, "step": 192560 }, { "epoch": 1.24, "learning_rate": 0.00011356615914855714, "loss": 0.029, "step": 192570 }, { "epoch": 1.24, "learning_rate": 0.00011355647779420022, "loss": 0.0259, "step": 192580 }, { "epoch": 1.24, "learning_rate": 0.00011354679643984328, "loss": 0.032, "step": 192590 }, { "epoch": 1.24, "learning_rate": 0.00011353711508548634, "loss": 0.0341, "step": 192600 }, { "epoch": 1.24, "learning_rate": 0.00011352743373112942, "loss": 0.0326, "step": 192610 }, { "epoch": 1.24, "learning_rate": 0.00011351775237677249, "loss": 0.0309, "step": 192620 }, { "epoch": 1.24, "learning_rate": 0.00011350807102241555, "loss": 0.0291, "step": 192630 }, { "epoch": 1.24, "learning_rate": 0.00011349838966805862, "loss": 0.0345, "step": 192640 }, { "epoch": 1.24, "learning_rate": 0.00011348870831370169, "loss": 0.0326, "step": 192650 }, { "epoch": 1.24, "learning_rate": 0.00011347902695934475, "loss": 0.0333, "step": 192660 }, { "epoch": 1.24, "learning_rate": 0.00011346934560498782, "loss": 0.03, "step": 192670 }, { "epoch": 1.24, "learning_rate": 0.0001134596642506309, "loss": 0.0273, "step": 192680 }, { "epoch": 1.24, "learning_rate": 0.00011344998289627396, "loss": 0.0274, "step": 192690 }, { "epoch": 1.24, "learning_rate": 0.00011344030154191702, "loss": 0.0288, "step": 192700 }, { "epoch": 1.24, "learning_rate": 0.0001134306201875601, "loss": 0.024, "step": 192710 }, { "epoch": 1.24, "learning_rate": 0.00011342093883320316, "loss": 0.0298, "step": 192720 }, { "epoch": 1.24, "learning_rate": 0.00011341125747884623, "loss": 0.034, "step": 192730 }, { "epoch": 1.24, "learning_rate": 0.0001134015761244893, "loss": 0.029, "step": 192740 }, { "epoch": 1.24, "learning_rate": 0.00011339189477013236, "loss": 0.0326, "step": 192750 }, { "epoch": 1.24, "learning_rate": 0.00011338221341577544, "loss": 0.031, "step": 192760 }, { "epoch": 1.24, "learning_rate": 0.0001133725320614185, "loss": 0.0262, "step": 192770 }, { "epoch": 1.24, "learning_rate": 0.00011336285070706157, "loss": 0.0386, "step": 192780 }, { "epoch": 1.24, "learning_rate": 0.00011335316935270464, "loss": 0.0325, "step": 192790 }, { "epoch": 1.24, "learning_rate": 0.0001133434879983477, "loss": 0.0313, "step": 192800 }, { "epoch": 1.24, "learning_rate": 0.00011333380664399077, "loss": 0.0314, "step": 192810 }, { "epoch": 1.24, "learning_rate": 0.00011332412528963384, "loss": 0.0287, "step": 192820 }, { "epoch": 1.24, "learning_rate": 0.00011331444393527692, "loss": 0.0316, "step": 192830 }, { "epoch": 1.24, "learning_rate": 0.00011330476258091997, "loss": 0.0371, "step": 192840 }, { "epoch": 1.24, "learning_rate": 0.00011329508122656304, "loss": 0.0322, "step": 192850 }, { "epoch": 1.24, "learning_rate": 0.00011328539987220612, "loss": 0.0316, "step": 192860 }, { "epoch": 1.24, "learning_rate": 0.00011327571851784917, "loss": 0.0327, "step": 192870 }, { "epoch": 1.24, "learning_rate": 0.00011326603716349225, "loss": 0.0351, "step": 192880 }, { "epoch": 1.24, "learning_rate": 0.00011325635580913532, "loss": 0.0263, "step": 192890 }, { "epoch": 1.25, "learning_rate": 0.0001132466744547784, "loss": 0.0273, "step": 192900 }, { "epoch": 1.25, "learning_rate": 0.00011323699310042145, "loss": 0.0283, "step": 192910 }, { "epoch": 1.25, "learning_rate": 0.00011322731174606452, "loss": 0.0299, "step": 192920 }, { "epoch": 1.25, "learning_rate": 0.0001132176303917076, "loss": 0.0263, "step": 192930 }, { "epoch": 1.25, "learning_rate": 0.00011320794903735065, "loss": 0.0311, "step": 192940 }, { "epoch": 1.25, "learning_rate": 0.00011319826768299371, "loss": 0.0304, "step": 192950 }, { "epoch": 1.25, "learning_rate": 0.0001131885863286368, "loss": 0.0293, "step": 192960 }, { "epoch": 1.25, "learning_rate": 0.00011317890497427986, "loss": 0.0375, "step": 192970 }, { "epoch": 1.25, "learning_rate": 0.00011316922361992293, "loss": 0.0302, "step": 192980 }, { "epoch": 1.25, "learning_rate": 0.00011315954226556599, "loss": 0.0303, "step": 192990 }, { "epoch": 1.25, "learning_rate": 0.00011314986091120907, "loss": 0.0344, "step": 193000 }, { "epoch": 1.25, "eval_cer": 0.9198716529205739, "eval_loss": 0.022520260885357857, "eval_runtime": 120.1842, "eval_samples_per_second": 16.641, "eval_steps_per_second": 4.16, "step": 193000 }, { "epoch": 1.25, "learning_rate": 0.00011314017955685212, "loss": 0.0279, "step": 193010 }, { "epoch": 1.25, "learning_rate": 0.00011313049820249519, "loss": 0.0348, "step": 193020 }, { "epoch": 1.25, "learning_rate": 0.00011312081684813827, "loss": 0.0312, "step": 193030 }, { "epoch": 1.25, "learning_rate": 0.00011311113549378134, "loss": 0.029, "step": 193040 }, { "epoch": 1.25, "learning_rate": 0.0001131014541394244, "loss": 0.0353, "step": 193050 }, { "epoch": 1.25, "learning_rate": 0.00011309177278506747, "loss": 0.0343, "step": 193060 }, { "epoch": 1.25, "learning_rate": 0.00011308209143071054, "loss": 0.0286, "step": 193070 }, { "epoch": 1.25, "learning_rate": 0.0001130724100763536, "loss": 0.0294, "step": 193080 }, { "epoch": 1.25, "learning_rate": 0.00011306272872199667, "loss": 0.0328, "step": 193090 }, { "epoch": 1.25, "learning_rate": 0.00011305304736763975, "loss": 0.0326, "step": 193100 }, { "epoch": 1.25, "learning_rate": 0.00011304336601328281, "loss": 0.0283, "step": 193110 }, { "epoch": 1.25, "learning_rate": 0.00011303368465892587, "loss": 0.0255, "step": 193120 }, { "epoch": 1.25, "learning_rate": 0.00011302400330456895, "loss": 0.0353, "step": 193130 }, { "epoch": 1.25, "learning_rate": 0.00011301432195021201, "loss": 0.0302, "step": 193140 }, { "epoch": 1.25, "learning_rate": 0.00011300464059585508, "loss": 0.0267, "step": 193150 }, { "epoch": 1.25, "learning_rate": 0.00011299495924149815, "loss": 0.0316, "step": 193160 }, { "epoch": 1.25, "learning_rate": 0.00011298527788714121, "loss": 0.0304, "step": 193170 }, { "epoch": 1.25, "learning_rate": 0.00011297559653278429, "loss": 0.0344, "step": 193180 }, { "epoch": 1.25, "learning_rate": 0.00011296591517842734, "loss": 0.0339, "step": 193190 }, { "epoch": 1.25, "learning_rate": 0.00011295623382407042, "loss": 0.0311, "step": 193200 }, { "epoch": 1.25, "learning_rate": 0.00011294655246971349, "loss": 0.0292, "step": 193210 }, { "epoch": 1.25, "learning_rate": 0.00011293687111535654, "loss": 0.0264, "step": 193220 }, { "epoch": 1.25, "learning_rate": 0.00011292718976099962, "loss": 0.0355, "step": 193230 }, { "epoch": 1.25, "learning_rate": 0.00011291750840664269, "loss": 0.0326, "step": 193240 }, { "epoch": 1.25, "learning_rate": 0.00011290782705228577, "loss": 0.0242, "step": 193250 }, { "epoch": 1.25, "learning_rate": 0.00011289814569792882, "loss": 0.0309, "step": 193260 }, { "epoch": 1.25, "learning_rate": 0.00011288846434357189, "loss": 0.0293, "step": 193270 }, { "epoch": 1.25, "learning_rate": 0.00011287878298921497, "loss": 0.0309, "step": 193280 }, { "epoch": 1.25, "learning_rate": 0.00011286910163485802, "loss": 0.0323, "step": 193290 }, { "epoch": 1.25, "learning_rate": 0.0001128594202805011, "loss": 0.0303, "step": 193300 }, { "epoch": 1.25, "learning_rate": 0.00011284973892614417, "loss": 0.0332, "step": 193310 }, { "epoch": 1.25, "learning_rate": 0.00011284005757178725, "loss": 0.0302, "step": 193320 }, { "epoch": 1.25, "learning_rate": 0.0001128303762174303, "loss": 0.0304, "step": 193330 }, { "epoch": 1.25, "learning_rate": 0.00011282069486307337, "loss": 0.0328, "step": 193340 }, { "epoch": 1.25, "learning_rate": 0.00011281101350871644, "loss": 0.0302, "step": 193350 }, { "epoch": 1.25, "learning_rate": 0.0001128013321543595, "loss": 0.0402, "step": 193360 }, { "epoch": 1.25, "learning_rate": 0.00011279165080000256, "loss": 0.0293, "step": 193370 }, { "epoch": 1.25, "learning_rate": 0.00011278196944564564, "loss": 0.0355, "step": 193380 }, { "epoch": 1.25, "learning_rate": 0.00011277228809128871, "loss": 0.0268, "step": 193390 }, { "epoch": 1.25, "learning_rate": 0.00011276260673693178, "loss": 0.0293, "step": 193400 }, { "epoch": 1.25, "learning_rate": 0.00011275292538257484, "loss": 0.0342, "step": 193410 }, { "epoch": 1.25, "learning_rate": 0.00011274324402821792, "loss": 0.0313, "step": 193420 }, { "epoch": 1.25, "learning_rate": 0.00011273356267386097, "loss": 0.027, "step": 193430 }, { "epoch": 1.25, "learning_rate": 0.00011272388131950404, "loss": 0.0329, "step": 193440 }, { "epoch": 1.25, "learning_rate": 0.00011271419996514712, "loss": 0.035, "step": 193450 }, { "epoch": 1.25, "learning_rate": 0.00011270451861079019, "loss": 0.033, "step": 193460 }, { "epoch": 1.25, "learning_rate": 0.00011269483725643324, "loss": 0.0353, "step": 193470 }, { "epoch": 1.25, "learning_rate": 0.00011268515590207632, "loss": 0.0332, "step": 193480 }, { "epoch": 1.25, "learning_rate": 0.00011267547454771939, "loss": 0.033, "step": 193490 }, { "epoch": 1.25, "learning_rate": 0.00011266579319336245, "loss": 0.031, "step": 193500 }, { "epoch": 1.25, "learning_rate": 0.00011265611183900552, "loss": 0.027, "step": 193510 }, { "epoch": 1.25, "learning_rate": 0.0001126464304846486, "loss": 0.032, "step": 193520 }, { "epoch": 1.25, "learning_rate": 0.00011263674913029166, "loss": 0.0346, "step": 193530 }, { "epoch": 1.25, "learning_rate": 0.00011262706777593472, "loss": 0.0286, "step": 193540 }, { "epoch": 1.25, "learning_rate": 0.0001126173864215778, "loss": 0.0303, "step": 193550 }, { "epoch": 1.25, "learning_rate": 0.00011260770506722086, "loss": 0.03, "step": 193560 }, { "epoch": 1.25, "learning_rate": 0.00011259802371286392, "loss": 0.0273, "step": 193570 }, { "epoch": 1.25, "learning_rate": 0.000112588342358507, "loss": 0.029, "step": 193580 }, { "epoch": 1.25, "learning_rate": 0.00011257866100415006, "loss": 0.031, "step": 193590 }, { "epoch": 1.25, "learning_rate": 0.00011256897964979314, "loss": 0.0335, "step": 193600 }, { "epoch": 1.25, "learning_rate": 0.0001125592982954362, "loss": 0.0356, "step": 193610 }, { "epoch": 1.25, "learning_rate": 0.00011254961694107927, "loss": 0.0305, "step": 193620 }, { "epoch": 1.25, "learning_rate": 0.00011253993558672234, "loss": 0.0284, "step": 193630 }, { "epoch": 1.25, "learning_rate": 0.00011253025423236539, "loss": 0.033, "step": 193640 }, { "epoch": 1.25, "learning_rate": 0.00011252057287800847, "loss": 0.032, "step": 193650 }, { "epoch": 1.25, "learning_rate": 0.00011251089152365154, "loss": 0.0291, "step": 193660 }, { "epoch": 1.25, "learning_rate": 0.00011250121016929462, "loss": 0.0272, "step": 193670 }, { "epoch": 1.25, "learning_rate": 0.00011249152881493767, "loss": 0.0288, "step": 193680 }, { "epoch": 1.25, "learning_rate": 0.00011248184746058074, "loss": 0.0303, "step": 193690 }, { "epoch": 1.25, "learning_rate": 0.00011247216610622382, "loss": 0.029, "step": 193700 }, { "epoch": 1.25, "learning_rate": 0.00011246248475186687, "loss": 0.0263, "step": 193710 }, { "epoch": 1.25, "learning_rate": 0.00011245280339750995, "loss": 0.0328, "step": 193720 }, { "epoch": 1.25, "learning_rate": 0.00011244312204315302, "loss": 0.0314, "step": 193730 }, { "epoch": 1.25, "learning_rate": 0.0001124334406887961, "loss": 0.0381, "step": 193740 }, { "epoch": 1.25, "learning_rate": 0.00011242375933443915, "loss": 0.0297, "step": 193750 }, { "epoch": 1.25, "learning_rate": 0.00011241407798008221, "loss": 0.0281, "step": 193760 }, { "epoch": 1.25, "learning_rate": 0.0001124043966257253, "loss": 0.0252, "step": 193770 }, { "epoch": 1.25, "learning_rate": 0.00011239471527136835, "loss": 0.0303, "step": 193780 }, { "epoch": 1.25, "learning_rate": 0.00011238503391701141, "loss": 0.0322, "step": 193790 }, { "epoch": 1.25, "learning_rate": 0.0001123753525626545, "loss": 0.037, "step": 193800 }, { "epoch": 1.25, "learning_rate": 0.00011236567120829756, "loss": 0.0343, "step": 193810 }, { "epoch": 1.25, "learning_rate": 0.00011235598985394063, "loss": 0.0336, "step": 193820 }, { "epoch": 1.25, "learning_rate": 0.00011234630849958369, "loss": 0.0352, "step": 193830 }, { "epoch": 1.25, "learning_rate": 0.00011233662714522677, "loss": 0.0303, "step": 193840 }, { "epoch": 1.25, "learning_rate": 0.00011232694579086982, "loss": 0.0322, "step": 193850 }, { "epoch": 1.25, "learning_rate": 0.00011231726443651289, "loss": 0.0327, "step": 193860 }, { "epoch": 1.25, "learning_rate": 0.00011230758308215597, "loss": 0.03, "step": 193870 }, { "epoch": 1.25, "learning_rate": 0.00011229790172779904, "loss": 0.0299, "step": 193880 }, { "epoch": 1.25, "learning_rate": 0.00011228822037344209, "loss": 0.0366, "step": 193890 }, { "epoch": 1.25, "learning_rate": 0.00011227853901908517, "loss": 0.0279, "step": 193900 }, { "epoch": 1.25, "learning_rate": 0.00011226885766472824, "loss": 0.0335, "step": 193910 }, { "epoch": 1.25, "learning_rate": 0.0001122591763103713, "loss": 0.0281, "step": 193920 }, { "epoch": 1.25, "learning_rate": 0.00011224949495601437, "loss": 0.0348, "step": 193930 }, { "epoch": 1.25, "learning_rate": 0.00011223981360165745, "loss": 0.0342, "step": 193940 }, { "epoch": 1.25, "learning_rate": 0.00011223013224730051, "loss": 0.0396, "step": 193950 }, { "epoch": 1.25, "learning_rate": 0.00011222045089294357, "loss": 0.0315, "step": 193960 }, { "epoch": 1.25, "learning_rate": 0.00011221076953858665, "loss": 0.0292, "step": 193970 }, { "epoch": 1.25, "learning_rate": 0.00011220108818422971, "loss": 0.0317, "step": 193980 }, { "epoch": 1.25, "learning_rate": 0.00011219140682987277, "loss": 0.0346, "step": 193990 }, { "epoch": 1.25, "learning_rate": 0.00011218172547551585, "loss": 0.0283, "step": 194000 }, { "epoch": 1.25, "eval_cer": 0.91987436447859, "eval_loss": 0.022109534591436386, "eval_runtime": 120.1821, "eval_samples_per_second": 16.641, "eval_steps_per_second": 4.16, "step": 194000 }, { "epoch": 1.25, "learning_rate": 0.00011217204412115891, "loss": 0.0379, "step": 194010 }, { "epoch": 1.25, "learning_rate": 0.00011216236276680199, "loss": 0.0315, "step": 194020 }, { "epoch": 1.25, "learning_rate": 0.00011215268141244504, "loss": 0.0361, "step": 194030 }, { "epoch": 1.25, "learning_rate": 0.00011214300005808812, "loss": 0.0365, "step": 194040 }, { "epoch": 1.25, "learning_rate": 0.00011213331870373119, "loss": 0.0301, "step": 194050 }, { "epoch": 1.25, "learning_rate": 0.00011212363734937424, "loss": 0.0329, "step": 194060 }, { "epoch": 1.25, "learning_rate": 0.00011211395599501732, "loss": 0.0312, "step": 194070 }, { "epoch": 1.25, "learning_rate": 0.00011210427464066039, "loss": 0.0357, "step": 194080 }, { "epoch": 1.25, "learning_rate": 0.00011209459328630347, "loss": 0.0286, "step": 194090 }, { "epoch": 1.25, "learning_rate": 0.00011208491193194652, "loss": 0.0273, "step": 194100 }, { "epoch": 1.25, "learning_rate": 0.00011207523057758959, "loss": 0.0322, "step": 194110 }, { "epoch": 1.25, "learning_rate": 0.00011206554922323267, "loss": 0.028, "step": 194120 }, { "epoch": 1.25, "learning_rate": 0.00011205586786887572, "loss": 0.034, "step": 194130 }, { "epoch": 1.25, "learning_rate": 0.0001120461865145188, "loss": 0.0278, "step": 194140 }, { "epoch": 1.25, "learning_rate": 0.00011203650516016187, "loss": 0.028, "step": 194150 }, { "epoch": 1.25, "learning_rate": 0.00011202682380580493, "loss": 0.0314, "step": 194160 }, { "epoch": 1.25, "learning_rate": 0.000112017142451448, "loss": 0.0344, "step": 194170 }, { "epoch": 1.25, "learning_rate": 0.00011200746109709106, "loss": 0.0321, "step": 194180 }, { "epoch": 1.25, "learning_rate": 0.00011199777974273414, "loss": 0.032, "step": 194190 }, { "epoch": 1.25, "learning_rate": 0.0001119880983883772, "loss": 0.0359, "step": 194200 }, { "epoch": 1.25, "learning_rate": 0.00011197841703402026, "loss": 0.0273, "step": 194210 }, { "epoch": 1.25, "learning_rate": 0.00011196873567966334, "loss": 0.0301, "step": 194220 }, { "epoch": 1.25, "learning_rate": 0.00011195905432530641, "loss": 0.0283, "step": 194230 }, { "epoch": 1.25, "learning_rate": 0.00011194937297094948, "loss": 0.0307, "step": 194240 }, { "epoch": 1.25, "learning_rate": 0.00011193969161659254, "loss": 0.0349, "step": 194250 }, { "epoch": 1.25, "learning_rate": 0.00011193001026223561, "loss": 0.0347, "step": 194260 }, { "epoch": 1.25, "learning_rate": 0.00011192032890787867, "loss": 0.0284, "step": 194270 }, { "epoch": 1.25, "learning_rate": 0.00011191064755352174, "loss": 0.0296, "step": 194280 }, { "epoch": 1.25, "learning_rate": 0.00011190096619916482, "loss": 0.028, "step": 194290 }, { "epoch": 1.25, "learning_rate": 0.00011189128484480789, "loss": 0.0305, "step": 194300 }, { "epoch": 1.25, "learning_rate": 0.00011188160349045094, "loss": 0.0307, "step": 194310 }, { "epoch": 1.25, "learning_rate": 0.00011187192213609402, "loss": 0.0275, "step": 194320 }, { "epoch": 1.25, "learning_rate": 0.00011186224078173709, "loss": 0.0368, "step": 194330 }, { "epoch": 1.25, "learning_rate": 0.00011185255942738015, "loss": 0.0307, "step": 194340 }, { "epoch": 1.25, "learning_rate": 0.00011184287807302322, "loss": 0.0303, "step": 194350 }, { "epoch": 1.25, "learning_rate": 0.00011183319671866628, "loss": 0.0327, "step": 194360 }, { "epoch": 1.25, "learning_rate": 0.00011182351536430936, "loss": 0.0291, "step": 194370 }, { "epoch": 1.25, "learning_rate": 0.00011181383400995242, "loss": 0.034, "step": 194380 }, { "epoch": 1.25, "learning_rate": 0.0001118041526555955, "loss": 0.0298, "step": 194390 }, { "epoch": 1.25, "learning_rate": 0.00011179447130123856, "loss": 0.0391, "step": 194400 }, { "epoch": 1.25, "learning_rate": 0.00011178478994688162, "loss": 0.0288, "step": 194410 }, { "epoch": 1.25, "learning_rate": 0.0001117751085925247, "loss": 0.0326, "step": 194420 }, { "epoch": 1.25, "learning_rate": 0.00011176542723816776, "loss": 0.025, "step": 194430 }, { "epoch": 1.25, "learning_rate": 0.00011175574588381084, "loss": 0.0362, "step": 194440 }, { "epoch": 1.26, "learning_rate": 0.0001117460645294539, "loss": 0.0351, "step": 194450 }, { "epoch": 1.26, "learning_rate": 0.00011173638317509696, "loss": 0.0297, "step": 194460 }, { "epoch": 1.26, "learning_rate": 0.00011172670182074004, "loss": 0.0338, "step": 194470 }, { "epoch": 1.26, "learning_rate": 0.00011171702046638309, "loss": 0.0334, "step": 194480 }, { "epoch": 1.26, "learning_rate": 0.00011170733911202617, "loss": 0.0338, "step": 194490 }, { "epoch": 1.26, "learning_rate": 0.00011169765775766924, "loss": 0.0299, "step": 194500 }, { "epoch": 1.26, "learning_rate": 0.00011168797640331232, "loss": 0.0293, "step": 194510 }, { "epoch": 1.26, "learning_rate": 0.00011167829504895537, "loss": 0.0293, "step": 194520 }, { "epoch": 1.26, "learning_rate": 0.00011166861369459844, "loss": 0.0298, "step": 194530 }, { "epoch": 1.26, "learning_rate": 0.00011165893234024152, "loss": 0.0339, "step": 194540 }, { "epoch": 1.26, "learning_rate": 0.00011164925098588457, "loss": 0.0304, "step": 194550 }, { "epoch": 1.26, "learning_rate": 0.00011163956963152764, "loss": 0.0374, "step": 194560 }, { "epoch": 1.26, "learning_rate": 0.00011162988827717072, "loss": 0.0312, "step": 194570 }, { "epoch": 1.26, "learning_rate": 0.00011162020692281377, "loss": 0.0298, "step": 194580 }, { "epoch": 1.26, "learning_rate": 0.00011161052556845685, "loss": 0.0379, "step": 194590 }, { "epoch": 1.26, "learning_rate": 0.00011160084421409991, "loss": 0.0327, "step": 194600 }, { "epoch": 1.26, "learning_rate": 0.000111591162859743, "loss": 0.0315, "step": 194610 }, { "epoch": 1.26, "learning_rate": 0.00011158148150538605, "loss": 0.0276, "step": 194620 }, { "epoch": 1.26, "learning_rate": 0.00011157180015102911, "loss": 0.0408, "step": 194630 }, { "epoch": 1.26, "learning_rate": 0.00011156211879667219, "loss": 0.0329, "step": 194640 }, { "epoch": 1.26, "learning_rate": 0.00011155243744231525, "loss": 0.0318, "step": 194650 }, { "epoch": 1.26, "learning_rate": 0.00011154275608795831, "loss": 0.0331, "step": 194660 }, { "epoch": 1.26, "learning_rate": 0.00011153307473360139, "loss": 0.0269, "step": 194670 }, { "epoch": 1.26, "learning_rate": 0.00011152339337924446, "loss": 0.0274, "step": 194680 }, { "epoch": 1.26, "learning_rate": 0.00011151371202488752, "loss": 0.0291, "step": 194690 }, { "epoch": 1.26, "learning_rate": 0.00011150403067053059, "loss": 0.0296, "step": 194700 }, { "epoch": 1.26, "learning_rate": 0.00011149434931617367, "loss": 0.039, "step": 194710 }, { "epoch": 1.26, "learning_rate": 0.00011148466796181672, "loss": 0.0339, "step": 194720 }, { "epoch": 1.26, "learning_rate": 0.00011147498660745979, "loss": 0.0263, "step": 194730 }, { "epoch": 1.26, "learning_rate": 0.00011146530525310287, "loss": 0.031, "step": 194740 }, { "epoch": 1.26, "learning_rate": 0.00011145562389874594, "loss": 0.0369, "step": 194750 }, { "epoch": 1.26, "learning_rate": 0.00011144594254438899, "loss": 0.0364, "step": 194760 }, { "epoch": 1.26, "learning_rate": 0.00011143626119003207, "loss": 0.028, "step": 194770 }, { "epoch": 1.26, "learning_rate": 0.00011142657983567513, "loss": 0.0291, "step": 194780 }, { "epoch": 1.26, "learning_rate": 0.0001114168984813182, "loss": 0.0341, "step": 194790 }, { "epoch": 1.26, "learning_rate": 0.00011140721712696127, "loss": 0.0282, "step": 194800 }, { "epoch": 1.26, "learning_rate": 0.00011139753577260435, "loss": 0.0347, "step": 194810 }, { "epoch": 1.26, "learning_rate": 0.00011138785441824741, "loss": 0.032, "step": 194820 }, { "epoch": 1.26, "learning_rate": 0.00011137817306389047, "loss": 0.033, "step": 194830 }, { "epoch": 1.26, "learning_rate": 0.00011136849170953354, "loss": 0.0328, "step": 194840 }, { "epoch": 1.26, "learning_rate": 0.00011135881035517661, "loss": 0.0329, "step": 194850 }, { "epoch": 1.26, "learning_rate": 0.00011134912900081966, "loss": 0.0348, "step": 194860 }, { "epoch": 1.26, "learning_rate": 0.00011133944764646274, "loss": 0.0313, "step": 194870 }, { "epoch": 1.26, "learning_rate": 0.00011132976629210581, "loss": 0.0339, "step": 194880 }, { "epoch": 1.26, "learning_rate": 0.00011132008493774889, "loss": 0.0319, "step": 194890 }, { "epoch": 1.26, "learning_rate": 0.00011131040358339194, "loss": 0.0328, "step": 194900 }, { "epoch": 1.26, "learning_rate": 0.00011130072222903502, "loss": 0.0305, "step": 194910 }, { "epoch": 1.26, "learning_rate": 0.00011129104087467809, "loss": 0.0273, "step": 194920 }, { "epoch": 1.26, "learning_rate": 0.00011128135952032114, "loss": 0.0312, "step": 194930 }, { "epoch": 1.26, "learning_rate": 0.00011127167816596422, "loss": 0.0271, "step": 194940 }, { "epoch": 1.26, "learning_rate": 0.00011126199681160729, "loss": 0.029, "step": 194950 }, { "epoch": 1.26, "learning_rate": 0.00011125231545725037, "loss": 0.0308, "step": 194960 }, { "epoch": 1.26, "learning_rate": 0.00011124263410289342, "loss": 0.0296, "step": 194970 }, { "epoch": 1.26, "learning_rate": 0.00011123295274853649, "loss": 0.0385, "step": 194980 }, { "epoch": 1.26, "learning_rate": 0.00011122327139417957, "loss": 0.0269, "step": 194990 }, { "epoch": 1.26, "learning_rate": 0.00011121359003982262, "loss": 0.0377, "step": 195000 }, { "epoch": 1.26, "eval_cer": 0.9198336911083493, "eval_loss": 0.022459572181105614, "eval_runtime": 120.3875, "eval_samples_per_second": 16.613, "eval_steps_per_second": 4.153, "step": 195000 }, { "epoch": 1.26, "learning_rate": 0.0001112039086854657, "loss": 0.0366, "step": 195010 }, { "epoch": 1.26, "learning_rate": 0.00011119422733110876, "loss": 0.0376, "step": 195020 }, { "epoch": 1.26, "learning_rate": 0.00011118454597675184, "loss": 0.0343, "step": 195030 }, { "epoch": 1.26, "learning_rate": 0.0001111748646223949, "loss": 0.0326, "step": 195040 }, { "epoch": 1.26, "learning_rate": 0.00011116518326803796, "loss": 0.0319, "step": 195050 }, { "epoch": 1.26, "learning_rate": 0.00011115550191368104, "loss": 0.03, "step": 195060 }, { "epoch": 1.26, "learning_rate": 0.0001111458205593241, "loss": 0.0323, "step": 195070 }, { "epoch": 1.26, "learning_rate": 0.00011113613920496716, "loss": 0.0299, "step": 195080 }, { "epoch": 1.26, "learning_rate": 0.00011112645785061024, "loss": 0.0343, "step": 195090 }, { "epoch": 1.26, "learning_rate": 0.00011111677649625331, "loss": 0.0304, "step": 195100 }, { "epoch": 1.26, "learning_rate": 0.00011110709514189637, "loss": 0.0339, "step": 195110 }, { "epoch": 1.26, "learning_rate": 0.00011109741378753944, "loss": 0.0282, "step": 195120 }, { "epoch": 1.26, "learning_rate": 0.00011108773243318252, "loss": 0.0297, "step": 195130 }, { "epoch": 1.26, "learning_rate": 0.00011107805107882557, "loss": 0.0273, "step": 195140 }, { "epoch": 1.26, "learning_rate": 0.00011106836972446864, "loss": 0.0277, "step": 195150 }, { "epoch": 1.26, "learning_rate": 0.00011105868837011172, "loss": 0.0366, "step": 195160 }, { "epoch": 1.26, "learning_rate": 0.00011104900701575478, "loss": 0.0285, "step": 195170 }, { "epoch": 1.26, "learning_rate": 0.00011103932566139784, "loss": 0.0302, "step": 195180 }, { "epoch": 1.26, "learning_rate": 0.00011102964430704092, "loss": 0.0305, "step": 195190 }, { "epoch": 1.26, "learning_rate": 0.00011101996295268398, "loss": 0.0314, "step": 195200 }, { "epoch": 1.26, "learning_rate": 0.00011101028159832705, "loss": 0.029, "step": 195210 }, { "epoch": 1.26, "learning_rate": 0.00011100060024397012, "loss": 0.0316, "step": 195220 }, { "epoch": 1.26, "learning_rate": 0.0001109909188896132, "loss": 0.0316, "step": 195230 }, { "epoch": 1.26, "learning_rate": 0.00011098123753525626, "loss": 0.035, "step": 195240 }, { "epoch": 1.26, "learning_rate": 0.00011097155618089931, "loss": 0.0318, "step": 195250 }, { "epoch": 1.26, "learning_rate": 0.0001109618748265424, "loss": 0.0358, "step": 195260 }, { "epoch": 1.26, "learning_rate": 0.00011095219347218546, "loss": 0.0279, "step": 195270 }, { "epoch": 1.26, "learning_rate": 0.00011094251211782851, "loss": 0.0313, "step": 195280 }, { "epoch": 1.26, "learning_rate": 0.0001109328307634716, "loss": 0.0354, "step": 195290 }, { "epoch": 1.26, "learning_rate": 0.00011092314940911466, "loss": 0.0275, "step": 195300 }, { "epoch": 1.26, "learning_rate": 0.00011091346805475774, "loss": 0.0314, "step": 195310 }, { "epoch": 1.26, "learning_rate": 0.00011090378670040079, "loss": 0.0279, "step": 195320 }, { "epoch": 1.26, "learning_rate": 0.00011089410534604387, "loss": 0.032, "step": 195330 }, { "epoch": 1.26, "learning_rate": 0.00011088442399168694, "loss": 0.0346, "step": 195340 }, { "epoch": 1.26, "learning_rate": 0.00011087474263732999, "loss": 0.0329, "step": 195350 }, { "epoch": 1.26, "learning_rate": 0.00011086506128297307, "loss": 0.0306, "step": 195360 }, { "epoch": 1.26, "learning_rate": 0.00011085537992861614, "loss": 0.0279, "step": 195370 }, { "epoch": 1.26, "learning_rate": 0.00011084569857425922, "loss": 0.0311, "step": 195380 }, { "epoch": 1.26, "learning_rate": 0.00011083601721990227, "loss": 0.0302, "step": 195390 }, { "epoch": 1.26, "learning_rate": 0.00011082633586554534, "loss": 0.0329, "step": 195400 }, { "epoch": 1.26, "learning_rate": 0.00011081665451118842, "loss": 0.0297, "step": 195410 }, { "epoch": 1.26, "learning_rate": 0.00011080697315683147, "loss": 0.0293, "step": 195420 }, { "epoch": 1.26, "learning_rate": 0.00011079729180247455, "loss": 0.0331, "step": 195430 }, { "epoch": 1.26, "learning_rate": 0.00011078761044811761, "loss": 0.0331, "step": 195440 }, { "epoch": 1.26, "learning_rate": 0.00011077792909376068, "loss": 0.0316, "step": 195450 }, { "epoch": 1.26, "learning_rate": 0.00011076824773940375, "loss": 0.0234, "step": 195460 }, { "epoch": 1.26, "learning_rate": 0.00011075856638504681, "loss": 0.0288, "step": 195470 }, { "epoch": 1.26, "learning_rate": 0.00011074888503068989, "loss": 0.0339, "step": 195480 }, { "epoch": 1.26, "learning_rate": 0.00011073920367633295, "loss": 0.0286, "step": 195490 }, { "epoch": 1.26, "learning_rate": 0.00011072952232197601, "loss": 0.0294, "step": 195500 }, { "epoch": 1.26, "learning_rate": 0.00011071984096761909, "loss": 0.0369, "step": 195510 }, { "epoch": 1.26, "learning_rate": 0.00011071015961326216, "loss": 0.0283, "step": 195520 }, { "epoch": 1.26, "learning_rate": 0.00011070047825890522, "loss": 0.034, "step": 195530 }, { "epoch": 1.26, "learning_rate": 0.00011069079690454829, "loss": 0.0275, "step": 195540 }, { "epoch": 1.26, "learning_rate": 0.00011068111555019136, "loss": 0.0297, "step": 195550 }, { "epoch": 1.26, "learning_rate": 0.00011067143419583442, "loss": 0.0318, "step": 195560 }, { "epoch": 1.26, "learning_rate": 0.00011066175284147749, "loss": 0.0291, "step": 195570 }, { "epoch": 1.26, "learning_rate": 0.00011065207148712057, "loss": 0.0289, "step": 195580 }, { "epoch": 1.26, "learning_rate": 0.00011064239013276363, "loss": 0.028, "step": 195590 }, { "epoch": 1.26, "learning_rate": 0.00011063270877840669, "loss": 0.0295, "step": 195600 }, { "epoch": 1.26, "learning_rate": 0.00011062302742404977, "loss": 0.0346, "step": 195610 }, { "epoch": 1.26, "learning_rate": 0.00011061334606969283, "loss": 0.0298, "step": 195620 }, { "epoch": 1.26, "learning_rate": 0.0001106036647153359, "loss": 0.0295, "step": 195630 }, { "epoch": 1.26, "learning_rate": 0.00011059398336097897, "loss": 0.0325, "step": 195640 }, { "epoch": 1.26, "learning_rate": 0.00011058430200662203, "loss": 0.0329, "step": 195650 }, { "epoch": 1.26, "learning_rate": 0.00011057462065226511, "loss": 0.0292, "step": 195660 }, { "epoch": 1.26, "learning_rate": 0.00011056493929790816, "loss": 0.03, "step": 195670 }, { "epoch": 1.26, "learning_rate": 0.00011055525794355124, "loss": 0.0368, "step": 195680 }, { "epoch": 1.26, "learning_rate": 0.00011054557658919431, "loss": 0.0314, "step": 195690 }, { "epoch": 1.26, "learning_rate": 0.00011053589523483736, "loss": 0.0328, "step": 195700 }, { "epoch": 1.26, "learning_rate": 0.00011052621388048044, "loss": 0.0324, "step": 195710 }, { "epoch": 1.26, "learning_rate": 0.00011051653252612351, "loss": 0.0317, "step": 195720 }, { "epoch": 1.26, "learning_rate": 0.00011050685117176659, "loss": 0.0333, "step": 195730 }, { "epoch": 1.26, "learning_rate": 0.00011049716981740964, "loss": 0.0316, "step": 195740 }, { "epoch": 1.26, "learning_rate": 0.00011048748846305271, "loss": 0.0381, "step": 195750 }, { "epoch": 1.26, "learning_rate": 0.00011047780710869579, "loss": 0.0326, "step": 195760 }, { "epoch": 1.26, "learning_rate": 0.00011046812575433884, "loss": 0.032, "step": 195770 }, { "epoch": 1.26, "learning_rate": 0.00011045844439998192, "loss": 0.0328, "step": 195780 }, { "epoch": 1.26, "learning_rate": 0.00011044876304562499, "loss": 0.0338, "step": 195790 }, { "epoch": 1.26, "learning_rate": 0.00011043908169126807, "loss": 0.0349, "step": 195800 }, { "epoch": 1.26, "learning_rate": 0.00011042940033691112, "loss": 0.0285, "step": 195810 }, { "epoch": 1.26, "learning_rate": 0.00011041971898255419, "loss": 0.027, "step": 195820 }, { "epoch": 1.26, "learning_rate": 0.00011041003762819727, "loss": 0.0342, "step": 195830 }, { "epoch": 1.26, "learning_rate": 0.00011040035627384032, "loss": 0.0263, "step": 195840 }, { "epoch": 1.26, "learning_rate": 0.00011039067491948338, "loss": 0.0341, "step": 195850 }, { "epoch": 1.26, "learning_rate": 0.00011038099356512646, "loss": 0.0402, "step": 195860 }, { "epoch": 1.26, "learning_rate": 0.00011037131221076953, "loss": 0.0289, "step": 195870 }, { "epoch": 1.26, "learning_rate": 0.0001103616308564126, "loss": 0.0279, "step": 195880 }, { "epoch": 1.26, "learning_rate": 0.00011035194950205566, "loss": 0.028, "step": 195890 }, { "epoch": 1.26, "learning_rate": 0.00011034226814769874, "loss": 0.0282, "step": 195900 }, { "epoch": 1.26, "learning_rate": 0.0001103325867933418, "loss": 0.0261, "step": 195910 }, { "epoch": 1.26, "learning_rate": 0.00011032290543898486, "loss": 0.0304, "step": 195920 }, { "epoch": 1.26, "learning_rate": 0.00011031322408462794, "loss": 0.0308, "step": 195930 }, { "epoch": 1.26, "learning_rate": 0.00011030354273027101, "loss": 0.0313, "step": 195940 }, { "epoch": 1.26, "learning_rate": 0.00011029386137591406, "loss": 0.037, "step": 195950 }, { "epoch": 1.26, "learning_rate": 0.00011028418002155714, "loss": 0.0287, "step": 195960 }, { "epoch": 1.26, "learning_rate": 0.0001102744986672002, "loss": 0.0373, "step": 195970 }, { "epoch": 1.26, "learning_rate": 0.00011026481731284327, "loss": 0.0303, "step": 195980 }, { "epoch": 1.26, "learning_rate": 0.00011025513595848634, "loss": 0.0312, "step": 195990 }, { "epoch": 1.27, "learning_rate": 0.00011024545460412942, "loss": 0.0395, "step": 196000 }, { "epoch": 1.27, "eval_cer": 0.9198987685007344, "eval_loss": 0.022464269772171974, "eval_runtime": 120.2, "eval_samples_per_second": 16.639, "eval_steps_per_second": 4.16, "step": 196000 }, { "epoch": 1.27, "learning_rate": 0.00011023577324977248, "loss": 0.0302, "step": 196010 }, { "epoch": 1.27, "learning_rate": 0.00011022609189541554, "loss": 0.0254, "step": 196020 }, { "epoch": 1.27, "learning_rate": 0.00011021641054105862, "loss": 0.0367, "step": 196030 }, { "epoch": 1.27, "learning_rate": 0.00011020672918670168, "loss": 0.0304, "step": 196040 }, { "epoch": 1.27, "learning_rate": 0.00011019704783234474, "loss": 0.0324, "step": 196050 }, { "epoch": 1.27, "learning_rate": 0.00011018736647798782, "loss": 0.0333, "step": 196060 }, { "epoch": 1.27, "learning_rate": 0.00011017768512363088, "loss": 0.0355, "step": 196070 }, { "epoch": 1.27, "learning_rate": 0.00011016800376927396, "loss": 0.0341, "step": 196080 }, { "epoch": 1.27, "learning_rate": 0.00011015832241491701, "loss": 0.0261, "step": 196090 }, { "epoch": 1.27, "learning_rate": 0.0001101486410605601, "loss": 0.0288, "step": 196100 }, { "epoch": 1.27, "learning_rate": 0.00011013895970620316, "loss": 0.0319, "step": 196110 }, { "epoch": 1.27, "learning_rate": 0.00011012927835184621, "loss": 0.0264, "step": 196120 }, { "epoch": 1.27, "learning_rate": 0.00011011959699748929, "loss": 0.0246, "step": 196130 }, { "epoch": 1.27, "learning_rate": 0.00011010991564313236, "loss": 0.0307, "step": 196140 }, { "epoch": 1.27, "learning_rate": 0.00011010023428877544, "loss": 0.0316, "step": 196150 }, { "epoch": 1.27, "learning_rate": 0.00011009055293441849, "loss": 0.0281, "step": 196160 }, { "epoch": 1.27, "learning_rate": 0.00011008087158006156, "loss": 0.0329, "step": 196170 }, { "epoch": 1.27, "learning_rate": 0.00011007119022570464, "loss": 0.0336, "step": 196180 }, { "epoch": 1.27, "learning_rate": 0.00011006150887134769, "loss": 0.0285, "step": 196190 }, { "epoch": 1.27, "learning_rate": 0.00011005182751699077, "loss": 0.0302, "step": 196200 }, { "epoch": 1.27, "learning_rate": 0.00011004214616263384, "loss": 0.0343, "step": 196210 }, { "epoch": 1.27, "learning_rate": 0.00011003246480827692, "loss": 0.0327, "step": 196220 }, { "epoch": 1.27, "learning_rate": 0.00011002278345391997, "loss": 0.0278, "step": 196230 }, { "epoch": 1.27, "learning_rate": 0.00011001310209956304, "loss": 0.0264, "step": 196240 }, { "epoch": 1.27, "learning_rate": 0.00011000342074520612, "loss": 0.0335, "step": 196250 }, { "epoch": 1.27, "learning_rate": 0.00010999373939084917, "loss": 0.0311, "step": 196260 }, { "epoch": 1.27, "learning_rate": 0.00010998405803649223, "loss": 0.0284, "step": 196270 }, { "epoch": 1.27, "learning_rate": 0.00010997437668213531, "loss": 0.0341, "step": 196280 }, { "epoch": 1.27, "learning_rate": 0.00010996469532777838, "loss": 0.0324, "step": 196290 }, { "epoch": 1.27, "learning_rate": 0.00010995501397342145, "loss": 0.0272, "step": 196300 }, { "epoch": 1.27, "learning_rate": 0.00010994533261906451, "loss": 0.0281, "step": 196310 }, { "epoch": 1.27, "learning_rate": 0.00010993565126470759, "loss": 0.0296, "step": 196320 }, { "epoch": 1.27, "learning_rate": 0.00010992596991035064, "loss": 0.0267, "step": 196330 }, { "epoch": 1.27, "learning_rate": 0.00010991628855599371, "loss": 0.0254, "step": 196340 }, { "epoch": 1.27, "learning_rate": 0.00010990660720163679, "loss": 0.032, "step": 196350 }, { "epoch": 1.27, "learning_rate": 0.00010989692584727986, "loss": 0.0296, "step": 196360 }, { "epoch": 1.27, "learning_rate": 0.00010988724449292291, "loss": 0.0272, "step": 196370 }, { "epoch": 1.27, "learning_rate": 0.00010987756313856599, "loss": 0.03, "step": 196380 }, { "epoch": 1.27, "learning_rate": 0.00010986788178420906, "loss": 0.0257, "step": 196390 }, { "epoch": 1.27, "learning_rate": 0.00010985820042985212, "loss": 0.0324, "step": 196400 }, { "epoch": 1.27, "learning_rate": 0.00010984851907549519, "loss": 0.0323, "step": 196410 }, { "epoch": 1.27, "learning_rate": 0.00010983883772113827, "loss": 0.0279, "step": 196420 }, { "epoch": 1.27, "learning_rate": 0.00010982915636678133, "loss": 0.0357, "step": 196430 }, { "epoch": 1.27, "learning_rate": 0.00010981947501242439, "loss": 0.0305, "step": 196440 }, { "epoch": 1.27, "learning_rate": 0.00010980979365806747, "loss": 0.0281, "step": 196450 }, { "epoch": 1.27, "learning_rate": 0.00010980011230371053, "loss": 0.0333, "step": 196460 }, { "epoch": 1.27, "learning_rate": 0.00010979043094935359, "loss": 0.0281, "step": 196470 }, { "epoch": 1.27, "learning_rate": 0.00010978074959499667, "loss": 0.0263, "step": 196480 }, { "epoch": 1.27, "learning_rate": 0.00010977106824063973, "loss": 0.0278, "step": 196490 }, { "epoch": 1.27, "learning_rate": 0.00010976138688628281, "loss": 0.0284, "step": 196500 }, { "epoch": 1.27, "learning_rate": 0.00010975170553192586, "loss": 0.0284, "step": 196510 }, { "epoch": 1.27, "learning_rate": 0.00010974202417756894, "loss": 0.0314, "step": 196520 }, { "epoch": 1.27, "learning_rate": 0.00010973234282321201, "loss": 0.0306, "step": 196530 }, { "epoch": 1.27, "learning_rate": 0.00010972266146885506, "loss": 0.026, "step": 196540 }, { "epoch": 1.27, "learning_rate": 0.00010971298011449814, "loss": 0.0262, "step": 196550 }, { "epoch": 1.27, "learning_rate": 0.00010970329876014121, "loss": 0.0296, "step": 196560 }, { "epoch": 1.27, "learning_rate": 0.00010969361740578429, "loss": 0.0374, "step": 196570 }, { "epoch": 1.27, "learning_rate": 0.00010968393605142734, "loss": 0.0263, "step": 196580 }, { "epoch": 1.27, "learning_rate": 0.00010967425469707041, "loss": 0.0328, "step": 196590 }, { "epoch": 1.27, "learning_rate": 0.00010966457334271349, "loss": 0.0335, "step": 196600 }, { "epoch": 1.27, "learning_rate": 0.00010965489198835654, "loss": 0.0354, "step": 196610 }, { "epoch": 1.27, "learning_rate": 0.00010964521063399962, "loss": 0.0292, "step": 196620 }, { "epoch": 1.27, "learning_rate": 0.00010963552927964269, "loss": 0.0404, "step": 196630 }, { "epoch": 1.27, "learning_rate": 0.00010962584792528575, "loss": 0.0311, "step": 196640 }, { "epoch": 1.27, "learning_rate": 0.00010961616657092882, "loss": 0.0334, "step": 196650 }, { "epoch": 1.27, "learning_rate": 0.00010960648521657189, "loss": 0.0289, "step": 196660 }, { "epoch": 1.27, "learning_rate": 0.00010959680386221496, "loss": 0.0363, "step": 196670 }, { "epoch": 1.27, "learning_rate": 0.00010958712250785802, "loss": 0.029, "step": 196680 }, { "epoch": 1.27, "learning_rate": 0.00010957744115350108, "loss": 0.0268, "step": 196690 }, { "epoch": 1.27, "learning_rate": 0.00010956775979914416, "loss": 0.0322, "step": 196700 }, { "epoch": 1.27, "learning_rate": 0.00010955807844478723, "loss": 0.0322, "step": 196710 }, { "epoch": 1.27, "learning_rate": 0.0001095483970904303, "loss": 0.0245, "step": 196720 }, { "epoch": 1.27, "learning_rate": 0.00010953871573607336, "loss": 0.0335, "step": 196730 }, { "epoch": 1.27, "learning_rate": 0.00010952903438171643, "loss": 0.0291, "step": 196740 }, { "epoch": 1.27, "learning_rate": 0.0001095193530273595, "loss": 0.0298, "step": 196750 }, { "epoch": 1.27, "learning_rate": 0.00010950967167300256, "loss": 0.0257, "step": 196760 }, { "epoch": 1.27, "learning_rate": 0.00010949999031864564, "loss": 0.0312, "step": 196770 }, { "epoch": 1.27, "learning_rate": 0.00010949030896428871, "loss": 0.0323, "step": 196780 }, { "epoch": 1.27, "learning_rate": 0.00010948062760993176, "loss": 0.027, "step": 196790 }, { "epoch": 1.27, "learning_rate": 0.00010947094625557484, "loss": 0.034, "step": 196800 }, { "epoch": 1.27, "learning_rate": 0.0001094612649012179, "loss": 0.0299, "step": 196810 }, { "epoch": 1.27, "learning_rate": 0.00010945158354686097, "loss": 0.0258, "step": 196820 }, { "epoch": 1.27, "learning_rate": 0.00010944190219250404, "loss": 0.0292, "step": 196830 }, { "epoch": 1.27, "learning_rate": 0.0001094322208381471, "loss": 0.0276, "step": 196840 }, { "epoch": 1.27, "learning_rate": 0.00010942253948379018, "loss": 0.0303, "step": 196850 }, { "epoch": 1.27, "learning_rate": 0.00010941285812943324, "loss": 0.0371, "step": 196860 }, { "epoch": 1.27, "learning_rate": 0.00010940317677507632, "loss": 0.0298, "step": 196870 }, { "epoch": 1.27, "learning_rate": 0.00010939349542071938, "loss": 0.0339, "step": 196880 }, { "epoch": 1.27, "learning_rate": 0.00010938381406636244, "loss": 0.0312, "step": 196890 }, { "epoch": 1.27, "learning_rate": 0.00010937413271200552, "loss": 0.0336, "step": 196900 }, { "epoch": 1.27, "learning_rate": 0.00010936445135764858, "loss": 0.0261, "step": 196910 }, { "epoch": 1.27, "learning_rate": 0.00010935477000329166, "loss": 0.0277, "step": 196920 }, { "epoch": 1.27, "learning_rate": 0.00010934508864893471, "loss": 0.0331, "step": 196930 }, { "epoch": 1.27, "learning_rate": 0.00010933540729457778, "loss": 0.0302, "step": 196940 }, { "epoch": 1.27, "learning_rate": 0.00010932572594022086, "loss": 0.029, "step": 196950 }, { "epoch": 1.27, "learning_rate": 0.00010931604458586391, "loss": 0.032, "step": 196960 }, { "epoch": 1.27, "learning_rate": 0.00010930636323150699, "loss": 0.0341, "step": 196970 }, { "epoch": 1.27, "learning_rate": 0.00010929668187715006, "loss": 0.0323, "step": 196980 }, { "epoch": 1.27, "learning_rate": 0.00010928700052279314, "loss": 0.0309, "step": 196990 }, { "epoch": 1.27, "learning_rate": 0.00010927731916843619, "loss": 0.0268, "step": 197000 }, { "epoch": 1.27, "eval_cer": 0.919872556773246, "eval_loss": 0.022425523027777672, "eval_runtime": 120.1817, "eval_samples_per_second": 16.641, "eval_steps_per_second": 4.16, "step": 197000 }, { "epoch": 1.27, "learning_rate": 0.00010926763781407926, "loss": 0.0271, "step": 197010 }, { "epoch": 1.27, "learning_rate": 0.00010925795645972234, "loss": 0.0324, "step": 197020 }, { "epoch": 1.27, "learning_rate": 0.00010924827510536539, "loss": 0.0242, "step": 197030 }, { "epoch": 1.27, "learning_rate": 0.00010923859375100846, "loss": 0.028, "step": 197040 }, { "epoch": 1.27, "learning_rate": 0.00010922891239665154, "loss": 0.0284, "step": 197050 }, { "epoch": 1.27, "learning_rate": 0.0001092192310422946, "loss": 0.0314, "step": 197060 }, { "epoch": 1.27, "learning_rate": 0.00010920954968793767, "loss": 0.0307, "step": 197070 }, { "epoch": 1.27, "learning_rate": 0.00010919986833358073, "loss": 0.0383, "step": 197080 }, { "epoch": 1.27, "learning_rate": 0.00010919018697922381, "loss": 0.0278, "step": 197090 }, { "epoch": 1.27, "learning_rate": 0.00010918050562486687, "loss": 0.0288, "step": 197100 }, { "epoch": 1.27, "learning_rate": 0.00010917082427050993, "loss": 0.0321, "step": 197110 }, { "epoch": 1.27, "learning_rate": 0.00010916114291615301, "loss": 0.0314, "step": 197120 }, { "epoch": 1.27, "learning_rate": 0.00010915146156179608, "loss": 0.025, "step": 197130 }, { "epoch": 1.27, "learning_rate": 0.00010914178020743913, "loss": 0.0322, "step": 197140 }, { "epoch": 1.27, "learning_rate": 0.00010913209885308221, "loss": 0.0395, "step": 197150 }, { "epoch": 1.27, "learning_rate": 0.00010912241749872528, "loss": 0.0284, "step": 197160 }, { "epoch": 1.27, "learning_rate": 0.00010911273614436834, "loss": 0.0293, "step": 197170 }, { "epoch": 1.27, "learning_rate": 0.00010910305479001141, "loss": 0.0377, "step": 197180 }, { "epoch": 1.27, "learning_rate": 0.00010909337343565449, "loss": 0.0319, "step": 197190 }, { "epoch": 1.27, "learning_rate": 0.00010908369208129756, "loss": 0.036, "step": 197200 }, { "epoch": 1.27, "learning_rate": 0.00010907401072694061, "loss": 0.0279, "step": 197210 }, { "epoch": 1.27, "learning_rate": 0.00010906432937258369, "loss": 0.0303, "step": 197220 }, { "epoch": 1.27, "learning_rate": 0.00010905464801822676, "loss": 0.0292, "step": 197230 }, { "epoch": 1.27, "learning_rate": 0.00010904496666386981, "loss": 0.0285, "step": 197240 }, { "epoch": 1.27, "learning_rate": 0.00010903528530951289, "loss": 0.0392, "step": 197250 }, { "epoch": 1.27, "learning_rate": 0.00010902560395515595, "loss": 0.0299, "step": 197260 }, { "epoch": 1.27, "learning_rate": 0.00010901592260079903, "loss": 0.0263, "step": 197270 }, { "epoch": 1.27, "learning_rate": 0.00010900624124644209, "loss": 0.0244, "step": 197280 }, { "epoch": 1.27, "learning_rate": 0.00010899655989208517, "loss": 0.0294, "step": 197290 }, { "epoch": 1.27, "learning_rate": 0.00010898687853772823, "loss": 0.0325, "step": 197300 }, { "epoch": 1.27, "learning_rate": 0.00010897719718337129, "loss": 0.0322, "step": 197310 }, { "epoch": 1.27, "learning_rate": 0.00010896751582901437, "loss": 0.0257, "step": 197320 }, { "epoch": 1.27, "learning_rate": 0.00010895783447465743, "loss": 0.0341, "step": 197330 }, { "epoch": 1.27, "learning_rate": 0.00010894815312030051, "loss": 0.0326, "step": 197340 }, { "epoch": 1.27, "learning_rate": 0.00010893847176594356, "loss": 0.0308, "step": 197350 }, { "epoch": 1.27, "learning_rate": 0.00010892879041158663, "loss": 0.0295, "step": 197360 }, { "epoch": 1.27, "learning_rate": 0.00010891910905722971, "loss": 0.0274, "step": 197370 }, { "epoch": 1.27, "learning_rate": 0.00010890942770287276, "loss": 0.0298, "step": 197380 }, { "epoch": 1.27, "learning_rate": 0.00010889974634851584, "loss": 0.0302, "step": 197390 }, { "epoch": 1.27, "learning_rate": 0.00010889006499415891, "loss": 0.0281, "step": 197400 }, { "epoch": 1.27, "learning_rate": 0.00010888038363980199, "loss": 0.0292, "step": 197410 }, { "epoch": 1.27, "learning_rate": 0.00010887070228544504, "loss": 0.0295, "step": 197420 }, { "epoch": 1.27, "learning_rate": 0.00010886102093108811, "loss": 0.0343, "step": 197430 }, { "epoch": 1.27, "learning_rate": 0.00010885133957673119, "loss": 0.0295, "step": 197440 }, { "epoch": 1.27, "learning_rate": 0.00010884165822237424, "loss": 0.0308, "step": 197450 }, { "epoch": 1.27, "learning_rate": 0.0001088319768680173, "loss": 0.0315, "step": 197460 }, { "epoch": 1.27, "learning_rate": 0.00010882229551366039, "loss": 0.0307, "step": 197470 }, { "epoch": 1.27, "learning_rate": 0.00010881261415930345, "loss": 0.0275, "step": 197480 }, { "epoch": 1.27, "learning_rate": 0.00010880293280494652, "loss": 0.0257, "step": 197490 }, { "epoch": 1.27, "learning_rate": 0.00010879325145058958, "loss": 0.0293, "step": 197500 }, { "epoch": 1.27, "learning_rate": 0.00010878357009623266, "loss": 0.0336, "step": 197510 }, { "epoch": 1.27, "learning_rate": 0.00010877388874187572, "loss": 0.0306, "step": 197520 }, { "epoch": 1.27, "learning_rate": 0.00010876420738751878, "loss": 0.0338, "step": 197530 }, { "epoch": 1.27, "learning_rate": 0.00010875452603316186, "loss": 0.0299, "step": 197540 }, { "epoch": 1.28, "learning_rate": 0.00010874484467880493, "loss": 0.0314, "step": 197550 }, { "epoch": 1.28, "learning_rate": 0.00010873516332444798, "loss": 0.027, "step": 197560 }, { "epoch": 1.28, "learning_rate": 0.00010872548197009106, "loss": 0.0338, "step": 197570 }, { "epoch": 1.28, "learning_rate": 0.00010871580061573413, "loss": 0.031, "step": 197580 }, { "epoch": 1.28, "learning_rate": 0.0001087061192613772, "loss": 0.0318, "step": 197590 }, { "epoch": 1.28, "learning_rate": 0.00010869643790702026, "loss": 0.0297, "step": 197600 }, { "epoch": 1.28, "learning_rate": 0.00010868675655266334, "loss": 0.0316, "step": 197610 }, { "epoch": 1.28, "learning_rate": 0.0001086770751983064, "loss": 0.0335, "step": 197620 }, { "epoch": 1.28, "learning_rate": 0.00010866739384394946, "loss": 0.0308, "step": 197630 }, { "epoch": 1.28, "learning_rate": 0.00010865771248959254, "loss": 0.029, "step": 197640 }, { "epoch": 1.28, "learning_rate": 0.0001086480311352356, "loss": 0.0299, "step": 197650 }, { "epoch": 1.28, "learning_rate": 0.00010863834978087866, "loss": 0.0298, "step": 197660 }, { "epoch": 1.28, "learning_rate": 0.00010862866842652174, "loss": 0.0266, "step": 197670 }, { "epoch": 1.28, "learning_rate": 0.0001086189870721648, "loss": 0.0351, "step": 197680 }, { "epoch": 1.28, "learning_rate": 0.00010860930571780788, "loss": 0.0337, "step": 197690 }, { "epoch": 1.28, "learning_rate": 0.00010859962436345094, "loss": 0.0284, "step": 197700 }, { "epoch": 1.28, "learning_rate": 0.00010858994300909402, "loss": 0.0278, "step": 197710 }, { "epoch": 1.28, "learning_rate": 0.00010858026165473708, "loss": 0.0283, "step": 197720 }, { "epoch": 1.28, "learning_rate": 0.00010857058030038014, "loss": 0.0342, "step": 197730 }, { "epoch": 1.28, "learning_rate": 0.00010856089894602322, "loss": 0.0282, "step": 197740 }, { "epoch": 1.28, "learning_rate": 0.00010855121759166628, "loss": 0.0296, "step": 197750 }, { "epoch": 1.28, "learning_rate": 0.00010854153623730936, "loss": 0.0258, "step": 197760 }, { "epoch": 1.28, "learning_rate": 0.00010853185488295241, "loss": 0.0281, "step": 197770 }, { "epoch": 1.28, "learning_rate": 0.00010852217352859548, "loss": 0.0322, "step": 197780 }, { "epoch": 1.28, "learning_rate": 0.00010851249217423856, "loss": 0.0327, "step": 197790 }, { "epoch": 1.28, "learning_rate": 0.00010850281081988161, "loss": 0.0359, "step": 197800 }, { "epoch": 1.28, "learning_rate": 0.00010849312946552469, "loss": 0.0266, "step": 197810 }, { "epoch": 1.28, "learning_rate": 0.00010848344811116776, "loss": 0.0316, "step": 197820 }, { "epoch": 1.28, "learning_rate": 0.00010847376675681084, "loss": 0.0269, "step": 197830 }, { "epoch": 1.28, "learning_rate": 0.00010846408540245389, "loss": 0.0316, "step": 197840 }, { "epoch": 1.28, "learning_rate": 0.00010845440404809696, "loss": 0.0309, "step": 197850 }, { "epoch": 1.28, "learning_rate": 0.00010844472269374004, "loss": 0.0282, "step": 197860 }, { "epoch": 1.28, "learning_rate": 0.00010843504133938309, "loss": 0.0333, "step": 197870 }, { "epoch": 1.28, "learning_rate": 0.00010842535998502616, "loss": 0.028, "step": 197880 }, { "epoch": 1.28, "learning_rate": 0.00010841567863066924, "loss": 0.0287, "step": 197890 }, { "epoch": 1.28, "learning_rate": 0.0001084059972763123, "loss": 0.0336, "step": 197900 }, { "epoch": 1.28, "learning_rate": 0.00010839631592195537, "loss": 0.0306, "step": 197910 }, { "epoch": 1.28, "learning_rate": 0.00010838663456759843, "loss": 0.0245, "step": 197920 }, { "epoch": 1.28, "learning_rate": 0.00010837695321324151, "loss": 0.0295, "step": 197930 }, { "epoch": 1.28, "learning_rate": 0.00010836727185888457, "loss": 0.0267, "step": 197940 }, { "epoch": 1.28, "learning_rate": 0.00010835759050452763, "loss": 0.034, "step": 197950 }, { "epoch": 1.28, "learning_rate": 0.00010834790915017071, "loss": 0.0288, "step": 197960 }, { "epoch": 1.28, "learning_rate": 0.00010833822779581378, "loss": 0.0308, "step": 197970 }, { "epoch": 1.28, "learning_rate": 0.00010832854644145683, "loss": 0.029, "step": 197980 }, { "epoch": 1.28, "learning_rate": 0.00010831886508709991, "loss": 0.0287, "step": 197990 }, { "epoch": 1.28, "learning_rate": 0.00010830918373274298, "loss": 0.032, "step": 198000 }, { "epoch": 1.28, "eval_cer": 0.919873460625918, "eval_loss": 0.022191094234585762, "eval_runtime": 120.0906, "eval_samples_per_second": 16.654, "eval_steps_per_second": 4.164, "step": 198000 }, { "epoch": 1.28, "learning_rate": 0.00010829950237838604, "loss": 0.0277, "step": 198010 }, { "epoch": 1.28, "learning_rate": 0.00010828982102402911, "loss": 0.0295, "step": 198020 }, { "epoch": 1.28, "learning_rate": 0.00010828013966967219, "loss": 0.0316, "step": 198030 }, { "epoch": 1.28, "learning_rate": 0.00010827045831531524, "loss": 0.0327, "step": 198040 }, { "epoch": 1.28, "learning_rate": 0.00010826077696095831, "loss": 0.0337, "step": 198050 }, { "epoch": 1.28, "learning_rate": 0.00010825109560660139, "loss": 0.028, "step": 198060 }, { "epoch": 1.28, "learning_rate": 0.00010824141425224446, "loss": 0.0297, "step": 198070 }, { "epoch": 1.28, "learning_rate": 0.00010823173289788751, "loss": 0.0287, "step": 198080 }, { "epoch": 1.28, "learning_rate": 0.00010822205154353059, "loss": 0.0271, "step": 198090 }, { "epoch": 1.28, "learning_rate": 0.00010821237018917365, "loss": 0.0304, "step": 198100 }, { "epoch": 1.28, "learning_rate": 0.00010820268883481672, "loss": 0.0285, "step": 198110 }, { "epoch": 1.28, "learning_rate": 0.00010819300748045979, "loss": 0.0319, "step": 198120 }, { "epoch": 1.28, "learning_rate": 0.00010818332612610287, "loss": 0.0264, "step": 198130 }, { "epoch": 1.28, "learning_rate": 0.00010817364477174593, "loss": 0.0388, "step": 198140 }, { "epoch": 1.28, "learning_rate": 0.00010816396341738899, "loss": 0.0354, "step": 198150 }, { "epoch": 1.28, "learning_rate": 0.00010815428206303206, "loss": 0.0355, "step": 198160 }, { "epoch": 1.28, "learning_rate": 0.00010814460070867513, "loss": 0.0324, "step": 198170 }, { "epoch": 1.28, "learning_rate": 0.00010813491935431818, "loss": 0.0315, "step": 198180 }, { "epoch": 1.28, "learning_rate": 0.00010812523799996126, "loss": 0.0294, "step": 198190 }, { "epoch": 1.28, "learning_rate": 0.00010811555664560433, "loss": 0.0317, "step": 198200 }, { "epoch": 1.28, "learning_rate": 0.00010810587529124741, "loss": 0.028, "step": 198210 }, { "epoch": 1.28, "learning_rate": 0.00010809619393689046, "loss": 0.0267, "step": 198220 }, { "epoch": 1.28, "learning_rate": 0.00010808651258253354, "loss": 0.0317, "step": 198230 }, { "epoch": 1.28, "learning_rate": 0.00010807683122817661, "loss": 0.0355, "step": 198240 }, { "epoch": 1.28, "learning_rate": 0.00010806714987381966, "loss": 0.0304, "step": 198250 }, { "epoch": 1.28, "learning_rate": 0.00010805746851946274, "loss": 0.0298, "step": 198260 }, { "epoch": 1.28, "learning_rate": 0.00010804778716510581, "loss": 0.0322, "step": 198270 }, { "epoch": 1.28, "learning_rate": 0.00010803810581074889, "loss": 0.0278, "step": 198280 }, { "epoch": 1.28, "learning_rate": 0.00010802842445639194, "loss": 0.0326, "step": 198290 }, { "epoch": 1.28, "learning_rate": 0.000108018743102035, "loss": 0.0332, "step": 198300 }, { "epoch": 1.28, "learning_rate": 0.00010800906174767809, "loss": 0.0291, "step": 198310 }, { "epoch": 1.28, "learning_rate": 0.00010799938039332114, "loss": 0.027, "step": 198320 }, { "epoch": 1.28, "learning_rate": 0.00010798969903896422, "loss": 0.0318, "step": 198330 }, { "epoch": 1.28, "learning_rate": 0.00010798001768460728, "loss": 0.0329, "step": 198340 }, { "epoch": 1.28, "learning_rate": 0.00010797033633025035, "loss": 0.0279, "step": 198350 }, { "epoch": 1.28, "learning_rate": 0.00010796065497589342, "loss": 0.0329, "step": 198360 }, { "epoch": 1.28, "learning_rate": 0.00010795097362153648, "loss": 0.0263, "step": 198370 }, { "epoch": 1.28, "learning_rate": 0.00010794129226717956, "loss": 0.0342, "step": 198380 }, { "epoch": 1.28, "learning_rate": 0.00010793161091282262, "loss": 0.0313, "step": 198390 }, { "epoch": 1.28, "learning_rate": 0.00010792192955846568, "loss": 0.0332, "step": 198400 }, { "epoch": 1.28, "learning_rate": 0.00010791224820410876, "loss": 0.0359, "step": 198410 }, { "epoch": 1.28, "learning_rate": 0.00010790256684975183, "loss": 0.0267, "step": 198420 }, { "epoch": 1.28, "learning_rate": 0.0001078928854953949, "loss": 0.0341, "step": 198430 }, { "epoch": 1.28, "learning_rate": 0.00010788320414103796, "loss": 0.0292, "step": 198440 }, { "epoch": 1.28, "learning_rate": 0.00010787352278668103, "loss": 0.0329, "step": 198450 }, { "epoch": 1.28, "learning_rate": 0.00010786384143232409, "loss": 0.0326, "step": 198460 }, { "epoch": 1.28, "learning_rate": 0.00010785416007796716, "loss": 0.0319, "step": 198470 }, { "epoch": 1.28, "learning_rate": 0.00010784447872361024, "loss": 0.0262, "step": 198480 }, { "epoch": 1.28, "learning_rate": 0.0001078347973692533, "loss": 0.0277, "step": 198490 }, { "epoch": 1.28, "learning_rate": 0.00010782511601489636, "loss": 0.028, "step": 198500 }, { "epoch": 1.28, "learning_rate": 0.00010781543466053944, "loss": 0.0404, "step": 198510 }, { "epoch": 1.28, "learning_rate": 0.0001078057533061825, "loss": 0.0357, "step": 198520 }, { "epoch": 1.28, "learning_rate": 0.00010779607195182557, "loss": 0.0304, "step": 198530 }, { "epoch": 1.28, "learning_rate": 0.00010778639059746864, "loss": 0.0374, "step": 198540 }, { "epoch": 1.28, "learning_rate": 0.0001077767092431117, "loss": 0.0316, "step": 198550 }, { "epoch": 1.28, "learning_rate": 0.00010776702788875478, "loss": 0.038, "step": 198560 }, { "epoch": 1.28, "learning_rate": 0.00010775734653439783, "loss": 0.0295, "step": 198570 }, { "epoch": 1.28, "learning_rate": 0.00010774766518004091, "loss": 0.0325, "step": 198580 }, { "epoch": 1.28, "learning_rate": 0.00010773798382568398, "loss": 0.0309, "step": 198590 }, { "epoch": 1.28, "learning_rate": 0.00010772830247132703, "loss": 0.036, "step": 198600 }, { "epoch": 1.28, "learning_rate": 0.00010771862111697011, "loss": 0.0308, "step": 198610 }, { "epoch": 1.28, "learning_rate": 0.00010770893976261318, "loss": 0.0301, "step": 198620 }, { "epoch": 1.28, "learning_rate": 0.00010769925840825626, "loss": 0.0275, "step": 198630 }, { "epoch": 1.28, "learning_rate": 0.00010768957705389931, "loss": 0.0302, "step": 198640 }, { "epoch": 1.28, "learning_rate": 0.00010767989569954238, "loss": 0.0295, "step": 198650 }, { "epoch": 1.28, "learning_rate": 0.00010767021434518546, "loss": 0.0283, "step": 198660 }, { "epoch": 1.28, "learning_rate": 0.00010766053299082851, "loss": 0.029, "step": 198670 }, { "epoch": 1.28, "learning_rate": 0.00010765085163647159, "loss": 0.0323, "step": 198680 }, { "epoch": 1.28, "learning_rate": 0.00010764117028211466, "loss": 0.029, "step": 198690 }, { "epoch": 1.28, "learning_rate": 0.00010763148892775774, "loss": 0.0326, "step": 198700 }, { "epoch": 1.28, "learning_rate": 0.00010762180757340079, "loss": 0.0287, "step": 198710 }, { "epoch": 1.28, "learning_rate": 0.00010761212621904386, "loss": 0.025, "step": 198720 }, { "epoch": 1.28, "learning_rate": 0.00010760244486468694, "loss": 0.0319, "step": 198730 }, { "epoch": 1.28, "learning_rate": 0.00010759276351032999, "loss": 0.0274, "step": 198740 }, { "epoch": 1.28, "learning_rate": 0.00010758308215597305, "loss": 0.0266, "step": 198750 }, { "epoch": 1.28, "learning_rate": 0.00010757340080161613, "loss": 0.0331, "step": 198760 }, { "epoch": 1.28, "learning_rate": 0.0001075637194472592, "loss": 0.03, "step": 198770 }, { "epoch": 1.28, "learning_rate": 0.00010755403809290227, "loss": 0.0368, "step": 198780 }, { "epoch": 1.28, "learning_rate": 0.00010754435673854533, "loss": 0.0272, "step": 198790 }, { "epoch": 1.28, "learning_rate": 0.00010753467538418841, "loss": 0.0296, "step": 198800 }, { "epoch": 1.28, "learning_rate": 0.00010752499402983147, "loss": 0.033, "step": 198810 }, { "epoch": 1.28, "learning_rate": 0.00010751531267547453, "loss": 0.0282, "step": 198820 }, { "epoch": 1.28, "learning_rate": 0.00010750563132111761, "loss": 0.0303, "step": 198830 }, { "epoch": 1.28, "learning_rate": 0.00010749594996676068, "loss": 0.0276, "step": 198840 }, { "epoch": 1.28, "learning_rate": 0.00010748626861240373, "loss": 0.0277, "step": 198850 }, { "epoch": 1.28, "learning_rate": 0.00010747658725804681, "loss": 0.029, "step": 198860 }, { "epoch": 1.28, "learning_rate": 0.00010746690590368988, "loss": 0.0311, "step": 198870 }, { "epoch": 1.28, "learning_rate": 0.00010745722454933294, "loss": 0.0343, "step": 198880 }, { "epoch": 1.28, "learning_rate": 0.00010744754319497601, "loss": 0.0326, "step": 198890 }, { "epoch": 1.28, "learning_rate": 0.00010743786184061909, "loss": 0.0288, "step": 198900 }, { "epoch": 1.28, "learning_rate": 0.00010742818048626215, "loss": 0.0359, "step": 198910 }, { "epoch": 1.28, "learning_rate": 0.00010741849913190521, "loss": 0.0324, "step": 198920 }, { "epoch": 1.28, "learning_rate": 0.00010740881777754829, "loss": 0.0278, "step": 198930 }, { "epoch": 1.28, "learning_rate": 0.00010739913642319135, "loss": 0.0272, "step": 198940 }, { "epoch": 1.28, "learning_rate": 0.0001073894550688344, "loss": 0.0246, "step": 198950 }, { "epoch": 1.28, "learning_rate": 0.00010737977371447749, "loss": 0.035, "step": 198960 }, { "epoch": 1.28, "learning_rate": 0.00010737009236012055, "loss": 0.0303, "step": 198970 }, { "epoch": 1.28, "learning_rate": 0.00010736041100576363, "loss": 0.0431, "step": 198980 }, { "epoch": 1.28, "learning_rate": 0.00010735072965140668, "loss": 0.0306, "step": 198990 }, { "epoch": 1.28, "learning_rate": 0.00010734104829704976, "loss": 0.0328, "step": 199000 }, { "epoch": 1.28, "eval_cer": 0.9199132301434866, "eval_loss": 0.0220940038561821, "eval_runtime": 120.1709, "eval_samples_per_second": 16.643, "eval_steps_per_second": 4.161, "step": 199000 }, { "epoch": 1.28, "learning_rate": 0.00010733136694269283, "loss": 0.0302, "step": 199010 }, { "epoch": 1.28, "learning_rate": 0.00010732168558833588, "loss": 0.0261, "step": 199020 }, { "epoch": 1.28, "learning_rate": 0.00010731200423397896, "loss": 0.0289, "step": 199030 }, { "epoch": 1.28, "learning_rate": 0.00010730232287962203, "loss": 0.0292, "step": 199040 }, { "epoch": 1.28, "learning_rate": 0.00010729264152526511, "loss": 0.0308, "step": 199050 }, { "epoch": 1.28, "learning_rate": 0.00010728296017090816, "loss": 0.0337, "step": 199060 }, { "epoch": 1.28, "learning_rate": 0.00010727327881655123, "loss": 0.026, "step": 199070 }, { "epoch": 1.28, "learning_rate": 0.00010726359746219431, "loss": 0.0302, "step": 199080 }, { "epoch": 1.28, "learning_rate": 0.00010725391610783736, "loss": 0.0311, "step": 199090 }, { "epoch": 1.29, "learning_rate": 0.00010724423475348044, "loss": 0.0297, "step": 199100 }, { "epoch": 1.29, "learning_rate": 0.0001072345533991235, "loss": 0.0344, "step": 199110 }, { "epoch": 1.29, "learning_rate": 0.00010722487204476659, "loss": 0.0288, "step": 199120 }, { "epoch": 1.29, "learning_rate": 0.00010721519069040964, "loss": 0.035, "step": 199130 }, { "epoch": 1.29, "learning_rate": 0.0001072055093360527, "loss": 0.0294, "step": 199140 }, { "epoch": 1.29, "learning_rate": 0.00010719582798169579, "loss": 0.0269, "step": 199150 }, { "epoch": 1.29, "learning_rate": 0.00010718614662733884, "loss": 0.029, "step": 199160 }, { "epoch": 1.29, "learning_rate": 0.0001071764652729819, "loss": 0.0298, "step": 199170 }, { "epoch": 1.29, "learning_rate": 0.00010716678391862498, "loss": 0.0355, "step": 199180 }, { "epoch": 1.29, "learning_rate": 0.00010715710256426805, "loss": 0.0338, "step": 199190 }, { "epoch": 1.29, "learning_rate": 0.00010714742120991112, "loss": 0.0315, "step": 199200 }, { "epoch": 1.29, "learning_rate": 0.00010713773985555418, "loss": 0.0379, "step": 199210 }, { "epoch": 1.29, "learning_rate": 0.00010712805850119726, "loss": 0.0433, "step": 199220 }, { "epoch": 1.29, "learning_rate": 0.00010711837714684032, "loss": 0.0281, "step": 199230 }, { "epoch": 1.29, "learning_rate": 0.00010710869579248338, "loss": 0.0283, "step": 199240 }, { "epoch": 1.29, "learning_rate": 0.00010709901443812646, "loss": 0.0324, "step": 199250 }, { "epoch": 1.29, "learning_rate": 0.00010708933308376953, "loss": 0.0263, "step": 199260 }, { "epoch": 1.29, "learning_rate": 0.00010707965172941258, "loss": 0.0291, "step": 199270 }, { "epoch": 1.29, "learning_rate": 0.00010706997037505566, "loss": 0.0307, "step": 199280 }, { "epoch": 1.29, "learning_rate": 0.00010706028902069873, "loss": 0.0316, "step": 199290 }, { "epoch": 1.29, "learning_rate": 0.00010705060766634179, "loss": 0.0293, "step": 199300 }, { "epoch": 1.29, "learning_rate": 0.00010704092631198486, "loss": 0.0397, "step": 199310 }, { "epoch": 1.29, "learning_rate": 0.00010703124495762794, "loss": 0.0334, "step": 199320 }, { "epoch": 1.29, "learning_rate": 0.000107021563603271, "loss": 0.0329, "step": 199330 }, { "epoch": 1.29, "learning_rate": 0.00010701188224891406, "loss": 0.0296, "step": 199340 }, { "epoch": 1.29, "learning_rate": 0.00010700220089455714, "loss": 0.0345, "step": 199350 }, { "epoch": 1.29, "learning_rate": 0.0001069925195402002, "loss": 0.0348, "step": 199360 }, { "epoch": 1.29, "learning_rate": 0.00010698283818584326, "loss": 0.0292, "step": 199370 }, { "epoch": 1.29, "learning_rate": 0.00010697315683148634, "loss": 0.0279, "step": 199380 }, { "epoch": 1.29, "learning_rate": 0.0001069634754771294, "loss": 0.0306, "step": 199390 }, { "epoch": 1.29, "learning_rate": 0.00010695379412277248, "loss": 0.0302, "step": 199400 }, { "epoch": 1.29, "learning_rate": 0.00010694411276841553, "loss": 0.0339, "step": 199410 }, { "epoch": 1.29, "learning_rate": 0.00010693443141405861, "loss": 0.0295, "step": 199420 }, { "epoch": 1.29, "learning_rate": 0.00010692475005970168, "loss": 0.0305, "step": 199430 }, { "epoch": 1.29, "learning_rate": 0.00010691506870534473, "loss": 0.0298, "step": 199440 }, { "epoch": 1.29, "learning_rate": 0.00010690538735098781, "loss": 0.0328, "step": 199450 }, { "epoch": 1.29, "learning_rate": 0.00010689570599663088, "loss": 0.0317, "step": 199460 }, { "epoch": 1.29, "learning_rate": 0.00010688602464227396, "loss": 0.0312, "step": 199470 }, { "epoch": 1.29, "learning_rate": 0.00010687634328791701, "loss": 0.032, "step": 199480 }, { "epoch": 1.29, "learning_rate": 0.00010686666193356008, "loss": 0.0293, "step": 199490 }, { "epoch": 1.29, "learning_rate": 0.00010685698057920316, "loss": 0.0383, "step": 199500 }, { "epoch": 1.29, "learning_rate": 0.00010684729922484621, "loss": 0.0341, "step": 199510 }, { "epoch": 1.29, "learning_rate": 0.00010683761787048929, "loss": 0.0316, "step": 199520 }, { "epoch": 1.29, "learning_rate": 0.00010682793651613236, "loss": 0.0372, "step": 199530 }, { "epoch": 1.29, "learning_rate": 0.00010681825516177542, "loss": 0.0263, "step": 199540 }, { "epoch": 1.29, "learning_rate": 0.00010680857380741849, "loss": 0.0378, "step": 199550 }, { "epoch": 1.29, "learning_rate": 0.00010679889245306156, "loss": 0.0277, "step": 199560 }, { "epoch": 1.29, "learning_rate": 0.00010678921109870463, "loss": 0.031, "step": 199570 }, { "epoch": 1.29, "learning_rate": 0.00010677952974434769, "loss": 0.0288, "step": 199580 }, { "epoch": 1.29, "learning_rate": 0.00010676984838999075, "loss": 0.0316, "step": 199590 }, { "epoch": 1.29, "learning_rate": 0.00010676016703563383, "loss": 0.0304, "step": 199600 }, { "epoch": 1.29, "learning_rate": 0.0001067504856812769, "loss": 0.0302, "step": 199610 }, { "epoch": 1.29, "learning_rate": 0.00010674080432691997, "loss": 0.0332, "step": 199620 }, { "epoch": 1.29, "learning_rate": 0.00010673112297256303, "loss": 0.0293, "step": 199630 }, { "epoch": 1.29, "learning_rate": 0.0001067214416182061, "loss": 0.0337, "step": 199640 }, { "epoch": 1.29, "learning_rate": 0.00010671176026384916, "loss": 0.034, "step": 199650 }, { "epoch": 1.29, "learning_rate": 0.00010670207890949223, "loss": 0.0306, "step": 199660 }, { "epoch": 1.29, "learning_rate": 0.00010669239755513531, "loss": 0.0292, "step": 199670 }, { "epoch": 1.29, "learning_rate": 0.00010668271620077838, "loss": 0.0311, "step": 199680 }, { "epoch": 1.29, "learning_rate": 0.00010667303484642143, "loss": 0.0344, "step": 199690 }, { "epoch": 1.29, "learning_rate": 0.00010666335349206451, "loss": 0.0283, "step": 199700 }, { "epoch": 1.29, "learning_rate": 0.00010665367213770758, "loss": 0.0321, "step": 199710 }, { "epoch": 1.29, "learning_rate": 0.00010664399078335064, "loss": 0.0316, "step": 199720 }, { "epoch": 1.29, "learning_rate": 0.00010663430942899371, "loss": 0.0342, "step": 199730 }, { "epoch": 1.29, "learning_rate": 0.00010662462807463677, "loss": 0.0303, "step": 199740 }, { "epoch": 1.29, "learning_rate": 0.00010661494672027985, "loss": 0.0272, "step": 199750 }, { "epoch": 1.29, "learning_rate": 0.00010660526536592291, "loss": 0.0325, "step": 199760 }, { "epoch": 1.29, "learning_rate": 0.00010659558401156599, "loss": 0.0317, "step": 199770 }, { "epoch": 1.29, "learning_rate": 0.00010658590265720905, "loss": 0.0366, "step": 199780 }, { "epoch": 1.29, "learning_rate": 0.0001065762213028521, "loss": 0.0341, "step": 199790 }, { "epoch": 1.29, "learning_rate": 0.00010656653994849519, "loss": 0.0258, "step": 199800 }, { "epoch": 1.29, "learning_rate": 0.00010655685859413825, "loss": 0.0294, "step": 199810 }, { "epoch": 1.29, "learning_rate": 0.00010654717723978133, "loss": 0.0249, "step": 199820 }, { "epoch": 1.29, "learning_rate": 0.00010653749588542438, "loss": 0.0339, "step": 199830 }, { "epoch": 1.29, "learning_rate": 0.00010652781453106745, "loss": 0.0336, "step": 199840 }, { "epoch": 1.29, "learning_rate": 0.00010651813317671053, "loss": 0.0324, "step": 199850 }, { "epoch": 1.29, "learning_rate": 0.00010650845182235358, "loss": 0.0342, "step": 199860 }, { "epoch": 1.29, "learning_rate": 0.00010649877046799666, "loss": 0.0317, "step": 199870 }, { "epoch": 1.29, "learning_rate": 0.00010648908911363973, "loss": 0.0289, "step": 199880 }, { "epoch": 1.29, "learning_rate": 0.00010647940775928281, "loss": 0.0345, "step": 199890 }, { "epoch": 1.29, "learning_rate": 0.00010646972640492586, "loss": 0.0298, "step": 199900 }, { "epoch": 1.29, "learning_rate": 0.00010646004505056893, "loss": 0.0345, "step": 199910 }, { "epoch": 1.29, "learning_rate": 0.00010645036369621201, "loss": 0.0302, "step": 199920 }, { "epoch": 1.29, "learning_rate": 0.00010644068234185506, "loss": 0.0309, "step": 199930 }, { "epoch": 1.29, "learning_rate": 0.00010643100098749813, "loss": 0.0319, "step": 199940 }, { "epoch": 1.29, "learning_rate": 0.0001064213196331412, "loss": 0.0338, "step": 199950 }, { "epoch": 1.29, "learning_rate": 0.00010641163827878427, "loss": 0.031, "step": 199960 }, { "epoch": 1.29, "learning_rate": 0.00010640195692442734, "loss": 0.0279, "step": 199970 }, { "epoch": 1.29, "learning_rate": 0.0001063922755700704, "loss": 0.0289, "step": 199980 }, { "epoch": 1.29, "learning_rate": 0.00010638259421571348, "loss": 0.0311, "step": 199990 }, { "epoch": 1.29, "learning_rate": 0.00010637291286135654, "loss": 0.0278, "step": 200000 }, { "epoch": 1.29, "eval_cer": 0.9198264602869732, "eval_loss": 0.02203773520886898, "eval_runtime": 120.2041, "eval_samples_per_second": 16.638, "eval_steps_per_second": 4.16, "step": 200000 }, { "epoch": 1.29, "learning_rate": 0.0001063632315069996, "loss": 0.0299, "step": 200010 }, { "epoch": 1.29, "learning_rate": 0.00010635355015264268, "loss": 0.0331, "step": 200020 }, { "epoch": 1.29, "learning_rate": 0.00010634386879828575, "loss": 0.0334, "step": 200030 }, { "epoch": 1.29, "learning_rate": 0.0001063341874439288, "loss": 0.0365, "step": 200040 }, { "epoch": 1.29, "learning_rate": 0.00010632450608957188, "loss": 0.0291, "step": 200050 }, { "epoch": 1.29, "learning_rate": 0.00010631482473521495, "loss": 0.0294, "step": 200060 }, { "epoch": 1.29, "learning_rate": 0.00010630514338085801, "loss": 0.0349, "step": 200070 }, { "epoch": 1.29, "learning_rate": 0.00010629546202650108, "loss": 0.0325, "step": 200080 }, { "epoch": 1.29, "learning_rate": 0.00010628578067214416, "loss": 0.0291, "step": 200090 }, { "epoch": 1.29, "learning_rate": 0.00010627609931778723, "loss": 0.034, "step": 200100 }, { "epoch": 1.29, "learning_rate": 0.00010626641796343028, "loss": 0.0294, "step": 200110 }, { "epoch": 1.29, "learning_rate": 0.00010625673660907336, "loss": 0.0351, "step": 200120 }, { "epoch": 1.29, "learning_rate": 0.00010624705525471643, "loss": 0.0309, "step": 200130 }, { "epoch": 1.29, "learning_rate": 0.00010623737390035948, "loss": 0.0313, "step": 200140 }, { "epoch": 1.29, "learning_rate": 0.00010622769254600256, "loss": 0.0281, "step": 200150 }, { "epoch": 1.29, "learning_rate": 0.00010621801119164562, "loss": 0.0307, "step": 200160 }, { "epoch": 1.29, "learning_rate": 0.0001062083298372887, "loss": 0.032, "step": 200170 }, { "epoch": 1.29, "learning_rate": 0.00010619864848293176, "loss": 0.0313, "step": 200180 }, { "epoch": 1.29, "learning_rate": 0.00010618896712857484, "loss": 0.0351, "step": 200190 }, { "epoch": 1.29, "learning_rate": 0.0001061792857742179, "loss": 0.0314, "step": 200200 }, { "epoch": 1.29, "learning_rate": 0.00010616960441986096, "loss": 0.0461, "step": 200210 }, { "epoch": 1.29, "learning_rate": 0.00010615992306550404, "loss": 0.0269, "step": 200220 }, { "epoch": 1.29, "learning_rate": 0.0001061502417111471, "loss": 0.0349, "step": 200230 }, { "epoch": 1.29, "learning_rate": 0.00010614056035679018, "loss": 0.0294, "step": 200240 }, { "epoch": 1.29, "learning_rate": 0.00010613087900243323, "loss": 0.0244, "step": 200250 }, { "epoch": 1.29, "learning_rate": 0.0001061211976480763, "loss": 0.0282, "step": 200260 }, { "epoch": 1.29, "learning_rate": 0.00010611151629371938, "loss": 0.0297, "step": 200270 }, { "epoch": 1.29, "learning_rate": 0.00010610183493936243, "loss": 0.0319, "step": 200280 }, { "epoch": 1.29, "learning_rate": 0.00010609215358500551, "loss": 0.0272, "step": 200290 }, { "epoch": 1.29, "learning_rate": 0.00010608247223064858, "loss": 0.0311, "step": 200300 }, { "epoch": 1.29, "learning_rate": 0.00010607279087629166, "loss": 0.0334, "step": 200310 }, { "epoch": 1.29, "learning_rate": 0.00010606310952193471, "loss": 0.0279, "step": 200320 }, { "epoch": 1.29, "learning_rate": 0.00010605342816757778, "loss": 0.0292, "step": 200330 }, { "epoch": 1.29, "learning_rate": 0.00010604374681322086, "loss": 0.0302, "step": 200340 }, { "epoch": 1.29, "learning_rate": 0.00010603406545886391, "loss": 0.0289, "step": 200350 }, { "epoch": 1.29, "learning_rate": 0.00010602438410450698, "loss": 0.0309, "step": 200360 }, { "epoch": 1.29, "learning_rate": 0.00010601470275015006, "loss": 0.0297, "step": 200370 }, { "epoch": 1.29, "learning_rate": 0.00010600502139579312, "loss": 0.0327, "step": 200380 }, { "epoch": 1.29, "learning_rate": 0.00010599534004143619, "loss": 0.0236, "step": 200390 }, { "epoch": 1.29, "learning_rate": 0.00010598565868707925, "loss": 0.0266, "step": 200400 }, { "epoch": 1.29, "learning_rate": 0.00010597597733272233, "loss": 0.0299, "step": 200410 }, { "epoch": 1.29, "learning_rate": 0.00010596629597836539, "loss": 0.0334, "step": 200420 }, { "epoch": 1.29, "learning_rate": 0.00010595661462400845, "loss": 0.0266, "step": 200430 }, { "epoch": 1.29, "learning_rate": 0.00010594693326965153, "loss": 0.0324, "step": 200440 }, { "epoch": 1.29, "learning_rate": 0.0001059372519152946, "loss": 0.0303, "step": 200450 }, { "epoch": 1.29, "learning_rate": 0.00010592757056093765, "loss": 0.0316, "step": 200460 }, { "epoch": 1.29, "learning_rate": 0.00010591788920658073, "loss": 0.0305, "step": 200470 }, { "epoch": 1.29, "learning_rate": 0.0001059082078522238, "loss": 0.0318, "step": 200480 }, { "epoch": 1.29, "learning_rate": 0.00010589852649786686, "loss": 0.0303, "step": 200490 }, { "epoch": 1.29, "learning_rate": 0.00010588884514350993, "loss": 0.035, "step": 200500 }, { "epoch": 1.29, "learning_rate": 0.00010587916378915301, "loss": 0.031, "step": 200510 }, { "epoch": 1.29, "learning_rate": 0.00010586948243479608, "loss": 0.027, "step": 200520 }, { "epoch": 1.29, "learning_rate": 0.00010585980108043913, "loss": 0.0294, "step": 200530 }, { "epoch": 1.29, "learning_rate": 0.00010585011972608221, "loss": 0.0293, "step": 200540 }, { "epoch": 1.29, "learning_rate": 0.00010584043837172528, "loss": 0.0349, "step": 200550 }, { "epoch": 1.29, "learning_rate": 0.00010583075701736833, "loss": 0.0342, "step": 200560 }, { "epoch": 1.29, "learning_rate": 0.00010582107566301141, "loss": 0.0273, "step": 200570 }, { "epoch": 1.29, "learning_rate": 0.00010581139430865447, "loss": 0.0289, "step": 200580 }, { "epoch": 1.29, "learning_rate": 0.00010580171295429755, "loss": 0.0304, "step": 200590 }, { "epoch": 1.29, "learning_rate": 0.0001057920315999406, "loss": 0.0271, "step": 200600 }, { "epoch": 1.29, "learning_rate": 0.00010578235024558369, "loss": 0.0357, "step": 200610 }, { "epoch": 1.29, "learning_rate": 0.00010577266889122675, "loss": 0.0342, "step": 200620 }, { "epoch": 1.29, "learning_rate": 0.0001057629875368698, "loss": 0.0334, "step": 200630 }, { "epoch": 1.29, "learning_rate": 0.00010575330618251289, "loss": 0.029, "step": 200640 }, { "epoch": 1.3, "learning_rate": 0.00010574362482815595, "loss": 0.0276, "step": 200650 }, { "epoch": 1.3, "learning_rate": 0.00010573394347379903, "loss": 0.0235, "step": 200660 }, { "epoch": 1.3, "learning_rate": 0.00010572426211944208, "loss": 0.0314, "step": 200670 }, { "epoch": 1.3, "learning_rate": 0.00010571458076508515, "loss": 0.0304, "step": 200680 }, { "epoch": 1.3, "learning_rate": 0.00010570489941072823, "loss": 0.0348, "step": 200690 }, { "epoch": 1.3, "learning_rate": 0.00010569521805637128, "loss": 0.0248, "step": 200700 }, { "epoch": 1.3, "learning_rate": 0.00010568553670201436, "loss": 0.0307, "step": 200710 }, { "epoch": 1.3, "learning_rate": 0.00010567585534765743, "loss": 0.0309, "step": 200720 }, { "epoch": 1.3, "learning_rate": 0.0001056661739933005, "loss": 0.0269, "step": 200730 }, { "epoch": 1.3, "learning_rate": 0.00010565649263894356, "loss": 0.0287, "step": 200740 }, { "epoch": 1.3, "learning_rate": 0.00010564681128458663, "loss": 0.0283, "step": 200750 }, { "epoch": 1.3, "learning_rate": 0.00010563712993022971, "loss": 0.0338, "step": 200760 }, { "epoch": 1.3, "learning_rate": 0.00010562744857587276, "loss": 0.0282, "step": 200770 }, { "epoch": 1.3, "learning_rate": 0.00010561776722151583, "loss": 0.0295, "step": 200780 }, { "epoch": 1.3, "learning_rate": 0.0001056080858671589, "loss": 0.0258, "step": 200790 }, { "epoch": 1.3, "learning_rate": 0.00010559840451280197, "loss": 0.0262, "step": 200800 }, { "epoch": 1.3, "learning_rate": 0.00010558872315844504, "loss": 0.0276, "step": 200810 }, { "epoch": 1.3, "learning_rate": 0.0001055790418040881, "loss": 0.0288, "step": 200820 }, { "epoch": 1.3, "learning_rate": 0.00010556936044973117, "loss": 0.035, "step": 200830 }, { "epoch": 1.3, "learning_rate": 0.00010555967909537424, "loss": 0.031, "step": 200840 }, { "epoch": 1.3, "learning_rate": 0.0001055499977410173, "loss": 0.0341, "step": 200850 }, { "epoch": 1.3, "learning_rate": 0.00010554031638666038, "loss": 0.0319, "step": 200860 }, { "epoch": 1.3, "learning_rate": 0.00010553063503230345, "loss": 0.0339, "step": 200870 }, { "epoch": 1.3, "learning_rate": 0.0001055209536779465, "loss": 0.0269, "step": 200880 }, { "epoch": 1.3, "learning_rate": 0.00010551127232358958, "loss": 0.0365, "step": 200890 }, { "epoch": 1.3, "learning_rate": 0.00010550159096923265, "loss": 0.0312, "step": 200900 }, { "epoch": 1.3, "learning_rate": 0.00010549190961487571, "loss": 0.0327, "step": 200910 }, { "epoch": 1.3, "learning_rate": 0.00010548222826051878, "loss": 0.0308, "step": 200920 }, { "epoch": 1.3, "learning_rate": 0.00010547254690616185, "loss": 0.031, "step": 200930 }, { "epoch": 1.3, "learning_rate": 0.00010546286555180493, "loss": 0.0332, "step": 200940 }, { "epoch": 1.3, "learning_rate": 0.00010545318419744798, "loss": 0.0291, "step": 200950 }, { "epoch": 1.3, "learning_rate": 0.00010544350284309106, "loss": 0.0245, "step": 200960 }, { "epoch": 1.3, "learning_rate": 0.00010543382148873413, "loss": 0.0292, "step": 200970 }, { "epoch": 1.3, "learning_rate": 0.00010542414013437718, "loss": 0.0294, "step": 200980 }, { "epoch": 1.3, "learning_rate": 0.00010541445878002026, "loss": 0.0319, "step": 200990 }, { "epoch": 1.3, "learning_rate": 0.00010540477742566332, "loss": 0.029, "step": 201000 }, { "epoch": 1.3, "eval_cer": 0.9199159417015027, "eval_loss": 0.02207825891673565, "eval_runtime": 120.2757, "eval_samples_per_second": 16.628, "eval_steps_per_second": 4.157, "step": 201000 }, { "epoch": 1.3, "learning_rate": 0.0001053950960713064, "loss": 0.0365, "step": 201010 }, { "epoch": 1.3, "learning_rate": 0.00010538541471694946, "loss": 0.0312, "step": 201020 }, { "epoch": 1.3, "learning_rate": 0.00010537573336259252, "loss": 0.0304, "step": 201030 }, { "epoch": 1.3, "learning_rate": 0.0001053660520082356, "loss": 0.0306, "step": 201040 }, { "epoch": 1.3, "learning_rate": 0.00010535637065387866, "loss": 0.0321, "step": 201050 }, { "epoch": 1.3, "learning_rate": 0.00010534668929952173, "loss": 0.0307, "step": 201060 }, { "epoch": 1.3, "learning_rate": 0.0001053370079451648, "loss": 0.031, "step": 201070 }, { "epoch": 1.3, "learning_rate": 0.00010532732659080788, "loss": 0.0326, "step": 201080 }, { "epoch": 1.3, "learning_rate": 0.00010531764523645093, "loss": 0.0332, "step": 201090 }, { "epoch": 1.3, "learning_rate": 0.000105307963882094, "loss": 0.032, "step": 201100 }, { "epoch": 1.3, "learning_rate": 0.00010529828252773708, "loss": 0.0297, "step": 201110 }, { "epoch": 1.3, "learning_rate": 0.00010528860117338013, "loss": 0.0321, "step": 201120 }, { "epoch": 1.3, "learning_rate": 0.0001052789198190232, "loss": 0.0275, "step": 201130 }, { "epoch": 1.3, "learning_rate": 0.00010526923846466628, "loss": 0.0324, "step": 201140 }, { "epoch": 1.3, "learning_rate": 0.00010525955711030934, "loss": 0.0317, "step": 201150 }, { "epoch": 1.3, "learning_rate": 0.00010524987575595241, "loss": 0.0311, "step": 201160 }, { "epoch": 1.3, "learning_rate": 0.00010524019440159548, "loss": 0.0313, "step": 201170 }, { "epoch": 1.3, "learning_rate": 0.00010523051304723856, "loss": 0.0324, "step": 201180 }, { "epoch": 1.3, "learning_rate": 0.00010522083169288161, "loss": 0.0275, "step": 201190 }, { "epoch": 1.3, "learning_rate": 0.00010521115033852468, "loss": 0.0277, "step": 201200 }, { "epoch": 1.3, "learning_rate": 0.00010520146898416776, "loss": 0.0342, "step": 201210 }, { "epoch": 1.3, "learning_rate": 0.00010519178762981082, "loss": 0.0356, "step": 201220 }, { "epoch": 1.3, "learning_rate": 0.00010518210627545387, "loss": 0.0275, "step": 201230 }, { "epoch": 1.3, "learning_rate": 0.00010517242492109695, "loss": 0.0358, "step": 201240 }, { "epoch": 1.3, "learning_rate": 0.00010516274356674002, "loss": 0.0342, "step": 201250 }, { "epoch": 1.3, "learning_rate": 0.00010515306221238309, "loss": 0.0285, "step": 201260 }, { "epoch": 1.3, "learning_rate": 0.00010514338085802615, "loss": 0.0321, "step": 201270 }, { "epoch": 1.3, "learning_rate": 0.00010513369950366923, "loss": 0.0349, "step": 201280 }, { "epoch": 1.3, "learning_rate": 0.0001051240181493123, "loss": 0.0333, "step": 201290 }, { "epoch": 1.3, "learning_rate": 0.00010511433679495535, "loss": 0.0389, "step": 201300 }, { "epoch": 1.3, "learning_rate": 0.00010510465544059843, "loss": 0.029, "step": 201310 }, { "epoch": 1.3, "learning_rate": 0.0001050949740862415, "loss": 0.0231, "step": 201320 }, { "epoch": 1.3, "learning_rate": 0.00010508529273188455, "loss": 0.0262, "step": 201330 }, { "epoch": 1.3, "learning_rate": 0.00010507561137752763, "loss": 0.0328, "step": 201340 }, { "epoch": 1.3, "learning_rate": 0.0001050659300231707, "loss": 0.0298, "step": 201350 }, { "epoch": 1.3, "learning_rate": 0.00010505624866881378, "loss": 0.0342, "step": 201360 }, { "epoch": 1.3, "learning_rate": 0.00010504656731445683, "loss": 0.0334, "step": 201370 }, { "epoch": 1.3, "learning_rate": 0.00010503688596009991, "loss": 0.0281, "step": 201380 }, { "epoch": 1.3, "learning_rate": 0.00010502720460574298, "loss": 0.0283, "step": 201390 }, { "epoch": 1.3, "learning_rate": 0.00010501752325138603, "loss": 0.0315, "step": 201400 }, { "epoch": 1.3, "learning_rate": 0.00010500784189702911, "loss": 0.0245, "step": 201410 }, { "epoch": 1.3, "learning_rate": 0.00010499816054267217, "loss": 0.029, "step": 201420 }, { "epoch": 1.3, "learning_rate": 0.00010498847918831523, "loss": 0.0312, "step": 201430 }, { "epoch": 1.3, "learning_rate": 0.0001049787978339583, "loss": 0.0267, "step": 201440 }, { "epoch": 1.3, "learning_rate": 0.00010496911647960137, "loss": 0.0245, "step": 201450 }, { "epoch": 1.3, "learning_rate": 0.00010495943512524445, "loss": 0.0322, "step": 201460 }, { "epoch": 1.3, "learning_rate": 0.0001049497537708875, "loss": 0.034, "step": 201470 }, { "epoch": 1.3, "learning_rate": 0.00010494007241653058, "loss": 0.0266, "step": 201480 }, { "epoch": 1.3, "learning_rate": 0.00010493039106217365, "loss": 0.0323, "step": 201490 }, { "epoch": 1.3, "learning_rate": 0.0001049207097078167, "loss": 0.035, "step": 201500 }, { "epoch": 1.3, "learning_rate": 0.00010491102835345978, "loss": 0.0343, "step": 201510 }, { "epoch": 1.3, "learning_rate": 0.00010490134699910285, "loss": 0.0351, "step": 201520 }, { "epoch": 1.3, "learning_rate": 0.00010489166564474593, "loss": 0.0339, "step": 201530 }, { "epoch": 1.3, "learning_rate": 0.00010488198429038898, "loss": 0.0292, "step": 201540 }, { "epoch": 1.3, "learning_rate": 0.00010487230293603205, "loss": 0.03, "step": 201550 }, { "epoch": 1.3, "learning_rate": 0.00010486262158167513, "loss": 0.0324, "step": 201560 }, { "epoch": 1.3, "learning_rate": 0.00010485294022731818, "loss": 0.0314, "step": 201570 }, { "epoch": 1.3, "learning_rate": 0.00010484325887296126, "loss": 0.0255, "step": 201580 }, { "epoch": 1.3, "learning_rate": 0.00010483357751860433, "loss": 0.0296, "step": 201590 }, { "epoch": 1.3, "learning_rate": 0.0001048238961642474, "loss": 0.0275, "step": 201600 }, { "epoch": 1.3, "learning_rate": 0.00010481421480989046, "loss": 0.0309, "step": 201610 }, { "epoch": 1.3, "learning_rate": 0.00010480453345553353, "loss": 0.0286, "step": 201620 }, { "epoch": 1.3, "learning_rate": 0.0001047948521011766, "loss": 0.0344, "step": 201630 }, { "epoch": 1.3, "learning_rate": 0.00010478517074681966, "loss": 0.0235, "step": 201640 }, { "epoch": 1.3, "learning_rate": 0.00010477548939246272, "loss": 0.0303, "step": 201650 }, { "epoch": 1.3, "learning_rate": 0.0001047658080381058, "loss": 0.0318, "step": 201660 }, { "epoch": 1.3, "learning_rate": 0.00010475612668374887, "loss": 0.0371, "step": 201670 }, { "epoch": 1.3, "learning_rate": 0.00010474644532939194, "loss": 0.0257, "step": 201680 }, { "epoch": 1.3, "learning_rate": 0.000104736763975035, "loss": 0.0278, "step": 201690 }, { "epoch": 1.3, "learning_rate": 0.00010472708262067808, "loss": 0.0273, "step": 201700 }, { "epoch": 1.3, "learning_rate": 0.00010471740126632114, "loss": 0.0307, "step": 201710 }, { "epoch": 1.3, "learning_rate": 0.0001047077199119642, "loss": 0.0294, "step": 201720 }, { "epoch": 1.3, "learning_rate": 0.00010469803855760728, "loss": 0.0291, "step": 201730 }, { "epoch": 1.3, "learning_rate": 0.00010468835720325035, "loss": 0.0276, "step": 201740 }, { "epoch": 1.3, "learning_rate": 0.0001046786758488934, "loss": 0.0299, "step": 201750 }, { "epoch": 1.3, "learning_rate": 0.00010466899449453648, "loss": 0.0311, "step": 201760 }, { "epoch": 1.3, "learning_rate": 0.00010465931314017955, "loss": 0.0366, "step": 201770 }, { "epoch": 1.3, "learning_rate": 0.00010464963178582261, "loss": 0.0266, "step": 201780 }, { "epoch": 1.3, "learning_rate": 0.00010463995043146568, "loss": 0.0292, "step": 201790 }, { "epoch": 1.3, "learning_rate": 0.00010463026907710876, "loss": 0.0331, "step": 201800 }, { "epoch": 1.3, "learning_rate": 0.00010462058772275182, "loss": 0.0289, "step": 201810 }, { "epoch": 1.3, "learning_rate": 0.00010461090636839488, "loss": 0.0272, "step": 201820 }, { "epoch": 1.3, "learning_rate": 0.00010460122501403796, "loss": 0.0334, "step": 201830 }, { "epoch": 1.3, "learning_rate": 0.00010459154365968102, "loss": 0.0308, "step": 201840 }, { "epoch": 1.3, "learning_rate": 0.00010458186230532408, "loss": 0.0236, "step": 201850 }, { "epoch": 1.3, "learning_rate": 0.00010457218095096716, "loss": 0.0289, "step": 201860 }, { "epoch": 1.3, "learning_rate": 0.00010456249959661022, "loss": 0.0264, "step": 201870 }, { "epoch": 1.3, "learning_rate": 0.0001045528182422533, "loss": 0.026, "step": 201880 }, { "epoch": 1.3, "learning_rate": 0.00010454313688789635, "loss": 0.0375, "step": 201890 }, { "epoch": 1.3, "learning_rate": 0.00010453345553353943, "loss": 0.0372, "step": 201900 }, { "epoch": 1.3, "learning_rate": 0.0001045237741791825, "loss": 0.0309, "step": 201910 }, { "epoch": 1.3, "learning_rate": 0.00010451409282482555, "loss": 0.0264, "step": 201920 }, { "epoch": 1.3, "learning_rate": 0.00010450441147046863, "loss": 0.0307, "step": 201930 }, { "epoch": 1.3, "learning_rate": 0.0001044947301161117, "loss": 0.029, "step": 201940 }, { "epoch": 1.3, "learning_rate": 0.00010448504876175478, "loss": 0.0314, "step": 201950 }, { "epoch": 1.3, "learning_rate": 0.00010447536740739783, "loss": 0.0331, "step": 201960 }, { "epoch": 1.3, "learning_rate": 0.0001044656860530409, "loss": 0.0265, "step": 201970 }, { "epoch": 1.3, "learning_rate": 0.00010445600469868398, "loss": 0.0289, "step": 201980 }, { "epoch": 1.3, "learning_rate": 0.00010444632334432703, "loss": 0.0267, "step": 201990 }, { "epoch": 1.3, "learning_rate": 0.00010443664198997011, "loss": 0.0319, "step": 202000 }, { "epoch": 1.3, "eval_cer": 0.9198861145633261, "eval_loss": 0.02179008163511753, "eval_runtime": 120.2378, "eval_samples_per_second": 16.634, "eval_steps_per_second": 4.158, "step": 202000 }, { "epoch": 1.3, "learning_rate": 0.00010442696063561318, "loss": 0.0331, "step": 202010 }, { "epoch": 1.3, "learning_rate": 0.00010441727928125624, "loss": 0.0294, "step": 202020 }, { "epoch": 1.3, "learning_rate": 0.00010440759792689931, "loss": 0.0315, "step": 202030 }, { "epoch": 1.3, "learning_rate": 0.00010439791657254238, "loss": 0.0305, "step": 202040 }, { "epoch": 1.3, "learning_rate": 0.00010438823521818546, "loss": 0.0318, "step": 202050 }, { "epoch": 1.3, "learning_rate": 0.00010437855386382851, "loss": 0.0247, "step": 202060 }, { "epoch": 1.3, "learning_rate": 0.00010436887250947157, "loss": 0.0336, "step": 202070 }, { "epoch": 1.3, "learning_rate": 0.00010435919115511465, "loss": 0.0297, "step": 202080 }, { "epoch": 1.3, "learning_rate": 0.00010434950980075772, "loss": 0.0308, "step": 202090 }, { "epoch": 1.3, "learning_rate": 0.00010433982844640079, "loss": 0.0277, "step": 202100 }, { "epoch": 1.3, "learning_rate": 0.00010433014709204385, "loss": 0.0285, "step": 202110 }, { "epoch": 1.3, "learning_rate": 0.00010432046573768693, "loss": 0.0324, "step": 202120 }, { "epoch": 1.3, "learning_rate": 0.00010431078438332999, "loss": 0.0258, "step": 202130 }, { "epoch": 1.3, "learning_rate": 0.00010430110302897305, "loss": 0.04, "step": 202140 }, { "epoch": 1.3, "learning_rate": 0.00010429142167461613, "loss": 0.0281, "step": 202150 }, { "epoch": 1.3, "learning_rate": 0.0001042817403202592, "loss": 0.0359, "step": 202160 }, { "epoch": 1.3, "learning_rate": 0.00010427205896590225, "loss": 0.0375, "step": 202170 }, { "epoch": 1.3, "learning_rate": 0.00010426237761154533, "loss": 0.0358, "step": 202180 }, { "epoch": 1.3, "learning_rate": 0.0001042526962571884, "loss": 0.0351, "step": 202190 }, { "epoch": 1.31, "learning_rate": 0.00010424301490283146, "loss": 0.0262, "step": 202200 }, { "epoch": 1.31, "learning_rate": 0.00010423333354847453, "loss": 0.034, "step": 202210 }, { "epoch": 1.31, "learning_rate": 0.00010422365219411761, "loss": 0.0306, "step": 202220 }, { "epoch": 1.31, "learning_rate": 0.00010421397083976067, "loss": 0.0352, "step": 202230 }, { "epoch": 1.31, "learning_rate": 0.00010420428948540373, "loss": 0.03, "step": 202240 }, { "epoch": 1.31, "learning_rate": 0.00010419460813104681, "loss": 0.0331, "step": 202250 }, { "epoch": 1.31, "learning_rate": 0.00010418492677668987, "loss": 0.0396, "step": 202260 }, { "epoch": 1.31, "learning_rate": 0.00010417524542233293, "loss": 0.0328, "step": 202270 }, { "epoch": 1.31, "learning_rate": 0.000104165564067976, "loss": 0.0306, "step": 202280 }, { "epoch": 1.31, "learning_rate": 0.00010415588271361907, "loss": 0.0309, "step": 202290 }, { "epoch": 1.31, "learning_rate": 0.00010414620135926215, "loss": 0.0314, "step": 202300 }, { "epoch": 1.31, "learning_rate": 0.0001041365200049052, "loss": 0.0365, "step": 202310 }, { "epoch": 1.31, "learning_rate": 0.00010412683865054828, "loss": 0.0294, "step": 202320 }, { "epoch": 1.31, "learning_rate": 0.00010411715729619135, "loss": 0.0367, "step": 202330 }, { "epoch": 1.31, "learning_rate": 0.0001041074759418344, "loss": 0.0298, "step": 202340 }, { "epoch": 1.31, "learning_rate": 0.00010409779458747748, "loss": 0.0283, "step": 202350 }, { "epoch": 1.31, "learning_rate": 0.00010408811323312055, "loss": 0.0325, "step": 202360 }, { "epoch": 1.31, "learning_rate": 0.00010407843187876363, "loss": 0.029, "step": 202370 }, { "epoch": 1.31, "learning_rate": 0.00010406875052440668, "loss": 0.0302, "step": 202380 }, { "epoch": 1.31, "learning_rate": 0.00010405906917004975, "loss": 0.0307, "step": 202390 }, { "epoch": 1.31, "learning_rate": 0.00010404938781569283, "loss": 0.0317, "step": 202400 }, { "epoch": 1.31, "learning_rate": 0.00010403970646133588, "loss": 0.0337, "step": 202410 }, { "epoch": 1.31, "learning_rate": 0.00010403002510697896, "loss": 0.0258, "step": 202420 }, { "epoch": 1.31, "learning_rate": 0.00010402034375262203, "loss": 0.0329, "step": 202430 }, { "epoch": 1.31, "learning_rate": 0.00010401066239826509, "loss": 0.0317, "step": 202440 }, { "epoch": 1.31, "learning_rate": 0.00010400098104390816, "loss": 0.0347, "step": 202450 }, { "epoch": 1.31, "learning_rate": 0.00010399129968955123, "loss": 0.0288, "step": 202460 }, { "epoch": 1.31, "learning_rate": 0.0001039816183351943, "loss": 0.0335, "step": 202470 }, { "epoch": 1.31, "learning_rate": 0.00010397193698083736, "loss": 0.0275, "step": 202480 }, { "epoch": 1.31, "learning_rate": 0.00010396225562648042, "loss": 0.0291, "step": 202490 }, { "epoch": 1.31, "learning_rate": 0.0001039525742721235, "loss": 0.0243, "step": 202500 }, { "epoch": 1.31, "learning_rate": 0.00010394289291776657, "loss": 0.0367, "step": 202510 }, { "epoch": 1.31, "learning_rate": 0.00010393321156340964, "loss": 0.0258, "step": 202520 }, { "epoch": 1.31, "learning_rate": 0.0001039235302090527, "loss": 0.0343, "step": 202530 }, { "epoch": 1.31, "learning_rate": 0.00010391384885469577, "loss": 0.0252, "step": 202540 }, { "epoch": 1.31, "learning_rate": 0.00010390416750033884, "loss": 0.0324, "step": 202550 }, { "epoch": 1.31, "learning_rate": 0.0001038944861459819, "loss": 0.0312, "step": 202560 }, { "epoch": 1.31, "learning_rate": 0.00010388480479162498, "loss": 0.0299, "step": 202570 }, { "epoch": 1.31, "learning_rate": 0.00010387512343726805, "loss": 0.0314, "step": 202580 }, { "epoch": 1.31, "learning_rate": 0.0001038654420829111, "loss": 0.0357, "step": 202590 }, { "epoch": 1.31, "learning_rate": 0.00010385576072855418, "loss": 0.026, "step": 202600 }, { "epoch": 1.31, "learning_rate": 0.00010384607937419725, "loss": 0.0304, "step": 202610 }, { "epoch": 1.31, "learning_rate": 0.00010383639801984031, "loss": 0.0304, "step": 202620 }, { "epoch": 1.31, "learning_rate": 0.00010382671666548338, "loss": 0.0293, "step": 202630 }, { "epoch": 1.31, "learning_rate": 0.00010381703531112644, "loss": 0.0338, "step": 202640 }, { "epoch": 1.31, "learning_rate": 0.00010380735395676952, "loss": 0.0284, "step": 202650 }, { "epoch": 1.31, "learning_rate": 0.00010379767260241258, "loss": 0.0257, "step": 202660 }, { "epoch": 1.31, "learning_rate": 0.00010378799124805566, "loss": 0.0302, "step": 202670 }, { "epoch": 1.31, "learning_rate": 0.00010377830989369872, "loss": 0.0281, "step": 202680 }, { "epoch": 1.31, "learning_rate": 0.00010376862853934178, "loss": 0.0253, "step": 202690 }, { "epoch": 1.31, "learning_rate": 0.00010375894718498486, "loss": 0.0339, "step": 202700 }, { "epoch": 1.31, "learning_rate": 0.00010374926583062792, "loss": 0.0348, "step": 202710 }, { "epoch": 1.31, "learning_rate": 0.000103739584476271, "loss": 0.032, "step": 202720 }, { "epoch": 1.31, "learning_rate": 0.00010372990312191405, "loss": 0.0311, "step": 202730 }, { "epoch": 1.31, "learning_rate": 0.00010372022176755712, "loss": 0.031, "step": 202740 }, { "epoch": 1.31, "learning_rate": 0.0001037105404132002, "loss": 0.0345, "step": 202750 }, { "epoch": 1.31, "learning_rate": 0.00010370085905884325, "loss": 0.0333, "step": 202760 }, { "epoch": 1.31, "learning_rate": 0.00010369117770448633, "loss": 0.028, "step": 202770 }, { "epoch": 1.31, "learning_rate": 0.0001036814963501294, "loss": 0.0359, "step": 202780 }, { "epoch": 1.31, "learning_rate": 0.00010367181499577248, "loss": 0.0301, "step": 202790 }, { "epoch": 1.31, "learning_rate": 0.00010366213364141553, "loss": 0.0269, "step": 202800 }, { "epoch": 1.31, "learning_rate": 0.0001036524522870586, "loss": 0.0322, "step": 202810 }, { "epoch": 1.31, "learning_rate": 0.00010364277093270168, "loss": 0.0245, "step": 202820 }, { "epoch": 1.31, "learning_rate": 0.00010363308957834473, "loss": 0.0281, "step": 202830 }, { "epoch": 1.31, "learning_rate": 0.0001036234082239878, "loss": 0.0324, "step": 202840 }, { "epoch": 1.31, "learning_rate": 0.00010361372686963088, "loss": 0.0285, "step": 202850 }, { "epoch": 1.31, "learning_rate": 0.00010360404551527394, "loss": 0.027, "step": 202860 }, { "epoch": 1.31, "learning_rate": 0.00010359436416091701, "loss": 0.0284, "step": 202870 }, { "epoch": 1.31, "learning_rate": 0.00010358468280656008, "loss": 0.0298, "step": 202880 }, { "epoch": 1.31, "learning_rate": 0.00010357500145220315, "loss": 0.0315, "step": 202890 }, { "epoch": 1.31, "learning_rate": 0.00010356532009784621, "loss": 0.0263, "step": 202900 }, { "epoch": 1.31, "learning_rate": 0.00010355563874348927, "loss": 0.0337, "step": 202910 }, { "epoch": 1.31, "learning_rate": 0.00010354595738913235, "loss": 0.0371, "step": 202920 }, { "epoch": 1.31, "learning_rate": 0.00010353627603477542, "loss": 0.0265, "step": 202930 }, { "epoch": 1.31, "learning_rate": 0.00010352659468041847, "loss": 0.0316, "step": 202940 }, { "epoch": 1.31, "learning_rate": 0.00010351691332606155, "loss": 0.0297, "step": 202950 }, { "epoch": 1.31, "learning_rate": 0.00010350723197170462, "loss": 0.0298, "step": 202960 }, { "epoch": 1.31, "learning_rate": 0.00010349755061734768, "loss": 0.0289, "step": 202970 }, { "epoch": 1.31, "learning_rate": 0.00010348786926299075, "loss": 0.0251, "step": 202980 }, { "epoch": 1.31, "learning_rate": 0.00010347818790863383, "loss": 0.0316, "step": 202990 }, { "epoch": 1.31, "learning_rate": 0.0001034685065542769, "loss": 0.0422, "step": 203000 }, { "epoch": 1.31, "eval_cer": 0.9198933453847022, "eval_loss": 0.022010989487171173, "eval_runtime": 120.2296, "eval_samples_per_second": 16.635, "eval_steps_per_second": 4.159, "step": 203000 }, { "epoch": 1.31, "learning_rate": 0.00010345882519991995, "loss": 0.0289, "step": 203010 }, { "epoch": 1.31, "learning_rate": 0.00010344914384556303, "loss": 0.0281, "step": 203020 }, { "epoch": 1.31, "learning_rate": 0.0001034394624912061, "loss": 0.0341, "step": 203030 }, { "epoch": 1.31, "learning_rate": 0.00010342978113684915, "loss": 0.0366, "step": 203040 }, { "epoch": 1.31, "learning_rate": 0.00010342009978249223, "loss": 0.0303, "step": 203050 }, { "epoch": 1.31, "learning_rate": 0.0001034104184281353, "loss": 0.0316, "step": 203060 }, { "epoch": 1.31, "learning_rate": 0.00010340073707377837, "loss": 0.0306, "step": 203070 }, { "epoch": 1.31, "learning_rate": 0.00010339105571942143, "loss": 0.0312, "step": 203080 }, { "epoch": 1.31, "learning_rate": 0.00010338137436506451, "loss": 0.0304, "step": 203090 }, { "epoch": 1.31, "learning_rate": 0.00010337169301070757, "loss": 0.0294, "step": 203100 }, { "epoch": 1.31, "learning_rate": 0.00010336201165635063, "loss": 0.0317, "step": 203110 }, { "epoch": 1.31, "learning_rate": 0.0001033523303019937, "loss": 0.0397, "step": 203120 }, { "epoch": 1.31, "learning_rate": 0.00010334264894763677, "loss": 0.0279, "step": 203130 }, { "epoch": 1.31, "learning_rate": 0.00010333296759327985, "loss": 0.0306, "step": 203140 }, { "epoch": 1.31, "learning_rate": 0.0001033232862389229, "loss": 0.0312, "step": 203150 }, { "epoch": 1.31, "learning_rate": 0.00010331360488456597, "loss": 0.0279, "step": 203160 }, { "epoch": 1.31, "learning_rate": 0.00010330392353020905, "loss": 0.0278, "step": 203170 }, { "epoch": 1.31, "learning_rate": 0.0001032942421758521, "loss": 0.032, "step": 203180 }, { "epoch": 1.31, "learning_rate": 0.00010328456082149518, "loss": 0.0308, "step": 203190 }, { "epoch": 1.31, "learning_rate": 0.00010327487946713825, "loss": 0.0269, "step": 203200 }, { "epoch": 1.31, "learning_rate": 0.00010326519811278133, "loss": 0.024, "step": 203210 }, { "epoch": 1.31, "learning_rate": 0.00010325551675842438, "loss": 0.0278, "step": 203220 }, { "epoch": 1.31, "learning_rate": 0.00010324583540406745, "loss": 0.0312, "step": 203230 }, { "epoch": 1.31, "learning_rate": 0.00010323615404971053, "loss": 0.0347, "step": 203240 }, { "epoch": 1.31, "learning_rate": 0.00010322647269535358, "loss": 0.0272, "step": 203250 }, { "epoch": 1.31, "learning_rate": 0.00010321679134099665, "loss": 0.03, "step": 203260 }, { "epoch": 1.31, "learning_rate": 0.00010320710998663973, "loss": 0.0272, "step": 203270 }, { "epoch": 1.31, "learning_rate": 0.00010319742863228279, "loss": 0.0306, "step": 203280 }, { "epoch": 1.31, "learning_rate": 0.00010318774727792586, "loss": 0.0331, "step": 203290 }, { "epoch": 1.31, "learning_rate": 0.00010317806592356892, "loss": 0.0351, "step": 203300 }, { "epoch": 1.31, "learning_rate": 0.000103168384569212, "loss": 0.0375, "step": 203310 }, { "epoch": 1.31, "learning_rate": 0.00010315870321485506, "loss": 0.0282, "step": 203320 }, { "epoch": 1.31, "learning_rate": 0.00010314902186049812, "loss": 0.0313, "step": 203330 }, { "epoch": 1.31, "learning_rate": 0.0001031393405061412, "loss": 0.0281, "step": 203340 }, { "epoch": 1.31, "learning_rate": 0.00010312965915178427, "loss": 0.0308, "step": 203350 }, { "epoch": 1.31, "learning_rate": 0.00010311997779742732, "loss": 0.0323, "step": 203360 }, { "epoch": 1.31, "learning_rate": 0.0001031102964430704, "loss": 0.029, "step": 203370 }, { "epoch": 1.31, "learning_rate": 0.00010310061508871347, "loss": 0.0341, "step": 203380 }, { "epoch": 1.31, "learning_rate": 0.00010309093373435653, "loss": 0.0331, "step": 203390 }, { "epoch": 1.31, "learning_rate": 0.0001030812523799996, "loss": 0.0402, "step": 203400 }, { "epoch": 1.31, "learning_rate": 0.00010307157102564268, "loss": 0.0295, "step": 203410 }, { "epoch": 1.31, "learning_rate": 0.00010306188967128575, "loss": 0.0314, "step": 203420 }, { "epoch": 1.31, "learning_rate": 0.0001030522083169288, "loss": 0.0339, "step": 203430 }, { "epoch": 1.31, "learning_rate": 0.00010304252696257188, "loss": 0.0412, "step": 203440 }, { "epoch": 1.31, "learning_rate": 0.00010303284560821495, "loss": 0.0338, "step": 203450 }, { "epoch": 1.31, "learning_rate": 0.000103023164253858, "loss": 0.0313, "step": 203460 }, { "epoch": 1.31, "learning_rate": 0.00010301348289950108, "loss": 0.0405, "step": 203470 }, { "epoch": 1.31, "learning_rate": 0.00010300380154514414, "loss": 0.0283, "step": 203480 }, { "epoch": 1.31, "learning_rate": 0.00010299412019078722, "loss": 0.0276, "step": 203490 }, { "epoch": 1.31, "learning_rate": 0.00010298443883643028, "loss": 0.0325, "step": 203500 }, { "epoch": 1.31, "learning_rate": 0.00010297475748207336, "loss": 0.0306, "step": 203510 }, { "epoch": 1.31, "learning_rate": 0.00010296507612771642, "loss": 0.0306, "step": 203520 }, { "epoch": 1.31, "learning_rate": 0.00010295539477335948, "loss": 0.0307, "step": 203530 }, { "epoch": 1.31, "learning_rate": 0.00010294571341900256, "loss": 0.0267, "step": 203540 }, { "epoch": 1.31, "learning_rate": 0.00010293603206464562, "loss": 0.0337, "step": 203550 }, { "epoch": 1.31, "learning_rate": 0.0001029263507102887, "loss": 0.0418, "step": 203560 }, { "epoch": 1.31, "learning_rate": 0.00010291666935593175, "loss": 0.0313, "step": 203570 }, { "epoch": 1.31, "learning_rate": 0.00010290698800157482, "loss": 0.0301, "step": 203580 }, { "epoch": 1.31, "learning_rate": 0.0001028973066472179, "loss": 0.0327, "step": 203590 }, { "epoch": 1.31, "learning_rate": 0.00010288762529286095, "loss": 0.0273, "step": 203600 }, { "epoch": 1.31, "learning_rate": 0.00010287794393850403, "loss": 0.0298, "step": 203610 }, { "epoch": 1.31, "learning_rate": 0.0001028682625841471, "loss": 0.027, "step": 203620 }, { "epoch": 1.31, "learning_rate": 0.00010285858122979017, "loss": 0.0322, "step": 203630 }, { "epoch": 1.31, "learning_rate": 0.00010284889987543323, "loss": 0.0344, "step": 203640 }, { "epoch": 1.31, "learning_rate": 0.0001028392185210763, "loss": 0.0313, "step": 203650 }, { "epoch": 1.31, "learning_rate": 0.00010282953716671938, "loss": 0.029, "step": 203660 }, { "epoch": 1.31, "learning_rate": 0.00010281985581236243, "loss": 0.0294, "step": 203670 }, { "epoch": 1.31, "learning_rate": 0.0001028101744580055, "loss": 0.0293, "step": 203680 }, { "epoch": 1.31, "learning_rate": 0.00010280049310364858, "loss": 0.0287, "step": 203690 }, { "epoch": 1.31, "learning_rate": 0.00010279081174929164, "loss": 0.0327, "step": 203700 }, { "epoch": 1.31, "learning_rate": 0.00010278113039493471, "loss": 0.0345, "step": 203710 }, { "epoch": 1.31, "learning_rate": 0.00010277144904057777, "loss": 0.0303, "step": 203720 }, { "epoch": 1.31, "learning_rate": 0.00010276176768622084, "loss": 0.0257, "step": 203730 }, { "epoch": 1.31, "learning_rate": 0.00010275208633186391, "loss": 0.0256, "step": 203740 }, { "epoch": 1.32, "learning_rate": 0.00010274240497750697, "loss": 0.0309, "step": 203750 }, { "epoch": 1.32, "learning_rate": 0.00010273272362315005, "loss": 0.028, "step": 203760 }, { "epoch": 1.32, "learning_rate": 0.00010272304226879312, "loss": 0.0328, "step": 203770 }, { "epoch": 1.32, "learning_rate": 0.00010271336091443617, "loss": 0.026, "step": 203780 }, { "epoch": 1.32, "learning_rate": 0.00010270367956007925, "loss": 0.0273, "step": 203790 }, { "epoch": 1.32, "learning_rate": 0.00010269399820572232, "loss": 0.0287, "step": 203800 }, { "epoch": 1.32, "learning_rate": 0.00010268431685136538, "loss": 0.0348, "step": 203810 }, { "epoch": 1.32, "learning_rate": 0.00010267463549700845, "loss": 0.031, "step": 203820 }, { "epoch": 1.32, "learning_rate": 0.00010266495414265152, "loss": 0.0268, "step": 203830 }, { "epoch": 1.32, "learning_rate": 0.0001026552727882946, "loss": 0.0338, "step": 203840 }, { "epoch": 1.32, "learning_rate": 0.00010264559143393765, "loss": 0.0338, "step": 203850 }, { "epoch": 1.32, "learning_rate": 0.00010263591007958073, "loss": 0.0264, "step": 203860 }, { "epoch": 1.32, "learning_rate": 0.0001026262287252238, "loss": 0.0265, "step": 203870 }, { "epoch": 1.32, "learning_rate": 0.00010261654737086685, "loss": 0.0276, "step": 203880 }, { "epoch": 1.32, "learning_rate": 0.00010260686601650993, "loss": 0.0279, "step": 203890 }, { "epoch": 1.32, "learning_rate": 0.000102597184662153, "loss": 0.0284, "step": 203900 }, { "epoch": 1.32, "learning_rate": 0.00010258750330779607, "loss": 0.034, "step": 203910 }, { "epoch": 1.32, "learning_rate": 0.00010257782195343913, "loss": 0.0344, "step": 203920 }, { "epoch": 1.32, "learning_rate": 0.00010256814059908219, "loss": 0.0318, "step": 203930 }, { "epoch": 1.32, "learning_rate": 0.00010255845924472527, "loss": 0.028, "step": 203940 }, { "epoch": 1.32, "learning_rate": 0.00010254877789036833, "loss": 0.03, "step": 203950 }, { "epoch": 1.32, "learning_rate": 0.0001025390965360114, "loss": 0.0297, "step": 203960 }, { "epoch": 1.32, "learning_rate": 0.00010252941518165447, "loss": 0.0344, "step": 203970 }, { "epoch": 1.32, "learning_rate": 0.00010251973382729755, "loss": 0.0328, "step": 203980 }, { "epoch": 1.32, "learning_rate": 0.0001025100524729406, "loss": 0.0294, "step": 203990 }, { "epoch": 1.32, "learning_rate": 0.00010250037111858367, "loss": 0.0301, "step": 204000 }, { "epoch": 1.32, "eval_cer": 0.9198237487289572, "eval_loss": 0.02146965079009533, "eval_runtime": 120.4063, "eval_samples_per_second": 16.61, "eval_steps_per_second": 4.153, "step": 204000 }, { "epoch": 1.32, "learning_rate": 0.00010249068976422675, "loss": 0.0301, "step": 204010 }, { "epoch": 1.32, "learning_rate": 0.0001024810084098698, "loss": 0.0315, "step": 204020 }, { "epoch": 1.32, "learning_rate": 0.00010247132705551287, "loss": 0.0307, "step": 204030 }, { "epoch": 1.32, "learning_rate": 0.00010246164570115595, "loss": 0.0366, "step": 204040 }, { "epoch": 1.32, "learning_rate": 0.00010245196434679901, "loss": 0.0315, "step": 204050 }, { "epoch": 1.32, "learning_rate": 0.00010244228299244208, "loss": 0.034, "step": 204060 }, { "epoch": 1.32, "learning_rate": 0.00010243260163808515, "loss": 0.0307, "step": 204070 }, { "epoch": 1.32, "learning_rate": 0.00010242292028372823, "loss": 0.0268, "step": 204080 }, { "epoch": 1.32, "learning_rate": 0.00010241323892937128, "loss": 0.0338, "step": 204090 }, { "epoch": 1.32, "learning_rate": 0.00010240355757501435, "loss": 0.0332, "step": 204100 }, { "epoch": 1.32, "learning_rate": 0.00010239387622065743, "loss": 0.0247, "step": 204110 }, { "epoch": 1.32, "learning_rate": 0.00010238419486630049, "loss": 0.0291, "step": 204120 }, { "epoch": 1.32, "learning_rate": 0.00010237451351194354, "loss": 0.0308, "step": 204130 }, { "epoch": 1.32, "learning_rate": 0.00010236483215758662, "loss": 0.0298, "step": 204140 }, { "epoch": 1.32, "learning_rate": 0.00010235515080322969, "loss": 0.0313, "step": 204150 }, { "epoch": 1.32, "learning_rate": 0.00010234546944887276, "loss": 0.0344, "step": 204160 }, { "epoch": 1.32, "learning_rate": 0.00010233578809451582, "loss": 0.0324, "step": 204170 }, { "epoch": 1.32, "learning_rate": 0.0001023261067401589, "loss": 0.0386, "step": 204180 }, { "epoch": 1.32, "learning_rate": 0.00010231642538580197, "loss": 0.0308, "step": 204190 }, { "epoch": 1.32, "learning_rate": 0.00010230674403144502, "loss": 0.0298, "step": 204200 }, { "epoch": 1.32, "learning_rate": 0.0001022970626770881, "loss": 0.0377, "step": 204210 }, { "epoch": 1.32, "learning_rate": 0.00010228738132273117, "loss": 0.034, "step": 204220 }, { "epoch": 1.32, "learning_rate": 0.00010227769996837422, "loss": 0.03, "step": 204230 }, { "epoch": 1.32, "learning_rate": 0.0001022680186140173, "loss": 0.0297, "step": 204240 }, { "epoch": 1.32, "learning_rate": 0.00010225833725966037, "loss": 0.0363, "step": 204250 }, { "epoch": 1.32, "learning_rate": 0.00010224865590530345, "loss": 0.0292, "step": 204260 }, { "epoch": 1.32, "learning_rate": 0.0001022389745509465, "loss": 0.025, "step": 204270 }, { "epoch": 1.32, "learning_rate": 0.00010222929319658958, "loss": 0.0277, "step": 204280 }, { "epoch": 1.32, "learning_rate": 0.00010221961184223265, "loss": 0.0302, "step": 204290 }, { "epoch": 1.32, "learning_rate": 0.0001022099304878757, "loss": 0.0296, "step": 204300 }, { "epoch": 1.32, "learning_rate": 0.00010220024913351878, "loss": 0.0282, "step": 204310 }, { "epoch": 1.32, "learning_rate": 0.00010219056777916184, "loss": 0.0317, "step": 204320 }, { "epoch": 1.32, "learning_rate": 0.00010218088642480492, "loss": 0.0264, "step": 204330 }, { "epoch": 1.32, "learning_rate": 0.00010217120507044798, "loss": 0.0363, "step": 204340 }, { "epoch": 1.32, "learning_rate": 0.00010216152371609104, "loss": 0.0279, "step": 204350 }, { "epoch": 1.32, "learning_rate": 0.00010215184236173412, "loss": 0.0264, "step": 204360 }, { "epoch": 1.32, "learning_rate": 0.00010214216100737718, "loss": 0.0241, "step": 204370 }, { "epoch": 1.32, "learning_rate": 0.00010213247965302025, "loss": 0.0331, "step": 204380 }, { "epoch": 1.32, "learning_rate": 0.00010212279829866332, "loss": 0.0335, "step": 204390 }, { "epoch": 1.32, "learning_rate": 0.0001021131169443064, "loss": 0.0305, "step": 204400 }, { "epoch": 1.32, "learning_rate": 0.00010210343558994945, "loss": 0.0389, "step": 204410 }, { "epoch": 1.32, "learning_rate": 0.00010209375423559252, "loss": 0.0278, "step": 204420 }, { "epoch": 1.32, "learning_rate": 0.0001020840728812356, "loss": 0.031, "step": 204430 }, { "epoch": 1.32, "learning_rate": 0.00010207439152687865, "loss": 0.034, "step": 204440 }, { "epoch": 1.32, "learning_rate": 0.00010206471017252172, "loss": 0.0324, "step": 204450 }, { "epoch": 1.32, "learning_rate": 0.0001020550288181648, "loss": 0.027, "step": 204460 }, { "epoch": 1.32, "learning_rate": 0.00010204534746380786, "loss": 0.029, "step": 204470 }, { "epoch": 1.32, "learning_rate": 0.00010203566610945093, "loss": 0.0296, "step": 204480 }, { "epoch": 1.32, "learning_rate": 0.000102025984755094, "loss": 0.0254, "step": 204490 }, { "epoch": 1.32, "learning_rate": 0.00010201630340073708, "loss": 0.0319, "step": 204500 }, { "epoch": 1.32, "learning_rate": 0.00010200662204638013, "loss": 0.0239, "step": 204510 }, { "epoch": 1.32, "learning_rate": 0.0001019969406920232, "loss": 0.0307, "step": 204520 }, { "epoch": 1.32, "learning_rate": 0.00010198725933766628, "loss": 0.0271, "step": 204530 }, { "epoch": 1.32, "learning_rate": 0.00010197757798330934, "loss": 0.0345, "step": 204540 }, { "epoch": 1.32, "learning_rate": 0.0001019678966289524, "loss": 0.0346, "step": 204550 }, { "epoch": 1.32, "learning_rate": 0.00010195821527459547, "loss": 0.0348, "step": 204560 }, { "epoch": 1.32, "learning_rate": 0.00010194853392023854, "loss": 0.0278, "step": 204570 }, { "epoch": 1.32, "learning_rate": 0.00010193885256588161, "loss": 0.032, "step": 204580 }, { "epoch": 1.32, "learning_rate": 0.00010192917121152467, "loss": 0.0312, "step": 204590 }, { "epoch": 1.32, "learning_rate": 0.00010191948985716775, "loss": 0.029, "step": 204600 }, { "epoch": 1.32, "learning_rate": 0.00010190980850281082, "loss": 0.0282, "step": 204610 }, { "epoch": 1.32, "learning_rate": 0.00010190012714845387, "loss": 0.0255, "step": 204620 }, { "epoch": 1.32, "learning_rate": 0.00010189044579409695, "loss": 0.0335, "step": 204630 }, { "epoch": 1.32, "learning_rate": 0.00010188076443974002, "loss": 0.0318, "step": 204640 }, { "epoch": 1.32, "learning_rate": 0.00010187108308538307, "loss": 0.0296, "step": 204650 }, { "epoch": 1.32, "learning_rate": 0.00010186140173102615, "loss": 0.0315, "step": 204660 }, { "epoch": 1.32, "learning_rate": 0.00010185172037666922, "loss": 0.0329, "step": 204670 }, { "epoch": 1.32, "learning_rate": 0.0001018420390223123, "loss": 0.0268, "step": 204680 }, { "epoch": 1.32, "learning_rate": 0.00010183235766795535, "loss": 0.0374, "step": 204690 }, { "epoch": 1.32, "learning_rate": 0.00010182267631359843, "loss": 0.032, "step": 204700 }, { "epoch": 1.32, "learning_rate": 0.0001018129949592415, "loss": 0.0347, "step": 204710 }, { "epoch": 1.32, "learning_rate": 0.00010180331360488455, "loss": 0.03, "step": 204720 }, { "epoch": 1.32, "learning_rate": 0.00010179363225052763, "loss": 0.0291, "step": 204730 }, { "epoch": 1.32, "learning_rate": 0.0001017839508961707, "loss": 0.0288, "step": 204740 }, { "epoch": 1.32, "learning_rate": 0.00010177426954181377, "loss": 0.0273, "step": 204750 }, { "epoch": 1.32, "learning_rate": 0.00010176458818745683, "loss": 0.0294, "step": 204760 }, { "epoch": 1.32, "learning_rate": 0.00010175490683309989, "loss": 0.0354, "step": 204770 }, { "epoch": 1.32, "learning_rate": 0.00010174522547874297, "loss": 0.0328, "step": 204780 }, { "epoch": 1.32, "learning_rate": 0.00010173554412438602, "loss": 0.0301, "step": 204790 }, { "epoch": 1.32, "learning_rate": 0.0001017258627700291, "loss": 0.029, "step": 204800 }, { "epoch": 1.32, "learning_rate": 0.00010171618141567217, "loss": 0.0333, "step": 204810 }, { "epoch": 1.32, "learning_rate": 0.00010170650006131524, "loss": 0.028, "step": 204820 }, { "epoch": 1.32, "learning_rate": 0.0001016968187069583, "loss": 0.0321, "step": 204830 }, { "epoch": 1.32, "learning_rate": 0.00010168713735260137, "loss": 0.0351, "step": 204840 }, { "epoch": 1.32, "learning_rate": 0.00010167745599824445, "loss": 0.0329, "step": 204850 }, { "epoch": 1.32, "learning_rate": 0.0001016677746438875, "loss": 0.0263, "step": 204860 }, { "epoch": 1.32, "learning_rate": 0.00010165809328953057, "loss": 0.0336, "step": 204870 }, { "epoch": 1.32, "learning_rate": 0.00010164841193517365, "loss": 0.0262, "step": 204880 }, { "epoch": 1.32, "learning_rate": 0.0001016387305808167, "loss": 0.0304, "step": 204890 }, { "epoch": 1.32, "learning_rate": 0.00010162904922645978, "loss": 0.0338, "step": 204900 }, { "epoch": 1.32, "learning_rate": 0.00010161936787210285, "loss": 0.0259, "step": 204910 }, { "epoch": 1.32, "learning_rate": 0.00010160968651774591, "loss": 0.0281, "step": 204920 }, { "epoch": 1.32, "learning_rate": 0.00010160000516338898, "loss": 0.025, "step": 204930 }, { "epoch": 1.32, "learning_rate": 0.00010159032380903205, "loss": 0.0303, "step": 204940 }, { "epoch": 1.32, "learning_rate": 0.00010158064245467513, "loss": 0.0287, "step": 204950 }, { "epoch": 1.32, "learning_rate": 0.00010157096110031818, "loss": 0.0304, "step": 204960 }, { "epoch": 1.32, "learning_rate": 0.00010156127974596124, "loss": 0.0308, "step": 204970 }, { "epoch": 1.32, "learning_rate": 0.00010155159839160432, "loss": 0.0253, "step": 204980 }, { "epoch": 1.32, "learning_rate": 0.00010154191703724739, "loss": 0.0236, "step": 204990 }, { "epoch": 1.32, "learning_rate": 0.00010153223568289046, "loss": 0.0293, "step": 205000 }, { "epoch": 1.32, "eval_cer": 0.9198472488984295, "eval_loss": 0.021727943792939186, "eval_runtime": 120.2177, "eval_samples_per_second": 16.636, "eval_steps_per_second": 4.159, "step": 205000 }, { "epoch": 1.32, "learning_rate": 0.00010152255432853352, "loss": 0.0271, "step": 205010 }, { "epoch": 1.32, "learning_rate": 0.00010151287297417659, "loss": 0.0265, "step": 205020 }, { "epoch": 1.32, "learning_rate": 0.00010150319161981966, "loss": 0.0303, "step": 205030 }, { "epoch": 1.32, "learning_rate": 0.00010149351026546272, "loss": 0.027, "step": 205040 }, { "epoch": 1.32, "learning_rate": 0.0001014838289111058, "loss": 0.0293, "step": 205050 }, { "epoch": 1.32, "learning_rate": 0.00010147414755674887, "loss": 0.0351, "step": 205060 }, { "epoch": 1.32, "learning_rate": 0.00010146446620239192, "loss": 0.0244, "step": 205070 }, { "epoch": 1.32, "learning_rate": 0.000101454784848035, "loss": 0.0343, "step": 205080 }, { "epoch": 1.32, "learning_rate": 0.00010144510349367807, "loss": 0.028, "step": 205090 }, { "epoch": 1.32, "learning_rate": 0.00010143542213932113, "loss": 0.0276, "step": 205100 }, { "epoch": 1.32, "learning_rate": 0.0001014257407849642, "loss": 0.0294, "step": 205110 }, { "epoch": 1.32, "learning_rate": 0.00010141605943060727, "loss": 0.0325, "step": 205120 }, { "epoch": 1.32, "learning_rate": 0.00010140637807625034, "loss": 0.0301, "step": 205130 }, { "epoch": 1.32, "learning_rate": 0.0001013966967218934, "loss": 0.0309, "step": 205140 }, { "epoch": 1.32, "learning_rate": 0.00010138701536753648, "loss": 0.0337, "step": 205150 }, { "epoch": 1.32, "learning_rate": 0.00010137733401317954, "loss": 0.0316, "step": 205160 }, { "epoch": 1.32, "learning_rate": 0.0001013676526588226, "loss": 0.0289, "step": 205170 }, { "epoch": 1.32, "learning_rate": 0.00010135797130446568, "loss": 0.0301, "step": 205180 }, { "epoch": 1.32, "learning_rate": 0.00010134828995010874, "loss": 0.0284, "step": 205190 }, { "epoch": 1.32, "learning_rate": 0.00010133860859575182, "loss": 0.0298, "step": 205200 }, { "epoch": 1.32, "learning_rate": 0.00010132892724139487, "loss": 0.0285, "step": 205210 }, { "epoch": 1.32, "learning_rate": 0.00010131924588703794, "loss": 0.025, "step": 205220 }, { "epoch": 1.32, "learning_rate": 0.00010130956453268102, "loss": 0.0295, "step": 205230 }, { "epoch": 1.32, "learning_rate": 0.00010129988317832407, "loss": 0.0292, "step": 205240 }, { "epoch": 1.32, "learning_rate": 0.00010129020182396715, "loss": 0.0275, "step": 205250 }, { "epoch": 1.32, "learning_rate": 0.00010128052046961022, "loss": 0.0406, "step": 205260 }, { "epoch": 1.32, "learning_rate": 0.0001012708391152533, "loss": 0.0274, "step": 205270 }, { "epoch": 1.32, "learning_rate": 0.00010126115776089635, "loss": 0.0284, "step": 205280 }, { "epoch": 1.32, "learning_rate": 0.00010125147640653942, "loss": 0.0269, "step": 205290 }, { "epoch": 1.33, "learning_rate": 0.0001012417950521825, "loss": 0.0342, "step": 205300 }, { "epoch": 1.33, "learning_rate": 0.00010123211369782555, "loss": 0.0375, "step": 205310 }, { "epoch": 1.33, "learning_rate": 0.00010122243234346862, "loss": 0.0268, "step": 205320 }, { "epoch": 1.33, "learning_rate": 0.0001012127509891117, "loss": 0.032, "step": 205330 }, { "epoch": 1.33, "learning_rate": 0.00010120306963475476, "loss": 0.0287, "step": 205340 }, { "epoch": 1.33, "learning_rate": 0.00010119338828039783, "loss": 0.0261, "step": 205350 }, { "epoch": 1.33, "learning_rate": 0.0001011837069260409, "loss": 0.0328, "step": 205360 }, { "epoch": 1.33, "learning_rate": 0.00010117402557168398, "loss": 0.0337, "step": 205370 }, { "epoch": 1.33, "learning_rate": 0.00010116434421732703, "loss": 0.0274, "step": 205380 }, { "epoch": 1.33, "learning_rate": 0.0001011546628629701, "loss": 0.0313, "step": 205390 }, { "epoch": 1.33, "learning_rate": 0.00010114498150861317, "loss": 0.0301, "step": 205400 }, { "epoch": 1.33, "learning_rate": 0.00010113530015425624, "loss": 0.0377, "step": 205410 }, { "epoch": 1.33, "learning_rate": 0.00010112561879989929, "loss": 0.0305, "step": 205420 }, { "epoch": 1.33, "learning_rate": 0.00010111593744554237, "loss": 0.026, "step": 205430 }, { "epoch": 1.33, "learning_rate": 0.00010110625609118544, "loss": 0.0296, "step": 205440 }, { "epoch": 1.33, "learning_rate": 0.0001010965747368285, "loss": 0.0318, "step": 205450 }, { "epoch": 1.33, "learning_rate": 0.00010108689338247157, "loss": 0.0328, "step": 205460 }, { "epoch": 1.33, "learning_rate": 0.00010107721202811465, "loss": 0.0317, "step": 205470 }, { "epoch": 1.33, "learning_rate": 0.00010106753067375772, "loss": 0.027, "step": 205480 }, { "epoch": 1.33, "learning_rate": 0.00010105784931940077, "loss": 0.0279, "step": 205490 }, { "epoch": 1.33, "learning_rate": 0.00010104816796504385, "loss": 0.0324, "step": 205500 }, { "epoch": 1.33, "learning_rate": 0.00010103848661068692, "loss": 0.0278, "step": 205510 }, { "epoch": 1.33, "learning_rate": 0.00010102880525632997, "loss": 0.0287, "step": 205520 }, { "epoch": 1.33, "learning_rate": 0.00010101912390197305, "loss": 0.0351, "step": 205530 }, { "epoch": 1.33, "learning_rate": 0.00010100944254761611, "loss": 0.0328, "step": 205540 }, { "epoch": 1.33, "learning_rate": 0.0001009997611932592, "loss": 0.0289, "step": 205550 }, { "epoch": 1.33, "learning_rate": 0.00010099007983890225, "loss": 0.0286, "step": 205560 }, { "epoch": 1.33, "learning_rate": 0.00010098039848454533, "loss": 0.031, "step": 205570 }, { "epoch": 1.33, "learning_rate": 0.0001009707171301884, "loss": 0.0244, "step": 205580 }, { "epoch": 1.33, "learning_rate": 0.00010096103577583145, "loss": 0.0257, "step": 205590 }, { "epoch": 1.33, "learning_rate": 0.00010095135442147453, "loss": 0.0343, "step": 205600 }, { "epoch": 1.33, "learning_rate": 0.00010094167306711759, "loss": 0.0286, "step": 205610 }, { "epoch": 1.33, "learning_rate": 0.00010093199171276067, "loss": 0.0309, "step": 205620 }, { "epoch": 1.33, "learning_rate": 0.00010092231035840372, "loss": 0.0293, "step": 205630 }, { "epoch": 1.33, "learning_rate": 0.00010091262900404679, "loss": 0.0282, "step": 205640 }, { "epoch": 1.33, "learning_rate": 0.00010090294764968987, "loss": 0.0269, "step": 205650 }, { "epoch": 1.33, "learning_rate": 0.00010089326629533292, "loss": 0.0413, "step": 205660 }, { "epoch": 1.33, "learning_rate": 0.000100883584940976, "loss": 0.0273, "step": 205670 }, { "epoch": 1.33, "learning_rate": 0.00010087390358661907, "loss": 0.0259, "step": 205680 }, { "epoch": 1.33, "learning_rate": 0.00010086422223226215, "loss": 0.03, "step": 205690 }, { "epoch": 1.33, "learning_rate": 0.0001008545408779052, "loss": 0.0275, "step": 205700 }, { "epoch": 1.33, "learning_rate": 0.00010084485952354827, "loss": 0.0265, "step": 205710 }, { "epoch": 1.33, "learning_rate": 0.00010083517816919135, "loss": 0.0348, "step": 205720 }, { "epoch": 1.33, "learning_rate": 0.0001008254968148344, "loss": 0.0322, "step": 205730 }, { "epoch": 1.33, "learning_rate": 0.00010081581546047747, "loss": 0.0322, "step": 205740 }, { "epoch": 1.33, "learning_rate": 0.00010080613410612055, "loss": 0.0351, "step": 205750 }, { "epoch": 1.33, "learning_rate": 0.00010079645275176361, "loss": 0.0277, "step": 205760 }, { "epoch": 1.33, "learning_rate": 0.00010078677139740668, "loss": 0.0379, "step": 205770 }, { "epoch": 1.33, "learning_rate": 0.00010077709004304975, "loss": 0.0286, "step": 205780 }, { "epoch": 1.33, "learning_rate": 0.00010076740868869283, "loss": 0.0262, "step": 205790 }, { "epoch": 1.33, "learning_rate": 0.00010075772733433588, "loss": 0.0266, "step": 205800 }, { "epoch": 1.33, "learning_rate": 0.00010074804597997894, "loss": 0.0272, "step": 205810 }, { "epoch": 1.33, "learning_rate": 0.00010073836462562202, "loss": 0.0286, "step": 205820 }, { "epoch": 1.33, "learning_rate": 0.00010072868327126509, "loss": 0.0264, "step": 205830 }, { "epoch": 1.33, "learning_rate": 0.00010071900191690814, "loss": 0.0272, "step": 205840 }, { "epoch": 1.33, "learning_rate": 0.00010070932056255122, "loss": 0.0324, "step": 205850 }, { "epoch": 1.33, "learning_rate": 0.00010069963920819429, "loss": 0.0284, "step": 205860 }, { "epoch": 1.33, "learning_rate": 0.00010068995785383735, "loss": 0.0306, "step": 205870 }, { "epoch": 1.33, "learning_rate": 0.00010068027649948042, "loss": 0.0314, "step": 205880 }, { "epoch": 1.33, "learning_rate": 0.0001006705951451235, "loss": 0.033, "step": 205890 }, { "epoch": 1.33, "learning_rate": 0.00010066091379076657, "loss": 0.0314, "step": 205900 }, { "epoch": 1.33, "learning_rate": 0.00010065123243640962, "loss": 0.0277, "step": 205910 }, { "epoch": 1.33, "learning_rate": 0.0001006415510820527, "loss": 0.0249, "step": 205920 }, { "epoch": 1.33, "learning_rate": 0.00010063186972769577, "loss": 0.0271, "step": 205930 }, { "epoch": 1.33, "learning_rate": 0.00010062218837333882, "loss": 0.028, "step": 205940 }, { "epoch": 1.33, "learning_rate": 0.0001006125070189819, "loss": 0.026, "step": 205950 }, { "epoch": 1.33, "learning_rate": 0.00010060282566462496, "loss": 0.0276, "step": 205960 }, { "epoch": 1.33, "learning_rate": 0.00010059314431026804, "loss": 0.0292, "step": 205970 }, { "epoch": 1.33, "learning_rate": 0.0001005834629559111, "loss": 0.0283, "step": 205980 }, { "epoch": 1.33, "learning_rate": 0.00010057378160155418, "loss": 0.0244, "step": 205990 }, { "epoch": 1.33, "learning_rate": 0.00010056410024719724, "loss": 0.0347, "step": 206000 }, { "epoch": 1.33, "eval_cer": 0.9198969607953904, "eval_loss": 0.021649910137057304, "eval_runtime": 120.1272, "eval_samples_per_second": 16.649, "eval_steps_per_second": 4.162, "step": 206000 }, { "epoch": 1.33, "learning_rate": 0.0001005544188928403, "loss": 0.0304, "step": 206010 }, { "epoch": 1.33, "learning_rate": 0.00010054473753848338, "loss": 0.0347, "step": 206020 }, { "epoch": 1.33, "learning_rate": 0.00010053505618412644, "loss": 0.0286, "step": 206030 }, { "epoch": 1.33, "learning_rate": 0.00010052537482976952, "loss": 0.0311, "step": 206040 }, { "epoch": 1.33, "learning_rate": 0.00010051569347541257, "loss": 0.0348, "step": 206050 }, { "epoch": 1.33, "learning_rate": 0.00010050601212105564, "loss": 0.0289, "step": 206060 }, { "epoch": 1.33, "learning_rate": 0.00010049633076669872, "loss": 0.0292, "step": 206070 }, { "epoch": 1.33, "learning_rate": 0.00010048664941234177, "loss": 0.0307, "step": 206080 }, { "epoch": 1.33, "learning_rate": 0.00010047696805798485, "loss": 0.0242, "step": 206090 }, { "epoch": 1.33, "learning_rate": 0.00010046728670362792, "loss": 0.0299, "step": 206100 }, { "epoch": 1.33, "learning_rate": 0.00010045760534927099, "loss": 0.0295, "step": 206110 }, { "epoch": 1.33, "learning_rate": 0.00010044792399491405, "loss": 0.0302, "step": 206120 }, { "epoch": 1.33, "learning_rate": 0.00010043824264055712, "loss": 0.031, "step": 206130 }, { "epoch": 1.33, "learning_rate": 0.0001004285612862002, "loss": 0.0335, "step": 206140 }, { "epoch": 1.33, "learning_rate": 0.00010041887993184325, "loss": 0.0297, "step": 206150 }, { "epoch": 1.33, "learning_rate": 0.00010040919857748632, "loss": 0.0317, "step": 206160 }, { "epoch": 1.33, "learning_rate": 0.0001003995172231294, "loss": 0.0268, "step": 206170 }, { "epoch": 1.33, "learning_rate": 0.00010038983586877246, "loss": 0.0312, "step": 206180 }, { "epoch": 1.33, "learning_rate": 0.00010038015451441553, "loss": 0.0346, "step": 206190 }, { "epoch": 1.33, "learning_rate": 0.0001003704731600586, "loss": 0.0354, "step": 206200 }, { "epoch": 1.33, "learning_rate": 0.00010036079180570166, "loss": 0.029, "step": 206210 }, { "epoch": 1.33, "learning_rate": 0.00010035111045134473, "loss": 0.0299, "step": 206220 }, { "epoch": 1.33, "learning_rate": 0.0001003414290969878, "loss": 0.027, "step": 206230 }, { "epoch": 1.33, "learning_rate": 0.00010033174774263087, "loss": 0.028, "step": 206240 }, { "epoch": 1.33, "learning_rate": 0.00010032206638827394, "loss": 0.0303, "step": 206250 }, { "epoch": 1.33, "learning_rate": 0.00010031238503391699, "loss": 0.0284, "step": 206260 }, { "epoch": 1.33, "learning_rate": 0.00010030270367956007, "loss": 0.0321, "step": 206270 }, { "epoch": 1.33, "learning_rate": 0.00010029302232520314, "loss": 0.0339, "step": 206280 }, { "epoch": 1.33, "learning_rate": 0.0001002833409708462, "loss": 0.0302, "step": 206290 }, { "epoch": 1.33, "learning_rate": 0.00010027365961648927, "loss": 0.0268, "step": 206300 }, { "epoch": 1.33, "learning_rate": 0.00010026397826213234, "loss": 0.032, "step": 206310 }, { "epoch": 1.33, "learning_rate": 0.00010025429690777542, "loss": 0.0311, "step": 206320 }, { "epoch": 1.33, "learning_rate": 0.00010024461555341847, "loss": 0.0269, "step": 206330 }, { "epoch": 1.33, "learning_rate": 0.00010023493419906155, "loss": 0.0256, "step": 206340 }, { "epoch": 1.33, "learning_rate": 0.00010022525284470462, "loss": 0.0269, "step": 206350 }, { "epoch": 1.33, "learning_rate": 0.00010021557149034767, "loss": 0.0275, "step": 206360 }, { "epoch": 1.33, "learning_rate": 0.00010020589013599075, "loss": 0.0314, "step": 206370 }, { "epoch": 1.33, "learning_rate": 0.00010019620878163381, "loss": 0.0291, "step": 206380 }, { "epoch": 1.33, "learning_rate": 0.0001001865274272769, "loss": 0.0337, "step": 206390 }, { "epoch": 1.33, "learning_rate": 0.00010017684607291995, "loss": 0.0227, "step": 206400 }, { "epoch": 1.33, "learning_rate": 0.00010016716471856301, "loss": 0.0275, "step": 206410 }, { "epoch": 1.33, "learning_rate": 0.00010015748336420609, "loss": 0.0282, "step": 206420 }, { "epoch": 1.33, "learning_rate": 0.00010014780200984915, "loss": 0.0288, "step": 206430 }, { "epoch": 1.33, "learning_rate": 0.00010013812065549223, "loss": 0.0326, "step": 206440 }, { "epoch": 1.33, "learning_rate": 0.00010012843930113529, "loss": 0.025, "step": 206450 }, { "epoch": 1.33, "learning_rate": 0.00010011875794677837, "loss": 0.0293, "step": 206460 }, { "epoch": 1.33, "learning_rate": 0.00010010907659242142, "loss": 0.0325, "step": 206470 }, { "epoch": 1.33, "learning_rate": 0.00010009939523806449, "loss": 0.0315, "step": 206480 }, { "epoch": 1.33, "learning_rate": 0.00010008971388370757, "loss": 0.0299, "step": 206490 }, { "epoch": 1.33, "learning_rate": 0.00010008003252935062, "loss": 0.0272, "step": 206500 }, { "epoch": 1.33, "learning_rate": 0.0001000703511749937, "loss": 0.0368, "step": 206510 }, { "epoch": 1.33, "learning_rate": 0.00010006066982063677, "loss": 0.0309, "step": 206520 }, { "epoch": 1.33, "learning_rate": 0.00010005098846627984, "loss": 0.0308, "step": 206530 }, { "epoch": 1.33, "learning_rate": 0.0001000413071119229, "loss": 0.0284, "step": 206540 }, { "epoch": 1.33, "learning_rate": 0.00010003162575756597, "loss": 0.027, "step": 206550 }, { "epoch": 1.33, "learning_rate": 0.00010002194440320905, "loss": 0.0274, "step": 206560 }, { "epoch": 1.33, "learning_rate": 0.0001000122630488521, "loss": 0.0301, "step": 206570 }, { "epoch": 1.33, "learning_rate": 0.00010000258169449517, "loss": 0.0292, "step": 206580 }, { "epoch": 1.33, "learning_rate": 9.999290034013825e-05, "loss": 0.0307, "step": 206590 }, { "epoch": 1.33, "learning_rate": 9.998321898578131e-05, "loss": 0.0362, "step": 206600 }, { "epoch": 1.33, "learning_rate": 9.997353763142438e-05, "loss": 0.0376, "step": 206610 }, { "epoch": 1.33, "learning_rate": 9.996385627706744e-05, "loss": 0.0274, "step": 206620 }, { "epoch": 1.33, "learning_rate": 9.995417492271051e-05, "loss": 0.0349, "step": 206630 }, { "epoch": 1.33, "learning_rate": 9.994449356835358e-05, "loss": 0.032, "step": 206640 }, { "epoch": 1.33, "learning_rate": 9.993481221399664e-05, "loss": 0.0344, "step": 206650 }, { "epoch": 1.33, "learning_rate": 9.992513085963972e-05, "loss": 0.0297, "step": 206660 }, { "epoch": 1.33, "learning_rate": 9.991544950528279e-05, "loss": 0.0311, "step": 206670 }, { "epoch": 1.33, "learning_rate": 9.990576815092584e-05, "loss": 0.0253, "step": 206680 }, { "epoch": 1.33, "learning_rate": 9.989608679656892e-05, "loss": 0.03, "step": 206690 }, { "epoch": 1.33, "learning_rate": 9.988640544221199e-05, "loss": 0.0267, "step": 206700 }, { "epoch": 1.33, "learning_rate": 9.987672408785505e-05, "loss": 0.0266, "step": 206710 }, { "epoch": 1.33, "learning_rate": 9.986704273349812e-05, "loss": 0.0344, "step": 206720 }, { "epoch": 1.33, "learning_rate": 9.985736137914119e-05, "loss": 0.0292, "step": 206730 }, { "epoch": 1.33, "learning_rate": 9.984768002478427e-05, "loss": 0.0367, "step": 206740 }, { "epoch": 1.33, "learning_rate": 9.983799867042732e-05, "loss": 0.0299, "step": 206750 }, { "epoch": 1.33, "learning_rate": 9.98283173160704e-05, "loss": 0.0319, "step": 206760 }, { "epoch": 1.33, "learning_rate": 9.981863596171347e-05, "loss": 0.0321, "step": 206770 }, { "epoch": 1.33, "learning_rate": 9.980895460735652e-05, "loss": 0.0354, "step": 206780 }, { "epoch": 1.33, "learning_rate": 9.97992732529996e-05, "loss": 0.0303, "step": 206790 }, { "epoch": 1.33, "learning_rate": 9.978959189864266e-05, "loss": 0.0287, "step": 206800 }, { "epoch": 1.33, "learning_rate": 9.977991054428574e-05, "loss": 0.0304, "step": 206810 }, { "epoch": 1.33, "learning_rate": 9.97702291899288e-05, "loss": 0.0278, "step": 206820 }, { "epoch": 1.33, "learning_rate": 9.976054783557186e-05, "loss": 0.0291, "step": 206830 }, { "epoch": 1.33, "learning_rate": 9.975086648121494e-05, "loss": 0.0333, "step": 206840 }, { "epoch": 1.34, "learning_rate": 9.9741185126858e-05, "loss": 0.0327, "step": 206850 }, { "epoch": 1.34, "learning_rate": 9.973150377250108e-05, "loss": 0.0253, "step": 206860 }, { "epoch": 1.34, "learning_rate": 9.972182241814414e-05, "loss": 0.0288, "step": 206870 }, { "epoch": 1.34, "learning_rate": 9.971214106378722e-05, "loss": 0.0275, "step": 206880 }, { "epoch": 1.34, "learning_rate": 9.970245970943027e-05, "loss": 0.0321, "step": 206890 }, { "epoch": 1.34, "learning_rate": 9.969277835507334e-05, "loss": 0.032, "step": 206900 }, { "epoch": 1.34, "learning_rate": 9.968309700071642e-05, "loss": 0.0252, "step": 206910 }, { "epoch": 1.34, "learning_rate": 9.967341564635947e-05, "loss": 0.0317, "step": 206920 }, { "epoch": 1.34, "learning_rate": 9.966373429200254e-05, "loss": 0.0279, "step": 206930 }, { "epoch": 1.34, "learning_rate": 9.965405293764562e-05, "loss": 0.0284, "step": 206940 }, { "epoch": 1.34, "learning_rate": 9.964437158328868e-05, "loss": 0.0292, "step": 206950 }, { "epoch": 1.34, "learning_rate": 9.963469022893175e-05, "loss": 0.0317, "step": 206960 }, { "epoch": 1.34, "learning_rate": 9.962500887457482e-05, "loss": 0.0324, "step": 206970 }, { "epoch": 1.34, "learning_rate": 9.96153275202179e-05, "loss": 0.0344, "step": 206980 }, { "epoch": 1.34, "learning_rate": 9.960564616586095e-05, "loss": 0.0309, "step": 206990 }, { "epoch": 1.34, "learning_rate": 9.959596481150402e-05, "loss": 0.0288, "step": 207000 }, { "epoch": 1.34, "eval_cer": 0.9198942492373743, "eval_loss": 0.02147371508181095, "eval_runtime": 120.1748, "eval_samples_per_second": 16.642, "eval_steps_per_second": 4.161, "step": 207000 }, { "epoch": 1.34, "learning_rate": 9.95862834571471e-05, "loss": 0.029, "step": 207010 }, { "epoch": 1.34, "learning_rate": 9.957660210279016e-05, "loss": 0.0309, "step": 207020 }, { "epoch": 1.34, "learning_rate": 9.956692074843321e-05, "loss": 0.0331, "step": 207030 }, { "epoch": 1.34, "learning_rate": 9.95572393940763e-05, "loss": 0.0278, "step": 207040 }, { "epoch": 1.34, "learning_rate": 9.954755803971936e-05, "loss": 0.026, "step": 207050 }, { "epoch": 1.34, "learning_rate": 9.953787668536243e-05, "loss": 0.0315, "step": 207060 }, { "epoch": 1.34, "learning_rate": 9.95281953310055e-05, "loss": 0.0337, "step": 207070 }, { "epoch": 1.34, "learning_rate": 9.951851397664857e-05, "loss": 0.0323, "step": 207080 }, { "epoch": 1.34, "learning_rate": 9.950883262229164e-05, "loss": 0.027, "step": 207090 }, { "epoch": 1.34, "learning_rate": 9.949915126793469e-05, "loss": 0.0277, "step": 207100 }, { "epoch": 1.34, "learning_rate": 9.948946991357777e-05, "loss": 0.0273, "step": 207110 }, { "epoch": 1.34, "learning_rate": 9.947978855922084e-05, "loss": 0.0259, "step": 207120 }, { "epoch": 1.34, "learning_rate": 9.947010720486389e-05, "loss": 0.0271, "step": 207130 }, { "epoch": 1.34, "learning_rate": 9.946042585050697e-05, "loss": 0.0295, "step": 207140 }, { "epoch": 1.34, "learning_rate": 9.945074449615004e-05, "loss": 0.0336, "step": 207150 }, { "epoch": 1.34, "learning_rate": 9.944106314179312e-05, "loss": 0.0341, "step": 207160 }, { "epoch": 1.34, "learning_rate": 9.943138178743617e-05, "loss": 0.0281, "step": 207170 }, { "epoch": 1.34, "learning_rate": 9.942170043307925e-05, "loss": 0.0332, "step": 207180 }, { "epoch": 1.34, "learning_rate": 9.941201907872232e-05, "loss": 0.0223, "step": 207190 }, { "epoch": 1.34, "learning_rate": 9.940233772436537e-05, "loss": 0.0299, "step": 207200 }, { "epoch": 1.34, "learning_rate": 9.939265637000845e-05, "loss": 0.0281, "step": 207210 }, { "epoch": 1.34, "learning_rate": 9.938297501565151e-05, "loss": 0.0284, "step": 207220 }, { "epoch": 1.34, "learning_rate": 9.93732936612946e-05, "loss": 0.0266, "step": 207230 }, { "epoch": 1.34, "learning_rate": 9.936361230693765e-05, "loss": 0.0319, "step": 207240 }, { "epoch": 1.34, "learning_rate": 9.935393095258071e-05, "loss": 0.028, "step": 207250 }, { "epoch": 1.34, "learning_rate": 9.934424959822379e-05, "loss": 0.0317, "step": 207260 }, { "epoch": 1.34, "learning_rate": 9.933456824386685e-05, "loss": 0.0277, "step": 207270 }, { "epoch": 1.34, "learning_rate": 9.932488688950993e-05, "loss": 0.032, "step": 207280 }, { "epoch": 1.34, "learning_rate": 9.931520553515299e-05, "loss": 0.0267, "step": 207290 }, { "epoch": 1.34, "learning_rate": 9.930552418079607e-05, "loss": 0.0301, "step": 207300 }, { "epoch": 1.34, "learning_rate": 9.929584282643912e-05, "loss": 0.0276, "step": 207310 }, { "epoch": 1.34, "learning_rate": 9.928616147208219e-05, "loss": 0.0289, "step": 207320 }, { "epoch": 1.34, "learning_rate": 9.927648011772527e-05, "loss": 0.0307, "step": 207330 }, { "epoch": 1.34, "learning_rate": 9.926679876336832e-05, "loss": 0.0293, "step": 207340 }, { "epoch": 1.34, "learning_rate": 9.925711740901139e-05, "loss": 0.0309, "step": 207350 }, { "epoch": 1.34, "learning_rate": 9.924743605465447e-05, "loss": 0.031, "step": 207360 }, { "epoch": 1.34, "learning_rate": 9.923775470029753e-05, "loss": 0.0369, "step": 207370 }, { "epoch": 1.34, "learning_rate": 9.92280733459406e-05, "loss": 0.0265, "step": 207380 }, { "epoch": 1.34, "learning_rate": 9.921839199158367e-05, "loss": 0.0294, "step": 207390 }, { "epoch": 1.34, "learning_rate": 9.920871063722675e-05, "loss": 0.0276, "step": 207400 }, { "epoch": 1.34, "learning_rate": 9.91990292828698e-05, "loss": 0.0341, "step": 207410 }, { "epoch": 1.34, "learning_rate": 9.918934792851287e-05, "loss": 0.0261, "step": 207420 }, { "epoch": 1.34, "learning_rate": 9.917966657415595e-05, "loss": 0.0315, "step": 207430 }, { "epoch": 1.34, "learning_rate": 9.916998521979901e-05, "loss": 0.0298, "step": 207440 }, { "epoch": 1.34, "learning_rate": 9.916030386544206e-05, "loss": 0.0258, "step": 207450 }, { "epoch": 1.34, "learning_rate": 9.915062251108514e-05, "loss": 0.0337, "step": 207460 }, { "epoch": 1.34, "learning_rate": 9.914094115672821e-05, "loss": 0.0357, "step": 207470 }, { "epoch": 1.34, "learning_rate": 9.913125980237128e-05, "loss": 0.0292, "step": 207480 }, { "epoch": 1.34, "learning_rate": 9.912157844801434e-05, "loss": 0.0333, "step": 207490 }, { "epoch": 1.34, "learning_rate": 9.911189709365742e-05, "loss": 0.0296, "step": 207500 }, { "epoch": 1.34, "learning_rate": 9.910221573930049e-05, "loss": 0.0293, "step": 207510 }, { "epoch": 1.34, "learning_rate": 9.909253438494354e-05, "loss": 0.0253, "step": 207520 }, { "epoch": 1.34, "learning_rate": 9.908285303058662e-05, "loss": 0.0327, "step": 207530 }, { "epoch": 1.34, "learning_rate": 9.907317167622969e-05, "loss": 0.0347, "step": 207540 }, { "epoch": 1.34, "learning_rate": 9.906349032187274e-05, "loss": 0.0348, "step": 207550 }, { "epoch": 1.34, "learning_rate": 9.905380896751582e-05, "loss": 0.0306, "step": 207560 }, { "epoch": 1.34, "learning_rate": 9.904412761315889e-05, "loss": 0.0316, "step": 207570 }, { "epoch": 1.34, "learning_rate": 9.903444625880197e-05, "loss": 0.0341, "step": 207580 }, { "epoch": 1.34, "learning_rate": 9.902476490444502e-05, "loss": 0.0392, "step": 207590 }, { "epoch": 1.34, "learning_rate": 9.90150835500881e-05, "loss": 0.0362, "step": 207600 }, { "epoch": 1.34, "learning_rate": 9.900540219573117e-05, "loss": 0.028, "step": 207610 }, { "epoch": 1.34, "learning_rate": 9.899572084137422e-05, "loss": 0.0309, "step": 207620 }, { "epoch": 1.34, "learning_rate": 9.89860394870173e-05, "loss": 0.0282, "step": 207630 }, { "epoch": 1.34, "learning_rate": 9.897635813266036e-05, "loss": 0.032, "step": 207640 }, { "epoch": 1.34, "learning_rate": 9.896667677830344e-05, "loss": 0.0362, "step": 207650 }, { "epoch": 1.34, "learning_rate": 9.89569954239465e-05, "loss": 0.0361, "step": 207660 }, { "epoch": 1.34, "learning_rate": 9.894731406958956e-05, "loss": 0.033, "step": 207670 }, { "epoch": 1.34, "learning_rate": 9.893763271523264e-05, "loss": 0.0313, "step": 207680 }, { "epoch": 1.34, "learning_rate": 9.89279513608757e-05, "loss": 0.0338, "step": 207690 }, { "epoch": 1.34, "learning_rate": 9.891827000651877e-05, "loss": 0.0296, "step": 207700 }, { "epoch": 1.34, "learning_rate": 9.890858865216184e-05, "loss": 0.026, "step": 207710 }, { "epoch": 1.34, "learning_rate": 9.889890729780491e-05, "loss": 0.0313, "step": 207720 }, { "epoch": 1.34, "learning_rate": 9.888922594344797e-05, "loss": 0.0295, "step": 207730 }, { "epoch": 1.34, "learning_rate": 9.887954458909104e-05, "loss": 0.0296, "step": 207740 }, { "epoch": 1.34, "learning_rate": 9.886986323473412e-05, "loss": 0.0316, "step": 207750 }, { "epoch": 1.34, "learning_rate": 9.886018188037717e-05, "loss": 0.0263, "step": 207760 }, { "epoch": 1.34, "learning_rate": 9.885050052602024e-05, "loss": 0.0336, "step": 207770 }, { "epoch": 1.34, "learning_rate": 9.884081917166332e-05, "loss": 0.0244, "step": 207780 }, { "epoch": 1.34, "learning_rate": 9.883113781730638e-05, "loss": 0.0278, "step": 207790 }, { "epoch": 1.34, "learning_rate": 9.882145646294945e-05, "loss": 0.0288, "step": 207800 }, { "epoch": 1.34, "learning_rate": 9.881177510859252e-05, "loss": 0.0286, "step": 207810 }, { "epoch": 1.34, "learning_rate": 9.880209375423558e-05, "loss": 0.0285, "step": 207820 }, { "epoch": 1.34, "learning_rate": 9.879241239987865e-05, "loss": 0.0281, "step": 207830 }, { "epoch": 1.34, "learning_rate": 9.878273104552172e-05, "loss": 0.0313, "step": 207840 }, { "epoch": 1.34, "learning_rate": 9.87730496911648e-05, "loss": 0.0306, "step": 207850 }, { "epoch": 1.34, "learning_rate": 9.876336833680786e-05, "loss": 0.0298, "step": 207860 }, { "epoch": 1.34, "learning_rate": 9.875368698245091e-05, "loss": 0.0303, "step": 207870 }, { "epoch": 1.34, "learning_rate": 9.8744005628094e-05, "loss": 0.0314, "step": 207880 }, { "epoch": 1.34, "learning_rate": 9.873432427373706e-05, "loss": 0.0264, "step": 207890 }, { "epoch": 1.34, "learning_rate": 9.872464291938013e-05, "loss": 0.0273, "step": 207900 }, { "epoch": 1.34, "learning_rate": 9.871496156502319e-05, "loss": 0.0271, "step": 207910 }, { "epoch": 1.34, "learning_rate": 9.870528021066626e-05, "loss": 0.0296, "step": 207920 }, { "epoch": 1.34, "learning_rate": 9.869559885630934e-05, "loss": 0.0263, "step": 207930 }, { "epoch": 1.34, "learning_rate": 9.868591750195239e-05, "loss": 0.0297, "step": 207940 }, { "epoch": 1.34, "learning_rate": 9.867623614759547e-05, "loss": 0.033, "step": 207950 }, { "epoch": 1.34, "learning_rate": 9.866655479323854e-05, "loss": 0.0331, "step": 207960 }, { "epoch": 1.34, "learning_rate": 9.865687343888159e-05, "loss": 0.0246, "step": 207970 }, { "epoch": 1.34, "learning_rate": 9.864719208452467e-05, "loss": 0.0303, "step": 207980 }, { "epoch": 1.34, "learning_rate": 9.863751073016774e-05, "loss": 0.0266, "step": 207990 }, { "epoch": 1.34, "learning_rate": 9.862782937581082e-05, "loss": 0.0264, "step": 208000 }, { "epoch": 1.34, "eval_cer": 0.91987888374195, "eval_loss": 0.02161572314798832, "eval_runtime": 120.2015, "eval_samples_per_second": 16.639, "eval_steps_per_second": 4.16, "step": 208000 }, { "epoch": 1.34, "learning_rate": 9.861814802145387e-05, "loss": 0.0352, "step": 208010 }, { "epoch": 1.34, "learning_rate": 9.860846666709694e-05, "loss": 0.0295, "step": 208020 }, { "epoch": 1.34, "learning_rate": 9.859878531274001e-05, "loss": 0.0302, "step": 208030 }, { "epoch": 1.34, "learning_rate": 9.858910395838307e-05, "loss": 0.0315, "step": 208040 }, { "epoch": 1.34, "learning_rate": 9.857942260402615e-05, "loss": 0.0343, "step": 208050 }, { "epoch": 1.34, "learning_rate": 9.856974124966921e-05, "loss": 0.0287, "step": 208060 }, { "epoch": 1.34, "learning_rate": 9.85600598953123e-05, "loss": 0.0283, "step": 208070 }, { "epoch": 1.34, "learning_rate": 9.855037854095535e-05, "loss": 0.0243, "step": 208080 }, { "epoch": 1.34, "learning_rate": 9.854069718659841e-05, "loss": 0.0318, "step": 208090 }, { "epoch": 1.34, "learning_rate": 9.853101583224149e-05, "loss": 0.0308, "step": 208100 }, { "epoch": 1.34, "learning_rate": 9.852133447788454e-05, "loss": 0.0278, "step": 208110 }, { "epoch": 1.34, "learning_rate": 9.851165312352761e-05, "loss": 0.0353, "step": 208120 }, { "epoch": 1.34, "learning_rate": 9.850197176917069e-05, "loss": 0.0323, "step": 208130 }, { "epoch": 1.34, "learning_rate": 9.849229041481376e-05, "loss": 0.0281, "step": 208140 }, { "epoch": 1.34, "learning_rate": 9.848260906045682e-05, "loss": 0.0342, "step": 208150 }, { "epoch": 1.34, "learning_rate": 9.847292770609989e-05, "loss": 0.0262, "step": 208160 }, { "epoch": 1.34, "learning_rate": 9.846324635174297e-05, "loss": 0.0361, "step": 208170 }, { "epoch": 1.34, "learning_rate": 9.845356499738602e-05, "loss": 0.0272, "step": 208180 }, { "epoch": 1.34, "learning_rate": 9.844388364302909e-05, "loss": 0.0292, "step": 208190 }, { "epoch": 1.34, "learning_rate": 9.843420228867217e-05, "loss": 0.0287, "step": 208200 }, { "epoch": 1.34, "learning_rate": 9.842452093431523e-05, "loss": 0.0315, "step": 208210 }, { "epoch": 1.34, "learning_rate": 9.841483957995829e-05, "loss": 0.0259, "step": 208220 }, { "epoch": 1.34, "learning_rate": 9.840515822560137e-05, "loss": 0.0269, "step": 208230 }, { "epoch": 1.34, "learning_rate": 9.839547687124443e-05, "loss": 0.0322, "step": 208240 }, { "epoch": 1.34, "learning_rate": 9.83857955168875e-05, "loss": 0.03, "step": 208250 }, { "epoch": 1.34, "learning_rate": 9.837611416253057e-05, "loss": 0.0272, "step": 208260 }, { "epoch": 1.34, "learning_rate": 9.836643280817365e-05, "loss": 0.0283, "step": 208270 }, { "epoch": 1.34, "learning_rate": 9.835675145381671e-05, "loss": 0.0312, "step": 208280 }, { "epoch": 1.34, "learning_rate": 9.834707009945976e-05, "loss": 0.0278, "step": 208290 }, { "epoch": 1.34, "learning_rate": 9.833738874510284e-05, "loss": 0.0266, "step": 208300 }, { "epoch": 1.34, "learning_rate": 9.832770739074591e-05, "loss": 0.0331, "step": 208310 }, { "epoch": 1.34, "learning_rate": 9.831802603638896e-05, "loss": 0.0324, "step": 208320 }, { "epoch": 1.34, "learning_rate": 9.830834468203204e-05, "loss": 0.034, "step": 208330 }, { "epoch": 1.34, "learning_rate": 9.829866332767511e-05, "loss": 0.0275, "step": 208340 }, { "epoch": 1.34, "learning_rate": 9.828898197331818e-05, "loss": 0.0288, "step": 208350 }, { "epoch": 1.34, "learning_rate": 9.827930061896124e-05, "loss": 0.0321, "step": 208360 }, { "epoch": 1.34, "learning_rate": 9.826961926460432e-05, "loss": 0.0335, "step": 208370 }, { "epoch": 1.34, "learning_rate": 9.825993791024739e-05, "loss": 0.0358, "step": 208380 }, { "epoch": 1.34, "learning_rate": 9.825025655589044e-05, "loss": 0.036, "step": 208390 }, { "epoch": 1.35, "learning_rate": 9.824057520153352e-05, "loss": 0.0321, "step": 208400 }, { "epoch": 1.35, "learning_rate": 9.823089384717659e-05, "loss": 0.0302, "step": 208410 }, { "epoch": 1.35, "learning_rate": 9.822121249281964e-05, "loss": 0.0318, "step": 208420 }, { "epoch": 1.35, "learning_rate": 9.821153113846272e-05, "loss": 0.0323, "step": 208430 }, { "epoch": 1.35, "learning_rate": 9.820184978410578e-05, "loss": 0.0314, "step": 208440 }, { "epoch": 1.35, "learning_rate": 9.819216842974886e-05, "loss": 0.0253, "step": 208450 }, { "epoch": 1.35, "learning_rate": 9.818248707539192e-05, "loss": 0.0295, "step": 208460 }, { "epoch": 1.35, "learning_rate": 9.8172805721035e-05, "loss": 0.0294, "step": 208470 }, { "epoch": 1.35, "learning_rate": 9.816312436667806e-05, "loss": 0.0267, "step": 208480 }, { "epoch": 1.35, "learning_rate": 9.815344301232112e-05, "loss": 0.0254, "step": 208490 }, { "epoch": 1.35, "learning_rate": 9.81437616579642e-05, "loss": 0.0277, "step": 208500 }, { "epoch": 1.35, "learning_rate": 9.813408030360726e-05, "loss": 0.0337, "step": 208510 }, { "epoch": 1.35, "learning_rate": 9.812439894925034e-05, "loss": 0.0299, "step": 208520 }, { "epoch": 1.35, "learning_rate": 9.81147175948934e-05, "loss": 0.0306, "step": 208530 }, { "epoch": 1.35, "learning_rate": 9.810503624053646e-05, "loss": 0.0255, "step": 208540 }, { "epoch": 1.35, "learning_rate": 9.809535488617954e-05, "loss": 0.028, "step": 208550 }, { "epoch": 1.35, "learning_rate": 9.80856735318226e-05, "loss": 0.0291, "step": 208560 }, { "epoch": 1.35, "learning_rate": 9.807599217746567e-05, "loss": 0.028, "step": 208570 }, { "epoch": 1.35, "learning_rate": 9.806631082310874e-05, "loss": 0.0317, "step": 208580 }, { "epoch": 1.35, "learning_rate": 9.805662946875182e-05, "loss": 0.0279, "step": 208590 }, { "epoch": 1.35, "learning_rate": 9.804694811439487e-05, "loss": 0.0303, "step": 208600 }, { "epoch": 1.35, "learning_rate": 9.803726676003794e-05, "loss": 0.0261, "step": 208610 }, { "epoch": 1.35, "learning_rate": 9.802758540568102e-05, "loss": 0.0333, "step": 208620 }, { "epoch": 1.35, "learning_rate": 9.801790405132407e-05, "loss": 0.0331, "step": 208630 }, { "epoch": 1.35, "learning_rate": 9.800822269696714e-05, "loss": 0.0299, "step": 208640 }, { "epoch": 1.35, "learning_rate": 9.799854134261022e-05, "loss": 0.0335, "step": 208650 }, { "epoch": 1.35, "learning_rate": 9.798885998825328e-05, "loss": 0.0337, "step": 208660 }, { "epoch": 1.35, "learning_rate": 9.797917863389635e-05, "loss": 0.0257, "step": 208670 }, { "epoch": 1.35, "learning_rate": 9.796949727953942e-05, "loss": 0.0286, "step": 208680 }, { "epoch": 1.35, "learning_rate": 9.79598159251825e-05, "loss": 0.0272, "step": 208690 }, { "epoch": 1.35, "learning_rate": 9.795013457082555e-05, "loss": 0.0332, "step": 208700 }, { "epoch": 1.35, "learning_rate": 9.794045321646861e-05, "loss": 0.0285, "step": 208710 }, { "epoch": 1.35, "learning_rate": 9.79307718621117e-05, "loss": 0.0244, "step": 208720 }, { "epoch": 1.35, "learning_rate": 9.792109050775476e-05, "loss": 0.028, "step": 208730 }, { "epoch": 1.35, "learning_rate": 9.791140915339781e-05, "loss": 0.0278, "step": 208740 }, { "epoch": 1.35, "learning_rate": 9.790172779904089e-05, "loss": 0.0266, "step": 208750 }, { "epoch": 1.35, "learning_rate": 9.789204644468396e-05, "loss": 0.0282, "step": 208760 }, { "epoch": 1.35, "learning_rate": 9.788236509032703e-05, "loss": 0.0312, "step": 208770 }, { "epoch": 1.35, "learning_rate": 9.787268373597009e-05, "loss": 0.0272, "step": 208780 }, { "epoch": 1.35, "learning_rate": 9.786300238161317e-05, "loss": 0.0323, "step": 208790 }, { "epoch": 1.35, "learning_rate": 9.785332102725624e-05, "loss": 0.0277, "step": 208800 }, { "epoch": 1.35, "learning_rate": 9.784363967289929e-05, "loss": 0.0297, "step": 208810 }, { "epoch": 1.35, "learning_rate": 9.783395831854237e-05, "loss": 0.0275, "step": 208820 }, { "epoch": 1.35, "learning_rate": 9.782427696418544e-05, "loss": 0.028, "step": 208830 }, { "epoch": 1.35, "learning_rate": 9.781459560982849e-05, "loss": 0.026, "step": 208840 }, { "epoch": 1.35, "learning_rate": 9.780491425547157e-05, "loss": 0.0295, "step": 208850 }, { "epoch": 1.35, "learning_rate": 9.779523290111463e-05, "loss": 0.0239, "step": 208860 }, { "epoch": 1.35, "learning_rate": 9.778555154675771e-05, "loss": 0.0269, "step": 208870 }, { "epoch": 1.35, "learning_rate": 9.777587019240077e-05, "loss": 0.0334, "step": 208880 }, { "epoch": 1.35, "learning_rate": 9.776618883804385e-05, "loss": 0.0323, "step": 208890 }, { "epoch": 1.35, "learning_rate": 9.775650748368691e-05, "loss": 0.0267, "step": 208900 }, { "epoch": 1.35, "learning_rate": 9.774682612932997e-05, "loss": 0.0257, "step": 208910 }, { "epoch": 1.35, "learning_rate": 9.773714477497305e-05, "loss": 0.0325, "step": 208920 }, { "epoch": 1.35, "learning_rate": 9.772746342061611e-05, "loss": 0.0305, "step": 208930 }, { "epoch": 1.35, "learning_rate": 9.771778206625919e-05, "loss": 0.0303, "step": 208940 }, { "epoch": 1.35, "learning_rate": 9.770810071190224e-05, "loss": 0.0266, "step": 208950 }, { "epoch": 1.35, "learning_rate": 9.769841935754531e-05, "loss": 0.0333, "step": 208960 }, { "epoch": 1.35, "learning_rate": 9.768873800318839e-05, "loss": 0.0313, "step": 208970 }, { "epoch": 1.35, "learning_rate": 9.767905664883144e-05, "loss": 0.0286, "step": 208980 }, { "epoch": 1.35, "learning_rate": 9.766937529447452e-05, "loss": 0.0304, "step": 208990 }, { "epoch": 1.35, "learning_rate": 9.765969394011759e-05, "loss": 0.0341, "step": 209000 }, { "epoch": 1.35, "eval_cer": 0.919940345723647, "eval_loss": 0.021424537524580956, "eval_runtime": 120.0847, "eval_samples_per_second": 16.655, "eval_steps_per_second": 4.164, "step": 209000 }, { "epoch": 1.35, "learning_rate": 9.765001258576066e-05, "loss": 0.0322, "step": 209010 }, { "epoch": 1.35, "learning_rate": 9.764033123140372e-05, "loss": 0.0329, "step": 209020 }, { "epoch": 1.35, "learning_rate": 9.763064987704679e-05, "loss": 0.033, "step": 209030 }, { "epoch": 1.35, "learning_rate": 9.762096852268987e-05, "loss": 0.0318, "step": 209040 }, { "epoch": 1.35, "learning_rate": 9.761128716833292e-05, "loss": 0.0308, "step": 209050 }, { "epoch": 1.35, "learning_rate": 9.760160581397599e-05, "loss": 0.027, "step": 209060 }, { "epoch": 1.35, "learning_rate": 9.759192445961907e-05, "loss": 0.0289, "step": 209070 }, { "epoch": 1.35, "learning_rate": 9.758224310526213e-05, "loss": 0.0294, "step": 209080 }, { "epoch": 1.35, "learning_rate": 9.75725617509052e-05, "loss": 0.0308, "step": 209090 }, { "epoch": 1.35, "learning_rate": 9.756288039654827e-05, "loss": 0.026, "step": 209100 }, { "epoch": 1.35, "learning_rate": 9.755319904219133e-05, "loss": 0.0319, "step": 209110 }, { "epoch": 1.35, "learning_rate": 9.75435176878344e-05, "loss": 0.0304, "step": 209120 }, { "epoch": 1.35, "learning_rate": 9.753383633347746e-05, "loss": 0.0266, "step": 209130 }, { "epoch": 1.35, "learning_rate": 9.752415497912054e-05, "loss": 0.0327, "step": 209140 }, { "epoch": 1.35, "learning_rate": 9.751447362476361e-05, "loss": 0.0238, "step": 209150 }, { "epoch": 1.35, "learning_rate": 9.750479227040666e-05, "loss": 0.033, "step": 209160 }, { "epoch": 1.35, "learning_rate": 9.749511091604974e-05, "loss": 0.0298, "step": 209170 }, { "epoch": 1.35, "learning_rate": 9.748542956169281e-05, "loss": 0.0324, "step": 209180 }, { "epoch": 1.35, "learning_rate": 9.747574820733587e-05, "loss": 0.0268, "step": 209190 }, { "epoch": 1.35, "learning_rate": 9.746606685297894e-05, "loss": 0.0278, "step": 209200 }, { "epoch": 1.35, "learning_rate": 9.745638549862201e-05, "loss": 0.03, "step": 209210 }, { "epoch": 1.35, "learning_rate": 9.744670414426509e-05, "loss": 0.0323, "step": 209220 }, { "epoch": 1.35, "learning_rate": 9.743702278990814e-05, "loss": 0.0285, "step": 209230 }, { "epoch": 1.35, "learning_rate": 9.742734143555122e-05, "loss": 0.0308, "step": 209240 }, { "epoch": 1.35, "learning_rate": 9.741766008119429e-05, "loss": 0.0297, "step": 209250 }, { "epoch": 1.35, "learning_rate": 9.740797872683734e-05, "loss": 0.035, "step": 209260 }, { "epoch": 1.35, "learning_rate": 9.739829737248042e-05, "loss": 0.0303, "step": 209270 }, { "epoch": 1.35, "learning_rate": 9.738861601812348e-05, "loss": 0.0303, "step": 209280 }, { "epoch": 1.35, "learning_rate": 9.737893466376656e-05, "loss": 0.0297, "step": 209290 }, { "epoch": 1.35, "learning_rate": 9.736925330940962e-05, "loss": 0.0295, "step": 209300 }, { "epoch": 1.35, "learning_rate": 9.735957195505268e-05, "loss": 0.0262, "step": 209310 }, { "epoch": 1.35, "learning_rate": 9.734989060069576e-05, "loss": 0.0346, "step": 209320 }, { "epoch": 1.35, "learning_rate": 9.734020924633882e-05, "loss": 0.0272, "step": 209330 }, { "epoch": 1.35, "learning_rate": 9.73305278919819e-05, "loss": 0.0289, "step": 209340 }, { "epoch": 1.35, "learning_rate": 9.732084653762496e-05, "loss": 0.0227, "step": 209350 }, { "epoch": 1.35, "learning_rate": 9.731116518326804e-05, "loss": 0.0285, "step": 209360 }, { "epoch": 1.35, "learning_rate": 9.73014838289111e-05, "loss": 0.0292, "step": 209370 }, { "epoch": 1.35, "learning_rate": 9.729180247455416e-05, "loss": 0.026, "step": 209380 }, { "epoch": 1.35, "learning_rate": 9.728212112019724e-05, "loss": 0.0269, "step": 209390 }, { "epoch": 1.35, "learning_rate": 9.727243976584029e-05, "loss": 0.0291, "step": 209400 }, { "epoch": 1.35, "learning_rate": 9.726275841148336e-05, "loss": 0.028, "step": 209410 }, { "epoch": 1.35, "learning_rate": 9.725307705712644e-05, "loss": 0.0292, "step": 209420 }, { "epoch": 1.35, "learning_rate": 9.72433957027695e-05, "loss": 0.03, "step": 209430 }, { "epoch": 1.35, "learning_rate": 9.723371434841257e-05, "loss": 0.0288, "step": 209440 }, { "epoch": 1.35, "learning_rate": 9.722403299405564e-05, "loss": 0.0306, "step": 209450 }, { "epoch": 1.35, "learning_rate": 9.721435163969872e-05, "loss": 0.0279, "step": 209460 }, { "epoch": 1.35, "learning_rate": 9.720467028534177e-05, "loss": 0.0315, "step": 209470 }, { "epoch": 1.35, "learning_rate": 9.719498893098484e-05, "loss": 0.0268, "step": 209480 }, { "epoch": 1.35, "learning_rate": 9.718530757662792e-05, "loss": 0.0324, "step": 209490 }, { "epoch": 1.35, "learning_rate": 9.717562622227098e-05, "loss": 0.0253, "step": 209500 }, { "epoch": 1.35, "learning_rate": 9.716594486791404e-05, "loss": 0.0345, "step": 209510 }, { "epoch": 1.35, "learning_rate": 9.715626351355711e-05, "loss": 0.028, "step": 209520 }, { "epoch": 1.35, "learning_rate": 9.714658215920018e-05, "loss": 0.0296, "step": 209530 }, { "epoch": 1.35, "learning_rate": 9.713690080484325e-05, "loss": 0.0348, "step": 209540 }, { "epoch": 1.35, "learning_rate": 9.712721945048631e-05, "loss": 0.0311, "step": 209550 }, { "epoch": 1.35, "learning_rate": 9.71175380961294e-05, "loss": 0.0243, "step": 209560 }, { "epoch": 1.35, "learning_rate": 9.710785674177246e-05, "loss": 0.0288, "step": 209570 }, { "epoch": 1.35, "learning_rate": 9.709817538741551e-05, "loss": 0.0306, "step": 209580 }, { "epoch": 1.35, "learning_rate": 9.708849403305859e-05, "loss": 0.0327, "step": 209590 }, { "epoch": 1.35, "learning_rate": 9.707881267870166e-05, "loss": 0.0321, "step": 209600 }, { "epoch": 1.35, "learning_rate": 9.706913132434471e-05, "loss": 0.026, "step": 209610 }, { "epoch": 1.35, "learning_rate": 9.705944996998779e-05, "loss": 0.0254, "step": 209620 }, { "epoch": 1.35, "learning_rate": 9.704976861563086e-05, "loss": 0.0326, "step": 209630 }, { "epoch": 1.35, "learning_rate": 9.704008726127394e-05, "loss": 0.0301, "step": 209640 }, { "epoch": 1.35, "learning_rate": 9.703040590691699e-05, "loss": 0.0292, "step": 209650 }, { "epoch": 1.35, "learning_rate": 9.702072455256007e-05, "loss": 0.0305, "step": 209660 }, { "epoch": 1.35, "learning_rate": 9.701104319820314e-05, "loss": 0.0292, "step": 209670 }, { "epoch": 1.35, "learning_rate": 9.700136184384619e-05, "loss": 0.0334, "step": 209680 }, { "epoch": 1.35, "learning_rate": 9.699168048948927e-05, "loss": 0.0314, "step": 209690 }, { "epoch": 1.35, "learning_rate": 9.698199913513233e-05, "loss": 0.028, "step": 209700 }, { "epoch": 1.35, "learning_rate": 9.697231778077541e-05, "loss": 0.0282, "step": 209710 }, { "epoch": 1.35, "learning_rate": 9.696263642641847e-05, "loss": 0.0296, "step": 209720 }, { "epoch": 1.35, "learning_rate": 9.695295507206153e-05, "loss": 0.0283, "step": 209730 }, { "epoch": 1.35, "learning_rate": 9.694327371770461e-05, "loss": 0.0367, "step": 209740 }, { "epoch": 1.35, "learning_rate": 9.693359236334767e-05, "loss": 0.0296, "step": 209750 }, { "epoch": 1.35, "learning_rate": 9.692391100899075e-05, "loss": 0.0251, "step": 209760 }, { "epoch": 1.35, "learning_rate": 9.691422965463381e-05, "loss": 0.0273, "step": 209770 }, { "epoch": 1.35, "learning_rate": 9.690454830027689e-05, "loss": 0.0304, "step": 209780 }, { "epoch": 1.35, "learning_rate": 9.689486694591994e-05, "loss": 0.0334, "step": 209790 }, { "epoch": 1.35, "learning_rate": 9.688518559156301e-05, "loss": 0.0327, "step": 209800 }, { "epoch": 1.35, "learning_rate": 9.687550423720609e-05, "loss": 0.0308, "step": 209810 }, { "epoch": 1.35, "learning_rate": 9.686582288284914e-05, "loss": 0.0267, "step": 209820 }, { "epoch": 1.35, "learning_rate": 9.685614152849221e-05, "loss": 0.0293, "step": 209830 }, { "epoch": 1.35, "learning_rate": 9.684646017413529e-05, "loss": 0.0328, "step": 209840 }, { "epoch": 1.35, "learning_rate": 9.683677881977836e-05, "loss": 0.0307, "step": 209850 }, { "epoch": 1.35, "learning_rate": 9.682709746542142e-05, "loss": 0.0323, "step": 209860 }, { "epoch": 1.35, "learning_rate": 9.681741611106449e-05, "loss": 0.0255, "step": 209870 }, { "epoch": 1.35, "learning_rate": 9.680773475670757e-05, "loss": 0.0291, "step": 209880 }, { "epoch": 1.35, "learning_rate": 9.679805340235062e-05, "loss": 0.0323, "step": 209890 }, { "epoch": 1.35, "learning_rate": 9.678837204799369e-05, "loss": 0.0256, "step": 209900 }, { "epoch": 1.35, "learning_rate": 9.677869069363677e-05, "loss": 0.0319, "step": 209910 }, { "epoch": 1.35, "learning_rate": 9.676900933927983e-05, "loss": 0.036, "step": 209920 }, { "epoch": 1.35, "learning_rate": 9.675932798492289e-05, "loss": 0.0298, "step": 209930 }, { "epoch": 1.35, "learning_rate": 9.674964663056596e-05, "loss": 0.0284, "step": 209940 }, { "epoch": 1.36, "learning_rate": 9.673996527620903e-05, "loss": 0.0312, "step": 209950 }, { "epoch": 1.36, "learning_rate": 9.67302839218521e-05, "loss": 0.0301, "step": 209960 }, { "epoch": 1.36, "learning_rate": 9.672060256749516e-05, "loss": 0.0285, "step": 209970 }, { "epoch": 1.36, "learning_rate": 9.671092121313824e-05, "loss": 0.0422, "step": 209980 }, { "epoch": 1.36, "learning_rate": 9.670123985878131e-05, "loss": 0.0268, "step": 209990 }, { "epoch": 1.36, "learning_rate": 9.669155850442436e-05, "loss": 0.029, "step": 210000 }, { "epoch": 1.36, "eval_cer": 0.9199105185854706, "eval_loss": 0.021298963576555252, "eval_runtime": 120.106, "eval_samples_per_second": 16.652, "eval_steps_per_second": 4.163, "step": 210000 }, { "epoch": 1.36, "learning_rate": 9.668187715006744e-05, "loss": 0.0273, "step": 210010 }, { "epoch": 1.36, "learning_rate": 9.667219579571051e-05, "loss": 0.0299, "step": 210020 }, { "epoch": 1.36, "learning_rate": 9.666251444135356e-05, "loss": 0.0283, "step": 210030 }, { "epoch": 1.36, "learning_rate": 9.665283308699664e-05, "loss": 0.0274, "step": 210040 }, { "epoch": 1.36, "learning_rate": 9.664315173263971e-05, "loss": 0.0297, "step": 210050 }, { "epoch": 1.36, "learning_rate": 9.663347037828279e-05, "loss": 0.0345, "step": 210060 }, { "epoch": 1.36, "learning_rate": 9.662378902392584e-05, "loss": 0.0268, "step": 210070 }, { "epoch": 1.36, "learning_rate": 9.661410766956892e-05, "loss": 0.0269, "step": 210080 }, { "epoch": 1.36, "learning_rate": 9.660442631521199e-05, "loss": 0.0306, "step": 210090 }, { "epoch": 1.36, "learning_rate": 9.659474496085504e-05, "loss": 0.0261, "step": 210100 }, { "epoch": 1.36, "learning_rate": 9.658506360649812e-05, "loss": 0.0302, "step": 210110 }, { "epoch": 1.36, "learning_rate": 9.657538225214118e-05, "loss": 0.0309, "step": 210120 }, { "epoch": 1.36, "learning_rate": 9.656570089778426e-05, "loss": 0.034, "step": 210130 }, { "epoch": 1.36, "learning_rate": 9.655601954342732e-05, "loss": 0.0275, "step": 210140 }, { "epoch": 1.36, "learning_rate": 9.654633818907038e-05, "loss": 0.027, "step": 210150 }, { "epoch": 1.36, "learning_rate": 9.653665683471346e-05, "loss": 0.0365, "step": 210160 }, { "epoch": 1.36, "learning_rate": 9.652697548035652e-05, "loss": 0.0301, "step": 210170 }, { "epoch": 1.36, "learning_rate": 9.65172941259996e-05, "loss": 0.0259, "step": 210180 }, { "epoch": 1.36, "learning_rate": 9.650761277164266e-05, "loss": 0.0345, "step": 210190 }, { "epoch": 1.36, "learning_rate": 9.649793141728573e-05, "loss": 0.0331, "step": 210200 }, { "epoch": 1.36, "learning_rate": 9.64882500629288e-05, "loss": 0.0372, "step": 210210 }, { "epoch": 1.36, "learning_rate": 9.647856870857186e-05, "loss": 0.0323, "step": 210220 }, { "epoch": 1.36, "learning_rate": 9.646888735421494e-05, "loss": 0.0277, "step": 210230 }, { "epoch": 1.36, "learning_rate": 9.645920599985799e-05, "loss": 0.0301, "step": 210240 }, { "epoch": 1.36, "learning_rate": 9.644952464550106e-05, "loss": 0.0289, "step": 210250 }, { "epoch": 1.36, "learning_rate": 9.643984329114414e-05, "loss": 0.0238, "step": 210260 }, { "epoch": 1.36, "learning_rate": 9.64301619367872e-05, "loss": 0.0293, "step": 210270 }, { "epoch": 1.36, "learning_rate": 9.642048058243027e-05, "loss": 0.0241, "step": 210280 }, { "epoch": 1.36, "learning_rate": 9.641079922807334e-05, "loss": 0.0268, "step": 210290 }, { "epoch": 1.36, "learning_rate": 9.64011178737164e-05, "loss": 0.0286, "step": 210300 }, { "epoch": 1.36, "learning_rate": 9.639143651935947e-05, "loss": 0.0267, "step": 210310 }, { "epoch": 1.36, "learning_rate": 9.638175516500254e-05, "loss": 0.0277, "step": 210320 }, { "epoch": 1.36, "learning_rate": 9.637207381064562e-05, "loss": 0.03, "step": 210330 }, { "epoch": 1.36, "learning_rate": 9.636239245628868e-05, "loss": 0.0284, "step": 210340 }, { "epoch": 1.36, "learning_rate": 9.635271110193173e-05, "loss": 0.0316, "step": 210350 }, { "epoch": 1.36, "learning_rate": 9.634302974757481e-05, "loss": 0.0271, "step": 210360 }, { "epoch": 1.36, "learning_rate": 9.633334839321788e-05, "loss": 0.0259, "step": 210370 }, { "epoch": 1.36, "learning_rate": 9.632366703886095e-05, "loss": 0.0277, "step": 210380 }, { "epoch": 1.36, "learning_rate": 9.631398568450401e-05, "loss": 0.0325, "step": 210390 }, { "epoch": 1.36, "learning_rate": 9.630430433014708e-05, "loss": 0.0279, "step": 210400 }, { "epoch": 1.36, "learning_rate": 9.629462297579016e-05, "loss": 0.0301, "step": 210410 }, { "epoch": 1.36, "learning_rate": 9.628494162143321e-05, "loss": 0.0263, "step": 210420 }, { "epoch": 1.36, "learning_rate": 9.627526026707629e-05, "loss": 0.032, "step": 210430 }, { "epoch": 1.36, "learning_rate": 9.626557891271936e-05, "loss": 0.029, "step": 210440 }, { "epoch": 1.36, "learning_rate": 9.625589755836241e-05, "loss": 0.0287, "step": 210450 }, { "epoch": 1.36, "learning_rate": 9.624621620400549e-05, "loss": 0.0297, "step": 210460 }, { "epoch": 1.36, "learning_rate": 9.623653484964856e-05, "loss": 0.0325, "step": 210470 }, { "epoch": 1.36, "learning_rate": 9.622685349529164e-05, "loss": 0.0329, "step": 210480 }, { "epoch": 1.36, "learning_rate": 9.621717214093469e-05, "loss": 0.026, "step": 210490 }, { "epoch": 1.36, "learning_rate": 9.620749078657776e-05, "loss": 0.0288, "step": 210500 }, { "epoch": 1.36, "learning_rate": 9.619780943222084e-05, "loss": 0.0314, "step": 210510 }, { "epoch": 1.36, "learning_rate": 9.618812807786389e-05, "loss": 0.0305, "step": 210520 }, { "epoch": 1.36, "learning_rate": 9.617844672350697e-05, "loss": 0.0336, "step": 210530 }, { "epoch": 1.36, "learning_rate": 9.616876536915003e-05, "loss": 0.0336, "step": 210540 }, { "epoch": 1.36, "learning_rate": 9.615908401479311e-05, "loss": 0.0247, "step": 210550 }, { "epoch": 1.36, "learning_rate": 9.614940266043617e-05, "loss": 0.034, "step": 210560 }, { "epoch": 1.36, "learning_rate": 9.613972130607923e-05, "loss": 0.0268, "step": 210570 }, { "epoch": 1.36, "learning_rate": 9.613003995172231e-05, "loss": 0.0299, "step": 210580 }, { "epoch": 1.36, "learning_rate": 9.612035859736537e-05, "loss": 0.0296, "step": 210590 }, { "epoch": 1.36, "learning_rate": 9.611067724300843e-05, "loss": 0.0327, "step": 210600 }, { "epoch": 1.36, "learning_rate": 9.610099588865151e-05, "loss": 0.0295, "step": 210610 }, { "epoch": 1.36, "learning_rate": 9.609131453429458e-05, "loss": 0.0282, "step": 210620 }, { "epoch": 1.36, "learning_rate": 9.608163317993764e-05, "loss": 0.0303, "step": 210630 }, { "epoch": 1.36, "learning_rate": 9.607195182558071e-05, "loss": 0.0271, "step": 210640 }, { "epoch": 1.36, "learning_rate": 9.606227047122379e-05, "loss": 0.0281, "step": 210650 }, { "epoch": 1.36, "learning_rate": 9.605258911686684e-05, "loss": 0.0263, "step": 210660 }, { "epoch": 1.36, "learning_rate": 9.604290776250991e-05, "loss": 0.0342, "step": 210670 }, { "epoch": 1.36, "learning_rate": 9.603322640815299e-05, "loss": 0.029, "step": 210680 }, { "epoch": 1.36, "learning_rate": 9.602354505379605e-05, "loss": 0.0265, "step": 210690 }, { "epoch": 1.36, "learning_rate": 9.601386369943911e-05, "loss": 0.0308, "step": 210700 }, { "epoch": 1.36, "learning_rate": 9.600418234508219e-05, "loss": 0.032, "step": 210710 }, { "epoch": 1.36, "learning_rate": 9.599450099072525e-05, "loss": 0.0326, "step": 210720 }, { "epoch": 1.36, "learning_rate": 9.598481963636832e-05, "loss": 0.0345, "step": 210730 }, { "epoch": 1.36, "learning_rate": 9.597513828201139e-05, "loss": 0.0286, "step": 210740 }, { "epoch": 1.36, "learning_rate": 9.596545692765447e-05, "loss": 0.0351, "step": 210750 }, { "epoch": 1.36, "learning_rate": 9.595577557329753e-05, "loss": 0.0347, "step": 210760 }, { "epoch": 1.36, "learning_rate": 9.594609421894058e-05, "loss": 0.0311, "step": 210770 }, { "epoch": 1.36, "learning_rate": 9.593641286458366e-05, "loss": 0.032, "step": 210780 }, { "epoch": 1.36, "learning_rate": 9.592673151022673e-05, "loss": 0.0342, "step": 210790 }, { "epoch": 1.36, "learning_rate": 9.59170501558698e-05, "loss": 0.0299, "step": 210800 }, { "epoch": 1.36, "learning_rate": 9.590736880151286e-05, "loss": 0.0325, "step": 210810 }, { "epoch": 1.36, "learning_rate": 9.589768744715593e-05, "loss": 0.0276, "step": 210820 }, { "epoch": 1.36, "learning_rate": 9.588800609279901e-05, "loss": 0.0263, "step": 210830 }, { "epoch": 1.36, "learning_rate": 9.587832473844206e-05, "loss": 0.0302, "step": 210840 }, { "epoch": 1.36, "learning_rate": 9.586864338408514e-05, "loss": 0.0309, "step": 210850 }, { "epoch": 1.36, "learning_rate": 9.585896202972821e-05, "loss": 0.0341, "step": 210860 }, { "epoch": 1.36, "learning_rate": 9.584928067537126e-05, "loss": 0.0299, "step": 210870 }, { "epoch": 1.36, "learning_rate": 9.583959932101434e-05, "loss": 0.0334, "step": 210880 }, { "epoch": 1.36, "learning_rate": 9.58299179666574e-05, "loss": 0.0275, "step": 210890 }, { "epoch": 1.36, "learning_rate": 9.582023661230049e-05, "loss": 0.0332, "step": 210900 }, { "epoch": 1.36, "learning_rate": 9.581055525794354e-05, "loss": 0.0327, "step": 210910 }, { "epoch": 1.36, "learning_rate": 9.58008739035866e-05, "loss": 0.0275, "step": 210920 }, { "epoch": 1.36, "learning_rate": 9.579119254922969e-05, "loss": 0.0292, "step": 210930 }, { "epoch": 1.36, "learning_rate": 9.578151119487274e-05, "loss": 0.0264, "step": 210940 }, { "epoch": 1.36, "learning_rate": 9.577182984051582e-05, "loss": 0.028, "step": 210950 }, { "epoch": 1.36, "learning_rate": 9.576214848615888e-05, "loss": 0.031, "step": 210960 }, { "epoch": 1.36, "learning_rate": 9.575246713180196e-05, "loss": 0.0295, "step": 210970 }, { "epoch": 1.36, "learning_rate": 9.574278577744502e-05, "loss": 0.0311, "step": 210980 }, { "epoch": 1.36, "learning_rate": 9.573310442308808e-05, "loss": 0.0286, "step": 210990 }, { "epoch": 1.36, "learning_rate": 9.572342306873116e-05, "loss": 0.0281, "step": 211000 }, { "epoch": 1.36, "eval_cer": 0.9198364026663653, "eval_loss": 0.021836968138813972, "eval_runtime": 120.1382, "eval_samples_per_second": 16.647, "eval_steps_per_second": 4.162, "step": 211000 }, { "epoch": 1.36, "learning_rate": 9.571374171437422e-05, "loss": 0.0298, "step": 211010 }, { "epoch": 1.36, "learning_rate": 9.570406036001728e-05, "loss": 0.0298, "step": 211020 }, { "epoch": 1.36, "learning_rate": 9.569437900566036e-05, "loss": 0.0268, "step": 211030 }, { "epoch": 1.36, "learning_rate": 9.568469765130343e-05, "loss": 0.0221, "step": 211040 }, { "epoch": 1.36, "learning_rate": 9.56750162969465e-05, "loss": 0.0275, "step": 211050 }, { "epoch": 1.36, "learning_rate": 9.566533494258956e-05, "loss": 0.0284, "step": 211060 }, { "epoch": 1.36, "learning_rate": 9.565565358823264e-05, "loss": 0.0303, "step": 211070 }, { "epoch": 1.36, "learning_rate": 9.564597223387569e-05, "loss": 0.0323, "step": 211080 }, { "epoch": 1.36, "learning_rate": 9.563629087951876e-05, "loss": 0.0308, "step": 211090 }, { "epoch": 1.36, "learning_rate": 9.562660952516184e-05, "loss": 0.033, "step": 211100 }, { "epoch": 1.36, "learning_rate": 9.56169281708049e-05, "loss": 0.0396, "step": 211110 }, { "epoch": 1.36, "learning_rate": 9.560724681644796e-05, "loss": 0.0297, "step": 211120 }, { "epoch": 1.36, "learning_rate": 9.559756546209104e-05, "loss": 0.0239, "step": 211130 }, { "epoch": 1.36, "learning_rate": 9.55878841077341e-05, "loss": 0.0275, "step": 211140 }, { "epoch": 1.36, "learning_rate": 9.557820275337717e-05, "loss": 0.0243, "step": 211150 }, { "epoch": 1.36, "learning_rate": 9.556852139902024e-05, "loss": 0.0292, "step": 211160 }, { "epoch": 1.36, "learning_rate": 9.555884004466332e-05, "loss": 0.0267, "step": 211170 }, { "epoch": 1.36, "learning_rate": 9.554915869030638e-05, "loss": 0.0296, "step": 211180 }, { "epoch": 1.36, "learning_rate": 9.553947733594943e-05, "loss": 0.0318, "step": 211190 }, { "epoch": 1.36, "learning_rate": 9.552979598159251e-05, "loss": 0.0307, "step": 211200 }, { "epoch": 1.36, "learning_rate": 9.552011462723558e-05, "loss": 0.0275, "step": 211210 }, { "epoch": 1.36, "learning_rate": 9.551043327287863e-05, "loss": 0.0328, "step": 211220 }, { "epoch": 1.36, "learning_rate": 9.550075191852171e-05, "loss": 0.0315, "step": 211230 }, { "epoch": 1.36, "learning_rate": 9.549107056416478e-05, "loss": 0.0325, "step": 211240 }, { "epoch": 1.36, "learning_rate": 9.548138920980786e-05, "loss": 0.0323, "step": 211250 }, { "epoch": 1.36, "learning_rate": 9.547170785545091e-05, "loss": 0.0299, "step": 211260 }, { "epoch": 1.36, "learning_rate": 9.546202650109399e-05, "loss": 0.0315, "step": 211270 }, { "epoch": 1.36, "learning_rate": 9.545234514673706e-05, "loss": 0.0291, "step": 211280 }, { "epoch": 1.36, "learning_rate": 9.544266379238011e-05, "loss": 0.0306, "step": 211290 }, { "epoch": 1.36, "learning_rate": 9.543298243802319e-05, "loss": 0.0265, "step": 211300 }, { "epoch": 1.36, "learning_rate": 9.542330108366626e-05, "loss": 0.0268, "step": 211310 }, { "epoch": 1.36, "learning_rate": 9.541361972930934e-05, "loss": 0.0309, "step": 211320 }, { "epoch": 1.36, "learning_rate": 9.540393837495239e-05, "loss": 0.0358, "step": 211330 }, { "epoch": 1.36, "learning_rate": 9.539425702059546e-05, "loss": 0.0314, "step": 211340 }, { "epoch": 1.36, "learning_rate": 9.538457566623853e-05, "loss": 0.0308, "step": 211350 }, { "epoch": 1.36, "learning_rate": 9.537489431188159e-05, "loss": 0.0346, "step": 211360 }, { "epoch": 1.36, "learning_rate": 9.536521295752467e-05, "loss": 0.031, "step": 211370 }, { "epoch": 1.36, "learning_rate": 9.535553160316773e-05, "loss": 0.0287, "step": 211380 }, { "epoch": 1.36, "learning_rate": 9.534585024881081e-05, "loss": 0.0329, "step": 211390 }, { "epoch": 1.36, "learning_rate": 9.533616889445387e-05, "loss": 0.0307, "step": 211400 }, { "epoch": 1.36, "learning_rate": 9.532648754009693e-05, "loss": 0.0239, "step": 211410 }, { "epoch": 1.36, "learning_rate": 9.531680618574001e-05, "loss": 0.0351, "step": 211420 }, { "epoch": 1.36, "learning_rate": 9.530712483138306e-05, "loss": 0.0351, "step": 211430 }, { "epoch": 1.36, "learning_rate": 9.529744347702613e-05, "loss": 0.0248, "step": 211440 }, { "epoch": 1.36, "learning_rate": 9.528776212266921e-05, "loss": 0.0309, "step": 211450 }, { "epoch": 1.36, "learning_rate": 9.527808076831228e-05, "loss": 0.0283, "step": 211460 }, { "epoch": 1.36, "learning_rate": 9.526839941395534e-05, "loss": 0.0319, "step": 211470 }, { "epoch": 1.36, "learning_rate": 9.525871805959841e-05, "loss": 0.0307, "step": 211480 }, { "epoch": 1.37, "learning_rate": 9.524903670524149e-05, "loss": 0.0277, "step": 211490 }, { "epoch": 1.37, "learning_rate": 9.523935535088454e-05, "loss": 0.0287, "step": 211500 }, { "epoch": 1.37, "learning_rate": 9.522967399652761e-05, "loss": 0.0272, "step": 211510 }, { "epoch": 1.37, "learning_rate": 9.521999264217069e-05, "loss": 0.0353, "step": 211520 }, { "epoch": 1.37, "learning_rate": 9.521031128781375e-05, "loss": 0.036, "step": 211530 }, { "epoch": 1.37, "learning_rate": 9.520062993345681e-05, "loss": 0.0358, "step": 211540 }, { "epoch": 1.37, "learning_rate": 9.519094857909989e-05, "loss": 0.029, "step": 211550 }, { "epoch": 1.37, "learning_rate": 9.518126722474295e-05, "loss": 0.0279, "step": 211560 }, { "epoch": 1.37, "learning_rate": 9.517158587038602e-05, "loss": 0.0261, "step": 211570 }, { "epoch": 1.37, "learning_rate": 9.516190451602909e-05, "loss": 0.0238, "step": 211580 }, { "epoch": 1.37, "learning_rate": 9.515222316167217e-05, "loss": 0.0356, "step": 211590 }, { "epoch": 1.37, "learning_rate": 9.514254180731523e-05, "loss": 0.0315, "step": 211600 }, { "epoch": 1.37, "learning_rate": 9.513286045295828e-05, "loss": 0.0274, "step": 211610 }, { "epoch": 1.37, "learning_rate": 9.512317909860136e-05, "loss": 0.0335, "step": 211620 }, { "epoch": 1.37, "learning_rate": 9.511349774424443e-05, "loss": 0.026, "step": 211630 }, { "epoch": 1.37, "learning_rate": 9.510381638988748e-05, "loss": 0.0333, "step": 211640 }, { "epoch": 1.37, "learning_rate": 9.509413503553056e-05, "loss": 0.032, "step": 211650 }, { "epoch": 1.37, "learning_rate": 9.508445368117363e-05, "loss": 0.0321, "step": 211660 }, { "epoch": 1.37, "learning_rate": 9.507477232681671e-05, "loss": 0.0289, "step": 211670 }, { "epoch": 1.37, "learning_rate": 9.506509097245976e-05, "loss": 0.0323, "step": 211680 }, { "epoch": 1.37, "learning_rate": 9.505540961810284e-05, "loss": 0.0254, "step": 211690 }, { "epoch": 1.37, "learning_rate": 9.504572826374591e-05, "loss": 0.026, "step": 211700 }, { "epoch": 1.37, "learning_rate": 9.503604690938896e-05, "loss": 0.0301, "step": 211710 }, { "epoch": 1.37, "learning_rate": 9.502636555503204e-05, "loss": 0.0263, "step": 211720 }, { "epoch": 1.37, "learning_rate": 9.50166842006751e-05, "loss": 0.0274, "step": 211730 }, { "epoch": 1.37, "learning_rate": 9.500700284631819e-05, "loss": 0.0265, "step": 211740 }, { "epoch": 1.37, "learning_rate": 9.499732149196124e-05, "loss": 0.0303, "step": 211750 }, { "epoch": 1.37, "learning_rate": 9.49876401376043e-05, "loss": 0.0291, "step": 211760 }, { "epoch": 1.37, "learning_rate": 9.497795878324738e-05, "loss": 0.028, "step": 211770 }, { "epoch": 1.37, "learning_rate": 9.496827742889044e-05, "loss": 0.0261, "step": 211780 }, { "epoch": 1.37, "learning_rate": 9.495859607453352e-05, "loss": 0.0254, "step": 211790 }, { "epoch": 1.37, "learning_rate": 9.494891472017658e-05, "loss": 0.0271, "step": 211800 }, { "epoch": 1.37, "learning_rate": 9.493923336581964e-05, "loss": 0.0257, "step": 211810 }, { "epoch": 1.37, "learning_rate": 9.492955201146272e-05, "loss": 0.0275, "step": 211820 }, { "epoch": 1.37, "learning_rate": 9.491987065710578e-05, "loss": 0.0356, "step": 211830 }, { "epoch": 1.37, "learning_rate": 9.491018930274886e-05, "loss": 0.0316, "step": 211840 }, { "epoch": 1.37, "learning_rate": 9.490050794839191e-05, "loss": 0.0253, "step": 211850 }, { "epoch": 1.37, "learning_rate": 9.489082659403498e-05, "loss": 0.0281, "step": 211860 }, { "epoch": 1.37, "learning_rate": 9.488114523967806e-05, "loss": 0.0296, "step": 211870 }, { "epoch": 1.37, "learning_rate": 9.487146388532111e-05, "loss": 0.0262, "step": 211880 }, { "epoch": 1.37, "learning_rate": 9.486178253096419e-05, "loss": 0.0335, "step": 211890 }, { "epoch": 1.37, "learning_rate": 9.485210117660726e-05, "loss": 0.0386, "step": 211900 }, { "epoch": 1.37, "learning_rate": 9.484241982225033e-05, "loss": 0.0279, "step": 211910 }, { "epoch": 1.37, "learning_rate": 9.483273846789339e-05, "loss": 0.0287, "step": 211920 }, { "epoch": 1.37, "learning_rate": 9.482305711353646e-05, "loss": 0.0318, "step": 211930 }, { "epoch": 1.37, "learning_rate": 9.481337575917954e-05, "loss": 0.0283, "step": 211940 }, { "epoch": 1.37, "learning_rate": 9.480369440482259e-05, "loss": 0.0253, "step": 211950 }, { "epoch": 1.37, "learning_rate": 9.479401305046566e-05, "loss": 0.0319, "step": 211960 }, { "epoch": 1.37, "learning_rate": 9.478433169610874e-05, "loss": 0.0348, "step": 211970 }, { "epoch": 1.37, "learning_rate": 9.47746503417518e-05, "loss": 0.0284, "step": 211980 }, { "epoch": 1.37, "learning_rate": 9.476496898739487e-05, "loss": 0.0302, "step": 211990 }, { "epoch": 1.37, "learning_rate": 9.475528763303794e-05, "loss": 0.033, "step": 212000 }, { "epoch": 1.37, "eval_cer": 0.9199132301434866, "eval_loss": 0.02124147117137909, "eval_runtime": 120.2274, "eval_samples_per_second": 16.635, "eval_steps_per_second": 4.159, "step": 212000 }, { "epoch": 1.37, "learning_rate": 9.4745606278681e-05, "loss": 0.0337, "step": 212010 }, { "epoch": 1.37, "learning_rate": 9.473592492432407e-05, "loss": 0.0298, "step": 212020 }, { "epoch": 1.37, "learning_rate": 9.472624356996713e-05, "loss": 0.0331, "step": 212030 }, { "epoch": 1.37, "learning_rate": 9.471656221561021e-05, "loss": 0.0277, "step": 212040 }, { "epoch": 1.37, "learning_rate": 9.470688086125328e-05, "loss": 0.0339, "step": 212050 }, { "epoch": 1.37, "learning_rate": 9.469719950689633e-05, "loss": 0.0311, "step": 212060 }, { "epoch": 1.37, "learning_rate": 9.468751815253941e-05, "loss": 0.0252, "step": 212070 }, { "epoch": 1.37, "learning_rate": 9.467783679818248e-05, "loss": 0.0308, "step": 212080 }, { "epoch": 1.37, "learning_rate": 9.466815544382555e-05, "loss": 0.0276, "step": 212090 }, { "epoch": 1.37, "learning_rate": 9.465847408946861e-05, "loss": 0.0352, "step": 212100 }, { "epoch": 1.37, "learning_rate": 9.464879273511168e-05, "loss": 0.0293, "step": 212110 }, { "epoch": 1.37, "learning_rate": 9.463911138075476e-05, "loss": 0.0283, "step": 212120 }, { "epoch": 1.37, "learning_rate": 9.462943002639781e-05, "loss": 0.0284, "step": 212130 }, { "epoch": 1.37, "learning_rate": 9.461974867204089e-05, "loss": 0.0315, "step": 212140 }, { "epoch": 1.37, "learning_rate": 9.461006731768396e-05, "loss": 0.032, "step": 212150 }, { "epoch": 1.37, "learning_rate": 9.460038596332701e-05, "loss": 0.0269, "step": 212160 }, { "epoch": 1.37, "learning_rate": 9.459070460897009e-05, "loss": 0.0308, "step": 212170 }, { "epoch": 1.37, "learning_rate": 9.458102325461315e-05, "loss": 0.0266, "step": 212180 }, { "epoch": 1.37, "learning_rate": 9.457134190025623e-05, "loss": 0.0292, "step": 212190 }, { "epoch": 1.37, "learning_rate": 9.456166054589929e-05, "loss": 0.0278, "step": 212200 }, { "epoch": 1.37, "learning_rate": 9.455197919154235e-05, "loss": 0.0321, "step": 212210 }, { "epoch": 1.37, "learning_rate": 9.454229783718543e-05, "loss": 0.0336, "step": 212220 }, { "epoch": 1.37, "learning_rate": 9.453261648282849e-05, "loss": 0.0227, "step": 212230 }, { "epoch": 1.37, "learning_rate": 9.452293512847157e-05, "loss": 0.0256, "step": 212240 }, { "epoch": 1.37, "learning_rate": 9.451325377411463e-05, "loss": 0.0277, "step": 212250 }, { "epoch": 1.37, "learning_rate": 9.450357241975771e-05, "loss": 0.0296, "step": 212260 }, { "epoch": 1.37, "learning_rate": 9.449389106540076e-05, "loss": 0.026, "step": 212270 }, { "epoch": 1.37, "learning_rate": 9.448420971104383e-05, "loss": 0.0245, "step": 212280 }, { "epoch": 1.37, "learning_rate": 9.447452835668691e-05, "loss": 0.032, "step": 212290 }, { "epoch": 1.37, "learning_rate": 9.446484700232996e-05, "loss": 0.0286, "step": 212300 }, { "epoch": 1.37, "learning_rate": 9.445516564797303e-05, "loss": 0.0285, "step": 212310 }, { "epoch": 1.37, "learning_rate": 9.444548429361611e-05, "loss": 0.0286, "step": 212320 }, { "epoch": 1.37, "learning_rate": 9.443580293925918e-05, "loss": 0.0297, "step": 212330 }, { "epoch": 1.37, "learning_rate": 9.442612158490224e-05, "loss": 0.0333, "step": 212340 }, { "epoch": 1.37, "learning_rate": 9.441644023054531e-05, "loss": 0.0281, "step": 212350 }, { "epoch": 1.37, "learning_rate": 9.440675887618839e-05, "loss": 0.0299, "step": 212360 }, { "epoch": 1.37, "learning_rate": 9.439707752183144e-05, "loss": 0.0292, "step": 212370 }, { "epoch": 1.37, "learning_rate": 9.43873961674745e-05, "loss": 0.0278, "step": 212380 }, { "epoch": 1.37, "learning_rate": 9.437771481311759e-05, "loss": 0.0326, "step": 212390 }, { "epoch": 1.37, "learning_rate": 9.436803345876065e-05, "loss": 0.0276, "step": 212400 }, { "epoch": 1.37, "learning_rate": 9.43583521044037e-05, "loss": 0.0266, "step": 212410 }, { "epoch": 1.37, "learning_rate": 9.434867075004679e-05, "loss": 0.0271, "step": 212420 }, { "epoch": 1.37, "learning_rate": 9.433898939568985e-05, "loss": 0.0297, "step": 212430 }, { "epoch": 1.37, "learning_rate": 9.432930804133292e-05, "loss": 0.0261, "step": 212440 }, { "epoch": 1.37, "learning_rate": 9.431962668697598e-05, "loss": 0.0258, "step": 212450 }, { "epoch": 1.37, "learning_rate": 9.430994533261906e-05, "loss": 0.0304, "step": 212460 }, { "epoch": 1.37, "learning_rate": 9.430026397826213e-05, "loss": 0.0316, "step": 212470 }, { "epoch": 1.37, "learning_rate": 9.429058262390518e-05, "loss": 0.0241, "step": 212480 }, { "epoch": 1.37, "learning_rate": 9.428090126954826e-05, "loss": 0.027, "step": 212490 }, { "epoch": 1.37, "learning_rate": 9.427121991519133e-05, "loss": 0.0318, "step": 212500 }, { "epoch": 1.37, "learning_rate": 9.426153856083438e-05, "loss": 0.0272, "step": 212510 }, { "epoch": 1.37, "learning_rate": 9.425185720647746e-05, "loss": 0.0335, "step": 212520 }, { "epoch": 1.37, "learning_rate": 9.424217585212053e-05, "loss": 0.0275, "step": 212530 }, { "epoch": 1.37, "learning_rate": 9.423249449776361e-05, "loss": 0.0384, "step": 212540 }, { "epoch": 1.37, "learning_rate": 9.422281314340666e-05, "loss": 0.0268, "step": 212550 }, { "epoch": 1.37, "learning_rate": 9.421313178904974e-05, "loss": 0.0363, "step": 212560 }, { "epoch": 1.37, "learning_rate": 9.42034504346928e-05, "loss": 0.028, "step": 212570 }, { "epoch": 1.37, "learning_rate": 9.419376908033586e-05, "loss": 0.0293, "step": 212580 }, { "epoch": 1.37, "learning_rate": 9.418408772597894e-05, "loss": 0.0246, "step": 212590 }, { "epoch": 1.37, "learning_rate": 9.4174406371622e-05, "loss": 0.0316, "step": 212600 }, { "epoch": 1.37, "learning_rate": 9.416472501726508e-05, "loss": 0.0304, "step": 212610 }, { "epoch": 1.37, "learning_rate": 9.415504366290814e-05, "loss": 0.0318, "step": 212620 }, { "epoch": 1.37, "learning_rate": 9.41453623085512e-05, "loss": 0.0276, "step": 212630 }, { "epoch": 1.37, "learning_rate": 9.413568095419428e-05, "loss": 0.0295, "step": 212640 }, { "epoch": 1.37, "learning_rate": 9.412599959983734e-05, "loss": 0.029, "step": 212650 }, { "epoch": 1.37, "learning_rate": 9.411631824548042e-05, "loss": 0.024, "step": 212660 }, { "epoch": 1.37, "learning_rate": 9.410663689112348e-05, "loss": 0.0267, "step": 212670 }, { "epoch": 1.37, "learning_rate": 9.409695553676656e-05, "loss": 0.026, "step": 212680 }, { "epoch": 1.37, "learning_rate": 9.408727418240961e-05, "loss": 0.0278, "step": 212690 }, { "epoch": 1.37, "learning_rate": 9.407759282805268e-05, "loss": 0.0276, "step": 212700 }, { "epoch": 1.37, "learning_rate": 9.406791147369576e-05, "loss": 0.034, "step": 212710 }, { "epoch": 1.37, "learning_rate": 9.405823011933881e-05, "loss": 0.0282, "step": 212720 }, { "epoch": 1.37, "learning_rate": 9.404854876498188e-05, "loss": 0.0243, "step": 212730 }, { "epoch": 1.37, "learning_rate": 9.403886741062496e-05, "loss": 0.0282, "step": 212740 }, { "epoch": 1.37, "learning_rate": 9.402918605626803e-05, "loss": 0.0279, "step": 212750 }, { "epoch": 1.37, "learning_rate": 9.401950470191109e-05, "loss": 0.0332, "step": 212760 }, { "epoch": 1.37, "learning_rate": 9.400982334755416e-05, "loss": 0.0265, "step": 212770 }, { "epoch": 1.37, "learning_rate": 9.400014199319724e-05, "loss": 0.0267, "step": 212780 }, { "epoch": 1.37, "learning_rate": 9.399046063884029e-05, "loss": 0.0246, "step": 212790 }, { "epoch": 1.37, "learning_rate": 9.398077928448336e-05, "loss": 0.0364, "step": 212800 }, { "epoch": 1.37, "learning_rate": 9.397109793012644e-05, "loss": 0.0283, "step": 212810 }, { "epoch": 1.37, "learning_rate": 9.39614165757695e-05, "loss": 0.0267, "step": 212820 }, { "epoch": 1.37, "learning_rate": 9.395173522141256e-05, "loss": 0.0272, "step": 212830 }, { "epoch": 1.37, "learning_rate": 9.394205386705563e-05, "loss": 0.0332, "step": 212840 }, { "epoch": 1.37, "learning_rate": 9.39323725126987e-05, "loss": 0.0297, "step": 212850 }, { "epoch": 1.37, "learning_rate": 9.392269115834177e-05, "loss": 0.0298, "step": 212860 }, { "epoch": 1.37, "learning_rate": 9.391300980398483e-05, "loss": 0.0282, "step": 212870 }, { "epoch": 1.37, "learning_rate": 9.390332844962791e-05, "loss": 0.0291, "step": 212880 }, { "epoch": 1.37, "learning_rate": 9.389364709527098e-05, "loss": 0.0338, "step": 212890 }, { "epoch": 1.37, "learning_rate": 9.388396574091403e-05, "loss": 0.0303, "step": 212900 }, { "epoch": 1.37, "learning_rate": 9.387428438655711e-05, "loss": 0.0301, "step": 212910 }, { "epoch": 1.37, "learning_rate": 9.386460303220018e-05, "loss": 0.0275, "step": 212920 }, { "epoch": 1.37, "learning_rate": 9.385492167784323e-05, "loss": 0.0287, "step": 212930 }, { "epoch": 1.37, "learning_rate": 9.384524032348631e-05, "loss": 0.0274, "step": 212940 }, { "epoch": 1.37, "learning_rate": 9.383555896912938e-05, "loss": 0.0265, "step": 212950 }, { "epoch": 1.37, "learning_rate": 9.382587761477246e-05, "loss": 0.0297, "step": 212960 }, { "epoch": 1.37, "learning_rate": 9.381619626041551e-05, "loss": 0.0245, "step": 212970 }, { "epoch": 1.37, "learning_rate": 9.380651490605859e-05, "loss": 0.0262, "step": 212980 }, { "epoch": 1.37, "learning_rate": 9.379683355170166e-05, "loss": 0.0315, "step": 212990 }, { "epoch": 1.37, "learning_rate": 9.378715219734471e-05, "loss": 0.0348, "step": 213000 }, { "epoch": 1.37, "eval_cer": 0.9199240763755507, "eval_loss": 0.021109996363520622, "eval_runtime": 120.0643, "eval_samples_per_second": 16.658, "eval_steps_per_second": 4.164, "step": 213000 }, { "epoch": 1.37, "learning_rate": 9.377747084298779e-05, "loss": 0.0329, "step": 213010 }, { "epoch": 1.37, "learning_rate": 9.376778948863085e-05, "loss": 0.028, "step": 213020 }, { "epoch": 1.37, "learning_rate": 9.375810813427393e-05, "loss": 0.0259, "step": 213030 }, { "epoch": 1.38, "learning_rate": 9.374842677991699e-05, "loss": 0.0295, "step": 213040 }, { "epoch": 1.38, "learning_rate": 9.373874542556005e-05, "loss": 0.0225, "step": 213050 }, { "epoch": 1.38, "learning_rate": 9.372906407120313e-05, "loss": 0.0313, "step": 213060 }, { "epoch": 1.38, "learning_rate": 9.371938271684619e-05, "loss": 0.0326, "step": 213070 }, { "epoch": 1.38, "learning_rate": 9.370970136248927e-05, "loss": 0.0246, "step": 213080 }, { "epoch": 1.38, "learning_rate": 9.370002000813233e-05, "loss": 0.0299, "step": 213090 }, { "epoch": 1.38, "learning_rate": 9.36903386537754e-05, "loss": 0.0282, "step": 213100 }, { "epoch": 1.38, "learning_rate": 9.368065729941846e-05, "loss": 0.0282, "step": 213110 }, { "epoch": 1.38, "learning_rate": 9.367097594506153e-05, "loss": 0.0279, "step": 213120 }, { "epoch": 1.38, "learning_rate": 9.366129459070461e-05, "loss": 0.0359, "step": 213130 }, { "epoch": 1.38, "learning_rate": 9.365161323634766e-05, "loss": 0.0349, "step": 213140 }, { "epoch": 1.38, "learning_rate": 9.364193188199073e-05, "loss": 0.0306, "step": 213150 }, { "epoch": 1.38, "learning_rate": 9.363225052763381e-05, "loss": 0.0315, "step": 213160 }, { "epoch": 1.38, "learning_rate": 9.362256917327688e-05, "loss": 0.0384, "step": 213170 }, { "epoch": 1.38, "learning_rate": 9.361288781891994e-05, "loss": 0.0275, "step": 213180 }, { "epoch": 1.38, "learning_rate": 9.360320646456301e-05, "loss": 0.0255, "step": 213190 }, { "epoch": 1.38, "learning_rate": 9.359352511020607e-05, "loss": 0.0335, "step": 213200 }, { "epoch": 1.38, "learning_rate": 9.358384375584914e-05, "loss": 0.0287, "step": 213210 }, { "epoch": 1.38, "learning_rate": 9.35741624014922e-05, "loss": 0.026, "step": 213220 }, { "epoch": 1.38, "learning_rate": 9.356448104713529e-05, "loss": 0.0272, "step": 213230 }, { "epoch": 1.38, "learning_rate": 9.355479969277835e-05, "loss": 0.0314, "step": 213240 }, { "epoch": 1.38, "learning_rate": 9.35451183384214e-05, "loss": 0.0376, "step": 213250 }, { "epoch": 1.38, "learning_rate": 9.353543698406448e-05, "loss": 0.0278, "step": 213260 }, { "epoch": 1.38, "learning_rate": 9.352575562970755e-05, "loss": 0.0261, "step": 213270 }, { "epoch": 1.38, "learning_rate": 9.351607427535062e-05, "loss": 0.025, "step": 213280 }, { "epoch": 1.38, "learning_rate": 9.350639292099368e-05, "loss": 0.0288, "step": 213290 }, { "epoch": 1.38, "learning_rate": 9.349671156663675e-05, "loss": 0.0359, "step": 213300 }, { "epoch": 1.38, "learning_rate": 9.348703021227983e-05, "loss": 0.0353, "step": 213310 }, { "epoch": 1.38, "learning_rate": 9.347734885792288e-05, "loss": 0.0315, "step": 213320 }, { "epoch": 1.38, "learning_rate": 9.346766750356596e-05, "loss": 0.0285, "step": 213330 }, { "epoch": 1.38, "learning_rate": 9.345798614920903e-05, "loss": 0.0306, "step": 213340 }, { "epoch": 1.38, "learning_rate": 9.344830479485208e-05, "loss": 0.0281, "step": 213350 }, { "epoch": 1.38, "learning_rate": 9.343862344049516e-05, "loss": 0.0307, "step": 213360 }, { "epoch": 1.38, "learning_rate": 9.342894208613823e-05, "loss": 0.0298, "step": 213370 }, { "epoch": 1.38, "learning_rate": 9.34192607317813e-05, "loss": 0.0276, "step": 213380 }, { "epoch": 1.38, "learning_rate": 9.340957937742436e-05, "loss": 0.031, "step": 213390 }, { "epoch": 1.38, "learning_rate": 9.339989802306743e-05, "loss": 0.0268, "step": 213400 }, { "epoch": 1.38, "learning_rate": 9.33902166687105e-05, "loss": 0.028, "step": 213410 }, { "epoch": 1.38, "learning_rate": 9.338053531435356e-05, "loss": 0.036, "step": 213420 }, { "epoch": 1.38, "learning_rate": 9.337085395999664e-05, "loss": 0.0267, "step": 213430 }, { "epoch": 1.38, "learning_rate": 9.33611726056397e-05, "loss": 0.0287, "step": 213440 }, { "epoch": 1.38, "learning_rate": 9.335149125128278e-05, "loss": 0.0336, "step": 213450 }, { "epoch": 1.38, "learning_rate": 9.334180989692584e-05, "loss": 0.0263, "step": 213460 }, { "epoch": 1.38, "learning_rate": 9.33321285425689e-05, "loss": 0.0345, "step": 213470 }, { "epoch": 1.38, "learning_rate": 9.332244718821198e-05, "loss": 0.0292, "step": 213480 }, { "epoch": 1.38, "learning_rate": 9.331276583385504e-05, "loss": 0.0264, "step": 213490 }, { "epoch": 1.38, "learning_rate": 9.33030844794981e-05, "loss": 0.0244, "step": 213500 }, { "epoch": 1.38, "learning_rate": 9.329340312514118e-05, "loss": 0.0274, "step": 213510 }, { "epoch": 1.38, "learning_rate": 9.328372177078425e-05, "loss": 0.0302, "step": 213520 }, { "epoch": 1.38, "learning_rate": 9.327404041642731e-05, "loss": 0.0326, "step": 213530 }, { "epoch": 1.38, "learning_rate": 9.326435906207038e-05, "loss": 0.0269, "step": 213540 }, { "epoch": 1.38, "learning_rate": 9.325467770771346e-05, "loss": 0.038, "step": 213550 }, { "epoch": 1.38, "learning_rate": 9.324499635335651e-05, "loss": 0.0319, "step": 213560 }, { "epoch": 1.38, "learning_rate": 9.323531499899958e-05, "loss": 0.0303, "step": 213570 }, { "epoch": 1.38, "learning_rate": 9.322563364464266e-05, "loss": 0.024, "step": 213580 }, { "epoch": 1.38, "learning_rate": 9.321595229028572e-05, "loss": 0.0336, "step": 213590 }, { "epoch": 1.38, "learning_rate": 9.320627093592878e-05, "loss": 0.0285, "step": 213600 }, { "epoch": 1.38, "learning_rate": 9.319658958157186e-05, "loss": 0.0308, "step": 213610 }, { "epoch": 1.38, "learning_rate": 9.318690822721492e-05, "loss": 0.0359, "step": 213620 }, { "epoch": 1.38, "learning_rate": 9.317722687285799e-05, "loss": 0.0289, "step": 213630 }, { "epoch": 1.38, "learning_rate": 9.316754551850106e-05, "loss": 0.0336, "step": 213640 }, { "epoch": 1.38, "learning_rate": 9.315786416414414e-05, "loss": 0.0254, "step": 213650 }, { "epoch": 1.38, "learning_rate": 9.31481828097872e-05, "loss": 0.0282, "step": 213660 }, { "epoch": 1.38, "learning_rate": 9.313850145543025e-05, "loss": 0.0316, "step": 213670 }, { "epoch": 1.38, "learning_rate": 9.312882010107333e-05, "loss": 0.026, "step": 213680 }, { "epoch": 1.38, "learning_rate": 9.31191387467164e-05, "loss": 0.0307, "step": 213690 }, { "epoch": 1.38, "learning_rate": 9.310945739235945e-05, "loss": 0.0284, "step": 213700 }, { "epoch": 1.38, "learning_rate": 9.309977603800253e-05, "loss": 0.0278, "step": 213710 }, { "epoch": 1.38, "learning_rate": 9.30900946836456e-05, "loss": 0.0266, "step": 213720 }, { "epoch": 1.38, "learning_rate": 9.308041332928868e-05, "loss": 0.0297, "step": 213730 }, { "epoch": 1.38, "learning_rate": 9.307073197493173e-05, "loss": 0.031, "step": 213740 }, { "epoch": 1.38, "learning_rate": 9.306105062057481e-05, "loss": 0.0261, "step": 213750 }, { "epoch": 1.38, "learning_rate": 9.305136926621788e-05, "loss": 0.0325, "step": 213760 }, { "epoch": 1.38, "learning_rate": 9.304168791186093e-05, "loss": 0.0278, "step": 213770 }, { "epoch": 1.38, "learning_rate": 9.303200655750401e-05, "loss": 0.0268, "step": 213780 }, { "epoch": 1.38, "learning_rate": 9.302232520314708e-05, "loss": 0.0282, "step": 213790 }, { "epoch": 1.38, "learning_rate": 9.301264384879016e-05, "loss": 0.0368, "step": 213800 }, { "epoch": 1.38, "learning_rate": 9.300296249443321e-05, "loss": 0.0294, "step": 213810 }, { "epoch": 1.38, "learning_rate": 9.299328114007628e-05, "loss": 0.0346, "step": 213820 }, { "epoch": 1.38, "learning_rate": 9.298359978571936e-05, "loss": 0.0267, "step": 213830 }, { "epoch": 1.38, "learning_rate": 9.297391843136241e-05, "loss": 0.0317, "step": 213840 }, { "epoch": 1.38, "learning_rate": 9.296423707700549e-05, "loss": 0.0267, "step": 213850 }, { "epoch": 1.38, "learning_rate": 9.295455572264855e-05, "loss": 0.03, "step": 213860 }, { "epoch": 1.38, "learning_rate": 9.294487436829163e-05, "loss": 0.0319, "step": 213870 }, { "epoch": 1.38, "learning_rate": 9.293519301393469e-05, "loss": 0.0273, "step": 213880 }, { "epoch": 1.38, "learning_rate": 9.292551165957775e-05, "loss": 0.0357, "step": 213890 }, { "epoch": 1.38, "learning_rate": 9.291583030522083e-05, "loss": 0.0261, "step": 213900 }, { "epoch": 1.38, "learning_rate": 9.290614895086389e-05, "loss": 0.0295, "step": 213910 }, { "epoch": 1.38, "learning_rate": 9.289646759650695e-05, "loss": 0.0285, "step": 213920 }, { "epoch": 1.38, "learning_rate": 9.288678624215003e-05, "loss": 0.0287, "step": 213930 }, { "epoch": 1.38, "learning_rate": 9.28771048877931e-05, "loss": 0.0306, "step": 213940 }, { "epoch": 1.38, "learning_rate": 9.286742353343616e-05, "loss": 0.0302, "step": 213950 }, { "epoch": 1.38, "learning_rate": 9.285774217907923e-05, "loss": 0.0328, "step": 213960 }, { "epoch": 1.38, "learning_rate": 9.284806082472231e-05, "loss": 0.0276, "step": 213970 }, { "epoch": 1.38, "learning_rate": 9.283837947036536e-05, "loss": 0.0287, "step": 213980 }, { "epoch": 1.38, "learning_rate": 9.282869811600843e-05, "loss": 0.0361, "step": 213990 }, { "epoch": 1.38, "learning_rate": 9.281901676165151e-05, "loss": 0.0291, "step": 214000 }, { "epoch": 1.38, "eval_cer": 0.919937634165631, "eval_loss": 0.02141990140080452, "eval_runtime": 120.0948, "eval_samples_per_second": 16.654, "eval_steps_per_second": 4.163, "step": 214000 }, { "epoch": 1.38, "learning_rate": 9.280933540729457e-05, "loss": 0.0352, "step": 214010 }, { "epoch": 1.38, "learning_rate": 9.279965405293763e-05, "loss": 0.0293, "step": 214020 }, { "epoch": 1.38, "learning_rate": 9.278997269858071e-05, "loss": 0.0261, "step": 214030 }, { "epoch": 1.38, "learning_rate": 9.278029134422377e-05, "loss": 0.0275, "step": 214040 }, { "epoch": 1.38, "learning_rate": 9.277060998986684e-05, "loss": 0.0337, "step": 214050 }, { "epoch": 1.38, "learning_rate": 9.27609286355099e-05, "loss": 0.0306, "step": 214060 }, { "epoch": 1.38, "learning_rate": 9.275124728115299e-05, "loss": 0.0319, "step": 214070 }, { "epoch": 1.38, "learning_rate": 9.274156592679605e-05, "loss": 0.0284, "step": 214080 }, { "epoch": 1.38, "learning_rate": 9.27318845724391e-05, "loss": 0.0292, "step": 214090 }, { "epoch": 1.38, "learning_rate": 9.272220321808218e-05, "loss": 0.0311, "step": 214100 }, { "epoch": 1.38, "learning_rate": 9.271252186372525e-05, "loss": 0.029, "step": 214110 }, { "epoch": 1.38, "learning_rate": 9.27028405093683e-05, "loss": 0.0304, "step": 214120 }, { "epoch": 1.38, "learning_rate": 9.269315915501138e-05, "loss": 0.0256, "step": 214130 }, { "epoch": 1.38, "learning_rate": 9.268347780065445e-05, "loss": 0.0317, "step": 214140 }, { "epoch": 1.38, "learning_rate": 9.267379644629753e-05, "loss": 0.0291, "step": 214150 }, { "epoch": 1.38, "learning_rate": 9.266411509194058e-05, "loss": 0.0299, "step": 214160 }, { "epoch": 1.38, "learning_rate": 9.265443373758366e-05, "loss": 0.0297, "step": 214170 }, { "epoch": 1.38, "learning_rate": 9.264475238322673e-05, "loss": 0.0237, "step": 214180 }, { "epoch": 1.38, "learning_rate": 9.263507102886978e-05, "loss": 0.0249, "step": 214190 }, { "epoch": 1.38, "learning_rate": 9.262538967451286e-05, "loss": 0.0269, "step": 214200 }, { "epoch": 1.38, "learning_rate": 9.261570832015593e-05, "loss": 0.0285, "step": 214210 }, { "epoch": 1.38, "learning_rate": 9.2606026965799e-05, "loss": 0.0308, "step": 214220 }, { "epoch": 1.38, "learning_rate": 9.259634561144206e-05, "loss": 0.0335, "step": 214230 }, { "epoch": 1.38, "learning_rate": 9.258666425708513e-05, "loss": 0.0259, "step": 214240 }, { "epoch": 1.38, "learning_rate": 9.25769829027282e-05, "loss": 0.0318, "step": 214250 }, { "epoch": 1.38, "learning_rate": 9.256730154837126e-05, "loss": 0.0321, "step": 214260 }, { "epoch": 1.38, "learning_rate": 9.255762019401434e-05, "loss": 0.0296, "step": 214270 }, { "epoch": 1.38, "learning_rate": 9.25479388396574e-05, "loss": 0.0309, "step": 214280 }, { "epoch": 1.38, "learning_rate": 9.253825748530047e-05, "loss": 0.0309, "step": 214290 }, { "epoch": 1.38, "learning_rate": 9.252857613094354e-05, "loss": 0.0319, "step": 214300 }, { "epoch": 1.38, "learning_rate": 9.25188947765866e-05, "loss": 0.0276, "step": 214310 }, { "epoch": 1.38, "learning_rate": 9.250921342222968e-05, "loss": 0.0312, "step": 214320 }, { "epoch": 1.38, "learning_rate": 9.249953206787273e-05, "loss": 0.0301, "step": 214330 }, { "epoch": 1.38, "learning_rate": 9.24898507135158e-05, "loss": 0.0269, "step": 214340 }, { "epoch": 1.38, "learning_rate": 9.248016935915888e-05, "loss": 0.0278, "step": 214350 }, { "epoch": 1.38, "learning_rate": 9.247048800480195e-05, "loss": 0.0284, "step": 214360 }, { "epoch": 1.38, "learning_rate": 9.246080665044501e-05, "loss": 0.0297, "step": 214370 }, { "epoch": 1.38, "learning_rate": 9.245112529608808e-05, "loss": 0.0295, "step": 214380 }, { "epoch": 1.38, "learning_rate": 9.244144394173115e-05, "loss": 0.0262, "step": 214390 }, { "epoch": 1.38, "learning_rate": 9.243176258737421e-05, "loss": 0.0271, "step": 214400 }, { "epoch": 1.38, "learning_rate": 9.242208123301728e-05, "loss": 0.0308, "step": 214410 }, { "epoch": 1.38, "learning_rate": 9.241239987866036e-05, "loss": 0.0249, "step": 214420 }, { "epoch": 1.38, "learning_rate": 9.240271852430342e-05, "loss": 0.0306, "step": 214430 }, { "epoch": 1.38, "learning_rate": 9.239303716994648e-05, "loss": 0.0347, "step": 214440 }, { "epoch": 1.38, "learning_rate": 9.238335581558956e-05, "loss": 0.0278, "step": 214450 }, { "epoch": 1.38, "learning_rate": 9.237367446123262e-05, "loss": 0.0264, "step": 214460 }, { "epoch": 1.38, "learning_rate": 9.236399310687569e-05, "loss": 0.0255, "step": 214470 }, { "epoch": 1.38, "learning_rate": 9.235431175251876e-05, "loss": 0.0283, "step": 214480 }, { "epoch": 1.38, "learning_rate": 9.234463039816182e-05, "loss": 0.0282, "step": 214490 }, { "epoch": 1.38, "learning_rate": 9.23349490438049e-05, "loss": 0.0241, "step": 214500 }, { "epoch": 1.38, "learning_rate": 9.232526768944795e-05, "loss": 0.0268, "step": 214510 }, { "epoch": 1.38, "learning_rate": 9.231558633509103e-05, "loss": 0.0273, "step": 214520 }, { "epoch": 1.38, "learning_rate": 9.23059049807341e-05, "loss": 0.0254, "step": 214530 }, { "epoch": 1.38, "learning_rate": 9.229622362637715e-05, "loss": 0.027, "step": 214540 }, { "epoch": 1.38, "learning_rate": 9.228654227202023e-05, "loss": 0.0307, "step": 214550 }, { "epoch": 1.38, "learning_rate": 9.22768609176633e-05, "loss": 0.0361, "step": 214560 }, { "epoch": 1.38, "learning_rate": 9.226717956330638e-05, "loss": 0.0271, "step": 214570 }, { "epoch": 1.38, "learning_rate": 9.225749820894943e-05, "loss": 0.0304, "step": 214580 }, { "epoch": 1.39, "learning_rate": 9.22478168545925e-05, "loss": 0.0304, "step": 214590 }, { "epoch": 1.39, "learning_rate": 9.223813550023558e-05, "loss": 0.0262, "step": 214600 }, { "epoch": 1.39, "learning_rate": 9.222845414587863e-05, "loss": 0.0285, "step": 214610 }, { "epoch": 1.39, "learning_rate": 9.221877279152171e-05, "loss": 0.0285, "step": 214620 }, { "epoch": 1.39, "learning_rate": 9.220909143716478e-05, "loss": 0.0265, "step": 214630 }, { "epoch": 1.39, "learning_rate": 9.219941008280786e-05, "loss": 0.025, "step": 214640 }, { "epoch": 1.39, "learning_rate": 9.218972872845091e-05, "loss": 0.0256, "step": 214650 }, { "epoch": 1.39, "learning_rate": 9.218004737409398e-05, "loss": 0.0306, "step": 214660 }, { "epoch": 1.39, "learning_rate": 9.217036601973705e-05, "loss": 0.0346, "step": 214670 }, { "epoch": 1.39, "learning_rate": 9.216068466538011e-05, "loss": 0.0296, "step": 214680 }, { "epoch": 1.39, "learning_rate": 9.215100331102317e-05, "loss": 0.0324, "step": 214690 }, { "epoch": 1.39, "learning_rate": 9.214132195666625e-05, "loss": 0.0323, "step": 214700 }, { "epoch": 1.39, "learning_rate": 9.213164060230932e-05, "loss": 0.0281, "step": 214710 }, { "epoch": 1.39, "learning_rate": 9.212195924795239e-05, "loss": 0.0312, "step": 214720 }, { "epoch": 1.39, "learning_rate": 9.211227789359545e-05, "loss": 0.0276, "step": 214730 }, { "epoch": 1.39, "learning_rate": 9.210259653923853e-05, "loss": 0.0334, "step": 214740 }, { "epoch": 1.39, "learning_rate": 9.209291518488158e-05, "loss": 0.0267, "step": 214750 }, { "epoch": 1.39, "learning_rate": 9.208323383052465e-05, "loss": 0.0332, "step": 214760 }, { "epoch": 1.39, "learning_rate": 9.207355247616773e-05, "loss": 0.0301, "step": 214770 }, { "epoch": 1.39, "learning_rate": 9.20638711218108e-05, "loss": 0.029, "step": 214780 }, { "epoch": 1.39, "learning_rate": 9.205418976745385e-05, "loss": 0.03, "step": 214790 }, { "epoch": 1.39, "learning_rate": 9.204450841309693e-05, "loss": 0.0297, "step": 214800 }, { "epoch": 1.39, "learning_rate": 9.203482705874e-05, "loss": 0.0268, "step": 214810 }, { "epoch": 1.39, "learning_rate": 9.202514570438306e-05, "loss": 0.0272, "step": 214820 }, { "epoch": 1.39, "learning_rate": 9.201546435002613e-05, "loss": 0.0258, "step": 214830 }, { "epoch": 1.39, "learning_rate": 9.200578299566921e-05, "loss": 0.0299, "step": 214840 }, { "epoch": 1.39, "learning_rate": 9.199610164131227e-05, "loss": 0.0308, "step": 214850 }, { "epoch": 1.39, "learning_rate": 9.198642028695533e-05, "loss": 0.0316, "step": 214860 }, { "epoch": 1.39, "learning_rate": 9.19767389325984e-05, "loss": 0.0206, "step": 214870 }, { "epoch": 1.39, "learning_rate": 9.196705757824147e-05, "loss": 0.028, "step": 214880 }, { "epoch": 1.39, "learning_rate": 9.195737622388453e-05, "loss": 0.0256, "step": 214890 }, { "epoch": 1.39, "learning_rate": 9.19476948695276e-05, "loss": 0.0287, "step": 214900 }, { "epoch": 1.39, "learning_rate": 9.193801351517067e-05, "loss": 0.0258, "step": 214910 }, { "epoch": 1.39, "learning_rate": 9.192833216081375e-05, "loss": 0.0326, "step": 214920 }, { "epoch": 1.39, "learning_rate": 9.19186508064568e-05, "loss": 0.0279, "step": 214930 }, { "epoch": 1.39, "learning_rate": 9.190896945209988e-05, "loss": 0.0304, "step": 214940 }, { "epoch": 1.39, "learning_rate": 9.189928809774295e-05, "loss": 0.0262, "step": 214950 }, { "epoch": 1.39, "learning_rate": 9.1889606743386e-05, "loss": 0.0304, "step": 214960 }, { "epoch": 1.39, "learning_rate": 9.187992538902908e-05, "loss": 0.0274, "step": 214970 }, { "epoch": 1.39, "learning_rate": 9.187024403467215e-05, "loss": 0.0275, "step": 214980 }, { "epoch": 1.39, "learning_rate": 9.186056268031523e-05, "loss": 0.0253, "step": 214990 }, { "epoch": 1.39, "learning_rate": 9.185088132595828e-05, "loss": 0.0353, "step": 215000 }, { "epoch": 1.39, "eval_cer": 0.9198843068579822, "eval_loss": 0.021198125556111336, "eval_runtime": 120.2091, "eval_samples_per_second": 16.638, "eval_steps_per_second": 4.159, "step": 215000 }, { "epoch": 1.39, "learning_rate": 9.184119997160135e-05, "loss": 0.0293, "step": 215010 }, { "epoch": 1.39, "learning_rate": 9.183151861724443e-05, "loss": 0.0336, "step": 215020 }, { "epoch": 1.39, "learning_rate": 9.182183726288748e-05, "loss": 0.0365, "step": 215030 }, { "epoch": 1.39, "learning_rate": 9.181215590853056e-05, "loss": 0.0335, "step": 215040 }, { "epoch": 1.39, "learning_rate": 9.180247455417363e-05, "loss": 0.0239, "step": 215050 }, { "epoch": 1.39, "learning_rate": 9.17927931998167e-05, "loss": 0.0283, "step": 215060 }, { "epoch": 1.39, "learning_rate": 9.178311184545976e-05, "loss": 0.0254, "step": 215070 }, { "epoch": 1.39, "learning_rate": 9.177343049110282e-05, "loss": 0.0271, "step": 215080 }, { "epoch": 1.39, "learning_rate": 9.17637491367459e-05, "loss": 0.0338, "step": 215090 }, { "epoch": 1.39, "learning_rate": 9.175406778238896e-05, "loss": 0.026, "step": 215100 }, { "epoch": 1.39, "learning_rate": 9.174438642803202e-05, "loss": 0.0311, "step": 215110 }, { "epoch": 1.39, "learning_rate": 9.17347050736751e-05, "loss": 0.0319, "step": 215120 }, { "epoch": 1.39, "learning_rate": 9.172502371931817e-05, "loss": 0.0232, "step": 215130 }, { "epoch": 1.39, "learning_rate": 9.171534236496124e-05, "loss": 0.037, "step": 215140 }, { "epoch": 1.39, "learning_rate": 9.17056610106043e-05, "loss": 0.0367, "step": 215150 }, { "epoch": 1.39, "learning_rate": 9.169597965624738e-05, "loss": 0.0299, "step": 215160 }, { "epoch": 1.39, "learning_rate": 9.168629830189043e-05, "loss": 0.027, "step": 215170 }, { "epoch": 1.39, "learning_rate": 9.16766169475335e-05, "loss": 0.0277, "step": 215180 }, { "epoch": 1.39, "learning_rate": 9.166693559317658e-05, "loss": 0.033, "step": 215190 }, { "epoch": 1.39, "learning_rate": 9.165725423881963e-05, "loss": 0.0306, "step": 215200 }, { "epoch": 1.39, "learning_rate": 9.16475728844627e-05, "loss": 0.0293, "step": 215210 }, { "epoch": 1.39, "learning_rate": 9.163789153010578e-05, "loss": 0.0362, "step": 215220 }, { "epoch": 1.39, "learning_rate": 9.162821017574885e-05, "loss": 0.0249, "step": 215230 }, { "epoch": 1.39, "learning_rate": 9.161852882139191e-05, "loss": 0.028, "step": 215240 }, { "epoch": 1.39, "learning_rate": 9.160884746703498e-05, "loss": 0.0201, "step": 215250 }, { "epoch": 1.39, "learning_rate": 9.159916611267806e-05, "loss": 0.0261, "step": 215260 }, { "epoch": 1.39, "learning_rate": 9.158948475832111e-05, "loss": 0.0316, "step": 215270 }, { "epoch": 1.39, "learning_rate": 9.157980340396418e-05, "loss": 0.0267, "step": 215280 }, { "epoch": 1.39, "learning_rate": 9.157012204960726e-05, "loss": 0.0281, "step": 215290 }, { "epoch": 1.39, "learning_rate": 9.156044069525032e-05, "loss": 0.0336, "step": 215300 }, { "epoch": 1.39, "learning_rate": 9.155075934089338e-05, "loss": 0.0287, "step": 215310 }, { "epoch": 1.39, "learning_rate": 9.154107798653646e-05, "loss": 0.0279, "step": 215320 }, { "epoch": 1.39, "learning_rate": 9.153139663217952e-05, "loss": 0.0335, "step": 215330 }, { "epoch": 1.39, "learning_rate": 9.152171527782259e-05, "loss": 0.0235, "step": 215340 }, { "epoch": 1.39, "learning_rate": 9.151203392346565e-05, "loss": 0.025, "step": 215350 }, { "epoch": 1.39, "learning_rate": 9.150235256910873e-05, "loss": 0.0275, "step": 215360 }, { "epoch": 1.39, "learning_rate": 9.14926712147518e-05, "loss": 0.0278, "step": 215370 }, { "epoch": 1.39, "learning_rate": 9.148298986039485e-05, "loss": 0.028, "step": 215380 }, { "epoch": 1.39, "learning_rate": 9.147330850603793e-05, "loss": 0.0298, "step": 215390 }, { "epoch": 1.39, "learning_rate": 9.1463627151681e-05, "loss": 0.027, "step": 215400 }, { "epoch": 1.39, "learning_rate": 9.145394579732405e-05, "loss": 0.0316, "step": 215410 }, { "epoch": 1.39, "learning_rate": 9.144426444296713e-05, "loss": 0.0331, "step": 215420 }, { "epoch": 1.39, "learning_rate": 9.14345830886102e-05, "loss": 0.0319, "step": 215430 }, { "epoch": 1.39, "learning_rate": 9.142490173425328e-05, "loss": 0.027, "step": 215440 }, { "epoch": 1.39, "learning_rate": 9.141522037989633e-05, "loss": 0.0264, "step": 215450 }, { "epoch": 1.39, "learning_rate": 9.140553902553941e-05, "loss": 0.0318, "step": 215460 }, { "epoch": 1.39, "learning_rate": 9.139585767118248e-05, "loss": 0.0296, "step": 215470 }, { "epoch": 1.39, "learning_rate": 9.138617631682553e-05, "loss": 0.0263, "step": 215480 }, { "epoch": 1.39, "learning_rate": 9.137649496246861e-05, "loss": 0.0271, "step": 215490 }, { "epoch": 1.39, "learning_rate": 9.136681360811167e-05, "loss": 0.0301, "step": 215500 }, { "epoch": 1.39, "learning_rate": 9.135713225375475e-05, "loss": 0.0358, "step": 215510 }, { "epoch": 1.39, "learning_rate": 9.134745089939781e-05, "loss": 0.0277, "step": 215520 }, { "epoch": 1.39, "learning_rate": 9.133776954504087e-05, "loss": 0.025, "step": 215530 }, { "epoch": 1.39, "learning_rate": 9.132808819068395e-05, "loss": 0.0259, "step": 215540 }, { "epoch": 1.39, "learning_rate": 9.1318406836327e-05, "loss": 0.028, "step": 215550 }, { "epoch": 1.39, "learning_rate": 9.130872548197009e-05, "loss": 0.0293, "step": 215560 }, { "epoch": 1.39, "learning_rate": 9.129904412761315e-05, "loss": 0.0243, "step": 215570 }, { "epoch": 1.39, "learning_rate": 9.128936277325623e-05, "loss": 0.0251, "step": 215580 }, { "epoch": 1.39, "learning_rate": 9.127968141889928e-05, "loss": 0.0269, "step": 215590 }, { "epoch": 1.39, "learning_rate": 9.127000006454235e-05, "loss": 0.0325, "step": 215600 }, { "epoch": 1.39, "learning_rate": 9.126031871018543e-05, "loss": 0.026, "step": 215610 }, { "epoch": 1.39, "learning_rate": 9.125063735582848e-05, "loss": 0.0258, "step": 215620 }, { "epoch": 1.39, "learning_rate": 9.124095600147155e-05, "loss": 0.0299, "step": 215630 }, { "epoch": 1.39, "learning_rate": 9.123127464711463e-05, "loss": 0.0284, "step": 215640 }, { "epoch": 1.39, "learning_rate": 9.12215932927577e-05, "loss": 0.0305, "step": 215650 }, { "epoch": 1.39, "learning_rate": 9.121191193840076e-05, "loss": 0.0292, "step": 215660 }, { "epoch": 1.39, "learning_rate": 9.120223058404383e-05, "loss": 0.0234, "step": 215670 }, { "epoch": 1.39, "learning_rate": 9.119254922968691e-05, "loss": 0.0338, "step": 215680 }, { "epoch": 1.39, "learning_rate": 9.118286787532996e-05, "loss": 0.034, "step": 215690 }, { "epoch": 1.39, "learning_rate": 9.117318652097303e-05, "loss": 0.0286, "step": 215700 }, { "epoch": 1.39, "learning_rate": 9.11635051666161e-05, "loss": 0.0272, "step": 215710 }, { "epoch": 1.39, "learning_rate": 9.115382381225917e-05, "loss": 0.0257, "step": 215720 }, { "epoch": 1.39, "learning_rate": 9.114414245790223e-05, "loss": 0.0296, "step": 215730 }, { "epoch": 1.39, "learning_rate": 9.11344611035453e-05, "loss": 0.0324, "step": 215740 }, { "epoch": 1.39, "learning_rate": 9.112477974918837e-05, "loss": 0.0326, "step": 215750 }, { "epoch": 1.39, "learning_rate": 9.111509839483144e-05, "loss": 0.0302, "step": 215760 }, { "epoch": 1.39, "learning_rate": 9.11054170404745e-05, "loss": 0.026, "step": 215770 }, { "epoch": 1.39, "learning_rate": 9.109573568611758e-05, "loss": 0.033, "step": 215780 }, { "epoch": 1.39, "learning_rate": 9.108605433176065e-05, "loss": 0.0281, "step": 215790 }, { "epoch": 1.39, "learning_rate": 9.10763729774037e-05, "loss": 0.0243, "step": 215800 }, { "epoch": 1.39, "learning_rate": 9.106669162304678e-05, "loss": 0.0266, "step": 215810 }, { "epoch": 1.39, "learning_rate": 9.105701026868985e-05, "loss": 0.0286, "step": 215820 }, { "epoch": 1.39, "learning_rate": 9.10473289143329e-05, "loss": 0.0302, "step": 215830 }, { "epoch": 1.39, "learning_rate": 9.103764755997598e-05, "loss": 0.0277, "step": 215840 }, { "epoch": 1.39, "learning_rate": 9.102796620561905e-05, "loss": 0.026, "step": 215850 }, { "epoch": 1.39, "learning_rate": 9.101828485126213e-05, "loss": 0.0261, "step": 215860 }, { "epoch": 1.39, "learning_rate": 9.100860349690518e-05, "loss": 0.029, "step": 215870 }, { "epoch": 1.39, "learning_rate": 9.099892214254826e-05, "loss": 0.028, "step": 215880 }, { "epoch": 1.39, "learning_rate": 9.098924078819133e-05, "loss": 0.0271, "step": 215890 }, { "epoch": 1.39, "learning_rate": 9.097955943383438e-05, "loss": 0.032, "step": 215900 }, { "epoch": 1.39, "learning_rate": 9.096987807947746e-05, "loss": 0.0312, "step": 215910 }, { "epoch": 1.39, "learning_rate": 9.096019672512052e-05, "loss": 0.0259, "step": 215920 }, { "epoch": 1.39, "learning_rate": 9.09505153707636e-05, "loss": 0.0275, "step": 215930 }, { "epoch": 1.39, "learning_rate": 9.094083401640666e-05, "loss": 0.0248, "step": 215940 }, { "epoch": 1.39, "learning_rate": 9.093115266204972e-05, "loss": 0.029, "step": 215950 }, { "epoch": 1.39, "learning_rate": 9.09214713076928e-05, "loss": 0.0321, "step": 215960 }, { "epoch": 1.39, "learning_rate": 9.091178995333586e-05, "loss": 0.0305, "step": 215970 }, { "epoch": 1.39, "learning_rate": 9.090210859897894e-05, "loss": 0.0296, "step": 215980 }, { "epoch": 1.39, "learning_rate": 9.0892427244622e-05, "loss": 0.0301, "step": 215990 }, { "epoch": 1.39, "learning_rate": 9.088274589026507e-05, "loss": 0.0324, "step": 216000 }, { "epoch": 1.39, "eval_cer": 0.9199457688396792, "eval_loss": 0.020877143368124962, "eval_runtime": 120.2616, "eval_samples_per_second": 16.63, "eval_steps_per_second": 4.158, "step": 216000 }, { "epoch": 1.39, "learning_rate": 9.087306453590813e-05, "loss": 0.031, "step": 216010 }, { "epoch": 1.39, "learning_rate": 9.08633831815512e-05, "loss": 0.0263, "step": 216020 }, { "epoch": 1.39, "learning_rate": 9.085370182719428e-05, "loss": 0.0279, "step": 216030 }, { "epoch": 1.39, "learning_rate": 9.084402047283733e-05, "loss": 0.03, "step": 216040 }, { "epoch": 1.39, "learning_rate": 9.08343391184804e-05, "loss": 0.0259, "step": 216050 }, { "epoch": 1.39, "learning_rate": 9.082465776412348e-05, "loss": 0.0288, "step": 216060 }, { "epoch": 1.39, "learning_rate": 9.081497640976655e-05, "loss": 0.0304, "step": 216070 }, { "epoch": 1.39, "learning_rate": 9.080529505540961e-05, "loss": 0.0328, "step": 216080 }, { "epoch": 1.39, "learning_rate": 9.079561370105268e-05, "loss": 0.0269, "step": 216090 }, { "epoch": 1.39, "learning_rate": 9.078593234669574e-05, "loss": 0.0287, "step": 216100 }, { "epoch": 1.39, "learning_rate": 9.077625099233881e-05, "loss": 0.0318, "step": 216110 }, { "epoch": 1.39, "learning_rate": 9.076656963798188e-05, "loss": 0.0272, "step": 216120 }, { "epoch": 1.39, "learning_rate": 9.075688828362496e-05, "loss": 0.0272, "step": 216130 }, { "epoch": 1.4, "learning_rate": 9.074720692926802e-05, "loss": 0.0261, "step": 216140 }, { "epoch": 1.4, "learning_rate": 9.073752557491108e-05, "loss": 0.0278, "step": 216150 }, { "epoch": 1.4, "learning_rate": 9.072784422055415e-05, "loss": 0.0278, "step": 216160 }, { "epoch": 1.4, "learning_rate": 9.071816286619722e-05, "loss": 0.0286, "step": 216170 }, { "epoch": 1.4, "learning_rate": 9.070848151184029e-05, "loss": 0.0318, "step": 216180 }, { "epoch": 1.4, "learning_rate": 9.069880015748335e-05, "loss": 0.0308, "step": 216190 }, { "epoch": 1.4, "learning_rate": 9.068911880312642e-05, "loss": 0.0266, "step": 216200 }, { "epoch": 1.4, "learning_rate": 9.06794374487695e-05, "loss": 0.0285, "step": 216210 }, { "epoch": 1.4, "learning_rate": 9.066975609441255e-05, "loss": 0.0289, "step": 216220 }, { "epoch": 1.4, "learning_rate": 9.066007474005563e-05, "loss": 0.0309, "step": 216230 }, { "epoch": 1.4, "learning_rate": 9.06503933856987e-05, "loss": 0.0294, "step": 216240 }, { "epoch": 1.4, "learning_rate": 9.064071203134175e-05, "loss": 0.0259, "step": 216250 }, { "epoch": 1.4, "learning_rate": 9.063103067698483e-05, "loss": 0.0257, "step": 216260 }, { "epoch": 1.4, "learning_rate": 9.06213493226279e-05, "loss": 0.0367, "step": 216270 }, { "epoch": 1.4, "learning_rate": 9.061166796827098e-05, "loss": 0.0253, "step": 216280 }, { "epoch": 1.4, "learning_rate": 9.060198661391403e-05, "loss": 0.0266, "step": 216290 }, { "epoch": 1.4, "learning_rate": 9.05923052595571e-05, "loss": 0.0301, "step": 216300 }, { "epoch": 1.4, "learning_rate": 9.058262390520018e-05, "loss": 0.0238, "step": 216310 }, { "epoch": 1.4, "learning_rate": 9.057294255084323e-05, "loss": 0.0302, "step": 216320 }, { "epoch": 1.4, "learning_rate": 9.056326119648631e-05, "loss": 0.0305, "step": 216330 }, { "epoch": 1.4, "learning_rate": 9.055357984212937e-05, "loss": 0.0276, "step": 216340 }, { "epoch": 1.4, "learning_rate": 9.054389848777245e-05, "loss": 0.0332, "step": 216350 }, { "epoch": 1.4, "learning_rate": 9.053421713341551e-05, "loss": 0.0248, "step": 216360 }, { "epoch": 1.4, "learning_rate": 9.052453577905857e-05, "loss": 0.0307, "step": 216370 }, { "epoch": 1.4, "learning_rate": 9.051485442470165e-05, "loss": 0.0299, "step": 216380 }, { "epoch": 1.4, "learning_rate": 9.05051730703447e-05, "loss": 0.0345, "step": 216390 }, { "epoch": 1.4, "learning_rate": 9.049549171598777e-05, "loss": 0.0335, "step": 216400 }, { "epoch": 1.4, "learning_rate": 9.048581036163085e-05, "loss": 0.033, "step": 216410 }, { "epoch": 1.4, "learning_rate": 9.047612900727392e-05, "loss": 0.0302, "step": 216420 }, { "epoch": 1.4, "learning_rate": 9.046644765291698e-05, "loss": 0.0268, "step": 216430 }, { "epoch": 1.4, "learning_rate": 9.045676629856005e-05, "loss": 0.03, "step": 216440 }, { "epoch": 1.4, "learning_rate": 9.044708494420313e-05, "loss": 0.0234, "step": 216450 }, { "epoch": 1.4, "learning_rate": 9.043740358984618e-05, "loss": 0.0323, "step": 216460 }, { "epoch": 1.4, "learning_rate": 9.042772223548925e-05, "loss": 0.0254, "step": 216470 }, { "epoch": 1.4, "learning_rate": 9.041804088113233e-05, "loss": 0.0318, "step": 216480 }, { "epoch": 1.4, "learning_rate": 9.04083595267754e-05, "loss": 0.0264, "step": 216490 }, { "epoch": 1.4, "learning_rate": 9.039867817241845e-05, "loss": 0.0293, "step": 216500 }, { "epoch": 1.4, "learning_rate": 9.038899681806153e-05, "loss": 0.0267, "step": 216510 }, { "epoch": 1.4, "learning_rate": 9.03793154637046e-05, "loss": 0.0293, "step": 216520 }, { "epoch": 1.4, "learning_rate": 9.036963410934766e-05, "loss": 0.0281, "step": 216530 }, { "epoch": 1.4, "learning_rate": 9.035995275499073e-05, "loss": 0.0295, "step": 216540 }, { "epoch": 1.4, "learning_rate": 9.03502714006338e-05, "loss": 0.0275, "step": 216550 }, { "epoch": 1.4, "learning_rate": 9.034059004627687e-05, "loss": 0.0277, "step": 216560 }, { "epoch": 1.4, "learning_rate": 9.033090869191992e-05, "loss": 0.0339, "step": 216570 }, { "epoch": 1.4, "learning_rate": 9.0321227337563e-05, "loss": 0.0271, "step": 216580 }, { "epoch": 1.4, "learning_rate": 9.031154598320607e-05, "loss": 0.0289, "step": 216590 }, { "epoch": 1.4, "learning_rate": 9.030186462884912e-05, "loss": 0.0303, "step": 216600 }, { "epoch": 1.4, "learning_rate": 9.02921832744922e-05, "loss": 0.0257, "step": 216610 }, { "epoch": 1.4, "learning_rate": 9.028250192013527e-05, "loss": 0.0263, "step": 216620 }, { "epoch": 1.4, "learning_rate": 9.027282056577835e-05, "loss": 0.0313, "step": 216630 }, { "epoch": 1.4, "learning_rate": 9.02631392114214e-05, "loss": 0.0285, "step": 216640 }, { "epoch": 1.4, "learning_rate": 9.025345785706448e-05, "loss": 0.0376, "step": 216650 }, { "epoch": 1.4, "learning_rate": 9.024377650270755e-05, "loss": 0.0282, "step": 216660 }, { "epoch": 1.4, "learning_rate": 9.02340951483506e-05, "loss": 0.0352, "step": 216670 }, { "epoch": 1.4, "learning_rate": 9.022441379399368e-05, "loss": 0.0281, "step": 216680 }, { "epoch": 1.4, "learning_rate": 9.021473243963675e-05, "loss": 0.0276, "step": 216690 }, { "epoch": 1.4, "learning_rate": 9.020505108527983e-05, "loss": 0.0295, "step": 216700 }, { "epoch": 1.4, "learning_rate": 9.019536973092288e-05, "loss": 0.03, "step": 216710 }, { "epoch": 1.4, "learning_rate": 9.018568837656595e-05, "loss": 0.0317, "step": 216720 }, { "epoch": 1.4, "learning_rate": 9.017600702220903e-05, "loss": 0.0227, "step": 216730 }, { "epoch": 1.4, "learning_rate": 9.016632566785208e-05, "loss": 0.0332, "step": 216740 }, { "epoch": 1.4, "learning_rate": 9.015664431349516e-05, "loss": 0.0276, "step": 216750 }, { "epoch": 1.4, "learning_rate": 9.014696295913822e-05, "loss": 0.0309, "step": 216760 }, { "epoch": 1.4, "learning_rate": 9.01372816047813e-05, "loss": 0.0262, "step": 216770 }, { "epoch": 1.4, "learning_rate": 9.012760025042436e-05, "loss": 0.0338, "step": 216780 }, { "epoch": 1.4, "learning_rate": 9.011791889606742e-05, "loss": 0.0234, "step": 216790 }, { "epoch": 1.4, "learning_rate": 9.01082375417105e-05, "loss": 0.0263, "step": 216800 }, { "epoch": 1.4, "learning_rate": 9.009855618735356e-05, "loss": 0.0284, "step": 216810 }, { "epoch": 1.4, "learning_rate": 9.008887483299662e-05, "loss": 0.0285, "step": 216820 }, { "epoch": 1.4, "learning_rate": 9.00791934786397e-05, "loss": 0.0299, "step": 216830 }, { "epoch": 1.4, "learning_rate": 9.006951212428277e-05, "loss": 0.0287, "step": 216840 }, { "epoch": 1.4, "learning_rate": 9.005983076992583e-05, "loss": 0.0258, "step": 216850 }, { "epoch": 1.4, "learning_rate": 9.00501494155689e-05, "loss": 0.0371, "step": 216860 }, { "epoch": 1.4, "learning_rate": 9.004046806121198e-05, "loss": 0.0293, "step": 216870 }, { "epoch": 1.4, "learning_rate": 9.003078670685503e-05, "loss": 0.0258, "step": 216880 }, { "epoch": 1.4, "learning_rate": 9.00211053524981e-05, "loss": 0.0239, "step": 216890 }, { "epoch": 1.4, "learning_rate": 9.001142399814118e-05, "loss": 0.0303, "step": 216900 }, { "epoch": 1.4, "learning_rate": 9.000174264378424e-05, "loss": 0.0259, "step": 216910 }, { "epoch": 1.4, "learning_rate": 8.99920612894273e-05, "loss": 0.0233, "step": 216920 }, { "epoch": 1.4, "learning_rate": 8.998237993507038e-05, "loss": 0.0266, "step": 216930 }, { "epoch": 1.4, "learning_rate": 8.997269858071344e-05, "loss": 0.0258, "step": 216940 }, { "epoch": 1.4, "learning_rate": 8.996301722635651e-05, "loss": 0.0301, "step": 216950 }, { "epoch": 1.4, "learning_rate": 8.995333587199958e-05, "loss": 0.0306, "step": 216960 }, { "epoch": 1.4, "learning_rate": 8.994365451764266e-05, "loss": 0.0301, "step": 216970 }, { "epoch": 1.4, "learning_rate": 8.993397316328572e-05, "loss": 0.0357, "step": 216980 }, { "epoch": 1.4, "learning_rate": 8.992429180892877e-05, "loss": 0.0262, "step": 216990 }, { "epoch": 1.4, "learning_rate": 8.991461045457185e-05, "loss": 0.0342, "step": 217000 }, { "epoch": 1.4, "eval_cer": 0.9198969607953904, "eval_loss": 0.020930752158164978, "eval_runtime": 120.4671, "eval_samples_per_second": 16.602, "eval_steps_per_second": 4.151, "step": 217000 }, { "epoch": 1.4, "learning_rate": 8.990492910021492e-05, "loss": 0.025, "step": 217010 }, { "epoch": 1.4, "learning_rate": 8.989524774585797e-05, "loss": 0.0321, "step": 217020 }, { "epoch": 1.4, "learning_rate": 8.988556639150105e-05, "loss": 0.0283, "step": 217030 }, { "epoch": 1.4, "learning_rate": 8.987588503714412e-05, "loss": 0.0282, "step": 217040 }, { "epoch": 1.4, "learning_rate": 8.98662036827872e-05, "loss": 0.0263, "step": 217050 }, { "epoch": 1.4, "learning_rate": 8.985652232843025e-05, "loss": 0.0265, "step": 217060 }, { "epoch": 1.4, "learning_rate": 8.984684097407333e-05, "loss": 0.0281, "step": 217070 }, { "epoch": 1.4, "learning_rate": 8.98371596197164e-05, "loss": 0.0311, "step": 217080 }, { "epoch": 1.4, "learning_rate": 8.982747826535945e-05, "loss": 0.0271, "step": 217090 }, { "epoch": 1.4, "learning_rate": 8.981779691100253e-05, "loss": 0.027, "step": 217100 }, { "epoch": 1.4, "learning_rate": 8.98081155566456e-05, "loss": 0.0322, "step": 217110 }, { "epoch": 1.4, "learning_rate": 8.979843420228868e-05, "loss": 0.0309, "step": 217120 }, { "epoch": 1.4, "learning_rate": 8.978875284793173e-05, "loss": 0.0281, "step": 217130 }, { "epoch": 1.4, "learning_rate": 8.97790714935748e-05, "loss": 0.0271, "step": 217140 }, { "epoch": 1.4, "learning_rate": 8.976939013921788e-05, "loss": 0.0261, "step": 217150 }, { "epoch": 1.4, "learning_rate": 8.975970878486093e-05, "loss": 0.0285, "step": 217160 }, { "epoch": 1.4, "learning_rate": 8.975002743050401e-05, "loss": 0.031, "step": 217170 }, { "epoch": 1.4, "learning_rate": 8.974034607614707e-05, "loss": 0.0345, "step": 217180 }, { "epoch": 1.4, "learning_rate": 8.973066472179014e-05, "loss": 0.0312, "step": 217190 }, { "epoch": 1.4, "learning_rate": 8.97209833674332e-05, "loss": 0.028, "step": 217200 }, { "epoch": 1.4, "learning_rate": 8.971130201307627e-05, "loss": 0.0291, "step": 217210 }, { "epoch": 1.4, "learning_rate": 8.970162065871935e-05, "loss": 0.0251, "step": 217220 }, { "epoch": 1.4, "learning_rate": 8.96919393043624e-05, "loss": 0.0332, "step": 217230 }, { "epoch": 1.4, "learning_rate": 8.968225795000547e-05, "loss": 0.0289, "step": 217240 }, { "epoch": 1.4, "learning_rate": 8.967257659564855e-05, "loss": 0.0239, "step": 217250 }, { "epoch": 1.4, "learning_rate": 8.966289524129162e-05, "loss": 0.0285, "step": 217260 }, { "epoch": 1.4, "learning_rate": 8.965321388693468e-05, "loss": 0.0338, "step": 217270 }, { "epoch": 1.4, "learning_rate": 8.964353253257775e-05, "loss": 0.0359, "step": 217280 }, { "epoch": 1.4, "learning_rate": 8.963385117822082e-05, "loss": 0.0325, "step": 217290 }, { "epoch": 1.4, "learning_rate": 8.962416982386388e-05, "loss": 0.0333, "step": 217300 }, { "epoch": 1.4, "learning_rate": 8.961448846950695e-05, "loss": 0.0273, "step": 217310 }, { "epoch": 1.4, "learning_rate": 8.960480711515003e-05, "loss": 0.03, "step": 217320 }, { "epoch": 1.4, "learning_rate": 8.95951257607931e-05, "loss": 0.0313, "step": 217330 }, { "epoch": 1.4, "learning_rate": 8.958544440643615e-05, "loss": 0.0247, "step": 217340 }, { "epoch": 1.4, "learning_rate": 8.957576305207923e-05, "loss": 0.0281, "step": 217350 }, { "epoch": 1.4, "learning_rate": 8.95660816977223e-05, "loss": 0.0277, "step": 217360 }, { "epoch": 1.4, "learning_rate": 8.955640034336536e-05, "loss": 0.0271, "step": 217370 }, { "epoch": 1.4, "learning_rate": 8.954671898900843e-05, "loss": 0.0261, "step": 217380 }, { "epoch": 1.4, "learning_rate": 8.953703763465149e-05, "loss": 0.0286, "step": 217390 }, { "epoch": 1.4, "learning_rate": 8.952735628029457e-05, "loss": 0.0376, "step": 217400 }, { "epoch": 1.4, "learning_rate": 8.951767492593762e-05, "loss": 0.0303, "step": 217410 }, { "epoch": 1.4, "learning_rate": 8.95079935715807e-05, "loss": 0.0286, "step": 217420 }, { "epoch": 1.4, "learning_rate": 8.949831221722377e-05, "loss": 0.0289, "step": 217430 }, { "epoch": 1.4, "learning_rate": 8.948863086286682e-05, "loss": 0.0311, "step": 217440 }, { "epoch": 1.4, "learning_rate": 8.94789495085099e-05, "loss": 0.0264, "step": 217450 }, { "epoch": 1.4, "learning_rate": 8.946926815415297e-05, "loss": 0.027, "step": 217460 }, { "epoch": 1.4, "learning_rate": 8.945958679979605e-05, "loss": 0.0306, "step": 217470 }, { "epoch": 1.4, "learning_rate": 8.94499054454391e-05, "loss": 0.0307, "step": 217480 }, { "epoch": 1.4, "learning_rate": 8.944022409108217e-05, "loss": 0.0229, "step": 217490 }, { "epoch": 1.4, "learning_rate": 8.943054273672525e-05, "loss": 0.028, "step": 217500 }, { "epoch": 1.4, "learning_rate": 8.94208613823683e-05, "loss": 0.0284, "step": 217510 }, { "epoch": 1.4, "learning_rate": 8.941118002801138e-05, "loss": 0.0233, "step": 217520 }, { "epoch": 1.4, "learning_rate": 8.940149867365445e-05, "loss": 0.0267, "step": 217530 }, { "epoch": 1.4, "learning_rate": 8.939181731929753e-05, "loss": 0.0236, "step": 217540 }, { "epoch": 1.4, "learning_rate": 8.938213596494058e-05, "loss": 0.0306, "step": 217550 }, { "epoch": 1.4, "learning_rate": 8.937245461058365e-05, "loss": 0.0318, "step": 217560 }, { "epoch": 1.4, "learning_rate": 8.936277325622673e-05, "loss": 0.0244, "step": 217570 }, { "epoch": 1.4, "learning_rate": 8.935309190186978e-05, "loss": 0.0258, "step": 217580 }, { "epoch": 1.4, "learning_rate": 8.934341054751284e-05, "loss": 0.0249, "step": 217590 }, { "epoch": 1.4, "learning_rate": 8.933372919315592e-05, "loss": 0.0237, "step": 217600 }, { "epoch": 1.4, "learning_rate": 8.932404783879899e-05, "loss": 0.0251, "step": 217610 }, { "epoch": 1.4, "learning_rate": 8.931436648444206e-05, "loss": 0.0302, "step": 217620 }, { "epoch": 1.4, "learning_rate": 8.930468513008512e-05, "loss": 0.0259, "step": 217630 }, { "epoch": 1.4, "learning_rate": 8.92950037757282e-05, "loss": 0.0279, "step": 217640 }, { "epoch": 1.4, "learning_rate": 8.928532242137125e-05, "loss": 0.0291, "step": 217650 }, { "epoch": 1.4, "learning_rate": 8.927564106701432e-05, "loss": 0.029, "step": 217660 }, { "epoch": 1.4, "learning_rate": 8.92659597126574e-05, "loss": 0.0274, "step": 217670 }, { "epoch": 1.4, "learning_rate": 8.925627835830047e-05, "loss": 0.0367, "step": 217680 }, { "epoch": 1.41, "learning_rate": 8.924659700394352e-05, "loss": 0.029, "step": 217690 }, { "epoch": 1.41, "learning_rate": 8.92369156495866e-05, "loss": 0.0306, "step": 217700 }, { "epoch": 1.41, "learning_rate": 8.922723429522967e-05, "loss": 0.0361, "step": 217710 }, { "epoch": 1.41, "learning_rate": 8.921755294087273e-05, "loss": 0.0288, "step": 217720 }, { "epoch": 1.41, "learning_rate": 8.92078715865158e-05, "loss": 0.0333, "step": 217730 }, { "epoch": 1.41, "learning_rate": 8.919819023215888e-05, "loss": 0.0334, "step": 217740 }, { "epoch": 1.41, "learning_rate": 8.918850887780194e-05, "loss": 0.0276, "step": 217750 }, { "epoch": 1.41, "learning_rate": 8.9178827523445e-05, "loss": 0.0289, "step": 217760 }, { "epoch": 1.41, "learning_rate": 8.916914616908808e-05, "loss": 0.0244, "step": 217770 }, { "epoch": 1.41, "learning_rate": 8.915946481473114e-05, "loss": 0.0327, "step": 217780 }, { "epoch": 1.41, "learning_rate": 8.91497834603742e-05, "loss": 0.0319, "step": 217790 }, { "epoch": 1.41, "learning_rate": 8.914010210601728e-05, "loss": 0.0233, "step": 217800 }, { "epoch": 1.41, "learning_rate": 8.913042075166034e-05, "loss": 0.0261, "step": 217810 }, { "epoch": 1.41, "learning_rate": 8.912073939730342e-05, "loss": 0.031, "step": 217820 }, { "epoch": 1.41, "learning_rate": 8.911105804294647e-05, "loss": 0.0249, "step": 217830 }, { "epoch": 1.41, "learning_rate": 8.910137668858955e-05, "loss": 0.0309, "step": 217840 }, { "epoch": 1.41, "learning_rate": 8.909169533423262e-05, "loss": 0.0349, "step": 217850 }, { "epoch": 1.41, "learning_rate": 8.908201397987567e-05, "loss": 0.0269, "step": 217860 }, { "epoch": 1.41, "learning_rate": 8.907233262551875e-05, "loss": 0.033, "step": 217870 }, { "epoch": 1.41, "learning_rate": 8.906265127116182e-05, "loss": 0.027, "step": 217880 }, { "epoch": 1.41, "learning_rate": 8.90529699168049e-05, "loss": 0.0244, "step": 217890 }, { "epoch": 1.41, "learning_rate": 8.904328856244795e-05, "loss": 0.0264, "step": 217900 }, { "epoch": 1.41, "learning_rate": 8.903360720809102e-05, "loss": 0.0324, "step": 217910 }, { "epoch": 1.41, "learning_rate": 8.90239258537341e-05, "loss": 0.027, "step": 217920 }, { "epoch": 1.41, "learning_rate": 8.901424449937715e-05, "loss": 0.0232, "step": 217930 }, { "epoch": 1.41, "learning_rate": 8.900456314502023e-05, "loss": 0.031, "step": 217940 }, { "epoch": 1.41, "learning_rate": 8.89948817906633e-05, "loss": 0.0304, "step": 217950 }, { "epoch": 1.41, "learning_rate": 8.898520043630638e-05, "loss": 0.0341, "step": 217960 }, { "epoch": 1.41, "learning_rate": 8.897551908194943e-05, "loss": 0.0309, "step": 217970 }, { "epoch": 1.41, "learning_rate": 8.89658377275925e-05, "loss": 0.0257, "step": 217980 }, { "epoch": 1.41, "learning_rate": 8.895615637323557e-05, "loss": 0.03, "step": 217990 }, { "epoch": 1.41, "learning_rate": 8.894647501887863e-05, "loss": 0.0293, "step": 218000 }, { "epoch": 1.41, "eval_cer": 0.9199186532595187, "eval_loss": 0.02118774503469467, "eval_runtime": 120.0083, "eval_samples_per_second": 16.666, "eval_steps_per_second": 4.166, "step": 218000 }, { "epoch": 1.41, "learning_rate": 8.89367936645217e-05, "loss": 0.0284, "step": 218010 }, { "epoch": 1.41, "learning_rate": 8.892711231016477e-05, "loss": 0.0282, "step": 218020 }, { "epoch": 1.41, "learning_rate": 8.891743095580784e-05, "loss": 0.0264, "step": 218030 }, { "epoch": 1.41, "learning_rate": 8.89077496014509e-05, "loss": 0.0312, "step": 218040 }, { "epoch": 1.41, "learning_rate": 8.889806824709397e-05, "loss": 0.0278, "step": 218050 }, { "epoch": 1.41, "learning_rate": 8.888838689273705e-05, "loss": 0.0239, "step": 218060 }, { "epoch": 1.41, "learning_rate": 8.88787055383801e-05, "loss": 0.0258, "step": 218070 }, { "epoch": 1.41, "learning_rate": 8.886902418402317e-05, "loss": 0.0275, "step": 218080 }, { "epoch": 1.41, "learning_rate": 8.885934282966625e-05, "loss": 0.0327, "step": 218090 }, { "epoch": 1.41, "learning_rate": 8.884966147530932e-05, "loss": 0.0341, "step": 218100 }, { "epoch": 1.41, "learning_rate": 8.883998012095237e-05, "loss": 0.0226, "step": 218110 }, { "epoch": 1.41, "learning_rate": 8.883029876659545e-05, "loss": 0.0254, "step": 218120 }, { "epoch": 1.41, "learning_rate": 8.882061741223852e-05, "loss": 0.0259, "step": 218130 }, { "epoch": 1.41, "learning_rate": 8.881093605788158e-05, "loss": 0.0278, "step": 218140 }, { "epoch": 1.41, "learning_rate": 8.880125470352465e-05, "loss": 0.0291, "step": 218150 }, { "epoch": 1.41, "learning_rate": 8.879157334916773e-05, "loss": 0.0315, "step": 218160 }, { "epoch": 1.41, "learning_rate": 8.87818919948108e-05, "loss": 0.0262, "step": 218170 }, { "epoch": 1.41, "learning_rate": 8.877221064045385e-05, "loss": 0.0274, "step": 218180 }, { "epoch": 1.41, "learning_rate": 8.876252928609693e-05, "loss": 0.0235, "step": 218190 }, { "epoch": 1.41, "learning_rate": 8.875284793173999e-05, "loss": 0.0271, "step": 218200 }, { "epoch": 1.41, "learning_rate": 8.874316657738305e-05, "loss": 0.0254, "step": 218210 }, { "epoch": 1.41, "learning_rate": 8.873348522302613e-05, "loss": 0.0242, "step": 218220 }, { "epoch": 1.41, "learning_rate": 8.872380386866919e-05, "loss": 0.0346, "step": 218230 }, { "epoch": 1.41, "learning_rate": 8.871412251431227e-05, "loss": 0.028, "step": 218240 }, { "epoch": 1.41, "learning_rate": 8.870444115995532e-05, "loss": 0.0299, "step": 218250 }, { "epoch": 1.41, "learning_rate": 8.86947598055984e-05, "loss": 0.0308, "step": 218260 }, { "epoch": 1.41, "learning_rate": 8.868507845124147e-05, "loss": 0.0267, "step": 218270 }, { "epoch": 1.41, "learning_rate": 8.867539709688452e-05, "loss": 0.0339, "step": 218280 }, { "epoch": 1.41, "learning_rate": 8.86657157425276e-05, "loss": 0.0254, "step": 218290 }, { "epoch": 1.41, "learning_rate": 8.865603438817067e-05, "loss": 0.0298, "step": 218300 }, { "epoch": 1.41, "learning_rate": 8.864635303381375e-05, "loss": 0.0306, "step": 218310 }, { "epoch": 1.41, "learning_rate": 8.86366716794568e-05, "loss": 0.0278, "step": 218320 }, { "epoch": 1.41, "learning_rate": 8.862699032509987e-05, "loss": 0.0302, "step": 218330 }, { "epoch": 1.41, "learning_rate": 8.861730897074295e-05, "loss": 0.0282, "step": 218340 }, { "epoch": 1.41, "learning_rate": 8.8607627616386e-05, "loss": 0.0263, "step": 218350 }, { "epoch": 1.41, "learning_rate": 8.859794626202908e-05, "loss": 0.0336, "step": 218360 }, { "epoch": 1.41, "learning_rate": 8.858826490767215e-05, "loss": 0.0354, "step": 218370 }, { "epoch": 1.41, "learning_rate": 8.857858355331521e-05, "loss": 0.031, "step": 218380 }, { "epoch": 1.41, "learning_rate": 8.856890219895828e-05, "loss": 0.0304, "step": 218390 }, { "epoch": 1.41, "learning_rate": 8.855922084460134e-05, "loss": 0.0321, "step": 218400 }, { "epoch": 1.41, "learning_rate": 8.854953949024442e-05, "loss": 0.0271, "step": 218410 }, { "epoch": 1.41, "learning_rate": 8.853985813588748e-05, "loss": 0.032, "step": 218420 }, { "epoch": 1.41, "learning_rate": 8.853017678153054e-05, "loss": 0.0285, "step": 218430 }, { "epoch": 1.41, "learning_rate": 8.852049542717362e-05, "loss": 0.0292, "step": 218440 }, { "epoch": 1.41, "learning_rate": 8.851081407281669e-05, "loss": 0.0314, "step": 218450 }, { "epoch": 1.41, "learning_rate": 8.850113271845976e-05, "loss": 0.0363, "step": 218460 }, { "epoch": 1.41, "learning_rate": 8.849145136410282e-05, "loss": 0.036, "step": 218470 }, { "epoch": 1.41, "learning_rate": 8.848177000974589e-05, "loss": 0.0387, "step": 218480 }, { "epoch": 1.41, "learning_rate": 8.847208865538895e-05, "loss": 0.0275, "step": 218490 }, { "epoch": 1.41, "learning_rate": 8.846240730103202e-05, "loss": 0.0292, "step": 218500 }, { "epoch": 1.41, "learning_rate": 8.84527259466751e-05, "loss": 0.0303, "step": 218510 }, { "epoch": 1.41, "learning_rate": 8.844304459231817e-05, "loss": 0.0312, "step": 218520 }, { "epoch": 1.41, "learning_rate": 8.843336323796122e-05, "loss": 0.0296, "step": 218530 }, { "epoch": 1.41, "learning_rate": 8.84236818836043e-05, "loss": 0.0299, "step": 218540 }, { "epoch": 1.41, "learning_rate": 8.841400052924737e-05, "loss": 0.0275, "step": 218550 }, { "epoch": 1.41, "learning_rate": 8.840431917489043e-05, "loss": 0.0314, "step": 218560 }, { "epoch": 1.41, "learning_rate": 8.83946378205335e-05, "loss": 0.0256, "step": 218570 }, { "epoch": 1.41, "learning_rate": 8.838495646617656e-05, "loss": 0.0317, "step": 218580 }, { "epoch": 1.41, "learning_rate": 8.837527511181964e-05, "loss": 0.0315, "step": 218590 }, { "epoch": 1.41, "learning_rate": 8.83655937574627e-05, "loss": 0.0279, "step": 218600 }, { "epoch": 1.41, "learning_rate": 8.835591240310578e-05, "loss": 0.0278, "step": 218610 }, { "epoch": 1.41, "learning_rate": 8.834623104874884e-05, "loss": 0.023, "step": 218620 }, { "epoch": 1.41, "learning_rate": 8.83365496943919e-05, "loss": 0.0297, "step": 218630 }, { "epoch": 1.41, "learning_rate": 8.832686834003498e-05, "loss": 0.0247, "step": 218640 }, { "epoch": 1.41, "learning_rate": 8.831718698567804e-05, "loss": 0.0304, "step": 218650 }, { "epoch": 1.41, "learning_rate": 8.830750563132111e-05, "loss": 0.0257, "step": 218660 }, { "epoch": 1.41, "learning_rate": 8.829782427696417e-05, "loss": 0.0281, "step": 218670 }, { "epoch": 1.41, "learning_rate": 8.828814292260724e-05, "loss": 0.0276, "step": 218680 }, { "epoch": 1.41, "learning_rate": 8.827846156825032e-05, "loss": 0.0221, "step": 218690 }, { "epoch": 1.41, "learning_rate": 8.826878021389337e-05, "loss": 0.0332, "step": 218700 }, { "epoch": 1.41, "learning_rate": 8.825909885953645e-05, "loss": 0.0288, "step": 218710 }, { "epoch": 1.41, "learning_rate": 8.824941750517952e-05, "loss": 0.0291, "step": 218720 }, { "epoch": 1.41, "learning_rate": 8.823973615082257e-05, "loss": 0.0246, "step": 218730 }, { "epoch": 1.41, "learning_rate": 8.823005479646565e-05, "loss": 0.0267, "step": 218740 }, { "epoch": 1.41, "learning_rate": 8.822037344210872e-05, "loss": 0.0271, "step": 218750 }, { "epoch": 1.41, "learning_rate": 8.82106920877518e-05, "loss": 0.0287, "step": 218760 }, { "epoch": 1.41, "learning_rate": 8.820101073339485e-05, "loss": 0.0342, "step": 218770 }, { "epoch": 1.41, "learning_rate": 8.819132937903792e-05, "loss": 0.0306, "step": 218780 }, { "epoch": 1.41, "learning_rate": 8.8181648024681e-05, "loss": 0.0314, "step": 218790 }, { "epoch": 1.41, "learning_rate": 8.817196667032405e-05, "loss": 0.0359, "step": 218800 }, { "epoch": 1.41, "learning_rate": 8.816228531596713e-05, "loss": 0.0238, "step": 218810 }, { "epoch": 1.41, "learning_rate": 8.81526039616102e-05, "loss": 0.0297, "step": 218820 }, { "epoch": 1.41, "learning_rate": 8.814292260725327e-05, "loss": 0.0336, "step": 218830 }, { "epoch": 1.41, "learning_rate": 8.813324125289633e-05, "loss": 0.0258, "step": 218840 }, { "epoch": 1.41, "learning_rate": 8.81235598985394e-05, "loss": 0.0244, "step": 218850 }, { "epoch": 1.41, "learning_rate": 8.811387854418247e-05, "loss": 0.0287, "step": 218860 }, { "epoch": 1.41, "learning_rate": 8.810419718982553e-05, "loss": 0.0253, "step": 218870 }, { "epoch": 1.41, "learning_rate": 8.809451583546859e-05, "loss": 0.035, "step": 218880 }, { "epoch": 1.41, "learning_rate": 8.808483448111167e-05, "loss": 0.0318, "step": 218890 }, { "epoch": 1.41, "learning_rate": 8.807515312675474e-05, "loss": 0.0294, "step": 218900 }, { "epoch": 1.41, "learning_rate": 8.80654717723978e-05, "loss": 0.0262, "step": 218910 }, { "epoch": 1.41, "learning_rate": 8.805579041804087e-05, "loss": 0.028, "step": 218920 }, { "epoch": 1.41, "learning_rate": 8.804610906368395e-05, "loss": 0.0291, "step": 218930 }, { "epoch": 1.41, "learning_rate": 8.8036427709327e-05, "loss": 0.0342, "step": 218940 }, { "epoch": 1.41, "learning_rate": 8.802674635497007e-05, "loss": 0.0271, "step": 218950 }, { "epoch": 1.41, "learning_rate": 8.801706500061315e-05, "loss": 0.0273, "step": 218960 }, { "epoch": 1.41, "learning_rate": 8.800738364625622e-05, "loss": 0.0305, "step": 218970 }, { "epoch": 1.41, "learning_rate": 8.799770229189927e-05, "loss": 0.0309, "step": 218980 }, { "epoch": 1.41, "learning_rate": 8.798802093754235e-05, "loss": 0.0292, "step": 218990 }, { "epoch": 1.41, "learning_rate": 8.797833958318541e-05, "loss": 0.0281, "step": 219000 }, { "epoch": 1.41, "eval_cer": 0.9199114224381426, "eval_loss": 0.020875846967101097, "eval_runtime": 120.3649, "eval_samples_per_second": 16.616, "eval_steps_per_second": 4.154, "step": 219000 }, { "epoch": 1.41, "learning_rate": 8.796865822882848e-05, "loss": 0.029, "step": 219010 }, { "epoch": 1.41, "learning_rate": 8.795897687447155e-05, "loss": 0.0278, "step": 219020 }, { "epoch": 1.41, "learning_rate": 8.794929552011463e-05, "loss": 0.0298, "step": 219030 }, { "epoch": 1.41, "learning_rate": 8.793961416575769e-05, "loss": 0.0317, "step": 219040 }, { "epoch": 1.41, "learning_rate": 8.792993281140075e-05, "loss": 0.0408, "step": 219050 }, { "epoch": 1.41, "learning_rate": 8.792025145704383e-05, "loss": 0.0263, "step": 219060 }, { "epoch": 1.41, "learning_rate": 8.791057010268689e-05, "loss": 0.0247, "step": 219070 }, { "epoch": 1.41, "learning_rate": 8.790088874832994e-05, "loss": 0.0266, "step": 219080 }, { "epoch": 1.41, "learning_rate": 8.789120739397302e-05, "loss": 0.026, "step": 219090 }, { "epoch": 1.41, "learning_rate": 8.788152603961609e-05, "loss": 0.0251, "step": 219100 }, { "epoch": 1.41, "learning_rate": 8.787184468525917e-05, "loss": 0.023, "step": 219110 }, { "epoch": 1.41, "learning_rate": 8.786216333090222e-05, "loss": 0.0243, "step": 219120 }, { "epoch": 1.41, "learning_rate": 8.78524819765453e-05, "loss": 0.0238, "step": 219130 }, { "epoch": 1.41, "learning_rate": 8.784280062218837e-05, "loss": 0.0268, "step": 219140 }, { "epoch": 1.41, "learning_rate": 8.783311926783142e-05, "loss": 0.0304, "step": 219150 }, { "epoch": 1.41, "learning_rate": 8.78234379134745e-05, "loss": 0.0228, "step": 219160 }, { "epoch": 1.41, "learning_rate": 8.781375655911757e-05, "loss": 0.0381, "step": 219170 }, { "epoch": 1.41, "learning_rate": 8.780407520476065e-05, "loss": 0.0305, "step": 219180 }, { "epoch": 1.41, "learning_rate": 8.77943938504037e-05, "loss": 0.0282, "step": 219190 }, { "epoch": 1.41, "learning_rate": 8.778471249604677e-05, "loss": 0.0325, "step": 219200 }, { "epoch": 1.41, "learning_rate": 8.777503114168985e-05, "loss": 0.0234, "step": 219210 }, { "epoch": 1.41, "learning_rate": 8.77653497873329e-05, "loss": 0.0273, "step": 219220 }, { "epoch": 1.41, "learning_rate": 8.775566843297598e-05, "loss": 0.0305, "step": 219230 }, { "epoch": 1.42, "learning_rate": 8.774598707861904e-05, "loss": 0.0287, "step": 219240 }, { "epoch": 1.42, "learning_rate": 8.773630572426212e-05, "loss": 0.0304, "step": 219250 }, { "epoch": 1.42, "learning_rate": 8.772662436990518e-05, "loss": 0.0311, "step": 219260 }, { "epoch": 1.42, "learning_rate": 8.771694301554824e-05, "loss": 0.0281, "step": 219270 }, { "epoch": 1.42, "learning_rate": 8.770726166119132e-05, "loss": 0.0264, "step": 219280 }, { "epoch": 1.42, "learning_rate": 8.769758030683438e-05, "loss": 0.0296, "step": 219290 }, { "epoch": 1.42, "learning_rate": 8.768789895247744e-05, "loss": 0.0289, "step": 219300 }, { "epoch": 1.42, "learning_rate": 8.767821759812052e-05, "loss": 0.0292, "step": 219310 }, { "epoch": 1.42, "learning_rate": 8.766853624376359e-05, "loss": 0.0341, "step": 219320 }, { "epoch": 1.42, "learning_rate": 8.765885488940665e-05, "loss": 0.0286, "step": 219330 }, { "epoch": 1.42, "learning_rate": 8.764917353504972e-05, "loss": 0.0296, "step": 219340 }, { "epoch": 1.42, "learning_rate": 8.76394921806928e-05, "loss": 0.029, "step": 219350 }, { "epoch": 1.42, "learning_rate": 8.762981082633585e-05, "loss": 0.0238, "step": 219360 }, { "epoch": 1.42, "learning_rate": 8.762012947197892e-05, "loss": 0.0288, "step": 219370 }, { "epoch": 1.42, "learning_rate": 8.7610448117622e-05, "loss": 0.0307, "step": 219380 }, { "epoch": 1.42, "learning_rate": 8.760076676326507e-05, "loss": 0.0308, "step": 219390 }, { "epoch": 1.42, "learning_rate": 8.759108540890812e-05, "loss": 0.0278, "step": 219400 }, { "epoch": 1.42, "learning_rate": 8.75814040545512e-05, "loss": 0.0296, "step": 219410 }, { "epoch": 1.42, "learning_rate": 8.757172270019426e-05, "loss": 0.0271, "step": 219420 }, { "epoch": 1.42, "learning_rate": 8.756204134583733e-05, "loss": 0.0321, "step": 219430 }, { "epoch": 1.42, "learning_rate": 8.75523599914804e-05, "loss": 0.0341, "step": 219440 }, { "epoch": 1.42, "learning_rate": 8.754267863712348e-05, "loss": 0.0277, "step": 219450 }, { "epoch": 1.42, "learning_rate": 8.753299728276654e-05, "loss": 0.0312, "step": 219460 }, { "epoch": 1.42, "learning_rate": 8.75233159284096e-05, "loss": 0.0291, "step": 219470 }, { "epoch": 1.42, "learning_rate": 8.751363457405267e-05, "loss": 0.0258, "step": 219480 }, { "epoch": 1.42, "learning_rate": 8.750395321969574e-05, "loss": 0.0255, "step": 219490 }, { "epoch": 1.42, "learning_rate": 8.74942718653388e-05, "loss": 0.0285, "step": 219500 }, { "epoch": 1.42, "learning_rate": 8.748459051098187e-05, "loss": 0.0323, "step": 219510 }, { "epoch": 1.42, "learning_rate": 8.747490915662494e-05, "loss": 0.0268, "step": 219520 }, { "epoch": 1.42, "learning_rate": 8.746522780226802e-05, "loss": 0.0269, "step": 219530 }, { "epoch": 1.42, "learning_rate": 8.745554644791107e-05, "loss": 0.0297, "step": 219540 }, { "epoch": 1.42, "learning_rate": 8.744586509355415e-05, "loss": 0.0264, "step": 219550 }, { "epoch": 1.42, "learning_rate": 8.743618373919722e-05, "loss": 0.0258, "step": 219560 }, { "epoch": 1.42, "learning_rate": 8.742650238484027e-05, "loss": 0.0284, "step": 219570 }, { "epoch": 1.42, "learning_rate": 8.741682103048335e-05, "loss": 0.0278, "step": 219580 }, { "epoch": 1.42, "learning_rate": 8.740713967612642e-05, "loss": 0.0288, "step": 219590 }, { "epoch": 1.42, "learning_rate": 8.73974583217695e-05, "loss": 0.0278, "step": 219600 }, { "epoch": 1.42, "learning_rate": 8.738777696741255e-05, "loss": 0.0242, "step": 219610 }, { "epoch": 1.42, "learning_rate": 8.737809561305562e-05, "loss": 0.0237, "step": 219620 }, { "epoch": 1.42, "learning_rate": 8.73684142586987e-05, "loss": 0.0294, "step": 219630 }, { "epoch": 1.42, "learning_rate": 8.735873290434175e-05, "loss": 0.0303, "step": 219640 }, { "epoch": 1.42, "learning_rate": 8.734905154998483e-05, "loss": 0.0303, "step": 219650 }, { "epoch": 1.42, "learning_rate": 8.73393701956279e-05, "loss": 0.0282, "step": 219660 }, { "epoch": 1.42, "learning_rate": 8.732968884127096e-05, "loss": 0.0257, "step": 219670 }, { "epoch": 1.42, "learning_rate": 8.732000748691403e-05, "loss": 0.0281, "step": 219680 }, { "epoch": 1.42, "learning_rate": 8.731032613255709e-05, "loss": 0.0271, "step": 219690 }, { "epoch": 1.42, "learning_rate": 8.730064477820017e-05, "loss": 0.0223, "step": 219700 }, { "epoch": 1.42, "learning_rate": 8.729096342384323e-05, "loss": 0.0207, "step": 219710 }, { "epoch": 1.42, "learning_rate": 8.728128206948629e-05, "loss": 0.0319, "step": 219720 }, { "epoch": 1.42, "learning_rate": 8.727160071512937e-05, "loss": 0.0304, "step": 219730 }, { "epoch": 1.42, "learning_rate": 8.726191936077244e-05, "loss": 0.0289, "step": 219740 }, { "epoch": 1.42, "learning_rate": 8.72522380064155e-05, "loss": 0.0326, "step": 219750 }, { "epoch": 1.42, "learning_rate": 8.724255665205857e-05, "loss": 0.0238, "step": 219760 }, { "epoch": 1.42, "learning_rate": 8.723287529770164e-05, "loss": 0.0278, "step": 219770 }, { "epoch": 1.42, "learning_rate": 8.72231939433447e-05, "loss": 0.0321, "step": 219780 }, { "epoch": 1.42, "learning_rate": 8.721351258898777e-05, "loss": 0.0248, "step": 219790 }, { "epoch": 1.42, "learning_rate": 8.720383123463085e-05, "loss": 0.0269, "step": 219800 }, { "epoch": 1.42, "learning_rate": 8.719414988027391e-05, "loss": 0.032, "step": 219810 }, { "epoch": 1.42, "learning_rate": 8.718446852591697e-05, "loss": 0.027, "step": 219820 }, { "epoch": 1.42, "learning_rate": 8.717478717156005e-05, "loss": 0.0287, "step": 219830 }, { "epoch": 1.42, "learning_rate": 8.716510581720311e-05, "loss": 0.027, "step": 219840 }, { "epoch": 1.42, "learning_rate": 8.715542446284618e-05, "loss": 0.027, "step": 219850 }, { "epoch": 1.42, "learning_rate": 8.714574310848925e-05, "loss": 0.0276, "step": 219860 }, { "epoch": 1.42, "learning_rate": 8.713606175413233e-05, "loss": 0.0305, "step": 219870 }, { "epoch": 1.42, "learning_rate": 8.712638039977539e-05, "loss": 0.028, "step": 219880 }, { "epoch": 1.42, "learning_rate": 8.711669904541844e-05, "loss": 0.0272, "step": 219890 }, { "epoch": 1.42, "learning_rate": 8.710701769106152e-05, "loss": 0.0259, "step": 219900 }, { "epoch": 1.42, "learning_rate": 8.709733633670459e-05, "loss": 0.0329, "step": 219910 }, { "epoch": 1.42, "learning_rate": 8.708765498234764e-05, "loss": 0.0285, "step": 219920 }, { "epoch": 1.42, "learning_rate": 8.707797362799072e-05, "loss": 0.0296, "step": 219930 }, { "epoch": 1.42, "learning_rate": 8.706829227363379e-05, "loss": 0.0243, "step": 219940 }, { "epoch": 1.42, "learning_rate": 8.705861091927687e-05, "loss": 0.0274, "step": 219950 }, { "epoch": 1.42, "learning_rate": 8.704892956491992e-05, "loss": 0.0319, "step": 219960 }, { "epoch": 1.42, "learning_rate": 8.7039248210563e-05, "loss": 0.0299, "step": 219970 }, { "epoch": 1.42, "learning_rate": 8.702956685620607e-05, "loss": 0.029, "step": 219980 }, { "epoch": 1.42, "learning_rate": 8.701988550184912e-05, "loss": 0.0277, "step": 219990 }, { "epoch": 1.42, "learning_rate": 8.70102041474922e-05, "loss": 0.0286, "step": 220000 }, { "epoch": 1.42, "eval_cer": 0.9197812676533725, "eval_loss": 0.02094407007098198, "eval_runtime": 120.2687, "eval_samples_per_second": 16.629, "eval_steps_per_second": 4.157, "step": 220000 }, { "epoch": 1.42, "learning_rate": 8.700052279313527e-05, "loss": 0.0248, "step": 220010 }, { "epoch": 1.42, "learning_rate": 8.699084143877835e-05, "loss": 0.0287, "step": 220020 }, { "epoch": 1.42, "learning_rate": 8.69811600844214e-05, "loss": 0.0262, "step": 220030 }, { "epoch": 1.42, "learning_rate": 8.697147873006447e-05, "loss": 0.0293, "step": 220040 }, { "epoch": 1.42, "learning_rate": 8.696179737570755e-05, "loss": 0.0248, "step": 220050 }, { "epoch": 1.42, "learning_rate": 8.69521160213506e-05, "loss": 0.026, "step": 220060 }, { "epoch": 1.42, "learning_rate": 8.694243466699368e-05, "loss": 0.0303, "step": 220070 }, { "epoch": 1.42, "learning_rate": 8.693275331263674e-05, "loss": 0.0323, "step": 220080 }, { "epoch": 1.42, "learning_rate": 8.692307195827981e-05, "loss": 0.0306, "step": 220090 }, { "epoch": 1.42, "learning_rate": 8.691339060392288e-05, "loss": 0.0322, "step": 220100 }, { "epoch": 1.42, "learning_rate": 8.690370924956594e-05, "loss": 0.0276, "step": 220110 }, { "epoch": 1.42, "learning_rate": 8.689402789520902e-05, "loss": 0.0282, "step": 220120 }, { "epoch": 1.42, "learning_rate": 8.688434654085208e-05, "loss": 0.0335, "step": 220130 }, { "epoch": 1.42, "learning_rate": 8.687466518649514e-05, "loss": 0.0301, "step": 220140 }, { "epoch": 1.42, "learning_rate": 8.686498383213822e-05, "loss": 0.0294, "step": 220150 }, { "epoch": 1.42, "learning_rate": 8.685530247778129e-05, "loss": 0.0268, "step": 220160 }, { "epoch": 1.42, "learning_rate": 8.684562112342435e-05, "loss": 0.0302, "step": 220170 }, { "epoch": 1.42, "learning_rate": 8.683593976906742e-05, "loss": 0.0297, "step": 220180 }, { "epoch": 1.42, "learning_rate": 8.682625841471049e-05, "loss": 0.0249, "step": 220190 }, { "epoch": 1.42, "learning_rate": 8.681657706035355e-05, "loss": 0.0291, "step": 220200 }, { "epoch": 1.42, "learning_rate": 8.680689570599662e-05, "loss": 0.0248, "step": 220210 }, { "epoch": 1.42, "learning_rate": 8.67972143516397e-05, "loss": 0.0288, "step": 220220 }, { "epoch": 1.42, "learning_rate": 8.678753299728276e-05, "loss": 0.0235, "step": 220230 }, { "epoch": 1.42, "learning_rate": 8.677785164292582e-05, "loss": 0.0308, "step": 220240 }, { "epoch": 1.42, "learning_rate": 8.67681702885689e-05, "loss": 0.0312, "step": 220250 }, { "epoch": 1.42, "learning_rate": 8.675848893421196e-05, "loss": 0.0293, "step": 220260 }, { "epoch": 1.42, "learning_rate": 8.674880757985503e-05, "loss": 0.0302, "step": 220270 }, { "epoch": 1.42, "learning_rate": 8.67391262254981e-05, "loss": 0.0265, "step": 220280 }, { "epoch": 1.42, "learning_rate": 8.672944487114116e-05, "loss": 0.0347, "step": 220290 }, { "epoch": 1.42, "learning_rate": 8.671976351678424e-05, "loss": 0.0382, "step": 220300 }, { "epoch": 1.42, "learning_rate": 8.67100821624273e-05, "loss": 0.0296, "step": 220310 }, { "epoch": 1.42, "learning_rate": 8.670040080807037e-05, "loss": 0.0283, "step": 220320 }, { "epoch": 1.42, "learning_rate": 8.669071945371344e-05, "loss": 0.0231, "step": 220330 }, { "epoch": 1.42, "learning_rate": 8.66810380993565e-05, "loss": 0.0287, "step": 220340 }, { "epoch": 1.42, "learning_rate": 8.667135674499957e-05, "loss": 0.0318, "step": 220350 }, { "epoch": 1.42, "learning_rate": 8.666167539064264e-05, "loss": 0.0261, "step": 220360 }, { "epoch": 1.42, "learning_rate": 8.665199403628572e-05, "loss": 0.0241, "step": 220370 }, { "epoch": 1.42, "learning_rate": 8.664231268192877e-05, "loss": 0.0328, "step": 220380 }, { "epoch": 1.42, "learning_rate": 8.663263132757184e-05, "loss": 0.0272, "step": 220390 }, { "epoch": 1.42, "learning_rate": 8.662294997321492e-05, "loss": 0.0301, "step": 220400 }, { "epoch": 1.42, "learning_rate": 8.661326861885797e-05, "loss": 0.0244, "step": 220410 }, { "epoch": 1.42, "learning_rate": 8.660358726450105e-05, "loss": 0.0281, "step": 220420 }, { "epoch": 1.42, "learning_rate": 8.659390591014412e-05, "loss": 0.024, "step": 220430 }, { "epoch": 1.42, "learning_rate": 8.65842245557872e-05, "loss": 0.0313, "step": 220440 }, { "epoch": 1.42, "learning_rate": 8.657454320143025e-05, "loss": 0.0303, "step": 220450 }, { "epoch": 1.42, "learning_rate": 8.656486184707332e-05, "loss": 0.0257, "step": 220460 }, { "epoch": 1.42, "learning_rate": 8.65551804927164e-05, "loss": 0.0259, "step": 220470 }, { "epoch": 1.42, "learning_rate": 8.654549913835945e-05, "loss": 0.0268, "step": 220480 }, { "epoch": 1.42, "learning_rate": 8.653581778400251e-05, "loss": 0.0283, "step": 220490 }, { "epoch": 1.42, "learning_rate": 8.65261364296456e-05, "loss": 0.0251, "step": 220500 }, { "epoch": 1.42, "learning_rate": 8.651645507528866e-05, "loss": 0.026, "step": 220510 }, { "epoch": 1.42, "learning_rate": 8.650677372093173e-05, "loss": 0.0233, "step": 220520 }, { "epoch": 1.42, "learning_rate": 8.649709236657479e-05, "loss": 0.0329, "step": 220530 }, { "epoch": 1.42, "learning_rate": 8.648741101221787e-05, "loss": 0.0331, "step": 220540 }, { "epoch": 1.42, "learning_rate": 8.647772965786093e-05, "loss": 0.0301, "step": 220550 }, { "epoch": 1.42, "learning_rate": 8.646804830350399e-05, "loss": 0.0248, "step": 220560 }, { "epoch": 1.42, "learning_rate": 8.645836694914707e-05, "loss": 0.026, "step": 220570 }, { "epoch": 1.42, "learning_rate": 8.644868559479014e-05, "loss": 0.0295, "step": 220580 }, { "epoch": 1.42, "learning_rate": 8.643900424043319e-05, "loss": 0.0251, "step": 220590 }, { "epoch": 1.42, "learning_rate": 8.642932288607627e-05, "loss": 0.0271, "step": 220600 }, { "epoch": 1.42, "learning_rate": 8.641964153171934e-05, "loss": 0.0224, "step": 220610 }, { "epoch": 1.42, "learning_rate": 8.64099601773624e-05, "loss": 0.0286, "step": 220620 }, { "epoch": 1.42, "learning_rate": 8.640027882300547e-05, "loss": 0.0257, "step": 220630 }, { "epoch": 1.42, "learning_rate": 8.639059746864855e-05, "loss": 0.0267, "step": 220640 }, { "epoch": 1.42, "learning_rate": 8.638091611429161e-05, "loss": 0.0315, "step": 220650 }, { "epoch": 1.42, "learning_rate": 8.637123475993467e-05, "loss": 0.0293, "step": 220660 }, { "epoch": 1.42, "learning_rate": 8.636155340557775e-05, "loss": 0.0255, "step": 220670 }, { "epoch": 1.42, "learning_rate": 8.635187205122081e-05, "loss": 0.0312, "step": 220680 }, { "epoch": 1.42, "learning_rate": 8.634219069686387e-05, "loss": 0.0282, "step": 220690 }, { "epoch": 1.42, "learning_rate": 8.633250934250695e-05, "loss": 0.0241, "step": 220700 }, { "epoch": 1.42, "learning_rate": 8.632282798815001e-05, "loss": 0.0289, "step": 220710 }, { "epoch": 1.42, "learning_rate": 8.631314663379309e-05, "loss": 0.0269, "step": 220720 }, { "epoch": 1.42, "learning_rate": 8.630346527943614e-05, "loss": 0.0327, "step": 220730 }, { "epoch": 1.42, "learning_rate": 8.629378392507922e-05, "loss": 0.0265, "step": 220740 }, { "epoch": 1.42, "learning_rate": 8.628410257072229e-05, "loss": 0.0323, "step": 220750 }, { "epoch": 1.42, "learning_rate": 8.627442121636534e-05, "loss": 0.0311, "step": 220760 }, { "epoch": 1.42, "learning_rate": 8.626473986200842e-05, "loss": 0.0339, "step": 220770 }, { "epoch": 1.42, "learning_rate": 8.625505850765149e-05, "loss": 0.028, "step": 220780 }, { "epoch": 1.43, "learning_rate": 8.624537715329457e-05, "loss": 0.03, "step": 220790 }, { "epoch": 1.43, "learning_rate": 8.623569579893762e-05, "loss": 0.0232, "step": 220800 }, { "epoch": 1.43, "learning_rate": 8.622601444458069e-05, "loss": 0.0298, "step": 220810 }, { "epoch": 1.43, "learning_rate": 8.621633309022377e-05, "loss": 0.0379, "step": 220820 }, { "epoch": 1.43, "learning_rate": 8.620665173586682e-05, "loss": 0.0273, "step": 220830 }, { "epoch": 1.43, "learning_rate": 8.61969703815099e-05, "loss": 0.0266, "step": 220840 }, { "epoch": 1.43, "learning_rate": 8.618728902715297e-05, "loss": 0.0302, "step": 220850 }, { "epoch": 1.43, "learning_rate": 8.617760767279605e-05, "loss": 0.0271, "step": 220860 }, { "epoch": 1.43, "learning_rate": 8.61679263184391e-05, "loss": 0.0289, "step": 220870 }, { "epoch": 1.43, "learning_rate": 8.615824496408217e-05, "loss": 0.0208, "step": 220880 }, { "epoch": 1.43, "learning_rate": 8.614856360972524e-05, "loss": 0.0278, "step": 220890 }, { "epoch": 1.43, "learning_rate": 8.61388822553683e-05, "loss": 0.0297, "step": 220900 }, { "epoch": 1.43, "learning_rate": 8.612920090101136e-05, "loss": 0.0309, "step": 220910 }, { "epoch": 1.43, "learning_rate": 8.611951954665444e-05, "loss": 0.0256, "step": 220920 }, { "epoch": 1.43, "learning_rate": 8.610983819229751e-05, "loss": 0.0314, "step": 220930 }, { "epoch": 1.43, "learning_rate": 8.610015683794058e-05, "loss": 0.0218, "step": 220940 }, { "epoch": 1.43, "learning_rate": 8.609047548358364e-05, "loss": 0.032, "step": 220950 }, { "epoch": 1.43, "learning_rate": 8.608079412922672e-05, "loss": 0.0306, "step": 220960 }, { "epoch": 1.43, "learning_rate": 8.607111277486977e-05, "loss": 0.0331, "step": 220970 }, { "epoch": 1.43, "learning_rate": 8.606143142051284e-05, "loss": 0.0312, "step": 220980 }, { "epoch": 1.43, "learning_rate": 8.605175006615592e-05, "loss": 0.0303, "step": 220990 }, { "epoch": 1.43, "learning_rate": 8.604206871179899e-05, "loss": 0.0297, "step": 221000 }, { "epoch": 1.43, "eval_cer": 0.9199529996610553, "eval_loss": 0.02053585834801197, "eval_runtime": 120.2097, "eval_samples_per_second": 16.638, "eval_steps_per_second": 4.159, "step": 221000 }, { "epoch": 1.43, "learning_rate": 8.603238735744204e-05, "loss": 0.0319, "step": 221010 }, { "epoch": 1.43, "learning_rate": 8.602270600308512e-05, "loss": 0.0258, "step": 221020 }, { "epoch": 1.43, "learning_rate": 8.601302464872819e-05, "loss": 0.0343, "step": 221030 }, { "epoch": 1.43, "learning_rate": 8.600334329437125e-05, "loss": 0.0301, "step": 221040 }, { "epoch": 1.43, "learning_rate": 8.599366194001432e-05, "loss": 0.0243, "step": 221050 }, { "epoch": 1.43, "learning_rate": 8.59839805856574e-05, "loss": 0.0247, "step": 221060 }, { "epoch": 1.43, "learning_rate": 8.597429923130046e-05, "loss": 0.0256, "step": 221070 }, { "epoch": 1.43, "learning_rate": 8.596461787694352e-05, "loss": 0.0336, "step": 221080 }, { "epoch": 1.43, "learning_rate": 8.59549365225866e-05, "loss": 0.0282, "step": 221090 }, { "epoch": 1.43, "learning_rate": 8.594525516822966e-05, "loss": 0.0302, "step": 221100 }, { "epoch": 1.43, "learning_rate": 8.593557381387272e-05, "loss": 0.0264, "step": 221110 }, { "epoch": 1.43, "learning_rate": 8.59258924595158e-05, "loss": 0.03, "step": 221120 }, { "epoch": 1.43, "learning_rate": 8.591621110515886e-05, "loss": 0.0272, "step": 221130 }, { "epoch": 1.43, "learning_rate": 8.590652975080194e-05, "loss": 0.0258, "step": 221140 }, { "epoch": 1.43, "learning_rate": 8.5896848396445e-05, "loss": 0.0244, "step": 221150 }, { "epoch": 1.43, "learning_rate": 8.588716704208807e-05, "loss": 0.0269, "step": 221160 }, { "epoch": 1.43, "learning_rate": 8.587748568773114e-05, "loss": 0.0216, "step": 221170 }, { "epoch": 1.43, "learning_rate": 8.586780433337419e-05, "loss": 0.03, "step": 221180 }, { "epoch": 1.43, "learning_rate": 8.585812297901727e-05, "loss": 0.0256, "step": 221190 }, { "epoch": 1.43, "learning_rate": 8.584844162466034e-05, "loss": 0.0251, "step": 221200 }, { "epoch": 1.43, "learning_rate": 8.583876027030342e-05, "loss": 0.0274, "step": 221210 }, { "epoch": 1.43, "learning_rate": 8.582907891594647e-05, "loss": 0.0372, "step": 221220 }, { "epoch": 1.43, "learning_rate": 8.581939756158954e-05, "loss": 0.0321, "step": 221230 }, { "epoch": 1.43, "learning_rate": 8.580971620723262e-05, "loss": 0.0288, "step": 221240 }, { "epoch": 1.43, "learning_rate": 8.580003485287567e-05, "loss": 0.025, "step": 221250 }, { "epoch": 1.43, "learning_rate": 8.579035349851875e-05, "loss": 0.0291, "step": 221260 }, { "epoch": 1.43, "learning_rate": 8.578067214416182e-05, "loss": 0.0281, "step": 221270 }, { "epoch": 1.43, "learning_rate": 8.577099078980488e-05, "loss": 0.0332, "step": 221280 }, { "epoch": 1.43, "learning_rate": 8.576130943544795e-05, "loss": 0.0284, "step": 221290 }, { "epoch": 1.43, "learning_rate": 8.575162808109101e-05, "loss": 0.0274, "step": 221300 }, { "epoch": 1.43, "learning_rate": 8.57419467267341e-05, "loss": 0.031, "step": 221310 }, { "epoch": 1.43, "learning_rate": 8.573226537237715e-05, "loss": 0.032, "step": 221320 }, { "epoch": 1.43, "learning_rate": 8.572258401802021e-05, "loss": 0.0329, "step": 221330 }, { "epoch": 1.43, "learning_rate": 8.57129026636633e-05, "loss": 0.0244, "step": 221340 }, { "epoch": 1.43, "learning_rate": 8.570322130930636e-05, "loss": 0.0301, "step": 221350 }, { "epoch": 1.43, "learning_rate": 8.569353995494943e-05, "loss": 0.0271, "step": 221360 }, { "epoch": 1.43, "learning_rate": 8.568385860059249e-05, "loss": 0.0299, "step": 221370 }, { "epoch": 1.43, "learning_rate": 8.567417724623556e-05, "loss": 0.0286, "step": 221380 }, { "epoch": 1.43, "learning_rate": 8.566449589187862e-05, "loss": 0.0312, "step": 221390 }, { "epoch": 1.43, "learning_rate": 8.565481453752169e-05, "loss": 0.0243, "step": 221400 }, { "epoch": 1.43, "learning_rate": 8.564513318316477e-05, "loss": 0.0298, "step": 221410 }, { "epoch": 1.43, "learning_rate": 8.563545182880784e-05, "loss": 0.0315, "step": 221420 }, { "epoch": 1.43, "learning_rate": 8.562577047445089e-05, "loss": 0.0316, "step": 221430 }, { "epoch": 1.43, "learning_rate": 8.561608912009397e-05, "loss": 0.0292, "step": 221440 }, { "epoch": 1.43, "learning_rate": 8.560640776573704e-05, "loss": 0.0314, "step": 221450 }, { "epoch": 1.43, "learning_rate": 8.55967264113801e-05, "loss": 0.0252, "step": 221460 }, { "epoch": 1.43, "learning_rate": 8.558704505702317e-05, "loss": 0.0325, "step": 221470 }, { "epoch": 1.43, "learning_rate": 8.557736370266623e-05, "loss": 0.0289, "step": 221480 }, { "epoch": 1.43, "learning_rate": 8.556768234830931e-05, "loss": 0.0294, "step": 221490 }, { "epoch": 1.43, "learning_rate": 8.555800099395237e-05, "loss": 0.0267, "step": 221500 }, { "epoch": 1.43, "learning_rate": 8.554831963959545e-05, "loss": 0.0305, "step": 221510 }, { "epoch": 1.43, "learning_rate": 8.553863828523851e-05, "loss": 0.0302, "step": 221520 }, { "epoch": 1.43, "learning_rate": 8.552895693088157e-05, "loss": 0.0243, "step": 221530 }, { "epoch": 1.43, "learning_rate": 8.551927557652465e-05, "loss": 0.0225, "step": 221540 }, { "epoch": 1.43, "learning_rate": 8.550959422216771e-05, "loss": 0.0257, "step": 221550 }, { "epoch": 1.43, "learning_rate": 8.549991286781079e-05, "loss": 0.0282, "step": 221560 }, { "epoch": 1.43, "learning_rate": 8.549023151345384e-05, "loss": 0.0229, "step": 221570 }, { "epoch": 1.43, "learning_rate": 8.548055015909691e-05, "loss": 0.027, "step": 221580 }, { "epoch": 1.43, "learning_rate": 8.547086880473999e-05, "loss": 0.0316, "step": 221590 }, { "epoch": 1.43, "learning_rate": 8.546118745038304e-05, "loss": 0.0277, "step": 221600 }, { "epoch": 1.43, "learning_rate": 8.545150609602612e-05, "loss": 0.0358, "step": 221610 }, { "epoch": 1.43, "learning_rate": 8.544182474166919e-05, "loss": 0.0269, "step": 221620 }, { "epoch": 1.43, "learning_rate": 8.543214338731227e-05, "loss": 0.0277, "step": 221630 }, { "epoch": 1.43, "learning_rate": 8.542246203295532e-05, "loss": 0.0309, "step": 221640 }, { "epoch": 1.43, "learning_rate": 8.541278067859839e-05, "loss": 0.0247, "step": 221650 }, { "epoch": 1.43, "learning_rate": 8.540309932424147e-05, "loss": 0.0319, "step": 221660 }, { "epoch": 1.43, "learning_rate": 8.539341796988452e-05, "loss": 0.0274, "step": 221670 }, { "epoch": 1.43, "learning_rate": 8.538373661552759e-05, "loss": 0.0271, "step": 221680 }, { "epoch": 1.43, "learning_rate": 8.537405526117067e-05, "loss": 0.0299, "step": 221690 }, { "epoch": 1.43, "learning_rate": 8.536437390681373e-05, "loss": 0.0329, "step": 221700 }, { "epoch": 1.43, "learning_rate": 8.53546925524568e-05, "loss": 0.0309, "step": 221710 }, { "epoch": 1.43, "learning_rate": 8.534501119809986e-05, "loss": 0.0326, "step": 221720 }, { "epoch": 1.43, "learning_rate": 8.533532984374294e-05, "loss": 0.0269, "step": 221730 }, { "epoch": 1.43, "learning_rate": 8.5325648489386e-05, "loss": 0.0328, "step": 221740 }, { "epoch": 1.43, "learning_rate": 8.531596713502906e-05, "loss": 0.0289, "step": 221750 }, { "epoch": 1.43, "learning_rate": 8.530628578067214e-05, "loss": 0.0298, "step": 221760 }, { "epoch": 1.43, "learning_rate": 8.529660442631521e-05, "loss": 0.0333, "step": 221770 }, { "epoch": 1.43, "learning_rate": 8.528692307195826e-05, "loss": 0.031, "step": 221780 }, { "epoch": 1.43, "learning_rate": 8.527724171760134e-05, "loss": 0.0295, "step": 221790 }, { "epoch": 1.43, "learning_rate": 8.526756036324441e-05, "loss": 0.0273, "step": 221800 }, { "epoch": 1.43, "learning_rate": 8.525787900888747e-05, "loss": 0.0291, "step": 221810 }, { "epoch": 1.43, "learning_rate": 8.524819765453054e-05, "loss": 0.0256, "step": 221820 }, { "epoch": 1.43, "learning_rate": 8.523851630017362e-05, "loss": 0.029, "step": 221830 }, { "epoch": 1.43, "learning_rate": 8.522883494581669e-05, "loss": 0.0276, "step": 221840 }, { "epoch": 1.43, "learning_rate": 8.521915359145974e-05, "loss": 0.0285, "step": 221850 }, { "epoch": 1.43, "learning_rate": 8.520947223710282e-05, "loss": 0.0271, "step": 221860 }, { "epoch": 1.43, "learning_rate": 8.519979088274589e-05, "loss": 0.0306, "step": 221870 }, { "epoch": 1.43, "learning_rate": 8.519010952838894e-05, "loss": 0.0391, "step": 221880 }, { "epoch": 1.43, "learning_rate": 8.518042817403202e-05, "loss": 0.0293, "step": 221890 }, { "epoch": 1.43, "learning_rate": 8.517074681967508e-05, "loss": 0.0323, "step": 221900 }, { "epoch": 1.43, "learning_rate": 8.516106546531816e-05, "loss": 0.0249, "step": 221910 }, { "epoch": 1.43, "learning_rate": 8.515138411096122e-05, "loss": 0.0333, "step": 221920 }, { "epoch": 1.43, "learning_rate": 8.51417027566043e-05, "loss": 0.0261, "step": 221930 }, { "epoch": 1.43, "learning_rate": 8.513202140224736e-05, "loss": 0.0259, "step": 221940 }, { "epoch": 1.43, "learning_rate": 8.512234004789042e-05, "loss": 0.026, "step": 221950 }, { "epoch": 1.43, "learning_rate": 8.51126586935335e-05, "loss": 0.0304, "step": 221960 }, { "epoch": 1.43, "learning_rate": 8.510297733917656e-05, "loss": 0.0265, "step": 221970 }, { "epoch": 1.43, "learning_rate": 8.509329598481964e-05, "loss": 0.027, "step": 221980 }, { "epoch": 1.43, "learning_rate": 8.50836146304627e-05, "loss": 0.0273, "step": 221990 }, { "epoch": 1.43, "learning_rate": 8.507393327610576e-05, "loss": 0.0256, "step": 222000 }, { "epoch": 1.43, "eval_cer": 0.9199059993221105, "eval_loss": 0.02071262337267399, "eval_runtime": 120.0993, "eval_samples_per_second": 16.653, "eval_steps_per_second": 4.163, "step": 222000 }, { "epoch": 1.43, "learning_rate": 8.506425192174884e-05, "loss": 0.027, "step": 222010 }, { "epoch": 1.43, "learning_rate": 8.505457056739189e-05, "loss": 0.0239, "step": 222020 }, { "epoch": 1.43, "learning_rate": 8.504488921303497e-05, "loss": 0.0306, "step": 222030 }, { "epoch": 1.43, "learning_rate": 8.503520785867804e-05, "loss": 0.0346, "step": 222040 }, { "epoch": 1.43, "learning_rate": 8.502552650432112e-05, "loss": 0.0284, "step": 222050 }, { "epoch": 1.43, "learning_rate": 8.501584514996417e-05, "loss": 0.0311, "step": 222060 }, { "epoch": 1.43, "learning_rate": 8.500616379560724e-05, "loss": 0.0287, "step": 222070 }, { "epoch": 1.43, "learning_rate": 8.499648244125032e-05, "loss": 0.0241, "step": 222080 }, { "epoch": 1.43, "learning_rate": 8.498680108689337e-05, "loss": 0.0282, "step": 222090 }, { "epoch": 1.43, "learning_rate": 8.497711973253644e-05, "loss": 0.0251, "step": 222100 }, { "epoch": 1.43, "learning_rate": 8.496743837817952e-05, "loss": 0.0273, "step": 222110 }, { "epoch": 1.43, "learning_rate": 8.495775702382257e-05, "loss": 0.0244, "step": 222120 }, { "epoch": 1.43, "learning_rate": 8.494807566946565e-05, "loss": 0.0295, "step": 222130 }, { "epoch": 1.43, "learning_rate": 8.493839431510871e-05, "loss": 0.0261, "step": 222140 }, { "epoch": 1.43, "learning_rate": 8.49287129607518e-05, "loss": 0.0255, "step": 222150 }, { "epoch": 1.43, "learning_rate": 8.491903160639485e-05, "loss": 0.0257, "step": 222160 }, { "epoch": 1.43, "learning_rate": 8.490935025203791e-05, "loss": 0.0263, "step": 222170 }, { "epoch": 1.43, "learning_rate": 8.489966889768099e-05, "loss": 0.0345, "step": 222180 }, { "epoch": 1.43, "learning_rate": 8.488998754332405e-05, "loss": 0.0259, "step": 222190 }, { "epoch": 1.43, "learning_rate": 8.488030618896711e-05, "loss": 0.0312, "step": 222200 }, { "epoch": 1.43, "learning_rate": 8.487062483461019e-05, "loss": 0.0296, "step": 222210 }, { "epoch": 1.43, "learning_rate": 8.486094348025326e-05, "loss": 0.0262, "step": 222220 }, { "epoch": 1.43, "learning_rate": 8.485126212589632e-05, "loss": 0.0282, "step": 222230 }, { "epoch": 1.43, "learning_rate": 8.484158077153939e-05, "loss": 0.0267, "step": 222240 }, { "epoch": 1.43, "learning_rate": 8.483189941718247e-05, "loss": 0.0321, "step": 222250 }, { "epoch": 1.43, "learning_rate": 8.482221806282552e-05, "loss": 0.0277, "step": 222260 }, { "epoch": 1.43, "learning_rate": 8.481253670846859e-05, "loss": 0.0289, "step": 222270 }, { "epoch": 1.43, "learning_rate": 8.480285535411167e-05, "loss": 0.0261, "step": 222280 }, { "epoch": 1.43, "learning_rate": 8.479317399975474e-05, "loss": 0.0261, "step": 222290 }, { "epoch": 1.43, "learning_rate": 8.478349264539779e-05, "loss": 0.0267, "step": 222300 }, { "epoch": 1.43, "learning_rate": 8.477381129104087e-05, "loss": 0.0232, "step": 222310 }, { "epoch": 1.43, "learning_rate": 8.476412993668393e-05, "loss": 0.031, "step": 222320 }, { "epoch": 1.43, "learning_rate": 8.4754448582327e-05, "loss": 0.0301, "step": 222330 }, { "epoch": 1.44, "learning_rate": 8.474476722797007e-05, "loss": 0.0322, "step": 222340 }, { "epoch": 1.44, "learning_rate": 8.473508587361315e-05, "loss": 0.0278, "step": 222350 }, { "epoch": 1.44, "learning_rate": 8.472540451925621e-05, "loss": 0.029, "step": 222360 }, { "epoch": 1.44, "learning_rate": 8.471572316489927e-05, "loss": 0.033, "step": 222370 }, { "epoch": 1.44, "learning_rate": 8.470604181054234e-05, "loss": 0.029, "step": 222380 }, { "epoch": 1.44, "learning_rate": 8.469636045618541e-05, "loss": 0.0243, "step": 222390 }, { "epoch": 1.44, "learning_rate": 8.468667910182846e-05, "loss": 0.0286, "step": 222400 }, { "epoch": 1.44, "learning_rate": 8.467699774747154e-05, "loss": 0.0304, "step": 222410 }, { "epoch": 1.44, "learning_rate": 8.466731639311461e-05, "loss": 0.0306, "step": 222420 }, { "epoch": 1.44, "learning_rate": 8.465763503875769e-05, "loss": 0.0258, "step": 222430 }, { "epoch": 1.44, "learning_rate": 8.464795368440074e-05, "loss": 0.0311, "step": 222440 }, { "epoch": 1.44, "learning_rate": 8.463827233004382e-05, "loss": 0.0306, "step": 222450 }, { "epoch": 1.44, "learning_rate": 8.462859097568689e-05, "loss": 0.0274, "step": 222460 }, { "epoch": 1.44, "learning_rate": 8.461890962132994e-05, "loss": 0.0246, "step": 222470 }, { "epoch": 1.44, "learning_rate": 8.460922826697302e-05, "loss": 0.0259, "step": 222480 }, { "epoch": 1.44, "learning_rate": 8.459954691261609e-05, "loss": 0.0249, "step": 222490 }, { "epoch": 1.44, "learning_rate": 8.458986555825917e-05, "loss": 0.0304, "step": 222500 }, { "epoch": 1.44, "learning_rate": 8.458018420390222e-05, "loss": 0.0329, "step": 222510 }, { "epoch": 1.44, "learning_rate": 8.457050284954529e-05, "loss": 0.0248, "step": 222520 }, { "epoch": 1.44, "learning_rate": 8.456082149518837e-05, "loss": 0.0283, "step": 222530 }, { "epoch": 1.44, "learning_rate": 8.455114014083142e-05, "loss": 0.0249, "step": 222540 }, { "epoch": 1.44, "learning_rate": 8.45414587864745e-05, "loss": 0.0232, "step": 222550 }, { "epoch": 1.44, "learning_rate": 8.453177743211756e-05, "loss": 0.0234, "step": 222560 }, { "epoch": 1.44, "learning_rate": 8.452209607776063e-05, "loss": 0.0257, "step": 222570 }, { "epoch": 1.44, "learning_rate": 8.45124147234037e-05, "loss": 0.027, "step": 222580 }, { "epoch": 1.44, "learning_rate": 8.450273336904676e-05, "loss": 0.0291, "step": 222590 }, { "epoch": 1.44, "learning_rate": 8.449305201468984e-05, "loss": 0.0267, "step": 222600 }, { "epoch": 1.44, "learning_rate": 8.44833706603329e-05, "loss": 0.0307, "step": 222610 }, { "epoch": 1.44, "learning_rate": 8.447368930597596e-05, "loss": 0.0288, "step": 222620 }, { "epoch": 1.44, "learning_rate": 8.446400795161904e-05, "loss": 0.035, "step": 222630 }, { "epoch": 1.44, "learning_rate": 8.445432659726211e-05, "loss": 0.0283, "step": 222640 }, { "epoch": 1.44, "learning_rate": 8.444464524290517e-05, "loss": 0.0237, "step": 222650 }, { "epoch": 1.44, "learning_rate": 8.443496388854824e-05, "loss": 0.0294, "step": 222660 }, { "epoch": 1.44, "learning_rate": 8.44252825341913e-05, "loss": 0.0244, "step": 222670 }, { "epoch": 1.44, "learning_rate": 8.441560117983437e-05, "loss": 0.026, "step": 222680 }, { "epoch": 1.44, "learning_rate": 8.440591982547744e-05, "loss": 0.0363, "step": 222690 }, { "epoch": 1.44, "learning_rate": 8.439623847112052e-05, "loss": 0.026, "step": 222700 }, { "epoch": 1.44, "learning_rate": 8.438655711676359e-05, "loss": 0.0284, "step": 222710 }, { "epoch": 1.44, "learning_rate": 8.437687576240664e-05, "loss": 0.0302, "step": 222720 }, { "epoch": 1.44, "learning_rate": 8.436719440804972e-05, "loss": 0.0256, "step": 222730 }, { "epoch": 1.44, "learning_rate": 8.435751305369278e-05, "loss": 0.0285, "step": 222740 }, { "epoch": 1.44, "learning_rate": 8.434783169933585e-05, "loss": 0.0267, "step": 222750 }, { "epoch": 1.44, "learning_rate": 8.433815034497892e-05, "loss": 0.0249, "step": 222760 }, { "epoch": 1.44, "learning_rate": 8.432846899062198e-05, "loss": 0.0355, "step": 222770 }, { "epoch": 1.44, "learning_rate": 8.431878763626506e-05, "loss": 0.025, "step": 222780 }, { "epoch": 1.44, "learning_rate": 8.430910628190811e-05, "loss": 0.0285, "step": 222790 }, { "epoch": 1.44, "learning_rate": 8.42994249275512e-05, "loss": 0.0286, "step": 222800 }, { "epoch": 1.44, "learning_rate": 8.428974357319426e-05, "loss": 0.0267, "step": 222810 }, { "epoch": 1.44, "learning_rate": 8.428006221883731e-05, "loss": 0.0304, "step": 222820 }, { "epoch": 1.44, "learning_rate": 8.42703808644804e-05, "loss": 0.0365, "step": 222830 }, { "epoch": 1.44, "learning_rate": 8.426069951012346e-05, "loss": 0.0288, "step": 222840 }, { "epoch": 1.44, "learning_rate": 8.425101815576654e-05, "loss": 0.0323, "step": 222850 }, { "epoch": 1.44, "learning_rate": 8.424133680140959e-05, "loss": 0.0293, "step": 222860 }, { "epoch": 1.44, "learning_rate": 8.423165544705266e-05, "loss": 0.029, "step": 222870 }, { "epoch": 1.44, "learning_rate": 8.422197409269574e-05, "loss": 0.0291, "step": 222880 }, { "epoch": 1.44, "learning_rate": 8.421229273833879e-05, "loss": 0.0274, "step": 222890 }, { "epoch": 1.44, "learning_rate": 8.420261138398187e-05, "loss": 0.0288, "step": 222900 }, { "epoch": 1.44, "learning_rate": 8.419293002962494e-05, "loss": 0.0266, "step": 222910 }, { "epoch": 1.44, "learning_rate": 8.418324867526802e-05, "loss": 0.0237, "step": 222920 }, { "epoch": 1.44, "learning_rate": 8.417356732091107e-05, "loss": 0.0252, "step": 222930 }, { "epoch": 1.44, "learning_rate": 8.416388596655414e-05, "loss": 0.0311, "step": 222940 }, { "epoch": 1.44, "learning_rate": 8.415420461219722e-05, "loss": 0.0317, "step": 222950 }, { "epoch": 1.44, "learning_rate": 8.414452325784027e-05, "loss": 0.0255, "step": 222960 }, { "epoch": 1.44, "learning_rate": 8.413484190348333e-05, "loss": 0.0257, "step": 222970 }, { "epoch": 1.44, "learning_rate": 8.412516054912641e-05, "loss": 0.0279, "step": 222980 }, { "epoch": 1.44, "learning_rate": 8.411547919476948e-05, "loss": 0.0249, "step": 222990 }, { "epoch": 1.44, "learning_rate": 8.410579784041255e-05, "loss": 0.0261, "step": 223000 }, { "epoch": 1.44, "eval_cer": 0.9198445373404135, "eval_loss": 0.02085886336863041, "eval_runtime": 120.1768, "eval_samples_per_second": 16.642, "eval_steps_per_second": 4.161, "step": 223000 }, { "epoch": 1.44, "learning_rate": 8.409611648605561e-05, "loss": 0.0336, "step": 223010 }, { "epoch": 1.44, "learning_rate": 8.408643513169869e-05, "loss": 0.0425, "step": 223020 }, { "epoch": 1.44, "learning_rate": 8.407675377734175e-05, "loss": 0.0325, "step": 223030 }, { "epoch": 1.44, "learning_rate": 8.406707242298481e-05, "loss": 0.0303, "step": 223040 }, { "epoch": 1.44, "learning_rate": 8.405739106862789e-05, "loss": 0.0317, "step": 223050 }, { "epoch": 1.44, "learning_rate": 8.404770971427096e-05, "loss": 0.0246, "step": 223060 }, { "epoch": 1.44, "learning_rate": 8.403802835991401e-05, "loss": 0.0294, "step": 223070 }, { "epoch": 1.44, "learning_rate": 8.402834700555709e-05, "loss": 0.0238, "step": 223080 }, { "epoch": 1.44, "learning_rate": 8.401866565120016e-05, "loss": 0.0277, "step": 223090 }, { "epoch": 1.44, "learning_rate": 8.400898429684322e-05, "loss": 0.0318, "step": 223100 }, { "epoch": 1.44, "learning_rate": 8.399930294248629e-05, "loss": 0.0278, "step": 223110 }, { "epoch": 1.44, "learning_rate": 8.398962158812937e-05, "loss": 0.0319, "step": 223120 }, { "epoch": 1.44, "learning_rate": 8.397994023377243e-05, "loss": 0.0304, "step": 223130 }, { "epoch": 1.44, "learning_rate": 8.397025887941549e-05, "loss": 0.0342, "step": 223140 }, { "epoch": 1.44, "learning_rate": 8.396057752505857e-05, "loss": 0.0323, "step": 223150 }, { "epoch": 1.44, "learning_rate": 8.395089617070163e-05, "loss": 0.0353, "step": 223160 }, { "epoch": 1.44, "learning_rate": 8.394121481634469e-05, "loss": 0.0292, "step": 223170 }, { "epoch": 1.44, "learning_rate": 8.393153346198777e-05, "loss": 0.0292, "step": 223180 }, { "epoch": 1.44, "learning_rate": 8.392185210763083e-05, "loss": 0.0274, "step": 223190 }, { "epoch": 1.44, "learning_rate": 8.391217075327391e-05, "loss": 0.0222, "step": 223200 }, { "epoch": 1.44, "learning_rate": 8.390248939891696e-05, "loss": 0.0286, "step": 223210 }, { "epoch": 1.44, "learning_rate": 8.389280804456004e-05, "loss": 0.0288, "step": 223220 }, { "epoch": 1.44, "learning_rate": 8.388312669020311e-05, "loss": 0.0258, "step": 223230 }, { "epoch": 1.44, "learning_rate": 8.387344533584616e-05, "loss": 0.03, "step": 223240 }, { "epoch": 1.44, "learning_rate": 8.386376398148924e-05, "loss": 0.0321, "step": 223250 }, { "epoch": 1.44, "learning_rate": 8.385408262713231e-05, "loss": 0.0287, "step": 223260 }, { "epoch": 1.44, "learning_rate": 8.384440127277539e-05, "loss": 0.0269, "step": 223270 }, { "epoch": 1.44, "learning_rate": 8.383471991841844e-05, "loss": 0.0256, "step": 223280 }, { "epoch": 1.44, "learning_rate": 8.382503856406151e-05, "loss": 0.027, "step": 223290 }, { "epoch": 1.44, "learning_rate": 8.381535720970459e-05, "loss": 0.0301, "step": 223300 }, { "epoch": 1.44, "learning_rate": 8.380567585534764e-05, "loss": 0.0328, "step": 223310 }, { "epoch": 1.44, "learning_rate": 8.379599450099072e-05, "loss": 0.0314, "step": 223320 }, { "epoch": 1.44, "learning_rate": 8.378631314663379e-05, "loss": 0.0294, "step": 223330 }, { "epoch": 1.44, "learning_rate": 8.377663179227687e-05, "loss": 0.0324, "step": 223340 }, { "epoch": 1.44, "learning_rate": 8.376695043791992e-05, "loss": 0.0297, "step": 223350 }, { "epoch": 1.44, "learning_rate": 8.375726908356299e-05, "loss": 0.0356, "step": 223360 }, { "epoch": 1.44, "learning_rate": 8.374758772920607e-05, "loss": 0.0267, "step": 223370 }, { "epoch": 1.44, "learning_rate": 8.373790637484912e-05, "loss": 0.0261, "step": 223380 }, { "epoch": 1.44, "learning_rate": 8.372822502049218e-05, "loss": 0.028, "step": 223390 }, { "epoch": 1.44, "learning_rate": 8.371854366613526e-05, "loss": 0.0281, "step": 223400 }, { "epoch": 1.44, "learning_rate": 8.370886231177833e-05, "loss": 0.0249, "step": 223410 }, { "epoch": 1.44, "learning_rate": 8.36991809574214e-05, "loss": 0.0242, "step": 223420 }, { "epoch": 1.44, "learning_rate": 8.368949960306446e-05, "loss": 0.025, "step": 223430 }, { "epoch": 1.44, "learning_rate": 8.367981824870754e-05, "loss": 0.0308, "step": 223440 }, { "epoch": 1.44, "learning_rate": 8.36701368943506e-05, "loss": 0.0286, "step": 223450 }, { "epoch": 1.44, "learning_rate": 8.366045553999366e-05, "loss": 0.0286, "step": 223460 }, { "epoch": 1.44, "learning_rate": 8.365077418563674e-05, "loss": 0.0295, "step": 223470 }, { "epoch": 1.44, "learning_rate": 8.364109283127981e-05, "loss": 0.0247, "step": 223480 }, { "epoch": 1.44, "learning_rate": 8.363141147692286e-05, "loss": 0.0277, "step": 223490 }, { "epoch": 1.44, "learning_rate": 8.362173012256594e-05, "loss": 0.0304, "step": 223500 }, { "epoch": 1.44, "learning_rate": 8.3612048768209e-05, "loss": 0.0274, "step": 223510 }, { "epoch": 1.44, "learning_rate": 8.360236741385207e-05, "loss": 0.034, "step": 223520 }, { "epoch": 1.44, "learning_rate": 8.359268605949514e-05, "loss": 0.0327, "step": 223530 }, { "epoch": 1.44, "learning_rate": 8.358300470513822e-05, "loss": 0.025, "step": 223540 }, { "epoch": 1.44, "learning_rate": 8.357332335078128e-05, "loss": 0.0289, "step": 223550 }, { "epoch": 1.44, "learning_rate": 8.356364199642434e-05, "loss": 0.0269, "step": 223560 }, { "epoch": 1.44, "learning_rate": 8.355396064206742e-05, "loss": 0.03, "step": 223570 }, { "epoch": 1.44, "learning_rate": 8.354427928771048e-05, "loss": 0.0283, "step": 223580 }, { "epoch": 1.44, "learning_rate": 8.353459793335354e-05, "loss": 0.0247, "step": 223590 }, { "epoch": 1.44, "learning_rate": 8.352491657899662e-05, "loss": 0.0277, "step": 223600 }, { "epoch": 1.44, "learning_rate": 8.351523522463968e-05, "loss": 0.0301, "step": 223610 }, { "epoch": 1.44, "learning_rate": 8.350555387028276e-05, "loss": 0.0265, "step": 223620 }, { "epoch": 1.44, "learning_rate": 8.349587251592581e-05, "loss": 0.0269, "step": 223630 }, { "epoch": 1.44, "learning_rate": 8.34861911615689e-05, "loss": 0.0293, "step": 223640 }, { "epoch": 1.44, "learning_rate": 8.347650980721196e-05, "loss": 0.0273, "step": 223650 }, { "epoch": 1.44, "learning_rate": 8.346682845285501e-05, "loss": 0.0258, "step": 223660 }, { "epoch": 1.44, "learning_rate": 8.345714709849809e-05, "loss": 0.0305, "step": 223670 }, { "epoch": 1.44, "learning_rate": 8.344746574414116e-05, "loss": 0.0326, "step": 223680 }, { "epoch": 1.44, "learning_rate": 8.343778438978424e-05, "loss": 0.0307, "step": 223690 }, { "epoch": 1.44, "learning_rate": 8.342810303542729e-05, "loss": 0.0311, "step": 223700 }, { "epoch": 1.44, "learning_rate": 8.341842168107036e-05, "loss": 0.0311, "step": 223710 }, { "epoch": 1.44, "learning_rate": 8.340874032671344e-05, "loss": 0.0349, "step": 223720 }, { "epoch": 1.44, "learning_rate": 8.339905897235649e-05, "loss": 0.037, "step": 223730 }, { "epoch": 1.44, "learning_rate": 8.338937761799957e-05, "loss": 0.0314, "step": 223740 }, { "epoch": 1.44, "learning_rate": 8.337969626364264e-05, "loss": 0.0294, "step": 223750 }, { "epoch": 1.44, "learning_rate": 8.33700149092857e-05, "loss": 0.0258, "step": 223760 }, { "epoch": 1.44, "learning_rate": 8.336033355492877e-05, "loss": 0.0266, "step": 223770 }, { "epoch": 1.44, "learning_rate": 8.335065220057184e-05, "loss": 0.0298, "step": 223780 }, { "epoch": 1.44, "learning_rate": 8.334097084621492e-05, "loss": 0.0278, "step": 223790 }, { "epoch": 1.44, "learning_rate": 8.333128949185797e-05, "loss": 0.0256, "step": 223800 }, { "epoch": 1.44, "learning_rate": 8.332160813750103e-05, "loss": 0.0259, "step": 223810 }, { "epoch": 1.44, "learning_rate": 8.331192678314411e-05, "loss": 0.0219, "step": 223820 }, { "epoch": 1.44, "learning_rate": 8.330224542878718e-05, "loss": 0.0293, "step": 223830 }, { "epoch": 1.44, "learning_rate": 8.329256407443025e-05, "loss": 0.0303, "step": 223840 }, { "epoch": 1.44, "learning_rate": 8.328288272007331e-05, "loss": 0.023, "step": 223850 }, { "epoch": 1.44, "learning_rate": 8.327320136571638e-05, "loss": 0.0293, "step": 223860 }, { "epoch": 1.44, "learning_rate": 8.326352001135945e-05, "loss": 0.0324, "step": 223870 }, { "epoch": 1.44, "learning_rate": 8.325383865700251e-05, "loss": 0.0255, "step": 223880 }, { "epoch": 1.45, "learning_rate": 8.324415730264559e-05, "loss": 0.0313, "step": 223890 }, { "epoch": 1.45, "learning_rate": 8.323447594828866e-05, "loss": 0.0269, "step": 223900 }, { "epoch": 1.45, "learning_rate": 8.322479459393171e-05, "loss": 0.0277, "step": 223910 }, { "epoch": 1.45, "learning_rate": 8.321511323957479e-05, "loss": 0.0267, "step": 223920 }, { "epoch": 1.45, "learning_rate": 8.320543188521786e-05, "loss": 0.0264, "step": 223930 }, { "epoch": 1.45, "learning_rate": 8.319575053086092e-05, "loss": 0.032, "step": 223940 }, { "epoch": 1.45, "learning_rate": 8.318606917650399e-05, "loss": 0.0338, "step": 223950 }, { "epoch": 1.45, "learning_rate": 8.317638782214705e-05, "loss": 0.0267, "step": 223960 }, { "epoch": 1.45, "learning_rate": 8.316670646779013e-05, "loss": 0.0253, "step": 223970 }, { "epoch": 1.45, "learning_rate": 8.315702511343319e-05, "loss": 0.0233, "step": 223980 }, { "epoch": 1.45, "learning_rate": 8.314734375907627e-05, "loss": 0.0293, "step": 223990 }, { "epoch": 1.45, "learning_rate": 8.313766240471933e-05, "loss": 0.0274, "step": 224000 }, { "epoch": 1.45, "eval_cer": 0.9198824991526381, "eval_loss": 0.020434506237506866, "eval_runtime": 120.0541, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 224000 }, { "epoch": 1.45, "learning_rate": 8.312798105036239e-05, "loss": 0.0298, "step": 224010 }, { "epoch": 1.45, "learning_rate": 8.311829969600547e-05, "loss": 0.0326, "step": 224020 }, { "epoch": 1.45, "learning_rate": 8.310861834164853e-05, "loss": 0.0247, "step": 224030 }, { "epoch": 1.45, "learning_rate": 8.309893698729161e-05, "loss": 0.0236, "step": 224040 }, { "epoch": 1.45, "learning_rate": 8.308925563293466e-05, "loss": 0.0275, "step": 224050 }, { "epoch": 1.45, "learning_rate": 8.307957427857773e-05, "loss": 0.0272, "step": 224060 }, { "epoch": 1.45, "learning_rate": 8.306989292422081e-05, "loss": 0.0317, "step": 224070 }, { "epoch": 1.45, "learning_rate": 8.306021156986386e-05, "loss": 0.0269, "step": 224080 }, { "epoch": 1.45, "learning_rate": 8.305053021550694e-05, "loss": 0.0259, "step": 224090 }, { "epoch": 1.45, "learning_rate": 8.304084886115001e-05, "loss": 0.0292, "step": 224100 }, { "epoch": 1.45, "learning_rate": 8.303116750679309e-05, "loss": 0.0287, "step": 224110 }, { "epoch": 1.45, "learning_rate": 8.302148615243614e-05, "loss": 0.0272, "step": 224120 }, { "epoch": 1.45, "learning_rate": 8.301180479807921e-05, "loss": 0.0265, "step": 224130 }, { "epoch": 1.45, "learning_rate": 8.300212344372229e-05, "loss": 0.0259, "step": 224140 }, { "epoch": 1.45, "learning_rate": 8.299244208936534e-05, "loss": 0.0261, "step": 224150 }, { "epoch": 1.45, "learning_rate": 8.298276073500842e-05, "loss": 0.0303, "step": 224160 }, { "epoch": 1.45, "learning_rate": 8.297307938065149e-05, "loss": 0.0248, "step": 224170 }, { "epoch": 1.45, "learning_rate": 8.296339802629455e-05, "loss": 0.0288, "step": 224180 }, { "epoch": 1.45, "learning_rate": 8.295371667193762e-05, "loss": 0.0311, "step": 224190 }, { "epoch": 1.45, "learning_rate": 8.294403531758069e-05, "loss": 0.0362, "step": 224200 }, { "epoch": 1.45, "learning_rate": 8.293435396322376e-05, "loss": 0.0229, "step": 224210 }, { "epoch": 1.45, "learning_rate": 8.292467260886682e-05, "loss": 0.0284, "step": 224220 }, { "epoch": 1.45, "learning_rate": 8.291499125450988e-05, "loss": 0.0306, "step": 224230 }, { "epoch": 1.45, "learning_rate": 8.290530990015296e-05, "loss": 0.0308, "step": 224240 }, { "epoch": 1.45, "learning_rate": 8.289562854579603e-05, "loss": 0.0279, "step": 224250 }, { "epoch": 1.45, "learning_rate": 8.28859471914391e-05, "loss": 0.0259, "step": 224260 }, { "epoch": 1.45, "learning_rate": 8.287626583708216e-05, "loss": 0.0275, "step": 224270 }, { "epoch": 1.45, "learning_rate": 8.286658448272523e-05, "loss": 0.0255, "step": 224280 }, { "epoch": 1.45, "learning_rate": 8.28569031283683e-05, "loss": 0.0299, "step": 224290 }, { "epoch": 1.45, "learning_rate": 8.284722177401136e-05, "loss": 0.027, "step": 224300 }, { "epoch": 1.45, "learning_rate": 8.283754041965444e-05, "loss": 0.0232, "step": 224310 }, { "epoch": 1.45, "learning_rate": 8.282785906529751e-05, "loss": 0.0271, "step": 224320 }, { "epoch": 1.45, "learning_rate": 8.281817771094056e-05, "loss": 0.0258, "step": 224330 }, { "epoch": 1.45, "learning_rate": 8.280849635658364e-05, "loss": 0.0253, "step": 224340 }, { "epoch": 1.45, "learning_rate": 8.27988150022267e-05, "loss": 0.0235, "step": 224350 }, { "epoch": 1.45, "learning_rate": 8.278913364786977e-05, "loss": 0.0303, "step": 224360 }, { "epoch": 1.45, "learning_rate": 8.277945229351284e-05, "loss": 0.0285, "step": 224370 }, { "epoch": 1.45, "learning_rate": 8.27697709391559e-05, "loss": 0.0259, "step": 224380 }, { "epoch": 1.45, "learning_rate": 8.276008958479898e-05, "loss": 0.0265, "step": 224390 }, { "epoch": 1.45, "learning_rate": 8.275040823044204e-05, "loss": 0.0336, "step": 224400 }, { "epoch": 1.45, "learning_rate": 8.274072687608512e-05, "loss": 0.0244, "step": 224410 }, { "epoch": 1.45, "learning_rate": 8.273104552172818e-05, "loss": 0.025, "step": 224420 }, { "epoch": 1.45, "learning_rate": 8.272136416737124e-05, "loss": 0.0289, "step": 224430 }, { "epoch": 1.45, "learning_rate": 8.271168281301432e-05, "loss": 0.0275, "step": 224440 }, { "epoch": 1.45, "learning_rate": 8.270200145865738e-05, "loss": 0.034, "step": 224450 }, { "epoch": 1.45, "learning_rate": 8.269232010430046e-05, "loss": 0.0256, "step": 224460 }, { "epoch": 1.45, "learning_rate": 8.268263874994351e-05, "loss": 0.0304, "step": 224470 }, { "epoch": 1.45, "learning_rate": 8.267295739558658e-05, "loss": 0.0261, "step": 224480 }, { "epoch": 1.45, "learning_rate": 8.266327604122966e-05, "loss": 0.0293, "step": 224490 }, { "epoch": 1.45, "learning_rate": 8.265359468687271e-05, "loss": 0.0239, "step": 224500 }, { "epoch": 1.45, "learning_rate": 8.264391333251579e-05, "loss": 0.0282, "step": 224510 }, { "epoch": 1.45, "learning_rate": 8.263423197815886e-05, "loss": 0.0266, "step": 224520 }, { "epoch": 1.45, "learning_rate": 8.262455062380194e-05, "loss": 0.0244, "step": 224530 }, { "epoch": 1.45, "learning_rate": 8.261486926944499e-05, "loss": 0.0278, "step": 224540 }, { "epoch": 1.45, "learning_rate": 8.260518791508806e-05, "loss": 0.0288, "step": 224550 }, { "epoch": 1.45, "learning_rate": 8.259550656073114e-05, "loss": 0.0279, "step": 224560 }, { "epoch": 1.45, "learning_rate": 8.258582520637419e-05, "loss": 0.0262, "step": 224570 }, { "epoch": 1.45, "learning_rate": 8.257614385201726e-05, "loss": 0.0282, "step": 224580 }, { "epoch": 1.45, "learning_rate": 8.256646249766034e-05, "loss": 0.0235, "step": 224590 }, { "epoch": 1.45, "learning_rate": 8.25567811433034e-05, "loss": 0.0311, "step": 224600 }, { "epoch": 1.45, "learning_rate": 8.254709978894647e-05, "loss": 0.0302, "step": 224610 }, { "epoch": 1.45, "learning_rate": 8.253741843458953e-05, "loss": 0.0315, "step": 224620 }, { "epoch": 1.45, "learning_rate": 8.252773708023261e-05, "loss": 0.0292, "step": 224630 }, { "epoch": 1.45, "learning_rate": 8.251805572587567e-05, "loss": 0.0262, "step": 224640 }, { "epoch": 1.45, "learning_rate": 8.250837437151873e-05, "loss": 0.024, "step": 224650 }, { "epoch": 1.45, "learning_rate": 8.249869301716181e-05, "loss": 0.0242, "step": 224660 }, { "epoch": 1.45, "learning_rate": 8.248901166280488e-05, "loss": 0.0278, "step": 224670 }, { "epoch": 1.45, "learning_rate": 8.247933030844793e-05, "loss": 0.0242, "step": 224680 }, { "epoch": 1.45, "learning_rate": 8.246964895409101e-05, "loss": 0.0288, "step": 224690 }, { "epoch": 1.45, "learning_rate": 8.245996759973408e-05, "loss": 0.0318, "step": 224700 }, { "epoch": 1.45, "learning_rate": 8.245028624537714e-05, "loss": 0.0299, "step": 224710 }, { "epoch": 1.45, "learning_rate": 8.244060489102021e-05, "loss": 0.0253, "step": 224720 }, { "epoch": 1.45, "learning_rate": 8.243092353666329e-05, "loss": 0.025, "step": 224730 }, { "epoch": 1.45, "learning_rate": 8.242124218230636e-05, "loss": 0.0244, "step": 224740 }, { "epoch": 1.45, "learning_rate": 8.241156082794941e-05, "loss": 0.0337, "step": 224750 }, { "epoch": 1.45, "learning_rate": 8.240187947359249e-05, "loss": 0.0249, "step": 224760 }, { "epoch": 1.45, "learning_rate": 8.239219811923556e-05, "loss": 0.0259, "step": 224770 }, { "epoch": 1.45, "learning_rate": 8.238251676487861e-05, "loss": 0.0242, "step": 224780 }, { "epoch": 1.45, "learning_rate": 8.237283541052169e-05, "loss": 0.0329, "step": 224790 }, { "epoch": 1.45, "learning_rate": 8.236315405616475e-05, "loss": 0.0277, "step": 224800 }, { "epoch": 1.45, "learning_rate": 8.235347270180783e-05, "loss": 0.0291, "step": 224810 }, { "epoch": 1.45, "learning_rate": 8.234379134745089e-05, "loss": 0.0257, "step": 224820 }, { "epoch": 1.45, "learning_rate": 8.233410999309397e-05, "loss": 0.0265, "step": 224830 }, { "epoch": 1.45, "learning_rate": 8.232442863873703e-05, "loss": 0.0272, "step": 224840 }, { "epoch": 1.45, "learning_rate": 8.231474728438009e-05, "loss": 0.0256, "step": 224850 }, { "epoch": 1.45, "learning_rate": 8.230506593002317e-05, "loss": 0.0223, "step": 224860 }, { "epoch": 1.45, "learning_rate": 8.229538457566623e-05, "loss": 0.0301, "step": 224870 }, { "epoch": 1.45, "learning_rate": 8.228570322130931e-05, "loss": 0.028, "step": 224880 }, { "epoch": 1.45, "learning_rate": 8.227602186695236e-05, "loss": 0.025, "step": 224890 }, { "epoch": 1.45, "learning_rate": 8.226634051259543e-05, "loss": 0.0291, "step": 224900 }, { "epoch": 1.45, "learning_rate": 8.225665915823851e-05, "loss": 0.0304, "step": 224910 }, { "epoch": 1.45, "learning_rate": 8.224697780388156e-05, "loss": 0.0267, "step": 224920 }, { "epoch": 1.45, "learning_rate": 8.223729644952464e-05, "loss": 0.028, "step": 224930 }, { "epoch": 1.45, "learning_rate": 8.222761509516771e-05, "loss": 0.0282, "step": 224940 }, { "epoch": 1.45, "learning_rate": 8.221793374081079e-05, "loss": 0.0244, "step": 224950 }, { "epoch": 1.45, "learning_rate": 8.220825238645384e-05, "loss": 0.0295, "step": 224960 }, { "epoch": 1.45, "learning_rate": 8.219857103209691e-05, "loss": 0.0241, "step": 224970 }, { "epoch": 1.45, "learning_rate": 8.218888967773999e-05, "loss": 0.0317, "step": 224980 }, { "epoch": 1.45, "learning_rate": 8.217920832338304e-05, "loss": 0.0324, "step": 224990 }, { "epoch": 1.45, "learning_rate": 8.21695269690261e-05, "loss": 0.0343, "step": 225000 }, { "epoch": 1.45, "eval_cer": 0.9198978646480623, "eval_loss": 0.020093819126486778, "eval_runtime": 120.1806, "eval_samples_per_second": 16.642, "eval_steps_per_second": 4.16, "step": 225000 }, { "epoch": 1.45, "learning_rate": 8.215984561466919e-05, "loss": 0.0234, "step": 225010 }, { "epoch": 1.45, "learning_rate": 8.215016426031225e-05, "loss": 0.0293, "step": 225020 }, { "epoch": 1.45, "learning_rate": 8.214048290595532e-05, "loss": 0.0252, "step": 225030 }, { "epoch": 1.45, "learning_rate": 8.213080155159838e-05, "loss": 0.0238, "step": 225040 }, { "epoch": 1.45, "learning_rate": 8.212112019724146e-05, "loss": 0.0307, "step": 225050 }, { "epoch": 1.45, "learning_rate": 8.211143884288452e-05, "loss": 0.0236, "step": 225060 }, { "epoch": 1.45, "learning_rate": 8.210175748852758e-05, "loss": 0.0292, "step": 225070 }, { "epoch": 1.45, "learning_rate": 8.209207613417066e-05, "loss": 0.0343, "step": 225080 }, { "epoch": 1.45, "learning_rate": 8.208239477981373e-05, "loss": 0.0258, "step": 225090 }, { "epoch": 1.45, "learning_rate": 8.207271342545678e-05, "loss": 0.0315, "step": 225100 }, { "epoch": 1.45, "learning_rate": 8.206303207109986e-05, "loss": 0.0237, "step": 225110 }, { "epoch": 1.45, "learning_rate": 8.205335071674293e-05, "loss": 0.0277, "step": 225120 }, { "epoch": 1.45, "learning_rate": 8.2043669362386e-05, "loss": 0.0307, "step": 225130 }, { "epoch": 1.45, "learning_rate": 8.203398800802906e-05, "loss": 0.0369, "step": 225140 }, { "epoch": 1.45, "learning_rate": 8.202430665367214e-05, "loss": 0.0296, "step": 225150 }, { "epoch": 1.45, "learning_rate": 8.20146252993152e-05, "loss": 0.0264, "step": 225160 }, { "epoch": 1.45, "learning_rate": 8.200494394495826e-05, "loss": 0.0335, "step": 225170 }, { "epoch": 1.45, "learning_rate": 8.199526259060134e-05, "loss": 0.0266, "step": 225180 }, { "epoch": 1.45, "learning_rate": 8.19855812362444e-05, "loss": 0.0244, "step": 225190 }, { "epoch": 1.45, "learning_rate": 8.197589988188746e-05, "loss": 0.0269, "step": 225200 }, { "epoch": 1.45, "learning_rate": 8.196621852753054e-05, "loss": 0.0286, "step": 225210 }, { "epoch": 1.45, "learning_rate": 8.19565371731736e-05, "loss": 0.0302, "step": 225220 }, { "epoch": 1.45, "learning_rate": 8.194685581881668e-05, "loss": 0.025, "step": 225230 }, { "epoch": 1.45, "learning_rate": 8.193717446445974e-05, "loss": 0.0285, "step": 225240 }, { "epoch": 1.45, "learning_rate": 8.192749311010282e-05, "loss": 0.0256, "step": 225250 }, { "epoch": 1.45, "learning_rate": 8.191781175574588e-05, "loss": 0.0251, "step": 225260 }, { "epoch": 1.45, "learning_rate": 8.190813040138894e-05, "loss": 0.0306, "step": 225270 }, { "epoch": 1.45, "learning_rate": 8.189844904703202e-05, "loss": 0.0247, "step": 225280 }, { "epoch": 1.45, "learning_rate": 8.188876769267508e-05, "loss": 0.0276, "step": 225290 }, { "epoch": 1.45, "learning_rate": 8.187908633831816e-05, "loss": 0.0275, "step": 225300 }, { "epoch": 1.45, "learning_rate": 8.186940498396121e-05, "loss": 0.0234, "step": 225310 }, { "epoch": 1.45, "learning_rate": 8.185972362960428e-05, "loss": 0.0266, "step": 225320 }, { "epoch": 1.45, "learning_rate": 8.185004227524736e-05, "loss": 0.0324, "step": 225330 }, { "epoch": 1.45, "learning_rate": 8.184036092089041e-05, "loss": 0.0304, "step": 225340 }, { "epoch": 1.45, "learning_rate": 8.183067956653349e-05, "loss": 0.0304, "step": 225350 }, { "epoch": 1.45, "learning_rate": 8.182099821217656e-05, "loss": 0.0256, "step": 225360 }, { "epoch": 1.45, "learning_rate": 8.181131685781962e-05, "loss": 0.0346, "step": 225370 }, { "epoch": 1.45, "learning_rate": 8.180163550346269e-05, "loss": 0.0284, "step": 225380 }, { "epoch": 1.45, "learning_rate": 8.179195414910576e-05, "loss": 0.0318, "step": 225390 }, { "epoch": 1.45, "learning_rate": 8.178227279474884e-05, "loss": 0.0256, "step": 225400 }, { "epoch": 1.45, "learning_rate": 8.177259144039189e-05, "loss": 0.0279, "step": 225410 }, { "epoch": 1.45, "learning_rate": 8.176291008603496e-05, "loss": 0.0291, "step": 225420 }, { "epoch": 1.45, "learning_rate": 8.175322873167804e-05, "loss": 0.0315, "step": 225430 }, { "epoch": 1.46, "learning_rate": 8.17435473773211e-05, "loss": 0.0243, "step": 225440 }, { "epoch": 1.46, "learning_rate": 8.173386602296417e-05, "loss": 0.0256, "step": 225450 }, { "epoch": 1.46, "learning_rate": 8.172418466860723e-05, "loss": 0.0258, "step": 225460 }, { "epoch": 1.46, "learning_rate": 8.17145033142503e-05, "loss": 0.0311, "step": 225470 }, { "epoch": 1.46, "learning_rate": 8.170482195989337e-05, "loss": 0.025, "step": 225480 }, { "epoch": 1.46, "learning_rate": 8.169514060553643e-05, "loss": 0.0292, "step": 225490 }, { "epoch": 1.46, "learning_rate": 8.168545925117951e-05, "loss": 0.0296, "step": 225500 }, { "epoch": 1.46, "learning_rate": 8.167577789682258e-05, "loss": 0.0285, "step": 225510 }, { "epoch": 1.46, "learning_rate": 8.166609654246563e-05, "loss": 0.0277, "step": 225520 }, { "epoch": 1.46, "learning_rate": 8.165641518810871e-05, "loss": 0.0273, "step": 225530 }, { "epoch": 1.46, "learning_rate": 8.164673383375178e-05, "loss": 0.027, "step": 225540 }, { "epoch": 1.46, "learning_rate": 8.163705247939484e-05, "loss": 0.0311, "step": 225550 }, { "epoch": 1.46, "learning_rate": 8.162737112503791e-05, "loss": 0.0294, "step": 225560 }, { "epoch": 1.46, "learning_rate": 8.161768977068098e-05, "loss": 0.0271, "step": 225570 }, { "epoch": 1.46, "learning_rate": 8.160800841632404e-05, "loss": 0.0262, "step": 225580 }, { "epoch": 1.46, "learning_rate": 8.159832706196711e-05, "loss": 0.0302, "step": 225590 }, { "epoch": 1.46, "learning_rate": 8.158864570761019e-05, "loss": 0.0408, "step": 225600 }, { "epoch": 1.46, "learning_rate": 8.157896435325326e-05, "loss": 0.0296, "step": 225610 }, { "epoch": 1.46, "learning_rate": 8.156928299889631e-05, "loss": 0.0333, "step": 225620 }, { "epoch": 1.46, "learning_rate": 8.155960164453939e-05, "loss": 0.0235, "step": 225630 }, { "epoch": 1.46, "learning_rate": 8.154992029018245e-05, "loss": 0.0306, "step": 225640 }, { "epoch": 1.46, "learning_rate": 8.154023893582552e-05, "loss": 0.0304, "step": 225650 }, { "epoch": 1.46, "learning_rate": 8.153055758146859e-05, "loss": 0.0308, "step": 225660 }, { "epoch": 1.46, "learning_rate": 8.152087622711165e-05, "loss": 0.0248, "step": 225670 }, { "epoch": 1.46, "learning_rate": 8.151119487275473e-05, "loss": 0.026, "step": 225680 }, { "epoch": 1.46, "learning_rate": 8.150151351839779e-05, "loss": 0.0294, "step": 225690 }, { "epoch": 1.46, "learning_rate": 8.149183216404086e-05, "loss": 0.0287, "step": 225700 }, { "epoch": 1.46, "learning_rate": 8.148215080968393e-05, "loss": 0.0296, "step": 225710 }, { "epoch": 1.46, "learning_rate": 8.147246945532698e-05, "loss": 0.0244, "step": 225720 }, { "epoch": 1.46, "learning_rate": 8.146278810097006e-05, "loss": 0.0317, "step": 225730 }, { "epoch": 1.46, "learning_rate": 8.145310674661313e-05, "loss": 0.0283, "step": 225740 }, { "epoch": 1.46, "learning_rate": 8.144342539225621e-05, "loss": 0.0267, "step": 225750 }, { "epoch": 1.46, "learning_rate": 8.143374403789926e-05, "loss": 0.0297, "step": 225760 }, { "epoch": 1.46, "learning_rate": 8.142406268354233e-05, "loss": 0.0211, "step": 225770 }, { "epoch": 1.46, "learning_rate": 8.141438132918541e-05, "loss": 0.0262, "step": 225780 }, { "epoch": 1.46, "learning_rate": 8.140469997482846e-05, "loss": 0.0318, "step": 225790 }, { "epoch": 1.46, "learning_rate": 8.139501862047154e-05, "loss": 0.0278, "step": 225800 }, { "epoch": 1.46, "learning_rate": 8.138533726611461e-05, "loss": 0.032, "step": 225810 }, { "epoch": 1.46, "learning_rate": 8.137565591175769e-05, "loss": 0.027, "step": 225820 }, { "epoch": 1.46, "learning_rate": 8.136597455740074e-05, "loss": 0.0248, "step": 225830 }, { "epoch": 1.46, "learning_rate": 8.13562932030438e-05, "loss": 0.0275, "step": 225840 }, { "epoch": 1.46, "learning_rate": 8.134661184868689e-05, "loss": 0.0276, "step": 225850 }, { "epoch": 1.46, "learning_rate": 8.133693049432994e-05, "loss": 0.0294, "step": 225860 }, { "epoch": 1.46, "learning_rate": 8.1327249139973e-05, "loss": 0.0326, "step": 225870 }, { "epoch": 1.46, "learning_rate": 8.131756778561608e-05, "loss": 0.028, "step": 225880 }, { "epoch": 1.46, "learning_rate": 8.130788643125915e-05, "loss": 0.0254, "step": 225890 }, { "epoch": 1.46, "learning_rate": 8.129820507690222e-05, "loss": 0.0322, "step": 225900 }, { "epoch": 1.46, "learning_rate": 8.128852372254528e-05, "loss": 0.031, "step": 225910 }, { "epoch": 1.46, "learning_rate": 8.127884236818836e-05, "loss": 0.0284, "step": 225920 }, { "epoch": 1.46, "learning_rate": 8.126916101383142e-05, "loss": 0.028, "step": 225930 }, { "epoch": 1.46, "learning_rate": 8.125947965947448e-05, "loss": 0.0273, "step": 225940 }, { "epoch": 1.46, "learning_rate": 8.124979830511756e-05, "loss": 0.0267, "step": 225950 }, { "epoch": 1.46, "learning_rate": 8.124011695076063e-05, "loss": 0.0236, "step": 225960 }, { "epoch": 1.46, "learning_rate": 8.123043559640368e-05, "loss": 0.0285, "step": 225970 }, { "epoch": 1.46, "learning_rate": 8.122075424204676e-05, "loss": 0.0295, "step": 225980 }, { "epoch": 1.46, "learning_rate": 8.121107288768983e-05, "loss": 0.0289, "step": 225990 }, { "epoch": 1.46, "learning_rate": 8.120139153333289e-05, "loss": 0.0249, "step": 226000 }, { "epoch": 1.46, "eval_cer": 0.9199150378488307, "eval_loss": 0.020439114421606064, "eval_runtime": 120.1357, "eval_samples_per_second": 16.648, "eval_steps_per_second": 4.162, "step": 226000 }, { "epoch": 1.46, "learning_rate": 8.119171017897596e-05, "loss": 0.0261, "step": 226010 }, { "epoch": 1.46, "learning_rate": 8.118202882461904e-05, "loss": 0.0253, "step": 226020 }, { "epoch": 1.46, "learning_rate": 8.11723474702621e-05, "loss": 0.0216, "step": 226030 }, { "epoch": 1.46, "learning_rate": 8.116266611590516e-05, "loss": 0.0257, "step": 226040 }, { "epoch": 1.46, "learning_rate": 8.115298476154824e-05, "loss": 0.0288, "step": 226050 }, { "epoch": 1.46, "learning_rate": 8.11433034071913e-05, "loss": 0.0269, "step": 226060 }, { "epoch": 1.46, "learning_rate": 8.113362205283436e-05, "loss": 0.0255, "step": 226070 }, { "epoch": 1.46, "learning_rate": 8.112394069847744e-05, "loss": 0.0238, "step": 226080 }, { "epoch": 1.46, "learning_rate": 8.11142593441205e-05, "loss": 0.0347, "step": 226090 }, { "epoch": 1.46, "learning_rate": 8.110457798976358e-05, "loss": 0.0283, "step": 226100 }, { "epoch": 1.46, "learning_rate": 8.109489663540663e-05, "loss": 0.0235, "step": 226110 }, { "epoch": 1.46, "learning_rate": 8.108521528104971e-05, "loss": 0.0273, "step": 226120 }, { "epoch": 1.46, "learning_rate": 8.107553392669278e-05, "loss": 0.0323, "step": 226130 }, { "epoch": 1.46, "learning_rate": 8.106585257233583e-05, "loss": 0.0275, "step": 226140 }, { "epoch": 1.46, "learning_rate": 8.105617121797891e-05, "loss": 0.0293, "step": 226150 }, { "epoch": 1.46, "learning_rate": 8.104648986362198e-05, "loss": 0.0281, "step": 226160 }, { "epoch": 1.46, "learning_rate": 8.103680850926506e-05, "loss": 0.0252, "step": 226170 }, { "epoch": 1.46, "learning_rate": 8.102712715490811e-05, "loss": 0.0259, "step": 226180 }, { "epoch": 1.46, "learning_rate": 8.101744580055118e-05, "loss": 0.0294, "step": 226190 }, { "epoch": 1.46, "learning_rate": 8.100776444619426e-05, "loss": 0.0241, "step": 226200 }, { "epoch": 1.46, "learning_rate": 8.099808309183731e-05, "loss": 0.0253, "step": 226210 }, { "epoch": 1.46, "learning_rate": 8.098840173748039e-05, "loss": 0.0252, "step": 226220 }, { "epoch": 1.46, "learning_rate": 8.097872038312346e-05, "loss": 0.0292, "step": 226230 }, { "epoch": 1.46, "learning_rate": 8.096903902876654e-05, "loss": 0.0359, "step": 226240 }, { "epoch": 1.46, "learning_rate": 8.095935767440959e-05, "loss": 0.027, "step": 226250 }, { "epoch": 1.46, "learning_rate": 8.094967632005266e-05, "loss": 0.0284, "step": 226260 }, { "epoch": 1.46, "learning_rate": 8.093999496569574e-05, "loss": 0.0295, "step": 226270 }, { "epoch": 1.46, "learning_rate": 8.093031361133879e-05, "loss": 0.0221, "step": 226280 }, { "epoch": 1.46, "learning_rate": 8.092063225698185e-05, "loss": 0.0277, "step": 226290 }, { "epoch": 1.46, "learning_rate": 8.091095090262493e-05, "loss": 0.0269, "step": 226300 }, { "epoch": 1.46, "learning_rate": 8.0901269548268e-05, "loss": 0.0286, "step": 226310 }, { "epoch": 1.46, "learning_rate": 8.089158819391107e-05, "loss": 0.0327, "step": 226320 }, { "epoch": 1.46, "learning_rate": 8.088190683955413e-05, "loss": 0.0259, "step": 226330 }, { "epoch": 1.46, "learning_rate": 8.087222548519721e-05, "loss": 0.029, "step": 226340 }, { "epoch": 1.46, "learning_rate": 8.086254413084027e-05, "loss": 0.0301, "step": 226350 }, { "epoch": 1.46, "learning_rate": 8.085286277648333e-05, "loss": 0.0274, "step": 226360 }, { "epoch": 1.46, "learning_rate": 8.084318142212641e-05, "loss": 0.027, "step": 226370 }, { "epoch": 1.46, "learning_rate": 8.083350006776948e-05, "loss": 0.0303, "step": 226380 }, { "epoch": 1.46, "learning_rate": 8.082381871341253e-05, "loss": 0.0228, "step": 226390 }, { "epoch": 1.46, "learning_rate": 8.081413735905561e-05, "loss": 0.0247, "step": 226400 }, { "epoch": 1.46, "learning_rate": 8.080445600469868e-05, "loss": 0.0252, "step": 226410 }, { "epoch": 1.46, "learning_rate": 8.079477465034174e-05, "loss": 0.0307, "step": 226420 }, { "epoch": 1.46, "learning_rate": 8.078509329598481e-05, "loss": 0.0252, "step": 226430 }, { "epoch": 1.46, "learning_rate": 8.077541194162789e-05, "loss": 0.0299, "step": 226440 }, { "epoch": 1.46, "learning_rate": 8.076573058727095e-05, "loss": 0.0289, "step": 226450 }, { "epoch": 1.46, "learning_rate": 8.075604923291401e-05, "loss": 0.0325, "step": 226460 }, { "epoch": 1.46, "learning_rate": 8.074636787855709e-05, "loss": 0.0278, "step": 226470 }, { "epoch": 1.46, "learning_rate": 8.073668652420015e-05, "loss": 0.0277, "step": 226480 }, { "epoch": 1.46, "learning_rate": 8.07270051698432e-05, "loss": 0.0291, "step": 226490 }, { "epoch": 1.46, "learning_rate": 8.071732381548629e-05, "loss": 0.0248, "step": 226500 }, { "epoch": 1.46, "learning_rate": 8.070764246112935e-05, "loss": 0.0246, "step": 226510 }, { "epoch": 1.46, "learning_rate": 8.069796110677243e-05, "loss": 0.025, "step": 226520 }, { "epoch": 1.46, "learning_rate": 8.068827975241548e-05, "loss": 0.0271, "step": 226530 }, { "epoch": 1.46, "learning_rate": 8.067859839805856e-05, "loss": 0.0249, "step": 226540 }, { "epoch": 1.46, "learning_rate": 8.066891704370163e-05, "loss": 0.0291, "step": 226550 }, { "epoch": 1.46, "learning_rate": 8.065923568934468e-05, "loss": 0.0335, "step": 226560 }, { "epoch": 1.46, "learning_rate": 8.064955433498776e-05, "loss": 0.0346, "step": 226570 }, { "epoch": 1.46, "learning_rate": 8.063987298063083e-05, "loss": 0.0291, "step": 226580 }, { "epoch": 1.46, "learning_rate": 8.063019162627391e-05, "loss": 0.0283, "step": 226590 }, { "epoch": 1.46, "learning_rate": 8.062051027191696e-05, "loss": 0.0274, "step": 226600 }, { "epoch": 1.46, "learning_rate": 8.061082891756003e-05, "loss": 0.0314, "step": 226610 }, { "epoch": 1.46, "learning_rate": 8.060114756320311e-05, "loss": 0.0264, "step": 226620 }, { "epoch": 1.46, "learning_rate": 8.059146620884616e-05, "loss": 0.0256, "step": 226630 }, { "epoch": 1.46, "learning_rate": 8.058178485448924e-05, "loss": 0.0286, "step": 226640 }, { "epoch": 1.46, "learning_rate": 8.05721035001323e-05, "loss": 0.0332, "step": 226650 }, { "epoch": 1.46, "learning_rate": 8.056242214577537e-05, "loss": 0.0248, "step": 226660 }, { "epoch": 1.46, "learning_rate": 8.055274079141844e-05, "loss": 0.0268, "step": 226670 }, { "epoch": 1.46, "learning_rate": 8.05430594370615e-05, "loss": 0.0302, "step": 226680 }, { "epoch": 1.46, "learning_rate": 8.053337808270459e-05, "loss": 0.0301, "step": 226690 }, { "epoch": 1.46, "learning_rate": 8.052369672834764e-05, "loss": 0.0272, "step": 226700 }, { "epoch": 1.46, "learning_rate": 8.05140153739907e-05, "loss": 0.0287, "step": 226710 }, { "epoch": 1.46, "learning_rate": 8.050433401963378e-05, "loss": 0.0286, "step": 226720 }, { "epoch": 1.46, "learning_rate": 8.049465266527685e-05, "loss": 0.0269, "step": 226730 }, { "epoch": 1.46, "learning_rate": 8.048497131091992e-05, "loss": 0.0301, "step": 226740 }, { "epoch": 1.46, "learning_rate": 8.047528995656298e-05, "loss": 0.0264, "step": 226750 }, { "epoch": 1.46, "learning_rate": 8.046560860220605e-05, "loss": 0.0268, "step": 226760 }, { "epoch": 1.46, "learning_rate": 8.045592724784912e-05, "loss": 0.0305, "step": 226770 }, { "epoch": 1.46, "learning_rate": 8.044624589349218e-05, "loss": 0.0272, "step": 226780 }, { "epoch": 1.46, "learning_rate": 8.043656453913526e-05, "loss": 0.0342, "step": 226790 }, { "epoch": 1.46, "learning_rate": 8.042688318477833e-05, "loss": 0.0348, "step": 226800 }, { "epoch": 1.46, "learning_rate": 8.041720183042138e-05, "loss": 0.0329, "step": 226810 }, { "epoch": 1.46, "learning_rate": 8.040752047606446e-05, "loss": 0.0268, "step": 226820 }, { "epoch": 1.46, "learning_rate": 8.039783912170753e-05, "loss": 0.0353, "step": 226830 }, { "epoch": 1.46, "learning_rate": 8.038815776735059e-05, "loss": 0.0332, "step": 226840 }, { "epoch": 1.46, "learning_rate": 8.037847641299366e-05, "loss": 0.0321, "step": 226850 }, { "epoch": 1.46, "learning_rate": 8.036879505863672e-05, "loss": 0.0322, "step": 226860 }, { "epoch": 1.46, "learning_rate": 8.03591137042798e-05, "loss": 0.0318, "step": 226870 }, { "epoch": 1.46, "learning_rate": 8.034943234992286e-05, "loss": 0.0269, "step": 226880 }, { "epoch": 1.46, "learning_rate": 8.033975099556594e-05, "loss": 0.0285, "step": 226890 }, { "epoch": 1.46, "learning_rate": 8.0330069641209e-05, "loss": 0.0348, "step": 226900 }, { "epoch": 1.46, "learning_rate": 8.032038828685206e-05, "loss": 0.0239, "step": 226910 }, { "epoch": 1.46, "learning_rate": 8.031070693249514e-05, "loss": 0.0294, "step": 226920 }, { "epoch": 1.46, "learning_rate": 8.03010255781382e-05, "loss": 0.0244, "step": 226930 }, { "epoch": 1.46, "learning_rate": 8.029134422378128e-05, "loss": 0.0299, "step": 226940 }, { "epoch": 1.46, "learning_rate": 8.028166286942433e-05, "loss": 0.0252, "step": 226950 }, { "epoch": 1.46, "learning_rate": 8.02719815150674e-05, "loss": 0.0246, "step": 226960 }, { "epoch": 1.46, "learning_rate": 8.026230016071048e-05, "loss": 0.0277, "step": 226970 }, { "epoch": 1.46, "learning_rate": 8.025261880635353e-05, "loss": 0.0298, "step": 226980 }, { "epoch": 1.47, "learning_rate": 8.024293745199661e-05, "loss": 0.0316, "step": 226990 }, { "epoch": 1.47, "learning_rate": 8.023325609763968e-05, "loss": 0.0267, "step": 227000 }, { "epoch": 1.47, "eval_cer": 0.9199240763755507, "eval_loss": 0.020223721861839294, "eval_runtime": 120.1186, "eval_samples_per_second": 16.65, "eval_steps_per_second": 4.163, "step": 227000 }, { "epoch": 1.47, "learning_rate": 8.022357474328276e-05, "loss": 0.0293, "step": 227010 }, { "epoch": 1.47, "learning_rate": 8.021389338892581e-05, "loss": 0.0351, "step": 227020 }, { "epoch": 1.47, "learning_rate": 8.020421203456888e-05, "loss": 0.0342, "step": 227030 }, { "epoch": 1.47, "learning_rate": 8.019453068021196e-05, "loss": 0.0375, "step": 227040 }, { "epoch": 1.47, "learning_rate": 8.018484932585501e-05, "loss": 0.0237, "step": 227050 }, { "epoch": 1.47, "learning_rate": 8.017516797149808e-05, "loss": 0.0317, "step": 227060 }, { "epoch": 1.47, "learning_rate": 8.016548661714116e-05, "loss": 0.0276, "step": 227070 }, { "epoch": 1.47, "learning_rate": 8.015580526278422e-05, "loss": 0.0258, "step": 227080 }, { "epoch": 1.47, "learning_rate": 8.014612390842729e-05, "loss": 0.0287, "step": 227090 }, { "epoch": 1.47, "learning_rate": 8.013644255407036e-05, "loss": 0.0214, "step": 227100 }, { "epoch": 1.47, "learning_rate": 8.012676119971344e-05, "loss": 0.0253, "step": 227110 }, { "epoch": 1.47, "learning_rate": 8.011707984535649e-05, "loss": 0.0298, "step": 227120 }, { "epoch": 1.47, "learning_rate": 8.010739849099955e-05, "loss": 0.0258, "step": 227130 }, { "epoch": 1.47, "learning_rate": 8.009771713664263e-05, "loss": 0.0337, "step": 227140 }, { "epoch": 1.47, "learning_rate": 8.00880357822857e-05, "loss": 0.0277, "step": 227150 }, { "epoch": 1.47, "learning_rate": 8.007835442792875e-05, "loss": 0.0291, "step": 227160 }, { "epoch": 1.47, "learning_rate": 8.006867307357183e-05, "loss": 0.0274, "step": 227170 }, { "epoch": 1.47, "learning_rate": 8.00589917192149e-05, "loss": 0.0289, "step": 227180 }, { "epoch": 1.47, "learning_rate": 8.004931036485796e-05, "loss": 0.0271, "step": 227190 }, { "epoch": 1.47, "learning_rate": 8.003962901050103e-05, "loss": 0.0287, "step": 227200 }, { "epoch": 1.47, "learning_rate": 8.002994765614411e-05, "loss": 0.0262, "step": 227210 }, { "epoch": 1.47, "learning_rate": 8.002026630178718e-05, "loss": 0.0281, "step": 227220 }, { "epoch": 1.47, "learning_rate": 8.001058494743023e-05, "loss": 0.0254, "step": 227230 }, { "epoch": 1.47, "learning_rate": 8.000090359307331e-05, "loss": 0.0267, "step": 227240 }, { "epoch": 1.47, "learning_rate": 7.999122223871638e-05, "loss": 0.0283, "step": 227250 }, { "epoch": 1.47, "learning_rate": 7.998154088435943e-05, "loss": 0.026, "step": 227260 }, { "epoch": 1.47, "learning_rate": 7.997185953000251e-05, "loss": 0.0289, "step": 227270 }, { "epoch": 1.47, "learning_rate": 7.996217817564557e-05, "loss": 0.0308, "step": 227280 }, { "epoch": 1.47, "learning_rate": 7.995249682128865e-05, "loss": 0.0327, "step": 227290 }, { "epoch": 1.47, "learning_rate": 7.994281546693171e-05, "loss": 0.0269, "step": 227300 }, { "epoch": 1.47, "learning_rate": 7.993313411257479e-05, "loss": 0.0282, "step": 227310 }, { "epoch": 1.47, "learning_rate": 7.992345275821785e-05, "loss": 0.0253, "step": 227320 }, { "epoch": 1.47, "learning_rate": 7.99137714038609e-05, "loss": 0.0364, "step": 227330 }, { "epoch": 1.47, "learning_rate": 7.990409004950399e-05, "loss": 0.0239, "step": 227340 }, { "epoch": 1.47, "learning_rate": 7.989440869514705e-05, "loss": 0.0235, "step": 227350 }, { "epoch": 1.47, "learning_rate": 7.988472734079013e-05, "loss": 0.0241, "step": 227360 }, { "epoch": 1.47, "learning_rate": 7.987504598643318e-05, "loss": 0.0228, "step": 227370 }, { "epoch": 1.47, "learning_rate": 7.986536463207625e-05, "loss": 0.0338, "step": 227380 }, { "epoch": 1.47, "learning_rate": 7.985568327771933e-05, "loss": 0.0249, "step": 227390 }, { "epoch": 1.47, "learning_rate": 7.984600192336238e-05, "loss": 0.0321, "step": 227400 }, { "epoch": 1.47, "learning_rate": 7.983632056900546e-05, "loss": 0.0292, "step": 227410 }, { "epoch": 1.47, "learning_rate": 7.982663921464853e-05, "loss": 0.0323, "step": 227420 }, { "epoch": 1.47, "learning_rate": 7.981695786029161e-05, "loss": 0.0295, "step": 227430 }, { "epoch": 1.47, "learning_rate": 7.980727650593466e-05, "loss": 0.0289, "step": 227440 }, { "epoch": 1.47, "learning_rate": 7.979759515157773e-05, "loss": 0.0276, "step": 227450 }, { "epoch": 1.47, "learning_rate": 7.978791379722081e-05, "loss": 0.0268, "step": 227460 }, { "epoch": 1.47, "learning_rate": 7.977823244286386e-05, "loss": 0.0235, "step": 227470 }, { "epoch": 1.47, "learning_rate": 7.976855108850693e-05, "loss": 0.0294, "step": 227480 }, { "epoch": 1.47, "learning_rate": 7.975886973415e-05, "loss": 0.0268, "step": 227490 }, { "epoch": 1.47, "learning_rate": 7.974918837979307e-05, "loss": 0.0261, "step": 227500 }, { "epoch": 1.47, "learning_rate": 7.973950702543614e-05, "loss": 0.0298, "step": 227510 }, { "epoch": 1.47, "learning_rate": 7.97298256710792e-05, "loss": 0.0226, "step": 227520 }, { "epoch": 1.47, "learning_rate": 7.972014431672228e-05, "loss": 0.0301, "step": 227530 }, { "epoch": 1.47, "learning_rate": 7.971046296236534e-05, "loss": 0.0259, "step": 227540 }, { "epoch": 1.47, "learning_rate": 7.97007816080084e-05, "loss": 0.0275, "step": 227550 }, { "epoch": 1.47, "learning_rate": 7.969110025365148e-05, "loss": 0.0292, "step": 227560 }, { "epoch": 1.47, "learning_rate": 7.968141889929455e-05, "loss": 0.0312, "step": 227570 }, { "epoch": 1.47, "learning_rate": 7.96717375449376e-05, "loss": 0.0362, "step": 227580 }, { "epoch": 1.47, "learning_rate": 7.966205619058068e-05, "loss": 0.0274, "step": 227590 }, { "epoch": 1.47, "learning_rate": 7.965237483622375e-05, "loss": 0.0301, "step": 227600 }, { "epoch": 1.47, "learning_rate": 7.964269348186681e-05, "loss": 0.0242, "step": 227610 }, { "epoch": 1.47, "learning_rate": 7.963301212750988e-05, "loss": 0.0264, "step": 227620 }, { "epoch": 1.47, "learning_rate": 7.962333077315296e-05, "loss": 0.0286, "step": 227630 }, { "epoch": 1.47, "learning_rate": 7.961364941879603e-05, "loss": 0.0256, "step": 227640 }, { "epoch": 1.47, "learning_rate": 7.960396806443908e-05, "loss": 0.0244, "step": 227650 }, { "epoch": 1.47, "learning_rate": 7.959428671008216e-05, "loss": 0.0268, "step": 227660 }, { "epoch": 1.47, "learning_rate": 7.958460535572523e-05, "loss": 0.0325, "step": 227670 }, { "epoch": 1.47, "learning_rate": 7.957492400136828e-05, "loss": 0.0296, "step": 227680 }, { "epoch": 1.47, "learning_rate": 7.956524264701136e-05, "loss": 0.0314, "step": 227690 }, { "epoch": 1.47, "learning_rate": 7.955556129265442e-05, "loss": 0.0275, "step": 227700 }, { "epoch": 1.47, "learning_rate": 7.95458799382975e-05, "loss": 0.0312, "step": 227710 }, { "epoch": 1.47, "learning_rate": 7.953619858394056e-05, "loss": 0.0255, "step": 227720 }, { "epoch": 1.47, "learning_rate": 7.952651722958364e-05, "loss": 0.0299, "step": 227730 }, { "epoch": 1.47, "learning_rate": 7.95168358752267e-05, "loss": 0.0269, "step": 227740 }, { "epoch": 1.47, "learning_rate": 7.950715452086976e-05, "loss": 0.0331, "step": 227750 }, { "epoch": 1.47, "learning_rate": 7.949747316651284e-05, "loss": 0.0236, "step": 227760 }, { "epoch": 1.47, "learning_rate": 7.94877918121559e-05, "loss": 0.0301, "step": 227770 }, { "epoch": 1.47, "learning_rate": 7.947811045779898e-05, "loss": 0.0287, "step": 227780 }, { "epoch": 1.47, "learning_rate": 7.946842910344203e-05, "loss": 0.0252, "step": 227790 }, { "epoch": 1.47, "learning_rate": 7.94587477490851e-05, "loss": 0.0287, "step": 227800 }, { "epoch": 1.47, "learning_rate": 7.944906639472818e-05, "loss": 0.0269, "step": 227810 }, { "epoch": 1.47, "learning_rate": 7.943938504037123e-05, "loss": 0.0227, "step": 227820 }, { "epoch": 1.47, "learning_rate": 7.942970368601431e-05, "loss": 0.0306, "step": 227830 }, { "epoch": 1.47, "learning_rate": 7.942002233165738e-05, "loss": 0.0285, "step": 227840 }, { "epoch": 1.47, "learning_rate": 7.941034097730045e-05, "loss": 0.0285, "step": 227850 }, { "epoch": 1.47, "learning_rate": 7.940065962294351e-05, "loss": 0.0283, "step": 227860 }, { "epoch": 1.47, "learning_rate": 7.939097826858658e-05, "loss": 0.0283, "step": 227870 }, { "epoch": 1.47, "learning_rate": 7.938129691422966e-05, "loss": 0.0255, "step": 227880 }, { "epoch": 1.47, "learning_rate": 7.937161555987271e-05, "loss": 0.0319, "step": 227890 }, { "epoch": 1.47, "learning_rate": 7.936193420551578e-05, "loss": 0.0266, "step": 227900 }, { "epoch": 1.47, "learning_rate": 7.935225285115886e-05, "loss": 0.0279, "step": 227910 }, { "epoch": 1.47, "learning_rate": 7.934257149680192e-05, "loss": 0.0227, "step": 227920 }, { "epoch": 1.47, "learning_rate": 7.933289014244499e-05, "loss": 0.0304, "step": 227930 }, { "epoch": 1.47, "learning_rate": 7.932320878808805e-05, "loss": 0.0335, "step": 227940 }, { "epoch": 1.47, "learning_rate": 7.931352743373112e-05, "loss": 0.0252, "step": 227950 }, { "epoch": 1.47, "learning_rate": 7.930384607937419e-05, "loss": 0.0292, "step": 227960 }, { "epoch": 1.47, "learning_rate": 7.929416472501725e-05, "loss": 0.0236, "step": 227970 }, { "epoch": 1.47, "learning_rate": 7.928448337066033e-05, "loss": 0.0271, "step": 227980 }, { "epoch": 1.47, "learning_rate": 7.92748020163034e-05, "loss": 0.0315, "step": 227990 }, { "epoch": 1.47, "learning_rate": 7.926512066194645e-05, "loss": 0.0264, "step": 228000 }, { "epoch": 1.47, "eval_cer": 0.9198535758671337, "eval_loss": 0.020223427563905716, "eval_runtime": 119.9893, "eval_samples_per_second": 16.668, "eval_steps_per_second": 4.167, "step": 228000 }, { "epoch": 1.47, "learning_rate": 7.925543930758953e-05, "loss": 0.0268, "step": 228010 }, { "epoch": 1.47, "learning_rate": 7.92457579532326e-05, "loss": 0.0279, "step": 228020 }, { "epoch": 1.47, "learning_rate": 7.923607659887566e-05, "loss": 0.031, "step": 228030 }, { "epoch": 1.47, "learning_rate": 7.922639524451873e-05, "loss": 0.0301, "step": 228040 }, { "epoch": 1.47, "learning_rate": 7.92167138901618e-05, "loss": 0.0332, "step": 228050 }, { "epoch": 1.47, "learning_rate": 7.920703253580488e-05, "loss": 0.029, "step": 228060 }, { "epoch": 1.47, "learning_rate": 7.919735118144793e-05, "loss": 0.0369, "step": 228070 }, { "epoch": 1.47, "learning_rate": 7.918766982709101e-05, "loss": 0.0235, "step": 228080 }, { "epoch": 1.47, "learning_rate": 7.917798847273408e-05, "loss": 0.0306, "step": 228090 }, { "epoch": 1.47, "learning_rate": 7.916830711837713e-05, "loss": 0.0289, "step": 228100 }, { "epoch": 1.47, "learning_rate": 7.915862576402021e-05, "loss": 0.0275, "step": 228110 }, { "epoch": 1.47, "learning_rate": 7.914894440966327e-05, "loss": 0.0258, "step": 228120 }, { "epoch": 1.47, "learning_rate": 7.913926305530635e-05, "loss": 0.0264, "step": 228130 }, { "epoch": 1.47, "learning_rate": 7.91295817009494e-05, "loss": 0.0282, "step": 228140 }, { "epoch": 1.47, "learning_rate": 7.911990034659247e-05, "loss": 0.0304, "step": 228150 }, { "epoch": 1.47, "learning_rate": 7.911021899223555e-05, "loss": 0.0267, "step": 228160 }, { "epoch": 1.47, "learning_rate": 7.91005376378786e-05, "loss": 0.0287, "step": 228170 }, { "epoch": 1.47, "learning_rate": 7.909085628352169e-05, "loss": 0.03, "step": 228180 }, { "epoch": 1.47, "learning_rate": 7.908117492916475e-05, "loss": 0.0293, "step": 228190 }, { "epoch": 1.47, "learning_rate": 7.907149357480783e-05, "loss": 0.0274, "step": 228200 }, { "epoch": 1.47, "learning_rate": 7.906181222045088e-05, "loss": 0.0325, "step": 228210 }, { "epoch": 1.47, "learning_rate": 7.905213086609395e-05, "loss": 0.0246, "step": 228220 }, { "epoch": 1.47, "learning_rate": 7.904244951173703e-05, "loss": 0.0284, "step": 228230 }, { "epoch": 1.47, "learning_rate": 7.903276815738008e-05, "loss": 0.0245, "step": 228240 }, { "epoch": 1.47, "learning_rate": 7.902308680302315e-05, "loss": 0.0264, "step": 228250 }, { "epoch": 1.47, "learning_rate": 7.901340544866623e-05, "loss": 0.0239, "step": 228260 }, { "epoch": 1.47, "learning_rate": 7.90037240943093e-05, "loss": 0.0295, "step": 228270 }, { "epoch": 1.47, "learning_rate": 7.899404273995236e-05, "loss": 0.0242, "step": 228280 }, { "epoch": 1.47, "learning_rate": 7.898436138559543e-05, "loss": 0.0231, "step": 228290 }, { "epoch": 1.47, "learning_rate": 7.897468003123851e-05, "loss": 0.0276, "step": 228300 }, { "epoch": 1.47, "learning_rate": 7.896499867688156e-05, "loss": 0.0281, "step": 228310 }, { "epoch": 1.47, "learning_rate": 7.895531732252463e-05, "loss": 0.0217, "step": 228320 }, { "epoch": 1.47, "learning_rate": 7.89456359681677e-05, "loss": 0.0292, "step": 228330 }, { "epoch": 1.47, "learning_rate": 7.893595461381077e-05, "loss": 0.0242, "step": 228340 }, { "epoch": 1.47, "learning_rate": 7.892627325945382e-05, "loss": 0.0275, "step": 228350 }, { "epoch": 1.47, "learning_rate": 7.89165919050969e-05, "loss": 0.022, "step": 228360 }, { "epoch": 1.47, "learning_rate": 7.890691055073997e-05, "loss": 0.0265, "step": 228370 }, { "epoch": 1.47, "learning_rate": 7.889722919638304e-05, "loss": 0.0317, "step": 228380 }, { "epoch": 1.47, "learning_rate": 7.88875478420261e-05, "loss": 0.0251, "step": 228390 }, { "epoch": 1.47, "learning_rate": 7.887786648766918e-05, "loss": 0.0275, "step": 228400 }, { "epoch": 1.47, "learning_rate": 7.886818513331225e-05, "loss": 0.0285, "step": 228410 }, { "epoch": 1.47, "learning_rate": 7.88585037789553e-05, "loss": 0.0232, "step": 228420 }, { "epoch": 1.47, "learning_rate": 7.884882242459838e-05, "loss": 0.029, "step": 228430 }, { "epoch": 1.47, "learning_rate": 7.883914107024145e-05, "loss": 0.026, "step": 228440 }, { "epoch": 1.47, "learning_rate": 7.882945971588451e-05, "loss": 0.0251, "step": 228450 }, { "epoch": 1.47, "learning_rate": 7.881977836152758e-05, "loss": 0.0265, "step": 228460 }, { "epoch": 1.47, "learning_rate": 7.881009700717065e-05, "loss": 0.0258, "step": 228470 }, { "epoch": 1.47, "learning_rate": 7.880041565281373e-05, "loss": 0.0289, "step": 228480 }, { "epoch": 1.47, "learning_rate": 7.879073429845678e-05, "loss": 0.0329, "step": 228490 }, { "epoch": 1.47, "learning_rate": 7.878105294409986e-05, "loss": 0.0273, "step": 228500 }, { "epoch": 1.47, "learning_rate": 7.877137158974293e-05, "loss": 0.0301, "step": 228510 }, { "epoch": 1.47, "learning_rate": 7.876169023538598e-05, "loss": 0.0261, "step": 228520 }, { "epoch": 1.47, "learning_rate": 7.875200888102906e-05, "loss": 0.0264, "step": 228530 }, { "epoch": 1.48, "learning_rate": 7.874232752667212e-05, "loss": 0.026, "step": 228540 }, { "epoch": 1.48, "learning_rate": 7.87326461723152e-05, "loss": 0.0275, "step": 228550 }, { "epoch": 1.48, "learning_rate": 7.872296481795826e-05, "loss": 0.0295, "step": 228560 }, { "epoch": 1.48, "learning_rate": 7.871328346360132e-05, "loss": 0.0258, "step": 228570 }, { "epoch": 1.48, "learning_rate": 7.87036021092444e-05, "loss": 0.0284, "step": 228580 }, { "epoch": 1.48, "learning_rate": 7.869392075488746e-05, "loss": 0.024, "step": 228590 }, { "epoch": 1.48, "learning_rate": 7.868423940053054e-05, "loss": 0.0252, "step": 228600 }, { "epoch": 1.48, "learning_rate": 7.86745580461736e-05, "loss": 0.0299, "step": 228610 }, { "epoch": 1.48, "learning_rate": 7.866487669181668e-05, "loss": 0.0239, "step": 228620 }, { "epoch": 1.48, "learning_rate": 7.865519533745973e-05, "loss": 0.0266, "step": 228630 }, { "epoch": 1.48, "learning_rate": 7.86455139831028e-05, "loss": 0.0247, "step": 228640 }, { "epoch": 1.48, "learning_rate": 7.863583262874588e-05, "loss": 0.0285, "step": 228650 }, { "epoch": 1.48, "learning_rate": 7.862615127438893e-05, "loss": 0.0311, "step": 228660 }, { "epoch": 1.48, "learning_rate": 7.8616469920032e-05, "loss": 0.029, "step": 228670 }, { "epoch": 1.48, "learning_rate": 7.860678856567508e-05, "loss": 0.0292, "step": 228680 }, { "epoch": 1.48, "learning_rate": 7.859710721131814e-05, "loss": 0.0311, "step": 228690 }, { "epoch": 1.48, "learning_rate": 7.858742585696121e-05, "loss": 0.026, "step": 228700 }, { "epoch": 1.48, "learning_rate": 7.857774450260428e-05, "loss": 0.0304, "step": 228710 }, { "epoch": 1.48, "learning_rate": 7.856806314824736e-05, "loss": 0.0296, "step": 228720 }, { "epoch": 1.48, "learning_rate": 7.855838179389041e-05, "loss": 0.029, "step": 228730 }, { "epoch": 1.48, "learning_rate": 7.854870043953348e-05, "loss": 0.0288, "step": 228740 }, { "epoch": 1.48, "learning_rate": 7.853901908517656e-05, "loss": 0.0265, "step": 228750 }, { "epoch": 1.48, "learning_rate": 7.852933773081962e-05, "loss": 0.0255, "step": 228760 }, { "epoch": 1.48, "learning_rate": 7.851965637646267e-05, "loss": 0.0279, "step": 228770 }, { "epoch": 1.48, "learning_rate": 7.850997502210575e-05, "loss": 0.0314, "step": 228780 }, { "epoch": 1.48, "learning_rate": 7.850029366774882e-05, "loss": 0.0369, "step": 228790 }, { "epoch": 1.48, "learning_rate": 7.849061231339189e-05, "loss": 0.0284, "step": 228800 }, { "epoch": 1.48, "learning_rate": 7.848093095903495e-05, "loss": 0.0323, "step": 228810 }, { "epoch": 1.48, "learning_rate": 7.847124960467803e-05, "loss": 0.0302, "step": 228820 }, { "epoch": 1.48, "learning_rate": 7.84615682503211e-05, "loss": 0.0244, "step": 228830 }, { "epoch": 1.48, "learning_rate": 7.845188689596415e-05, "loss": 0.026, "step": 228840 }, { "epoch": 1.48, "learning_rate": 7.844220554160723e-05, "loss": 0.0281, "step": 228850 }, { "epoch": 1.48, "learning_rate": 7.84325241872503e-05, "loss": 0.0354, "step": 228860 }, { "epoch": 1.48, "learning_rate": 7.842284283289335e-05, "loss": 0.0344, "step": 228870 }, { "epoch": 1.48, "learning_rate": 7.841316147853643e-05, "loss": 0.0257, "step": 228880 }, { "epoch": 1.48, "learning_rate": 7.84034801241795e-05, "loss": 0.0365, "step": 228890 }, { "epoch": 1.48, "learning_rate": 7.839379876982258e-05, "loss": 0.0289, "step": 228900 }, { "epoch": 1.48, "learning_rate": 7.838411741546563e-05, "loss": 0.0287, "step": 228910 }, { "epoch": 1.48, "learning_rate": 7.837443606110871e-05, "loss": 0.0269, "step": 228920 }, { "epoch": 1.48, "learning_rate": 7.836475470675178e-05, "loss": 0.0244, "step": 228930 }, { "epoch": 1.48, "learning_rate": 7.835507335239483e-05, "loss": 0.027, "step": 228940 }, { "epoch": 1.48, "learning_rate": 7.834539199803791e-05, "loss": 0.0255, "step": 228950 }, { "epoch": 1.48, "learning_rate": 7.833571064368097e-05, "loss": 0.0246, "step": 228960 }, { "epoch": 1.48, "learning_rate": 7.832602928932403e-05, "loss": 0.0282, "step": 228970 }, { "epoch": 1.48, "learning_rate": 7.83163479349671e-05, "loss": 0.0264, "step": 228980 }, { "epoch": 1.48, "learning_rate": 7.830666658061017e-05, "loss": 0.0275, "step": 228990 }, { "epoch": 1.48, "learning_rate": 7.829698522625325e-05, "loss": 0.031, "step": 229000 }, { "epoch": 1.48, "eval_cer": 0.9198644220991978, "eval_loss": 0.020123105496168137, "eval_runtime": 120.4002, "eval_samples_per_second": 16.611, "eval_steps_per_second": 4.153, "step": 229000 }, { "epoch": 1.48, "learning_rate": 7.82873038718963e-05, "loss": 0.0289, "step": 229010 }, { "epoch": 1.48, "learning_rate": 7.827762251753938e-05, "loss": 0.0215, "step": 229020 }, { "epoch": 1.48, "learning_rate": 7.826794116318245e-05, "loss": 0.0274, "step": 229030 }, { "epoch": 1.48, "learning_rate": 7.82582598088255e-05, "loss": 0.0282, "step": 229040 }, { "epoch": 1.48, "learning_rate": 7.824857845446858e-05, "loss": 0.0269, "step": 229050 }, { "epoch": 1.48, "learning_rate": 7.823889710011165e-05, "loss": 0.0321, "step": 229060 }, { "epoch": 1.48, "learning_rate": 7.822921574575473e-05, "loss": 0.0245, "step": 229070 }, { "epoch": 1.48, "learning_rate": 7.821953439139778e-05, "loss": 0.0239, "step": 229080 }, { "epoch": 1.48, "learning_rate": 7.820985303704085e-05, "loss": 0.0281, "step": 229090 }, { "epoch": 1.48, "learning_rate": 7.820017168268393e-05, "loss": 0.0311, "step": 229100 }, { "epoch": 1.48, "learning_rate": 7.819049032832698e-05, "loss": 0.0245, "step": 229110 }, { "epoch": 1.48, "learning_rate": 7.818080897397006e-05, "loss": 0.0256, "step": 229120 }, { "epoch": 1.48, "learning_rate": 7.817112761961313e-05, "loss": 0.0281, "step": 229130 }, { "epoch": 1.48, "learning_rate": 7.816144626525621e-05, "loss": 0.0271, "step": 229140 }, { "epoch": 1.48, "learning_rate": 7.815176491089926e-05, "loss": 0.0332, "step": 229150 }, { "epoch": 1.48, "learning_rate": 7.814208355654233e-05, "loss": 0.0288, "step": 229160 }, { "epoch": 1.48, "learning_rate": 7.81324022021854e-05, "loss": 0.027, "step": 229170 }, { "epoch": 1.48, "learning_rate": 7.812272084782846e-05, "loss": 0.0263, "step": 229180 }, { "epoch": 1.48, "learning_rate": 7.811303949347152e-05, "loss": 0.0256, "step": 229190 }, { "epoch": 1.48, "learning_rate": 7.81033581391146e-05, "loss": 0.028, "step": 229200 }, { "epoch": 1.48, "learning_rate": 7.809367678475767e-05, "loss": 0.0336, "step": 229210 }, { "epoch": 1.48, "learning_rate": 7.808399543040074e-05, "loss": 0.0305, "step": 229220 }, { "epoch": 1.48, "learning_rate": 7.80743140760438e-05, "loss": 0.0285, "step": 229230 }, { "epoch": 1.48, "learning_rate": 7.806463272168688e-05, "loss": 0.0266, "step": 229240 }, { "epoch": 1.48, "learning_rate": 7.805495136732994e-05, "loss": 0.0282, "step": 229250 }, { "epoch": 1.48, "learning_rate": 7.8045270012973e-05, "loss": 0.0267, "step": 229260 }, { "epoch": 1.48, "learning_rate": 7.803558865861608e-05, "loss": 0.0287, "step": 229270 }, { "epoch": 1.48, "learning_rate": 7.802590730425915e-05, "loss": 0.0274, "step": 229280 }, { "epoch": 1.48, "learning_rate": 7.80162259499022e-05, "loss": 0.0259, "step": 229290 }, { "epoch": 1.48, "learning_rate": 7.800654459554528e-05, "loss": 0.0252, "step": 229300 }, { "epoch": 1.48, "learning_rate": 7.799686324118835e-05, "loss": 0.0227, "step": 229310 }, { "epoch": 1.48, "learning_rate": 7.798718188683141e-05, "loss": 0.0248, "step": 229320 }, { "epoch": 1.48, "learning_rate": 7.797750053247448e-05, "loss": 0.026, "step": 229330 }, { "epoch": 1.48, "learning_rate": 7.796781917811756e-05, "loss": 0.0253, "step": 229340 }, { "epoch": 1.48, "learning_rate": 7.795813782376062e-05, "loss": 0.0269, "step": 229350 }, { "epoch": 1.48, "learning_rate": 7.794845646940368e-05, "loss": 0.0241, "step": 229360 }, { "epoch": 1.48, "learning_rate": 7.793877511504676e-05, "loss": 0.0294, "step": 229370 }, { "epoch": 1.48, "learning_rate": 7.792909376068982e-05, "loss": 0.022, "step": 229380 }, { "epoch": 1.48, "learning_rate": 7.791941240633288e-05, "loss": 0.0276, "step": 229390 }, { "epoch": 1.48, "learning_rate": 7.790973105197596e-05, "loss": 0.0244, "step": 229400 }, { "epoch": 1.48, "learning_rate": 7.790004969761902e-05, "loss": 0.0258, "step": 229410 }, { "epoch": 1.48, "learning_rate": 7.78903683432621e-05, "loss": 0.0258, "step": 229420 }, { "epoch": 1.48, "learning_rate": 7.788068698890515e-05, "loss": 0.0285, "step": 229430 }, { "epoch": 1.48, "learning_rate": 7.787100563454823e-05, "loss": 0.0239, "step": 229440 }, { "epoch": 1.48, "learning_rate": 7.78613242801913e-05, "loss": 0.0297, "step": 229450 }, { "epoch": 1.48, "learning_rate": 7.785164292583435e-05, "loss": 0.0265, "step": 229460 }, { "epoch": 1.48, "learning_rate": 7.784196157147743e-05, "loss": 0.0235, "step": 229470 }, { "epoch": 1.48, "learning_rate": 7.78322802171205e-05, "loss": 0.0285, "step": 229480 }, { "epoch": 1.48, "learning_rate": 7.782259886276358e-05, "loss": 0.0273, "step": 229490 }, { "epoch": 1.48, "learning_rate": 7.781291750840663e-05, "loss": 0.0288, "step": 229500 }, { "epoch": 1.48, "learning_rate": 7.78032361540497e-05, "loss": 0.0247, "step": 229510 }, { "epoch": 1.48, "learning_rate": 7.779355479969278e-05, "loss": 0.0266, "step": 229520 }, { "epoch": 1.48, "learning_rate": 7.778387344533583e-05, "loss": 0.0239, "step": 229530 }, { "epoch": 1.48, "learning_rate": 7.777419209097891e-05, "loss": 0.0279, "step": 229540 }, { "epoch": 1.48, "learning_rate": 7.776451073662198e-05, "loss": 0.0285, "step": 229550 }, { "epoch": 1.48, "learning_rate": 7.775482938226504e-05, "loss": 0.0244, "step": 229560 }, { "epoch": 1.48, "learning_rate": 7.774514802790811e-05, "loss": 0.0278, "step": 229570 }, { "epoch": 1.48, "learning_rate": 7.773546667355118e-05, "loss": 0.0291, "step": 229580 }, { "epoch": 1.48, "learning_rate": 7.772578531919426e-05, "loss": 0.0254, "step": 229590 }, { "epoch": 1.48, "learning_rate": 7.771610396483731e-05, "loss": 0.0331, "step": 229600 }, { "epoch": 1.48, "learning_rate": 7.770642261048037e-05, "loss": 0.0272, "step": 229610 }, { "epoch": 1.48, "learning_rate": 7.769674125612345e-05, "loss": 0.0273, "step": 229620 }, { "epoch": 1.48, "learning_rate": 7.768705990176652e-05, "loss": 0.0264, "step": 229630 }, { "epoch": 1.48, "learning_rate": 7.767737854740959e-05, "loss": 0.0261, "step": 229640 }, { "epoch": 1.48, "learning_rate": 7.766769719305265e-05, "loss": 0.0248, "step": 229650 }, { "epoch": 1.48, "learning_rate": 7.765801583869572e-05, "loss": 0.0282, "step": 229660 }, { "epoch": 1.48, "learning_rate": 7.764833448433879e-05, "loss": 0.0252, "step": 229670 }, { "epoch": 1.48, "learning_rate": 7.763865312998185e-05, "loss": 0.0277, "step": 229680 }, { "epoch": 1.48, "learning_rate": 7.762897177562493e-05, "loss": 0.0307, "step": 229690 }, { "epoch": 1.48, "learning_rate": 7.7619290421268e-05, "loss": 0.026, "step": 229700 }, { "epoch": 1.48, "learning_rate": 7.760960906691105e-05, "loss": 0.0263, "step": 229710 }, { "epoch": 1.48, "learning_rate": 7.759992771255413e-05, "loss": 0.0278, "step": 229720 }, { "epoch": 1.48, "learning_rate": 7.75902463581972e-05, "loss": 0.0274, "step": 229730 }, { "epoch": 1.48, "learning_rate": 7.758056500384026e-05, "loss": 0.0256, "step": 229740 }, { "epoch": 1.48, "learning_rate": 7.757088364948333e-05, "loss": 0.0288, "step": 229750 }, { "epoch": 1.48, "learning_rate": 7.75612022951264e-05, "loss": 0.0252, "step": 229760 }, { "epoch": 1.48, "learning_rate": 7.755152094076947e-05, "loss": 0.0283, "step": 229770 }, { "epoch": 1.48, "learning_rate": 7.754183958641253e-05, "loss": 0.0241, "step": 229780 }, { "epoch": 1.48, "learning_rate": 7.753215823205561e-05, "loss": 0.0246, "step": 229790 }, { "epoch": 1.48, "learning_rate": 7.752247687769867e-05, "loss": 0.0262, "step": 229800 }, { "epoch": 1.48, "learning_rate": 7.751279552334173e-05, "loss": 0.0298, "step": 229810 }, { "epoch": 1.48, "learning_rate": 7.75031141689848e-05, "loss": 0.0279, "step": 229820 }, { "epoch": 1.48, "learning_rate": 7.749343281462787e-05, "loss": 0.0263, "step": 229830 }, { "epoch": 1.48, "learning_rate": 7.748375146027095e-05, "loss": 0.0296, "step": 229840 }, { "epoch": 1.48, "learning_rate": 7.7474070105914e-05, "loss": 0.0243, "step": 229850 }, { "epoch": 1.48, "learning_rate": 7.746438875155707e-05, "loss": 0.0302, "step": 229860 }, { "epoch": 1.48, "learning_rate": 7.745470739720015e-05, "loss": 0.0303, "step": 229870 }, { "epoch": 1.48, "learning_rate": 7.74450260428432e-05, "loss": 0.0286, "step": 229880 }, { "epoch": 1.48, "learning_rate": 7.743534468848628e-05, "loss": 0.0314, "step": 229890 }, { "epoch": 1.48, "learning_rate": 7.742566333412935e-05, "loss": 0.0299, "step": 229900 }, { "epoch": 1.48, "learning_rate": 7.741598197977243e-05, "loss": 0.0286, "step": 229910 }, { "epoch": 1.48, "learning_rate": 7.740630062541548e-05, "loss": 0.0274, "step": 229920 }, { "epoch": 1.48, "learning_rate": 7.739661927105855e-05, "loss": 0.0314, "step": 229930 }, { "epoch": 1.48, "learning_rate": 7.738693791670163e-05, "loss": 0.0245, "step": 229940 }, { "epoch": 1.48, "learning_rate": 7.737725656234468e-05, "loss": 0.0269, "step": 229950 }, { "epoch": 1.48, "learning_rate": 7.736757520798775e-05, "loss": 0.0443, "step": 229960 }, { "epoch": 1.48, "learning_rate": 7.735789385363083e-05, "loss": 0.0279, "step": 229970 }, { "epoch": 1.48, "learning_rate": 7.734821249927389e-05, "loss": 0.0248, "step": 229980 }, { "epoch": 1.48, "learning_rate": 7.733853114491696e-05, "loss": 0.0229, "step": 229990 }, { "epoch": 1.48, "learning_rate": 7.732884979056003e-05, "loss": 0.0273, "step": 230000 }, { "epoch": 1.48, "eval_cer": 0.919877979889278, "eval_loss": 0.019865069538354874, "eval_runtime": 119.8796, "eval_samples_per_second": 16.683, "eval_steps_per_second": 4.171, "step": 230000 }, { "epoch": 1.48, "learning_rate": 7.73191684362031e-05, "loss": 0.0266, "step": 230010 }, { "epoch": 1.48, "learning_rate": 7.730948708184616e-05, "loss": 0.0322, "step": 230020 }, { "epoch": 1.48, "learning_rate": 7.729980572748922e-05, "loss": 0.022, "step": 230030 }, { "epoch": 1.48, "learning_rate": 7.72901243731323e-05, "loss": 0.0286, "step": 230040 }, { "epoch": 1.48, "learning_rate": 7.728044301877537e-05, "loss": 0.0245, "step": 230050 }, { "epoch": 1.48, "learning_rate": 7.727076166441842e-05, "loss": 0.0246, "step": 230060 }, { "epoch": 1.48, "learning_rate": 7.72610803100615e-05, "loss": 0.0279, "step": 230070 }, { "epoch": 1.48, "learning_rate": 7.725139895570457e-05, "loss": 0.0257, "step": 230080 }, { "epoch": 1.49, "learning_rate": 7.724171760134764e-05, "loss": 0.0219, "step": 230090 }, { "epoch": 1.49, "learning_rate": 7.72320362469907e-05, "loss": 0.0322, "step": 230100 }, { "epoch": 1.49, "learning_rate": 7.722235489263378e-05, "loss": 0.0363, "step": 230110 }, { "epoch": 1.49, "learning_rate": 7.721267353827685e-05, "loss": 0.0275, "step": 230120 }, { "epoch": 1.49, "learning_rate": 7.72029921839199e-05, "loss": 0.0309, "step": 230130 }, { "epoch": 1.49, "learning_rate": 7.719331082956298e-05, "loss": 0.0301, "step": 230140 }, { "epoch": 1.49, "learning_rate": 7.718362947520605e-05, "loss": 0.0275, "step": 230150 }, { "epoch": 1.49, "learning_rate": 7.71739481208491e-05, "loss": 0.0232, "step": 230160 }, { "epoch": 1.49, "learning_rate": 7.716426676649218e-05, "loss": 0.0222, "step": 230170 }, { "epoch": 1.49, "learning_rate": 7.715458541213524e-05, "loss": 0.0367, "step": 230180 }, { "epoch": 1.49, "learning_rate": 7.714490405777832e-05, "loss": 0.0309, "step": 230190 }, { "epoch": 1.49, "learning_rate": 7.713522270342138e-05, "loss": 0.0256, "step": 230200 }, { "epoch": 1.49, "learning_rate": 7.712554134906446e-05, "loss": 0.0282, "step": 230210 }, { "epoch": 1.49, "learning_rate": 7.711585999470752e-05, "loss": 0.0278, "step": 230220 }, { "epoch": 1.49, "learning_rate": 7.710617864035058e-05, "loss": 0.0283, "step": 230230 }, { "epoch": 1.49, "learning_rate": 7.709649728599366e-05, "loss": 0.0286, "step": 230240 }, { "epoch": 1.49, "learning_rate": 7.708681593163672e-05, "loss": 0.0311, "step": 230250 }, { "epoch": 1.49, "learning_rate": 7.70771345772798e-05, "loss": 0.0292, "step": 230260 }, { "epoch": 1.49, "learning_rate": 7.706745322292285e-05, "loss": 0.0299, "step": 230270 }, { "epoch": 1.49, "learning_rate": 7.705777186856592e-05, "loss": 0.0255, "step": 230280 }, { "epoch": 1.49, "learning_rate": 7.7048090514209e-05, "loss": 0.0267, "step": 230290 }, { "epoch": 1.49, "learning_rate": 7.703840915985205e-05, "loss": 0.027, "step": 230300 }, { "epoch": 1.49, "learning_rate": 7.702872780549513e-05, "loss": 0.0234, "step": 230310 }, { "epoch": 1.49, "learning_rate": 7.70190464511382e-05, "loss": 0.031, "step": 230320 }, { "epoch": 1.49, "learning_rate": 7.700936509678128e-05, "loss": 0.0334, "step": 230330 }, { "epoch": 1.49, "learning_rate": 7.699968374242433e-05, "loss": 0.0383, "step": 230340 }, { "epoch": 1.49, "learning_rate": 7.69900023880674e-05, "loss": 0.0265, "step": 230350 }, { "epoch": 1.49, "learning_rate": 7.698032103371048e-05, "loss": 0.023, "step": 230360 }, { "epoch": 1.49, "learning_rate": 7.697063967935353e-05, "loss": 0.0293, "step": 230370 }, { "epoch": 1.49, "learning_rate": 7.69609583249966e-05, "loss": 0.0271, "step": 230380 }, { "epoch": 1.49, "learning_rate": 7.695127697063968e-05, "loss": 0.0273, "step": 230390 }, { "epoch": 1.49, "learning_rate": 7.694159561628274e-05, "loss": 0.0228, "step": 230400 }, { "epoch": 1.49, "learning_rate": 7.693191426192581e-05, "loss": 0.0278, "step": 230410 }, { "epoch": 1.49, "learning_rate": 7.692223290756888e-05, "loss": 0.0222, "step": 230420 }, { "epoch": 1.49, "learning_rate": 7.691255155321195e-05, "loss": 0.0261, "step": 230430 }, { "epoch": 1.49, "learning_rate": 7.690287019885501e-05, "loss": 0.0317, "step": 230440 }, { "epoch": 1.49, "learning_rate": 7.689318884449807e-05, "loss": 0.0254, "step": 230450 }, { "epoch": 1.49, "learning_rate": 7.688350749014115e-05, "loss": 0.0298, "step": 230460 }, { "epoch": 1.49, "learning_rate": 7.687382613578422e-05, "loss": 0.0261, "step": 230470 }, { "epoch": 1.49, "learning_rate": 7.686414478142727e-05, "loss": 0.0304, "step": 230480 }, { "epoch": 1.49, "learning_rate": 7.685446342707035e-05, "loss": 0.0351, "step": 230490 }, { "epoch": 1.49, "learning_rate": 7.684478207271342e-05, "loss": 0.0263, "step": 230500 }, { "epoch": 1.49, "learning_rate": 7.683510071835648e-05, "loss": 0.0272, "step": 230510 }, { "epoch": 1.49, "learning_rate": 7.682541936399955e-05, "loss": 0.0253, "step": 230520 }, { "epoch": 1.49, "learning_rate": 7.681573800964263e-05, "loss": 0.0235, "step": 230530 }, { "epoch": 1.49, "learning_rate": 7.68060566552857e-05, "loss": 0.0285, "step": 230540 }, { "epoch": 1.49, "learning_rate": 7.679637530092875e-05, "loss": 0.0253, "step": 230550 }, { "epoch": 1.49, "learning_rate": 7.678669394657183e-05, "loss": 0.0278, "step": 230560 }, { "epoch": 1.49, "learning_rate": 7.67770125922149e-05, "loss": 0.031, "step": 230570 }, { "epoch": 1.49, "learning_rate": 7.676733123785795e-05, "loss": 0.0276, "step": 230580 }, { "epoch": 1.49, "learning_rate": 7.675764988350103e-05, "loss": 0.0322, "step": 230590 }, { "epoch": 1.49, "learning_rate": 7.67479685291441e-05, "loss": 0.0277, "step": 230600 }, { "epoch": 1.49, "learning_rate": 7.673828717478717e-05, "loss": 0.0278, "step": 230610 }, { "epoch": 1.49, "learning_rate": 7.672860582043023e-05, "loss": 0.0331, "step": 230620 }, { "epoch": 1.49, "learning_rate": 7.671892446607331e-05, "loss": 0.0253, "step": 230630 }, { "epoch": 1.49, "learning_rate": 7.670924311171637e-05, "loss": 0.0291, "step": 230640 }, { "epoch": 1.49, "learning_rate": 7.669956175735943e-05, "loss": 0.0273, "step": 230650 }, { "epoch": 1.49, "learning_rate": 7.66898804030025e-05, "loss": 0.0331, "step": 230660 }, { "epoch": 1.49, "learning_rate": 7.668019904864557e-05, "loss": 0.0287, "step": 230670 }, { "epoch": 1.49, "learning_rate": 7.667051769428865e-05, "loss": 0.0264, "step": 230680 }, { "epoch": 1.49, "learning_rate": 7.66608363399317e-05, "loss": 0.0263, "step": 230690 }, { "epoch": 1.49, "learning_rate": 7.665115498557477e-05, "loss": 0.0363, "step": 230700 }, { "epoch": 1.49, "learning_rate": 7.664147363121785e-05, "loss": 0.0286, "step": 230710 }, { "epoch": 1.49, "learning_rate": 7.66317922768609e-05, "loss": 0.026, "step": 230720 }, { "epoch": 1.49, "learning_rate": 7.662211092250398e-05, "loss": 0.0281, "step": 230730 }, { "epoch": 1.49, "learning_rate": 7.661242956814705e-05, "loss": 0.0232, "step": 230740 }, { "epoch": 1.49, "learning_rate": 7.660274821379012e-05, "loss": 0.025, "step": 230750 }, { "epoch": 1.49, "learning_rate": 7.659306685943318e-05, "loss": 0.0214, "step": 230760 }, { "epoch": 1.49, "learning_rate": 7.658338550507625e-05, "loss": 0.0283, "step": 230770 }, { "epoch": 1.49, "learning_rate": 7.657370415071933e-05, "loss": 0.03, "step": 230780 }, { "epoch": 1.49, "learning_rate": 7.656402279636238e-05, "loss": 0.0277, "step": 230790 }, { "epoch": 1.49, "learning_rate": 7.655434144200545e-05, "loss": 0.0272, "step": 230800 }, { "epoch": 1.49, "learning_rate": 7.654466008764853e-05, "loss": 0.0267, "step": 230810 }, { "epoch": 1.49, "learning_rate": 7.653497873329159e-05, "loss": 0.0273, "step": 230820 }, { "epoch": 1.49, "learning_rate": 7.652529737893466e-05, "loss": 0.0255, "step": 230830 }, { "epoch": 1.49, "learning_rate": 7.651561602457773e-05, "loss": 0.0284, "step": 230840 }, { "epoch": 1.49, "learning_rate": 7.650593467022079e-05, "loss": 0.0284, "step": 230850 }, { "epoch": 1.49, "learning_rate": 7.649625331586386e-05, "loss": 0.0319, "step": 230860 }, { "epoch": 1.49, "learning_rate": 7.648657196150692e-05, "loss": 0.0259, "step": 230870 }, { "epoch": 1.49, "learning_rate": 7.647689060715e-05, "loss": 0.033, "step": 230880 }, { "epoch": 1.49, "learning_rate": 7.646720925279307e-05, "loss": 0.0333, "step": 230890 }, { "epoch": 1.49, "learning_rate": 7.645752789843612e-05, "loss": 0.0257, "step": 230900 }, { "epoch": 1.49, "learning_rate": 7.64478465440792e-05, "loss": 0.0247, "step": 230910 }, { "epoch": 1.49, "learning_rate": 7.643816518972227e-05, "loss": 0.0234, "step": 230920 }, { "epoch": 1.49, "learning_rate": 7.642848383536533e-05, "loss": 0.0275, "step": 230930 }, { "epoch": 1.49, "learning_rate": 7.64188024810084e-05, "loss": 0.0282, "step": 230940 }, { "epoch": 1.49, "learning_rate": 7.640912112665147e-05, "loss": 0.0289, "step": 230950 }, { "epoch": 1.49, "learning_rate": 7.639943977229455e-05, "loss": 0.0305, "step": 230960 }, { "epoch": 1.49, "learning_rate": 7.63897584179376e-05, "loss": 0.0221, "step": 230970 }, { "epoch": 1.49, "learning_rate": 7.638007706358068e-05, "loss": 0.0292, "step": 230980 }, { "epoch": 1.49, "learning_rate": 7.637039570922375e-05, "loss": 0.0276, "step": 230990 }, { "epoch": 1.49, "learning_rate": 7.63607143548668e-05, "loss": 0.024, "step": 231000 }, { "epoch": 1.49, "eval_cer": 0.9199014800587504, "eval_loss": 0.019931979477405548, "eval_runtime": 120.0906, "eval_samples_per_second": 16.654, "eval_steps_per_second": 4.164, "step": 231000 }, { "epoch": 1.49, "learning_rate": 7.635103300050988e-05, "loss": 0.0329, "step": 231010 }, { "epoch": 1.49, "learning_rate": 7.634135164615294e-05, "loss": 0.0307, "step": 231020 }, { "epoch": 1.49, "learning_rate": 7.633167029179602e-05, "loss": 0.025, "step": 231030 }, { "epoch": 1.49, "learning_rate": 7.632198893743908e-05, "loss": 0.027, "step": 231040 }, { "epoch": 1.49, "learning_rate": 7.631230758308214e-05, "loss": 0.0297, "step": 231050 }, { "epoch": 1.49, "learning_rate": 7.630262622872522e-05, "loss": 0.0305, "step": 231060 }, { "epoch": 1.49, "learning_rate": 7.629294487436828e-05, "loss": 0.0267, "step": 231070 }, { "epoch": 1.49, "learning_rate": 7.628326352001136e-05, "loss": 0.0316, "step": 231080 }, { "epoch": 1.49, "learning_rate": 7.627358216565442e-05, "loss": 0.0312, "step": 231090 }, { "epoch": 1.49, "learning_rate": 7.62639008112975e-05, "loss": 0.0283, "step": 231100 }, { "epoch": 1.49, "learning_rate": 7.625421945694055e-05, "loss": 0.0277, "step": 231110 }, { "epoch": 1.49, "learning_rate": 7.624453810258362e-05, "loss": 0.0337, "step": 231120 }, { "epoch": 1.49, "learning_rate": 7.62348567482267e-05, "loss": 0.028, "step": 231130 }, { "epoch": 1.49, "learning_rate": 7.622517539386975e-05, "loss": 0.0307, "step": 231140 }, { "epoch": 1.49, "learning_rate": 7.621549403951282e-05, "loss": 0.0311, "step": 231150 }, { "epoch": 1.49, "learning_rate": 7.62058126851559e-05, "loss": 0.028, "step": 231160 }, { "epoch": 1.49, "learning_rate": 7.619613133079897e-05, "loss": 0.0255, "step": 231170 }, { "epoch": 1.49, "learning_rate": 7.618644997644203e-05, "loss": 0.0285, "step": 231180 }, { "epoch": 1.49, "learning_rate": 7.61767686220851e-05, "loss": 0.0265, "step": 231190 }, { "epoch": 1.49, "learning_rate": 7.616708726772818e-05, "loss": 0.0276, "step": 231200 }, { "epoch": 1.49, "learning_rate": 7.615740591337123e-05, "loss": 0.0271, "step": 231210 }, { "epoch": 1.49, "learning_rate": 7.61477245590143e-05, "loss": 0.0256, "step": 231220 }, { "epoch": 1.49, "learning_rate": 7.613804320465738e-05, "loss": 0.0281, "step": 231230 }, { "epoch": 1.49, "learning_rate": 7.612836185030044e-05, "loss": 0.0283, "step": 231240 }, { "epoch": 1.49, "learning_rate": 7.61186804959435e-05, "loss": 0.0249, "step": 231250 }, { "epoch": 1.49, "learning_rate": 7.610899914158657e-05, "loss": 0.029, "step": 231260 }, { "epoch": 1.49, "learning_rate": 7.609931778722964e-05, "loss": 0.0305, "step": 231270 }, { "epoch": 1.49, "learning_rate": 7.608963643287271e-05, "loss": 0.0261, "step": 231280 }, { "epoch": 1.49, "learning_rate": 7.607995507851577e-05, "loss": 0.0286, "step": 231290 }, { "epoch": 1.49, "learning_rate": 7.607027372415885e-05, "loss": 0.029, "step": 231300 }, { "epoch": 1.49, "learning_rate": 7.606059236980192e-05, "loss": 0.0258, "step": 231310 }, { "epoch": 1.49, "learning_rate": 7.605091101544497e-05, "loss": 0.0247, "step": 231320 }, { "epoch": 1.49, "learning_rate": 7.604122966108805e-05, "loss": 0.0236, "step": 231330 }, { "epoch": 1.49, "learning_rate": 7.603154830673112e-05, "loss": 0.0313, "step": 231340 }, { "epoch": 1.49, "learning_rate": 7.602186695237417e-05, "loss": 0.0331, "step": 231350 }, { "epoch": 1.49, "learning_rate": 7.601218559801725e-05, "loss": 0.0251, "step": 231360 }, { "epoch": 1.49, "learning_rate": 7.600250424366032e-05, "loss": 0.0272, "step": 231370 }, { "epoch": 1.49, "learning_rate": 7.59928228893034e-05, "loss": 0.0267, "step": 231380 }, { "epoch": 1.49, "learning_rate": 7.598314153494645e-05, "loss": 0.0245, "step": 231390 }, { "epoch": 1.49, "learning_rate": 7.597346018058953e-05, "loss": 0.0307, "step": 231400 }, { "epoch": 1.49, "learning_rate": 7.59637788262326e-05, "loss": 0.0312, "step": 231410 }, { "epoch": 1.49, "learning_rate": 7.595409747187565e-05, "loss": 0.0335, "step": 231420 }, { "epoch": 1.49, "learning_rate": 7.594441611751873e-05, "loss": 0.0287, "step": 231430 }, { "epoch": 1.49, "learning_rate": 7.59347347631618e-05, "loss": 0.0257, "step": 231440 }, { "epoch": 1.49, "learning_rate": 7.592505340880487e-05, "loss": 0.0264, "step": 231450 }, { "epoch": 1.49, "learning_rate": 7.591537205444793e-05, "loss": 0.0269, "step": 231460 }, { "epoch": 1.49, "learning_rate": 7.590569070009099e-05, "loss": 0.027, "step": 231470 }, { "epoch": 1.49, "learning_rate": 7.589600934573407e-05, "loss": 0.0309, "step": 231480 }, { "epoch": 1.49, "learning_rate": 7.588632799137713e-05, "loss": 0.0261, "step": 231490 }, { "epoch": 1.49, "learning_rate": 7.58766466370202e-05, "loss": 0.0263, "step": 231500 }, { "epoch": 1.49, "learning_rate": 7.586696528266327e-05, "loss": 0.0239, "step": 231510 }, { "epoch": 1.49, "learning_rate": 7.585728392830635e-05, "loss": 0.0265, "step": 231520 }, { "epoch": 1.49, "learning_rate": 7.58476025739494e-05, "loss": 0.0275, "step": 231530 }, { "epoch": 1.49, "learning_rate": 7.583792121959247e-05, "loss": 0.0262, "step": 231540 }, { "epoch": 1.49, "learning_rate": 7.582823986523555e-05, "loss": 0.0302, "step": 231550 }, { "epoch": 1.49, "learning_rate": 7.58185585108786e-05, "loss": 0.0258, "step": 231560 }, { "epoch": 1.49, "learning_rate": 7.580887715652167e-05, "loss": 0.0261, "step": 231570 }, { "epoch": 1.49, "learning_rate": 7.579919580216475e-05, "loss": 0.0289, "step": 231580 }, { "epoch": 1.49, "learning_rate": 7.578951444780781e-05, "loss": 0.0229, "step": 231590 }, { "epoch": 1.49, "learning_rate": 7.577983309345088e-05, "loss": 0.0323, "step": 231600 }, { "epoch": 1.49, "learning_rate": 7.577015173909395e-05, "loss": 0.0258, "step": 231610 }, { "epoch": 1.49, "learning_rate": 7.576047038473703e-05, "loss": 0.0294, "step": 231620 }, { "epoch": 1.49, "learning_rate": 7.575078903038008e-05, "loss": 0.0308, "step": 231630 }, { "epoch": 1.5, "learning_rate": 7.574110767602315e-05, "loss": 0.0281, "step": 231640 }, { "epoch": 1.5, "learning_rate": 7.573142632166623e-05, "loss": 0.0294, "step": 231650 }, { "epoch": 1.5, "learning_rate": 7.572174496730929e-05, "loss": 0.0259, "step": 231660 }, { "epoch": 1.5, "learning_rate": 7.571206361295234e-05, "loss": 0.0226, "step": 231670 }, { "epoch": 1.5, "learning_rate": 7.570238225859542e-05, "loss": 0.0301, "step": 231680 }, { "epoch": 1.5, "learning_rate": 7.569270090423849e-05, "loss": 0.0271, "step": 231690 }, { "epoch": 1.5, "learning_rate": 7.568301954988156e-05, "loss": 0.0245, "step": 231700 }, { "epoch": 1.5, "learning_rate": 7.567333819552462e-05, "loss": 0.0254, "step": 231710 }, { "epoch": 1.5, "learning_rate": 7.56636568411677e-05, "loss": 0.0316, "step": 231720 }, { "epoch": 1.5, "learning_rate": 7.565397548681077e-05, "loss": 0.0332, "step": 231730 }, { "epoch": 1.5, "learning_rate": 7.564429413245382e-05, "loss": 0.0234, "step": 231740 }, { "epoch": 1.5, "learning_rate": 7.56346127780969e-05, "loss": 0.0307, "step": 231750 }, { "epoch": 1.5, "learning_rate": 7.562493142373997e-05, "loss": 0.0262, "step": 231760 }, { "epoch": 1.5, "learning_rate": 7.561525006938302e-05, "loss": 0.0278, "step": 231770 }, { "epoch": 1.5, "learning_rate": 7.56055687150261e-05, "loss": 0.0284, "step": 231780 }, { "epoch": 1.5, "learning_rate": 7.559588736066917e-05, "loss": 0.0246, "step": 231790 }, { "epoch": 1.5, "learning_rate": 7.558620600631225e-05, "loss": 0.0262, "step": 231800 }, { "epoch": 1.5, "learning_rate": 7.55765246519553e-05, "loss": 0.031, "step": 231810 }, { "epoch": 1.5, "learning_rate": 7.556684329759838e-05, "loss": 0.0265, "step": 231820 }, { "epoch": 1.5, "learning_rate": 7.555716194324145e-05, "loss": 0.0267, "step": 231830 }, { "epoch": 1.5, "learning_rate": 7.55474805888845e-05, "loss": 0.032, "step": 231840 }, { "epoch": 1.5, "learning_rate": 7.553779923452758e-05, "loss": 0.0311, "step": 231850 }, { "epoch": 1.5, "learning_rate": 7.552811788017064e-05, "loss": 0.0285, "step": 231860 }, { "epoch": 1.5, "learning_rate": 7.551843652581372e-05, "loss": 0.0233, "step": 231870 }, { "epoch": 1.5, "learning_rate": 7.550875517145678e-05, "loss": 0.0232, "step": 231880 }, { "epoch": 1.5, "learning_rate": 7.549907381709984e-05, "loss": 0.026, "step": 231890 }, { "epoch": 1.5, "learning_rate": 7.548939246274292e-05, "loss": 0.0286, "step": 231900 }, { "epoch": 1.5, "learning_rate": 7.547971110838598e-05, "loss": 0.029, "step": 231910 }, { "epoch": 1.5, "learning_rate": 7.547002975402906e-05, "loss": 0.0233, "step": 231920 }, { "epoch": 1.5, "learning_rate": 7.546034839967212e-05, "loss": 0.0283, "step": 231930 }, { "epoch": 1.5, "learning_rate": 7.545066704531519e-05, "loss": 0.0281, "step": 231940 }, { "epoch": 1.5, "learning_rate": 7.544098569095825e-05, "loss": 0.0267, "step": 231950 }, { "epoch": 1.5, "learning_rate": 7.543130433660132e-05, "loss": 0.0283, "step": 231960 }, { "epoch": 1.5, "learning_rate": 7.54216229822444e-05, "loss": 0.0324, "step": 231970 }, { "epoch": 1.5, "learning_rate": 7.541194162788745e-05, "loss": 0.0267, "step": 231980 }, { "epoch": 1.5, "learning_rate": 7.540226027353052e-05, "loss": 0.0284, "step": 231990 }, { "epoch": 1.5, "learning_rate": 7.53925789191736e-05, "loss": 0.0295, "step": 232000 }, { "epoch": 1.5, "eval_cer": 0.9198915376793583, "eval_loss": 0.019776683300733566, "eval_runtime": 120.0, "eval_samples_per_second": 16.667, "eval_steps_per_second": 4.167, "step": 232000 }, { "epoch": 1.5, "learning_rate": 7.538289756481666e-05, "loss": 0.0288, "step": 232010 }, { "epoch": 1.5, "learning_rate": 7.537321621045973e-05, "loss": 0.0322, "step": 232020 }, { "epoch": 1.5, "learning_rate": 7.53635348561028e-05, "loss": 0.0271, "step": 232030 }, { "epoch": 1.5, "learning_rate": 7.535385350174586e-05, "loss": 0.0292, "step": 232040 }, { "epoch": 1.5, "learning_rate": 7.534417214738893e-05, "loss": 0.0282, "step": 232050 }, { "epoch": 1.5, "learning_rate": 7.5334490793032e-05, "loss": 0.027, "step": 232060 }, { "epoch": 1.5, "learning_rate": 7.532480943867508e-05, "loss": 0.0252, "step": 232070 }, { "epoch": 1.5, "learning_rate": 7.531512808431814e-05, "loss": 0.0251, "step": 232080 }, { "epoch": 1.5, "learning_rate": 7.53054467299612e-05, "loss": 0.0283, "step": 232090 }, { "epoch": 1.5, "learning_rate": 7.529576537560427e-05, "loss": 0.0244, "step": 232100 }, { "epoch": 1.5, "learning_rate": 7.528608402124734e-05, "loss": 0.0264, "step": 232110 }, { "epoch": 1.5, "learning_rate": 7.527640266689041e-05, "loss": 0.0311, "step": 232120 }, { "epoch": 1.5, "learning_rate": 7.526672131253347e-05, "loss": 0.0276, "step": 232130 }, { "epoch": 1.5, "learning_rate": 7.525703995817654e-05, "loss": 0.0267, "step": 232140 }, { "epoch": 1.5, "learning_rate": 7.524735860381962e-05, "loss": 0.0274, "step": 232150 }, { "epoch": 1.5, "learning_rate": 7.523767724946267e-05, "loss": 0.024, "step": 232160 }, { "epoch": 1.5, "learning_rate": 7.522799589510575e-05, "loss": 0.0312, "step": 232170 }, { "epoch": 1.5, "learning_rate": 7.521831454074882e-05, "loss": 0.0323, "step": 232180 }, { "epoch": 1.5, "learning_rate": 7.520863318639187e-05, "loss": 0.0295, "step": 232190 }, { "epoch": 1.5, "learning_rate": 7.519895183203495e-05, "loss": 0.0269, "step": 232200 }, { "epoch": 1.5, "learning_rate": 7.518927047767802e-05, "loss": 0.0249, "step": 232210 }, { "epoch": 1.5, "learning_rate": 7.51795891233211e-05, "loss": 0.0339, "step": 232220 }, { "epoch": 1.5, "learning_rate": 7.516990776896415e-05, "loss": 0.0288, "step": 232230 }, { "epoch": 1.5, "learning_rate": 7.516022641460722e-05, "loss": 0.0283, "step": 232240 }, { "epoch": 1.5, "learning_rate": 7.51505450602503e-05, "loss": 0.0265, "step": 232250 }, { "epoch": 1.5, "learning_rate": 7.514086370589335e-05, "loss": 0.0268, "step": 232260 }, { "epoch": 1.5, "learning_rate": 7.513118235153643e-05, "loss": 0.0227, "step": 232270 }, { "epoch": 1.5, "learning_rate": 7.51215009971795e-05, "loss": 0.0299, "step": 232280 }, { "epoch": 1.5, "learning_rate": 7.511181964282257e-05, "loss": 0.0269, "step": 232290 }, { "epoch": 1.5, "learning_rate": 7.510213828846563e-05, "loss": 0.0297, "step": 232300 }, { "epoch": 1.5, "learning_rate": 7.509245693410869e-05, "loss": 0.0264, "step": 232310 }, { "epoch": 1.5, "learning_rate": 7.508277557975177e-05, "loss": 0.0255, "step": 232320 }, { "epoch": 1.5, "learning_rate": 7.507309422539483e-05, "loss": 0.0276, "step": 232330 }, { "epoch": 1.5, "learning_rate": 7.506341287103789e-05, "loss": 0.0286, "step": 232340 }, { "epoch": 1.5, "learning_rate": 7.505373151668097e-05, "loss": 0.0236, "step": 232350 }, { "epoch": 1.5, "learning_rate": 7.504405016232404e-05, "loss": 0.0268, "step": 232360 }, { "epoch": 1.5, "learning_rate": 7.50343688079671e-05, "loss": 0.0303, "step": 232370 }, { "epoch": 1.5, "learning_rate": 7.502468745361017e-05, "loss": 0.0275, "step": 232380 }, { "epoch": 1.5, "learning_rate": 7.501500609925325e-05, "loss": 0.0243, "step": 232390 }, { "epoch": 1.5, "learning_rate": 7.50053247448963e-05, "loss": 0.0254, "step": 232400 }, { "epoch": 1.5, "learning_rate": 7.499564339053937e-05, "loss": 0.0307, "step": 232410 }, { "epoch": 1.5, "learning_rate": 7.498596203618245e-05, "loss": 0.0328, "step": 232420 }, { "epoch": 1.5, "learning_rate": 7.497628068182551e-05, "loss": 0.024, "step": 232430 }, { "epoch": 1.5, "learning_rate": 7.496659932746857e-05, "loss": 0.0243, "step": 232440 }, { "epoch": 1.5, "learning_rate": 7.495691797311165e-05, "loss": 0.0249, "step": 232450 }, { "epoch": 1.5, "learning_rate": 7.494723661875471e-05, "loss": 0.0213, "step": 232460 }, { "epoch": 1.5, "learning_rate": 7.493755526439778e-05, "loss": 0.0272, "step": 232470 }, { "epoch": 1.5, "learning_rate": 7.492787391004085e-05, "loss": 0.0273, "step": 232480 }, { "epoch": 1.5, "learning_rate": 7.491819255568393e-05, "loss": 0.0245, "step": 232490 }, { "epoch": 1.5, "learning_rate": 7.490851120132698e-05, "loss": 0.0256, "step": 232500 }, { "epoch": 1.5, "learning_rate": 7.489882984697004e-05, "loss": 0.0287, "step": 232510 }, { "epoch": 1.5, "learning_rate": 7.488914849261312e-05, "loss": 0.0259, "step": 232520 }, { "epoch": 1.5, "learning_rate": 7.487946713825619e-05, "loss": 0.0341, "step": 232530 }, { "epoch": 1.5, "learning_rate": 7.486978578389926e-05, "loss": 0.0245, "step": 232540 }, { "epoch": 1.5, "learning_rate": 7.486010442954232e-05, "loss": 0.0257, "step": 232550 }, { "epoch": 1.5, "learning_rate": 7.485042307518539e-05, "loss": 0.0217, "step": 232560 }, { "epoch": 1.5, "learning_rate": 7.484074172082846e-05, "loss": 0.0227, "step": 232570 }, { "epoch": 1.5, "learning_rate": 7.483106036647152e-05, "loss": 0.0265, "step": 232580 }, { "epoch": 1.5, "learning_rate": 7.48213790121146e-05, "loss": 0.0234, "step": 232590 }, { "epoch": 1.5, "learning_rate": 7.481169765775765e-05, "loss": 0.0287, "step": 232600 }, { "epoch": 1.5, "learning_rate": 7.480201630340073e-05, "loss": 0.0306, "step": 232610 }, { "epoch": 1.5, "learning_rate": 7.47923349490438e-05, "loss": 0.0284, "step": 232620 }, { "epoch": 1.5, "learning_rate": 7.478265359468687e-05, "loss": 0.0332, "step": 232630 }, { "epoch": 1.5, "learning_rate": 7.477297224032993e-05, "loss": 0.0247, "step": 232640 }, { "epoch": 1.5, "learning_rate": 7.4763290885973e-05, "loss": 0.0312, "step": 232650 }, { "epoch": 1.5, "learning_rate": 7.475360953161607e-05, "loss": 0.0276, "step": 232660 }, { "epoch": 1.5, "learning_rate": 7.474392817725913e-05, "loss": 0.0317, "step": 232670 }, { "epoch": 1.5, "learning_rate": 7.473424682290221e-05, "loss": 0.0245, "step": 232680 }, { "epoch": 1.5, "learning_rate": 7.472456546854528e-05, "loss": 0.026, "step": 232690 }, { "epoch": 1.5, "learning_rate": 7.471488411418834e-05, "loss": 0.0262, "step": 232700 }, { "epoch": 1.5, "learning_rate": 7.470520275983141e-05, "loss": 0.0264, "step": 232710 }, { "epoch": 1.5, "learning_rate": 7.469552140547448e-05, "loss": 0.0261, "step": 232720 }, { "epoch": 1.5, "learning_rate": 7.468584005111754e-05, "loss": 0.0281, "step": 232730 }, { "epoch": 1.5, "learning_rate": 7.467615869676061e-05, "loss": 0.0268, "step": 232740 }, { "epoch": 1.5, "learning_rate": 7.466647734240369e-05, "loss": 0.027, "step": 232750 }, { "epoch": 1.5, "learning_rate": 7.465679598804674e-05, "loss": 0.0318, "step": 232760 }, { "epoch": 1.5, "learning_rate": 7.464711463368982e-05, "loss": 0.0204, "step": 232770 }, { "epoch": 1.5, "learning_rate": 7.463743327933289e-05, "loss": 0.0282, "step": 232780 }, { "epoch": 1.5, "learning_rate": 7.462775192497595e-05, "loss": 0.0263, "step": 232790 }, { "epoch": 1.5, "learning_rate": 7.461807057061902e-05, "loss": 0.0259, "step": 232800 }, { "epoch": 1.5, "learning_rate": 7.460838921626209e-05, "loss": 0.0315, "step": 232810 }, { "epoch": 1.5, "learning_rate": 7.459870786190515e-05, "loss": 0.0279, "step": 232820 }, { "epoch": 1.5, "learning_rate": 7.458902650754822e-05, "loss": 0.0235, "step": 232830 }, { "epoch": 1.5, "learning_rate": 7.45793451531913e-05, "loss": 0.0269, "step": 232840 }, { "epoch": 1.5, "learning_rate": 7.456966379883436e-05, "loss": 0.0316, "step": 232850 }, { "epoch": 1.5, "learning_rate": 7.455998244447742e-05, "loss": 0.0241, "step": 232860 }, { "epoch": 1.5, "learning_rate": 7.45503010901205e-05, "loss": 0.029, "step": 232870 }, { "epoch": 1.5, "learning_rate": 7.454061973576356e-05, "loss": 0.0328, "step": 232880 }, { "epoch": 1.5, "learning_rate": 7.453093838140663e-05, "loss": 0.0299, "step": 232890 }, { "epoch": 1.5, "learning_rate": 7.45212570270497e-05, "loss": 0.0323, "step": 232900 }, { "epoch": 1.5, "learning_rate": 7.451157567269278e-05, "loss": 0.0293, "step": 232910 }, { "epoch": 1.5, "learning_rate": 7.450189431833583e-05, "loss": 0.0273, "step": 232920 }, { "epoch": 1.5, "learning_rate": 7.44922129639789e-05, "loss": 0.0317, "step": 232930 }, { "epoch": 1.5, "learning_rate": 7.448253160962197e-05, "loss": 0.0273, "step": 232940 }, { "epoch": 1.5, "learning_rate": 7.447285025526504e-05, "loss": 0.0256, "step": 232950 }, { "epoch": 1.5, "learning_rate": 7.44631689009081e-05, "loss": 0.0313, "step": 232960 }, { "epoch": 1.5, "learning_rate": 7.445348754655117e-05, "loss": 0.0326, "step": 232970 }, { "epoch": 1.5, "learning_rate": 7.444380619219424e-05, "loss": 0.0244, "step": 232980 }, { "epoch": 1.5, "learning_rate": 7.44341248378373e-05, "loss": 0.0271, "step": 232990 }, { "epoch": 1.5, "learning_rate": 7.442444348348037e-05, "loss": 0.0281, "step": 233000 }, { "epoch": 1.5, "eval_cer": 0.9199141339961586, "eval_loss": 0.019634824246168137, "eval_runtime": 120.2752, "eval_samples_per_second": 16.629, "eval_steps_per_second": 4.157, "step": 233000 }, { "epoch": 1.5, "learning_rate": 7.441476212912345e-05, "loss": 0.0279, "step": 233010 }, { "epoch": 1.5, "learning_rate": 7.44050807747665e-05, "loss": 0.0254, "step": 233020 }, { "epoch": 1.5, "learning_rate": 7.439539942040958e-05, "loss": 0.0229, "step": 233030 }, { "epoch": 1.5, "learning_rate": 7.438571806605265e-05, "loss": 0.0317, "step": 233040 }, { "epoch": 1.5, "learning_rate": 7.437603671169572e-05, "loss": 0.0253, "step": 233050 }, { "epoch": 1.5, "learning_rate": 7.436635535733878e-05, "loss": 0.0285, "step": 233060 }, { "epoch": 1.5, "learning_rate": 7.435667400298185e-05, "loss": 0.0252, "step": 233070 }, { "epoch": 1.5, "learning_rate": 7.434699264862491e-05, "loss": 0.0276, "step": 233080 }, { "epoch": 1.5, "learning_rate": 7.433731129426798e-05, "loss": 0.0208, "step": 233090 }, { "epoch": 1.5, "learning_rate": 7.432762993991106e-05, "loss": 0.0236, "step": 233100 }, { "epoch": 1.5, "learning_rate": 7.431794858555413e-05, "loss": 0.0276, "step": 233110 }, { "epoch": 1.5, "learning_rate": 7.43082672311972e-05, "loss": 0.0268, "step": 233120 }, { "epoch": 1.5, "learning_rate": 7.429858587684026e-05, "loss": 0.0252, "step": 233130 }, { "epoch": 1.5, "learning_rate": 7.428890452248333e-05, "loss": 0.0265, "step": 233140 }, { "epoch": 1.5, "learning_rate": 7.427922316812639e-05, "loss": 0.0285, "step": 233150 }, { "epoch": 1.5, "learning_rate": 7.426954181376946e-05, "loss": 0.0288, "step": 233160 }, { "epoch": 1.5, "learning_rate": 7.425986045941254e-05, "loss": 0.028, "step": 233170 }, { "epoch": 1.5, "learning_rate": 7.425017910505559e-05, "loss": 0.0265, "step": 233180 }, { "epoch": 1.51, "learning_rate": 7.424049775069867e-05, "loss": 0.0279, "step": 233190 }, { "epoch": 1.51, "learning_rate": 7.423081639634174e-05, "loss": 0.0275, "step": 233200 }, { "epoch": 1.51, "learning_rate": 7.42211350419848e-05, "loss": 0.0276, "step": 233210 }, { "epoch": 1.51, "learning_rate": 7.421145368762787e-05, "loss": 0.0242, "step": 233220 }, { "epoch": 1.51, "learning_rate": 7.420177233327094e-05, "loss": 0.0235, "step": 233230 }, { "epoch": 1.51, "learning_rate": 7.4192090978914e-05, "loss": 0.0296, "step": 233240 }, { "epoch": 1.51, "learning_rate": 7.418240962455707e-05, "loss": 0.0263, "step": 233250 }, { "epoch": 1.51, "learning_rate": 7.417272827020015e-05, "loss": 0.0299, "step": 233260 }, { "epoch": 1.51, "learning_rate": 7.416304691584321e-05, "loss": 0.0307, "step": 233270 }, { "epoch": 1.51, "learning_rate": 7.415336556148627e-05, "loss": 0.0259, "step": 233280 }, { "epoch": 1.51, "learning_rate": 7.414368420712935e-05, "loss": 0.0261, "step": 233290 }, { "epoch": 1.51, "learning_rate": 7.413400285277241e-05, "loss": 0.0267, "step": 233300 }, { "epoch": 1.51, "learning_rate": 7.412432149841548e-05, "loss": 0.0287, "step": 233310 }, { "epoch": 1.51, "learning_rate": 7.411464014405855e-05, "loss": 0.0249, "step": 233320 }, { "epoch": 1.51, "learning_rate": 7.410495878970161e-05, "loss": 0.0251, "step": 233330 }, { "epoch": 1.51, "learning_rate": 7.409527743534468e-05, "loss": 0.027, "step": 233340 }, { "epoch": 1.51, "learning_rate": 7.408559608098774e-05, "loss": 0.0311, "step": 233350 }, { "epoch": 1.51, "learning_rate": 7.407591472663082e-05, "loss": 0.0307, "step": 233360 }, { "epoch": 1.51, "learning_rate": 7.406623337227389e-05, "loss": 0.0212, "step": 233370 }, { "epoch": 1.51, "learning_rate": 7.405655201791696e-05, "loss": 0.0281, "step": 233380 }, { "epoch": 1.51, "learning_rate": 7.404687066356002e-05, "loss": 0.0262, "step": 233390 }, { "epoch": 1.51, "learning_rate": 7.403718930920309e-05, "loss": 0.0215, "step": 233400 }, { "epoch": 1.51, "learning_rate": 7.402750795484616e-05, "loss": 0.0282, "step": 233410 }, { "epoch": 1.51, "learning_rate": 7.401782660048922e-05, "loss": 0.0247, "step": 233420 }, { "epoch": 1.51, "learning_rate": 7.40081452461323e-05, "loss": 0.0259, "step": 233430 }, { "epoch": 1.51, "learning_rate": 7.399846389177535e-05, "loss": 0.0283, "step": 233440 }, { "epoch": 1.51, "learning_rate": 7.398878253741843e-05, "loss": 0.0319, "step": 233450 }, { "epoch": 1.51, "learning_rate": 7.39791011830615e-05, "loss": 0.0246, "step": 233460 }, { "epoch": 1.51, "learning_rate": 7.396941982870457e-05, "loss": 0.0279, "step": 233470 }, { "epoch": 1.51, "learning_rate": 7.395973847434763e-05, "loss": 0.0272, "step": 233480 }, { "epoch": 1.51, "learning_rate": 7.39500571199907e-05, "loss": 0.0227, "step": 233490 }, { "epoch": 1.51, "learning_rate": 7.394037576563376e-05, "loss": 0.0228, "step": 233500 }, { "epoch": 1.51, "learning_rate": 7.393069441127683e-05, "loss": 0.0259, "step": 233510 }, { "epoch": 1.51, "learning_rate": 7.392101305691991e-05, "loss": 0.0285, "step": 233520 }, { "epoch": 1.51, "learning_rate": 7.391133170256298e-05, "loss": 0.0288, "step": 233530 }, { "epoch": 1.51, "learning_rate": 7.390165034820603e-05, "loss": 0.0311, "step": 233540 }, { "epoch": 1.51, "learning_rate": 7.389196899384911e-05, "loss": 0.0282, "step": 233550 }, { "epoch": 1.51, "learning_rate": 7.388228763949218e-05, "loss": 0.0241, "step": 233560 }, { "epoch": 1.51, "learning_rate": 7.387260628513524e-05, "loss": 0.0284, "step": 233570 }, { "epoch": 1.51, "learning_rate": 7.386292493077831e-05, "loss": 0.0242, "step": 233580 }, { "epoch": 1.51, "learning_rate": 7.385324357642137e-05, "loss": 0.0311, "step": 233590 }, { "epoch": 1.51, "learning_rate": 7.384356222206444e-05, "loss": 0.0278, "step": 233600 }, { "epoch": 1.51, "learning_rate": 7.383388086770751e-05, "loss": 0.0288, "step": 233610 }, { "epoch": 1.51, "learning_rate": 7.382419951335059e-05, "loss": 0.025, "step": 233620 }, { "epoch": 1.51, "learning_rate": 7.381451815899365e-05, "loss": 0.0271, "step": 233630 }, { "epoch": 1.51, "learning_rate": 7.380483680463672e-05, "loss": 0.0305, "step": 233640 }, { "epoch": 1.51, "learning_rate": 7.379515545027979e-05, "loss": 0.0273, "step": 233650 }, { "epoch": 1.51, "learning_rate": 7.378547409592285e-05, "loss": 0.0204, "step": 233660 }, { "epoch": 1.51, "learning_rate": 7.377579274156592e-05, "loss": 0.0277, "step": 233670 }, { "epoch": 1.51, "learning_rate": 7.376611138720898e-05, "loss": 0.0278, "step": 233680 }, { "epoch": 1.51, "learning_rate": 7.375643003285205e-05, "loss": 0.0253, "step": 233690 }, { "epoch": 1.51, "learning_rate": 7.374674867849512e-05, "loss": 0.0254, "step": 233700 }, { "epoch": 1.51, "learning_rate": 7.37370673241382e-05, "loss": 0.0314, "step": 233710 }, { "epoch": 1.51, "learning_rate": 7.372738596978126e-05, "loss": 0.0282, "step": 233720 }, { "epoch": 1.51, "learning_rate": 7.371770461542433e-05, "loss": 0.0271, "step": 233730 }, { "epoch": 1.51, "learning_rate": 7.37080232610674e-05, "loss": 0.0281, "step": 233740 }, { "epoch": 1.51, "learning_rate": 7.369834190671046e-05, "loss": 0.026, "step": 233750 }, { "epoch": 1.51, "learning_rate": 7.368866055235353e-05, "loss": 0.0295, "step": 233760 }, { "epoch": 1.51, "learning_rate": 7.36789791979966e-05, "loss": 0.0273, "step": 233770 }, { "epoch": 1.51, "learning_rate": 7.366929784363967e-05, "loss": 0.029, "step": 233780 }, { "epoch": 1.51, "learning_rate": 7.365961648928273e-05, "loss": 0.0298, "step": 233790 }, { "epoch": 1.51, "learning_rate": 7.36499351349258e-05, "loss": 0.0287, "step": 233800 }, { "epoch": 1.51, "learning_rate": 7.364025378056887e-05, "loss": 0.0271, "step": 233810 }, { "epoch": 1.51, "learning_rate": 7.363057242621194e-05, "loss": 0.0301, "step": 233820 }, { "epoch": 1.51, "learning_rate": 7.3620891071855e-05, "loss": 0.0281, "step": 233830 }, { "epoch": 1.51, "learning_rate": 7.361120971749807e-05, "loss": 0.026, "step": 233840 }, { "epoch": 1.51, "learning_rate": 7.360152836314114e-05, "loss": 0.0263, "step": 233850 }, { "epoch": 1.51, "learning_rate": 7.35918470087842e-05, "loss": 0.0247, "step": 233860 }, { "epoch": 1.51, "learning_rate": 7.358216565442728e-05, "loss": 0.0302, "step": 233870 }, { "epoch": 1.51, "learning_rate": 7.357248430007035e-05, "loss": 0.0248, "step": 233880 }, { "epoch": 1.51, "learning_rate": 7.35628029457134e-05, "loss": 0.0264, "step": 233890 }, { "epoch": 1.51, "learning_rate": 7.355312159135648e-05, "loss": 0.0238, "step": 233900 }, { "epoch": 1.51, "learning_rate": 7.354344023699955e-05, "loss": 0.0278, "step": 233910 }, { "epoch": 1.51, "learning_rate": 7.353375888264261e-05, "loss": 0.0247, "step": 233920 }, { "epoch": 1.51, "learning_rate": 7.352407752828568e-05, "loss": 0.0282, "step": 233930 }, { "epoch": 1.51, "learning_rate": 7.351439617392876e-05, "loss": 0.026, "step": 233940 }, { "epoch": 1.51, "learning_rate": 7.350471481957181e-05, "loss": 0.0245, "step": 233950 }, { "epoch": 1.51, "learning_rate": 7.349503346521488e-05, "loss": 0.0324, "step": 233960 }, { "epoch": 1.51, "learning_rate": 7.348535211085796e-05, "loss": 0.0257, "step": 233970 }, { "epoch": 1.51, "learning_rate": 7.347567075650103e-05, "loss": 0.0251, "step": 233980 }, { "epoch": 1.51, "learning_rate": 7.346598940214409e-05, "loss": 0.0285, "step": 233990 }, { "epoch": 1.51, "learning_rate": 7.345630804778716e-05, "loss": 0.0243, "step": 234000 }, { "epoch": 1.51, "eval_cer": 0.9198472488984295, "eval_loss": 0.019518280401825905, "eval_runtime": 120.3803, "eval_samples_per_second": 16.614, "eval_steps_per_second": 4.154, "step": 234000 }, { "epoch": 1.51, "learning_rate": 7.344662669343022e-05, "loss": 0.0231, "step": 234010 }, { "epoch": 1.51, "learning_rate": 7.343694533907329e-05, "loss": 0.0305, "step": 234020 }, { "epoch": 1.51, "learning_rate": 7.342726398471636e-05, "loss": 0.031, "step": 234030 }, { "epoch": 1.51, "learning_rate": 7.341758263035944e-05, "loss": 0.0231, "step": 234040 }, { "epoch": 1.51, "learning_rate": 7.340790127600249e-05, "loss": 0.024, "step": 234050 }, { "epoch": 1.51, "learning_rate": 7.339821992164557e-05, "loss": 0.0274, "step": 234060 }, { "epoch": 1.51, "learning_rate": 7.338853856728864e-05, "loss": 0.0263, "step": 234070 }, { "epoch": 1.51, "learning_rate": 7.33788572129317e-05, "loss": 0.0282, "step": 234080 }, { "epoch": 1.51, "learning_rate": 7.336917585857477e-05, "loss": 0.0237, "step": 234090 }, { "epoch": 1.51, "learning_rate": 7.335949450421783e-05, "loss": 0.023, "step": 234100 }, { "epoch": 1.51, "learning_rate": 7.33498131498609e-05, "loss": 0.0256, "step": 234110 }, { "epoch": 1.51, "learning_rate": 7.334013179550397e-05, "loss": 0.0262, "step": 234120 }, { "epoch": 1.51, "learning_rate": 7.333045044114705e-05, "loss": 0.0228, "step": 234130 }, { "epoch": 1.51, "learning_rate": 7.332076908679011e-05, "loss": 0.0256, "step": 234140 }, { "epoch": 1.51, "learning_rate": 7.331108773243318e-05, "loss": 0.0274, "step": 234150 }, { "epoch": 1.51, "learning_rate": 7.330140637807624e-05, "loss": 0.0313, "step": 234160 }, { "epoch": 1.51, "learning_rate": 7.329172502371931e-05, "loss": 0.0263, "step": 234170 }, { "epoch": 1.51, "learning_rate": 7.328204366936238e-05, "loss": 0.0238, "step": 234180 }, { "epoch": 1.51, "learning_rate": 7.327236231500544e-05, "loss": 0.0254, "step": 234190 }, { "epoch": 1.51, "learning_rate": 7.326268096064852e-05, "loss": 0.0262, "step": 234200 }, { "epoch": 1.51, "learning_rate": 7.325299960629158e-05, "loss": 0.0293, "step": 234210 }, { "epoch": 1.51, "learning_rate": 7.324331825193466e-05, "loss": 0.0261, "step": 234220 }, { "epoch": 1.51, "learning_rate": 7.323363689757772e-05, "loss": 0.027, "step": 234230 }, { "epoch": 1.51, "learning_rate": 7.322395554322079e-05, "loss": 0.0289, "step": 234240 }, { "epoch": 1.51, "learning_rate": 7.321427418886385e-05, "loss": 0.0278, "step": 234250 }, { "epoch": 1.51, "learning_rate": 7.320459283450692e-05, "loss": 0.0263, "step": 234260 }, { "epoch": 1.51, "learning_rate": 7.319491148014999e-05, "loss": 0.0334, "step": 234270 }, { "epoch": 1.51, "learning_rate": 7.318523012579305e-05, "loss": 0.0224, "step": 234280 }, { "epoch": 1.51, "learning_rate": 7.317554877143613e-05, "loss": 0.0301, "step": 234290 }, { "epoch": 1.51, "learning_rate": 7.31658674170792e-05, "loss": 0.0272, "step": 234300 }, { "epoch": 1.51, "learning_rate": 7.315618606272225e-05, "loss": 0.0282, "step": 234310 }, { "epoch": 1.51, "learning_rate": 7.314650470836533e-05, "loss": 0.0288, "step": 234320 }, { "epoch": 1.51, "learning_rate": 7.31368233540084e-05, "loss": 0.0285, "step": 234330 }, { "epoch": 1.51, "learning_rate": 7.312714199965146e-05, "loss": 0.0233, "step": 234340 }, { "epoch": 1.51, "learning_rate": 7.311746064529453e-05, "loss": 0.0318, "step": 234350 }, { "epoch": 1.51, "learning_rate": 7.310777929093761e-05, "loss": 0.0288, "step": 234360 }, { "epoch": 1.51, "learning_rate": 7.309809793658066e-05, "loss": 0.0269, "step": 234370 }, { "epoch": 1.51, "learning_rate": 7.308841658222373e-05, "loss": 0.0254, "step": 234380 }, { "epoch": 1.51, "learning_rate": 7.307873522786681e-05, "loss": 0.0284, "step": 234390 }, { "epoch": 1.51, "learning_rate": 7.306905387350988e-05, "loss": 0.0273, "step": 234400 }, { "epoch": 1.51, "learning_rate": 7.305937251915294e-05, "loss": 0.0297, "step": 234410 }, { "epoch": 1.51, "learning_rate": 7.304969116479601e-05, "loss": 0.0322, "step": 234420 }, { "epoch": 1.51, "learning_rate": 7.304000981043907e-05, "loss": 0.0254, "step": 234430 }, { "epoch": 1.51, "learning_rate": 7.303032845608214e-05, "loss": 0.025, "step": 234440 }, { "epoch": 1.51, "learning_rate": 7.30206471017252e-05, "loss": 0.0326, "step": 234450 }, { "epoch": 1.51, "learning_rate": 7.301096574736829e-05, "loss": 0.0276, "step": 234460 }, { "epoch": 1.51, "learning_rate": 7.300128439301134e-05, "loss": 0.0235, "step": 234470 }, { "epoch": 1.51, "learning_rate": 7.299160303865442e-05, "loss": 0.0257, "step": 234480 }, { "epoch": 1.51, "learning_rate": 7.298192168429749e-05, "loss": 0.0293, "step": 234490 }, { "epoch": 1.51, "learning_rate": 7.297224032994055e-05, "loss": 0.0306, "step": 234500 }, { "epoch": 1.51, "learning_rate": 7.296255897558362e-05, "loss": 0.0227, "step": 234510 }, { "epoch": 1.51, "learning_rate": 7.295287762122668e-05, "loss": 0.025, "step": 234520 }, { "epoch": 1.51, "learning_rate": 7.294319626686975e-05, "loss": 0.0229, "step": 234530 }, { "epoch": 1.51, "learning_rate": 7.293351491251282e-05, "loss": 0.0255, "step": 234540 }, { "epoch": 1.51, "learning_rate": 7.29238335581559e-05, "loss": 0.0234, "step": 234550 }, { "epoch": 1.51, "learning_rate": 7.291415220379896e-05, "loss": 0.035, "step": 234560 }, { "epoch": 1.51, "learning_rate": 7.290447084944203e-05, "loss": 0.0341, "step": 234570 }, { "epoch": 1.51, "learning_rate": 7.28947894950851e-05, "loss": 0.0209, "step": 234580 }, { "epoch": 1.51, "learning_rate": 7.288510814072816e-05, "loss": 0.0297, "step": 234590 }, { "epoch": 1.51, "learning_rate": 7.287542678637123e-05, "loss": 0.0273, "step": 234600 }, { "epoch": 1.51, "learning_rate": 7.28657454320143e-05, "loss": 0.0264, "step": 234610 }, { "epoch": 1.51, "learning_rate": 7.285606407765737e-05, "loss": 0.0264, "step": 234620 }, { "epoch": 1.51, "learning_rate": 7.284638272330043e-05, "loss": 0.0288, "step": 234630 }, { "epoch": 1.51, "learning_rate": 7.28367013689435e-05, "loss": 0.0266, "step": 234640 }, { "epoch": 1.51, "learning_rate": 7.282702001458657e-05, "loss": 0.0263, "step": 234650 }, { "epoch": 1.51, "learning_rate": 7.281733866022964e-05, "loss": 0.0242, "step": 234660 }, { "epoch": 1.51, "learning_rate": 7.28076573058727e-05, "loss": 0.023, "step": 234670 }, { "epoch": 1.51, "learning_rate": 7.279797595151577e-05, "loss": 0.0285, "step": 234680 }, { "epoch": 1.51, "learning_rate": 7.278829459715884e-05, "loss": 0.0298, "step": 234690 }, { "epoch": 1.51, "learning_rate": 7.27786132428019e-05, "loss": 0.0267, "step": 234700 }, { "epoch": 1.51, "learning_rate": 7.276893188844498e-05, "loss": 0.0248, "step": 234710 }, { "epoch": 1.51, "learning_rate": 7.275925053408805e-05, "loss": 0.0252, "step": 234720 }, { "epoch": 1.51, "learning_rate": 7.27495691797311e-05, "loss": 0.0276, "step": 234730 }, { "epoch": 1.52, "learning_rate": 7.273988782537418e-05, "loss": 0.026, "step": 234740 }, { "epoch": 1.52, "learning_rate": 7.273020647101725e-05, "loss": 0.0291, "step": 234750 }, { "epoch": 1.52, "learning_rate": 7.272052511666031e-05, "loss": 0.0305, "step": 234760 }, { "epoch": 1.52, "learning_rate": 7.271084376230338e-05, "loss": 0.0225, "step": 234770 }, { "epoch": 1.52, "learning_rate": 7.270116240794645e-05, "loss": 0.0292, "step": 234780 }, { "epoch": 1.52, "learning_rate": 7.269148105358951e-05, "loss": 0.0249, "step": 234790 }, { "epoch": 1.52, "learning_rate": 7.268179969923258e-05, "loss": 0.0229, "step": 234800 }, { "epoch": 1.52, "learning_rate": 7.267211834487566e-05, "loss": 0.0233, "step": 234810 }, { "epoch": 1.52, "learning_rate": 7.266243699051873e-05, "loss": 0.0269, "step": 234820 }, { "epoch": 1.52, "learning_rate": 7.265275563616179e-05, "loss": 0.0241, "step": 234830 }, { "epoch": 1.52, "learning_rate": 7.264307428180486e-05, "loss": 0.0272, "step": 234840 }, { "epoch": 1.52, "learning_rate": 7.263339292744792e-05, "loss": 0.0302, "step": 234850 }, { "epoch": 1.52, "learning_rate": 7.262371157309099e-05, "loss": 0.0251, "step": 234860 }, { "epoch": 1.52, "learning_rate": 7.261403021873406e-05, "loss": 0.0233, "step": 234870 }, { "epoch": 1.52, "learning_rate": 7.260434886437712e-05, "loss": 0.0266, "step": 234880 }, { "epoch": 1.52, "learning_rate": 7.259466751002019e-05, "loss": 0.0351, "step": 234890 }, { "epoch": 1.52, "learning_rate": 7.258498615566327e-05, "loss": 0.0327, "step": 234900 }, { "epoch": 1.52, "learning_rate": 7.257530480130633e-05, "loss": 0.026, "step": 234910 }, { "epoch": 1.52, "learning_rate": 7.25656234469494e-05, "loss": 0.0254, "step": 234920 }, { "epoch": 1.52, "learning_rate": 7.255594209259247e-05, "loss": 0.0276, "step": 234930 }, { "epoch": 1.52, "learning_rate": 7.254626073823553e-05, "loss": 0.0296, "step": 234940 }, { "epoch": 1.52, "learning_rate": 7.25365793838786e-05, "loss": 0.0263, "step": 234950 }, { "epoch": 1.52, "learning_rate": 7.252689802952167e-05, "loss": 0.0282, "step": 234960 }, { "epoch": 1.52, "learning_rate": 7.251721667516475e-05, "loss": 0.0293, "step": 234970 }, { "epoch": 1.52, "learning_rate": 7.25075353208078e-05, "loss": 0.0327, "step": 234980 }, { "epoch": 1.52, "learning_rate": 7.249785396645086e-05, "loss": 0.0232, "step": 234990 }, { "epoch": 1.52, "learning_rate": 7.248817261209394e-05, "loss": 0.0258, "step": 235000 }, { "epoch": 1.52, "eval_cer": 0.9198888261213423, "eval_loss": 0.019709018990397453, "eval_runtime": 120.2635, "eval_samples_per_second": 16.63, "eval_steps_per_second": 4.158, "step": 235000 }, { "epoch": 1.52, "learning_rate": 7.247849125773701e-05, "loss": 0.0354, "step": 235010 }, { "epoch": 1.52, "learning_rate": 7.246880990338008e-05, "loss": 0.0305, "step": 235020 }, { "epoch": 1.52, "learning_rate": 7.245912854902314e-05, "loss": 0.0266, "step": 235030 }, { "epoch": 1.52, "learning_rate": 7.244944719466621e-05, "loss": 0.0355, "step": 235040 }, { "epoch": 1.52, "learning_rate": 7.243976584030928e-05, "loss": 0.0263, "step": 235050 }, { "epoch": 1.52, "learning_rate": 7.243008448595234e-05, "loss": 0.0246, "step": 235060 }, { "epoch": 1.52, "learning_rate": 7.242040313159542e-05, "loss": 0.031, "step": 235070 }, { "epoch": 1.52, "learning_rate": 7.241072177723847e-05, "loss": 0.0277, "step": 235080 }, { "epoch": 1.52, "learning_rate": 7.240104042288155e-05, "loss": 0.0258, "step": 235090 }, { "epoch": 1.52, "learning_rate": 7.239135906852462e-05, "loss": 0.0264, "step": 235100 }, { "epoch": 1.52, "learning_rate": 7.238167771416769e-05, "loss": 0.0276, "step": 235110 }, { "epoch": 1.52, "learning_rate": 7.237199635981075e-05, "loss": 0.026, "step": 235120 }, { "epoch": 1.52, "learning_rate": 7.236231500545382e-05, "loss": 0.0277, "step": 235130 }, { "epoch": 1.52, "learning_rate": 7.235263365109689e-05, "loss": 0.0246, "step": 235140 }, { "epoch": 1.52, "learning_rate": 7.234295229673995e-05, "loss": 0.028, "step": 235150 }, { "epoch": 1.52, "learning_rate": 7.233327094238303e-05, "loss": 0.0241, "step": 235160 }, { "epoch": 1.52, "learning_rate": 7.23235895880261e-05, "loss": 0.0272, "step": 235170 }, { "epoch": 1.52, "learning_rate": 7.231390823366916e-05, "loss": 0.0267, "step": 235180 }, { "epoch": 1.52, "learning_rate": 7.230422687931223e-05, "loss": 0.0297, "step": 235190 }, { "epoch": 1.52, "learning_rate": 7.22945455249553e-05, "loss": 0.029, "step": 235200 }, { "epoch": 1.52, "learning_rate": 7.228486417059836e-05, "loss": 0.0283, "step": 235210 }, { "epoch": 1.52, "learning_rate": 7.227518281624143e-05, "loss": 0.0279, "step": 235220 }, { "epoch": 1.52, "learning_rate": 7.226550146188451e-05, "loss": 0.0269, "step": 235230 }, { "epoch": 1.52, "learning_rate": 7.225582010752756e-05, "loss": 0.0249, "step": 235240 }, { "epoch": 1.52, "learning_rate": 7.224613875317064e-05, "loss": 0.0221, "step": 235250 }, { "epoch": 1.52, "learning_rate": 7.223645739881371e-05, "loss": 0.0298, "step": 235260 }, { "epoch": 1.52, "learning_rate": 7.222677604445677e-05, "loss": 0.0286, "step": 235270 }, { "epoch": 1.52, "learning_rate": 7.221709469009984e-05, "loss": 0.0275, "step": 235280 }, { "epoch": 1.52, "learning_rate": 7.22074133357429e-05, "loss": 0.0252, "step": 235290 }, { "epoch": 1.52, "learning_rate": 7.219773198138597e-05, "loss": 0.0231, "step": 235300 }, { "epoch": 1.52, "learning_rate": 7.218805062702904e-05, "loss": 0.0276, "step": 235310 }, { "epoch": 1.52, "learning_rate": 7.217836927267212e-05, "loss": 0.0253, "step": 235320 }, { "epoch": 1.52, "learning_rate": 7.216868791831518e-05, "loss": 0.03, "step": 235330 }, { "epoch": 1.52, "learning_rate": 7.215900656395824e-05, "loss": 0.0285, "step": 235340 }, { "epoch": 1.52, "learning_rate": 7.214932520960132e-05, "loss": 0.028, "step": 235350 }, { "epoch": 1.52, "learning_rate": 7.213964385524438e-05, "loss": 0.0255, "step": 235360 }, { "epoch": 1.52, "learning_rate": 7.212996250088745e-05, "loss": 0.0258, "step": 235370 }, { "epoch": 1.52, "learning_rate": 7.212028114653052e-05, "loss": 0.0357, "step": 235380 }, { "epoch": 1.52, "learning_rate": 7.21105997921736e-05, "loss": 0.0245, "step": 235390 }, { "epoch": 1.52, "learning_rate": 7.210091843781665e-05, "loss": 0.027, "step": 235400 }, { "epoch": 1.52, "learning_rate": 7.209123708345971e-05, "loss": 0.0265, "step": 235410 }, { "epoch": 1.52, "learning_rate": 7.20815557291028e-05, "loss": 0.0254, "step": 235420 }, { "epoch": 1.52, "learning_rate": 7.207187437474586e-05, "loss": 0.0253, "step": 235430 }, { "epoch": 1.52, "learning_rate": 7.206219302038893e-05, "loss": 0.0281, "step": 235440 }, { "epoch": 1.52, "learning_rate": 7.205251166603199e-05, "loss": 0.0265, "step": 235450 }, { "epoch": 1.52, "learning_rate": 7.204283031167506e-05, "loss": 0.0304, "step": 235460 }, { "epoch": 1.52, "learning_rate": 7.203314895731813e-05, "loss": 0.0254, "step": 235470 }, { "epoch": 1.52, "learning_rate": 7.202346760296119e-05, "loss": 0.0294, "step": 235480 }, { "epoch": 1.52, "learning_rate": 7.201378624860427e-05, "loss": 0.025, "step": 235490 }, { "epoch": 1.52, "learning_rate": 7.200410489424732e-05, "loss": 0.0204, "step": 235500 }, { "epoch": 1.52, "learning_rate": 7.19944235398904e-05, "loss": 0.0311, "step": 235510 }, { "epoch": 1.52, "learning_rate": 7.198474218553347e-05, "loss": 0.0213, "step": 235520 }, { "epoch": 1.52, "learning_rate": 7.197506083117654e-05, "loss": 0.0293, "step": 235530 }, { "epoch": 1.52, "learning_rate": 7.19653794768196e-05, "loss": 0.0272, "step": 235540 }, { "epoch": 1.52, "learning_rate": 7.195569812246267e-05, "loss": 0.0243, "step": 235550 }, { "epoch": 1.52, "learning_rate": 7.194601676810574e-05, "loss": 0.0291, "step": 235560 }, { "epoch": 1.52, "learning_rate": 7.19363354137488e-05, "loss": 0.0251, "step": 235570 }, { "epoch": 1.52, "learning_rate": 7.192665405939188e-05, "loss": 0.0224, "step": 235580 }, { "epoch": 1.52, "learning_rate": 7.191697270503495e-05, "loss": 0.0244, "step": 235590 }, { "epoch": 1.52, "learning_rate": 7.190729135067801e-05, "loss": 0.026, "step": 235600 }, { "epoch": 1.52, "learning_rate": 7.189760999632108e-05, "loss": 0.029, "step": 235610 }, { "epoch": 1.52, "learning_rate": 7.188792864196415e-05, "loss": 0.025, "step": 235620 }, { "epoch": 1.52, "learning_rate": 7.187824728760721e-05, "loss": 0.0283, "step": 235630 }, { "epoch": 1.52, "learning_rate": 7.186856593325028e-05, "loss": 0.0265, "step": 235640 }, { "epoch": 1.52, "learning_rate": 7.185888457889336e-05, "loss": 0.0256, "step": 235650 }, { "epoch": 1.52, "learning_rate": 7.184920322453641e-05, "loss": 0.0335, "step": 235660 }, { "epoch": 1.52, "learning_rate": 7.183952187017949e-05, "loss": 0.0282, "step": 235670 }, { "epoch": 1.52, "learning_rate": 7.182984051582256e-05, "loss": 0.0278, "step": 235680 }, { "epoch": 1.52, "learning_rate": 7.182015916146562e-05, "loss": 0.0302, "step": 235690 }, { "epoch": 1.52, "learning_rate": 7.181047780710869e-05, "loss": 0.0334, "step": 235700 }, { "epoch": 1.52, "learning_rate": 7.180079645275176e-05, "loss": 0.0333, "step": 235710 }, { "epoch": 1.52, "learning_rate": 7.179111509839482e-05, "loss": 0.0231, "step": 235720 }, { "epoch": 1.52, "learning_rate": 7.178143374403789e-05, "loss": 0.0255, "step": 235730 }, { "epoch": 1.52, "learning_rate": 7.177175238968097e-05, "loss": 0.0273, "step": 235740 }, { "epoch": 1.52, "learning_rate": 7.176207103532403e-05, "loss": 0.0282, "step": 235750 }, { "epoch": 1.52, "learning_rate": 7.175238968096709e-05, "loss": 0.0268, "step": 235760 }, { "epoch": 1.52, "learning_rate": 7.174270832661017e-05, "loss": 0.0263, "step": 235770 }, { "epoch": 1.52, "learning_rate": 7.173302697225323e-05, "loss": 0.0243, "step": 235780 }, { "epoch": 1.52, "learning_rate": 7.17233456178963e-05, "loss": 0.0288, "step": 235790 }, { "epoch": 1.52, "learning_rate": 7.171366426353937e-05, "loss": 0.0269, "step": 235800 }, { "epoch": 1.52, "learning_rate": 7.170398290918245e-05, "loss": 0.028, "step": 235810 }, { "epoch": 1.52, "learning_rate": 7.16943015548255e-05, "loss": 0.0267, "step": 235820 }, { "epoch": 1.52, "learning_rate": 7.168462020046856e-05, "loss": 0.027, "step": 235830 }, { "epoch": 1.52, "learning_rate": 7.167493884611164e-05, "loss": 0.03, "step": 235840 }, { "epoch": 1.52, "learning_rate": 7.166525749175471e-05, "loss": 0.0349, "step": 235850 }, { "epoch": 1.52, "learning_rate": 7.165557613739778e-05, "loss": 0.0247, "step": 235860 }, { "epoch": 1.52, "learning_rate": 7.164589478304084e-05, "loss": 0.0303, "step": 235870 }, { "epoch": 1.52, "learning_rate": 7.163621342868391e-05, "loss": 0.025, "step": 235880 }, { "epoch": 1.52, "learning_rate": 7.162653207432698e-05, "loss": 0.0253, "step": 235890 }, { "epoch": 1.52, "learning_rate": 7.161685071997004e-05, "loss": 0.0267, "step": 235900 }, { "epoch": 1.52, "learning_rate": 7.160716936561312e-05, "loss": 0.0204, "step": 235910 }, { "epoch": 1.52, "learning_rate": 7.159748801125617e-05, "loss": 0.0288, "step": 235920 }, { "epoch": 1.52, "learning_rate": 7.158780665689925e-05, "loss": 0.0274, "step": 235930 }, { "epoch": 1.52, "learning_rate": 7.157812530254232e-05, "loss": 0.0242, "step": 235940 }, { "epoch": 1.52, "learning_rate": 7.156844394818539e-05, "loss": 0.0281, "step": 235950 }, { "epoch": 1.52, "learning_rate": 7.155876259382845e-05, "loss": 0.0266, "step": 235960 }, { "epoch": 1.52, "learning_rate": 7.154908123947152e-05, "loss": 0.0235, "step": 235970 }, { "epoch": 1.52, "learning_rate": 7.153939988511459e-05, "loss": 0.028, "step": 235980 }, { "epoch": 1.52, "learning_rate": 7.152971853075765e-05, "loss": 0.0279, "step": 235990 }, { "epoch": 1.52, "learning_rate": 7.152003717640073e-05, "loss": 0.0272, "step": 236000 }, { "epoch": 1.52, "eval_cer": 0.9198336911083493, "eval_loss": 0.019630778580904007, "eval_runtime": 120.0957, "eval_samples_per_second": 16.653, "eval_steps_per_second": 4.163, "step": 236000 }, { "epoch": 1.52, "learning_rate": 7.15103558220438e-05, "loss": 0.0283, "step": 236010 }, { "epoch": 1.52, "learning_rate": 7.150067446768686e-05, "loss": 0.0277, "step": 236020 }, { "epoch": 1.52, "learning_rate": 7.149099311332993e-05, "loss": 0.031, "step": 236030 }, { "epoch": 1.52, "learning_rate": 7.1481311758973e-05, "loss": 0.025, "step": 236040 }, { "epoch": 1.52, "learning_rate": 7.147163040461606e-05, "loss": 0.0232, "step": 236050 }, { "epoch": 1.52, "learning_rate": 7.146194905025913e-05, "loss": 0.0339, "step": 236060 }, { "epoch": 1.52, "learning_rate": 7.145226769590221e-05, "loss": 0.0262, "step": 236070 }, { "epoch": 1.52, "learning_rate": 7.144258634154526e-05, "loss": 0.0252, "step": 236080 }, { "epoch": 1.52, "learning_rate": 7.143290498718834e-05, "loss": 0.0237, "step": 236090 }, { "epoch": 1.52, "learning_rate": 7.142322363283141e-05, "loss": 0.0231, "step": 236100 }, { "epoch": 1.52, "learning_rate": 7.141354227847447e-05, "loss": 0.026, "step": 236110 }, { "epoch": 1.52, "learning_rate": 7.140386092411754e-05, "loss": 0.0261, "step": 236120 }, { "epoch": 1.52, "learning_rate": 7.13941795697606e-05, "loss": 0.0294, "step": 236130 }, { "epoch": 1.52, "learning_rate": 7.138449821540367e-05, "loss": 0.0245, "step": 236140 }, { "epoch": 1.52, "learning_rate": 7.137481686104674e-05, "loss": 0.0246, "step": 236150 }, { "epoch": 1.52, "learning_rate": 7.136513550668982e-05, "loss": 0.0305, "step": 236160 }, { "epoch": 1.52, "learning_rate": 7.135545415233288e-05, "loss": 0.0268, "step": 236170 }, { "epoch": 1.52, "learning_rate": 7.134577279797594e-05, "loss": 0.0203, "step": 236180 }, { "epoch": 1.52, "learning_rate": 7.133609144361902e-05, "loss": 0.0296, "step": 236190 }, { "epoch": 1.52, "learning_rate": 7.132641008926208e-05, "loss": 0.0235, "step": 236200 }, { "epoch": 1.52, "learning_rate": 7.131672873490515e-05, "loss": 0.0232, "step": 236210 }, { "epoch": 1.52, "learning_rate": 7.130704738054822e-05, "loss": 0.024, "step": 236220 }, { "epoch": 1.52, "learning_rate": 7.129736602619128e-05, "loss": 0.0299, "step": 236230 }, { "epoch": 1.52, "learning_rate": 7.128768467183435e-05, "loss": 0.0297, "step": 236240 }, { "epoch": 1.52, "learning_rate": 7.127800331747741e-05, "loss": 0.0258, "step": 236250 }, { "epoch": 1.52, "learning_rate": 7.12683219631205e-05, "loss": 0.0217, "step": 236260 }, { "epoch": 1.52, "learning_rate": 7.125864060876356e-05, "loss": 0.0261, "step": 236270 }, { "epoch": 1.53, "learning_rate": 7.124895925440663e-05, "loss": 0.0255, "step": 236280 }, { "epoch": 1.53, "learning_rate": 7.123927790004969e-05, "loss": 0.0259, "step": 236290 }, { "epoch": 1.53, "learning_rate": 7.122959654569276e-05, "loss": 0.0256, "step": 236300 }, { "epoch": 1.53, "learning_rate": 7.121991519133583e-05, "loss": 0.025, "step": 236310 }, { "epoch": 1.53, "learning_rate": 7.121023383697889e-05, "loss": 0.0297, "step": 236320 }, { "epoch": 1.53, "learning_rate": 7.120055248262196e-05, "loss": 0.0287, "step": 236330 }, { "epoch": 1.53, "learning_rate": 7.119087112826502e-05, "loss": 0.0225, "step": 236340 }, { "epoch": 1.53, "learning_rate": 7.11811897739081e-05, "loss": 0.0262, "step": 236350 }, { "epoch": 1.53, "learning_rate": 7.117150841955117e-05, "loss": 0.0282, "step": 236360 }, { "epoch": 1.53, "learning_rate": 7.116182706519424e-05, "loss": 0.0268, "step": 236370 }, { "epoch": 1.53, "learning_rate": 7.11521457108373e-05, "loss": 0.0323, "step": 236380 }, { "epoch": 1.53, "learning_rate": 7.114246435648037e-05, "loss": 0.0275, "step": 236390 }, { "epoch": 1.53, "learning_rate": 7.113278300212343e-05, "loss": 0.0237, "step": 236400 }, { "epoch": 1.53, "learning_rate": 7.11231016477665e-05, "loss": 0.0258, "step": 236410 }, { "epoch": 1.53, "learning_rate": 7.111342029340958e-05, "loss": 0.0333, "step": 236420 }, { "epoch": 1.53, "learning_rate": 7.110373893905263e-05, "loss": 0.0258, "step": 236430 }, { "epoch": 1.53, "learning_rate": 7.109405758469571e-05, "loss": 0.029, "step": 236440 }, { "epoch": 1.53, "learning_rate": 7.108437623033878e-05, "loss": 0.0298, "step": 236450 }, { "epoch": 1.53, "learning_rate": 7.107469487598185e-05, "loss": 0.0223, "step": 236460 }, { "epoch": 1.53, "learning_rate": 7.106501352162491e-05, "loss": 0.0266, "step": 236470 }, { "epoch": 1.53, "learning_rate": 7.105533216726798e-05, "loss": 0.0339, "step": 236480 }, { "epoch": 1.53, "learning_rate": 7.104565081291104e-05, "loss": 0.0274, "step": 236490 }, { "epoch": 1.53, "learning_rate": 7.103596945855411e-05, "loss": 0.0248, "step": 236500 }, { "epoch": 1.53, "learning_rate": 7.102628810419719e-05, "loss": 0.0351, "step": 236510 }, { "epoch": 1.53, "learning_rate": 7.101660674984026e-05, "loss": 0.0202, "step": 236520 }, { "epoch": 1.53, "learning_rate": 7.100692539548331e-05, "loss": 0.0248, "step": 236530 }, { "epoch": 1.53, "learning_rate": 7.099724404112639e-05, "loss": 0.0258, "step": 236540 }, { "epoch": 1.53, "learning_rate": 7.098756268676946e-05, "loss": 0.026, "step": 236550 }, { "epoch": 1.53, "learning_rate": 7.097788133241252e-05, "loss": 0.0295, "step": 236560 }, { "epoch": 1.53, "learning_rate": 7.096819997805559e-05, "loss": 0.0334, "step": 236570 }, { "epoch": 1.53, "learning_rate": 7.095851862369867e-05, "loss": 0.0221, "step": 236580 }, { "epoch": 1.53, "learning_rate": 7.094883726934172e-05, "loss": 0.0213, "step": 236590 }, { "epoch": 1.53, "learning_rate": 7.093915591498479e-05, "loss": 0.0252, "step": 236600 }, { "epoch": 1.53, "learning_rate": 7.092947456062787e-05, "loss": 0.0262, "step": 236610 }, { "epoch": 1.53, "learning_rate": 7.091979320627093e-05, "loss": 0.0272, "step": 236620 }, { "epoch": 1.53, "learning_rate": 7.0910111851914e-05, "loss": 0.0295, "step": 236630 }, { "epoch": 1.53, "learning_rate": 7.090043049755707e-05, "loss": 0.0291, "step": 236640 }, { "epoch": 1.53, "learning_rate": 7.089074914320013e-05, "loss": 0.0263, "step": 236650 }, { "epoch": 1.53, "learning_rate": 7.08810677888432e-05, "loss": 0.0257, "step": 236660 }, { "epoch": 1.53, "learning_rate": 7.087138643448626e-05, "loss": 0.0221, "step": 236670 }, { "epoch": 1.53, "learning_rate": 7.086170508012934e-05, "loss": 0.024, "step": 236680 }, { "epoch": 1.53, "learning_rate": 7.08520237257724e-05, "loss": 0.0314, "step": 236690 }, { "epoch": 1.53, "learning_rate": 7.084234237141548e-05, "loss": 0.0249, "step": 236700 }, { "epoch": 1.53, "learning_rate": 7.083266101705854e-05, "loss": 0.0234, "step": 236710 }, { "epoch": 1.53, "learning_rate": 7.082297966270161e-05, "loss": 0.0315, "step": 236720 }, { "epoch": 1.53, "learning_rate": 7.081329830834467e-05, "loss": 0.0263, "step": 236730 }, { "epoch": 1.53, "learning_rate": 7.080361695398774e-05, "loss": 0.023, "step": 236740 }, { "epoch": 1.53, "learning_rate": 7.079393559963081e-05, "loss": 0.0326, "step": 236750 }, { "epoch": 1.53, "learning_rate": 7.078425424527387e-05, "loss": 0.0284, "step": 236760 }, { "epoch": 1.53, "learning_rate": 7.077457289091695e-05, "loss": 0.026, "step": 236770 }, { "epoch": 1.53, "learning_rate": 7.076489153656002e-05, "loss": 0.0279, "step": 236780 }, { "epoch": 1.53, "learning_rate": 7.075521018220307e-05, "loss": 0.0267, "step": 236790 }, { "epoch": 1.53, "learning_rate": 7.074552882784615e-05, "loss": 0.0241, "step": 236800 }, { "epoch": 1.53, "learning_rate": 7.073584747348922e-05, "loss": 0.0266, "step": 236810 }, { "epoch": 1.53, "learning_rate": 7.072616611913228e-05, "loss": 0.0242, "step": 236820 }, { "epoch": 1.53, "learning_rate": 7.071648476477535e-05, "loss": 0.0279, "step": 236830 }, { "epoch": 1.53, "learning_rate": 7.070680341041843e-05, "loss": 0.0278, "step": 236840 }, { "epoch": 1.53, "learning_rate": 7.069712205606148e-05, "loss": 0.0312, "step": 236850 }, { "epoch": 1.53, "learning_rate": 7.068744070170455e-05, "loss": 0.0274, "step": 236860 }, { "epoch": 1.53, "learning_rate": 7.067775934734763e-05, "loss": 0.0298, "step": 236870 }, { "epoch": 1.53, "learning_rate": 7.06680779929907e-05, "loss": 0.0268, "step": 236880 }, { "epoch": 1.53, "learning_rate": 7.065839663863376e-05, "loss": 0.028, "step": 236890 }, { "epoch": 1.53, "learning_rate": 7.064871528427683e-05, "loss": 0.024, "step": 236900 }, { "epoch": 1.53, "learning_rate": 7.06390339299199e-05, "loss": 0.0265, "step": 236910 }, { "epoch": 1.53, "learning_rate": 7.062935257556296e-05, "loss": 0.0288, "step": 236920 }, { "epoch": 1.53, "learning_rate": 7.061967122120603e-05, "loss": 0.0278, "step": 236930 }, { "epoch": 1.53, "learning_rate": 7.06099898668491e-05, "loss": 0.0253, "step": 236940 }, { "epoch": 1.53, "learning_rate": 7.060030851249216e-05, "loss": 0.028, "step": 236950 }, { "epoch": 1.53, "learning_rate": 7.059062715813524e-05, "loss": 0.0237, "step": 236960 }, { "epoch": 1.53, "learning_rate": 7.05809458037783e-05, "loss": 0.0352, "step": 236970 }, { "epoch": 1.53, "learning_rate": 7.057126444942137e-05, "loss": 0.0235, "step": 236980 }, { "epoch": 1.53, "learning_rate": 7.056158309506444e-05, "loss": 0.031, "step": 236990 }, { "epoch": 1.53, "learning_rate": 7.05519017407075e-05, "loss": 0.0261, "step": 237000 }, { "epoch": 1.53, "eval_cer": 0.9198870184159982, "eval_loss": 0.019820256158709526, "eval_runtime": 120.3827, "eval_samples_per_second": 16.614, "eval_steps_per_second": 4.153, "step": 237000 }, { "epoch": 1.53, "learning_rate": 7.054222038635057e-05, "loss": 0.0272, "step": 237010 }, { "epoch": 1.53, "learning_rate": 7.053253903199364e-05, "loss": 0.02, "step": 237020 }, { "epoch": 1.53, "learning_rate": 7.052285767763672e-05, "loss": 0.0271, "step": 237030 }, { "epoch": 1.53, "learning_rate": 7.051317632327978e-05, "loss": 0.0267, "step": 237040 }, { "epoch": 1.53, "learning_rate": 7.050349496892285e-05, "loss": 0.025, "step": 237050 }, { "epoch": 1.53, "learning_rate": 7.049381361456592e-05, "loss": 0.0304, "step": 237060 }, { "epoch": 1.53, "learning_rate": 7.048413226020898e-05, "loss": 0.0261, "step": 237070 }, { "epoch": 1.53, "learning_rate": 7.047445090585205e-05, "loss": 0.0267, "step": 237080 }, { "epoch": 1.53, "learning_rate": 7.046476955149511e-05, "loss": 0.0262, "step": 237090 }, { "epoch": 1.53, "learning_rate": 7.04550881971382e-05, "loss": 0.03, "step": 237100 }, { "epoch": 1.53, "learning_rate": 7.044540684278125e-05, "loss": 0.0267, "step": 237110 }, { "epoch": 1.53, "learning_rate": 7.043572548842433e-05, "loss": 0.0261, "step": 237120 }, { "epoch": 1.53, "learning_rate": 7.042604413406739e-05, "loss": 0.0239, "step": 237130 }, { "epoch": 1.53, "learning_rate": 7.041636277971046e-05, "loss": 0.0301, "step": 237140 }, { "epoch": 1.53, "learning_rate": 7.040668142535352e-05, "loss": 0.0271, "step": 237150 }, { "epoch": 1.53, "learning_rate": 7.039700007099659e-05, "loss": 0.0273, "step": 237160 }, { "epoch": 1.53, "learning_rate": 7.038731871663966e-05, "loss": 0.0273, "step": 237170 }, { "epoch": 1.53, "learning_rate": 7.037763736228272e-05, "loss": 0.0282, "step": 237180 }, { "epoch": 1.53, "learning_rate": 7.03679560079258e-05, "loss": 0.0268, "step": 237190 }, { "epoch": 1.53, "learning_rate": 7.035827465356887e-05, "loss": 0.0291, "step": 237200 }, { "epoch": 1.53, "learning_rate": 7.034859329921192e-05, "loss": 0.029, "step": 237210 }, { "epoch": 1.53, "learning_rate": 7.0338911944855e-05, "loss": 0.0234, "step": 237220 }, { "epoch": 1.53, "learning_rate": 7.032923059049807e-05, "loss": 0.0284, "step": 237230 }, { "epoch": 1.53, "learning_rate": 7.031954923614113e-05, "loss": 0.0262, "step": 237240 }, { "epoch": 1.53, "learning_rate": 7.03098678817842e-05, "loss": 0.0293, "step": 237250 }, { "epoch": 1.53, "learning_rate": 7.030018652742728e-05, "loss": 0.025, "step": 237260 }, { "epoch": 1.53, "learning_rate": 7.029050517307033e-05, "loss": 0.0286, "step": 237270 }, { "epoch": 1.53, "learning_rate": 7.02808238187134e-05, "loss": 0.0269, "step": 237280 }, { "epoch": 1.53, "learning_rate": 7.027114246435648e-05, "loss": 0.0324, "step": 237290 }, { "epoch": 1.53, "learning_rate": 7.026146110999955e-05, "loss": 0.03, "step": 237300 }, { "epoch": 1.53, "learning_rate": 7.025177975564261e-05, "loss": 0.0237, "step": 237310 }, { "epoch": 1.53, "learning_rate": 7.024209840128568e-05, "loss": 0.0279, "step": 237320 }, { "epoch": 1.53, "learning_rate": 7.023241704692874e-05, "loss": 0.0241, "step": 237330 }, { "epoch": 1.53, "learning_rate": 7.022273569257181e-05, "loss": 0.0247, "step": 237340 }, { "epoch": 1.53, "learning_rate": 7.021305433821488e-05, "loss": 0.0319, "step": 237350 }, { "epoch": 1.53, "learning_rate": 7.020337298385796e-05, "loss": 0.0274, "step": 237360 }, { "epoch": 1.53, "learning_rate": 7.019369162950101e-05, "loss": 0.0251, "step": 237370 }, { "epoch": 1.53, "learning_rate": 7.018401027514409e-05, "loss": 0.0287, "step": 237380 }, { "epoch": 1.53, "learning_rate": 7.017432892078716e-05, "loss": 0.0265, "step": 237390 }, { "epoch": 1.53, "learning_rate": 7.016464756643022e-05, "loss": 0.0239, "step": 237400 }, { "epoch": 1.53, "learning_rate": 7.015496621207329e-05, "loss": 0.0237, "step": 237410 }, { "epoch": 1.53, "learning_rate": 7.014528485771635e-05, "loss": 0.0235, "step": 237420 }, { "epoch": 1.53, "learning_rate": 7.013560350335942e-05, "loss": 0.0343, "step": 237430 }, { "epoch": 1.53, "learning_rate": 7.012592214900249e-05, "loss": 0.0257, "step": 237440 }, { "epoch": 1.53, "learning_rate": 7.011624079464557e-05, "loss": 0.0274, "step": 237450 }, { "epoch": 1.53, "learning_rate": 7.010655944028863e-05, "loss": 0.0279, "step": 237460 }, { "epoch": 1.53, "learning_rate": 7.00968780859317e-05, "loss": 0.0258, "step": 237470 }, { "epoch": 1.53, "learning_rate": 7.008719673157476e-05, "loss": 0.0273, "step": 237480 }, { "epoch": 1.53, "learning_rate": 7.007751537721783e-05, "loss": 0.0235, "step": 237490 }, { "epoch": 1.53, "learning_rate": 7.00678340228609e-05, "loss": 0.0249, "step": 237500 }, { "epoch": 1.53, "learning_rate": 7.005815266850396e-05, "loss": 0.0255, "step": 237510 }, { "epoch": 1.53, "learning_rate": 7.004847131414703e-05, "loss": 0.021, "step": 237520 }, { "epoch": 1.53, "learning_rate": 7.00387899597901e-05, "loss": 0.0256, "step": 237530 }, { "epoch": 1.53, "learning_rate": 7.002910860543318e-05, "loss": 0.0254, "step": 237540 }, { "epoch": 1.53, "learning_rate": 7.001942725107624e-05, "loss": 0.0267, "step": 237550 }, { "epoch": 1.53, "learning_rate": 7.000974589671931e-05, "loss": 0.0257, "step": 237560 }, { "epoch": 1.53, "learning_rate": 7.000006454236237e-05, "loss": 0.023, "step": 237570 }, { "epoch": 1.53, "learning_rate": 6.999038318800544e-05, "loss": 0.0257, "step": 237580 }, { "epoch": 1.53, "learning_rate": 6.998070183364851e-05, "loss": 0.024, "step": 237590 }, { "epoch": 1.53, "learning_rate": 6.997102047929157e-05, "loss": 0.0232, "step": 237600 }, { "epoch": 1.53, "learning_rate": 6.996133912493465e-05, "loss": 0.0291, "step": 237610 }, { "epoch": 1.53, "learning_rate": 6.995165777057772e-05, "loss": 0.0233, "step": 237620 }, { "epoch": 1.53, "learning_rate": 6.994197641622077e-05, "loss": 0.0261, "step": 237630 }, { "epoch": 1.53, "learning_rate": 6.993229506186385e-05, "loss": 0.0333, "step": 237640 }, { "epoch": 1.53, "learning_rate": 6.992261370750692e-05, "loss": 0.0323, "step": 237650 }, { "epoch": 1.53, "learning_rate": 6.991293235314998e-05, "loss": 0.0299, "step": 237660 }, { "epoch": 1.53, "learning_rate": 6.990325099879305e-05, "loss": 0.0265, "step": 237670 }, { "epoch": 1.53, "learning_rate": 6.989356964443612e-05, "loss": 0.0221, "step": 237680 }, { "epoch": 1.53, "learning_rate": 6.988388829007918e-05, "loss": 0.0288, "step": 237690 }, { "epoch": 1.53, "learning_rate": 6.987420693572225e-05, "loss": 0.03, "step": 237700 }, { "epoch": 1.53, "learning_rate": 6.986452558136533e-05, "loss": 0.0289, "step": 237710 }, { "epoch": 1.53, "learning_rate": 6.98548442270084e-05, "loss": 0.0265, "step": 237720 }, { "epoch": 1.53, "learning_rate": 6.984516287265146e-05, "loss": 0.0309, "step": 237730 }, { "epoch": 1.53, "learning_rate": 6.983548151829453e-05, "loss": 0.0219, "step": 237740 }, { "epoch": 1.53, "learning_rate": 6.98258001639376e-05, "loss": 0.0247, "step": 237750 }, { "epoch": 1.53, "learning_rate": 6.981611880958066e-05, "loss": 0.026, "step": 237760 }, { "epoch": 1.53, "learning_rate": 6.980643745522373e-05, "loss": 0.0238, "step": 237770 }, { "epoch": 1.53, "learning_rate": 6.979675610086679e-05, "loss": 0.0269, "step": 237780 }, { "epoch": 1.53, "learning_rate": 6.978707474650986e-05, "loss": 0.0297, "step": 237790 }, { "epoch": 1.53, "learning_rate": 6.977739339215294e-05, "loss": 0.0259, "step": 237800 }, { "epoch": 1.53, "learning_rate": 6.9767712037796e-05, "loss": 0.0236, "step": 237810 }, { "epoch": 1.53, "learning_rate": 6.975803068343907e-05, "loss": 0.0273, "step": 237820 }, { "epoch": 1.54, "learning_rate": 6.974834932908214e-05, "loss": 0.0258, "step": 237830 }, { "epoch": 1.54, "learning_rate": 6.97386679747252e-05, "loss": 0.027, "step": 237840 }, { "epoch": 1.54, "learning_rate": 6.972898662036827e-05, "loss": 0.0259, "step": 237850 }, { "epoch": 1.54, "learning_rate": 6.971930526601134e-05, "loss": 0.0246, "step": 237860 }, { "epoch": 1.54, "learning_rate": 6.970962391165442e-05, "loss": 0.0232, "step": 237870 }, { "epoch": 1.54, "learning_rate": 6.969994255729747e-05, "loss": 0.0337, "step": 237880 }, { "epoch": 1.54, "learning_rate": 6.969026120294055e-05, "loss": 0.0248, "step": 237890 }, { "epoch": 1.54, "learning_rate": 6.968057984858361e-05, "loss": 0.0283, "step": 237900 }, { "epoch": 1.54, "learning_rate": 6.967089849422668e-05, "loss": 0.0264, "step": 237910 }, { "epoch": 1.54, "learning_rate": 6.966121713986975e-05, "loss": 0.0254, "step": 237920 }, { "epoch": 1.54, "learning_rate": 6.965153578551281e-05, "loss": 0.0285, "step": 237930 }, { "epoch": 1.54, "learning_rate": 6.964185443115588e-05, "loss": 0.0219, "step": 237940 }, { "epoch": 1.54, "learning_rate": 6.963217307679895e-05, "loss": 0.021, "step": 237950 }, { "epoch": 1.54, "learning_rate": 6.962249172244203e-05, "loss": 0.0253, "step": 237960 }, { "epoch": 1.54, "learning_rate": 6.961281036808509e-05, "loss": 0.028, "step": 237970 }, { "epoch": 1.54, "learning_rate": 6.960312901372814e-05, "loss": 0.0326, "step": 237980 }, { "epoch": 1.54, "learning_rate": 6.959344765937122e-05, "loss": 0.0261, "step": 237990 }, { "epoch": 1.54, "learning_rate": 6.958376630501429e-05, "loss": 0.0222, "step": 238000 }, { "epoch": 1.54, "eval_cer": 0.9198617105411818, "eval_loss": 0.019788194447755814, "eval_runtime": 119.9476, "eval_samples_per_second": 16.674, "eval_steps_per_second": 4.168, "step": 238000 }, { "epoch": 1.54, "learning_rate": 6.957408495065736e-05, "loss": 0.0316, "step": 238010 }, { "epoch": 1.54, "learning_rate": 6.956440359630042e-05, "loss": 0.0366, "step": 238020 }, { "epoch": 1.54, "learning_rate": 6.95547222419435e-05, "loss": 0.03, "step": 238030 }, { "epoch": 1.54, "learning_rate": 6.954504088758656e-05, "loss": 0.027, "step": 238040 }, { "epoch": 1.54, "learning_rate": 6.953535953322962e-05, "loss": 0.0266, "step": 238050 }, { "epoch": 1.54, "learning_rate": 6.95256781788727e-05, "loss": 0.0316, "step": 238060 }, { "epoch": 1.54, "learning_rate": 6.951599682451577e-05, "loss": 0.0262, "step": 238070 }, { "epoch": 1.54, "learning_rate": 6.950631547015883e-05, "loss": 0.0263, "step": 238080 }, { "epoch": 1.54, "learning_rate": 6.94966341158019e-05, "loss": 0.024, "step": 238090 }, { "epoch": 1.54, "learning_rate": 6.948695276144497e-05, "loss": 0.0264, "step": 238100 }, { "epoch": 1.54, "learning_rate": 6.947727140708803e-05, "loss": 0.0243, "step": 238110 }, { "epoch": 1.54, "learning_rate": 6.94675900527311e-05, "loss": 0.0293, "step": 238120 }, { "epoch": 1.54, "learning_rate": 6.945790869837418e-05, "loss": 0.0283, "step": 238130 }, { "epoch": 1.54, "learning_rate": 6.944822734401723e-05, "loss": 0.0283, "step": 238140 }, { "epoch": 1.54, "learning_rate": 6.943854598966031e-05, "loss": 0.0255, "step": 238150 }, { "epoch": 1.54, "learning_rate": 6.942886463530338e-05, "loss": 0.0241, "step": 238160 }, { "epoch": 1.54, "learning_rate": 6.941918328094644e-05, "loss": 0.0327, "step": 238170 }, { "epoch": 1.54, "learning_rate": 6.940950192658951e-05, "loss": 0.0263, "step": 238180 }, { "epoch": 1.54, "learning_rate": 6.939982057223258e-05, "loss": 0.0242, "step": 238190 }, { "epoch": 1.54, "learning_rate": 6.939013921787564e-05, "loss": 0.0268, "step": 238200 }, { "epoch": 1.54, "learning_rate": 6.938045786351871e-05, "loss": 0.0256, "step": 238210 }, { "epoch": 1.54, "learning_rate": 6.937077650916179e-05, "loss": 0.0255, "step": 238220 }, { "epoch": 1.54, "learning_rate": 6.936109515480485e-05, "loss": 0.0274, "step": 238230 }, { "epoch": 1.54, "learning_rate": 6.935141380044792e-05, "loss": 0.0228, "step": 238240 }, { "epoch": 1.54, "learning_rate": 6.934173244609099e-05, "loss": 0.0229, "step": 238250 }, { "epoch": 1.54, "learning_rate": 6.933205109173405e-05, "loss": 0.0234, "step": 238260 }, { "epoch": 1.54, "learning_rate": 6.932236973737712e-05, "loss": 0.025, "step": 238270 }, { "epoch": 1.54, "learning_rate": 6.931268838302019e-05, "loss": 0.0219, "step": 238280 }, { "epoch": 1.54, "learning_rate": 6.930300702866327e-05, "loss": 0.0251, "step": 238290 }, { "epoch": 1.54, "learning_rate": 6.929332567430632e-05, "loss": 0.0272, "step": 238300 }, { "epoch": 1.54, "learning_rate": 6.92836443199494e-05, "loss": 0.0254, "step": 238310 }, { "epoch": 1.54, "learning_rate": 6.927396296559246e-05, "loss": 0.0272, "step": 238320 }, { "epoch": 1.54, "learning_rate": 6.926428161123553e-05, "loss": 0.0263, "step": 238330 }, { "epoch": 1.54, "learning_rate": 6.92546002568786e-05, "loss": 0.0298, "step": 238340 }, { "epoch": 1.54, "learning_rate": 6.924491890252166e-05, "loss": 0.0269, "step": 238350 }, { "epoch": 1.54, "learning_rate": 6.923523754816473e-05, "loss": 0.0211, "step": 238360 }, { "epoch": 1.54, "learning_rate": 6.92255561938078e-05, "loss": 0.0259, "step": 238370 }, { "epoch": 1.54, "learning_rate": 6.921587483945088e-05, "loss": 0.0329, "step": 238380 }, { "epoch": 1.54, "learning_rate": 6.920619348509394e-05, "loss": 0.0252, "step": 238390 }, { "epoch": 1.54, "learning_rate": 6.9196512130737e-05, "loss": 0.0241, "step": 238400 }, { "epoch": 1.54, "learning_rate": 6.918683077638007e-05, "loss": 0.0268, "step": 238410 }, { "epoch": 1.54, "learning_rate": 6.917714942202314e-05, "loss": 0.0321, "step": 238420 }, { "epoch": 1.54, "learning_rate": 6.91674680676662e-05, "loss": 0.0274, "step": 238430 }, { "epoch": 1.54, "learning_rate": 6.915778671330927e-05, "loss": 0.0241, "step": 238440 }, { "epoch": 1.54, "learning_rate": 6.914810535895234e-05, "loss": 0.027, "step": 238450 }, { "epoch": 1.54, "learning_rate": 6.91384240045954e-05, "loss": 0.0212, "step": 238460 }, { "epoch": 1.54, "learning_rate": 6.912874265023847e-05, "loss": 0.0292, "step": 238470 }, { "epoch": 1.54, "learning_rate": 6.911906129588155e-05, "loss": 0.029, "step": 238480 }, { "epoch": 1.54, "learning_rate": 6.910937994152462e-05, "loss": 0.0268, "step": 238490 }, { "epoch": 1.54, "learning_rate": 6.909969858716768e-05, "loss": 0.0252, "step": 238500 }, { "epoch": 1.54, "learning_rate": 6.909001723281075e-05, "loss": 0.0309, "step": 238510 }, { "epoch": 1.54, "learning_rate": 6.908033587845382e-05, "loss": 0.0229, "step": 238520 }, { "epoch": 1.54, "learning_rate": 6.907065452409688e-05, "loss": 0.0264, "step": 238530 }, { "epoch": 1.54, "learning_rate": 6.906097316973995e-05, "loss": 0.0291, "step": 238540 }, { "epoch": 1.54, "learning_rate": 6.905129181538303e-05, "loss": 0.0274, "step": 238550 }, { "epoch": 1.54, "learning_rate": 6.904161046102608e-05, "loss": 0.0273, "step": 238560 }, { "epoch": 1.54, "learning_rate": 6.903192910666916e-05, "loss": 0.0233, "step": 238570 }, { "epoch": 1.54, "learning_rate": 6.902224775231223e-05, "loss": 0.0274, "step": 238580 }, { "epoch": 1.54, "learning_rate": 6.90125663979553e-05, "loss": 0.0241, "step": 238590 }, { "epoch": 1.54, "learning_rate": 6.900288504359836e-05, "loss": 0.0268, "step": 238600 }, { "epoch": 1.54, "learning_rate": 6.899320368924143e-05, "loss": 0.0301, "step": 238610 }, { "epoch": 1.54, "learning_rate": 6.898352233488449e-05, "loss": 0.0342, "step": 238620 }, { "epoch": 1.54, "learning_rate": 6.897384098052756e-05, "loss": 0.0277, "step": 238630 }, { "epoch": 1.54, "learning_rate": 6.896415962617064e-05, "loss": 0.0246, "step": 238640 }, { "epoch": 1.54, "learning_rate": 6.89544782718137e-05, "loss": 0.0284, "step": 238650 }, { "epoch": 1.54, "learning_rate": 6.894479691745676e-05, "loss": 0.0279, "step": 238660 }, { "epoch": 1.54, "learning_rate": 6.893511556309984e-05, "loss": 0.0266, "step": 238670 }, { "epoch": 1.54, "learning_rate": 6.89254342087429e-05, "loss": 0.0265, "step": 238680 }, { "epoch": 1.54, "learning_rate": 6.891575285438597e-05, "loss": 0.0242, "step": 238690 }, { "epoch": 1.54, "learning_rate": 6.890607150002904e-05, "loss": 0.0256, "step": 238700 }, { "epoch": 1.54, "learning_rate": 6.889639014567212e-05, "loss": 0.0264, "step": 238710 }, { "epoch": 1.54, "learning_rate": 6.888670879131517e-05, "loss": 0.034, "step": 238720 }, { "epoch": 1.54, "learning_rate": 6.887702743695823e-05, "loss": 0.0308, "step": 238730 }, { "epoch": 1.54, "learning_rate": 6.886734608260131e-05, "loss": 0.0241, "step": 238740 }, { "epoch": 1.54, "learning_rate": 6.885766472824438e-05, "loss": 0.0249, "step": 238750 }, { "epoch": 1.54, "learning_rate": 6.884798337388745e-05, "loss": 0.026, "step": 238760 }, { "epoch": 1.54, "learning_rate": 6.883830201953051e-05, "loss": 0.0293, "step": 238770 }, { "epoch": 1.54, "learning_rate": 6.882862066517358e-05, "loss": 0.0233, "step": 238780 }, { "epoch": 1.54, "learning_rate": 6.881893931081665e-05, "loss": 0.0305, "step": 238790 }, { "epoch": 1.54, "learning_rate": 6.880925795645971e-05, "loss": 0.0276, "step": 238800 }, { "epoch": 1.54, "learning_rate": 6.879957660210279e-05, "loss": 0.0278, "step": 238810 }, { "epoch": 1.54, "learning_rate": 6.878989524774584e-05, "loss": 0.0307, "step": 238820 }, { "epoch": 1.54, "learning_rate": 6.878021389338892e-05, "loss": 0.0278, "step": 238830 }, { "epoch": 1.54, "learning_rate": 6.877053253903199e-05, "loss": 0.0227, "step": 238840 }, { "epoch": 1.54, "learning_rate": 6.876085118467506e-05, "loss": 0.0295, "step": 238850 }, { "epoch": 1.54, "learning_rate": 6.875116983031812e-05, "loss": 0.025, "step": 238860 }, { "epoch": 1.54, "learning_rate": 6.874148847596119e-05, "loss": 0.026, "step": 238870 }, { "epoch": 1.54, "learning_rate": 6.873180712160426e-05, "loss": 0.0286, "step": 238880 }, { "epoch": 1.54, "learning_rate": 6.872212576724732e-05, "loss": 0.0244, "step": 238890 }, { "epoch": 1.54, "learning_rate": 6.87124444128904e-05, "loss": 0.0311, "step": 238900 }, { "epoch": 1.54, "learning_rate": 6.870276305853347e-05, "loss": 0.029, "step": 238910 }, { "epoch": 1.54, "learning_rate": 6.869308170417653e-05, "loss": 0.0288, "step": 238920 }, { "epoch": 1.54, "learning_rate": 6.86834003498196e-05, "loss": 0.029, "step": 238930 }, { "epoch": 1.54, "learning_rate": 6.867371899546267e-05, "loss": 0.0269, "step": 238940 }, { "epoch": 1.54, "learning_rate": 6.866403764110573e-05, "loss": 0.0261, "step": 238950 }, { "epoch": 1.54, "learning_rate": 6.86543562867488e-05, "loss": 0.0299, "step": 238960 }, { "epoch": 1.54, "learning_rate": 6.864467493239186e-05, "loss": 0.0264, "step": 238970 }, { "epoch": 1.54, "learning_rate": 6.863499357803493e-05, "loss": 0.0289, "step": 238980 }, { "epoch": 1.54, "learning_rate": 6.862531222367801e-05, "loss": 0.0246, "step": 238990 }, { "epoch": 1.54, "learning_rate": 6.861563086932108e-05, "loss": 0.0259, "step": 239000 }, { "epoch": 1.54, "eval_cer": 0.9199050954694384, "eval_loss": 0.01946895383298397, "eval_runtime": 120.4017, "eval_samples_per_second": 16.611, "eval_steps_per_second": 4.153, "step": 239000 }, { "epoch": 1.54, "learning_rate": 6.860594951496414e-05, "loss": 0.0281, "step": 239010 }, { "epoch": 1.54, "learning_rate": 6.859626816060721e-05, "loss": 0.0324, "step": 239020 }, { "epoch": 1.54, "learning_rate": 6.858658680625028e-05, "loss": 0.0294, "step": 239030 }, { "epoch": 1.54, "learning_rate": 6.857690545189334e-05, "loss": 0.0236, "step": 239040 }, { "epoch": 1.54, "learning_rate": 6.856722409753641e-05, "loss": 0.024, "step": 239050 }, { "epoch": 1.54, "learning_rate": 6.855754274317949e-05, "loss": 0.0266, "step": 239060 }, { "epoch": 1.54, "learning_rate": 6.854786138882254e-05, "loss": 0.0255, "step": 239070 }, { "epoch": 1.54, "learning_rate": 6.853818003446561e-05, "loss": 0.0267, "step": 239080 }, { "epoch": 1.54, "learning_rate": 6.852849868010869e-05, "loss": 0.0257, "step": 239090 }, { "epoch": 1.54, "learning_rate": 6.851881732575175e-05, "loss": 0.0272, "step": 239100 }, { "epoch": 1.54, "learning_rate": 6.850913597139482e-05, "loss": 0.0257, "step": 239110 }, { "epoch": 1.54, "learning_rate": 6.849945461703789e-05, "loss": 0.0258, "step": 239120 }, { "epoch": 1.54, "learning_rate": 6.848977326268095e-05, "loss": 0.0322, "step": 239130 }, { "epoch": 1.54, "learning_rate": 6.848009190832402e-05, "loss": 0.0296, "step": 239140 }, { "epoch": 1.54, "learning_rate": 6.847041055396708e-05, "loss": 0.0258, "step": 239150 }, { "epoch": 1.54, "learning_rate": 6.846072919961016e-05, "loss": 0.0289, "step": 239160 }, { "epoch": 1.54, "learning_rate": 6.845104784525322e-05, "loss": 0.0268, "step": 239170 }, { "epoch": 1.54, "learning_rate": 6.84413664908963e-05, "loss": 0.0251, "step": 239180 }, { "epoch": 1.54, "learning_rate": 6.843168513653936e-05, "loss": 0.0223, "step": 239190 }, { "epoch": 1.54, "learning_rate": 6.842200378218243e-05, "loss": 0.0296, "step": 239200 }, { "epoch": 1.54, "learning_rate": 6.84123224278255e-05, "loss": 0.0242, "step": 239210 }, { "epoch": 1.54, "learning_rate": 6.840264107346856e-05, "loss": 0.024, "step": 239220 }, { "epoch": 1.54, "learning_rate": 6.839295971911163e-05, "loss": 0.0302, "step": 239230 }, { "epoch": 1.54, "learning_rate": 6.83832783647547e-05, "loss": 0.026, "step": 239240 }, { "epoch": 1.54, "learning_rate": 6.837359701039777e-05, "loss": 0.027, "step": 239250 }, { "epoch": 1.54, "learning_rate": 6.836391565604084e-05, "loss": 0.0254, "step": 239260 }, { "epoch": 1.54, "learning_rate": 6.83542343016839e-05, "loss": 0.0294, "step": 239270 }, { "epoch": 1.54, "learning_rate": 6.834455294732697e-05, "loss": 0.0243, "step": 239280 }, { "epoch": 1.54, "learning_rate": 6.833487159297004e-05, "loss": 0.0295, "step": 239290 }, { "epoch": 1.54, "learning_rate": 6.83251902386131e-05, "loss": 0.0286, "step": 239300 }, { "epoch": 1.54, "learning_rate": 6.831550888425617e-05, "loss": 0.0199, "step": 239310 }, { "epoch": 1.54, "learning_rate": 6.830582752989925e-05, "loss": 0.0238, "step": 239320 }, { "epoch": 1.54, "learning_rate": 6.82961461755423e-05, "loss": 0.0231, "step": 239330 }, { "epoch": 1.54, "learning_rate": 6.828646482118538e-05, "loss": 0.0212, "step": 239340 }, { "epoch": 1.54, "learning_rate": 6.827678346682845e-05, "loss": 0.025, "step": 239350 }, { "epoch": 1.54, "learning_rate": 6.826710211247152e-05, "loss": 0.0214, "step": 239360 }, { "epoch": 1.54, "learning_rate": 6.825742075811458e-05, "loss": 0.0248, "step": 239370 }, { "epoch": 1.55, "learning_rate": 6.824773940375765e-05, "loss": 0.029, "step": 239380 }, { "epoch": 1.55, "learning_rate": 6.823805804940071e-05, "loss": 0.0274, "step": 239390 }, { "epoch": 1.55, "learning_rate": 6.822837669504378e-05, "loss": 0.03, "step": 239400 }, { "epoch": 1.55, "learning_rate": 6.821869534068686e-05, "loss": 0.0247, "step": 239410 }, { "epoch": 1.55, "learning_rate": 6.820901398632993e-05, "loss": 0.0254, "step": 239420 }, { "epoch": 1.55, "learning_rate": 6.819933263197298e-05, "loss": 0.0238, "step": 239430 }, { "epoch": 1.55, "learning_rate": 6.818965127761606e-05, "loss": 0.0272, "step": 239440 }, { "epoch": 1.55, "learning_rate": 6.817996992325913e-05, "loss": 0.0262, "step": 239450 }, { "epoch": 1.55, "learning_rate": 6.817028856890219e-05, "loss": 0.0239, "step": 239460 }, { "epoch": 1.55, "learning_rate": 6.816060721454526e-05, "loss": 0.0265, "step": 239470 }, { "epoch": 1.55, "learning_rate": 6.815092586018834e-05, "loss": 0.0303, "step": 239480 }, { "epoch": 1.55, "learning_rate": 6.814124450583139e-05, "loss": 0.027, "step": 239490 }, { "epoch": 1.55, "learning_rate": 6.813156315147446e-05, "loss": 0.0299, "step": 239500 }, { "epoch": 1.55, "learning_rate": 6.812188179711754e-05, "loss": 0.0265, "step": 239510 }, { "epoch": 1.55, "learning_rate": 6.81122004427606e-05, "loss": 0.0287, "step": 239520 }, { "epoch": 1.55, "learning_rate": 6.810251908840367e-05, "loss": 0.0312, "step": 239530 }, { "epoch": 1.55, "learning_rate": 6.809283773404674e-05, "loss": 0.0265, "step": 239540 }, { "epoch": 1.55, "learning_rate": 6.80831563796898e-05, "loss": 0.0223, "step": 239550 }, { "epoch": 1.55, "learning_rate": 6.807347502533287e-05, "loss": 0.025, "step": 239560 }, { "epoch": 1.55, "learning_rate": 6.806379367097593e-05, "loss": 0.0291, "step": 239570 }, { "epoch": 1.55, "learning_rate": 6.805411231661901e-05, "loss": 0.0272, "step": 239580 }, { "epoch": 1.55, "learning_rate": 6.804443096226207e-05, "loss": 0.027, "step": 239590 }, { "epoch": 1.55, "learning_rate": 6.803474960790515e-05, "loss": 0.0283, "step": 239600 }, { "epoch": 1.55, "learning_rate": 6.802506825354821e-05, "loss": 0.0326, "step": 239610 }, { "epoch": 1.55, "learning_rate": 6.801538689919128e-05, "loss": 0.028, "step": 239620 }, { "epoch": 1.55, "learning_rate": 6.800570554483435e-05, "loss": 0.029, "step": 239630 }, { "epoch": 1.55, "learning_rate": 6.799602419047741e-05, "loss": 0.0261, "step": 239640 }, { "epoch": 1.55, "learning_rate": 6.798634283612048e-05, "loss": 0.0259, "step": 239650 }, { "epoch": 1.55, "learning_rate": 6.797666148176354e-05, "loss": 0.025, "step": 239660 }, { "epoch": 1.55, "learning_rate": 6.796698012740662e-05, "loss": 0.0219, "step": 239670 }, { "epoch": 1.55, "learning_rate": 6.795729877304969e-05, "loss": 0.03, "step": 239680 }, { "epoch": 1.55, "learning_rate": 6.794761741869276e-05, "loss": 0.0316, "step": 239690 }, { "epoch": 1.55, "learning_rate": 6.793793606433582e-05, "loss": 0.0281, "step": 239700 }, { "epoch": 1.55, "learning_rate": 6.792825470997889e-05, "loss": 0.03, "step": 239710 }, { "epoch": 1.55, "learning_rate": 6.791857335562195e-05, "loss": 0.0317, "step": 239720 }, { "epoch": 1.55, "learning_rate": 6.790889200126502e-05, "loss": 0.0226, "step": 239730 }, { "epoch": 1.55, "learning_rate": 6.78992106469081e-05, "loss": 0.0252, "step": 239740 }, { "epoch": 1.55, "learning_rate": 6.788952929255115e-05, "loss": 0.0306, "step": 239750 }, { "epoch": 1.55, "learning_rate": 6.787984793819423e-05, "loss": 0.0223, "step": 239760 }, { "epoch": 1.55, "learning_rate": 6.78701665838373e-05, "loss": 0.0374, "step": 239770 }, { "epoch": 1.55, "learning_rate": 6.786048522948037e-05, "loss": 0.0278, "step": 239780 }, { "epoch": 1.55, "learning_rate": 6.785080387512343e-05, "loss": 0.0286, "step": 239790 }, { "epoch": 1.55, "learning_rate": 6.78411225207665e-05, "loss": 0.0277, "step": 239800 }, { "epoch": 1.55, "learning_rate": 6.783144116640956e-05, "loss": 0.0283, "step": 239810 }, { "epoch": 1.55, "learning_rate": 6.782175981205263e-05, "loss": 0.0312, "step": 239820 }, { "epoch": 1.55, "learning_rate": 6.781207845769571e-05, "loss": 0.0268, "step": 239830 }, { "epoch": 1.55, "learning_rate": 6.780239710333878e-05, "loss": 0.0295, "step": 239840 }, { "epoch": 1.55, "learning_rate": 6.779271574898183e-05, "loss": 0.0264, "step": 239850 }, { "epoch": 1.55, "learning_rate": 6.778303439462491e-05, "loss": 0.0325, "step": 239860 }, { "epoch": 1.55, "learning_rate": 6.777335304026798e-05, "loss": 0.0221, "step": 239870 }, { "epoch": 1.55, "learning_rate": 6.776367168591104e-05, "loss": 0.0192, "step": 239880 }, { "epoch": 1.55, "learning_rate": 6.775399033155411e-05, "loss": 0.0299, "step": 239890 }, { "epoch": 1.55, "learning_rate": 6.774430897719719e-05, "loss": 0.0274, "step": 239900 }, { "epoch": 1.55, "learning_rate": 6.773462762284024e-05, "loss": 0.0217, "step": 239910 }, { "epoch": 1.55, "learning_rate": 6.77249462684833e-05, "loss": 0.03, "step": 239920 }, { "epoch": 1.55, "learning_rate": 6.771526491412639e-05, "loss": 0.0288, "step": 239930 }, { "epoch": 1.55, "learning_rate": 6.770558355976945e-05, "loss": 0.0378, "step": 239940 }, { "epoch": 1.55, "learning_rate": 6.769590220541252e-05, "loss": 0.0326, "step": 239950 }, { "epoch": 1.55, "learning_rate": 6.768622085105559e-05, "loss": 0.0275, "step": 239960 }, { "epoch": 1.55, "learning_rate": 6.767653949669865e-05, "loss": 0.0236, "step": 239970 }, { "epoch": 1.55, "learning_rate": 6.766685814234172e-05, "loss": 0.0212, "step": 239980 }, { "epoch": 1.55, "learning_rate": 6.765717678798478e-05, "loss": 0.0237, "step": 239990 }, { "epoch": 1.55, "learning_rate": 6.764749543362786e-05, "loss": 0.0317, "step": 240000 }, { "epoch": 1.55, "eval_cer": 0.9198644220991978, "eval_loss": 0.019400835037231445, "eval_runtime": 119.9567, "eval_samples_per_second": 16.673, "eval_steps_per_second": 4.168, "step": 240000 }, { "epoch": 1.55, "learning_rate": 6.763781407927092e-05, "loss": 0.0272, "step": 240010 }, { "epoch": 1.55, "learning_rate": 6.7628132724914e-05, "loss": 0.0224, "step": 240020 }, { "epoch": 1.55, "learning_rate": 6.761845137055706e-05, "loss": 0.0265, "step": 240030 }, { "epoch": 1.55, "learning_rate": 6.760877001620013e-05, "loss": 0.0284, "step": 240040 }, { "epoch": 1.55, "learning_rate": 6.75990886618432e-05, "loss": 0.0278, "step": 240050 }, { "epoch": 1.55, "learning_rate": 6.758940730748626e-05, "loss": 0.0267, "step": 240060 }, { "epoch": 1.55, "learning_rate": 6.757972595312933e-05, "loss": 0.025, "step": 240070 }, { "epoch": 1.55, "learning_rate": 6.75700445987724e-05, "loss": 0.0245, "step": 240080 }, { "epoch": 1.55, "learning_rate": 6.756036324441547e-05, "loss": 0.0335, "step": 240090 }, { "epoch": 1.55, "learning_rate": 6.755068189005854e-05, "loss": 0.0251, "step": 240100 }, { "epoch": 1.55, "learning_rate": 6.75410005357016e-05, "loss": 0.0252, "step": 240110 }, { "epoch": 1.55, "learning_rate": 6.753131918134467e-05, "loss": 0.0224, "step": 240120 }, { "epoch": 1.55, "learning_rate": 6.752163782698774e-05, "loss": 0.0321, "step": 240130 }, { "epoch": 1.55, "learning_rate": 6.75119564726308e-05, "loss": 0.0261, "step": 240140 }, { "epoch": 1.55, "learning_rate": 6.750227511827387e-05, "loss": 0.0305, "step": 240150 }, { "epoch": 1.55, "learning_rate": 6.749259376391695e-05, "loss": 0.0251, "step": 240160 }, { "epoch": 1.55, "learning_rate": 6.748291240956e-05, "loss": 0.0275, "step": 240170 }, { "epoch": 1.55, "learning_rate": 6.747323105520307e-05, "loss": 0.0246, "step": 240180 }, { "epoch": 1.55, "learning_rate": 6.746354970084615e-05, "loss": 0.0233, "step": 240190 }, { "epoch": 1.55, "learning_rate": 6.745386834648922e-05, "loss": 0.0296, "step": 240200 }, { "epoch": 1.55, "learning_rate": 6.744418699213228e-05, "loss": 0.0255, "step": 240210 }, { "epoch": 1.55, "learning_rate": 6.743450563777535e-05, "loss": 0.0295, "step": 240220 }, { "epoch": 1.55, "learning_rate": 6.742482428341841e-05, "loss": 0.0232, "step": 240230 }, { "epoch": 1.55, "learning_rate": 6.741514292906148e-05, "loss": 0.0234, "step": 240240 }, { "epoch": 1.55, "learning_rate": 6.740546157470455e-05, "loss": 0.0247, "step": 240250 }, { "epoch": 1.55, "learning_rate": 6.739578022034763e-05, "loss": 0.0245, "step": 240260 }, { "epoch": 1.55, "learning_rate": 6.738609886599068e-05, "loss": 0.0372, "step": 240270 }, { "epoch": 1.55, "learning_rate": 6.737641751163376e-05, "loss": 0.0258, "step": 240280 }, { "epoch": 1.55, "learning_rate": 6.736673615727683e-05, "loss": 0.0293, "step": 240290 }, { "epoch": 1.55, "learning_rate": 6.735705480291989e-05, "loss": 0.0224, "step": 240300 }, { "epoch": 1.55, "learning_rate": 6.734737344856296e-05, "loss": 0.0274, "step": 240310 }, { "epoch": 1.55, "learning_rate": 6.733769209420602e-05, "loss": 0.0275, "step": 240320 }, { "epoch": 1.55, "learning_rate": 6.732801073984909e-05, "loss": 0.0292, "step": 240330 }, { "epoch": 1.55, "learning_rate": 6.731832938549216e-05, "loss": 0.0231, "step": 240340 }, { "epoch": 1.55, "learning_rate": 6.730864803113524e-05, "loss": 0.0287, "step": 240350 }, { "epoch": 1.55, "learning_rate": 6.72989666767783e-05, "loss": 0.0289, "step": 240360 }, { "epoch": 1.55, "learning_rate": 6.728928532242137e-05, "loss": 0.0278, "step": 240370 }, { "epoch": 1.55, "learning_rate": 6.727960396806444e-05, "loss": 0.0237, "step": 240380 }, { "epoch": 1.55, "learning_rate": 6.72699226137075e-05, "loss": 0.0288, "step": 240390 }, { "epoch": 1.55, "learning_rate": 6.726024125935057e-05, "loss": 0.0232, "step": 240400 }, { "epoch": 1.55, "learning_rate": 6.725055990499363e-05, "loss": 0.026, "step": 240410 }, { "epoch": 1.55, "learning_rate": 6.72408785506367e-05, "loss": 0.0271, "step": 240420 }, { "epoch": 1.55, "learning_rate": 6.723119719627977e-05, "loss": 0.0276, "step": 240430 }, { "epoch": 1.55, "learning_rate": 6.722151584192285e-05, "loss": 0.026, "step": 240440 }, { "epoch": 1.55, "learning_rate": 6.721183448756591e-05, "loss": 0.0264, "step": 240450 }, { "epoch": 1.55, "learning_rate": 6.720215313320898e-05, "loss": 0.0235, "step": 240460 }, { "epoch": 1.55, "learning_rate": 6.719247177885204e-05, "loss": 0.0252, "step": 240470 }, { "epoch": 1.55, "learning_rate": 6.718279042449511e-05, "loss": 0.0264, "step": 240480 }, { "epoch": 1.55, "learning_rate": 6.717310907013818e-05, "loss": 0.0256, "step": 240490 }, { "epoch": 1.55, "learning_rate": 6.716342771578124e-05, "loss": 0.0278, "step": 240500 }, { "epoch": 1.55, "learning_rate": 6.715374636142432e-05, "loss": 0.026, "step": 240510 }, { "epoch": 1.55, "learning_rate": 6.714406500706738e-05, "loss": 0.0243, "step": 240520 }, { "epoch": 1.55, "learning_rate": 6.713438365271044e-05, "loss": 0.0289, "step": 240530 }, { "epoch": 1.55, "learning_rate": 6.712470229835352e-05, "loss": 0.0239, "step": 240540 }, { "epoch": 1.55, "learning_rate": 6.711502094399659e-05, "loss": 0.0212, "step": 240550 }, { "epoch": 1.55, "learning_rate": 6.710533958963965e-05, "loss": 0.0237, "step": 240560 }, { "epoch": 1.55, "learning_rate": 6.709565823528272e-05, "loss": 0.0235, "step": 240570 }, { "epoch": 1.55, "learning_rate": 6.708597688092579e-05, "loss": 0.0287, "step": 240580 }, { "epoch": 1.55, "learning_rate": 6.707629552656885e-05, "loss": 0.0319, "step": 240590 }, { "epoch": 1.55, "learning_rate": 6.706661417221192e-05, "loss": 0.0251, "step": 240600 }, { "epoch": 1.55, "learning_rate": 6.7056932817855e-05, "loss": 0.0211, "step": 240610 }, { "epoch": 1.55, "learning_rate": 6.704725146349805e-05, "loss": 0.0233, "step": 240620 }, { "epoch": 1.55, "learning_rate": 6.703757010914113e-05, "loss": 0.0247, "step": 240630 }, { "epoch": 1.55, "learning_rate": 6.70278887547842e-05, "loss": 0.0283, "step": 240640 }, { "epoch": 1.55, "learning_rate": 6.701820740042726e-05, "loss": 0.0253, "step": 240650 }, { "epoch": 1.55, "learning_rate": 6.700852604607033e-05, "loss": 0.0293, "step": 240660 }, { "epoch": 1.55, "learning_rate": 6.69988446917134e-05, "loss": 0.0266, "step": 240670 }, { "epoch": 1.55, "learning_rate": 6.698916333735646e-05, "loss": 0.025, "step": 240680 }, { "epoch": 1.55, "learning_rate": 6.697948198299953e-05, "loss": 0.0231, "step": 240690 }, { "epoch": 1.55, "learning_rate": 6.696980062864261e-05, "loss": 0.0259, "step": 240700 }, { "epoch": 1.55, "learning_rate": 6.696011927428568e-05, "loss": 0.0275, "step": 240710 }, { "epoch": 1.55, "learning_rate": 6.695043791992874e-05, "loss": 0.0251, "step": 240720 }, { "epoch": 1.55, "learning_rate": 6.694075656557181e-05, "loss": 0.0256, "step": 240730 }, { "epoch": 1.55, "learning_rate": 6.693107521121487e-05, "loss": 0.0255, "step": 240740 }, { "epoch": 1.55, "learning_rate": 6.692139385685794e-05, "loss": 0.0203, "step": 240750 }, { "epoch": 1.55, "learning_rate": 6.6911712502501e-05, "loss": 0.0251, "step": 240760 }, { "epoch": 1.55, "learning_rate": 6.690203114814409e-05, "loss": 0.0225, "step": 240770 }, { "epoch": 1.55, "learning_rate": 6.689234979378714e-05, "loss": 0.0271, "step": 240780 }, { "epoch": 1.55, "learning_rate": 6.688266843943022e-05, "loss": 0.0268, "step": 240790 }, { "epoch": 1.55, "learning_rate": 6.687298708507328e-05, "loss": 0.023, "step": 240800 }, { "epoch": 1.55, "learning_rate": 6.686330573071635e-05, "loss": 0.0233, "step": 240810 }, { "epoch": 1.55, "learning_rate": 6.685362437635942e-05, "loss": 0.0258, "step": 240820 }, { "epoch": 1.55, "learning_rate": 6.684394302200248e-05, "loss": 0.0276, "step": 240830 }, { "epoch": 1.55, "learning_rate": 6.683426166764555e-05, "loss": 0.0215, "step": 240840 }, { "epoch": 1.55, "learning_rate": 6.682458031328862e-05, "loss": 0.0225, "step": 240850 }, { "epoch": 1.55, "learning_rate": 6.68148989589317e-05, "loss": 0.0265, "step": 240860 }, { "epoch": 1.55, "learning_rate": 6.680521760457476e-05, "loss": 0.0247, "step": 240870 }, { "epoch": 1.55, "learning_rate": 6.679553625021781e-05, "loss": 0.0268, "step": 240880 }, { "epoch": 1.55, "learning_rate": 6.67858548958609e-05, "loss": 0.0299, "step": 240890 }, { "epoch": 1.55, "learning_rate": 6.677617354150396e-05, "loss": 0.0254, "step": 240900 }, { "epoch": 1.55, "learning_rate": 6.676649218714703e-05, "loss": 0.0252, "step": 240910 }, { "epoch": 1.55, "learning_rate": 6.67568108327901e-05, "loss": 0.0302, "step": 240920 }, { "epoch": 1.56, "learning_rate": 6.674712947843317e-05, "loss": 0.0227, "step": 240930 }, { "epoch": 1.56, "learning_rate": 6.673744812407623e-05, "loss": 0.0259, "step": 240940 }, { "epoch": 1.56, "learning_rate": 6.672776676971929e-05, "loss": 0.023, "step": 240950 }, { "epoch": 1.56, "learning_rate": 6.671808541536237e-05, "loss": 0.0256, "step": 240960 }, { "epoch": 1.56, "learning_rate": 6.670840406100544e-05, "loss": 0.0271, "step": 240970 }, { "epoch": 1.56, "learning_rate": 6.66987227066485e-05, "loss": 0.0295, "step": 240980 }, { "epoch": 1.56, "learning_rate": 6.668904135229157e-05, "loss": 0.0253, "step": 240990 }, { "epoch": 1.56, "learning_rate": 6.667935999793464e-05, "loss": 0.0266, "step": 241000 }, { "epoch": 1.56, "eval_cer": 0.9198906338266862, "eval_loss": 0.019124064594507217, "eval_runtime": 120.0034, "eval_samples_per_second": 16.666, "eval_steps_per_second": 4.167, "step": 241000 }, { "epoch": 1.56, "learning_rate": 6.66696786435777e-05, "loss": 0.0262, "step": 241010 }, { "epoch": 1.56, "learning_rate": 6.665999728922077e-05, "loss": 0.025, "step": 241020 }, { "epoch": 1.56, "learning_rate": 6.665031593486385e-05, "loss": 0.0251, "step": 241030 }, { "epoch": 1.56, "learning_rate": 6.66406345805069e-05, "loss": 0.0287, "step": 241040 }, { "epoch": 1.56, "learning_rate": 6.663095322614998e-05, "loss": 0.0262, "step": 241050 }, { "epoch": 1.56, "learning_rate": 6.662127187179305e-05, "loss": 0.0244, "step": 241060 }, { "epoch": 1.56, "learning_rate": 6.661159051743611e-05, "loss": 0.0248, "step": 241070 }, { "epoch": 1.56, "learning_rate": 6.660190916307918e-05, "loss": 0.0241, "step": 241080 }, { "epoch": 1.56, "learning_rate": 6.659222780872225e-05, "loss": 0.0257, "step": 241090 }, { "epoch": 1.56, "learning_rate": 6.658254645436531e-05, "loss": 0.0322, "step": 241100 }, { "epoch": 1.56, "learning_rate": 6.657286510000838e-05, "loss": 0.0252, "step": 241110 }, { "epoch": 1.56, "learning_rate": 6.656318374565146e-05, "loss": 0.0274, "step": 241120 }, { "epoch": 1.56, "learning_rate": 6.655350239129452e-05, "loss": 0.0268, "step": 241130 }, { "epoch": 1.56, "learning_rate": 6.654382103693759e-05, "loss": 0.0257, "step": 241140 }, { "epoch": 1.56, "learning_rate": 6.653413968258066e-05, "loss": 0.034, "step": 241150 }, { "epoch": 1.56, "learning_rate": 6.652445832822372e-05, "loss": 0.0275, "step": 241160 }, { "epoch": 1.56, "learning_rate": 6.651477697386679e-05, "loss": 0.0226, "step": 241170 }, { "epoch": 1.56, "learning_rate": 6.650509561950986e-05, "loss": 0.0254, "step": 241180 }, { "epoch": 1.56, "learning_rate": 6.649541426515294e-05, "loss": 0.022, "step": 241190 }, { "epoch": 1.56, "learning_rate": 6.648573291079599e-05, "loss": 0.0255, "step": 241200 }, { "epoch": 1.56, "learning_rate": 6.647605155643907e-05, "loss": 0.029, "step": 241210 }, { "epoch": 1.56, "learning_rate": 6.646637020208213e-05, "loss": 0.0261, "step": 241220 }, { "epoch": 1.56, "learning_rate": 6.64566888477252e-05, "loss": 0.0249, "step": 241230 }, { "epoch": 1.56, "learning_rate": 6.644700749336827e-05, "loss": 0.0261, "step": 241240 }, { "epoch": 1.56, "learning_rate": 6.643732613901133e-05, "loss": 0.0258, "step": 241250 }, { "epoch": 1.56, "learning_rate": 6.64276447846544e-05, "loss": 0.0266, "step": 241260 }, { "epoch": 1.56, "learning_rate": 6.641796343029747e-05, "loss": 0.035, "step": 241270 }, { "epoch": 1.56, "learning_rate": 6.640828207594055e-05, "loss": 0.0283, "step": 241280 }, { "epoch": 1.56, "learning_rate": 6.639860072158361e-05, "loss": 0.0234, "step": 241290 }, { "epoch": 1.56, "learning_rate": 6.638891936722666e-05, "loss": 0.0254, "step": 241300 }, { "epoch": 1.56, "learning_rate": 6.637923801286974e-05, "loss": 0.0296, "step": 241310 }, { "epoch": 1.56, "learning_rate": 6.636955665851281e-05, "loss": 0.027, "step": 241320 }, { "epoch": 1.56, "learning_rate": 6.635987530415588e-05, "loss": 0.029, "step": 241330 }, { "epoch": 1.56, "learning_rate": 6.635019394979894e-05, "loss": 0.0282, "step": 241340 }, { "epoch": 1.56, "learning_rate": 6.634051259544202e-05, "loss": 0.0281, "step": 241350 }, { "epoch": 1.56, "learning_rate": 6.633083124108508e-05, "loss": 0.0261, "step": 241360 }, { "epoch": 1.56, "learning_rate": 6.632114988672814e-05, "loss": 0.0317, "step": 241370 }, { "epoch": 1.56, "learning_rate": 6.631146853237122e-05, "loss": 0.0203, "step": 241380 }, { "epoch": 1.56, "learning_rate": 6.630178717801429e-05, "loss": 0.0291, "step": 241390 }, { "epoch": 1.56, "learning_rate": 6.629210582365735e-05, "loss": 0.0252, "step": 241400 }, { "epoch": 1.56, "learning_rate": 6.628242446930042e-05, "loss": 0.0245, "step": 241410 }, { "epoch": 1.56, "learning_rate": 6.627274311494349e-05, "loss": 0.0221, "step": 241420 }, { "epoch": 1.56, "learning_rate": 6.626306176058655e-05, "loss": 0.0273, "step": 241430 }, { "epoch": 1.56, "learning_rate": 6.625338040622962e-05, "loss": 0.0325, "step": 241440 }, { "epoch": 1.56, "learning_rate": 6.62436990518727e-05, "loss": 0.024, "step": 241450 }, { "epoch": 1.56, "learning_rate": 6.623401769751575e-05, "loss": 0.0215, "step": 241460 }, { "epoch": 1.56, "learning_rate": 6.622433634315883e-05, "loss": 0.0244, "step": 241470 }, { "epoch": 1.56, "learning_rate": 6.62146549888019e-05, "loss": 0.0291, "step": 241480 }, { "epoch": 1.56, "learning_rate": 6.620497363444496e-05, "loss": 0.0261, "step": 241490 }, { "epoch": 1.56, "learning_rate": 6.619529228008803e-05, "loss": 0.026, "step": 241500 }, { "epoch": 1.56, "learning_rate": 6.61856109257311e-05, "loss": 0.0307, "step": 241510 }, { "epoch": 1.56, "learning_rate": 6.617592957137416e-05, "loss": 0.0251, "step": 241520 }, { "epoch": 1.56, "learning_rate": 6.616624821701723e-05, "loss": 0.0254, "step": 241530 }, { "epoch": 1.56, "learning_rate": 6.615656686266031e-05, "loss": 0.0247, "step": 241540 }, { "epoch": 1.56, "learning_rate": 6.614688550830337e-05, "loss": 0.0313, "step": 241550 }, { "epoch": 1.56, "learning_rate": 6.613720415394644e-05, "loss": 0.0287, "step": 241560 }, { "epoch": 1.56, "learning_rate": 6.612752279958951e-05, "loss": 0.0305, "step": 241570 }, { "epoch": 1.56, "learning_rate": 6.611784144523257e-05, "loss": 0.0292, "step": 241580 }, { "epoch": 1.56, "learning_rate": 6.610816009087564e-05, "loss": 0.0256, "step": 241590 }, { "epoch": 1.56, "learning_rate": 6.60984787365187e-05, "loss": 0.024, "step": 241600 }, { "epoch": 1.56, "learning_rate": 6.608879738216177e-05, "loss": 0.0245, "step": 241610 }, { "epoch": 1.56, "learning_rate": 6.607911602780484e-05, "loss": 0.0253, "step": 241620 }, { "epoch": 1.56, "learning_rate": 6.606943467344792e-05, "loss": 0.0272, "step": 241630 }, { "epoch": 1.56, "learning_rate": 6.605975331909098e-05, "loss": 0.0239, "step": 241640 }, { "epoch": 1.56, "learning_rate": 6.605007196473405e-05, "loss": 0.0275, "step": 241650 }, { "epoch": 1.56, "learning_rate": 6.604039061037712e-05, "loss": 0.0318, "step": 241660 }, { "epoch": 1.56, "learning_rate": 6.603070925602018e-05, "loss": 0.0317, "step": 241670 }, { "epoch": 1.56, "learning_rate": 6.602102790166325e-05, "loss": 0.0278, "step": 241680 }, { "epoch": 1.56, "learning_rate": 6.601134654730632e-05, "loss": 0.0251, "step": 241690 }, { "epoch": 1.56, "learning_rate": 6.60016651929494e-05, "loss": 0.0247, "step": 241700 }, { "epoch": 1.56, "learning_rate": 6.599198383859245e-05, "loss": 0.0278, "step": 241710 }, { "epoch": 1.56, "learning_rate": 6.598230248423551e-05, "loss": 0.0265, "step": 241720 }, { "epoch": 1.56, "learning_rate": 6.59726211298786e-05, "loss": 0.026, "step": 241730 }, { "epoch": 1.56, "learning_rate": 6.596293977552166e-05, "loss": 0.0256, "step": 241740 }, { "epoch": 1.56, "learning_rate": 6.595325842116473e-05, "loss": 0.0298, "step": 241750 }, { "epoch": 1.56, "learning_rate": 6.594357706680779e-05, "loss": 0.0293, "step": 241760 }, { "epoch": 1.56, "learning_rate": 6.593389571245086e-05, "loss": 0.026, "step": 241770 }, { "epoch": 1.56, "learning_rate": 6.592421435809393e-05, "loss": 0.0241, "step": 241780 }, { "epoch": 1.56, "learning_rate": 6.591453300373699e-05, "loss": 0.0281, "step": 241790 }, { "epoch": 1.56, "learning_rate": 6.590485164938007e-05, "loss": 0.0221, "step": 241800 }, { "epoch": 1.56, "learning_rate": 6.589517029502312e-05, "loss": 0.0288, "step": 241810 }, { "epoch": 1.56, "learning_rate": 6.58854889406662e-05, "loss": 0.0316, "step": 241820 }, { "epoch": 1.56, "learning_rate": 6.587580758630927e-05, "loss": 0.0322, "step": 241830 }, { "epoch": 1.56, "learning_rate": 6.586612623195234e-05, "loss": 0.0256, "step": 241840 }, { "epoch": 1.56, "learning_rate": 6.58564448775954e-05, "loss": 0.0237, "step": 241850 }, { "epoch": 1.56, "learning_rate": 6.584676352323847e-05, "loss": 0.0236, "step": 241860 }, { "epoch": 1.56, "learning_rate": 6.583708216888154e-05, "loss": 0.0247, "step": 241870 }, { "epoch": 1.56, "learning_rate": 6.58274008145246e-05, "loss": 0.0235, "step": 241880 }, { "epoch": 1.56, "learning_rate": 6.581771946016768e-05, "loss": 0.0248, "step": 241890 }, { "epoch": 1.56, "learning_rate": 6.580803810581075e-05, "loss": 0.0278, "step": 241900 }, { "epoch": 1.56, "learning_rate": 6.579835675145381e-05, "loss": 0.0271, "step": 241910 }, { "epoch": 1.56, "learning_rate": 6.578867539709688e-05, "loss": 0.0288, "step": 241920 }, { "epoch": 1.56, "learning_rate": 6.577899404273995e-05, "loss": 0.0286, "step": 241930 }, { "epoch": 1.56, "learning_rate": 6.576931268838301e-05, "loss": 0.0279, "step": 241940 }, { "epoch": 1.56, "learning_rate": 6.575963133402608e-05, "loss": 0.0279, "step": 241950 }, { "epoch": 1.56, "learning_rate": 6.574994997966916e-05, "loss": 0.0262, "step": 241960 }, { "epoch": 1.56, "learning_rate": 6.574026862531221e-05, "loss": 0.0244, "step": 241970 }, { "epoch": 1.56, "learning_rate": 6.573058727095528e-05, "loss": 0.0287, "step": 241980 }, { "epoch": 1.56, "learning_rate": 6.572090591659836e-05, "loss": 0.0228, "step": 241990 }, { "epoch": 1.56, "learning_rate": 6.571122456224142e-05, "loss": 0.0272, "step": 242000 }, { "epoch": 1.56, "eval_cer": 0.9198599028358377, "eval_loss": 0.019341401755809784, "eval_runtime": 120.0186, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 242000 }, { "epoch": 1.56, "learning_rate": 6.570154320788449e-05, "loss": 0.0295, "step": 242010 }, { "epoch": 1.56, "learning_rate": 6.569186185352756e-05, "loss": 0.0279, "step": 242020 }, { "epoch": 1.56, "learning_rate": 6.568218049917062e-05, "loss": 0.0264, "step": 242030 }, { "epoch": 1.56, "learning_rate": 6.567249914481369e-05, "loss": 0.0254, "step": 242040 }, { "epoch": 1.56, "learning_rate": 6.566281779045675e-05, "loss": 0.0301, "step": 242050 }, { "epoch": 1.56, "learning_rate": 6.565313643609983e-05, "loss": 0.0256, "step": 242060 }, { "epoch": 1.56, "learning_rate": 6.564345508174289e-05, "loss": 0.0276, "step": 242070 }, { "epoch": 1.56, "learning_rate": 6.563377372738597e-05, "loss": 0.0284, "step": 242080 }, { "epoch": 1.56, "learning_rate": 6.562409237302903e-05, "loss": 0.0275, "step": 242090 }, { "epoch": 1.56, "learning_rate": 6.56144110186721e-05, "loss": 0.0287, "step": 242100 }, { "epoch": 1.56, "learning_rate": 6.560472966431517e-05, "loss": 0.0259, "step": 242110 }, { "epoch": 1.56, "learning_rate": 6.559504830995823e-05, "loss": 0.0223, "step": 242120 }, { "epoch": 1.56, "learning_rate": 6.55853669556013e-05, "loss": 0.0262, "step": 242130 }, { "epoch": 1.56, "learning_rate": 6.557568560124436e-05, "loss": 0.0265, "step": 242140 }, { "epoch": 1.56, "learning_rate": 6.556600424688744e-05, "loss": 0.0251, "step": 242150 }, { "epoch": 1.56, "learning_rate": 6.555632289253051e-05, "loss": 0.0257, "step": 242160 }, { "epoch": 1.56, "learning_rate": 6.554664153817358e-05, "loss": 0.0243, "step": 242170 }, { "epoch": 1.56, "learning_rate": 6.553696018381664e-05, "loss": 0.0242, "step": 242180 }, { "epoch": 1.56, "learning_rate": 6.552727882945971e-05, "loss": 0.0243, "step": 242190 }, { "epoch": 1.56, "learning_rate": 6.551759747510278e-05, "loss": 0.0227, "step": 242200 }, { "epoch": 1.56, "learning_rate": 6.550791612074584e-05, "loss": 0.0239, "step": 242210 }, { "epoch": 1.56, "learning_rate": 6.549823476638892e-05, "loss": 0.0246, "step": 242220 }, { "epoch": 1.56, "learning_rate": 6.548855341203197e-05, "loss": 0.0286, "step": 242230 }, { "epoch": 1.56, "learning_rate": 6.547887205767505e-05, "loss": 0.0305, "step": 242240 }, { "epoch": 1.56, "learning_rate": 6.546919070331812e-05, "loss": 0.0253, "step": 242250 }, { "epoch": 1.56, "learning_rate": 6.545950934896119e-05, "loss": 0.0286, "step": 242260 }, { "epoch": 1.56, "learning_rate": 6.544982799460425e-05, "loss": 0.0257, "step": 242270 }, { "epoch": 1.56, "learning_rate": 6.544014664024732e-05, "loss": 0.0255, "step": 242280 }, { "epoch": 1.56, "learning_rate": 6.543046528589038e-05, "loss": 0.0253, "step": 242290 }, { "epoch": 1.56, "learning_rate": 6.542078393153345e-05, "loss": 0.0254, "step": 242300 }, { "epoch": 1.56, "learning_rate": 6.541110257717653e-05, "loss": 0.026, "step": 242310 }, { "epoch": 1.56, "learning_rate": 6.54014212228196e-05, "loss": 0.0243, "step": 242320 }, { "epoch": 1.56, "learning_rate": 6.539173986846265e-05, "loss": 0.0233, "step": 242330 }, { "epoch": 1.56, "learning_rate": 6.538205851410573e-05, "loss": 0.0259, "step": 242340 }, { "epoch": 1.56, "learning_rate": 6.53723771597488e-05, "loss": 0.0253, "step": 242350 }, { "epoch": 1.56, "learning_rate": 6.536269580539186e-05, "loss": 0.0253, "step": 242360 }, { "epoch": 1.56, "learning_rate": 6.535301445103493e-05, "loss": 0.0282, "step": 242370 }, { "epoch": 1.56, "learning_rate": 6.534333309667801e-05, "loss": 0.0236, "step": 242380 }, { "epoch": 1.56, "learning_rate": 6.533365174232106e-05, "loss": 0.0241, "step": 242390 }, { "epoch": 1.56, "learning_rate": 6.532397038796413e-05, "loss": 0.0274, "step": 242400 }, { "epoch": 1.56, "learning_rate": 6.531428903360721e-05, "loss": 0.0231, "step": 242410 }, { "epoch": 1.56, "learning_rate": 6.530460767925027e-05, "loss": 0.0295, "step": 242420 }, { "epoch": 1.56, "learning_rate": 6.529492632489334e-05, "loss": 0.0267, "step": 242430 }, { "epoch": 1.56, "learning_rate": 6.52852449705364e-05, "loss": 0.0269, "step": 242440 }, { "epoch": 1.56, "learning_rate": 6.527556361617947e-05, "loss": 0.0259, "step": 242450 }, { "epoch": 1.56, "learning_rate": 6.526588226182254e-05, "loss": 0.0313, "step": 242460 }, { "epoch": 1.56, "learning_rate": 6.52562009074656e-05, "loss": 0.0229, "step": 242470 }, { "epoch": 1.57, "learning_rate": 6.524651955310868e-05, "loss": 0.0303, "step": 242480 }, { "epoch": 1.57, "learning_rate": 6.523683819875174e-05, "loss": 0.0268, "step": 242490 }, { "epoch": 1.57, "learning_rate": 6.522715684439482e-05, "loss": 0.0307, "step": 242500 }, { "epoch": 1.57, "learning_rate": 6.521747549003788e-05, "loss": 0.0301, "step": 242510 }, { "epoch": 1.57, "learning_rate": 6.520779413568095e-05, "loss": 0.0324, "step": 242520 }, { "epoch": 1.57, "learning_rate": 6.519811278132402e-05, "loss": 0.0251, "step": 242530 }, { "epoch": 1.57, "learning_rate": 6.518843142696708e-05, "loss": 0.0276, "step": 242540 }, { "epoch": 1.57, "learning_rate": 6.517875007261015e-05, "loss": 0.0233, "step": 242550 }, { "epoch": 1.57, "learning_rate": 6.516906871825321e-05, "loss": 0.0261, "step": 242560 }, { "epoch": 1.57, "learning_rate": 6.51593873638963e-05, "loss": 0.0302, "step": 242570 }, { "epoch": 1.57, "learning_rate": 6.514970600953936e-05, "loss": 0.0335, "step": 242580 }, { "epoch": 1.57, "learning_rate": 6.514002465518243e-05, "loss": 0.0288, "step": 242590 }, { "epoch": 1.57, "learning_rate": 6.513034330082549e-05, "loss": 0.0378, "step": 242600 }, { "epoch": 1.57, "learning_rate": 6.512066194646856e-05, "loss": 0.0269, "step": 242610 }, { "epoch": 1.57, "learning_rate": 6.511098059211162e-05, "loss": 0.0266, "step": 242620 }, { "epoch": 1.57, "learning_rate": 6.510129923775469e-05, "loss": 0.0253, "step": 242630 }, { "epoch": 1.57, "learning_rate": 6.509161788339777e-05, "loss": 0.0278, "step": 242640 }, { "epoch": 1.57, "learning_rate": 6.508193652904082e-05, "loss": 0.023, "step": 242650 }, { "epoch": 1.57, "learning_rate": 6.50722551746839e-05, "loss": 0.0278, "step": 242660 }, { "epoch": 1.57, "learning_rate": 6.506257382032697e-05, "loss": 0.0246, "step": 242670 }, { "epoch": 1.57, "learning_rate": 6.505289246597004e-05, "loss": 0.0223, "step": 242680 }, { "epoch": 1.57, "learning_rate": 6.50432111116131e-05, "loss": 0.0275, "step": 242690 }, { "epoch": 1.57, "learning_rate": 6.503352975725617e-05, "loss": 0.0235, "step": 242700 }, { "epoch": 1.57, "learning_rate": 6.502384840289923e-05, "loss": 0.0265, "step": 242710 }, { "epoch": 1.57, "learning_rate": 6.50141670485423e-05, "loss": 0.0268, "step": 242720 }, { "epoch": 1.57, "learning_rate": 6.500448569418538e-05, "loss": 0.0322, "step": 242730 }, { "epoch": 1.57, "learning_rate": 6.499480433982845e-05, "loss": 0.0224, "step": 242740 }, { "epoch": 1.57, "learning_rate": 6.49851229854715e-05, "loss": 0.032, "step": 242750 }, { "epoch": 1.57, "learning_rate": 6.497544163111458e-05, "loss": 0.0293, "step": 242760 }, { "epoch": 1.57, "learning_rate": 6.496576027675765e-05, "loss": 0.0321, "step": 242770 }, { "epoch": 1.57, "learning_rate": 6.495607892240071e-05, "loss": 0.0272, "step": 242780 }, { "epoch": 1.57, "learning_rate": 6.494639756804378e-05, "loss": 0.0237, "step": 242790 }, { "epoch": 1.57, "learning_rate": 6.493671621368686e-05, "loss": 0.03, "step": 242800 }, { "epoch": 1.57, "learning_rate": 6.492703485932991e-05, "loss": 0.0276, "step": 242810 }, { "epoch": 1.57, "learning_rate": 6.491735350497298e-05, "loss": 0.0261, "step": 242820 }, { "epoch": 1.57, "learning_rate": 6.490767215061606e-05, "loss": 0.0278, "step": 242830 }, { "epoch": 1.57, "learning_rate": 6.489799079625912e-05, "loss": 0.0292, "step": 242840 }, { "epoch": 1.57, "learning_rate": 6.488830944190219e-05, "loss": 0.0245, "step": 242850 }, { "epoch": 1.57, "learning_rate": 6.487862808754526e-05, "loss": 0.0264, "step": 242860 }, { "epoch": 1.57, "learning_rate": 6.486894673318832e-05, "loss": 0.0326, "step": 242870 }, { "epoch": 1.57, "learning_rate": 6.485926537883139e-05, "loss": 0.0243, "step": 242880 }, { "epoch": 1.57, "learning_rate": 6.484958402447445e-05, "loss": 0.0238, "step": 242890 }, { "epoch": 1.57, "learning_rate": 6.483990267011753e-05, "loss": 0.0261, "step": 242900 }, { "epoch": 1.57, "learning_rate": 6.483022131576059e-05, "loss": 0.0279, "step": 242910 }, { "epoch": 1.57, "learning_rate": 6.482053996140367e-05, "loss": 0.0286, "step": 242920 }, { "epoch": 1.57, "learning_rate": 6.481085860704673e-05, "loss": 0.0312, "step": 242930 }, { "epoch": 1.57, "learning_rate": 6.48011772526898e-05, "loss": 0.0362, "step": 242940 }, { "epoch": 1.57, "learning_rate": 6.479149589833287e-05, "loss": 0.0275, "step": 242950 }, { "epoch": 1.57, "learning_rate": 6.478181454397593e-05, "loss": 0.0343, "step": 242960 }, { "epoch": 1.57, "learning_rate": 6.4772133189619e-05, "loss": 0.0283, "step": 242970 }, { "epoch": 1.57, "learning_rate": 6.476245183526206e-05, "loss": 0.0279, "step": 242980 }, { "epoch": 1.57, "learning_rate": 6.475277048090514e-05, "loss": 0.0267, "step": 242990 }, { "epoch": 1.57, "learning_rate": 6.474308912654821e-05, "loss": 0.0236, "step": 243000 }, { "epoch": 1.57, "eval_cer": 0.9198508643091177, "eval_loss": 0.019448544830083847, "eval_runtime": 120.0183, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 243000 }, { "epoch": 1.57, "learning_rate": 6.473340777219128e-05, "loss": 0.0247, "step": 243010 }, { "epoch": 1.57, "learning_rate": 6.472372641783434e-05, "loss": 0.0266, "step": 243020 }, { "epoch": 1.57, "learning_rate": 6.471404506347741e-05, "loss": 0.0275, "step": 243030 }, { "epoch": 1.57, "learning_rate": 6.470436370912047e-05, "loss": 0.0265, "step": 243040 }, { "epoch": 1.57, "learning_rate": 6.469468235476354e-05, "loss": 0.0346, "step": 243050 }, { "epoch": 1.57, "learning_rate": 6.468500100040661e-05, "loss": 0.0299, "step": 243060 }, { "epoch": 1.57, "learning_rate": 6.467531964604967e-05, "loss": 0.0315, "step": 243070 }, { "epoch": 1.57, "learning_rate": 6.466563829169275e-05, "loss": 0.0286, "step": 243080 }, { "epoch": 1.57, "learning_rate": 6.465595693733582e-05, "loss": 0.0229, "step": 243090 }, { "epoch": 1.57, "learning_rate": 6.464627558297889e-05, "loss": 0.0295, "step": 243100 }, { "epoch": 1.57, "learning_rate": 6.463659422862195e-05, "loss": 0.0272, "step": 243110 }, { "epoch": 1.57, "learning_rate": 6.462691287426502e-05, "loss": 0.0256, "step": 243120 }, { "epoch": 1.57, "learning_rate": 6.461723151990808e-05, "loss": 0.0239, "step": 243130 }, { "epoch": 1.57, "learning_rate": 6.460755016555115e-05, "loss": 0.0243, "step": 243140 }, { "epoch": 1.57, "learning_rate": 6.459786881119423e-05, "loss": 0.0243, "step": 243150 }, { "epoch": 1.57, "learning_rate": 6.458818745683728e-05, "loss": 0.0251, "step": 243160 }, { "epoch": 1.57, "learning_rate": 6.457850610248035e-05, "loss": 0.0302, "step": 243170 }, { "epoch": 1.57, "learning_rate": 6.456882474812343e-05, "loss": 0.0311, "step": 243180 }, { "epoch": 1.57, "learning_rate": 6.45591433937665e-05, "loss": 0.0279, "step": 243190 }, { "epoch": 1.57, "learning_rate": 6.454946203940956e-05, "loss": 0.026, "step": 243200 }, { "epoch": 1.57, "learning_rate": 6.453978068505263e-05, "loss": 0.0248, "step": 243210 }, { "epoch": 1.57, "learning_rate": 6.45300993306957e-05, "loss": 0.0273, "step": 243220 }, { "epoch": 1.57, "learning_rate": 6.452041797633876e-05, "loss": 0.0283, "step": 243230 }, { "epoch": 1.57, "learning_rate": 6.451073662198183e-05, "loss": 0.0413, "step": 243240 }, { "epoch": 1.57, "learning_rate": 6.45010552676249e-05, "loss": 0.0299, "step": 243250 }, { "epoch": 1.57, "learning_rate": 6.449137391326796e-05, "loss": 0.0197, "step": 243260 }, { "epoch": 1.57, "learning_rate": 6.448169255891104e-05, "loss": 0.0242, "step": 243270 }, { "epoch": 1.57, "learning_rate": 6.44720112045541e-05, "loss": 0.0261, "step": 243280 }, { "epoch": 1.57, "learning_rate": 6.446232985019717e-05, "loss": 0.0304, "step": 243290 }, { "epoch": 1.57, "learning_rate": 6.445264849584024e-05, "loss": 0.0242, "step": 243300 }, { "epoch": 1.57, "learning_rate": 6.44429671414833e-05, "loss": 0.0299, "step": 243310 }, { "epoch": 1.57, "learning_rate": 6.443328578712637e-05, "loss": 0.0285, "step": 243320 }, { "epoch": 1.57, "learning_rate": 6.442360443276944e-05, "loss": 0.0228, "step": 243330 }, { "epoch": 1.57, "learning_rate": 6.441392307841252e-05, "loss": 0.0249, "step": 243340 }, { "epoch": 1.57, "learning_rate": 6.440424172405558e-05, "loss": 0.0263, "step": 243350 }, { "epoch": 1.57, "learning_rate": 6.439456036969865e-05, "loss": 0.0267, "step": 243360 }, { "epoch": 1.57, "learning_rate": 6.438487901534171e-05, "loss": 0.0242, "step": 243370 }, { "epoch": 1.57, "learning_rate": 6.437519766098478e-05, "loss": 0.027, "step": 243380 }, { "epoch": 1.57, "learning_rate": 6.436551630662785e-05, "loss": 0.0325, "step": 243390 }, { "epoch": 1.57, "learning_rate": 6.435583495227091e-05, "loss": 0.0242, "step": 243400 }, { "epoch": 1.57, "learning_rate": 6.4346153597914e-05, "loss": 0.0312, "step": 243410 }, { "epoch": 1.57, "learning_rate": 6.433647224355705e-05, "loss": 0.029, "step": 243420 }, { "epoch": 1.57, "learning_rate": 6.432679088920013e-05, "loss": 0.0227, "step": 243430 }, { "epoch": 1.57, "learning_rate": 6.431710953484319e-05, "loss": 0.023, "step": 243440 }, { "epoch": 1.57, "learning_rate": 6.430742818048626e-05, "loss": 0.0213, "step": 243450 }, { "epoch": 1.57, "learning_rate": 6.429774682612932e-05, "loss": 0.0329, "step": 243460 }, { "epoch": 1.57, "learning_rate": 6.428806547177239e-05, "loss": 0.0279, "step": 243470 }, { "epoch": 1.57, "learning_rate": 6.427838411741546e-05, "loss": 0.0322, "step": 243480 }, { "epoch": 1.57, "learning_rate": 6.426870276305852e-05, "loss": 0.0228, "step": 243490 }, { "epoch": 1.57, "learning_rate": 6.42590214087016e-05, "loss": 0.0244, "step": 243500 }, { "epoch": 1.57, "learning_rate": 6.424934005434467e-05, "loss": 0.0247, "step": 243510 }, { "epoch": 1.57, "learning_rate": 6.423965869998772e-05, "loss": 0.0286, "step": 243520 }, { "epoch": 1.57, "learning_rate": 6.42299773456308e-05, "loss": 0.0274, "step": 243530 }, { "epoch": 1.57, "learning_rate": 6.422029599127387e-05, "loss": 0.026, "step": 243540 }, { "epoch": 1.57, "learning_rate": 6.421061463691693e-05, "loss": 0.0314, "step": 243550 }, { "epoch": 1.57, "learning_rate": 6.420093328256e-05, "loss": 0.0262, "step": 243560 }, { "epoch": 1.57, "learning_rate": 6.419125192820308e-05, "loss": 0.024, "step": 243570 }, { "epoch": 1.57, "learning_rate": 6.418157057384613e-05, "loss": 0.0274, "step": 243580 }, { "epoch": 1.57, "learning_rate": 6.41718892194892e-05, "loss": 0.0247, "step": 243590 }, { "epoch": 1.57, "learning_rate": 6.416220786513228e-05, "loss": 0.027, "step": 243600 }, { "epoch": 1.57, "learning_rate": 6.415252651077535e-05, "loss": 0.025, "step": 243610 }, { "epoch": 1.57, "learning_rate": 6.414284515641841e-05, "loss": 0.0257, "step": 243620 }, { "epoch": 1.57, "learning_rate": 6.413316380206148e-05, "loss": 0.0268, "step": 243630 }, { "epoch": 1.57, "learning_rate": 6.412348244770454e-05, "loss": 0.0235, "step": 243640 }, { "epoch": 1.57, "learning_rate": 6.411380109334761e-05, "loss": 0.0317, "step": 243650 }, { "epoch": 1.57, "learning_rate": 6.410411973899068e-05, "loss": 0.025, "step": 243660 }, { "epoch": 1.57, "learning_rate": 6.409443838463376e-05, "loss": 0.0255, "step": 243670 }, { "epoch": 1.57, "learning_rate": 6.408475703027681e-05, "loss": 0.0269, "step": 243680 }, { "epoch": 1.57, "learning_rate": 6.407507567591989e-05, "loss": 0.0219, "step": 243690 }, { "epoch": 1.57, "learning_rate": 6.406539432156295e-05, "loss": 0.0237, "step": 243700 }, { "epoch": 1.57, "learning_rate": 6.405571296720602e-05, "loss": 0.0219, "step": 243710 }, { "epoch": 1.57, "learning_rate": 6.404603161284909e-05, "loss": 0.0265, "step": 243720 }, { "epoch": 1.57, "learning_rate": 6.403635025849215e-05, "loss": 0.0218, "step": 243730 }, { "epoch": 1.57, "learning_rate": 6.402666890413522e-05, "loss": 0.0298, "step": 243740 }, { "epoch": 1.57, "learning_rate": 6.401698754977829e-05, "loss": 0.0238, "step": 243750 }, { "epoch": 1.57, "learning_rate": 6.400730619542137e-05, "loss": 0.0298, "step": 243760 }, { "epoch": 1.57, "learning_rate": 6.399762484106443e-05, "loss": 0.0219, "step": 243770 }, { "epoch": 1.57, "learning_rate": 6.398794348670748e-05, "loss": 0.0242, "step": 243780 }, { "epoch": 1.57, "learning_rate": 6.397826213235056e-05, "loss": 0.0282, "step": 243790 }, { "epoch": 1.57, "learning_rate": 6.396858077799363e-05, "loss": 0.0224, "step": 243800 }, { "epoch": 1.57, "learning_rate": 6.39588994236367e-05, "loss": 0.0275, "step": 243810 }, { "epoch": 1.57, "learning_rate": 6.394921806927976e-05, "loss": 0.026, "step": 243820 }, { "epoch": 1.57, "learning_rate": 6.393953671492284e-05, "loss": 0.0276, "step": 243830 }, { "epoch": 1.57, "learning_rate": 6.39298553605659e-05, "loss": 0.0288, "step": 243840 }, { "epoch": 1.57, "learning_rate": 6.392017400620896e-05, "loss": 0.0267, "step": 243850 }, { "epoch": 1.57, "learning_rate": 6.391049265185204e-05, "loss": 0.028, "step": 243860 }, { "epoch": 1.57, "learning_rate": 6.390081129749511e-05, "loss": 0.0217, "step": 243870 }, { "epoch": 1.57, "learning_rate": 6.389112994313817e-05, "loss": 0.0274, "step": 243880 }, { "epoch": 1.57, "learning_rate": 6.388144858878124e-05, "loss": 0.0291, "step": 243890 }, { "epoch": 1.57, "learning_rate": 6.387176723442431e-05, "loss": 0.0252, "step": 243900 }, { "epoch": 1.57, "learning_rate": 6.386208588006737e-05, "loss": 0.0269, "step": 243910 }, { "epoch": 1.57, "learning_rate": 6.385240452571044e-05, "loss": 0.0253, "step": 243920 }, { "epoch": 1.57, "learning_rate": 6.384272317135352e-05, "loss": 0.0232, "step": 243930 }, { "epoch": 1.57, "learning_rate": 6.383304181699657e-05, "loss": 0.0255, "step": 243940 }, { "epoch": 1.57, "learning_rate": 6.382336046263965e-05, "loss": 0.026, "step": 243950 }, { "epoch": 1.57, "learning_rate": 6.381367910828272e-05, "loss": 0.0305, "step": 243960 }, { "epoch": 1.57, "learning_rate": 6.380399775392578e-05, "loss": 0.0273, "step": 243970 }, { "epoch": 1.57, "learning_rate": 6.379431639956885e-05, "loss": 0.0213, "step": 243980 }, { "epoch": 1.57, "learning_rate": 6.378463504521192e-05, "loss": 0.0256, "step": 243990 }, { "epoch": 1.57, "learning_rate": 6.377495369085498e-05, "loss": 0.0266, "step": 244000 }, { "epoch": 1.57, "eval_cer": 0.9198400180770534, "eval_loss": 0.019307343289256096, "eval_runtime": 120.042, "eval_samples_per_second": 16.661, "eval_steps_per_second": 4.165, "step": 244000 }, { "epoch": 1.57, "learning_rate": 6.376527233649805e-05, "loss": 0.0235, "step": 244010 }, { "epoch": 1.57, "learning_rate": 6.375559098214113e-05, "loss": 0.0252, "step": 244020 }, { "epoch": 1.58, "learning_rate": 6.37459096277842e-05, "loss": 0.0287, "step": 244030 }, { "epoch": 1.58, "learning_rate": 6.373622827342726e-05, "loss": 0.035, "step": 244040 }, { "epoch": 1.58, "learning_rate": 6.372654691907033e-05, "loss": 0.0262, "step": 244050 }, { "epoch": 1.58, "learning_rate": 6.37168655647134e-05, "loss": 0.0305, "step": 244060 }, { "epoch": 1.58, "learning_rate": 6.370718421035646e-05, "loss": 0.0224, "step": 244070 }, { "epoch": 1.58, "learning_rate": 6.369750285599953e-05, "loss": 0.0272, "step": 244080 }, { "epoch": 1.58, "learning_rate": 6.36878215016426e-05, "loss": 0.0239, "step": 244090 }, { "epoch": 1.58, "learning_rate": 6.367814014728566e-05, "loss": 0.0223, "step": 244100 }, { "epoch": 1.58, "learning_rate": 6.366845879292874e-05, "loss": 0.0264, "step": 244110 }, { "epoch": 1.58, "learning_rate": 6.36587774385718e-05, "loss": 0.0255, "step": 244120 }, { "epoch": 1.58, "learning_rate": 6.364909608421487e-05, "loss": 0.0236, "step": 244130 }, { "epoch": 1.58, "learning_rate": 6.363941472985794e-05, "loss": 0.0275, "step": 244140 }, { "epoch": 1.58, "learning_rate": 6.3629733375501e-05, "loss": 0.0298, "step": 244150 }, { "epoch": 1.58, "learning_rate": 6.362005202114407e-05, "loss": 0.027, "step": 244160 }, { "epoch": 1.58, "learning_rate": 6.361037066678714e-05, "loss": 0.0215, "step": 244170 }, { "epoch": 1.58, "learning_rate": 6.360068931243022e-05, "loss": 0.0251, "step": 244180 }, { "epoch": 1.58, "learning_rate": 6.359100795807328e-05, "loss": 0.0255, "step": 244190 }, { "epoch": 1.58, "learning_rate": 6.358132660371633e-05, "loss": 0.0225, "step": 244200 }, { "epoch": 1.58, "learning_rate": 6.357164524935941e-05, "loss": 0.0273, "step": 244210 }, { "epoch": 1.58, "learning_rate": 6.356196389500248e-05, "loss": 0.0285, "step": 244220 }, { "epoch": 1.58, "learning_rate": 6.355228254064555e-05, "loss": 0.0205, "step": 244230 }, { "epoch": 1.58, "learning_rate": 6.354260118628861e-05, "loss": 0.0337, "step": 244240 }, { "epoch": 1.58, "learning_rate": 6.353291983193168e-05, "loss": 0.03, "step": 244250 }, { "epoch": 1.58, "learning_rate": 6.352323847757475e-05, "loss": 0.0247, "step": 244260 }, { "epoch": 1.58, "learning_rate": 6.351355712321781e-05, "loss": 0.0275, "step": 244270 }, { "epoch": 1.58, "learning_rate": 6.350387576886089e-05, "loss": 0.0254, "step": 244280 }, { "epoch": 1.58, "learning_rate": 6.349419441450396e-05, "loss": 0.0276, "step": 244290 }, { "epoch": 1.58, "learning_rate": 6.348451306014702e-05, "loss": 0.0265, "step": 244300 }, { "epoch": 1.58, "learning_rate": 6.347483170579009e-05, "loss": 0.0244, "step": 244310 }, { "epoch": 1.58, "learning_rate": 6.346515035143316e-05, "loss": 0.0261, "step": 244320 }, { "epoch": 1.58, "learning_rate": 6.345546899707622e-05, "loss": 0.025, "step": 244330 }, { "epoch": 1.58, "learning_rate": 6.344578764271929e-05, "loss": 0.0238, "step": 244340 }, { "epoch": 1.58, "learning_rate": 6.343610628836237e-05, "loss": 0.0266, "step": 244350 }, { "epoch": 1.58, "learning_rate": 6.342642493400542e-05, "loss": 0.0249, "step": 244360 }, { "epoch": 1.58, "learning_rate": 6.34167435796485e-05, "loss": 0.028, "step": 244370 }, { "epoch": 1.58, "learning_rate": 6.340706222529157e-05, "loss": 0.0261, "step": 244380 }, { "epoch": 1.58, "learning_rate": 6.339738087093463e-05, "loss": 0.0286, "step": 244390 }, { "epoch": 1.58, "learning_rate": 6.33876995165777e-05, "loss": 0.0236, "step": 244400 }, { "epoch": 1.58, "learning_rate": 6.337801816222077e-05, "loss": 0.0271, "step": 244410 }, { "epoch": 1.58, "learning_rate": 6.336833680786383e-05, "loss": 0.0255, "step": 244420 }, { "epoch": 1.58, "learning_rate": 6.33586554535069e-05, "loss": 0.0226, "step": 244430 }, { "epoch": 1.58, "learning_rate": 6.334897409914998e-05, "loss": 0.0298, "step": 244440 }, { "epoch": 1.58, "learning_rate": 6.333929274479304e-05, "loss": 0.0296, "step": 244450 }, { "epoch": 1.58, "learning_rate": 6.332961139043611e-05, "loss": 0.0223, "step": 244460 }, { "epoch": 1.58, "learning_rate": 6.331993003607918e-05, "loss": 0.0267, "step": 244470 }, { "epoch": 1.58, "learning_rate": 6.331024868172224e-05, "loss": 0.0249, "step": 244480 }, { "epoch": 1.58, "learning_rate": 6.330056732736531e-05, "loss": 0.0225, "step": 244490 }, { "epoch": 1.58, "learning_rate": 6.329088597300838e-05, "loss": 0.0303, "step": 244500 }, { "epoch": 1.58, "learning_rate": 6.328120461865144e-05, "loss": 0.0277, "step": 244510 }, { "epoch": 1.58, "learning_rate": 6.327152326429451e-05, "loss": 0.028, "step": 244520 }, { "epoch": 1.58, "learning_rate": 6.326184190993759e-05, "loss": 0.0251, "step": 244530 }, { "epoch": 1.58, "learning_rate": 6.325216055558065e-05, "loss": 0.0282, "step": 244540 }, { "epoch": 1.58, "learning_rate": 6.324247920122372e-05, "loss": 0.0226, "step": 244550 }, { "epoch": 1.58, "learning_rate": 6.323279784686679e-05, "loss": 0.0229, "step": 244560 }, { "epoch": 1.58, "learning_rate": 6.322311649250985e-05, "loss": 0.0288, "step": 244570 }, { "epoch": 1.58, "learning_rate": 6.321343513815292e-05, "loss": 0.0276, "step": 244580 }, { "epoch": 1.58, "learning_rate": 6.320375378379599e-05, "loss": 0.0261, "step": 244590 }, { "epoch": 1.58, "learning_rate": 6.319407242943907e-05, "loss": 0.0316, "step": 244600 }, { "epoch": 1.58, "learning_rate": 6.318439107508212e-05, "loss": 0.0322, "step": 244610 }, { "epoch": 1.58, "learning_rate": 6.317470972072518e-05, "loss": 0.0228, "step": 244620 }, { "epoch": 1.58, "learning_rate": 6.316502836636826e-05, "loss": 0.028, "step": 244630 }, { "epoch": 1.58, "learning_rate": 6.315534701201133e-05, "loss": 0.0325, "step": 244640 }, { "epoch": 1.58, "learning_rate": 6.31456656576544e-05, "loss": 0.03, "step": 244650 }, { "epoch": 1.58, "learning_rate": 6.313598430329746e-05, "loss": 0.0275, "step": 244660 }, { "epoch": 1.58, "learning_rate": 6.312630294894053e-05, "loss": 0.0266, "step": 244670 }, { "epoch": 1.58, "learning_rate": 6.31166215945836e-05, "loss": 0.0244, "step": 244680 }, { "epoch": 1.58, "learning_rate": 6.310694024022666e-05, "loss": 0.0255, "step": 244690 }, { "epoch": 1.58, "learning_rate": 6.309725888586974e-05, "loss": 0.0231, "step": 244700 }, { "epoch": 1.58, "learning_rate": 6.30875775315128e-05, "loss": 0.0251, "step": 244710 }, { "epoch": 1.58, "learning_rate": 6.307789617715587e-05, "loss": 0.0286, "step": 244720 }, { "epoch": 1.58, "learning_rate": 6.306821482279894e-05, "loss": 0.0266, "step": 244730 }, { "epoch": 1.58, "learning_rate": 6.3058533468442e-05, "loss": 0.0293, "step": 244740 }, { "epoch": 1.58, "learning_rate": 6.304885211408507e-05, "loss": 0.0271, "step": 244750 }, { "epoch": 1.58, "learning_rate": 6.303917075972814e-05, "loss": 0.0235, "step": 244760 }, { "epoch": 1.58, "learning_rate": 6.30294894053712e-05, "loss": 0.0203, "step": 244770 }, { "epoch": 1.58, "learning_rate": 6.301980805101427e-05, "loss": 0.0238, "step": 244780 }, { "epoch": 1.58, "learning_rate": 6.301012669665735e-05, "loss": 0.0304, "step": 244790 }, { "epoch": 1.58, "learning_rate": 6.300044534230042e-05, "loss": 0.0302, "step": 244800 }, { "epoch": 1.58, "learning_rate": 6.299076398794348e-05, "loss": 0.0314, "step": 244810 }, { "epoch": 1.58, "learning_rate": 6.298108263358655e-05, "loss": 0.0246, "step": 244820 }, { "epoch": 1.58, "learning_rate": 6.297140127922962e-05, "loss": 0.0286, "step": 244830 }, { "epoch": 1.58, "learning_rate": 6.296171992487268e-05, "loss": 0.019, "step": 244840 }, { "epoch": 1.58, "learning_rate": 6.295203857051575e-05, "loss": 0.0223, "step": 244850 }, { "epoch": 1.58, "learning_rate": 6.294235721615883e-05, "loss": 0.0254, "step": 244860 }, { "epoch": 1.58, "learning_rate": 6.293267586180188e-05, "loss": 0.0255, "step": 244870 }, { "epoch": 1.58, "learning_rate": 6.292299450744496e-05, "loss": 0.02, "step": 244880 }, { "epoch": 1.58, "learning_rate": 6.291331315308803e-05, "loss": 0.0227, "step": 244890 }, { "epoch": 1.58, "learning_rate": 6.29036317987311e-05, "loss": 0.0278, "step": 244900 }, { "epoch": 1.58, "learning_rate": 6.289395044437416e-05, "loss": 0.0246, "step": 244910 }, { "epoch": 1.58, "learning_rate": 6.288426909001723e-05, "loss": 0.034, "step": 244920 }, { "epoch": 1.58, "learning_rate": 6.287458773566029e-05, "loss": 0.029, "step": 244930 }, { "epoch": 1.58, "learning_rate": 6.286490638130336e-05, "loss": 0.0276, "step": 244940 }, { "epoch": 1.58, "learning_rate": 6.285522502694644e-05, "loss": 0.0233, "step": 244950 }, { "epoch": 1.58, "learning_rate": 6.28455436725895e-05, "loss": 0.0215, "step": 244960 }, { "epoch": 1.58, "learning_rate": 6.283586231823256e-05, "loss": 0.024, "step": 244970 }, { "epoch": 1.58, "learning_rate": 6.282618096387564e-05, "loss": 0.0269, "step": 244980 }, { "epoch": 1.58, "learning_rate": 6.28164996095187e-05, "loss": 0.0255, "step": 244990 }, { "epoch": 1.58, "learning_rate": 6.280681825516177e-05, "loss": 0.027, "step": 245000 }, { "epoch": 1.58, "eval_cer": 0.9198960569427184, "eval_loss": 0.01949627697467804, "eval_runtime": 120.0652, "eval_samples_per_second": 16.658, "eval_steps_per_second": 4.164, "step": 245000 }, { "epoch": 1.58, "learning_rate": 6.279713690080484e-05, "loss": 0.0205, "step": 245010 }, { "epoch": 1.58, "learning_rate": 6.278745554644792e-05, "loss": 0.0261, "step": 245020 }, { "epoch": 1.58, "learning_rate": 6.277777419209097e-05, "loss": 0.028, "step": 245030 }, { "epoch": 1.58, "learning_rate": 6.276809283773403e-05, "loss": 0.0325, "step": 245040 }, { "epoch": 1.58, "learning_rate": 6.275841148337711e-05, "loss": 0.0253, "step": 245050 }, { "epoch": 1.58, "learning_rate": 6.274873012902018e-05, "loss": 0.0254, "step": 245060 }, { "epoch": 1.58, "learning_rate": 6.273904877466325e-05, "loss": 0.0289, "step": 245070 }, { "epoch": 1.58, "learning_rate": 6.272936742030631e-05, "loss": 0.0265, "step": 245080 }, { "epoch": 1.58, "learning_rate": 6.271968606594938e-05, "loss": 0.0293, "step": 245090 }, { "epoch": 1.58, "learning_rate": 6.271000471159245e-05, "loss": 0.0266, "step": 245100 }, { "epoch": 1.58, "learning_rate": 6.270032335723551e-05, "loss": 0.025, "step": 245110 }, { "epoch": 1.58, "learning_rate": 6.269064200287859e-05, "loss": 0.0307, "step": 245120 }, { "epoch": 1.58, "learning_rate": 6.268096064852164e-05, "loss": 0.0271, "step": 245130 }, { "epoch": 1.58, "learning_rate": 6.267127929416472e-05, "loss": 0.0267, "step": 245140 }, { "epoch": 1.58, "learning_rate": 6.266159793980779e-05, "loss": 0.0281, "step": 245150 }, { "epoch": 1.58, "learning_rate": 6.265191658545086e-05, "loss": 0.0277, "step": 245160 }, { "epoch": 1.58, "learning_rate": 6.264223523109392e-05, "loss": 0.0236, "step": 245170 }, { "epoch": 1.58, "learning_rate": 6.263255387673699e-05, "loss": 0.0302, "step": 245180 }, { "epoch": 1.58, "learning_rate": 6.262287252238006e-05, "loss": 0.0255, "step": 245190 }, { "epoch": 1.58, "learning_rate": 6.261319116802312e-05, "loss": 0.035, "step": 245200 }, { "epoch": 1.58, "learning_rate": 6.26035098136662e-05, "loss": 0.0223, "step": 245210 }, { "epoch": 1.58, "learning_rate": 6.259382845930927e-05, "loss": 0.0279, "step": 245220 }, { "epoch": 1.58, "learning_rate": 6.258414710495233e-05, "loss": 0.0283, "step": 245230 }, { "epoch": 1.58, "learning_rate": 6.25744657505954e-05, "loss": 0.0236, "step": 245240 }, { "epoch": 1.58, "learning_rate": 6.256478439623847e-05, "loss": 0.0271, "step": 245250 }, { "epoch": 1.58, "learning_rate": 6.255510304188153e-05, "loss": 0.0239, "step": 245260 }, { "epoch": 1.58, "learning_rate": 6.25454216875246e-05, "loss": 0.0248, "step": 245270 }, { "epoch": 1.58, "learning_rate": 6.253574033316768e-05, "loss": 0.0255, "step": 245280 }, { "epoch": 1.58, "learning_rate": 6.252605897881073e-05, "loss": 0.027, "step": 245290 }, { "epoch": 1.58, "learning_rate": 6.251637762445381e-05, "loss": 0.0258, "step": 245300 }, { "epoch": 1.58, "learning_rate": 6.250669627009688e-05, "loss": 0.0267, "step": 245310 }, { "epoch": 1.58, "learning_rate": 6.249701491573994e-05, "loss": 0.0318, "step": 245320 }, { "epoch": 1.58, "learning_rate": 6.248733356138301e-05, "loss": 0.0264, "step": 245330 }, { "epoch": 1.58, "learning_rate": 6.247765220702608e-05, "loss": 0.027, "step": 245340 }, { "epoch": 1.58, "learning_rate": 6.246797085266914e-05, "loss": 0.0248, "step": 245350 }, { "epoch": 1.58, "learning_rate": 6.245828949831221e-05, "loss": 0.0276, "step": 245360 }, { "epoch": 1.58, "learning_rate": 6.244860814395527e-05, "loss": 0.0263, "step": 245370 }, { "epoch": 1.58, "learning_rate": 6.243892678959835e-05, "loss": 0.0266, "step": 245380 }, { "epoch": 1.58, "learning_rate": 6.242924543524141e-05, "loss": 0.0254, "step": 245390 }, { "epoch": 1.58, "learning_rate": 6.241956408088449e-05, "loss": 0.029, "step": 245400 }, { "epoch": 1.58, "learning_rate": 6.240988272652755e-05, "loss": 0.0244, "step": 245410 }, { "epoch": 1.58, "learning_rate": 6.240020137217062e-05, "loss": 0.0368, "step": 245420 }, { "epoch": 1.58, "learning_rate": 6.239052001781369e-05, "loss": 0.0287, "step": 245430 }, { "epoch": 1.58, "learning_rate": 6.238083866345675e-05, "loss": 0.0283, "step": 245440 }, { "epoch": 1.58, "learning_rate": 6.237115730909982e-05, "loss": 0.0286, "step": 245450 }, { "epoch": 1.58, "learning_rate": 6.236147595474288e-05, "loss": 0.0279, "step": 245460 }, { "epoch": 1.58, "learning_rate": 6.235179460038596e-05, "loss": 0.0314, "step": 245470 }, { "epoch": 1.58, "learning_rate": 6.234211324602903e-05, "loss": 0.037, "step": 245480 }, { "epoch": 1.58, "learning_rate": 6.23324318916721e-05, "loss": 0.0223, "step": 245490 }, { "epoch": 1.58, "learning_rate": 6.232275053731516e-05, "loss": 0.0257, "step": 245500 }, { "epoch": 1.58, "learning_rate": 6.231306918295823e-05, "loss": 0.0288, "step": 245510 }, { "epoch": 1.58, "learning_rate": 6.23033878286013e-05, "loss": 0.0254, "step": 245520 }, { "epoch": 1.58, "learning_rate": 6.229370647424436e-05, "loss": 0.0336, "step": 245530 }, { "epoch": 1.58, "learning_rate": 6.228402511988744e-05, "loss": 0.0265, "step": 245540 }, { "epoch": 1.58, "learning_rate": 6.22743437655305e-05, "loss": 0.0264, "step": 245550 }, { "epoch": 1.58, "learning_rate": 6.226466241117357e-05, "loss": 0.0288, "step": 245560 }, { "epoch": 1.58, "learning_rate": 6.225498105681664e-05, "loss": 0.0239, "step": 245570 }, { "epoch": 1.59, "learning_rate": 6.22452997024597e-05, "loss": 0.031, "step": 245580 }, { "epoch": 1.59, "learning_rate": 6.223561834810277e-05, "loss": 0.0231, "step": 245590 }, { "epoch": 1.59, "learning_rate": 6.222593699374584e-05, "loss": 0.0242, "step": 245600 }, { "epoch": 1.59, "learning_rate": 6.22162556393889e-05, "loss": 0.0241, "step": 245610 }, { "epoch": 1.59, "learning_rate": 6.220657428503197e-05, "loss": 0.0261, "step": 245620 }, { "epoch": 1.59, "learning_rate": 6.219689293067505e-05, "loss": 0.0272, "step": 245630 }, { "epoch": 1.59, "learning_rate": 6.218721157631812e-05, "loss": 0.0272, "step": 245640 }, { "epoch": 1.59, "learning_rate": 6.217753022196117e-05, "loss": 0.0309, "step": 245650 }, { "epoch": 1.59, "learning_rate": 6.216784886760425e-05, "loss": 0.0272, "step": 245660 }, { "epoch": 1.59, "learning_rate": 6.215816751324732e-05, "loss": 0.0225, "step": 245670 }, { "epoch": 1.59, "learning_rate": 6.214848615889038e-05, "loss": 0.0272, "step": 245680 }, { "epoch": 1.59, "learning_rate": 6.213880480453345e-05, "loss": 0.0256, "step": 245690 }, { "epoch": 1.59, "learning_rate": 6.212912345017651e-05, "loss": 0.0267, "step": 245700 }, { "epoch": 1.59, "learning_rate": 6.211944209581958e-05, "loss": 0.0309, "step": 245710 }, { "epoch": 1.59, "learning_rate": 6.210976074146265e-05, "loss": 0.0295, "step": 245720 }, { "epoch": 1.59, "learning_rate": 6.210007938710573e-05, "loss": 0.0251, "step": 245730 }, { "epoch": 1.59, "learning_rate": 6.209039803274879e-05, "loss": 0.0231, "step": 245740 }, { "epoch": 1.59, "learning_rate": 6.208071667839186e-05, "loss": 0.0286, "step": 245750 }, { "epoch": 1.59, "learning_rate": 6.207103532403493e-05, "loss": 0.0246, "step": 245760 }, { "epoch": 1.59, "learning_rate": 6.206135396967799e-05, "loss": 0.0273, "step": 245770 }, { "epoch": 1.59, "learning_rate": 6.205167261532106e-05, "loss": 0.026, "step": 245780 }, { "epoch": 1.59, "learning_rate": 6.204199126096412e-05, "loss": 0.032, "step": 245790 }, { "epoch": 1.59, "learning_rate": 6.203230990660719e-05, "loss": 0.0247, "step": 245800 }, { "epoch": 1.59, "learning_rate": 6.202262855225026e-05, "loss": 0.0228, "step": 245810 }, { "epoch": 1.59, "learning_rate": 6.201294719789334e-05, "loss": 0.0236, "step": 245820 }, { "epoch": 1.59, "learning_rate": 6.20032658435364e-05, "loss": 0.0227, "step": 245830 }, { "epoch": 1.59, "learning_rate": 6.199358448917947e-05, "loss": 0.024, "step": 245840 }, { "epoch": 1.59, "learning_rate": 6.198390313482254e-05, "loss": 0.0299, "step": 245850 }, { "epoch": 1.59, "learning_rate": 6.19742217804656e-05, "loss": 0.0266, "step": 245860 }, { "epoch": 1.59, "learning_rate": 6.196454042610867e-05, "loss": 0.0315, "step": 245870 }, { "epoch": 1.59, "learning_rate": 6.195485907175173e-05, "loss": 0.0223, "step": 245880 }, { "epoch": 1.59, "learning_rate": 6.194517771739481e-05, "loss": 0.0257, "step": 245890 }, { "epoch": 1.59, "learning_rate": 6.193549636303787e-05, "loss": 0.0261, "step": 245900 }, { "epoch": 1.59, "learning_rate": 6.192581500868095e-05, "loss": 0.0238, "step": 245910 }, { "epoch": 1.59, "learning_rate": 6.191613365432401e-05, "loss": 0.0309, "step": 245920 }, { "epoch": 1.59, "learning_rate": 6.190645229996708e-05, "loss": 0.0247, "step": 245930 }, { "epoch": 1.59, "learning_rate": 6.189677094561014e-05, "loss": 0.0265, "step": 245940 }, { "epoch": 1.59, "learning_rate": 6.188708959125321e-05, "loss": 0.027, "step": 245950 }, { "epoch": 1.59, "learning_rate": 6.187740823689628e-05, "loss": 0.0258, "step": 245960 }, { "epoch": 1.59, "learning_rate": 6.186772688253934e-05, "loss": 0.0269, "step": 245970 }, { "epoch": 1.59, "learning_rate": 6.185804552818242e-05, "loss": 0.0278, "step": 245980 }, { "epoch": 1.59, "learning_rate": 6.184836417382549e-05, "loss": 0.03, "step": 245990 }, { "epoch": 1.59, "learning_rate": 6.183868281946854e-05, "loss": 0.0257, "step": 246000 }, { "epoch": 1.59, "eval_cer": 0.9198806914472941, "eval_loss": 0.01917816512286663, "eval_runtime": 120.0373, "eval_samples_per_second": 16.661, "eval_steps_per_second": 4.165, "step": 246000 }, { "epoch": 1.59, "learning_rate": 6.182900146511162e-05, "loss": 0.028, "step": 246010 }, { "epoch": 1.59, "learning_rate": 6.181932011075469e-05, "loss": 0.026, "step": 246020 }, { "epoch": 1.59, "learning_rate": 6.180963875639775e-05, "loss": 0.0262, "step": 246030 }, { "epoch": 1.59, "learning_rate": 6.179995740204082e-05, "loss": 0.031, "step": 246040 }, { "epoch": 1.59, "learning_rate": 6.17902760476839e-05, "loss": 0.0259, "step": 246050 }, { "epoch": 1.59, "learning_rate": 6.178059469332695e-05, "loss": 0.0288, "step": 246060 }, { "epoch": 1.59, "learning_rate": 6.177091333897002e-05, "loss": 0.0232, "step": 246070 }, { "epoch": 1.59, "learning_rate": 6.17612319846131e-05, "loss": 0.0236, "step": 246080 }, { "epoch": 1.59, "learning_rate": 6.175155063025617e-05, "loss": 0.0278, "step": 246090 }, { "epoch": 1.59, "learning_rate": 6.174186927589923e-05, "loss": 0.0291, "step": 246100 }, { "epoch": 1.59, "learning_rate": 6.17321879215423e-05, "loss": 0.025, "step": 246110 }, { "epoch": 1.59, "learning_rate": 6.172250656718536e-05, "loss": 0.033, "step": 246120 }, { "epoch": 1.59, "learning_rate": 6.171282521282843e-05, "loss": 0.0368, "step": 246130 }, { "epoch": 1.59, "learning_rate": 6.17031438584715e-05, "loss": 0.0261, "step": 246140 }, { "epoch": 1.59, "learning_rate": 6.169346250411458e-05, "loss": 0.0236, "step": 246150 }, { "epoch": 1.59, "learning_rate": 6.168378114975763e-05, "loss": 0.0221, "step": 246160 }, { "epoch": 1.59, "learning_rate": 6.167409979540071e-05, "loss": 0.0229, "step": 246170 }, { "epoch": 1.59, "learning_rate": 6.166441844104378e-05, "loss": 0.03, "step": 246180 }, { "epoch": 1.59, "learning_rate": 6.165473708668684e-05, "loss": 0.0226, "step": 246190 }, { "epoch": 1.59, "learning_rate": 6.164505573232991e-05, "loss": 0.0262, "step": 246200 }, { "epoch": 1.59, "learning_rate": 6.163537437797297e-05, "loss": 0.0236, "step": 246210 }, { "epoch": 1.59, "learning_rate": 6.162569302361604e-05, "loss": 0.026, "step": 246220 }, { "epoch": 1.59, "learning_rate": 6.16160116692591e-05, "loss": 0.025, "step": 246230 }, { "epoch": 1.59, "learning_rate": 6.160633031490219e-05, "loss": 0.0254, "step": 246240 }, { "epoch": 1.59, "learning_rate": 6.159664896054525e-05, "loss": 0.0251, "step": 246250 }, { "epoch": 1.59, "learning_rate": 6.158696760618832e-05, "loss": 0.0325, "step": 246260 }, { "epoch": 1.59, "learning_rate": 6.157728625183139e-05, "loss": 0.03, "step": 246270 }, { "epoch": 1.59, "learning_rate": 6.156760489747445e-05, "loss": 0.0251, "step": 246280 }, { "epoch": 1.59, "learning_rate": 6.155792354311752e-05, "loss": 0.0333, "step": 246290 }, { "epoch": 1.59, "learning_rate": 6.154824218876058e-05, "loss": 0.0289, "step": 246300 }, { "epoch": 1.59, "learning_rate": 6.153856083440366e-05, "loss": 0.027, "step": 246310 }, { "epoch": 1.59, "learning_rate": 6.152887948004672e-05, "loss": 0.0279, "step": 246320 }, { "epoch": 1.59, "learning_rate": 6.15191981256898e-05, "loss": 0.022, "step": 246330 }, { "epoch": 1.59, "learning_rate": 6.150951677133286e-05, "loss": 0.0271, "step": 246340 }, { "epoch": 1.59, "learning_rate": 6.149983541697593e-05, "loss": 0.0288, "step": 246350 }, { "epoch": 1.59, "learning_rate": 6.1490154062619e-05, "loss": 0.0247, "step": 246360 }, { "epoch": 1.59, "learning_rate": 6.148047270826206e-05, "loss": 0.0292, "step": 246370 }, { "epoch": 1.59, "learning_rate": 6.147079135390513e-05, "loss": 0.0227, "step": 246380 }, { "epoch": 1.59, "learning_rate": 6.14611099995482e-05, "loss": 0.0254, "step": 246390 }, { "epoch": 1.59, "learning_rate": 6.145142864519127e-05, "loss": 0.0233, "step": 246400 }, { "epoch": 1.59, "learning_rate": 6.144174729083434e-05, "loss": 0.0263, "step": 246410 }, { "epoch": 1.59, "learning_rate": 6.143206593647739e-05, "loss": 0.0247, "step": 246420 }, { "epoch": 1.59, "learning_rate": 6.142238458212047e-05, "loss": 0.0233, "step": 246430 }, { "epoch": 1.59, "learning_rate": 6.141270322776354e-05, "loss": 0.0254, "step": 246440 }, { "epoch": 1.59, "learning_rate": 6.14030218734066e-05, "loss": 0.0251, "step": 246450 }, { "epoch": 1.59, "learning_rate": 6.139334051904967e-05, "loss": 0.0277, "step": 246460 }, { "epoch": 1.59, "learning_rate": 6.138365916469275e-05, "loss": 0.0256, "step": 246470 }, { "epoch": 1.59, "learning_rate": 6.13739778103358e-05, "loss": 0.0243, "step": 246480 }, { "epoch": 1.59, "learning_rate": 6.136429645597887e-05, "loss": 0.0335, "step": 246490 }, { "epoch": 1.59, "learning_rate": 6.135461510162195e-05, "loss": 0.0247, "step": 246500 }, { "epoch": 1.59, "learning_rate": 6.134493374726502e-05, "loss": 0.0237, "step": 246510 }, { "epoch": 1.59, "learning_rate": 6.133525239290808e-05, "loss": 0.0255, "step": 246520 }, { "epoch": 1.59, "learning_rate": 6.132557103855115e-05, "loss": 0.0252, "step": 246530 }, { "epoch": 1.59, "learning_rate": 6.131588968419421e-05, "loss": 0.0292, "step": 246540 }, { "epoch": 1.59, "learning_rate": 6.130620832983728e-05, "loss": 0.0236, "step": 246550 }, { "epoch": 1.59, "learning_rate": 6.129652697548035e-05, "loss": 0.0243, "step": 246560 }, { "epoch": 1.59, "learning_rate": 6.128684562112343e-05, "loss": 0.0274, "step": 246570 }, { "epoch": 1.59, "learning_rate": 6.127716426676648e-05, "loss": 0.0275, "step": 246580 }, { "epoch": 1.59, "learning_rate": 6.126748291240956e-05, "loss": 0.0246, "step": 246590 }, { "epoch": 1.59, "learning_rate": 6.125780155805263e-05, "loss": 0.0222, "step": 246600 }, { "epoch": 1.59, "learning_rate": 6.124812020369569e-05, "loss": 0.027, "step": 246610 }, { "epoch": 1.59, "learning_rate": 6.123843884933876e-05, "loss": 0.0235, "step": 246620 }, { "epoch": 1.59, "learning_rate": 6.122875749498182e-05, "loss": 0.0283, "step": 246630 }, { "epoch": 1.59, "learning_rate": 6.121907614062489e-05, "loss": 0.0227, "step": 246640 }, { "epoch": 1.59, "learning_rate": 6.120939478626796e-05, "loss": 0.0252, "step": 246650 }, { "epoch": 1.59, "learning_rate": 6.119971343191104e-05, "loss": 0.0241, "step": 246660 }, { "epoch": 1.59, "learning_rate": 6.11900320775541e-05, "loss": 0.0235, "step": 246670 }, { "epoch": 1.59, "learning_rate": 6.118035072319717e-05, "loss": 0.0311, "step": 246680 }, { "epoch": 1.59, "learning_rate": 6.117066936884023e-05, "loss": 0.0279, "step": 246690 }, { "epoch": 1.59, "learning_rate": 6.11609880144833e-05, "loss": 0.0282, "step": 246700 }, { "epoch": 1.59, "learning_rate": 6.115130666012637e-05, "loss": 0.0252, "step": 246710 }, { "epoch": 1.59, "learning_rate": 6.114162530576943e-05, "loss": 0.0223, "step": 246720 }, { "epoch": 1.59, "learning_rate": 6.113194395141251e-05, "loss": 0.0277, "step": 246730 }, { "epoch": 1.59, "learning_rate": 6.112226259705557e-05, "loss": 0.0285, "step": 246740 }, { "epoch": 1.59, "learning_rate": 6.111258124269865e-05, "loss": 0.0362, "step": 246750 }, { "epoch": 1.59, "learning_rate": 6.110289988834171e-05, "loss": 0.0231, "step": 246760 }, { "epoch": 1.59, "learning_rate": 6.109321853398478e-05, "loss": 0.0265, "step": 246770 }, { "epoch": 1.59, "learning_rate": 6.108353717962784e-05, "loss": 0.0333, "step": 246780 }, { "epoch": 1.59, "learning_rate": 6.107385582527091e-05, "loss": 0.0233, "step": 246790 }, { "epoch": 1.59, "learning_rate": 6.106417447091398e-05, "loss": 0.0267, "step": 246800 }, { "epoch": 1.59, "learning_rate": 6.105449311655704e-05, "loss": 0.0253, "step": 246810 }, { "epoch": 1.59, "learning_rate": 6.104481176220012e-05, "loss": 0.023, "step": 246820 }, { "epoch": 1.59, "learning_rate": 6.103513040784318e-05, "loss": 0.0266, "step": 246830 }, { "epoch": 1.59, "learning_rate": 6.102544905348625e-05, "loss": 0.0259, "step": 246840 }, { "epoch": 1.59, "learning_rate": 6.101576769912932e-05, "loss": 0.0254, "step": 246850 }, { "epoch": 1.59, "learning_rate": 6.100608634477238e-05, "loss": 0.0259, "step": 246860 }, { "epoch": 1.59, "learning_rate": 6.0996404990415454e-05, "loss": 0.0286, "step": 246870 }, { "epoch": 1.59, "learning_rate": 6.098672363605852e-05, "loss": 0.0258, "step": 246880 }, { "epoch": 1.59, "learning_rate": 6.0977042281701593e-05, "loss": 0.025, "step": 246890 }, { "epoch": 1.59, "learning_rate": 6.096736092734466e-05, "loss": 0.0263, "step": 246900 }, { "epoch": 1.59, "learning_rate": 6.095767957298772e-05, "loss": 0.0335, "step": 246910 }, { "epoch": 1.59, "learning_rate": 6.094799821863079e-05, "loss": 0.0223, "step": 246920 }, { "epoch": 1.59, "learning_rate": 6.093831686427386e-05, "loss": 0.0256, "step": 246930 }, { "epoch": 1.59, "learning_rate": 6.092863550991693e-05, "loss": 0.0249, "step": 246940 }, { "epoch": 1.59, "learning_rate": 6.091895415556e-05, "loss": 0.0256, "step": 246950 }, { "epoch": 1.59, "learning_rate": 6.090927280120307e-05, "loss": 0.0295, "step": 246960 }, { "epoch": 1.59, "learning_rate": 6.089959144684613e-05, "loss": 0.0235, "step": 246970 }, { "epoch": 1.59, "learning_rate": 6.0889910092489196e-05, "loss": 0.0232, "step": 246980 }, { "epoch": 1.59, "learning_rate": 6.088022873813227e-05, "loss": 0.0253, "step": 246990 }, { "epoch": 1.59, "learning_rate": 6.0870547383775336e-05, "loss": 0.0276, "step": 247000 }, { "epoch": 1.59, "eval_cer": 0.9198824991526381, "eval_loss": 0.019043434411287308, "eval_runtime": 120.2331, "eval_samples_per_second": 16.634, "eval_steps_per_second": 4.159, "step": 247000 }, { "epoch": 1.59, "learning_rate": 6.086086602941841e-05, "loss": 0.0211, "step": 247010 }, { "epoch": 1.59, "learning_rate": 6.085118467506147e-05, "loss": 0.0253, "step": 247020 }, { "epoch": 1.59, "learning_rate": 6.084150332070454e-05, "loss": 0.0319, "step": 247030 }, { "epoch": 1.59, "learning_rate": 6.083182196634761e-05, "loss": 0.024, "step": 247040 }, { "epoch": 1.59, "learning_rate": 6.0822140611990674e-05, "loss": 0.0267, "step": 247050 }, { "epoch": 1.59, "learning_rate": 6.081245925763375e-05, "loss": 0.0268, "step": 247060 }, { "epoch": 1.59, "learning_rate": 6.0802777903276806e-05, "loss": 0.0318, "step": 247070 }, { "epoch": 1.59, "learning_rate": 6.079309654891988e-05, "loss": 0.027, "step": 247080 }, { "epoch": 1.59, "learning_rate": 6.0783415194562945e-05, "loss": 0.0288, "step": 247090 }, { "epoch": 1.59, "learning_rate": 6.077373384020601e-05, "loss": 0.0268, "step": 247100 }, { "epoch": 1.59, "learning_rate": 6.0764052485849085e-05, "loss": 0.0284, "step": 247110 }, { "epoch": 1.59, "learning_rate": 6.0754371131492144e-05, "loss": 0.0286, "step": 247120 }, { "epoch": 1.6, "learning_rate": 6.074468977713522e-05, "loss": 0.0266, "step": 247130 }, { "epoch": 1.6, "learning_rate": 6.073500842277828e-05, "loss": 0.0257, "step": 247140 }, { "epoch": 1.6, "learning_rate": 6.0725327068421356e-05, "loss": 0.021, "step": 247150 }, { "epoch": 1.6, "learning_rate": 6.071564571406442e-05, "loss": 0.026, "step": 247160 }, { "epoch": 1.6, "learning_rate": 6.070596435970748e-05, "loss": 0.0279, "step": 247170 }, { "epoch": 1.6, "learning_rate": 6.0696283005350555e-05, "loss": 0.0213, "step": 247180 }, { "epoch": 1.6, "learning_rate": 6.068660165099362e-05, "loss": 0.0241, "step": 247190 }, { "epoch": 1.6, "learning_rate": 6.0676920296636694e-05, "loss": 0.0249, "step": 247200 }, { "epoch": 1.6, "learning_rate": 6.066723894227976e-05, "loss": 0.0287, "step": 247210 }, { "epoch": 1.6, "learning_rate": 6.0657557587922834e-05, "loss": 0.0276, "step": 247220 }, { "epoch": 1.6, "learning_rate": 6.064787623356589e-05, "loss": 0.0266, "step": 247230 }, { "epoch": 1.6, "learning_rate": 6.063819487920896e-05, "loss": 0.0226, "step": 247240 }, { "epoch": 1.6, "learning_rate": 6.062851352485203e-05, "loss": 0.0257, "step": 247250 }, { "epoch": 1.6, "learning_rate": 6.06188321704951e-05, "loss": 0.0284, "step": 247260 }, { "epoch": 1.6, "learning_rate": 6.060915081613817e-05, "loss": 0.0255, "step": 247270 }, { "epoch": 1.6, "learning_rate": 6.059946946178123e-05, "loss": 0.0211, "step": 247280 }, { "epoch": 1.6, "learning_rate": 6.0589788107424304e-05, "loss": 0.0206, "step": 247290 }, { "epoch": 1.6, "learning_rate": 6.058010675306737e-05, "loss": 0.0205, "step": 247300 }, { "epoch": 1.6, "learning_rate": 6.0570425398710437e-05, "loss": 0.0261, "step": 247310 }, { "epoch": 1.6, "learning_rate": 6.056074404435351e-05, "loss": 0.0262, "step": 247320 }, { "epoch": 1.6, "learning_rate": 6.055106268999657e-05, "loss": 0.0206, "step": 247330 }, { "epoch": 1.6, "learning_rate": 6.054138133563964e-05, "loss": 0.0284, "step": 247340 }, { "epoch": 1.6, "learning_rate": 6.053169998128271e-05, "loss": 0.0247, "step": 247350 }, { "epoch": 1.6, "learning_rate": 6.052201862692578e-05, "loss": 0.0228, "step": 247360 }, { "epoch": 1.6, "learning_rate": 6.051233727256885e-05, "loss": 0.0241, "step": 247370 }, { "epoch": 1.6, "learning_rate": 6.050265591821191e-05, "loss": 0.0237, "step": 247380 }, { "epoch": 1.6, "learning_rate": 6.049297456385498e-05, "loss": 0.0255, "step": 247390 }, { "epoch": 1.6, "learning_rate": 6.0483293209498046e-05, "loss": 0.0312, "step": 247400 }, { "epoch": 1.6, "learning_rate": 6.047361185514112e-05, "loss": 0.0218, "step": 247410 }, { "epoch": 1.6, "learning_rate": 6.0463930500784185e-05, "loss": 0.0271, "step": 247420 }, { "epoch": 1.6, "learning_rate": 6.045424914642726e-05, "loss": 0.0246, "step": 247430 }, { "epoch": 1.6, "learning_rate": 6.044456779207032e-05, "loss": 0.0268, "step": 247440 }, { "epoch": 1.6, "learning_rate": 6.0434886437713384e-05, "loss": 0.0236, "step": 247450 }, { "epoch": 1.6, "learning_rate": 6.042520508335646e-05, "loss": 0.0225, "step": 247460 }, { "epoch": 1.6, "learning_rate": 6.0415523728999523e-05, "loss": 0.0277, "step": 247470 }, { "epoch": 1.6, "learning_rate": 6.0405842374642596e-05, "loss": 0.029, "step": 247480 }, { "epoch": 1.6, "learning_rate": 6.0396161020285656e-05, "loss": 0.0263, "step": 247490 }, { "epoch": 1.6, "learning_rate": 6.038647966592873e-05, "loss": 0.0267, "step": 247500 }, { "epoch": 1.6, "learning_rate": 6.0376798311571795e-05, "loss": 0.0297, "step": 247510 }, { "epoch": 1.6, "learning_rate": 6.036711695721486e-05, "loss": 0.0229, "step": 247520 }, { "epoch": 1.6, "learning_rate": 6.0357435602857934e-05, "loss": 0.024, "step": 247530 }, { "epoch": 1.6, "learning_rate": 6.0347754248500994e-05, "loss": 0.0355, "step": 247540 }, { "epoch": 1.6, "learning_rate": 6.033807289414407e-05, "loss": 0.0239, "step": 247550 }, { "epoch": 1.6, "learning_rate": 6.032839153978713e-05, "loss": 0.0246, "step": 247560 }, { "epoch": 1.6, "learning_rate": 6.0318710185430206e-05, "loss": 0.0211, "step": 247570 }, { "epoch": 1.6, "learning_rate": 6.030902883107327e-05, "loss": 0.0333, "step": 247580 }, { "epoch": 1.6, "learning_rate": 6.029934747671633e-05, "loss": 0.0223, "step": 247590 }, { "epoch": 1.6, "learning_rate": 6.0289666122359405e-05, "loss": 0.0241, "step": 247600 }, { "epoch": 1.6, "learning_rate": 6.027998476800247e-05, "loss": 0.0269, "step": 247610 }, { "epoch": 1.6, "learning_rate": 6.0270303413645544e-05, "loss": 0.0242, "step": 247620 }, { "epoch": 1.6, "learning_rate": 6.026062205928861e-05, "loss": 0.0236, "step": 247630 }, { "epoch": 1.6, "learning_rate": 6.0250940704931683e-05, "loss": 0.0293, "step": 247640 }, { "epoch": 1.6, "learning_rate": 6.024125935057474e-05, "loss": 0.0311, "step": 247650 }, { "epoch": 1.6, "learning_rate": 6.023157799621781e-05, "loss": 0.0287, "step": 247660 }, { "epoch": 1.6, "learning_rate": 6.022189664186088e-05, "loss": 0.0267, "step": 247670 }, { "epoch": 1.6, "learning_rate": 6.021221528750395e-05, "loss": 0.0288, "step": 247680 }, { "epoch": 1.6, "learning_rate": 6.020253393314702e-05, "loss": 0.0295, "step": 247690 }, { "epoch": 1.6, "learning_rate": 6.019285257879008e-05, "loss": 0.0223, "step": 247700 }, { "epoch": 1.6, "learning_rate": 6.0183171224433154e-05, "loss": 0.0254, "step": 247710 }, { "epoch": 1.6, "learning_rate": 6.017348987007622e-05, "loss": 0.0195, "step": 247720 }, { "epoch": 1.6, "learning_rate": 6.0163808515719286e-05, "loss": 0.0274, "step": 247730 }, { "epoch": 1.6, "learning_rate": 6.015412716136236e-05, "loss": 0.0237, "step": 247740 }, { "epoch": 1.6, "learning_rate": 6.014444580700542e-05, "loss": 0.0234, "step": 247750 }, { "epoch": 1.6, "learning_rate": 6.013476445264849e-05, "loss": 0.0304, "step": 247760 }, { "epoch": 1.6, "learning_rate": 6.012508309829156e-05, "loss": 0.0275, "step": 247770 }, { "epoch": 1.6, "learning_rate": 6.011540174393463e-05, "loss": 0.03, "step": 247780 }, { "epoch": 1.6, "learning_rate": 6.01057203895777e-05, "loss": 0.0253, "step": 247790 }, { "epoch": 1.6, "learning_rate": 6.009603903522076e-05, "loss": 0.0201, "step": 247800 }, { "epoch": 1.6, "learning_rate": 6.008635768086383e-05, "loss": 0.0211, "step": 247810 }, { "epoch": 1.6, "learning_rate": 6.0076676326506896e-05, "loss": 0.027, "step": 247820 }, { "epoch": 1.6, "learning_rate": 6.006699497214997e-05, "loss": 0.0298, "step": 247830 }, { "epoch": 1.6, "learning_rate": 6.0057313617793035e-05, "loss": 0.021, "step": 247840 }, { "epoch": 1.6, "learning_rate": 6.00476322634361e-05, "loss": 0.0241, "step": 247850 }, { "epoch": 1.6, "learning_rate": 6.003795090907917e-05, "loss": 0.0259, "step": 247860 }, { "epoch": 1.6, "learning_rate": 6.0028269554722234e-05, "loss": 0.0289, "step": 247870 }, { "epoch": 1.6, "learning_rate": 6.001858820036531e-05, "loss": 0.027, "step": 247880 }, { "epoch": 1.6, "learning_rate": 6.000890684600837e-05, "loss": 0.0231, "step": 247890 }, { "epoch": 1.6, "learning_rate": 5.999922549165144e-05, "loss": 0.0254, "step": 247900 }, { "epoch": 1.6, "learning_rate": 5.9989544137294506e-05, "loss": 0.02, "step": 247910 }, { "epoch": 1.6, "learning_rate": 5.997986278293758e-05, "loss": 0.0229, "step": 247920 }, { "epoch": 1.6, "learning_rate": 5.9970181428580645e-05, "loss": 0.0235, "step": 247930 }, { "epoch": 1.6, "learning_rate": 5.996050007422371e-05, "loss": 0.0264, "step": 247940 }, { "epoch": 1.6, "learning_rate": 5.995081871986678e-05, "loss": 0.0303, "step": 247950 }, { "epoch": 1.6, "learning_rate": 5.9941137365509844e-05, "loss": 0.0278, "step": 247960 }, { "epoch": 1.6, "learning_rate": 5.993145601115292e-05, "loss": 0.0273, "step": 247970 }, { "epoch": 1.6, "learning_rate": 5.992177465679598e-05, "loss": 0.0245, "step": 247980 }, { "epoch": 1.6, "learning_rate": 5.9912093302439056e-05, "loss": 0.0282, "step": 247990 }, { "epoch": 1.6, "learning_rate": 5.9902411948082115e-05, "loss": 0.0238, "step": 248000 }, { "epoch": 1.6, "eval_cer": 0.9198852107106542, "eval_loss": 0.01876279152929783, "eval_runtime": 120.3747, "eval_samples_per_second": 16.615, "eval_steps_per_second": 4.154, "step": 248000 }, { "epoch": 1.6, "learning_rate": 5.989273059372518e-05, "loss": 0.025, "step": 248010 }, { "epoch": 1.6, "learning_rate": 5.9883049239368255e-05, "loss": 0.0193, "step": 248020 }, { "epoch": 1.6, "learning_rate": 5.987336788501132e-05, "loss": 0.0249, "step": 248030 }, { "epoch": 1.6, "learning_rate": 5.9863686530654394e-05, "loss": 0.0252, "step": 248040 }, { "epoch": 1.6, "learning_rate": 5.9854005176297453e-05, "loss": 0.0226, "step": 248050 }, { "epoch": 1.6, "learning_rate": 5.9844323821940526e-05, "loss": 0.0258, "step": 248060 }, { "epoch": 1.6, "learning_rate": 5.983464246758359e-05, "loss": 0.0232, "step": 248070 }, { "epoch": 1.6, "learning_rate": 5.982496111322666e-05, "loss": 0.0221, "step": 248080 }, { "epoch": 1.6, "learning_rate": 5.981527975886973e-05, "loss": 0.0266, "step": 248090 }, { "epoch": 1.6, "learning_rate": 5.980559840451279e-05, "loss": 0.0225, "step": 248100 }, { "epoch": 1.6, "learning_rate": 5.9795917050155864e-05, "loss": 0.0248, "step": 248110 }, { "epoch": 1.6, "learning_rate": 5.978623569579893e-05, "loss": 0.0314, "step": 248120 }, { "epoch": 1.6, "learning_rate": 5.9776554341442004e-05, "loss": 0.0252, "step": 248130 }, { "epoch": 1.6, "learning_rate": 5.976687298708507e-05, "loss": 0.0247, "step": 248140 }, { "epoch": 1.6, "learning_rate": 5.975719163272813e-05, "loss": 0.0242, "step": 248150 }, { "epoch": 1.6, "learning_rate": 5.97475102783712e-05, "loss": 0.0312, "step": 248160 }, { "epoch": 1.6, "learning_rate": 5.973782892401427e-05, "loss": 0.0231, "step": 248170 }, { "epoch": 1.6, "learning_rate": 5.972814756965734e-05, "loss": 0.0281, "step": 248180 }, { "epoch": 1.6, "learning_rate": 5.971846621530041e-05, "loss": 0.0241, "step": 248190 }, { "epoch": 1.6, "learning_rate": 5.970878486094348e-05, "loss": 0.0248, "step": 248200 }, { "epoch": 1.6, "learning_rate": 5.969910350658654e-05, "loss": 0.0245, "step": 248210 }, { "epoch": 1.6, "learning_rate": 5.9689422152229607e-05, "loss": 0.0294, "step": 248220 }, { "epoch": 1.6, "learning_rate": 5.967974079787268e-05, "loss": 0.0213, "step": 248230 }, { "epoch": 1.6, "learning_rate": 5.9670059443515746e-05, "loss": 0.0219, "step": 248240 }, { "epoch": 1.6, "learning_rate": 5.966037808915882e-05, "loss": 0.025, "step": 248250 }, { "epoch": 1.6, "learning_rate": 5.965069673480188e-05, "loss": 0.0228, "step": 248260 }, { "epoch": 1.6, "learning_rate": 5.964101538044495e-05, "loss": 0.0263, "step": 248270 }, { "epoch": 1.6, "learning_rate": 5.963133402608802e-05, "loss": 0.0219, "step": 248280 }, { "epoch": 1.6, "learning_rate": 5.9621652671731084e-05, "loss": 0.0305, "step": 248290 }, { "epoch": 1.6, "learning_rate": 5.961197131737416e-05, "loss": 0.0216, "step": 248300 }, { "epoch": 1.6, "learning_rate": 5.9602289963017216e-05, "loss": 0.0239, "step": 248310 }, { "epoch": 1.6, "learning_rate": 5.959260860866029e-05, "loss": 0.0278, "step": 248320 }, { "epoch": 1.6, "learning_rate": 5.9582927254303356e-05, "loss": 0.0279, "step": 248330 }, { "epoch": 1.6, "learning_rate": 5.957324589994643e-05, "loss": 0.0242, "step": 248340 }, { "epoch": 1.6, "learning_rate": 5.9563564545589495e-05, "loss": 0.0281, "step": 248350 }, { "epoch": 1.6, "learning_rate": 5.9553883191232554e-05, "loss": 0.0272, "step": 248360 }, { "epoch": 1.6, "learning_rate": 5.954420183687563e-05, "loss": 0.0258, "step": 248370 }, { "epoch": 1.6, "learning_rate": 5.9534520482518694e-05, "loss": 0.0246, "step": 248380 }, { "epoch": 1.6, "learning_rate": 5.9524839128161767e-05, "loss": 0.0264, "step": 248390 }, { "epoch": 1.6, "learning_rate": 5.951515777380483e-05, "loss": 0.0274, "step": 248400 }, { "epoch": 1.6, "learning_rate": 5.9505476419447906e-05, "loss": 0.0243, "step": 248410 }, { "epoch": 1.6, "learning_rate": 5.9495795065090965e-05, "loss": 0.026, "step": 248420 }, { "epoch": 1.6, "learning_rate": 5.948611371073403e-05, "loss": 0.0249, "step": 248430 }, { "epoch": 1.6, "learning_rate": 5.9476432356377105e-05, "loss": 0.0233, "step": 248440 }, { "epoch": 1.6, "learning_rate": 5.946675100202017e-05, "loss": 0.028, "step": 248450 }, { "epoch": 1.6, "learning_rate": 5.9457069647663244e-05, "loss": 0.0267, "step": 248460 }, { "epoch": 1.6, "learning_rate": 5.94473882933063e-05, "loss": 0.0287, "step": 248470 }, { "epoch": 1.6, "learning_rate": 5.9437706938949376e-05, "loss": 0.0252, "step": 248480 }, { "epoch": 1.6, "learning_rate": 5.942802558459244e-05, "loss": 0.0251, "step": 248490 }, { "epoch": 1.6, "learning_rate": 5.941834423023551e-05, "loss": 0.0239, "step": 248500 }, { "epoch": 1.6, "learning_rate": 5.940866287587858e-05, "loss": 0.0255, "step": 248510 }, { "epoch": 1.6, "learning_rate": 5.939898152152164e-05, "loss": 0.0244, "step": 248520 }, { "epoch": 1.6, "learning_rate": 5.9389300167164714e-05, "loss": 0.0271, "step": 248530 }, { "epoch": 1.6, "learning_rate": 5.937961881280778e-05, "loss": 0.0273, "step": 248540 }, { "epoch": 1.6, "learning_rate": 5.9369937458450853e-05, "loss": 0.0251, "step": 248550 }, { "epoch": 1.6, "learning_rate": 5.936025610409392e-05, "loss": 0.0241, "step": 248560 }, { "epoch": 1.6, "learning_rate": 5.935057474973698e-05, "loss": 0.031, "step": 248570 }, { "epoch": 1.6, "learning_rate": 5.934089339538005e-05, "loss": 0.0264, "step": 248580 }, { "epoch": 1.6, "learning_rate": 5.933121204102312e-05, "loss": 0.0258, "step": 248590 }, { "epoch": 1.6, "learning_rate": 5.932153068666619e-05, "loss": 0.0256, "step": 248600 }, { "epoch": 1.6, "learning_rate": 5.931184933230926e-05, "loss": 0.0262, "step": 248610 }, { "epoch": 1.6, "learning_rate": 5.930216797795233e-05, "loss": 0.0271, "step": 248620 }, { "epoch": 1.6, "learning_rate": 5.929248662359539e-05, "loss": 0.0202, "step": 248630 }, { "epoch": 1.6, "learning_rate": 5.9282805269238456e-05, "loss": 0.0306, "step": 248640 }, { "epoch": 1.6, "learning_rate": 5.927312391488153e-05, "loss": 0.0243, "step": 248650 }, { "epoch": 1.6, "learning_rate": 5.9263442560524596e-05, "loss": 0.0253, "step": 248660 }, { "epoch": 1.6, "learning_rate": 5.925376120616767e-05, "loss": 0.0218, "step": 248670 }, { "epoch": 1.61, "learning_rate": 5.924407985181073e-05, "loss": 0.0228, "step": 248680 }, { "epoch": 1.61, "learning_rate": 5.92343984974538e-05, "loss": 0.0296, "step": 248690 }, { "epoch": 1.61, "learning_rate": 5.922471714309687e-05, "loss": 0.0279, "step": 248700 }, { "epoch": 1.61, "learning_rate": 5.9215035788739934e-05, "loss": 0.0293, "step": 248710 }, { "epoch": 1.61, "learning_rate": 5.920535443438301e-05, "loss": 0.0292, "step": 248720 }, { "epoch": 1.61, "learning_rate": 5.9195673080026066e-05, "loss": 0.0289, "step": 248730 }, { "epoch": 1.61, "learning_rate": 5.918599172566914e-05, "loss": 0.0253, "step": 248740 }, { "epoch": 1.61, "learning_rate": 5.9176310371312205e-05, "loss": 0.0285, "step": 248750 }, { "epoch": 1.61, "learning_rate": 5.916662901695527e-05, "loss": 0.0244, "step": 248760 }, { "epoch": 1.61, "learning_rate": 5.9156947662598345e-05, "loss": 0.025, "step": 248770 }, { "epoch": 1.61, "learning_rate": 5.9147266308241404e-05, "loss": 0.0247, "step": 248780 }, { "epoch": 1.61, "learning_rate": 5.913758495388448e-05, "loss": 0.0284, "step": 248790 }, { "epoch": 1.61, "learning_rate": 5.912790359952754e-05, "loss": 0.0244, "step": 248800 }, { "epoch": 1.61, "learning_rate": 5.9118222245170616e-05, "loss": 0.0254, "step": 248810 }, { "epoch": 1.61, "learning_rate": 5.910854089081368e-05, "loss": 0.0315, "step": 248820 }, { "epoch": 1.61, "learning_rate": 5.909885953645674e-05, "loss": 0.0247, "step": 248830 }, { "epoch": 1.61, "learning_rate": 5.9089178182099815e-05, "loss": 0.0264, "step": 248840 }, { "epoch": 1.61, "learning_rate": 5.907949682774288e-05, "loss": 0.0252, "step": 248850 }, { "epoch": 1.61, "learning_rate": 5.9069815473385954e-05, "loss": 0.027, "step": 248860 }, { "epoch": 1.61, "learning_rate": 5.906013411902902e-05, "loss": 0.0276, "step": 248870 }, { "epoch": 1.61, "learning_rate": 5.9050452764672094e-05, "loss": 0.0283, "step": 248880 }, { "epoch": 1.61, "learning_rate": 5.904077141031515e-05, "loss": 0.0235, "step": 248890 }, { "epoch": 1.61, "learning_rate": 5.903109005595822e-05, "loss": 0.0307, "step": 248900 }, { "epoch": 1.61, "learning_rate": 5.902140870160129e-05, "loss": 0.0244, "step": 248910 }, { "epoch": 1.61, "learning_rate": 5.901172734724436e-05, "loss": 0.0272, "step": 248920 }, { "epoch": 1.61, "learning_rate": 5.900204599288743e-05, "loss": 0.0285, "step": 248930 }, { "epoch": 1.61, "learning_rate": 5.899236463853049e-05, "loss": 0.0246, "step": 248940 }, { "epoch": 1.61, "learning_rate": 5.8982683284173564e-05, "loss": 0.0266, "step": 248950 }, { "epoch": 1.61, "learning_rate": 5.897300192981663e-05, "loss": 0.0287, "step": 248960 }, { "epoch": 1.61, "learning_rate": 5.8963320575459696e-05, "loss": 0.032, "step": 248970 }, { "epoch": 1.61, "learning_rate": 5.895363922110277e-05, "loss": 0.0229, "step": 248980 }, { "epoch": 1.61, "learning_rate": 5.894395786674583e-05, "loss": 0.0233, "step": 248990 }, { "epoch": 1.61, "learning_rate": 5.89342765123889e-05, "loss": 0.0301, "step": 249000 }, { "epoch": 1.61, "eval_cer": 0.9198562874251497, "eval_loss": 0.018836012110114098, "eval_runtime": 120.0, "eval_samples_per_second": 16.667, "eval_steps_per_second": 4.167, "step": 249000 }, { "epoch": 1.61, "learning_rate": 5.892459515803197e-05, "loss": 0.0268, "step": 249010 }, { "epoch": 1.61, "learning_rate": 5.891491380367504e-05, "loss": 0.0318, "step": 249020 }, { "epoch": 1.61, "learning_rate": 5.890523244931811e-05, "loss": 0.024, "step": 249030 }, { "epoch": 1.61, "learning_rate": 5.889555109496117e-05, "loss": 0.0307, "step": 249040 }, { "epoch": 1.61, "learning_rate": 5.888586974060424e-05, "loss": 0.0245, "step": 249050 }, { "epoch": 1.61, "learning_rate": 5.8876188386247306e-05, "loss": 0.0296, "step": 249060 }, { "epoch": 1.61, "learning_rate": 5.886650703189038e-05, "loss": 0.0253, "step": 249070 }, { "epoch": 1.61, "learning_rate": 5.8856825677533445e-05, "loss": 0.03, "step": 249080 }, { "epoch": 1.61, "learning_rate": 5.884714432317651e-05, "loss": 0.0341, "step": 249090 }, { "epoch": 1.61, "learning_rate": 5.883746296881958e-05, "loss": 0.0277, "step": 249100 }, { "epoch": 1.61, "learning_rate": 5.8827781614462644e-05, "loss": 0.0286, "step": 249110 }, { "epoch": 1.61, "learning_rate": 5.881810026010572e-05, "loss": 0.0244, "step": 249120 }, { "epoch": 1.61, "learning_rate": 5.8808418905748783e-05, "loss": 0.0233, "step": 249130 }, { "epoch": 1.61, "learning_rate": 5.879873755139185e-05, "loss": 0.0271, "step": 249140 }, { "epoch": 1.61, "learning_rate": 5.8789056197034916e-05, "loss": 0.0218, "step": 249150 }, { "epoch": 1.61, "learning_rate": 5.877937484267799e-05, "loss": 0.0267, "step": 249160 }, { "epoch": 1.61, "learning_rate": 5.8769693488321055e-05, "loss": 0.0234, "step": 249170 }, { "epoch": 1.61, "learning_rate": 5.876001213396412e-05, "loss": 0.0207, "step": 249180 }, { "epoch": 1.61, "learning_rate": 5.875033077960719e-05, "loss": 0.0216, "step": 249190 }, { "epoch": 1.61, "learning_rate": 5.8740649425250254e-05, "loss": 0.0263, "step": 249200 }, { "epoch": 1.61, "learning_rate": 5.873096807089333e-05, "loss": 0.0251, "step": 249210 }, { "epoch": 1.61, "learning_rate": 5.872128671653639e-05, "loss": 0.0301, "step": 249220 }, { "epoch": 1.61, "learning_rate": 5.8711605362179466e-05, "loss": 0.0243, "step": 249230 }, { "epoch": 1.61, "learning_rate": 5.8701924007822526e-05, "loss": 0.0262, "step": 249240 }, { "epoch": 1.61, "learning_rate": 5.869224265346559e-05, "loss": 0.0205, "step": 249250 }, { "epoch": 1.61, "learning_rate": 5.8682561299108665e-05, "loss": 0.0252, "step": 249260 }, { "epoch": 1.61, "learning_rate": 5.867287994475173e-05, "loss": 0.0258, "step": 249270 }, { "epoch": 1.61, "learning_rate": 5.8663198590394804e-05, "loss": 0.0241, "step": 249280 }, { "epoch": 1.61, "learning_rate": 5.8653517236037864e-05, "loss": 0.0271, "step": 249290 }, { "epoch": 1.61, "learning_rate": 5.8643835881680937e-05, "loss": 0.0286, "step": 249300 }, { "epoch": 1.61, "learning_rate": 5.8634154527324e-05, "loss": 0.0257, "step": 249310 }, { "epoch": 1.61, "learning_rate": 5.862447317296707e-05, "loss": 0.0264, "step": 249320 }, { "epoch": 1.61, "learning_rate": 5.861479181861014e-05, "loss": 0.0234, "step": 249330 }, { "epoch": 1.61, "learning_rate": 5.86051104642532e-05, "loss": 0.0227, "step": 249340 }, { "epoch": 1.61, "learning_rate": 5.8595429109896275e-05, "loss": 0.0315, "step": 249350 }, { "epoch": 1.61, "learning_rate": 5.858574775553934e-05, "loss": 0.0252, "step": 249360 }, { "epoch": 1.61, "learning_rate": 5.8576066401182414e-05, "loss": 0.0272, "step": 249370 }, { "epoch": 1.61, "learning_rate": 5.856638504682548e-05, "loss": 0.0275, "step": 249380 }, { "epoch": 1.61, "learning_rate": 5.855670369246854e-05, "loss": 0.0191, "step": 249390 }, { "epoch": 1.61, "learning_rate": 5.854702233811161e-05, "loss": 0.0282, "step": 249400 }, { "epoch": 1.61, "learning_rate": 5.853734098375468e-05, "loss": 0.0241, "step": 249410 }, { "epoch": 1.61, "learning_rate": 5.852765962939775e-05, "loss": 0.0265, "step": 249420 }, { "epoch": 1.61, "learning_rate": 5.851797827504082e-05, "loss": 0.0268, "step": 249430 }, { "epoch": 1.61, "learning_rate": 5.850829692068389e-05, "loss": 0.022, "step": 249440 }, { "epoch": 1.61, "learning_rate": 5.849861556632695e-05, "loss": 0.0276, "step": 249450 }, { "epoch": 1.61, "learning_rate": 5.848893421197002e-05, "loss": 0.026, "step": 249460 }, { "epoch": 1.61, "learning_rate": 5.847925285761309e-05, "loss": 0.0225, "step": 249470 }, { "epoch": 1.61, "learning_rate": 5.8469571503256156e-05, "loss": 0.0243, "step": 249480 }, { "epoch": 1.61, "learning_rate": 5.845989014889923e-05, "loss": 0.0251, "step": 249490 }, { "epoch": 1.61, "learning_rate": 5.845020879454229e-05, "loss": 0.0257, "step": 249500 }, { "epoch": 1.61, "learning_rate": 5.844052744018536e-05, "loss": 0.0231, "step": 249510 }, { "epoch": 1.61, "learning_rate": 5.843084608582843e-05, "loss": 0.0292, "step": 249520 }, { "epoch": 1.61, "learning_rate": 5.8421164731471494e-05, "loss": 0.0322, "step": 249530 }, { "epoch": 1.61, "learning_rate": 5.841148337711457e-05, "loss": 0.0278, "step": 249540 }, { "epoch": 1.61, "learning_rate": 5.8401802022757626e-05, "loss": 0.0203, "step": 249550 }, { "epoch": 1.61, "learning_rate": 5.83921206684007e-05, "loss": 0.0251, "step": 249560 }, { "epoch": 1.61, "learning_rate": 5.8382439314043766e-05, "loss": 0.0267, "step": 249570 }, { "epoch": 1.61, "learning_rate": 5.837275795968684e-05, "loss": 0.0233, "step": 249580 }, { "epoch": 1.61, "learning_rate": 5.8363076605329905e-05, "loss": 0.0267, "step": 249590 }, { "epoch": 1.61, "learning_rate": 5.8353395250972964e-05, "loss": 0.0229, "step": 249600 }, { "epoch": 1.61, "learning_rate": 5.834371389661604e-05, "loss": 0.0226, "step": 249610 }, { "epoch": 1.61, "learning_rate": 5.8334032542259104e-05, "loss": 0.0343, "step": 249620 }, { "epoch": 1.61, "learning_rate": 5.832435118790218e-05, "loss": 0.0235, "step": 249630 }, { "epoch": 1.61, "learning_rate": 5.831466983354524e-05, "loss": 0.02, "step": 249640 }, { "epoch": 1.61, "learning_rate": 5.8304988479188316e-05, "loss": 0.029, "step": 249650 }, { "epoch": 1.61, "learning_rate": 5.8295307124831375e-05, "loss": 0.0327, "step": 249660 }, { "epoch": 1.61, "learning_rate": 5.828562577047444e-05, "loss": 0.0244, "step": 249670 }, { "epoch": 1.61, "learning_rate": 5.8275944416117515e-05, "loss": 0.0265, "step": 249680 }, { "epoch": 1.61, "learning_rate": 5.826626306176058e-05, "loss": 0.0251, "step": 249690 }, { "epoch": 1.61, "learning_rate": 5.8256581707403654e-05, "loss": 0.028, "step": 249700 }, { "epoch": 1.61, "learning_rate": 5.8246900353046713e-05, "loss": 0.0271, "step": 249710 }, { "epoch": 1.61, "learning_rate": 5.8237218998689786e-05, "loss": 0.0272, "step": 249720 }, { "epoch": 1.61, "learning_rate": 5.822753764433285e-05, "loss": 0.0314, "step": 249730 }, { "epoch": 1.61, "learning_rate": 5.821785628997592e-05, "loss": 0.022, "step": 249740 }, { "epoch": 1.61, "learning_rate": 5.820817493561899e-05, "loss": 0.0237, "step": 249750 }, { "epoch": 1.61, "learning_rate": 5.819849358126205e-05, "loss": 0.0252, "step": 249760 }, { "epoch": 1.61, "learning_rate": 5.8188812226905124e-05, "loss": 0.0224, "step": 249770 }, { "epoch": 1.61, "learning_rate": 5.817913087254819e-05, "loss": 0.0232, "step": 249780 }, { "epoch": 1.61, "learning_rate": 5.8169449518191264e-05, "loss": 0.0285, "step": 249790 }, { "epoch": 1.61, "learning_rate": 5.815976816383433e-05, "loss": 0.0212, "step": 249800 }, { "epoch": 1.61, "learning_rate": 5.815008680947739e-05, "loss": 0.0261, "step": 249810 }, { "epoch": 1.61, "learning_rate": 5.814040545512046e-05, "loss": 0.0232, "step": 249820 }, { "epoch": 1.61, "learning_rate": 5.813072410076353e-05, "loss": 0.0278, "step": 249830 }, { "epoch": 1.61, "learning_rate": 5.81210427464066e-05, "loss": 0.0262, "step": 249840 }, { "epoch": 1.61, "learning_rate": 5.811136139204967e-05, "loss": 0.0271, "step": 249850 }, { "epoch": 1.61, "learning_rate": 5.810168003769274e-05, "loss": 0.0284, "step": 249860 }, { "epoch": 1.61, "learning_rate": 5.80919986833358e-05, "loss": 0.0236, "step": 249870 }, { "epoch": 1.61, "learning_rate": 5.8082317328978867e-05, "loss": 0.0263, "step": 249880 }, { "epoch": 1.61, "learning_rate": 5.807263597462194e-05, "loss": 0.0246, "step": 249890 }, { "epoch": 1.61, "learning_rate": 5.8062954620265006e-05, "loss": 0.0256, "step": 249900 }, { "epoch": 1.61, "learning_rate": 5.805327326590808e-05, "loss": 0.0233, "step": 249910 }, { "epoch": 1.61, "learning_rate": 5.804359191155114e-05, "loss": 0.0235, "step": 249920 }, { "epoch": 1.61, "learning_rate": 5.803391055719421e-05, "loss": 0.0242, "step": 249930 }, { "epoch": 1.61, "learning_rate": 5.802422920283728e-05, "loss": 0.0237, "step": 249940 }, { "epoch": 1.61, "learning_rate": 5.8014547848480344e-05, "loss": 0.03, "step": 249950 }, { "epoch": 1.61, "learning_rate": 5.800486649412342e-05, "loss": 0.0265, "step": 249960 }, { "epoch": 1.61, "learning_rate": 5.7995185139766476e-05, "loss": 0.0331, "step": 249970 }, { "epoch": 1.61, "learning_rate": 5.798550378540955e-05, "loss": 0.0273, "step": 249980 }, { "epoch": 1.61, "learning_rate": 5.7975822431052616e-05, "loss": 0.0246, "step": 249990 }, { "epoch": 1.61, "learning_rate": 5.796614107669569e-05, "loss": 0.0273, "step": 250000 }, { "epoch": 1.61, "eval_cer": 0.919873460625918, "eval_loss": 0.018918007612228394, "eval_runtime": 119.9798, "eval_samples_per_second": 16.669, "eval_steps_per_second": 4.167, "step": 250000 }, { "epoch": 1.61, "learning_rate": 5.7956459722338755e-05, "loss": 0.0251, "step": 250010 }, { "epoch": 1.61, "learning_rate": 5.7946778367981814e-05, "loss": 0.0285, "step": 250020 }, { "epoch": 1.61, "learning_rate": 5.793709701362489e-05, "loss": 0.0237, "step": 250030 }, { "epoch": 1.61, "learning_rate": 5.7927415659267953e-05, "loss": 0.0238, "step": 250040 }, { "epoch": 1.61, "learning_rate": 5.7917734304911027e-05, "loss": 0.0246, "step": 250050 }, { "epoch": 1.61, "learning_rate": 5.790805295055409e-05, "loss": 0.0298, "step": 250060 }, { "epoch": 1.61, "learning_rate": 5.7898371596197166e-05, "loss": 0.0242, "step": 250070 }, { "epoch": 1.61, "learning_rate": 5.7888690241840225e-05, "loss": 0.0295, "step": 250080 }, { "epoch": 1.61, "learning_rate": 5.787900888748329e-05, "loss": 0.0223, "step": 250090 }, { "epoch": 1.61, "learning_rate": 5.7869327533126364e-05, "loss": 0.0229, "step": 250100 }, { "epoch": 1.61, "learning_rate": 5.785964617876943e-05, "loss": 0.0247, "step": 250110 }, { "epoch": 1.61, "learning_rate": 5.7849964824412504e-05, "loss": 0.0257, "step": 250120 }, { "epoch": 1.61, "learning_rate": 5.784028347005556e-05, "loss": 0.0283, "step": 250130 }, { "epoch": 1.61, "learning_rate": 5.7830602115698636e-05, "loss": 0.0261, "step": 250140 }, { "epoch": 1.61, "learning_rate": 5.78209207613417e-05, "loss": 0.0212, "step": 250150 }, { "epoch": 1.61, "learning_rate": 5.781123940698477e-05, "loss": 0.0292, "step": 250160 }, { "epoch": 1.61, "learning_rate": 5.780155805262784e-05, "loss": 0.0293, "step": 250170 }, { "epoch": 1.61, "learning_rate": 5.77918766982709e-05, "loss": 0.0257, "step": 250180 }, { "epoch": 1.61, "learning_rate": 5.7782195343913974e-05, "loss": 0.0288, "step": 250190 }, { "epoch": 1.61, "learning_rate": 5.777251398955704e-05, "loss": 0.0269, "step": 250200 }, { "epoch": 1.61, "learning_rate": 5.7762832635200113e-05, "loss": 0.0229, "step": 250210 }, { "epoch": 1.61, "learning_rate": 5.775315128084318e-05, "loss": 0.0237, "step": 250220 }, { "epoch": 1.62, "learning_rate": 5.774346992648624e-05, "loss": 0.0231, "step": 250230 }, { "epoch": 1.62, "learning_rate": 5.773378857212931e-05, "loss": 0.027, "step": 250240 }, { "epoch": 1.62, "learning_rate": 5.772410721777238e-05, "loss": 0.026, "step": 250250 }, { "epoch": 1.62, "learning_rate": 5.771442586341545e-05, "loss": 0.027, "step": 250260 }, { "epoch": 1.62, "learning_rate": 5.770474450905852e-05, "loss": 0.0259, "step": 250270 }, { "epoch": 1.62, "learning_rate": 5.769506315470159e-05, "loss": 0.0252, "step": 250280 }, { "epoch": 1.62, "learning_rate": 5.768538180034465e-05, "loss": 0.029, "step": 250290 }, { "epoch": 1.62, "learning_rate": 5.7675700445987716e-05, "loss": 0.0275, "step": 250300 }, { "epoch": 1.62, "learning_rate": 5.766601909163079e-05, "loss": 0.0232, "step": 250310 }, { "epoch": 1.62, "learning_rate": 5.7656337737273856e-05, "loss": 0.0222, "step": 250320 }, { "epoch": 1.62, "learning_rate": 5.764665638291693e-05, "loss": 0.0266, "step": 250330 }, { "epoch": 1.62, "learning_rate": 5.763697502855999e-05, "loss": 0.0276, "step": 250340 }, { "epoch": 1.62, "learning_rate": 5.762729367420306e-05, "loss": 0.0255, "step": 250350 }, { "epoch": 1.62, "learning_rate": 5.761761231984613e-05, "loss": 0.0286, "step": 250360 }, { "epoch": 1.62, "learning_rate": 5.7607930965489194e-05, "loss": 0.0262, "step": 250370 }, { "epoch": 1.62, "learning_rate": 5.7598249611132267e-05, "loss": 0.0276, "step": 250380 }, { "epoch": 1.62, "learning_rate": 5.7588568256775326e-05, "loss": 0.0243, "step": 250390 }, { "epoch": 1.62, "learning_rate": 5.75788869024184e-05, "loss": 0.0279, "step": 250400 }, { "epoch": 1.62, "learning_rate": 5.7569205548061465e-05, "loss": 0.0299, "step": 250410 }, { "epoch": 1.62, "learning_rate": 5.755952419370454e-05, "loss": 0.025, "step": 250420 }, { "epoch": 1.62, "learning_rate": 5.7549842839347605e-05, "loss": 0.0247, "step": 250430 }, { "epoch": 1.62, "learning_rate": 5.7540161484990664e-05, "loss": 0.035, "step": 250440 }, { "epoch": 1.62, "learning_rate": 5.753048013063374e-05, "loss": 0.025, "step": 250450 }, { "epoch": 1.62, "learning_rate": 5.75207987762768e-05, "loss": 0.02, "step": 250460 }, { "epoch": 1.62, "learning_rate": 5.7511117421919876e-05, "loss": 0.0279, "step": 250470 }, { "epoch": 1.62, "learning_rate": 5.750143606756294e-05, "loss": 0.0229, "step": 250480 }, { "epoch": 1.62, "learning_rate": 5.7491754713206e-05, "loss": 0.0298, "step": 250490 }, { "epoch": 1.62, "learning_rate": 5.7482073358849075e-05, "loss": 0.0247, "step": 250500 }, { "epoch": 1.62, "learning_rate": 5.747239200449214e-05, "loss": 0.0264, "step": 250510 }, { "epoch": 1.62, "learning_rate": 5.7462710650135214e-05, "loss": 0.0272, "step": 250520 }, { "epoch": 1.62, "learning_rate": 5.745302929577828e-05, "loss": 0.0227, "step": 250530 }, { "epoch": 1.62, "learning_rate": 5.744334794142135e-05, "loss": 0.0225, "step": 250540 }, { "epoch": 1.62, "learning_rate": 5.743366658706441e-05, "loss": 0.022, "step": 250550 }, { "epoch": 1.62, "learning_rate": 5.742398523270748e-05, "loss": 0.0233, "step": 250560 }, { "epoch": 1.62, "learning_rate": 5.741430387835055e-05, "loss": 0.0198, "step": 250570 }, { "epoch": 1.62, "learning_rate": 5.740462252399362e-05, "loss": 0.0212, "step": 250580 }, { "epoch": 1.62, "learning_rate": 5.7394941169636685e-05, "loss": 0.0278, "step": 250590 }, { "epoch": 1.62, "learning_rate": 5.738525981527975e-05, "loss": 0.0266, "step": 250600 }, { "epoch": 1.62, "learning_rate": 5.7375578460922824e-05, "loss": 0.0216, "step": 250610 }, { "epoch": 1.62, "learning_rate": 5.736589710656589e-05, "loss": 0.0235, "step": 250620 }, { "epoch": 1.62, "learning_rate": 5.7356215752208956e-05, "loss": 0.0311, "step": 250630 }, { "epoch": 1.62, "learning_rate": 5.734653439785202e-05, "loss": 0.0232, "step": 250640 }, { "epoch": 1.62, "learning_rate": 5.733685304349509e-05, "loss": 0.0252, "step": 250650 }, { "epoch": 1.62, "learning_rate": 5.732717168913816e-05, "loss": 0.0274, "step": 250660 }, { "epoch": 1.62, "learning_rate": 5.731749033478123e-05, "loss": 0.0232, "step": 250670 }, { "epoch": 1.62, "learning_rate": 5.73078089804243e-05, "loss": 0.0237, "step": 250680 }, { "epoch": 1.62, "learning_rate": 5.729812762606736e-05, "loss": 0.0282, "step": 250690 }, { "epoch": 1.62, "learning_rate": 5.728844627171043e-05, "loss": 0.0239, "step": 250700 }, { "epoch": 1.62, "learning_rate": 5.72787649173535e-05, "loss": 0.0214, "step": 250710 }, { "epoch": 1.62, "learning_rate": 5.7269083562996566e-05, "loss": 0.023, "step": 250720 }, { "epoch": 1.62, "learning_rate": 5.725940220863964e-05, "loss": 0.0275, "step": 250730 }, { "epoch": 1.62, "learning_rate": 5.72497208542827e-05, "loss": 0.0237, "step": 250740 }, { "epoch": 1.62, "learning_rate": 5.724003949992577e-05, "loss": 0.027, "step": 250750 }, { "epoch": 1.62, "learning_rate": 5.723035814556884e-05, "loss": 0.0266, "step": 250760 }, { "epoch": 1.62, "learning_rate": 5.7220676791211904e-05, "loss": 0.0275, "step": 250770 }, { "epoch": 1.62, "learning_rate": 5.721099543685498e-05, "loss": 0.0217, "step": 250780 }, { "epoch": 1.62, "learning_rate": 5.720131408249804e-05, "loss": 0.0263, "step": 250790 }, { "epoch": 1.62, "learning_rate": 5.719163272814111e-05, "loss": 0.0231, "step": 250800 }, { "epoch": 1.62, "learning_rate": 5.7181951373784176e-05, "loss": 0.022, "step": 250810 }, { "epoch": 1.62, "learning_rate": 5.717227001942725e-05, "loss": 0.0286, "step": 250820 }, { "epoch": 1.62, "learning_rate": 5.7162588665070315e-05, "loss": 0.0273, "step": 250830 }, { "epoch": 1.62, "learning_rate": 5.7152907310713375e-05, "loss": 0.0241, "step": 250840 }, { "epoch": 1.62, "learning_rate": 5.714322595635645e-05, "loss": 0.0235, "step": 250850 }, { "epoch": 1.62, "learning_rate": 5.7133544601999514e-05, "loss": 0.0292, "step": 250860 }, { "epoch": 1.62, "learning_rate": 5.712386324764259e-05, "loss": 0.0353, "step": 250870 }, { "epoch": 1.62, "learning_rate": 5.711418189328565e-05, "loss": 0.0231, "step": 250880 }, { "epoch": 1.62, "learning_rate": 5.7104500538928726e-05, "loss": 0.0283, "step": 250890 }, { "epoch": 1.62, "learning_rate": 5.7094819184571786e-05, "loss": 0.0208, "step": 250900 }, { "epoch": 1.62, "learning_rate": 5.708513783021485e-05, "loss": 0.0284, "step": 250910 }, { "epoch": 1.62, "learning_rate": 5.7075456475857925e-05, "loss": 0.0308, "step": 250920 }, { "epoch": 1.62, "learning_rate": 5.706577512150099e-05, "loss": 0.0252, "step": 250930 }, { "epoch": 1.62, "learning_rate": 5.7056093767144064e-05, "loss": 0.027, "step": 250940 }, { "epoch": 1.62, "learning_rate": 5.7046412412787124e-05, "loss": 0.0276, "step": 250950 }, { "epoch": 1.62, "learning_rate": 5.7036731058430197e-05, "loss": 0.0265, "step": 250960 }, { "epoch": 1.62, "learning_rate": 5.702704970407326e-05, "loss": 0.0305, "step": 250970 }, { "epoch": 1.62, "learning_rate": 5.701736834971633e-05, "loss": 0.04, "step": 250980 }, { "epoch": 1.62, "learning_rate": 5.70076869953594e-05, "loss": 0.0228, "step": 250990 }, { "epoch": 1.62, "learning_rate": 5.699800564100246e-05, "loss": 0.0246, "step": 251000 }, { "epoch": 1.62, "eval_cer": 0.9198400180770534, "eval_loss": 0.018709488213062286, "eval_runtime": 120.2758, "eval_samples_per_second": 16.628, "eval_steps_per_second": 4.157, "step": 251000 }, { "epoch": 1.62, "learning_rate": 5.6988324286645535e-05, "loss": 0.0307, "step": 251010 }, { "epoch": 1.62, "learning_rate": 5.69786429322886e-05, "loss": 0.0268, "step": 251020 }, { "epoch": 1.62, "learning_rate": 5.6968961577931674e-05, "loss": 0.022, "step": 251030 }, { "epoch": 1.62, "learning_rate": 5.695928022357474e-05, "loss": 0.0245, "step": 251040 }, { "epoch": 1.62, "learning_rate": 5.69495988692178e-05, "loss": 0.0296, "step": 251050 }, { "epoch": 1.62, "learning_rate": 5.693991751486087e-05, "loss": 0.0287, "step": 251060 }, { "epoch": 1.62, "learning_rate": 5.693023616050394e-05, "loss": 0.0268, "step": 251070 }, { "epoch": 1.62, "learning_rate": 5.692055480614701e-05, "loss": 0.0219, "step": 251080 }, { "epoch": 1.62, "learning_rate": 5.691087345179008e-05, "loss": 0.0243, "step": 251090 }, { "epoch": 1.62, "learning_rate": 5.690119209743315e-05, "loss": 0.0253, "step": 251100 }, { "epoch": 1.62, "learning_rate": 5.689151074307621e-05, "loss": 0.0217, "step": 251110 }, { "epoch": 1.62, "learning_rate": 5.688182938871928e-05, "loss": 0.0251, "step": 251120 }, { "epoch": 1.62, "learning_rate": 5.687214803436235e-05, "loss": 0.0283, "step": 251130 }, { "epoch": 1.62, "learning_rate": 5.6862466680005416e-05, "loss": 0.0257, "step": 251140 }, { "epoch": 1.62, "learning_rate": 5.685278532564849e-05, "loss": 0.0286, "step": 251150 }, { "epoch": 1.62, "learning_rate": 5.684310397129155e-05, "loss": 0.0305, "step": 251160 }, { "epoch": 1.62, "learning_rate": 5.683342261693462e-05, "loss": 0.0265, "step": 251170 }, { "epoch": 1.62, "learning_rate": 5.682374126257769e-05, "loss": 0.0255, "step": 251180 }, { "epoch": 1.62, "learning_rate": 5.6814059908220754e-05, "loss": 0.0232, "step": 251190 }, { "epoch": 1.62, "learning_rate": 5.680437855386383e-05, "loss": 0.0254, "step": 251200 }, { "epoch": 1.62, "learning_rate": 5.6794697199506886e-05, "loss": 0.0214, "step": 251210 }, { "epoch": 1.62, "learning_rate": 5.678501584514996e-05, "loss": 0.0292, "step": 251220 }, { "epoch": 1.62, "learning_rate": 5.6775334490793026e-05, "loss": 0.0237, "step": 251230 }, { "epoch": 1.62, "learning_rate": 5.67656531364361e-05, "loss": 0.0238, "step": 251240 }, { "epoch": 1.62, "learning_rate": 5.6755971782079165e-05, "loss": 0.0291, "step": 251250 }, { "epoch": 1.62, "learning_rate": 5.6746290427722224e-05, "loss": 0.024, "step": 251260 }, { "epoch": 1.62, "learning_rate": 5.67366090733653e-05, "loss": 0.0204, "step": 251270 }, { "epoch": 1.62, "learning_rate": 5.6726927719008364e-05, "loss": 0.024, "step": 251280 }, { "epoch": 1.62, "learning_rate": 5.671724636465144e-05, "loss": 0.0297, "step": 251290 }, { "epoch": 1.62, "learning_rate": 5.67075650102945e-05, "loss": 0.0196, "step": 251300 }, { "epoch": 1.62, "learning_rate": 5.6697883655937576e-05, "loss": 0.0242, "step": 251310 }, { "epoch": 1.62, "learning_rate": 5.6688202301580635e-05, "loss": 0.0251, "step": 251320 }, { "epoch": 1.62, "learning_rate": 5.66785209472237e-05, "loss": 0.027, "step": 251330 }, { "epoch": 1.62, "learning_rate": 5.6668839592866775e-05, "loss": 0.0301, "step": 251340 }, { "epoch": 1.62, "learning_rate": 5.665915823850984e-05, "loss": 0.0227, "step": 251350 }, { "epoch": 1.62, "learning_rate": 5.6649476884152914e-05, "loss": 0.0262, "step": 251360 }, { "epoch": 1.62, "learning_rate": 5.663979552979597e-05, "loss": 0.0278, "step": 251370 }, { "epoch": 1.62, "learning_rate": 5.6630114175439046e-05, "loss": 0.0255, "step": 251380 }, { "epoch": 1.62, "learning_rate": 5.662043282108211e-05, "loss": 0.0242, "step": 251390 }, { "epoch": 1.62, "learning_rate": 5.661075146672518e-05, "loss": 0.0307, "step": 251400 }, { "epoch": 1.62, "learning_rate": 5.660107011236825e-05, "loss": 0.0226, "step": 251410 }, { "epoch": 1.62, "learning_rate": 5.659138875801131e-05, "loss": 0.0293, "step": 251420 }, { "epoch": 1.62, "learning_rate": 5.6581707403654384e-05, "loss": 0.029, "step": 251430 }, { "epoch": 1.62, "learning_rate": 5.657202604929745e-05, "loss": 0.0274, "step": 251440 }, { "epoch": 1.62, "learning_rate": 5.6562344694940524e-05, "loss": 0.024, "step": 251450 }, { "epoch": 1.62, "learning_rate": 5.655266334058359e-05, "loss": 0.0268, "step": 251460 }, { "epoch": 1.62, "learning_rate": 5.654298198622665e-05, "loss": 0.0249, "step": 251470 }, { "epoch": 1.62, "learning_rate": 5.653330063186972e-05, "loss": 0.0313, "step": 251480 }, { "epoch": 1.62, "learning_rate": 5.652361927751279e-05, "loss": 0.0294, "step": 251490 }, { "epoch": 1.62, "learning_rate": 5.651393792315586e-05, "loss": 0.0268, "step": 251500 }, { "epoch": 1.62, "learning_rate": 5.650425656879893e-05, "loss": 0.0214, "step": 251510 }, { "epoch": 1.62, "learning_rate": 5.6494575214442e-05, "loss": 0.0244, "step": 251520 }, { "epoch": 1.62, "learning_rate": 5.648489386008506e-05, "loss": 0.0252, "step": 251530 }, { "epoch": 1.62, "learning_rate": 5.6475212505728127e-05, "loss": 0.0287, "step": 251540 }, { "epoch": 1.62, "learning_rate": 5.64655311513712e-05, "loss": 0.028, "step": 251550 }, { "epoch": 1.62, "learning_rate": 5.6455849797014266e-05, "loss": 0.0264, "step": 251560 }, { "epoch": 1.62, "learning_rate": 5.644616844265734e-05, "loss": 0.0286, "step": 251570 }, { "epoch": 1.62, "learning_rate": 5.64364870883004e-05, "loss": 0.0251, "step": 251580 }, { "epoch": 1.62, "learning_rate": 5.642680573394347e-05, "loss": 0.0267, "step": 251590 }, { "epoch": 1.62, "learning_rate": 5.641712437958654e-05, "loss": 0.0249, "step": 251600 }, { "epoch": 1.62, "learning_rate": 5.6407443025229604e-05, "loss": 0.0267, "step": 251610 }, { "epoch": 1.62, "learning_rate": 5.639776167087268e-05, "loss": 0.0284, "step": 251620 }, { "epoch": 1.62, "learning_rate": 5.6388080316515736e-05, "loss": 0.0279, "step": 251630 }, { "epoch": 1.62, "learning_rate": 5.637839896215881e-05, "loss": 0.0274, "step": 251640 }, { "epoch": 1.62, "learning_rate": 5.6368717607801875e-05, "loss": 0.0261, "step": 251650 }, { "epoch": 1.62, "learning_rate": 5.635903625344495e-05, "loss": 0.0295, "step": 251660 }, { "epoch": 1.62, "learning_rate": 5.6349354899088015e-05, "loss": 0.0272, "step": 251670 }, { "epoch": 1.62, "learning_rate": 5.6339673544731074e-05, "loss": 0.0265, "step": 251680 }, { "epoch": 1.62, "learning_rate": 5.632999219037415e-05, "loss": 0.0235, "step": 251690 }, { "epoch": 1.62, "learning_rate": 5.6320310836017213e-05, "loss": 0.0252, "step": 251700 }, { "epoch": 1.62, "learning_rate": 5.6310629481660286e-05, "loss": 0.0259, "step": 251710 }, { "epoch": 1.62, "learning_rate": 5.630094812730335e-05, "loss": 0.0292, "step": 251720 }, { "epoch": 1.62, "learning_rate": 5.629126677294642e-05, "loss": 0.0332, "step": 251730 }, { "epoch": 1.62, "learning_rate": 5.6281585418589485e-05, "loss": 0.0263, "step": 251740 }, { "epoch": 1.62, "learning_rate": 5.627190406423255e-05, "loss": 0.0327, "step": 251750 }, { "epoch": 1.62, "learning_rate": 5.6262222709875624e-05, "loss": 0.0219, "step": 251760 }, { "epoch": 1.62, "learning_rate": 5.625254135551869e-05, "loss": 0.0295, "step": 251770 }, { "epoch": 1.63, "learning_rate": 5.624286000116176e-05, "loss": 0.0264, "step": 251780 }, { "epoch": 1.63, "learning_rate": 5.623317864680482e-05, "loss": 0.0233, "step": 251790 }, { "epoch": 1.63, "learning_rate": 5.6223497292447896e-05, "loss": 0.0297, "step": 251800 }, { "epoch": 1.63, "learning_rate": 5.621381593809096e-05, "loss": 0.0279, "step": 251810 }, { "epoch": 1.63, "learning_rate": 5.620413458373403e-05, "loss": 0.0285, "step": 251820 }, { "epoch": 1.63, "learning_rate": 5.6194453229377095e-05, "loss": 0.0254, "step": 251830 }, { "epoch": 1.63, "learning_rate": 5.618477187502016e-05, "loss": 0.0267, "step": 251840 }, { "epoch": 1.63, "learning_rate": 5.6175090520663234e-05, "loss": 0.0224, "step": 251850 }, { "epoch": 1.63, "learning_rate": 5.61654091663063e-05, "loss": 0.0204, "step": 251860 }, { "epoch": 1.63, "learning_rate": 5.6155727811949373e-05, "loss": 0.0217, "step": 251870 }, { "epoch": 1.63, "learning_rate": 5.614604645759243e-05, "loss": 0.0258, "step": 251880 }, { "epoch": 1.63, "learning_rate": 5.61363651032355e-05, "loss": 0.0277, "step": 251890 }, { "epoch": 1.63, "learning_rate": 5.612668374887857e-05, "loss": 0.0276, "step": 251900 }, { "epoch": 1.63, "learning_rate": 5.611700239452164e-05, "loss": 0.0194, "step": 251910 }, { "epoch": 1.63, "learning_rate": 5.610732104016471e-05, "loss": 0.0227, "step": 251920 }, { "epoch": 1.63, "learning_rate": 5.609763968580778e-05, "loss": 0.0265, "step": 251930 }, { "epoch": 1.63, "learning_rate": 5.6087958331450844e-05, "loss": 0.0308, "step": 251940 }, { "epoch": 1.63, "learning_rate": 5.607827697709391e-05, "loss": 0.0227, "step": 251950 }, { "epoch": 1.63, "learning_rate": 5.6068595622736976e-05, "loss": 0.0262, "step": 251960 }, { "epoch": 1.63, "learning_rate": 5.605891426838005e-05, "loss": 0.0285, "step": 251970 }, { "epoch": 1.63, "learning_rate": 5.6049232914023116e-05, "loss": 0.0289, "step": 251980 }, { "epoch": 1.63, "learning_rate": 5.603955155966618e-05, "loss": 0.0272, "step": 251990 }, { "epoch": 1.63, "learning_rate": 5.602987020530925e-05, "loss": 0.0309, "step": 252000 }, { "epoch": 1.63, "eval_cer": 0.9198192294655971, "eval_loss": 0.018738944083452225, "eval_runtime": 120.2162, "eval_samples_per_second": 16.637, "eval_steps_per_second": 4.159, "step": 252000 }, { "epoch": 1.63, "learning_rate": 5.602018885095232e-05, "loss": 0.0267, "step": 252010 }, { "epoch": 1.63, "learning_rate": 5.601050749659539e-05, "loss": 0.0254, "step": 252020 }, { "epoch": 1.63, "learning_rate": 5.6000826142238454e-05, "loss": 0.0268, "step": 252030 }, { "epoch": 1.63, "learning_rate": 5.599114478788152e-05, "loss": 0.0209, "step": 252040 }, { "epoch": 1.63, "learning_rate": 5.5981463433524586e-05, "loss": 0.0259, "step": 252050 }, { "epoch": 1.63, "learning_rate": 5.597178207916766e-05, "loss": 0.0269, "step": 252060 }, { "epoch": 1.63, "learning_rate": 5.5962100724810725e-05, "loss": 0.0256, "step": 252070 }, { "epoch": 1.63, "learning_rate": 5.59524193704538e-05, "loss": 0.0279, "step": 252080 }, { "epoch": 1.63, "learning_rate": 5.594273801609686e-05, "loss": 0.0268, "step": 252090 }, { "epoch": 1.63, "learning_rate": 5.5933056661739924e-05, "loss": 0.0254, "step": 252100 }, { "epoch": 1.63, "learning_rate": 5.5923375307383e-05, "loss": 0.03, "step": 252110 }, { "epoch": 1.63, "learning_rate": 5.591369395302606e-05, "loss": 0.0277, "step": 252120 }, { "epoch": 1.63, "learning_rate": 5.5904012598669136e-05, "loss": 0.022, "step": 252130 }, { "epoch": 1.63, "learning_rate": 5.5894331244312196e-05, "loss": 0.0235, "step": 252140 }, { "epoch": 1.63, "learning_rate": 5.588464988995527e-05, "loss": 0.0256, "step": 252150 }, { "epoch": 1.63, "learning_rate": 5.5874968535598335e-05, "loss": 0.0233, "step": 252160 }, { "epoch": 1.63, "learning_rate": 5.58652871812414e-05, "loss": 0.0247, "step": 252170 }, { "epoch": 1.63, "learning_rate": 5.5855605826884474e-05, "loss": 0.0283, "step": 252180 }, { "epoch": 1.63, "learning_rate": 5.5845924472527534e-05, "loss": 0.0329, "step": 252190 }, { "epoch": 1.63, "learning_rate": 5.583624311817061e-05, "loss": 0.0258, "step": 252200 }, { "epoch": 1.63, "learning_rate": 5.582656176381367e-05, "loss": 0.0247, "step": 252210 }, { "epoch": 1.63, "learning_rate": 5.581688040945674e-05, "loss": 0.0244, "step": 252220 }, { "epoch": 1.63, "learning_rate": 5.580719905509981e-05, "loss": 0.0271, "step": 252230 }, { "epoch": 1.63, "learning_rate": 5.579751770074287e-05, "loss": 0.027, "step": 252240 }, { "epoch": 1.63, "learning_rate": 5.5787836346385945e-05, "loss": 0.0259, "step": 252250 }, { "epoch": 1.63, "learning_rate": 5.577815499202901e-05, "loss": 0.0253, "step": 252260 }, { "epoch": 1.63, "learning_rate": 5.5768473637672084e-05, "loss": 0.0321, "step": 252270 }, { "epoch": 1.63, "learning_rate": 5.575879228331515e-05, "loss": 0.0231, "step": 252280 }, { "epoch": 1.63, "learning_rate": 5.574911092895821e-05, "loss": 0.0227, "step": 252290 }, { "epoch": 1.63, "learning_rate": 5.573942957460128e-05, "loss": 0.0248, "step": 252300 }, { "epoch": 1.63, "learning_rate": 5.572974822024435e-05, "loss": 0.0231, "step": 252310 }, { "epoch": 1.63, "learning_rate": 5.572006686588742e-05, "loss": 0.0274, "step": 252320 }, { "epoch": 1.63, "learning_rate": 5.571038551153049e-05, "loss": 0.0276, "step": 252330 }, { "epoch": 1.63, "learning_rate": 5.570070415717356e-05, "loss": 0.0255, "step": 252340 }, { "epoch": 1.63, "learning_rate": 5.569102280281662e-05, "loss": 0.0257, "step": 252350 }, { "epoch": 1.63, "learning_rate": 5.568134144845969e-05, "loss": 0.024, "step": 252360 }, { "epoch": 1.63, "learning_rate": 5.567166009410276e-05, "loss": 0.0258, "step": 252370 }, { "epoch": 1.63, "learning_rate": 5.5661978739745826e-05, "loss": 0.0264, "step": 252380 }, { "epoch": 1.63, "learning_rate": 5.56522973853889e-05, "loss": 0.0244, "step": 252390 }, { "epoch": 1.63, "learning_rate": 5.564261603103196e-05, "loss": 0.0238, "step": 252400 }, { "epoch": 1.63, "learning_rate": 5.563293467667503e-05, "loss": 0.0224, "step": 252410 }, { "epoch": 1.63, "learning_rate": 5.56232533223181e-05, "loss": 0.0337, "step": 252420 }, { "epoch": 1.63, "learning_rate": 5.5613571967961164e-05, "loss": 0.0267, "step": 252430 }, { "epoch": 1.63, "learning_rate": 5.560389061360424e-05, "loss": 0.0269, "step": 252440 }, { "epoch": 1.63, "learning_rate": 5.5594209259247297e-05, "loss": 0.0289, "step": 252450 }, { "epoch": 1.63, "learning_rate": 5.558452790489037e-05, "loss": 0.0216, "step": 252460 }, { "epoch": 1.63, "learning_rate": 5.5574846550533436e-05, "loss": 0.0241, "step": 252470 }, { "epoch": 1.63, "learning_rate": 5.556516519617651e-05, "loss": 0.0261, "step": 252480 }, { "epoch": 1.63, "learning_rate": 5.5555483841819575e-05, "loss": 0.0251, "step": 252490 }, { "epoch": 1.63, "learning_rate": 5.5545802487462635e-05, "loss": 0.0258, "step": 252500 }, { "epoch": 1.63, "learning_rate": 5.553612113310571e-05, "loss": 0.0277, "step": 252510 }, { "epoch": 1.63, "learning_rate": 5.5526439778748774e-05, "loss": 0.0255, "step": 252520 }, { "epoch": 1.63, "learning_rate": 5.551675842439185e-05, "loss": 0.0273, "step": 252530 }, { "epoch": 1.63, "learning_rate": 5.550707707003491e-05, "loss": 0.0253, "step": 252540 }, { "epoch": 1.63, "learning_rate": 5.5497395715677986e-05, "loss": 0.0253, "step": 252550 }, { "epoch": 1.63, "learning_rate": 5.5487714361321046e-05, "loss": 0.024, "step": 252560 }, { "epoch": 1.63, "learning_rate": 5.547803300696411e-05, "loss": 0.0357, "step": 252570 }, { "epoch": 1.63, "learning_rate": 5.5468351652607185e-05, "loss": 0.0196, "step": 252580 }, { "epoch": 1.63, "learning_rate": 5.545867029825025e-05, "loss": 0.0288, "step": 252590 }, { "epoch": 1.63, "learning_rate": 5.5448988943893324e-05, "loss": 0.0281, "step": 252600 }, { "epoch": 1.63, "learning_rate": 5.5439307589536384e-05, "loss": 0.0294, "step": 252610 }, { "epoch": 1.63, "learning_rate": 5.5429626235179457e-05, "loss": 0.0239, "step": 252620 }, { "epoch": 1.63, "learning_rate": 5.541994488082252e-05, "loss": 0.0226, "step": 252630 }, { "epoch": 1.63, "learning_rate": 5.541026352646559e-05, "loss": 0.0251, "step": 252640 }, { "epoch": 1.63, "learning_rate": 5.540058217210866e-05, "loss": 0.0247, "step": 252650 }, { "epoch": 1.63, "learning_rate": 5.539090081775172e-05, "loss": 0.027, "step": 252660 }, { "epoch": 1.63, "learning_rate": 5.5381219463394795e-05, "loss": 0.0227, "step": 252670 }, { "epoch": 1.63, "learning_rate": 5.537153810903786e-05, "loss": 0.0232, "step": 252680 }, { "epoch": 1.63, "learning_rate": 5.5361856754680934e-05, "loss": 0.0238, "step": 252690 }, { "epoch": 1.63, "learning_rate": 5.5352175400324e-05, "loss": 0.0234, "step": 252700 }, { "epoch": 1.63, "learning_rate": 5.534249404596706e-05, "loss": 0.0272, "step": 252710 }, { "epoch": 1.63, "learning_rate": 5.533281269161013e-05, "loss": 0.0227, "step": 252720 }, { "epoch": 1.63, "learning_rate": 5.53231313372532e-05, "loss": 0.0257, "step": 252730 }, { "epoch": 1.63, "learning_rate": 5.531344998289627e-05, "loss": 0.0222, "step": 252740 }, { "epoch": 1.63, "learning_rate": 5.530376862853934e-05, "loss": 0.0218, "step": 252750 }, { "epoch": 1.63, "learning_rate": 5.529408727418241e-05, "loss": 0.0259, "step": 252760 }, { "epoch": 1.63, "learning_rate": 5.528440591982547e-05, "loss": 0.0227, "step": 252770 }, { "epoch": 1.63, "learning_rate": 5.527472456546854e-05, "loss": 0.0309, "step": 252780 }, { "epoch": 1.63, "learning_rate": 5.526504321111161e-05, "loss": 0.0217, "step": 252790 }, { "epoch": 1.63, "learning_rate": 5.5255361856754676e-05, "loss": 0.022, "step": 252800 }, { "epoch": 1.63, "learning_rate": 5.524568050239775e-05, "loss": 0.0231, "step": 252810 }, { "epoch": 1.63, "learning_rate": 5.523599914804081e-05, "loss": 0.0237, "step": 252820 }, { "epoch": 1.63, "learning_rate": 5.522631779368388e-05, "loss": 0.0259, "step": 252830 }, { "epoch": 1.63, "learning_rate": 5.521663643932695e-05, "loss": 0.0266, "step": 252840 }, { "epoch": 1.63, "learning_rate": 5.5206955084970014e-05, "loss": 0.0313, "step": 252850 }, { "epoch": 1.63, "learning_rate": 5.519727373061309e-05, "loss": 0.0228, "step": 252860 }, { "epoch": 1.63, "learning_rate": 5.5187592376256146e-05, "loss": 0.0307, "step": 252870 }, { "epoch": 1.63, "learning_rate": 5.517791102189922e-05, "loss": 0.0219, "step": 252880 }, { "epoch": 1.63, "learning_rate": 5.5168229667542286e-05, "loss": 0.0254, "step": 252890 }, { "epoch": 1.63, "learning_rate": 5.515854831318536e-05, "loss": 0.0263, "step": 252900 }, { "epoch": 1.63, "learning_rate": 5.5148866958828425e-05, "loss": 0.0256, "step": 252910 }, { "epoch": 1.63, "learning_rate": 5.5139185604471484e-05, "loss": 0.024, "step": 252920 }, { "epoch": 1.63, "learning_rate": 5.512950425011456e-05, "loss": 0.0212, "step": 252930 }, { "epoch": 1.63, "learning_rate": 5.5119822895757624e-05, "loss": 0.023, "step": 252940 }, { "epoch": 1.63, "learning_rate": 5.51101415414007e-05, "loss": 0.0353, "step": 252950 }, { "epoch": 1.63, "learning_rate": 5.510046018704376e-05, "loss": 0.027, "step": 252960 }, { "epoch": 1.63, "learning_rate": 5.5090778832686836e-05, "loss": 0.0242, "step": 252970 }, { "epoch": 1.63, "learning_rate": 5.5081097478329895e-05, "loss": 0.0246, "step": 252980 }, { "epoch": 1.63, "learning_rate": 5.507141612397296e-05, "loss": 0.0271, "step": 252990 }, { "epoch": 1.63, "learning_rate": 5.5061734769616035e-05, "loss": 0.0237, "step": 253000 }, { "epoch": 1.63, "eval_cer": 0.9198508643091177, "eval_loss": 0.018802916631102562, "eval_runtime": 119.9935, "eval_samples_per_second": 16.668, "eval_steps_per_second": 4.167, "step": 253000 }, { "epoch": 1.63, "learning_rate": 5.50520534152591e-05, "loss": 0.0292, "step": 253010 }, { "epoch": 1.63, "learning_rate": 5.5042372060902174e-05, "loss": 0.0239, "step": 253020 }, { "epoch": 1.63, "learning_rate": 5.503269070654523e-05, "loss": 0.0221, "step": 253030 }, { "epoch": 1.63, "learning_rate": 5.5023009352188306e-05, "loss": 0.0239, "step": 253040 }, { "epoch": 1.63, "learning_rate": 5.501332799783137e-05, "loss": 0.023, "step": 253050 }, { "epoch": 1.63, "learning_rate": 5.500364664347444e-05, "loss": 0.0234, "step": 253060 }, { "epoch": 1.63, "learning_rate": 5.499396528911751e-05, "loss": 0.0289, "step": 253070 }, { "epoch": 1.63, "learning_rate": 5.498428393476057e-05, "loss": 0.0263, "step": 253080 }, { "epoch": 1.63, "learning_rate": 5.4974602580403644e-05, "loss": 0.0207, "step": 253090 }, { "epoch": 1.63, "learning_rate": 5.496492122604671e-05, "loss": 0.0227, "step": 253100 }, { "epoch": 1.63, "learning_rate": 5.4955239871689784e-05, "loss": 0.0216, "step": 253110 }, { "epoch": 1.63, "learning_rate": 5.494555851733285e-05, "loss": 0.0287, "step": 253120 }, { "epoch": 1.63, "learning_rate": 5.493587716297591e-05, "loss": 0.0237, "step": 253130 }, { "epoch": 1.63, "learning_rate": 5.492619580861898e-05, "loss": 0.0278, "step": 253140 }, { "epoch": 1.63, "learning_rate": 5.491651445426205e-05, "loss": 0.0215, "step": 253150 }, { "epoch": 1.63, "learning_rate": 5.490683309990512e-05, "loss": 0.0302, "step": 253160 }, { "epoch": 1.63, "learning_rate": 5.489715174554819e-05, "loss": 0.0266, "step": 253170 }, { "epoch": 1.63, "learning_rate": 5.4887470391191254e-05, "loss": 0.029, "step": 253180 }, { "epoch": 1.63, "learning_rate": 5.487778903683432e-05, "loss": 0.0227, "step": 253190 }, { "epoch": 1.63, "learning_rate": 5.4868107682477387e-05, "loss": 0.0254, "step": 253200 }, { "epoch": 1.63, "learning_rate": 5.485842632812046e-05, "loss": 0.0245, "step": 253210 }, { "epoch": 1.63, "learning_rate": 5.4848744973763526e-05, "loss": 0.0251, "step": 253220 }, { "epoch": 1.63, "learning_rate": 5.483906361940659e-05, "loss": 0.0233, "step": 253230 }, { "epoch": 1.63, "learning_rate": 5.482938226504966e-05, "loss": 0.0211, "step": 253240 }, { "epoch": 1.63, "learning_rate": 5.481970091069273e-05, "loss": 0.0263, "step": 253250 }, { "epoch": 1.63, "learning_rate": 5.48100195563358e-05, "loss": 0.0246, "step": 253260 }, { "epoch": 1.63, "learning_rate": 5.4800338201978864e-05, "loss": 0.0257, "step": 253270 }, { "epoch": 1.63, "learning_rate": 5.479065684762193e-05, "loss": 0.0238, "step": 253280 }, { "epoch": 1.63, "learning_rate": 5.4780975493264996e-05, "loss": 0.0259, "step": 253290 }, { "epoch": 1.63, "learning_rate": 5.477129413890807e-05, "loss": 0.0283, "step": 253300 }, { "epoch": 1.63, "learning_rate": 5.4761612784551135e-05, "loss": 0.0229, "step": 253310 }, { "epoch": 1.63, "learning_rate": 5.475193143019421e-05, "loss": 0.0334, "step": 253320 }, { "epoch": 1.64, "learning_rate": 5.474225007583727e-05, "loss": 0.0274, "step": 253330 }, { "epoch": 1.64, "learning_rate": 5.4732568721480334e-05, "loss": 0.0244, "step": 253340 }, { "epoch": 1.64, "learning_rate": 5.472288736712341e-05, "loss": 0.0265, "step": 253350 }, { "epoch": 1.64, "learning_rate": 5.4713206012766473e-05, "loss": 0.0249, "step": 253360 }, { "epoch": 1.64, "learning_rate": 5.4703524658409546e-05, "loss": 0.0264, "step": 253370 }, { "epoch": 1.64, "learning_rate": 5.4693843304052606e-05, "loss": 0.0217, "step": 253380 }, { "epoch": 1.64, "learning_rate": 5.468416194969568e-05, "loss": 0.026, "step": 253390 }, { "epoch": 1.64, "learning_rate": 5.4674480595338745e-05, "loss": 0.0224, "step": 253400 }, { "epoch": 1.64, "learning_rate": 5.466479924098181e-05, "loss": 0.0242, "step": 253410 }, { "epoch": 1.64, "learning_rate": 5.4655117886624884e-05, "loss": 0.0252, "step": 253420 }, { "epoch": 1.64, "learning_rate": 5.4645436532267944e-05, "loss": 0.0237, "step": 253430 }, { "epoch": 1.64, "learning_rate": 5.463575517791102e-05, "loss": 0.0317, "step": 253440 }, { "epoch": 1.64, "learning_rate": 5.462607382355408e-05, "loss": 0.0287, "step": 253450 }, { "epoch": 1.64, "learning_rate": 5.4616392469197156e-05, "loss": 0.0237, "step": 253460 }, { "epoch": 1.64, "learning_rate": 5.460671111484022e-05, "loss": 0.0242, "step": 253470 }, { "epoch": 1.64, "learning_rate": 5.459702976048328e-05, "loss": 0.0202, "step": 253480 }, { "epoch": 1.64, "learning_rate": 5.4587348406126355e-05, "loss": 0.027, "step": 253490 }, { "epoch": 1.64, "learning_rate": 5.457766705176942e-05, "loss": 0.0237, "step": 253500 }, { "epoch": 1.64, "learning_rate": 5.4567985697412494e-05, "loss": 0.0231, "step": 253510 }, { "epoch": 1.64, "learning_rate": 5.455830434305556e-05, "loss": 0.0269, "step": 253520 }, { "epoch": 1.64, "learning_rate": 5.454862298869863e-05, "loss": 0.0269, "step": 253530 }, { "epoch": 1.64, "learning_rate": 5.453894163434169e-05, "loss": 0.0237, "step": 253540 }, { "epoch": 1.64, "learning_rate": 5.452926027998476e-05, "loss": 0.0261, "step": 253550 }, { "epoch": 1.64, "learning_rate": 5.451957892562783e-05, "loss": 0.0301, "step": 253560 }, { "epoch": 1.64, "learning_rate": 5.45098975712709e-05, "loss": 0.0238, "step": 253570 }, { "epoch": 1.64, "learning_rate": 5.450021621691397e-05, "loss": 0.0251, "step": 253580 }, { "epoch": 1.64, "learning_rate": 5.449053486255703e-05, "loss": 0.0247, "step": 253590 }, { "epoch": 1.64, "learning_rate": 5.4480853508200104e-05, "loss": 0.0231, "step": 253600 }, { "epoch": 1.64, "learning_rate": 5.447117215384317e-05, "loss": 0.029, "step": 253610 }, { "epoch": 1.64, "learning_rate": 5.4461490799486236e-05, "loss": 0.0263, "step": 253620 }, { "epoch": 1.64, "learning_rate": 5.445180944512931e-05, "loss": 0.025, "step": 253630 }, { "epoch": 1.64, "learning_rate": 5.444212809077237e-05, "loss": 0.0263, "step": 253640 }, { "epoch": 1.64, "learning_rate": 5.443244673641544e-05, "loss": 0.0232, "step": 253650 }, { "epoch": 1.64, "learning_rate": 5.442276538205851e-05, "loss": 0.0269, "step": 253660 }, { "epoch": 1.64, "learning_rate": 5.441308402770158e-05, "loss": 0.0225, "step": 253670 }, { "epoch": 1.64, "learning_rate": 5.440340267334465e-05, "loss": 0.0244, "step": 253680 }, { "epoch": 1.64, "learning_rate": 5.439372131898771e-05, "loss": 0.0224, "step": 253690 }, { "epoch": 1.64, "learning_rate": 5.438403996463078e-05, "loss": 0.0244, "step": 253700 }, { "epoch": 1.64, "learning_rate": 5.4374358610273846e-05, "loss": 0.0271, "step": 253710 }, { "epoch": 1.64, "learning_rate": 5.436467725591692e-05, "loss": 0.0331, "step": 253720 }, { "epoch": 1.64, "learning_rate": 5.4354995901559985e-05, "loss": 0.0212, "step": 253730 }, { "epoch": 1.64, "learning_rate": 5.434531454720306e-05, "loss": 0.0284, "step": 253740 }, { "epoch": 1.64, "learning_rate": 5.433563319284612e-05, "loss": 0.0246, "step": 253750 }, { "epoch": 1.64, "learning_rate": 5.4325951838489184e-05, "loss": 0.026, "step": 253760 }, { "epoch": 1.64, "learning_rate": 5.431627048413226e-05, "loss": 0.0235, "step": 253770 }, { "epoch": 1.64, "learning_rate": 5.430658912977532e-05, "loss": 0.023, "step": 253780 }, { "epoch": 1.64, "learning_rate": 5.4296907775418396e-05, "loss": 0.0242, "step": 253790 }, { "epoch": 1.64, "learning_rate": 5.4287226421061456e-05, "loss": 0.0225, "step": 253800 }, { "epoch": 1.64, "learning_rate": 5.427754506670453e-05, "loss": 0.0262, "step": 253810 }, { "epoch": 1.64, "learning_rate": 5.4267863712347595e-05, "loss": 0.0235, "step": 253820 }, { "epoch": 1.64, "learning_rate": 5.425818235799066e-05, "loss": 0.0251, "step": 253830 }, { "epoch": 1.64, "learning_rate": 5.4248501003633734e-05, "loss": 0.0278, "step": 253840 }, { "epoch": 1.64, "learning_rate": 5.4238819649276794e-05, "loss": 0.0229, "step": 253850 }, { "epoch": 1.64, "learning_rate": 5.422913829491987e-05, "loss": 0.0241, "step": 253860 }, { "epoch": 1.64, "learning_rate": 5.421945694056293e-05, "loss": 0.0286, "step": 253870 }, { "epoch": 1.64, "learning_rate": 5.4209775586206006e-05, "loss": 0.0257, "step": 253880 }, { "epoch": 1.64, "learning_rate": 5.420009423184907e-05, "loss": 0.0224, "step": 253890 }, { "epoch": 1.64, "learning_rate": 5.419041287749213e-05, "loss": 0.0241, "step": 253900 }, { "epoch": 1.64, "learning_rate": 5.4180731523135205e-05, "loss": 0.0294, "step": 253910 }, { "epoch": 1.64, "learning_rate": 5.417105016877827e-05, "loss": 0.0259, "step": 253920 }, { "epoch": 1.64, "learning_rate": 5.4161368814421344e-05, "loss": 0.0233, "step": 253930 }, { "epoch": 1.64, "learning_rate": 5.415168746006441e-05, "loss": 0.0252, "step": 253940 }, { "epoch": 1.64, "learning_rate": 5.414200610570747e-05, "loss": 0.0248, "step": 253950 }, { "epoch": 1.64, "learning_rate": 5.413232475135054e-05, "loss": 0.026, "step": 253960 }, { "epoch": 1.64, "learning_rate": 5.412264339699361e-05, "loss": 0.0242, "step": 253970 }, { "epoch": 1.64, "learning_rate": 5.411296204263668e-05, "loss": 0.027, "step": 253980 }, { "epoch": 1.64, "learning_rate": 5.410328068827975e-05, "loss": 0.0233, "step": 253990 }, { "epoch": 1.64, "learning_rate": 5.409359933392282e-05, "loss": 0.0234, "step": 254000 }, { "epoch": 1.64, "eval_cer": 0.9198201333182692, "eval_loss": 0.01838851161301136, "eval_runtime": 120.0869, "eval_samples_per_second": 16.655, "eval_steps_per_second": 4.164, "step": 254000 }, { "epoch": 1.64, "learning_rate": 5.408391797956588e-05, "loss": 0.0227, "step": 254010 }, { "epoch": 1.64, "learning_rate": 5.407423662520895e-05, "loss": 0.0244, "step": 254020 }, { "epoch": 1.64, "learning_rate": 5.406455527085202e-05, "loss": 0.0237, "step": 254030 }, { "epoch": 1.64, "learning_rate": 5.4054873916495086e-05, "loss": 0.0224, "step": 254040 }, { "epoch": 1.64, "learning_rate": 5.404519256213816e-05, "loss": 0.0221, "step": 254050 }, { "epoch": 1.64, "learning_rate": 5.403551120778122e-05, "loss": 0.0259, "step": 254060 }, { "epoch": 1.64, "learning_rate": 5.402582985342429e-05, "loss": 0.0229, "step": 254070 }, { "epoch": 1.64, "learning_rate": 5.401614849906736e-05, "loss": 0.0246, "step": 254080 }, { "epoch": 1.64, "learning_rate": 5.4006467144710424e-05, "loss": 0.024, "step": 254090 }, { "epoch": 1.64, "learning_rate": 5.39967857903535e-05, "loss": 0.0302, "step": 254100 }, { "epoch": 1.64, "learning_rate": 5.3987104435996557e-05, "loss": 0.0237, "step": 254110 }, { "epoch": 1.64, "learning_rate": 5.397742308163963e-05, "loss": 0.0236, "step": 254120 }, { "epoch": 1.64, "learning_rate": 5.3967741727282696e-05, "loss": 0.0219, "step": 254130 }, { "epoch": 1.64, "learning_rate": 5.395806037292577e-05, "loss": 0.0232, "step": 254140 }, { "epoch": 1.64, "learning_rate": 5.3948379018568835e-05, "loss": 0.0292, "step": 254150 }, { "epoch": 1.64, "learning_rate": 5.3938697664211895e-05, "loss": 0.0238, "step": 254160 }, { "epoch": 1.64, "learning_rate": 5.392901630985497e-05, "loss": 0.0253, "step": 254170 }, { "epoch": 1.64, "learning_rate": 5.3919334955498034e-05, "loss": 0.0259, "step": 254180 }, { "epoch": 1.64, "learning_rate": 5.390965360114111e-05, "loss": 0.0247, "step": 254190 }, { "epoch": 1.64, "learning_rate": 5.389997224678417e-05, "loss": 0.0235, "step": 254200 }, { "epoch": 1.64, "learning_rate": 5.3890290892427246e-05, "loss": 0.0269, "step": 254210 }, { "epoch": 1.64, "learning_rate": 5.3880609538070306e-05, "loss": 0.0279, "step": 254220 }, { "epoch": 1.64, "learning_rate": 5.387092818371337e-05, "loss": 0.03, "step": 254230 }, { "epoch": 1.64, "learning_rate": 5.3861246829356445e-05, "loss": 0.0279, "step": 254240 }, { "epoch": 1.64, "learning_rate": 5.385156547499951e-05, "loss": 0.0247, "step": 254250 }, { "epoch": 1.64, "learning_rate": 5.3841884120642584e-05, "loss": 0.0236, "step": 254260 }, { "epoch": 1.64, "learning_rate": 5.3832202766285644e-05, "loss": 0.0248, "step": 254270 }, { "epoch": 1.64, "learning_rate": 5.3822521411928717e-05, "loss": 0.0212, "step": 254280 }, { "epoch": 1.64, "learning_rate": 5.381284005757178e-05, "loss": 0.0295, "step": 254290 }, { "epoch": 1.64, "learning_rate": 5.380315870321485e-05, "loss": 0.026, "step": 254300 }, { "epoch": 1.64, "learning_rate": 5.379347734885792e-05, "loss": 0.0244, "step": 254310 }, { "epoch": 1.64, "learning_rate": 5.378379599450098e-05, "loss": 0.0253, "step": 254320 }, { "epoch": 1.64, "learning_rate": 5.3774114640144054e-05, "loss": 0.026, "step": 254330 }, { "epoch": 1.64, "learning_rate": 5.376443328578712e-05, "loss": 0.0227, "step": 254340 }, { "epoch": 1.64, "learning_rate": 5.3754751931430194e-05, "loss": 0.0215, "step": 254350 }, { "epoch": 1.64, "learning_rate": 5.374507057707326e-05, "loss": 0.0266, "step": 254360 }, { "epoch": 1.64, "learning_rate": 5.373538922271632e-05, "loss": 0.0266, "step": 254370 }, { "epoch": 1.64, "learning_rate": 5.372570786835939e-05, "loss": 0.0225, "step": 254380 }, { "epoch": 1.64, "learning_rate": 5.371602651400246e-05, "loss": 0.0206, "step": 254390 }, { "epoch": 1.64, "learning_rate": 5.370634515964553e-05, "loss": 0.025, "step": 254400 }, { "epoch": 1.64, "learning_rate": 5.36966638052886e-05, "loss": 0.0263, "step": 254410 }, { "epoch": 1.64, "learning_rate": 5.368698245093167e-05, "loss": 0.0275, "step": 254420 }, { "epoch": 1.64, "learning_rate": 5.367730109657473e-05, "loss": 0.0293, "step": 254430 }, { "epoch": 1.64, "learning_rate": 5.36676197422178e-05, "loss": 0.0231, "step": 254440 }, { "epoch": 1.64, "learning_rate": 5.365793838786087e-05, "loss": 0.0314, "step": 254450 }, { "epoch": 1.64, "learning_rate": 5.3648257033503936e-05, "loss": 0.0325, "step": 254460 }, { "epoch": 1.64, "learning_rate": 5.363857567914701e-05, "loss": 0.0306, "step": 254470 }, { "epoch": 1.64, "learning_rate": 5.362889432479007e-05, "loss": 0.0256, "step": 254480 }, { "epoch": 1.64, "learning_rate": 5.361921297043314e-05, "loss": 0.0277, "step": 254490 }, { "epoch": 1.64, "learning_rate": 5.360953161607621e-05, "loss": 0.025, "step": 254500 }, { "epoch": 1.64, "learning_rate": 5.3599850261719274e-05, "loss": 0.0248, "step": 254510 }, { "epoch": 1.64, "learning_rate": 5.359016890736235e-05, "loss": 0.0259, "step": 254520 }, { "epoch": 1.64, "learning_rate": 5.3580487553005406e-05, "loss": 0.0265, "step": 254530 }, { "epoch": 1.64, "learning_rate": 5.357080619864848e-05, "loss": 0.0194, "step": 254540 }, { "epoch": 1.64, "learning_rate": 5.3561124844291546e-05, "loss": 0.0249, "step": 254550 }, { "epoch": 1.64, "learning_rate": 5.355144348993462e-05, "loss": 0.0244, "step": 254560 }, { "epoch": 1.64, "learning_rate": 5.3541762135577685e-05, "loss": 0.0259, "step": 254570 }, { "epoch": 1.64, "learning_rate": 5.3532080781220744e-05, "loss": 0.0266, "step": 254580 }, { "epoch": 1.64, "learning_rate": 5.352239942686382e-05, "loss": 0.032, "step": 254590 }, { "epoch": 1.64, "learning_rate": 5.3512718072506884e-05, "loss": 0.0216, "step": 254600 }, { "epoch": 1.64, "learning_rate": 5.350303671814996e-05, "loss": 0.0248, "step": 254610 }, { "epoch": 1.64, "learning_rate": 5.349335536379302e-05, "loss": 0.0246, "step": 254620 }, { "epoch": 1.64, "learning_rate": 5.348367400943609e-05, "loss": 0.0252, "step": 254630 }, { "epoch": 1.64, "learning_rate": 5.3473992655079155e-05, "loss": 0.0247, "step": 254640 }, { "epoch": 1.64, "learning_rate": 5.346431130072222e-05, "loss": 0.0242, "step": 254650 }, { "epoch": 1.64, "learning_rate": 5.3454629946365295e-05, "loss": 0.0317, "step": 254660 }, { "epoch": 1.64, "learning_rate": 5.344494859200836e-05, "loss": 0.0231, "step": 254670 }, { "epoch": 1.64, "learning_rate": 5.343526723765143e-05, "loss": 0.0221, "step": 254680 }, { "epoch": 1.64, "learning_rate": 5.342558588329449e-05, "loss": 0.0258, "step": 254690 }, { "epoch": 1.64, "learning_rate": 5.3415904528937566e-05, "loss": 0.0268, "step": 254700 }, { "epoch": 1.64, "learning_rate": 5.340622317458063e-05, "loss": 0.0252, "step": 254710 }, { "epoch": 1.64, "learning_rate": 5.33965418202237e-05, "loss": 0.0228, "step": 254720 }, { "epoch": 1.64, "learning_rate": 5.3386860465866765e-05, "loss": 0.0235, "step": 254730 }, { "epoch": 1.64, "learning_rate": 5.337717911150983e-05, "loss": 0.0282, "step": 254740 }, { "epoch": 1.64, "learning_rate": 5.3367497757152904e-05, "loss": 0.0274, "step": 254750 }, { "epoch": 1.64, "learning_rate": 5.335781640279597e-05, "loss": 0.0251, "step": 254760 }, { "epoch": 1.64, "learning_rate": 5.3348135048439044e-05, "loss": 0.0264, "step": 254770 }, { "epoch": 1.64, "learning_rate": 5.33384536940821e-05, "loss": 0.0232, "step": 254780 }, { "epoch": 1.64, "learning_rate": 5.332877233972517e-05, "loss": 0.025, "step": 254790 }, { "epoch": 1.64, "learning_rate": 5.331909098536824e-05, "loss": 0.0317, "step": 254800 }, { "epoch": 1.64, "learning_rate": 5.330940963101131e-05, "loss": 0.0257, "step": 254810 }, { "epoch": 1.64, "learning_rate": 5.329972827665438e-05, "loss": 0.0372, "step": 254820 }, { "epoch": 1.64, "learning_rate": 5.329004692229744e-05, "loss": 0.0227, "step": 254830 }, { "epoch": 1.64, "learning_rate": 5.3280365567940514e-05, "loss": 0.0203, "step": 254840 }, { "epoch": 1.64, "learning_rate": 5.327068421358358e-05, "loss": 0.0259, "step": 254850 }, { "epoch": 1.64, "learning_rate": 5.3261002859226646e-05, "loss": 0.028, "step": 254860 }, { "epoch": 1.64, "learning_rate": 5.325132150486972e-05, "loss": 0.0316, "step": 254870 }, { "epoch": 1.65, "learning_rate": 5.324164015051278e-05, "loss": 0.0266, "step": 254880 }, { "epoch": 1.65, "learning_rate": 5.323195879615585e-05, "loss": 0.0227, "step": 254890 }, { "epoch": 1.65, "learning_rate": 5.322227744179892e-05, "loss": 0.0244, "step": 254900 }, { "epoch": 1.65, "learning_rate": 5.321259608744199e-05, "loss": 0.0243, "step": 254910 }, { "epoch": 1.65, "learning_rate": 5.320291473308506e-05, "loss": 0.0303, "step": 254920 }, { "epoch": 1.65, "learning_rate": 5.319323337872812e-05, "loss": 0.0243, "step": 254930 }, { "epoch": 1.65, "learning_rate": 5.318355202437119e-05, "loss": 0.0246, "step": 254940 }, { "epoch": 1.65, "learning_rate": 5.3173870670014256e-05, "loss": 0.0264, "step": 254950 }, { "epoch": 1.65, "learning_rate": 5.316418931565733e-05, "loss": 0.0242, "step": 254960 }, { "epoch": 1.65, "learning_rate": 5.3154507961300395e-05, "loss": 0.025, "step": 254970 }, { "epoch": 1.65, "learning_rate": 5.314482660694347e-05, "loss": 0.0258, "step": 254980 }, { "epoch": 1.65, "learning_rate": 5.313514525258653e-05, "loss": 0.0302, "step": 254990 }, { "epoch": 1.65, "learning_rate": 5.3125463898229594e-05, "loss": 0.0246, "step": 255000 }, { "epoch": 1.65, "eval_cer": 0.9198255564343012, "eval_loss": 0.018629562109708786, "eval_runtime": 120.0069, "eval_samples_per_second": 16.666, "eval_steps_per_second": 4.166, "step": 255000 }, { "epoch": 1.65, "learning_rate": 5.311578254387267e-05, "loss": 0.0264, "step": 255010 }, { "epoch": 1.65, "learning_rate": 5.3106101189515733e-05, "loss": 0.0253, "step": 255020 }, { "epoch": 1.65, "learning_rate": 5.3096419835158806e-05, "loss": 0.0293, "step": 255030 }, { "epoch": 1.65, "learning_rate": 5.3086738480801866e-05, "loss": 0.0254, "step": 255040 }, { "epoch": 1.65, "learning_rate": 5.307705712644494e-05, "loss": 0.0287, "step": 255050 }, { "epoch": 1.65, "learning_rate": 5.3067375772088005e-05, "loss": 0.0244, "step": 255060 }, { "epoch": 1.65, "learning_rate": 5.305769441773107e-05, "loss": 0.0248, "step": 255070 }, { "epoch": 1.65, "learning_rate": 5.3048013063374144e-05, "loss": 0.0252, "step": 255080 }, { "epoch": 1.65, "learning_rate": 5.3038331709017204e-05, "loss": 0.0268, "step": 255090 }, { "epoch": 1.65, "learning_rate": 5.302865035466028e-05, "loss": 0.0259, "step": 255100 }, { "epoch": 1.65, "learning_rate": 5.301896900030334e-05, "loss": 0.0274, "step": 255110 }, { "epoch": 1.65, "learning_rate": 5.3009287645946416e-05, "loss": 0.0252, "step": 255120 }, { "epoch": 1.65, "learning_rate": 5.299960629158948e-05, "loss": 0.0216, "step": 255130 }, { "epoch": 1.65, "learning_rate": 5.298992493723254e-05, "loss": 0.0259, "step": 255140 }, { "epoch": 1.65, "learning_rate": 5.2980243582875615e-05, "loss": 0.0232, "step": 255150 }, { "epoch": 1.65, "learning_rate": 5.297056222851868e-05, "loss": 0.0235, "step": 255160 }, { "epoch": 1.65, "learning_rate": 5.2960880874161754e-05, "loss": 0.0254, "step": 255170 }, { "epoch": 1.65, "learning_rate": 5.295119951980482e-05, "loss": 0.0244, "step": 255180 }, { "epoch": 1.65, "learning_rate": 5.294151816544789e-05, "loss": 0.0257, "step": 255190 }, { "epoch": 1.65, "learning_rate": 5.293183681109095e-05, "loss": 0.0261, "step": 255200 }, { "epoch": 1.65, "learning_rate": 5.292215545673402e-05, "loss": 0.0312, "step": 255210 }, { "epoch": 1.65, "learning_rate": 5.291247410237709e-05, "loss": 0.0251, "step": 255220 }, { "epoch": 1.65, "learning_rate": 5.290279274802016e-05, "loss": 0.0275, "step": 255230 }, { "epoch": 1.65, "learning_rate": 5.289311139366323e-05, "loss": 0.0238, "step": 255240 }, { "epoch": 1.65, "learning_rate": 5.288343003930629e-05, "loss": 0.024, "step": 255250 }, { "epoch": 1.65, "learning_rate": 5.2873748684949364e-05, "loss": 0.0272, "step": 255260 }, { "epoch": 1.65, "learning_rate": 5.286406733059243e-05, "loss": 0.0282, "step": 255270 }, { "epoch": 1.65, "learning_rate": 5.2854385976235496e-05, "loss": 0.0259, "step": 255280 }, { "epoch": 1.65, "learning_rate": 5.284470462187857e-05, "loss": 0.0293, "step": 255290 }, { "epoch": 1.65, "learning_rate": 5.283502326752163e-05, "loss": 0.0252, "step": 255300 }, { "epoch": 1.65, "learning_rate": 5.28253419131647e-05, "loss": 0.0227, "step": 255310 }, { "epoch": 1.65, "learning_rate": 5.281566055880777e-05, "loss": 0.0306, "step": 255320 }, { "epoch": 1.65, "learning_rate": 5.280597920445084e-05, "loss": 0.0253, "step": 255330 }, { "epoch": 1.65, "learning_rate": 5.279629785009391e-05, "loss": 0.0273, "step": 255340 }, { "epoch": 1.65, "learning_rate": 5.278661649573697e-05, "loss": 0.0287, "step": 255350 }, { "epoch": 1.65, "learning_rate": 5.277693514138004e-05, "loss": 0.0235, "step": 255360 }, { "epoch": 1.65, "learning_rate": 5.2767253787023106e-05, "loss": 0.022, "step": 255370 }, { "epoch": 1.65, "learning_rate": 5.275757243266618e-05, "loss": 0.0245, "step": 255380 }, { "epoch": 1.65, "learning_rate": 5.2747891078309245e-05, "loss": 0.0211, "step": 255390 }, { "epoch": 1.65, "learning_rate": 5.273820972395232e-05, "loss": 0.0237, "step": 255400 }, { "epoch": 1.65, "learning_rate": 5.272852836959538e-05, "loss": 0.0276, "step": 255410 }, { "epoch": 1.65, "learning_rate": 5.2718847015238444e-05, "loss": 0.0211, "step": 255420 }, { "epoch": 1.65, "learning_rate": 5.270916566088152e-05, "loss": 0.022, "step": 255430 }, { "epoch": 1.65, "learning_rate": 5.269948430652458e-05, "loss": 0.028, "step": 255440 }, { "epoch": 1.65, "learning_rate": 5.2689802952167656e-05, "loss": 0.0282, "step": 255450 }, { "epoch": 1.65, "learning_rate": 5.2680121597810716e-05, "loss": 0.028, "step": 255460 }, { "epoch": 1.65, "learning_rate": 5.267044024345379e-05, "loss": 0.0224, "step": 255470 }, { "epoch": 1.65, "learning_rate": 5.2660758889096855e-05, "loss": 0.0225, "step": 255480 }, { "epoch": 1.65, "learning_rate": 5.265107753473992e-05, "loss": 0.0235, "step": 255490 }, { "epoch": 1.65, "learning_rate": 5.2641396180382994e-05, "loss": 0.0247, "step": 255500 }, { "epoch": 1.65, "learning_rate": 5.2631714826026054e-05, "loss": 0.0225, "step": 255510 }, { "epoch": 1.65, "learning_rate": 5.262203347166913e-05, "loss": 0.0326, "step": 255520 }, { "epoch": 1.65, "learning_rate": 5.261235211731219e-05, "loss": 0.0274, "step": 255530 }, { "epoch": 1.65, "learning_rate": 5.2602670762955266e-05, "loss": 0.0286, "step": 255540 }, { "epoch": 1.65, "learning_rate": 5.259298940859833e-05, "loss": 0.0216, "step": 255550 }, { "epoch": 1.65, "learning_rate": 5.258330805424139e-05, "loss": 0.0238, "step": 255560 }, { "epoch": 1.65, "learning_rate": 5.2573626699884465e-05, "loss": 0.0204, "step": 255570 }, { "epoch": 1.65, "learning_rate": 5.256394534552753e-05, "loss": 0.0242, "step": 255580 }, { "epoch": 1.65, "learning_rate": 5.2554263991170604e-05, "loss": 0.0272, "step": 255590 }, { "epoch": 1.65, "learning_rate": 5.254458263681367e-05, "loss": 0.024, "step": 255600 }, { "epoch": 1.65, "learning_rate": 5.253490128245674e-05, "loss": 0.0243, "step": 255610 }, { "epoch": 1.65, "learning_rate": 5.25252199280998e-05, "loss": 0.023, "step": 255620 }, { "epoch": 1.65, "learning_rate": 5.251553857374287e-05, "loss": 0.022, "step": 255630 }, { "epoch": 1.65, "learning_rate": 5.250585721938594e-05, "loss": 0.0249, "step": 255640 }, { "epoch": 1.65, "learning_rate": 5.249617586502901e-05, "loss": 0.0247, "step": 255650 }, { "epoch": 1.65, "learning_rate": 5.248649451067208e-05, "loss": 0.0223, "step": 255660 }, { "epoch": 1.65, "learning_rate": 5.247681315631514e-05, "loss": 0.0293, "step": 255670 }, { "epoch": 1.65, "learning_rate": 5.246713180195821e-05, "loss": 0.0271, "step": 255680 }, { "epoch": 1.65, "learning_rate": 5.245745044760128e-05, "loss": 0.0226, "step": 255690 }, { "epoch": 1.65, "learning_rate": 5.2447769093244346e-05, "loss": 0.0237, "step": 255700 }, { "epoch": 1.65, "learning_rate": 5.243808773888742e-05, "loss": 0.0227, "step": 255710 }, { "epoch": 1.65, "learning_rate": 5.242840638453048e-05, "loss": 0.0245, "step": 255720 }, { "epoch": 1.65, "learning_rate": 5.241872503017355e-05, "loss": 0.0268, "step": 255730 }, { "epoch": 1.65, "learning_rate": 5.240904367581662e-05, "loss": 0.0264, "step": 255740 }, { "epoch": 1.65, "learning_rate": 5.2399362321459684e-05, "loss": 0.0217, "step": 255750 }, { "epoch": 1.65, "learning_rate": 5.238968096710276e-05, "loss": 0.0281, "step": 255760 }, { "epoch": 1.65, "learning_rate": 5.2379999612745817e-05, "loss": 0.0232, "step": 255770 }, { "epoch": 1.65, "learning_rate": 5.237031825838889e-05, "loss": 0.0208, "step": 255780 }, { "epoch": 1.65, "learning_rate": 5.2360636904031956e-05, "loss": 0.0299, "step": 255790 }, { "epoch": 1.65, "learning_rate": 5.235095554967503e-05, "loss": 0.0237, "step": 255800 }, { "epoch": 1.65, "learning_rate": 5.2341274195318095e-05, "loss": 0.0243, "step": 255810 }, { "epoch": 1.65, "learning_rate": 5.2331592840961155e-05, "loss": 0.0248, "step": 255820 }, { "epoch": 1.65, "learning_rate": 5.232191148660423e-05, "loss": 0.0226, "step": 255830 }, { "epoch": 1.65, "learning_rate": 5.2312230132247294e-05, "loss": 0.0232, "step": 255840 }, { "epoch": 1.65, "learning_rate": 5.230254877789037e-05, "loss": 0.026, "step": 255850 }, { "epoch": 1.65, "learning_rate": 5.229286742353343e-05, "loss": 0.0209, "step": 255860 }, { "epoch": 1.65, "learning_rate": 5.22831860691765e-05, "loss": 0.0185, "step": 255870 }, { "epoch": 1.65, "learning_rate": 5.2273504714819566e-05, "loss": 0.0249, "step": 255880 }, { "epoch": 1.65, "learning_rate": 5.226382336046263e-05, "loss": 0.0215, "step": 255890 }, { "epoch": 1.65, "learning_rate": 5.2254142006105705e-05, "loss": 0.0246, "step": 255900 }, { "epoch": 1.65, "learning_rate": 5.224446065174877e-05, "loss": 0.0265, "step": 255910 }, { "epoch": 1.65, "learning_rate": 5.223477929739184e-05, "loss": 0.0228, "step": 255920 }, { "epoch": 1.65, "learning_rate": 5.2225097943034903e-05, "loss": 0.0235, "step": 255930 }, { "epoch": 1.65, "learning_rate": 5.2215416588677976e-05, "loss": 0.0233, "step": 255940 }, { "epoch": 1.65, "learning_rate": 5.220573523432104e-05, "loss": 0.025, "step": 255950 }, { "epoch": 1.65, "learning_rate": 5.219605387996411e-05, "loss": 0.0236, "step": 255960 }, { "epoch": 1.65, "learning_rate": 5.2186372525607175e-05, "loss": 0.0238, "step": 255970 }, { "epoch": 1.65, "learning_rate": 5.217669117125024e-05, "loss": 0.0246, "step": 255980 }, { "epoch": 1.65, "learning_rate": 5.2167009816893314e-05, "loss": 0.023, "step": 255990 }, { "epoch": 1.65, "learning_rate": 5.215732846253638e-05, "loss": 0.0213, "step": 256000 }, { "epoch": 1.65, "eval_cer": 0.9198852107106542, "eval_loss": 0.018240749835968018, "eval_runtime": 120.0265, "eval_samples_per_second": 16.663, "eval_steps_per_second": 4.166, "step": 256000 }, { "epoch": 1.65, "learning_rate": 5.2147647108179454e-05, "loss": 0.0221, "step": 256010 }, { "epoch": 1.65, "learning_rate": 5.213796575382251e-05, "loss": 0.0277, "step": 256020 }, { "epoch": 1.65, "learning_rate": 5.212828439946558e-05, "loss": 0.0244, "step": 256030 }, { "epoch": 1.65, "learning_rate": 5.211860304510865e-05, "loss": 0.0221, "step": 256040 }, { "epoch": 1.65, "learning_rate": 5.210892169075172e-05, "loss": 0.0308, "step": 256050 }, { "epoch": 1.65, "learning_rate": 5.209924033639479e-05, "loss": 0.0227, "step": 256060 }, { "epoch": 1.65, "learning_rate": 5.208955898203785e-05, "loss": 0.0282, "step": 256070 }, { "epoch": 1.65, "learning_rate": 5.2079877627680924e-05, "loss": 0.0243, "step": 256080 }, { "epoch": 1.65, "learning_rate": 5.207019627332399e-05, "loss": 0.0243, "step": 256090 }, { "epoch": 1.65, "learning_rate": 5.206051491896706e-05, "loss": 0.0246, "step": 256100 }, { "epoch": 1.65, "learning_rate": 5.205083356461013e-05, "loss": 0.0224, "step": 256110 }, { "epoch": 1.65, "learning_rate": 5.204115221025319e-05, "loss": 0.0233, "step": 256120 }, { "epoch": 1.65, "learning_rate": 5.203147085589626e-05, "loss": 0.0204, "step": 256130 }, { "epoch": 1.65, "learning_rate": 5.202178950153933e-05, "loss": 0.0253, "step": 256140 }, { "epoch": 1.65, "learning_rate": 5.20121081471824e-05, "loss": 0.0201, "step": 256150 }, { "epoch": 1.65, "learning_rate": 5.200242679282547e-05, "loss": 0.0241, "step": 256160 }, { "epoch": 1.65, "learning_rate": 5.199274543846853e-05, "loss": 0.028, "step": 256170 }, { "epoch": 1.65, "learning_rate": 5.19830640841116e-05, "loss": 0.0233, "step": 256180 }, { "epoch": 1.65, "learning_rate": 5.1973382729754666e-05, "loss": 0.029, "step": 256190 }, { "epoch": 1.65, "learning_rate": 5.196370137539774e-05, "loss": 0.031, "step": 256200 }, { "epoch": 1.65, "learning_rate": 5.1954020021040806e-05, "loss": 0.0274, "step": 256210 }, { "epoch": 1.65, "learning_rate": 5.194433866668388e-05, "loss": 0.0261, "step": 256220 }, { "epoch": 1.65, "learning_rate": 5.193465731232694e-05, "loss": 0.0257, "step": 256230 }, { "epoch": 1.65, "learning_rate": 5.1924975957970004e-05, "loss": 0.0277, "step": 256240 }, { "epoch": 1.65, "learning_rate": 5.191529460361308e-05, "loss": 0.0307, "step": 256250 }, { "epoch": 1.65, "learning_rate": 5.1905613249256144e-05, "loss": 0.0229, "step": 256260 }, { "epoch": 1.65, "learning_rate": 5.1895931894899217e-05, "loss": 0.0226, "step": 256270 }, { "epoch": 1.65, "learning_rate": 5.1886250540542276e-05, "loss": 0.0218, "step": 256280 }, { "epoch": 1.65, "learning_rate": 5.187656918618535e-05, "loss": 0.0256, "step": 256290 }, { "epoch": 1.65, "learning_rate": 5.1866887831828415e-05, "loss": 0.024, "step": 256300 }, { "epoch": 1.65, "learning_rate": 5.185720647747148e-05, "loss": 0.0236, "step": 256310 }, { "epoch": 1.65, "learning_rate": 5.1847525123114555e-05, "loss": 0.0238, "step": 256320 }, { "epoch": 1.65, "learning_rate": 5.1837843768757614e-05, "loss": 0.0225, "step": 256330 }, { "epoch": 1.65, "learning_rate": 5.182816241440069e-05, "loss": 0.0232, "step": 256340 }, { "epoch": 1.65, "learning_rate": 5.181848106004375e-05, "loss": 0.0231, "step": 256350 }, { "epoch": 1.65, "learning_rate": 5.1808799705686826e-05, "loss": 0.0253, "step": 256360 }, { "epoch": 1.65, "learning_rate": 5.179911835132989e-05, "loss": 0.0269, "step": 256370 }, { "epoch": 1.65, "learning_rate": 5.178943699697295e-05, "loss": 0.0256, "step": 256380 }, { "epoch": 1.65, "learning_rate": 5.1779755642616025e-05, "loss": 0.0227, "step": 256390 }, { "epoch": 1.65, "learning_rate": 5.177007428825909e-05, "loss": 0.0213, "step": 256400 }, { "epoch": 1.65, "learning_rate": 5.1760392933902164e-05, "loss": 0.0261, "step": 256410 }, { "epoch": 1.65, "learning_rate": 5.175071157954523e-05, "loss": 0.0254, "step": 256420 }, { "epoch": 1.66, "learning_rate": 5.1741030225188304e-05, "loss": 0.0246, "step": 256430 }, { "epoch": 1.66, "learning_rate": 5.173134887083136e-05, "loss": 0.0212, "step": 256440 }, { "epoch": 1.66, "learning_rate": 5.172166751647443e-05, "loss": 0.0241, "step": 256450 }, { "epoch": 1.66, "learning_rate": 5.17119861621175e-05, "loss": 0.0231, "step": 256460 }, { "epoch": 1.66, "learning_rate": 5.170230480776057e-05, "loss": 0.0272, "step": 256470 }, { "epoch": 1.66, "learning_rate": 5.169262345340364e-05, "loss": 0.0256, "step": 256480 }, { "epoch": 1.66, "learning_rate": 5.16829420990467e-05, "loss": 0.0263, "step": 256490 }, { "epoch": 1.66, "learning_rate": 5.1673260744689774e-05, "loss": 0.0216, "step": 256500 }, { "epoch": 1.66, "learning_rate": 5.166357939033284e-05, "loss": 0.0302, "step": 256510 }, { "epoch": 1.66, "learning_rate": 5.1653898035975906e-05, "loss": 0.0285, "step": 256520 }, { "epoch": 1.66, "learning_rate": 5.164421668161898e-05, "loss": 0.0324, "step": 256530 }, { "epoch": 1.66, "learning_rate": 5.163453532726204e-05, "loss": 0.0252, "step": 256540 }, { "epoch": 1.66, "learning_rate": 5.162485397290511e-05, "loss": 0.0209, "step": 256550 }, { "epoch": 1.66, "learning_rate": 5.161517261854818e-05, "loss": 0.0251, "step": 256560 }, { "epoch": 1.66, "learning_rate": 5.160549126419125e-05, "loss": 0.0247, "step": 256570 }, { "epoch": 1.66, "learning_rate": 5.159580990983432e-05, "loss": 0.0272, "step": 256580 }, { "epoch": 1.66, "learning_rate": 5.158612855547738e-05, "loss": 0.0256, "step": 256590 }, { "epoch": 1.66, "learning_rate": 5.157644720112045e-05, "loss": 0.0202, "step": 256600 }, { "epoch": 1.66, "learning_rate": 5.1566765846763516e-05, "loss": 0.031, "step": 256610 }, { "epoch": 1.66, "learning_rate": 5.155708449240659e-05, "loss": 0.0253, "step": 256620 }, { "epoch": 1.66, "learning_rate": 5.1547403138049655e-05, "loss": 0.026, "step": 256630 }, { "epoch": 1.66, "learning_rate": 5.153772178369273e-05, "loss": 0.026, "step": 256640 }, { "epoch": 1.66, "learning_rate": 5.152804042933579e-05, "loss": 0.023, "step": 256650 }, { "epoch": 1.66, "learning_rate": 5.1518359074978854e-05, "loss": 0.0238, "step": 256660 }, { "epoch": 1.66, "learning_rate": 5.150867772062193e-05, "loss": 0.0229, "step": 256670 }, { "epoch": 1.66, "learning_rate": 5.149899636626499e-05, "loss": 0.025, "step": 256680 }, { "epoch": 1.66, "learning_rate": 5.1489315011908066e-05, "loss": 0.0276, "step": 256690 }, { "epoch": 1.66, "learning_rate": 5.1479633657551126e-05, "loss": 0.0275, "step": 256700 }, { "epoch": 1.66, "learning_rate": 5.14699523031942e-05, "loss": 0.0288, "step": 256710 }, { "epoch": 1.66, "learning_rate": 5.1460270948837265e-05, "loss": 0.0208, "step": 256720 }, { "epoch": 1.66, "learning_rate": 5.145058959448033e-05, "loss": 0.0225, "step": 256730 }, { "epoch": 1.66, "learning_rate": 5.1440908240123404e-05, "loss": 0.0244, "step": 256740 }, { "epoch": 1.66, "learning_rate": 5.1431226885766464e-05, "loss": 0.0228, "step": 256750 }, { "epoch": 1.66, "learning_rate": 5.142154553140954e-05, "loss": 0.0252, "step": 256760 }, { "epoch": 1.66, "learning_rate": 5.14118641770526e-05, "loss": 0.0229, "step": 256770 }, { "epoch": 1.66, "learning_rate": 5.1402182822695676e-05, "loss": 0.0254, "step": 256780 }, { "epoch": 1.66, "learning_rate": 5.139250146833874e-05, "loss": 0.0196, "step": 256790 }, { "epoch": 1.66, "learning_rate": 5.13828201139818e-05, "loss": 0.0284, "step": 256800 }, { "epoch": 1.66, "learning_rate": 5.1373138759624875e-05, "loss": 0.0244, "step": 256810 }, { "epoch": 1.66, "learning_rate": 5.136345740526794e-05, "loss": 0.0243, "step": 256820 }, { "epoch": 1.66, "learning_rate": 5.1353776050911014e-05, "loss": 0.0291, "step": 256830 }, { "epoch": 1.66, "learning_rate": 5.134409469655408e-05, "loss": 0.0254, "step": 256840 }, { "epoch": 1.66, "learning_rate": 5.133441334219715e-05, "loss": 0.0201, "step": 256850 }, { "epoch": 1.66, "learning_rate": 5.132473198784021e-05, "loss": 0.0275, "step": 256860 }, { "epoch": 1.66, "learning_rate": 5.131505063348328e-05, "loss": 0.0202, "step": 256870 }, { "epoch": 1.66, "learning_rate": 5.130536927912635e-05, "loss": 0.02, "step": 256880 }, { "epoch": 1.66, "learning_rate": 5.129568792476942e-05, "loss": 0.0234, "step": 256890 }, { "epoch": 1.66, "learning_rate": 5.128600657041249e-05, "loss": 0.0211, "step": 256900 }, { "epoch": 1.66, "learning_rate": 5.127632521605555e-05, "loss": 0.0208, "step": 256910 }, { "epoch": 1.66, "learning_rate": 5.1266643861698624e-05, "loss": 0.0257, "step": 256920 }, { "epoch": 1.66, "learning_rate": 5.125696250734169e-05, "loss": 0.0256, "step": 256930 }, { "epoch": 1.66, "learning_rate": 5.1247281152984756e-05, "loss": 0.0203, "step": 256940 }, { "epoch": 1.66, "learning_rate": 5.123759979862783e-05, "loss": 0.03, "step": 256950 }, { "epoch": 1.66, "learning_rate": 5.122791844427089e-05, "loss": 0.0251, "step": 256960 }, { "epoch": 1.66, "learning_rate": 5.121823708991396e-05, "loss": 0.0238, "step": 256970 }, { "epoch": 1.66, "learning_rate": 5.120855573555703e-05, "loss": 0.024, "step": 256980 }, { "epoch": 1.66, "learning_rate": 5.11988743812001e-05, "loss": 0.0221, "step": 256990 }, { "epoch": 1.66, "learning_rate": 5.118919302684317e-05, "loss": 0.0251, "step": 257000 }, { "epoch": 1.66, "eval_cer": 0.9198481527511015, "eval_loss": 0.018239615485072136, "eval_runtime": 120.1756, "eval_samples_per_second": 16.642, "eval_steps_per_second": 4.161, "step": 257000 }, { "epoch": 1.66, "learning_rate": 5.117951167248623e-05, "loss": 0.0253, "step": 257010 }, { "epoch": 1.66, "learning_rate": 5.11698303181293e-05, "loss": 0.0239, "step": 257020 }, { "epoch": 1.66, "learning_rate": 5.1160148963772366e-05, "loss": 0.0207, "step": 257030 }, { "epoch": 1.66, "learning_rate": 5.115046760941544e-05, "loss": 0.0246, "step": 257040 }, { "epoch": 1.66, "learning_rate": 5.1140786255058505e-05, "loss": 0.031, "step": 257050 }, { "epoch": 1.66, "learning_rate": 5.113110490070158e-05, "loss": 0.0264, "step": 257060 }, { "epoch": 1.66, "learning_rate": 5.112142354634464e-05, "loss": 0.0231, "step": 257070 }, { "epoch": 1.66, "learning_rate": 5.1111742191987704e-05, "loss": 0.0209, "step": 257080 }, { "epoch": 1.66, "learning_rate": 5.110206083763078e-05, "loss": 0.0233, "step": 257090 }, { "epoch": 1.66, "learning_rate": 5.109237948327384e-05, "loss": 0.0229, "step": 257100 }, { "epoch": 1.66, "learning_rate": 5.1082698128916916e-05, "loss": 0.0223, "step": 257110 }, { "epoch": 1.66, "learning_rate": 5.1073016774559976e-05, "loss": 0.0279, "step": 257120 }, { "epoch": 1.66, "learning_rate": 5.106333542020305e-05, "loss": 0.0223, "step": 257130 }, { "epoch": 1.66, "learning_rate": 5.1053654065846115e-05, "loss": 0.0272, "step": 257140 }, { "epoch": 1.66, "learning_rate": 5.104397271148918e-05, "loss": 0.0284, "step": 257150 }, { "epoch": 1.66, "learning_rate": 5.1034291357132254e-05, "loss": 0.0212, "step": 257160 }, { "epoch": 1.66, "learning_rate": 5.1024610002775314e-05, "loss": 0.0253, "step": 257170 }, { "epoch": 1.66, "learning_rate": 5.101492864841839e-05, "loss": 0.0214, "step": 257180 }, { "epoch": 1.66, "learning_rate": 5.100524729406145e-05, "loss": 0.0284, "step": 257190 }, { "epoch": 1.66, "learning_rate": 5.0995565939704526e-05, "loss": 0.0224, "step": 257200 }, { "epoch": 1.66, "learning_rate": 5.098588458534759e-05, "loss": 0.0243, "step": 257210 }, { "epoch": 1.66, "learning_rate": 5.097620323099065e-05, "loss": 0.0263, "step": 257220 }, { "epoch": 1.66, "learning_rate": 5.0966521876633725e-05, "loss": 0.0223, "step": 257230 }, { "epoch": 1.66, "learning_rate": 5.095684052227679e-05, "loss": 0.0283, "step": 257240 }, { "epoch": 1.66, "learning_rate": 5.0947159167919864e-05, "loss": 0.0261, "step": 257250 }, { "epoch": 1.66, "learning_rate": 5.093747781356293e-05, "loss": 0.0231, "step": 257260 }, { "epoch": 1.66, "learning_rate": 5.0927796459205996e-05, "loss": 0.0238, "step": 257270 }, { "epoch": 1.66, "learning_rate": 5.091811510484906e-05, "loss": 0.0238, "step": 257280 }, { "epoch": 1.66, "learning_rate": 5.090843375049213e-05, "loss": 0.0261, "step": 257290 }, { "epoch": 1.66, "learning_rate": 5.08987523961352e-05, "loss": 0.0235, "step": 257300 }, { "epoch": 1.66, "learning_rate": 5.088907104177827e-05, "loss": 0.0233, "step": 257310 }, { "epoch": 1.66, "learning_rate": 5.0879389687421334e-05, "loss": 0.03, "step": 257320 }, { "epoch": 1.66, "learning_rate": 5.08697083330644e-05, "loss": 0.0264, "step": 257330 }, { "epoch": 1.66, "learning_rate": 5.0860026978707474e-05, "loss": 0.0261, "step": 257340 }, { "epoch": 1.66, "learning_rate": 5.085034562435054e-05, "loss": 0.0286, "step": 257350 }, { "epoch": 1.66, "learning_rate": 5.0840664269993606e-05, "loss": 0.0285, "step": 257360 }, { "epoch": 1.66, "learning_rate": 5.083098291563667e-05, "loss": 0.0258, "step": 257370 }, { "epoch": 1.66, "learning_rate": 5.082130156127974e-05, "loss": 0.0223, "step": 257380 }, { "epoch": 1.66, "learning_rate": 5.081162020692281e-05, "loss": 0.0285, "step": 257390 }, { "epoch": 1.66, "learning_rate": 5.080193885256588e-05, "loss": 0.0267, "step": 257400 }, { "epoch": 1.66, "learning_rate": 5.0792257498208944e-05, "loss": 0.0285, "step": 257410 }, { "epoch": 1.66, "learning_rate": 5.078257614385201e-05, "loss": 0.0194, "step": 257420 }, { "epoch": 1.66, "learning_rate": 5.0772894789495077e-05, "loss": 0.0314, "step": 257430 }, { "epoch": 1.66, "learning_rate": 5.076321343513815e-05, "loss": 0.0273, "step": 257440 }, { "epoch": 1.66, "learning_rate": 5.0753532080781216e-05, "loss": 0.0293, "step": 257450 }, { "epoch": 1.66, "learning_rate": 5.074385072642429e-05, "loss": 0.0219, "step": 257460 }, { "epoch": 1.66, "learning_rate": 5.073416937206735e-05, "loss": 0.0265, "step": 257470 }, { "epoch": 1.66, "learning_rate": 5.0724488017710414e-05, "loss": 0.0227, "step": 257480 }, { "epoch": 1.66, "learning_rate": 5.071480666335349e-05, "loss": 0.0225, "step": 257490 }, { "epoch": 1.66, "learning_rate": 5.0705125308996554e-05, "loss": 0.0217, "step": 257500 }, { "epoch": 1.66, "learning_rate": 5.069544395463963e-05, "loss": 0.0259, "step": 257510 }, { "epoch": 1.66, "learning_rate": 5.0685762600282686e-05, "loss": 0.0256, "step": 257520 }, { "epoch": 1.66, "learning_rate": 5.067608124592576e-05, "loss": 0.0295, "step": 257530 }, { "epoch": 1.66, "learning_rate": 5.0666399891568825e-05, "loss": 0.0217, "step": 257540 }, { "epoch": 1.66, "learning_rate": 5.065671853721189e-05, "loss": 0.0292, "step": 257550 }, { "epoch": 1.66, "learning_rate": 5.0647037182854965e-05, "loss": 0.0207, "step": 257560 }, { "epoch": 1.66, "learning_rate": 5.0637355828498024e-05, "loss": 0.0243, "step": 257570 }, { "epoch": 1.66, "learning_rate": 5.06276744741411e-05, "loss": 0.026, "step": 257580 }, { "epoch": 1.66, "learning_rate": 5.0617993119784163e-05, "loss": 0.0215, "step": 257590 }, { "epoch": 1.66, "learning_rate": 5.0608311765427236e-05, "loss": 0.0289, "step": 257600 }, { "epoch": 1.66, "learning_rate": 5.05986304110703e-05, "loss": 0.0292, "step": 257610 }, { "epoch": 1.66, "learning_rate": 5.058894905671336e-05, "loss": 0.0268, "step": 257620 }, { "epoch": 1.66, "learning_rate": 5.0579267702356435e-05, "loss": 0.0269, "step": 257630 }, { "epoch": 1.66, "learning_rate": 5.05695863479995e-05, "loss": 0.0237, "step": 257640 }, { "epoch": 1.66, "learning_rate": 5.0559904993642574e-05, "loss": 0.0307, "step": 257650 }, { "epoch": 1.66, "learning_rate": 5.055022363928564e-05, "loss": 0.0245, "step": 257660 }, { "epoch": 1.66, "learning_rate": 5.0540542284928714e-05, "loss": 0.023, "step": 257670 }, { "epoch": 1.66, "learning_rate": 5.053086093057177e-05, "loss": 0.0202, "step": 257680 }, { "epoch": 1.66, "learning_rate": 5.052117957621484e-05, "loss": 0.0255, "step": 257690 }, { "epoch": 1.66, "learning_rate": 5.051149822185791e-05, "loss": 0.0224, "step": 257700 }, { "epoch": 1.66, "learning_rate": 5.050181686750098e-05, "loss": 0.0279, "step": 257710 }, { "epoch": 1.66, "learning_rate": 5.049213551314405e-05, "loss": 0.0235, "step": 257720 }, { "epoch": 1.66, "learning_rate": 5.048245415878711e-05, "loss": 0.0264, "step": 257730 }, { "epoch": 1.66, "learning_rate": 5.0472772804430184e-05, "loss": 0.0275, "step": 257740 }, { "epoch": 1.66, "learning_rate": 5.046309145007325e-05, "loss": 0.0275, "step": 257750 }, { "epoch": 1.66, "learning_rate": 5.045341009571632e-05, "loss": 0.0242, "step": 257760 }, { "epoch": 1.66, "learning_rate": 5.044372874135939e-05, "loss": 0.0223, "step": 257770 }, { "epoch": 1.66, "learning_rate": 5.043404738700245e-05, "loss": 0.0265, "step": 257780 }, { "epoch": 1.66, "learning_rate": 5.042436603264552e-05, "loss": 0.0277, "step": 257790 }, { "epoch": 1.66, "learning_rate": 5.041468467828859e-05, "loss": 0.0235, "step": 257800 }, { "epoch": 1.66, "learning_rate": 5.040500332393166e-05, "loss": 0.0216, "step": 257810 }, { "epoch": 1.66, "learning_rate": 5.039532196957473e-05, "loss": 0.0241, "step": 257820 }, { "epoch": 1.66, "learning_rate": 5.038564061521779e-05, "loss": 0.0264, "step": 257830 }, { "epoch": 1.66, "learning_rate": 5.037595926086086e-05, "loss": 0.0254, "step": 257840 }, { "epoch": 1.66, "learning_rate": 5.0366277906503926e-05, "loss": 0.0212, "step": 257850 }, { "epoch": 1.66, "learning_rate": 5.0356596552147e-05, "loss": 0.0246, "step": 257860 }, { "epoch": 1.66, "learning_rate": 5.0346915197790066e-05, "loss": 0.0274, "step": 257870 }, { "epoch": 1.66, "learning_rate": 5.033723384343314e-05, "loss": 0.0232, "step": 257880 }, { "epoch": 1.66, "learning_rate": 5.03275524890762e-05, "loss": 0.0216, "step": 257890 }, { "epoch": 1.66, "learning_rate": 5.0317871134719264e-05, "loss": 0.0229, "step": 257900 }, { "epoch": 1.66, "learning_rate": 5.030818978036234e-05, "loss": 0.0341, "step": 257910 }, { "epoch": 1.66, "learning_rate": 5.0298508426005404e-05, "loss": 0.0236, "step": 257920 }, { "epoch": 1.66, "learning_rate": 5.0288827071648477e-05, "loss": 0.0238, "step": 257930 }, { "epoch": 1.66, "learning_rate": 5.0279145717291536e-05, "loss": 0.0234, "step": 257940 }, { "epoch": 1.66, "learning_rate": 5.026946436293461e-05, "loss": 0.0226, "step": 257950 }, { "epoch": 1.66, "learning_rate": 5.0259783008577675e-05, "loss": 0.0212, "step": 257960 }, { "epoch": 1.66, "learning_rate": 5.025010165422074e-05, "loss": 0.025, "step": 257970 }, { "epoch": 1.67, "learning_rate": 5.0240420299863815e-05, "loss": 0.0282, "step": 257980 }, { "epoch": 1.67, "learning_rate": 5.0230738945506874e-05, "loss": 0.0277, "step": 257990 }, { "epoch": 1.67, "learning_rate": 5.022105759114995e-05, "loss": 0.0236, "step": 258000 }, { "epoch": 1.67, "eval_cer": 0.9198228448762852, "eval_loss": 0.018363136798143387, "eval_runtime": 120.066, "eval_samples_per_second": 16.658, "eval_steps_per_second": 4.164, "step": 258000 }, { "epoch": 1.67, "learning_rate": 5.021137623679301e-05, "loss": 0.0231, "step": 258010 }, { "epoch": 1.67, "learning_rate": 5.0201694882436086e-05, "loss": 0.0217, "step": 258020 }, { "epoch": 1.67, "learning_rate": 5.019201352807915e-05, "loss": 0.0247, "step": 258030 }, { "epoch": 1.67, "learning_rate": 5.018233217372221e-05, "loss": 0.0248, "step": 258040 }, { "epoch": 1.67, "learning_rate": 5.0172650819365285e-05, "loss": 0.0276, "step": 258050 }, { "epoch": 1.67, "learning_rate": 5.016296946500835e-05, "loss": 0.0213, "step": 258060 }, { "epoch": 1.67, "learning_rate": 5.0153288110651424e-05, "loss": 0.0285, "step": 258070 }, { "epoch": 1.67, "learning_rate": 5.014360675629449e-05, "loss": 0.0236, "step": 258080 }, { "epoch": 1.67, "learning_rate": 5.0133925401937564e-05, "loss": 0.029, "step": 258090 }, { "epoch": 1.67, "learning_rate": 5.012424404758062e-05, "loss": 0.0282, "step": 258100 }, { "epoch": 1.67, "learning_rate": 5.011456269322369e-05, "loss": 0.0244, "step": 258110 }, { "epoch": 1.67, "learning_rate": 5.010488133886676e-05, "loss": 0.0251, "step": 258120 }, { "epoch": 1.67, "learning_rate": 5.009519998450983e-05, "loss": 0.0268, "step": 258130 }, { "epoch": 1.67, "learning_rate": 5.00855186301529e-05, "loss": 0.0268, "step": 258140 }, { "epoch": 1.67, "learning_rate": 5.007583727579596e-05, "loss": 0.021, "step": 258150 }, { "epoch": 1.67, "learning_rate": 5.0066155921439034e-05, "loss": 0.0272, "step": 258160 }, { "epoch": 1.67, "learning_rate": 5.00564745670821e-05, "loss": 0.0218, "step": 258170 }, { "epoch": 1.67, "learning_rate": 5.0046793212725166e-05, "loss": 0.0211, "step": 258180 }, { "epoch": 1.67, "learning_rate": 5.003711185836824e-05, "loss": 0.0262, "step": 258190 }, { "epoch": 1.67, "learning_rate": 5.00274305040113e-05, "loss": 0.0314, "step": 258200 }, { "epoch": 1.67, "learning_rate": 5.001774914965437e-05, "loss": 0.022, "step": 258210 }, { "epoch": 1.67, "learning_rate": 5.000806779529744e-05, "loss": 0.0269, "step": 258220 }, { "epoch": 1.67, "learning_rate": 4.999838644094051e-05, "loss": 0.0252, "step": 258230 }, { "epoch": 1.67, "learning_rate": 4.998870508658358e-05, "loss": 0.0305, "step": 258240 }, { "epoch": 1.67, "learning_rate": 4.997902373222664e-05, "loss": 0.0223, "step": 258250 }, { "epoch": 1.67, "learning_rate": 4.996934237786971e-05, "loss": 0.027, "step": 258260 }, { "epoch": 1.67, "learning_rate": 4.9959661023512776e-05, "loss": 0.0249, "step": 258270 }, { "epoch": 1.67, "learning_rate": 4.994997966915585e-05, "loss": 0.0279, "step": 258280 }, { "epoch": 1.67, "learning_rate": 4.9940298314798915e-05, "loss": 0.0271, "step": 258290 }, { "epoch": 1.67, "learning_rate": 4.993061696044199e-05, "loss": 0.0249, "step": 258300 }, { "epoch": 1.67, "learning_rate": 4.992093560608505e-05, "loss": 0.0224, "step": 258310 }, { "epoch": 1.67, "learning_rate": 4.9911254251728114e-05, "loss": 0.0253, "step": 258320 }, { "epoch": 1.67, "learning_rate": 4.990157289737119e-05, "loss": 0.0244, "step": 258330 }, { "epoch": 1.67, "learning_rate": 4.989189154301425e-05, "loss": 0.0198, "step": 258340 }, { "epoch": 1.67, "learning_rate": 4.9882210188657326e-05, "loss": 0.0225, "step": 258350 }, { "epoch": 1.67, "learning_rate": 4.9872528834300386e-05, "loss": 0.0259, "step": 258360 }, { "epoch": 1.67, "learning_rate": 4.986284747994346e-05, "loss": 0.0225, "step": 258370 }, { "epoch": 1.67, "learning_rate": 4.9853166125586525e-05, "loss": 0.025, "step": 258380 }, { "epoch": 1.67, "learning_rate": 4.984348477122959e-05, "loss": 0.0277, "step": 258390 }, { "epoch": 1.67, "learning_rate": 4.9833803416872664e-05, "loss": 0.0241, "step": 258400 }, { "epoch": 1.67, "learning_rate": 4.9824122062515724e-05, "loss": 0.0199, "step": 258410 }, { "epoch": 1.67, "learning_rate": 4.98144407081588e-05, "loss": 0.0266, "step": 258420 }, { "epoch": 1.67, "learning_rate": 4.980475935380186e-05, "loss": 0.0311, "step": 258430 }, { "epoch": 1.67, "learning_rate": 4.9795077999444936e-05, "loss": 0.023, "step": 258440 }, { "epoch": 1.67, "learning_rate": 4.9785396645088e-05, "loss": 0.0227, "step": 258450 }, { "epoch": 1.67, "learning_rate": 4.977571529073106e-05, "loss": 0.0229, "step": 258460 }, { "epoch": 1.67, "learning_rate": 4.9766033936374135e-05, "loss": 0.023, "step": 258470 }, { "epoch": 1.67, "learning_rate": 4.97563525820172e-05, "loss": 0.0265, "step": 258480 }, { "epoch": 1.67, "learning_rate": 4.9746671227660274e-05, "loss": 0.0224, "step": 258490 }, { "epoch": 1.67, "learning_rate": 4.973698987330334e-05, "loss": 0.0288, "step": 258500 }, { "epoch": 1.67, "learning_rate": 4.9727308518946407e-05, "loss": 0.0257, "step": 258510 }, { "epoch": 1.67, "learning_rate": 4.971762716458947e-05, "loss": 0.0226, "step": 258520 }, { "epoch": 1.67, "learning_rate": 4.970794581023254e-05, "loss": 0.0279, "step": 258530 }, { "epoch": 1.67, "learning_rate": 4.969826445587561e-05, "loss": 0.0219, "step": 258540 }, { "epoch": 1.67, "learning_rate": 4.968858310151868e-05, "loss": 0.0259, "step": 258550 }, { "epoch": 1.67, "learning_rate": 4.9678901747161745e-05, "loss": 0.0225, "step": 258560 }, { "epoch": 1.67, "learning_rate": 4.966922039280481e-05, "loss": 0.0251, "step": 258570 }, { "epoch": 1.67, "learning_rate": 4.9659539038447884e-05, "loss": 0.0198, "step": 258580 }, { "epoch": 1.67, "learning_rate": 4.964985768409095e-05, "loss": 0.0239, "step": 258590 }, { "epoch": 1.67, "learning_rate": 4.9640176329734016e-05, "loss": 0.0308, "step": 258600 }, { "epoch": 1.67, "learning_rate": 4.963049497537708e-05, "loss": 0.0219, "step": 258610 }, { "epoch": 1.67, "learning_rate": 4.962081362102015e-05, "loss": 0.027, "step": 258620 }, { "epoch": 1.67, "learning_rate": 4.961113226666322e-05, "loss": 0.027, "step": 258630 }, { "epoch": 1.67, "learning_rate": 4.960145091230629e-05, "loss": 0.0333, "step": 258640 }, { "epoch": 1.67, "learning_rate": 4.959176955794936e-05, "loss": 0.0237, "step": 258650 }, { "epoch": 1.67, "learning_rate": 4.958208820359243e-05, "loss": 0.024, "step": 258660 }, { "epoch": 1.67, "learning_rate": 4.957240684923549e-05, "loss": 0.0245, "step": 258670 }, { "epoch": 1.67, "learning_rate": 4.956272549487856e-05, "loss": 0.029, "step": 258680 }, { "epoch": 1.67, "learning_rate": 4.9553044140521626e-05, "loss": 0.02, "step": 258690 }, { "epoch": 1.67, "learning_rate": 4.95433627861647e-05, "loss": 0.0243, "step": 258700 }, { "epoch": 1.67, "learning_rate": 4.9533681431807765e-05, "loss": 0.0325, "step": 258710 }, { "epoch": 1.67, "learning_rate": 4.952400007745083e-05, "loss": 0.0234, "step": 258720 }, { "epoch": 1.67, "learning_rate": 4.95143187230939e-05, "loss": 0.0287, "step": 258730 }, { "epoch": 1.67, "learning_rate": 4.9504637368736964e-05, "loss": 0.0238, "step": 258740 }, { "epoch": 1.67, "learning_rate": 4.949495601438004e-05, "loss": 0.0244, "step": 258750 }, { "epoch": 1.67, "learning_rate": 4.94852746600231e-05, "loss": 0.0255, "step": 258760 }, { "epoch": 1.67, "learning_rate": 4.947559330566617e-05, "loss": 0.0196, "step": 258770 }, { "epoch": 1.67, "learning_rate": 4.9465911951309236e-05, "loss": 0.0203, "step": 258780 }, { "epoch": 1.67, "learning_rate": 4.945623059695231e-05, "loss": 0.0263, "step": 258790 }, { "epoch": 1.67, "learning_rate": 4.9446549242595375e-05, "loss": 0.0233, "step": 258800 }, { "epoch": 1.67, "learning_rate": 4.943686788823844e-05, "loss": 0.0249, "step": 258810 }, { "epoch": 1.67, "learning_rate": 4.942718653388151e-05, "loss": 0.0279, "step": 258820 }, { "epoch": 1.67, "learning_rate": 4.9417505179524574e-05, "loss": 0.0273, "step": 258830 }, { "epoch": 1.67, "learning_rate": 4.940782382516765e-05, "loss": 0.0263, "step": 258840 }, { "epoch": 1.67, "learning_rate": 4.939814247081071e-05, "loss": 0.0254, "step": 258850 }, { "epoch": 1.67, "learning_rate": 4.9388461116453786e-05, "loss": 0.0247, "step": 258860 }, { "epoch": 1.67, "learning_rate": 4.9378779762096845e-05, "loss": 0.0267, "step": 258870 }, { "epoch": 1.67, "learning_rate": 4.936909840773991e-05, "loss": 0.0255, "step": 258880 }, { "epoch": 1.67, "learning_rate": 4.9359417053382985e-05, "loss": 0.0194, "step": 258890 }, { "epoch": 1.67, "learning_rate": 4.934973569902605e-05, "loss": 0.0205, "step": 258900 }, { "epoch": 1.67, "learning_rate": 4.9340054344669124e-05, "loss": 0.0238, "step": 258910 }, { "epoch": 1.67, "learning_rate": 4.933037299031218e-05, "loss": 0.0268, "step": 258920 }, { "epoch": 1.67, "learning_rate": 4.9320691635955256e-05, "loss": 0.0248, "step": 258930 }, { "epoch": 1.67, "learning_rate": 4.931101028159832e-05, "loss": 0.0222, "step": 258940 }, { "epoch": 1.67, "learning_rate": 4.930132892724139e-05, "loss": 0.0219, "step": 258950 }, { "epoch": 1.67, "learning_rate": 4.929164757288446e-05, "loss": 0.0255, "step": 258960 }, { "epoch": 1.67, "learning_rate": 4.928196621852752e-05, "loss": 0.026, "step": 258970 }, { "epoch": 1.67, "learning_rate": 4.9272284864170594e-05, "loss": 0.0208, "step": 258980 }, { "epoch": 1.67, "learning_rate": 4.926260350981366e-05, "loss": 0.0239, "step": 258990 }, { "epoch": 1.67, "learning_rate": 4.9252922155456734e-05, "loss": 0.0276, "step": 259000 }, { "epoch": 1.67, "eval_cer": 0.9198409219297254, "eval_loss": 0.018455343320965767, "eval_runtime": 120.0636, "eval_samples_per_second": 16.658, "eval_steps_per_second": 4.164, "step": 259000 }, { "epoch": 1.67, "learning_rate": 4.92432408010998e-05, "loss": 0.0202, "step": 259010 }, { "epoch": 1.67, "learning_rate": 4.923355944674286e-05, "loss": 0.0241, "step": 259020 }, { "epoch": 1.67, "learning_rate": 4.922387809238593e-05, "loss": 0.0316, "step": 259030 }, { "epoch": 1.67, "learning_rate": 4.9214196738029e-05, "loss": 0.0258, "step": 259040 }, { "epoch": 1.67, "learning_rate": 4.920451538367207e-05, "loss": 0.0275, "step": 259050 }, { "epoch": 1.67, "learning_rate": 4.919483402931514e-05, "loss": 0.0228, "step": 259060 }, { "epoch": 1.67, "learning_rate": 4.918515267495821e-05, "loss": 0.024, "step": 259070 }, { "epoch": 1.67, "learning_rate": 4.917547132060127e-05, "loss": 0.0237, "step": 259080 }, { "epoch": 1.67, "learning_rate": 4.9165789966244336e-05, "loss": 0.0252, "step": 259090 }, { "epoch": 1.67, "learning_rate": 4.915610861188741e-05, "loss": 0.0263, "step": 259100 }, { "epoch": 1.67, "learning_rate": 4.9146427257530476e-05, "loss": 0.0264, "step": 259110 }, { "epoch": 1.67, "learning_rate": 4.913674590317355e-05, "loss": 0.0225, "step": 259120 }, { "epoch": 1.67, "learning_rate": 4.912706454881661e-05, "loss": 0.0285, "step": 259130 }, { "epoch": 1.67, "learning_rate": 4.9117383194459674e-05, "loss": 0.0228, "step": 259140 }, { "epoch": 1.67, "learning_rate": 4.910770184010275e-05, "loss": 0.0208, "step": 259150 }, { "epoch": 1.67, "learning_rate": 4.9098020485745814e-05, "loss": 0.0213, "step": 259160 }, { "epoch": 1.67, "learning_rate": 4.908833913138889e-05, "loss": 0.0222, "step": 259170 }, { "epoch": 1.67, "learning_rate": 4.9078657777031946e-05, "loss": 0.0243, "step": 259180 }, { "epoch": 1.67, "learning_rate": 4.906897642267502e-05, "loss": 0.0233, "step": 259190 }, { "epoch": 1.67, "learning_rate": 4.9059295068318085e-05, "loss": 0.0256, "step": 259200 }, { "epoch": 1.67, "learning_rate": 4.904961371396115e-05, "loss": 0.0223, "step": 259210 }, { "epoch": 1.67, "learning_rate": 4.9039932359604225e-05, "loss": 0.0238, "step": 259220 }, { "epoch": 1.67, "learning_rate": 4.9030251005247284e-05, "loss": 0.024, "step": 259230 }, { "epoch": 1.67, "learning_rate": 4.902056965089036e-05, "loss": 0.0273, "step": 259240 }, { "epoch": 1.67, "learning_rate": 4.9010888296533423e-05, "loss": 0.0265, "step": 259250 }, { "epoch": 1.67, "learning_rate": 4.9001206942176496e-05, "loss": 0.0264, "step": 259260 }, { "epoch": 1.67, "learning_rate": 4.899152558781956e-05, "loss": 0.023, "step": 259270 }, { "epoch": 1.67, "learning_rate": 4.898184423346262e-05, "loss": 0.0259, "step": 259280 }, { "epoch": 1.67, "learning_rate": 4.8972162879105695e-05, "loss": 0.0282, "step": 259290 }, { "epoch": 1.67, "learning_rate": 4.896248152474876e-05, "loss": 0.0212, "step": 259300 }, { "epoch": 1.67, "learning_rate": 4.8952800170391834e-05, "loss": 0.026, "step": 259310 }, { "epoch": 1.67, "learning_rate": 4.89431188160349e-05, "loss": 0.027, "step": 259320 }, { "epoch": 1.67, "learning_rate": 4.8933437461677974e-05, "loss": 0.0243, "step": 259330 }, { "epoch": 1.67, "learning_rate": 4.892375610732103e-05, "loss": 0.0214, "step": 259340 }, { "epoch": 1.67, "learning_rate": 4.89140747529641e-05, "loss": 0.0286, "step": 259350 }, { "epoch": 1.67, "learning_rate": 4.890439339860717e-05, "loss": 0.0276, "step": 259360 }, { "epoch": 1.67, "learning_rate": 4.889471204425024e-05, "loss": 0.0244, "step": 259370 }, { "epoch": 1.67, "learning_rate": 4.888503068989331e-05, "loss": 0.0191, "step": 259380 }, { "epoch": 1.67, "learning_rate": 4.887534933553637e-05, "loss": 0.0289, "step": 259390 }, { "epoch": 1.67, "learning_rate": 4.8865667981179444e-05, "loss": 0.0225, "step": 259400 }, { "epoch": 1.67, "learning_rate": 4.885598662682251e-05, "loss": 0.0231, "step": 259410 }, { "epoch": 1.67, "learning_rate": 4.8846305272465577e-05, "loss": 0.0264, "step": 259420 }, { "epoch": 1.67, "learning_rate": 4.883662391810865e-05, "loss": 0.0237, "step": 259430 }, { "epoch": 1.67, "learning_rate": 4.882694256375171e-05, "loss": 0.0242, "step": 259440 }, { "epoch": 1.67, "learning_rate": 4.881726120939478e-05, "loss": 0.0199, "step": 259450 }, { "epoch": 1.67, "learning_rate": 4.880757985503785e-05, "loss": 0.0208, "step": 259460 }, { "epoch": 1.67, "learning_rate": 4.879789850068092e-05, "loss": 0.0239, "step": 259470 }, { "epoch": 1.67, "learning_rate": 4.878821714632399e-05, "loss": 0.0227, "step": 259480 }, { "epoch": 1.67, "learning_rate": 4.877853579196705e-05, "loss": 0.0253, "step": 259490 }, { "epoch": 1.67, "learning_rate": 4.876885443761012e-05, "loss": 0.0242, "step": 259500 }, { "epoch": 1.67, "learning_rate": 4.8759173083253186e-05, "loss": 0.0275, "step": 259510 }, { "epoch": 1.67, "learning_rate": 4.874949172889626e-05, "loss": 0.0233, "step": 259520 }, { "epoch": 1.68, "learning_rate": 4.8739810374539326e-05, "loss": 0.0242, "step": 259530 }, { "epoch": 1.68, "learning_rate": 4.87301290201824e-05, "loss": 0.0265, "step": 259540 }, { "epoch": 1.68, "learning_rate": 4.872044766582546e-05, "loss": 0.0222, "step": 259550 }, { "epoch": 1.68, "learning_rate": 4.8710766311468524e-05, "loss": 0.0262, "step": 259560 }, { "epoch": 1.68, "learning_rate": 4.87010849571116e-05, "loss": 0.0209, "step": 259570 }, { "epoch": 1.68, "learning_rate": 4.8691403602754664e-05, "loss": 0.0215, "step": 259580 }, { "epoch": 1.68, "learning_rate": 4.8681722248397737e-05, "loss": 0.0303, "step": 259590 }, { "epoch": 1.68, "learning_rate": 4.8672040894040796e-05, "loss": 0.0254, "step": 259600 }, { "epoch": 1.68, "learning_rate": 4.866235953968387e-05, "loss": 0.0268, "step": 259610 }, { "epoch": 1.68, "learning_rate": 4.8652678185326935e-05, "loss": 0.0224, "step": 259620 }, { "epoch": 1.68, "learning_rate": 4.864299683097e-05, "loss": 0.0215, "step": 259630 }, { "epoch": 1.68, "learning_rate": 4.8633315476613075e-05, "loss": 0.024, "step": 259640 }, { "epoch": 1.68, "learning_rate": 4.8623634122256134e-05, "loss": 0.0235, "step": 259650 }, { "epoch": 1.68, "learning_rate": 4.861395276789921e-05, "loss": 0.0247, "step": 259660 }, { "epoch": 1.68, "learning_rate": 4.860427141354227e-05, "loss": 0.028, "step": 259670 }, { "epoch": 1.68, "learning_rate": 4.8594590059185346e-05, "loss": 0.0244, "step": 259680 }, { "epoch": 1.68, "learning_rate": 4.858490870482841e-05, "loss": 0.0223, "step": 259690 }, { "epoch": 1.68, "learning_rate": 4.857522735047147e-05, "loss": 0.0264, "step": 259700 }, { "epoch": 1.68, "learning_rate": 4.8565545996114545e-05, "loss": 0.0249, "step": 259710 }, { "epoch": 1.68, "learning_rate": 4.855586464175761e-05, "loss": 0.0239, "step": 259720 }, { "epoch": 1.68, "learning_rate": 4.8546183287400684e-05, "loss": 0.0242, "step": 259730 }, { "epoch": 1.68, "learning_rate": 4.853650193304375e-05, "loss": 0.0244, "step": 259740 }, { "epoch": 1.68, "learning_rate": 4.8526820578686823e-05, "loss": 0.0273, "step": 259750 }, { "epoch": 1.68, "learning_rate": 4.851713922432988e-05, "loss": 0.0288, "step": 259760 }, { "epoch": 1.68, "learning_rate": 4.850745786997295e-05, "loss": 0.0242, "step": 259770 }, { "epoch": 1.68, "learning_rate": 4.849777651561602e-05, "loss": 0.0219, "step": 259780 }, { "epoch": 1.68, "learning_rate": 4.848809516125909e-05, "loss": 0.0287, "step": 259790 }, { "epoch": 1.68, "learning_rate": 4.847841380690216e-05, "loss": 0.0286, "step": 259800 }, { "epoch": 1.68, "learning_rate": 4.846873245254522e-05, "loss": 0.0283, "step": 259810 }, { "epoch": 1.68, "learning_rate": 4.8459051098188294e-05, "loss": 0.0226, "step": 259820 }, { "epoch": 1.68, "learning_rate": 4.844936974383136e-05, "loss": 0.0278, "step": 259830 }, { "epoch": 1.68, "learning_rate": 4.8439688389474426e-05, "loss": 0.0253, "step": 259840 }, { "epoch": 1.68, "learning_rate": 4.84300070351175e-05, "loss": 0.0227, "step": 259850 }, { "epoch": 1.68, "learning_rate": 4.842032568076056e-05, "loss": 0.0229, "step": 259860 }, { "epoch": 1.68, "learning_rate": 4.841064432640363e-05, "loss": 0.0218, "step": 259870 }, { "epoch": 1.68, "learning_rate": 4.84009629720467e-05, "loss": 0.0292, "step": 259880 }, { "epoch": 1.68, "learning_rate": 4.839128161768977e-05, "loss": 0.0256, "step": 259890 }, { "epoch": 1.68, "learning_rate": 4.838160026333284e-05, "loss": 0.0299, "step": 259900 }, { "epoch": 1.68, "learning_rate": 4.83719189089759e-05, "loss": 0.0241, "step": 259910 }, { "epoch": 1.68, "learning_rate": 4.836223755461897e-05, "loss": 0.0316, "step": 259920 }, { "epoch": 1.68, "learning_rate": 4.8352556200262036e-05, "loss": 0.0271, "step": 259930 }, { "epoch": 1.68, "learning_rate": 4.834287484590511e-05, "loss": 0.0249, "step": 259940 }, { "epoch": 1.68, "learning_rate": 4.8333193491548175e-05, "loss": 0.0227, "step": 259950 }, { "epoch": 1.68, "learning_rate": 4.832351213719124e-05, "loss": 0.0259, "step": 259960 }, { "epoch": 1.68, "learning_rate": 4.831383078283431e-05, "loss": 0.0235, "step": 259970 }, { "epoch": 1.68, "learning_rate": 4.8304149428477374e-05, "loss": 0.0284, "step": 259980 }, { "epoch": 1.68, "learning_rate": 4.829446807412045e-05, "loss": 0.0224, "step": 259990 }, { "epoch": 1.68, "learning_rate": 4.828478671976351e-05, "loss": 0.0233, "step": 260000 }, { "epoch": 1.68, "eval_cer": 0.9198653259518699, "eval_loss": 0.018204906955361366, "eval_runtime": 119.9898, "eval_samples_per_second": 16.668, "eval_steps_per_second": 4.167, "step": 260000 }, { "epoch": 1.68, "learning_rate": 4.827510536540658e-05, "loss": 0.0275, "step": 260010 }, { "epoch": 1.68, "learning_rate": 4.8265424011049646e-05, "loss": 0.0224, "step": 260020 }, { "epoch": 1.68, "learning_rate": 4.825574265669272e-05, "loss": 0.0241, "step": 260030 }, { "epoch": 1.68, "learning_rate": 4.8246061302335785e-05, "loss": 0.0214, "step": 260040 }, { "epoch": 1.68, "learning_rate": 4.823637994797885e-05, "loss": 0.0222, "step": 260050 }, { "epoch": 1.68, "learning_rate": 4.822669859362192e-05, "loss": 0.022, "step": 260060 }, { "epoch": 1.68, "learning_rate": 4.8217017239264984e-05, "loss": 0.0247, "step": 260070 }, { "epoch": 1.68, "learning_rate": 4.820733588490806e-05, "loss": 0.0288, "step": 260080 }, { "epoch": 1.68, "learning_rate": 4.819765453055112e-05, "loss": 0.0286, "step": 260090 }, { "epoch": 1.68, "learning_rate": 4.8187973176194196e-05, "loss": 0.025, "step": 260100 }, { "epoch": 1.68, "learning_rate": 4.8178291821837256e-05, "loss": 0.0235, "step": 260110 }, { "epoch": 1.68, "learning_rate": 4.816861046748032e-05, "loss": 0.0249, "step": 260120 }, { "epoch": 1.68, "learning_rate": 4.8158929113123395e-05, "loss": 0.0222, "step": 260130 }, { "epoch": 1.68, "learning_rate": 4.814924775876646e-05, "loss": 0.0282, "step": 260140 }, { "epoch": 1.68, "learning_rate": 4.8139566404409534e-05, "loss": 0.0264, "step": 260150 }, { "epoch": 1.68, "learning_rate": 4.8129885050052593e-05, "loss": 0.0257, "step": 260160 }, { "epoch": 1.68, "learning_rate": 4.8120203695695667e-05, "loss": 0.0275, "step": 260170 }, { "epoch": 1.68, "learning_rate": 4.811052234133873e-05, "loss": 0.0241, "step": 260180 }, { "epoch": 1.68, "learning_rate": 4.81008409869818e-05, "loss": 0.0224, "step": 260190 }, { "epoch": 1.68, "learning_rate": 4.809115963262487e-05, "loss": 0.0258, "step": 260200 }, { "epoch": 1.68, "learning_rate": 4.808147827826793e-05, "loss": 0.0234, "step": 260210 }, { "epoch": 1.68, "learning_rate": 4.8071796923911004e-05, "loss": 0.0241, "step": 260220 }, { "epoch": 1.68, "learning_rate": 4.806211556955407e-05, "loss": 0.0231, "step": 260230 }, { "epoch": 1.68, "learning_rate": 4.8052434215197144e-05, "loss": 0.0283, "step": 260240 }, { "epoch": 1.68, "learning_rate": 4.804275286084021e-05, "loss": 0.0231, "step": 260250 }, { "epoch": 1.68, "learning_rate": 4.803307150648327e-05, "loss": 0.023, "step": 260260 }, { "epoch": 1.68, "learning_rate": 4.802339015212634e-05, "loss": 0.0274, "step": 260270 }, { "epoch": 1.68, "learning_rate": 4.801370879776941e-05, "loss": 0.0231, "step": 260280 }, { "epoch": 1.68, "learning_rate": 4.800402744341248e-05, "loss": 0.0222, "step": 260290 }, { "epoch": 1.68, "learning_rate": 4.799434608905555e-05, "loss": 0.024, "step": 260300 }, { "epoch": 1.68, "learning_rate": 4.798466473469862e-05, "loss": 0.0248, "step": 260310 }, { "epoch": 1.68, "learning_rate": 4.797498338034168e-05, "loss": 0.0262, "step": 260320 }, { "epoch": 1.68, "learning_rate": 4.796530202598475e-05, "loss": 0.0217, "step": 260330 }, { "epoch": 1.68, "learning_rate": 4.795562067162782e-05, "loss": 0.0253, "step": 260340 }, { "epoch": 1.68, "learning_rate": 4.7945939317270886e-05, "loss": 0.0248, "step": 260350 }, { "epoch": 1.68, "learning_rate": 4.793625796291396e-05, "loss": 0.0306, "step": 260360 }, { "epoch": 1.68, "learning_rate": 4.792657660855702e-05, "loss": 0.0234, "step": 260370 }, { "epoch": 1.68, "learning_rate": 4.791689525420009e-05, "loss": 0.0229, "step": 260380 }, { "epoch": 1.68, "learning_rate": 4.790721389984316e-05, "loss": 0.0204, "step": 260390 }, { "epoch": 1.68, "learning_rate": 4.7897532545486224e-05, "loss": 0.0246, "step": 260400 }, { "epoch": 1.68, "learning_rate": 4.78878511911293e-05, "loss": 0.0205, "step": 260410 }, { "epoch": 1.68, "learning_rate": 4.7878169836772356e-05, "loss": 0.029, "step": 260420 }, { "epoch": 1.68, "learning_rate": 4.786848848241543e-05, "loss": 0.0236, "step": 260430 }, { "epoch": 1.68, "learning_rate": 4.7858807128058496e-05, "loss": 0.0227, "step": 260440 }, { "epoch": 1.68, "learning_rate": 4.784912577370157e-05, "loss": 0.0229, "step": 260450 }, { "epoch": 1.68, "learning_rate": 4.7839444419344635e-05, "loss": 0.0278, "step": 260460 }, { "epoch": 1.68, "learning_rate": 4.7829763064987694e-05, "loss": 0.0264, "step": 260470 }, { "epoch": 1.68, "learning_rate": 4.782008171063077e-05, "loss": 0.0228, "step": 260480 }, { "epoch": 1.68, "learning_rate": 4.7810400356273834e-05, "loss": 0.026, "step": 260490 }, { "epoch": 1.68, "learning_rate": 4.7800719001916907e-05, "loss": 0.028, "step": 260500 }, { "epoch": 1.68, "learning_rate": 4.779103764755997e-05, "loss": 0.0246, "step": 260510 }, { "epoch": 1.68, "learning_rate": 4.7781356293203046e-05, "loss": 0.0248, "step": 260520 }, { "epoch": 1.68, "learning_rate": 4.7771674938846105e-05, "loss": 0.0241, "step": 260530 }, { "epoch": 1.68, "learning_rate": 4.776199358448917e-05, "loss": 0.0224, "step": 260540 }, { "epoch": 1.68, "learning_rate": 4.7752312230132245e-05, "loss": 0.0253, "step": 260550 }, { "epoch": 1.68, "learning_rate": 4.774263087577531e-05, "loss": 0.0272, "step": 260560 }, { "epoch": 1.68, "learning_rate": 4.7732949521418384e-05, "loss": 0.0272, "step": 260570 }, { "epoch": 1.68, "learning_rate": 4.772326816706144e-05, "loss": 0.0284, "step": 260580 }, { "epoch": 1.68, "learning_rate": 4.7713586812704516e-05, "loss": 0.0215, "step": 260590 }, { "epoch": 1.68, "learning_rate": 4.770390545834758e-05, "loss": 0.0219, "step": 260600 }, { "epoch": 1.68, "learning_rate": 4.769422410399065e-05, "loss": 0.0244, "step": 260610 }, { "epoch": 1.68, "learning_rate": 4.768454274963372e-05, "loss": 0.0213, "step": 260620 }, { "epoch": 1.68, "learning_rate": 4.767486139527678e-05, "loss": 0.0295, "step": 260630 }, { "epoch": 1.68, "learning_rate": 4.7665180040919854e-05, "loss": 0.0205, "step": 260640 }, { "epoch": 1.68, "learning_rate": 4.765549868656292e-05, "loss": 0.0241, "step": 260650 }, { "epoch": 1.68, "learning_rate": 4.7645817332205994e-05, "loss": 0.0254, "step": 260660 }, { "epoch": 1.68, "learning_rate": 4.763613597784906e-05, "loss": 0.0249, "step": 260670 }, { "epoch": 1.68, "learning_rate": 4.762645462349212e-05, "loss": 0.0217, "step": 260680 }, { "epoch": 1.68, "learning_rate": 4.761677326913519e-05, "loss": 0.0233, "step": 260690 }, { "epoch": 1.68, "learning_rate": 4.760709191477826e-05, "loss": 0.0219, "step": 260700 }, { "epoch": 1.68, "learning_rate": 4.759741056042133e-05, "loss": 0.0287, "step": 260710 }, { "epoch": 1.68, "learning_rate": 4.75877292060644e-05, "loss": 0.0231, "step": 260720 }, { "epoch": 1.68, "learning_rate": 4.757804785170747e-05, "loss": 0.0236, "step": 260730 }, { "epoch": 1.68, "learning_rate": 4.756836649735053e-05, "loss": 0.0219, "step": 260740 }, { "epoch": 1.68, "learning_rate": 4.7558685142993596e-05, "loss": 0.0277, "step": 260750 }, { "epoch": 1.68, "learning_rate": 4.754900378863667e-05, "loss": 0.0254, "step": 260760 }, { "epoch": 1.68, "learning_rate": 4.7539322434279736e-05, "loss": 0.0252, "step": 260770 }, { "epoch": 1.68, "learning_rate": 4.752964107992281e-05, "loss": 0.0226, "step": 260780 }, { "epoch": 1.68, "learning_rate": 4.751995972556587e-05, "loss": 0.0253, "step": 260790 }, { "epoch": 1.68, "learning_rate": 4.751027837120894e-05, "loss": 0.0246, "step": 260800 }, { "epoch": 1.68, "learning_rate": 4.750059701685201e-05, "loss": 0.0216, "step": 260810 }, { "epoch": 1.68, "learning_rate": 4.7490915662495074e-05, "loss": 0.0217, "step": 260820 }, { "epoch": 1.68, "learning_rate": 4.748123430813815e-05, "loss": 0.0196, "step": 260830 }, { "epoch": 1.68, "learning_rate": 4.7471552953781206e-05, "loss": 0.026, "step": 260840 }, { "epoch": 1.68, "learning_rate": 4.746187159942428e-05, "loss": 0.0252, "step": 260850 }, { "epoch": 1.68, "learning_rate": 4.7452190245067345e-05, "loss": 0.0214, "step": 260860 }, { "epoch": 1.68, "learning_rate": 4.744250889071041e-05, "loss": 0.0235, "step": 260870 }, { "epoch": 1.68, "learning_rate": 4.7432827536353485e-05, "loss": 0.0242, "step": 260880 }, { "epoch": 1.68, "learning_rate": 4.7423146181996544e-05, "loss": 0.0235, "step": 260890 }, { "epoch": 1.68, "learning_rate": 4.741346482763962e-05, "loss": 0.0246, "step": 260900 }, { "epoch": 1.68, "learning_rate": 4.7403783473282683e-05, "loss": 0.0241, "step": 260910 }, { "epoch": 1.68, "learning_rate": 4.7394102118925756e-05, "loss": 0.0234, "step": 260920 }, { "epoch": 1.68, "learning_rate": 4.738442076456882e-05, "loss": 0.0261, "step": 260930 }, { "epoch": 1.68, "learning_rate": 4.737473941021188e-05, "loss": 0.0269, "step": 260940 }, { "epoch": 1.68, "learning_rate": 4.7365058055854955e-05, "loss": 0.0301, "step": 260950 }, { "epoch": 1.68, "learning_rate": 4.735537670149802e-05, "loss": 0.0247, "step": 260960 }, { "epoch": 1.68, "learning_rate": 4.7345695347141094e-05, "loss": 0.0272, "step": 260970 }, { "epoch": 1.68, "learning_rate": 4.733601399278416e-05, "loss": 0.0261, "step": 260980 }, { "epoch": 1.68, "learning_rate": 4.7326332638427234e-05, "loss": 0.0291, "step": 260990 }, { "epoch": 1.68, "learning_rate": 4.731665128407029e-05, "loss": 0.0205, "step": 261000 }, { "epoch": 1.68, "eval_cer": 0.919811998644221, "eval_loss": 0.01825707219541073, "eval_runtime": 120.0532, "eval_samples_per_second": 16.659, "eval_steps_per_second": 4.165, "step": 261000 }, { "epoch": 1.68, "learning_rate": 4.730696992971336e-05, "loss": 0.022, "step": 261010 }, { "epoch": 1.68, "learning_rate": 4.729728857535643e-05, "loss": 0.0277, "step": 261020 }, { "epoch": 1.68, "learning_rate": 4.72876072209995e-05, "loss": 0.0285, "step": 261030 }, { "epoch": 1.68, "learning_rate": 4.727792586664257e-05, "loss": 0.0276, "step": 261040 }, { "epoch": 1.68, "learning_rate": 4.726824451228563e-05, "loss": 0.0256, "step": 261050 }, { "epoch": 1.68, "learning_rate": 4.7258563157928704e-05, "loss": 0.0254, "step": 261060 }, { "epoch": 1.69, "learning_rate": 4.724888180357177e-05, "loss": 0.0299, "step": 261070 }, { "epoch": 1.69, "learning_rate": 4.7239200449214837e-05, "loss": 0.0303, "step": 261080 }, { "epoch": 1.69, "learning_rate": 4.722951909485791e-05, "loss": 0.025, "step": 261090 }, { "epoch": 1.69, "learning_rate": 4.721983774050097e-05, "loss": 0.0265, "step": 261100 }, { "epoch": 1.69, "learning_rate": 4.721015638614404e-05, "loss": 0.025, "step": 261110 }, { "epoch": 1.69, "learning_rate": 4.720047503178711e-05, "loss": 0.0245, "step": 261120 }, { "epoch": 1.69, "learning_rate": 4.719079367743018e-05, "loss": 0.0268, "step": 261130 }, { "epoch": 1.69, "learning_rate": 4.718111232307325e-05, "loss": 0.0267, "step": 261140 }, { "epoch": 1.69, "learning_rate": 4.717143096871631e-05, "loss": 0.024, "step": 261150 }, { "epoch": 1.69, "learning_rate": 4.716174961435938e-05, "loss": 0.0222, "step": 261160 }, { "epoch": 1.69, "learning_rate": 4.7152068260002446e-05, "loss": 0.0251, "step": 261170 }, { "epoch": 1.69, "learning_rate": 4.714238690564552e-05, "loss": 0.0275, "step": 261180 }, { "epoch": 1.69, "learning_rate": 4.7132705551288586e-05, "loss": 0.0285, "step": 261190 }, { "epoch": 1.69, "learning_rate": 4.712302419693166e-05, "loss": 0.0219, "step": 261200 }, { "epoch": 1.69, "learning_rate": 4.711334284257472e-05, "loss": 0.0244, "step": 261210 }, { "epoch": 1.69, "learning_rate": 4.7103661488217784e-05, "loss": 0.027, "step": 261220 }, { "epoch": 1.69, "learning_rate": 4.709398013386086e-05, "loss": 0.0301, "step": 261230 }, { "epoch": 1.69, "learning_rate": 4.7084298779503924e-05, "loss": 0.0251, "step": 261240 }, { "epoch": 1.69, "learning_rate": 4.7074617425146997e-05, "loss": 0.0255, "step": 261250 }, { "epoch": 1.69, "learning_rate": 4.7064936070790056e-05, "loss": 0.0224, "step": 261260 }, { "epoch": 1.69, "learning_rate": 4.705525471643313e-05, "loss": 0.0299, "step": 261270 }, { "epoch": 1.69, "learning_rate": 4.7045573362076195e-05, "loss": 0.0256, "step": 261280 }, { "epoch": 1.69, "learning_rate": 4.703589200771926e-05, "loss": 0.0254, "step": 261290 }, { "epoch": 1.69, "learning_rate": 4.7026210653362334e-05, "loss": 0.0216, "step": 261300 }, { "epoch": 1.69, "learning_rate": 4.7016529299005394e-05, "loss": 0.026, "step": 261310 }, { "epoch": 1.69, "learning_rate": 4.700684794464847e-05, "loss": 0.0246, "step": 261320 }, { "epoch": 1.69, "learning_rate": 4.699716659029153e-05, "loss": 0.0241, "step": 261330 }, { "epoch": 1.69, "learning_rate": 4.6987485235934606e-05, "loss": 0.0299, "step": 261340 }, { "epoch": 1.69, "learning_rate": 4.697780388157767e-05, "loss": 0.0217, "step": 261350 }, { "epoch": 1.69, "learning_rate": 4.696812252722073e-05, "loss": 0.0246, "step": 261360 }, { "epoch": 1.69, "learning_rate": 4.6958441172863805e-05, "loss": 0.0252, "step": 261370 }, { "epoch": 1.69, "learning_rate": 4.694875981850687e-05, "loss": 0.0218, "step": 261380 }, { "epoch": 1.69, "learning_rate": 4.6939078464149944e-05, "loss": 0.0217, "step": 261390 }, { "epoch": 1.69, "learning_rate": 4.692939710979301e-05, "loss": 0.0274, "step": 261400 }, { "epoch": 1.69, "learning_rate": 4.691971575543608e-05, "loss": 0.025, "step": 261410 }, { "epoch": 1.69, "learning_rate": 4.691003440107914e-05, "loss": 0.0226, "step": 261420 }, { "epoch": 1.69, "learning_rate": 4.690035304672221e-05, "loss": 0.0241, "step": 261430 }, { "epoch": 1.69, "learning_rate": 4.689067169236528e-05, "loss": 0.0233, "step": 261440 }, { "epoch": 1.69, "learning_rate": 4.688099033800835e-05, "loss": 0.0299, "step": 261450 }, { "epoch": 1.69, "learning_rate": 4.6871308983651415e-05, "loss": 0.0215, "step": 261460 }, { "epoch": 1.69, "learning_rate": 4.686162762929448e-05, "loss": 0.0244, "step": 261470 }, { "epoch": 1.69, "learning_rate": 4.6851946274937554e-05, "loss": 0.0232, "step": 261480 }, { "epoch": 1.69, "learning_rate": 4.684226492058062e-05, "loss": 0.0224, "step": 261490 }, { "epoch": 1.69, "learning_rate": 4.6832583566223686e-05, "loss": 0.0236, "step": 261500 }, { "epoch": 1.69, "learning_rate": 4.682290221186675e-05, "loss": 0.0227, "step": 261510 }, { "epoch": 1.69, "learning_rate": 4.681322085750982e-05, "loss": 0.027, "step": 261520 }, { "epoch": 1.69, "learning_rate": 4.680353950315289e-05, "loss": 0.0248, "step": 261530 }, { "epoch": 1.69, "learning_rate": 4.679385814879596e-05, "loss": 0.0261, "step": 261540 }, { "epoch": 1.69, "learning_rate": 4.678417679443903e-05, "loss": 0.0228, "step": 261550 }, { "epoch": 1.69, "learning_rate": 4.677449544008209e-05, "loss": 0.0226, "step": 261560 }, { "epoch": 1.69, "learning_rate": 4.676481408572516e-05, "loss": 0.0227, "step": 261570 }, { "epoch": 1.69, "learning_rate": 4.675513273136823e-05, "loss": 0.0272, "step": 261580 }, { "epoch": 1.69, "learning_rate": 4.6745451377011296e-05, "loss": 0.0249, "step": 261590 }, { "epoch": 1.69, "learning_rate": 4.673577002265437e-05, "loss": 0.0257, "step": 261600 }, { "epoch": 1.69, "learning_rate": 4.672608866829743e-05, "loss": 0.0225, "step": 261610 }, { "epoch": 1.69, "learning_rate": 4.67164073139405e-05, "loss": 0.024, "step": 261620 }, { "epoch": 1.69, "learning_rate": 4.670672595958357e-05, "loss": 0.0253, "step": 261630 }, { "epoch": 1.69, "learning_rate": 4.6697044605226634e-05, "loss": 0.0248, "step": 261640 }, { "epoch": 1.69, "learning_rate": 4.668736325086971e-05, "loss": 0.0255, "step": 261650 }, { "epoch": 1.69, "learning_rate": 4.6677681896512767e-05, "loss": 0.0208, "step": 261660 }, { "epoch": 1.69, "learning_rate": 4.666800054215584e-05, "loss": 0.0263, "step": 261670 }, { "epoch": 1.69, "learning_rate": 4.6658319187798906e-05, "loss": 0.0259, "step": 261680 }, { "epoch": 1.69, "learning_rate": 4.664863783344198e-05, "loss": 0.0376, "step": 261690 }, { "epoch": 1.69, "learning_rate": 4.6638956479085045e-05, "loss": 0.0238, "step": 261700 }, { "epoch": 1.69, "learning_rate": 4.6629275124728105e-05, "loss": 0.0229, "step": 261710 }, { "epoch": 1.69, "learning_rate": 4.661959377037118e-05, "loss": 0.0356, "step": 261720 }, { "epoch": 1.69, "learning_rate": 4.6609912416014244e-05, "loss": 0.0321, "step": 261730 }, { "epoch": 1.69, "learning_rate": 4.660023106165732e-05, "loss": 0.0251, "step": 261740 }, { "epoch": 1.69, "learning_rate": 4.659054970730038e-05, "loss": 0.0241, "step": 261750 }, { "epoch": 1.69, "learning_rate": 4.6580868352943456e-05, "loss": 0.027, "step": 261760 }, { "epoch": 1.69, "learning_rate": 4.6571186998586515e-05, "loss": 0.0228, "step": 261770 }, { "epoch": 1.69, "learning_rate": 4.656150564422958e-05, "loss": 0.0266, "step": 261780 }, { "epoch": 1.69, "learning_rate": 4.6551824289872655e-05, "loss": 0.0249, "step": 261790 }, { "epoch": 1.69, "learning_rate": 4.654214293551572e-05, "loss": 0.0235, "step": 261800 }, { "epoch": 1.69, "learning_rate": 4.6532461581158794e-05, "loss": 0.0236, "step": 261810 }, { "epoch": 1.69, "learning_rate": 4.6522780226801853e-05, "loss": 0.0263, "step": 261820 }, { "epoch": 1.69, "learning_rate": 4.6513098872444926e-05, "loss": 0.021, "step": 261830 }, { "epoch": 1.69, "learning_rate": 4.650341751808799e-05, "loss": 0.0234, "step": 261840 }, { "epoch": 1.69, "learning_rate": 4.649373616373106e-05, "loss": 0.0247, "step": 261850 }, { "epoch": 1.69, "learning_rate": 4.648405480937413e-05, "loss": 0.0272, "step": 261860 }, { "epoch": 1.69, "learning_rate": 4.647437345501719e-05, "loss": 0.0306, "step": 261870 }, { "epoch": 1.69, "learning_rate": 4.6464692100660264e-05, "loss": 0.0244, "step": 261880 }, { "epoch": 1.69, "learning_rate": 4.645501074630333e-05, "loss": 0.0208, "step": 261890 }, { "epoch": 1.69, "learning_rate": 4.6445329391946404e-05, "loss": 0.0235, "step": 261900 }, { "epoch": 1.69, "learning_rate": 4.643564803758947e-05, "loss": 0.0287, "step": 261910 }, { "epoch": 1.69, "learning_rate": 4.642596668323253e-05, "loss": 0.0271, "step": 261920 }, { "epoch": 1.69, "learning_rate": 4.64162853288756e-05, "loss": 0.0216, "step": 261930 }, { "epoch": 1.69, "learning_rate": 4.640660397451867e-05, "loss": 0.0293, "step": 261940 }, { "epoch": 1.69, "learning_rate": 4.639692262016174e-05, "loss": 0.0269, "step": 261950 }, { "epoch": 1.69, "learning_rate": 4.638724126580481e-05, "loss": 0.0255, "step": 261960 }, { "epoch": 1.69, "learning_rate": 4.637755991144788e-05, "loss": 0.0223, "step": 261970 }, { "epoch": 1.69, "learning_rate": 4.636787855709094e-05, "loss": 0.0286, "step": 261980 }, { "epoch": 1.69, "learning_rate": 4.635819720273401e-05, "loss": 0.026, "step": 261990 }, { "epoch": 1.69, "learning_rate": 4.634851584837708e-05, "loss": 0.0253, "step": 262000 }, { "epoch": 1.69, "eval_cer": 0.9198499604564456, "eval_loss": 0.018117111176252365, "eval_runtime": 120.1178, "eval_samples_per_second": 16.65, "eval_steps_per_second": 4.163, "step": 262000 }, { "epoch": 1.69, "learning_rate": 4.6338834494020146e-05, "loss": 0.0266, "step": 262010 }, { "epoch": 1.69, "learning_rate": 4.632915313966322e-05, "loss": 0.0256, "step": 262020 }, { "epoch": 1.69, "learning_rate": 4.631947178530628e-05, "loss": 0.0262, "step": 262030 }, { "epoch": 1.69, "learning_rate": 4.630979043094935e-05, "loss": 0.027, "step": 262040 }, { "epoch": 1.69, "learning_rate": 4.630010907659242e-05, "loss": 0.0222, "step": 262050 }, { "epoch": 1.69, "learning_rate": 4.6290427722235484e-05, "loss": 0.0248, "step": 262060 }, { "epoch": 1.69, "learning_rate": 4.628074636787856e-05, "loss": 0.0236, "step": 262070 }, { "epoch": 1.69, "learning_rate": 4.6271065013521616e-05, "loss": 0.0251, "step": 262080 }, { "epoch": 1.69, "learning_rate": 4.626138365916469e-05, "loss": 0.0252, "step": 262090 }, { "epoch": 1.69, "learning_rate": 4.6251702304807756e-05, "loss": 0.0216, "step": 262100 }, { "epoch": 1.69, "learning_rate": 4.624202095045083e-05, "loss": 0.0248, "step": 262110 }, { "epoch": 1.69, "learning_rate": 4.6232339596093895e-05, "loss": 0.0227, "step": 262120 }, { "epoch": 1.69, "learning_rate": 4.6222658241736954e-05, "loss": 0.0279, "step": 262130 }, { "epoch": 1.69, "learning_rate": 4.621297688738003e-05, "loss": 0.0247, "step": 262140 }, { "epoch": 1.69, "learning_rate": 4.6203295533023094e-05, "loss": 0.0248, "step": 262150 }, { "epoch": 1.69, "learning_rate": 4.6193614178666167e-05, "loss": 0.0263, "step": 262160 }, { "epoch": 1.69, "learning_rate": 4.618393282430923e-05, "loss": 0.0225, "step": 262170 }, { "epoch": 1.69, "learning_rate": 4.6174251469952306e-05, "loss": 0.0214, "step": 262180 }, { "epoch": 1.69, "learning_rate": 4.6164570115595365e-05, "loss": 0.0259, "step": 262190 }, { "epoch": 1.69, "learning_rate": 4.615488876123843e-05, "loss": 0.0313, "step": 262200 }, { "epoch": 1.69, "learning_rate": 4.6145207406881505e-05, "loss": 0.0223, "step": 262210 }, { "epoch": 1.69, "learning_rate": 4.613552605252457e-05, "loss": 0.0242, "step": 262220 }, { "epoch": 1.69, "learning_rate": 4.6125844698167644e-05, "loss": 0.0224, "step": 262230 }, { "epoch": 1.69, "learning_rate": 4.61161633438107e-05, "loss": 0.0232, "step": 262240 }, { "epoch": 1.69, "learning_rate": 4.6106481989453776e-05, "loss": 0.029, "step": 262250 }, { "epoch": 1.69, "learning_rate": 4.609680063509684e-05, "loss": 0.0205, "step": 262260 }, { "epoch": 1.69, "learning_rate": 4.608711928073991e-05, "loss": 0.0252, "step": 262270 }, { "epoch": 1.69, "learning_rate": 4.607743792638298e-05, "loss": 0.0243, "step": 262280 }, { "epoch": 1.69, "learning_rate": 4.606775657202604e-05, "loss": 0.0242, "step": 262290 }, { "epoch": 1.69, "learning_rate": 4.6058075217669114e-05, "loss": 0.0278, "step": 262300 }, { "epoch": 1.69, "learning_rate": 4.604839386331218e-05, "loss": 0.0243, "step": 262310 }, { "epoch": 1.69, "learning_rate": 4.6038712508955254e-05, "loss": 0.0265, "step": 262320 }, { "epoch": 1.69, "learning_rate": 4.602903115459832e-05, "loss": 0.0239, "step": 262330 }, { "epoch": 1.69, "learning_rate": 4.601934980024138e-05, "loss": 0.0205, "step": 262340 }, { "epoch": 1.69, "learning_rate": 4.600966844588445e-05, "loss": 0.019, "step": 262350 }, { "epoch": 1.69, "learning_rate": 4.599998709152752e-05, "loss": 0.0271, "step": 262360 }, { "epoch": 1.69, "learning_rate": 4.599030573717059e-05, "loss": 0.0227, "step": 262370 }, { "epoch": 1.69, "learning_rate": 4.598062438281366e-05, "loss": 0.0204, "step": 262380 }, { "epoch": 1.69, "learning_rate": 4.597094302845673e-05, "loss": 0.026, "step": 262390 }, { "epoch": 1.69, "learning_rate": 4.596126167409979e-05, "loss": 0.0242, "step": 262400 }, { "epoch": 1.69, "learning_rate": 4.5951580319742856e-05, "loss": 0.0271, "step": 262410 }, { "epoch": 1.69, "learning_rate": 4.594189896538593e-05, "loss": 0.0277, "step": 262420 }, { "epoch": 1.69, "learning_rate": 4.5932217611028996e-05, "loss": 0.0297, "step": 262430 }, { "epoch": 1.69, "learning_rate": 4.592253625667207e-05, "loss": 0.0233, "step": 262440 }, { "epoch": 1.69, "learning_rate": 4.591285490231513e-05, "loss": 0.0213, "step": 262450 }, { "epoch": 1.69, "learning_rate": 4.59031735479582e-05, "loss": 0.0269, "step": 262460 }, { "epoch": 1.69, "learning_rate": 4.589349219360127e-05, "loss": 0.0266, "step": 262470 }, { "epoch": 1.69, "learning_rate": 4.5883810839244334e-05, "loss": 0.024, "step": 262480 }, { "epoch": 1.69, "learning_rate": 4.587412948488741e-05, "loss": 0.036, "step": 262490 }, { "epoch": 1.69, "learning_rate": 4.5864448130530466e-05, "loss": 0.0239, "step": 262500 }, { "epoch": 1.69, "learning_rate": 4.585476677617354e-05, "loss": 0.022, "step": 262510 }, { "epoch": 1.69, "learning_rate": 4.5845085421816605e-05, "loss": 0.0194, "step": 262520 }, { "epoch": 1.69, "learning_rate": 4.583540406745968e-05, "loss": 0.0249, "step": 262530 }, { "epoch": 1.69, "learning_rate": 4.5825722713102745e-05, "loss": 0.022, "step": 262540 }, { "epoch": 1.69, "learning_rate": 4.5816041358745804e-05, "loss": 0.0263, "step": 262550 }, { "epoch": 1.69, "learning_rate": 4.580636000438888e-05, "loss": 0.0241, "step": 262560 }, { "epoch": 1.69, "learning_rate": 4.579667865003194e-05, "loss": 0.0268, "step": 262570 }, { "epoch": 1.69, "learning_rate": 4.5786997295675016e-05, "loss": 0.029, "step": 262580 }, { "epoch": 1.69, "learning_rate": 4.577731594131808e-05, "loss": 0.0226, "step": 262590 }, { "epoch": 1.69, "learning_rate": 4.576763458696114e-05, "loss": 0.0292, "step": 262600 }, { "epoch": 1.69, "learning_rate": 4.5757953232604215e-05, "loss": 0.0278, "step": 262610 }, { "epoch": 1.7, "learning_rate": 4.574827187824728e-05, "loss": 0.0263, "step": 262620 }, { "epoch": 1.7, "learning_rate": 4.5738590523890354e-05, "loss": 0.0224, "step": 262630 }, { "epoch": 1.7, "learning_rate": 4.572890916953342e-05, "loss": 0.022, "step": 262640 }, { "epoch": 1.7, "learning_rate": 4.571922781517649e-05, "loss": 0.0252, "step": 262650 }, { "epoch": 1.7, "learning_rate": 4.570954646081955e-05, "loss": 0.0262, "step": 262660 }, { "epoch": 1.7, "learning_rate": 4.569986510646262e-05, "loss": 0.0214, "step": 262670 }, { "epoch": 1.7, "learning_rate": 4.569018375210569e-05, "loss": 0.0205, "step": 262680 }, { "epoch": 1.7, "learning_rate": 4.568050239774876e-05, "loss": 0.0263, "step": 262690 }, { "epoch": 1.7, "learning_rate": 4.5670821043391825e-05, "loss": 0.0234, "step": 262700 }, { "epoch": 1.7, "learning_rate": 4.566113968903489e-05, "loss": 0.026, "step": 262710 }, { "epoch": 1.7, "learning_rate": 4.5651458334677964e-05, "loss": 0.0239, "step": 262720 }, { "epoch": 1.7, "learning_rate": 4.564177698032103e-05, "loss": 0.021, "step": 262730 }, { "epoch": 1.7, "learning_rate": 4.5632095625964097e-05, "loss": 0.0267, "step": 262740 }, { "epoch": 1.7, "learning_rate": 4.562241427160716e-05, "loss": 0.0247, "step": 262750 }, { "epoch": 1.7, "learning_rate": 4.561273291725023e-05, "loss": 0.0239, "step": 262760 }, { "epoch": 1.7, "learning_rate": 4.56030515628933e-05, "loss": 0.0233, "step": 262770 }, { "epoch": 1.7, "learning_rate": 4.559337020853637e-05, "loss": 0.0308, "step": 262780 }, { "epoch": 1.7, "learning_rate": 4.558368885417944e-05, "loss": 0.0232, "step": 262790 }, { "epoch": 1.7, "learning_rate": 4.55740074998225e-05, "loss": 0.029, "step": 262800 }, { "epoch": 1.7, "learning_rate": 4.556432614546557e-05, "loss": 0.0323, "step": 262810 }, { "epoch": 1.7, "learning_rate": 4.555464479110864e-05, "loss": 0.0262, "step": 262820 }, { "epoch": 1.7, "learning_rate": 4.5544963436751706e-05, "loss": 0.0236, "step": 262830 }, { "epoch": 1.7, "learning_rate": 4.553528208239478e-05, "loss": 0.0197, "step": 262840 }, { "epoch": 1.7, "learning_rate": 4.552560072803784e-05, "loss": 0.0265, "step": 262850 }, { "epoch": 1.7, "learning_rate": 4.551591937368091e-05, "loss": 0.0235, "step": 262860 }, { "epoch": 1.7, "learning_rate": 4.550623801932398e-05, "loss": 0.0236, "step": 262870 }, { "epoch": 1.7, "learning_rate": 4.5496556664967044e-05, "loss": 0.0209, "step": 262880 }, { "epoch": 1.7, "learning_rate": 4.548687531061012e-05, "loss": 0.0257, "step": 262890 }, { "epoch": 1.7, "learning_rate": 4.547719395625318e-05, "loss": 0.0253, "step": 262900 }, { "epoch": 1.7, "learning_rate": 4.546751260189625e-05, "loss": 0.0265, "step": 262910 }, { "epoch": 1.7, "learning_rate": 4.5457831247539316e-05, "loss": 0.0237, "step": 262920 }, { "epoch": 1.7, "learning_rate": 4.544814989318239e-05, "loss": 0.0254, "step": 262930 }, { "epoch": 1.7, "learning_rate": 4.5438468538825455e-05, "loss": 0.0326, "step": 262940 }, { "epoch": 1.7, "learning_rate": 4.542878718446852e-05, "loss": 0.0304, "step": 262950 }, { "epoch": 1.7, "learning_rate": 4.541910583011159e-05, "loss": 0.0236, "step": 262960 }, { "epoch": 1.7, "learning_rate": 4.5409424475754654e-05, "loss": 0.0271, "step": 262970 }, { "epoch": 1.7, "learning_rate": 4.539974312139773e-05, "loss": 0.0261, "step": 262980 }, { "epoch": 1.7, "learning_rate": 4.539006176704079e-05, "loss": 0.027, "step": 262990 }, { "epoch": 1.7, "learning_rate": 4.5380380412683866e-05, "loss": 0.0221, "step": 263000 }, { "epoch": 1.7, "eval_cer": 0.9198345949610214, "eval_loss": 0.018028145655989647, "eval_runtime": 120.064, "eval_samples_per_second": 16.658, "eval_steps_per_second": 4.164, "step": 263000 }, { "epoch": 1.7, "learning_rate": 4.5370699058326926e-05, "loss": 0.0251, "step": 263010 }, { "epoch": 1.7, "learning_rate": 4.536101770396999e-05, "loss": 0.0274, "step": 263020 }, { "epoch": 1.7, "learning_rate": 4.5351336349613065e-05, "loss": 0.0202, "step": 263030 }, { "epoch": 1.7, "learning_rate": 4.534165499525613e-05, "loss": 0.0232, "step": 263040 }, { "epoch": 1.7, "learning_rate": 4.5331973640899204e-05, "loss": 0.0253, "step": 263050 }, { "epoch": 1.7, "learning_rate": 4.5322292286542264e-05, "loss": 0.0236, "step": 263060 }, { "epoch": 1.7, "learning_rate": 4.531261093218534e-05, "loss": 0.0263, "step": 263070 }, { "epoch": 1.7, "learning_rate": 4.53029295778284e-05, "loss": 0.0239, "step": 263080 }, { "epoch": 1.7, "learning_rate": 4.529324822347147e-05, "loss": 0.0228, "step": 263090 }, { "epoch": 1.7, "learning_rate": 4.528356686911454e-05, "loss": 0.0256, "step": 263100 }, { "epoch": 1.7, "learning_rate": 4.52738855147576e-05, "loss": 0.025, "step": 263110 }, { "epoch": 1.7, "learning_rate": 4.5264204160400675e-05, "loss": 0.027, "step": 263120 }, { "epoch": 1.7, "learning_rate": 4.525452280604374e-05, "loss": 0.0267, "step": 263130 }, { "epoch": 1.7, "learning_rate": 4.5244841451686814e-05, "loss": 0.0283, "step": 263140 }, { "epoch": 1.7, "learning_rate": 4.523516009732988e-05, "loss": 0.0278, "step": 263150 }, { "epoch": 1.7, "learning_rate": 4.522547874297294e-05, "loss": 0.0275, "step": 263160 }, { "epoch": 1.7, "learning_rate": 4.521579738861601e-05, "loss": 0.0202, "step": 263170 }, { "epoch": 1.7, "learning_rate": 4.520611603425908e-05, "loss": 0.0275, "step": 263180 }, { "epoch": 1.7, "learning_rate": 4.519643467990215e-05, "loss": 0.0259, "step": 263190 }, { "epoch": 1.7, "learning_rate": 4.518675332554522e-05, "loss": 0.0273, "step": 263200 }, { "epoch": 1.7, "learning_rate": 4.517707197118829e-05, "loss": 0.0271, "step": 263210 }, { "epoch": 1.7, "learning_rate": 4.516739061683135e-05, "loss": 0.0214, "step": 263220 }, { "epoch": 1.7, "learning_rate": 4.515770926247442e-05, "loss": 0.027, "step": 263230 }, { "epoch": 1.7, "learning_rate": 4.514802790811749e-05, "loss": 0.0262, "step": 263240 }, { "epoch": 1.7, "learning_rate": 4.5138346553760556e-05, "loss": 0.0253, "step": 263250 }, { "epoch": 1.7, "learning_rate": 4.512866519940363e-05, "loss": 0.0201, "step": 263260 }, { "epoch": 1.7, "learning_rate": 4.511898384504669e-05, "loss": 0.0281, "step": 263270 }, { "epoch": 1.7, "learning_rate": 4.510930249068976e-05, "loss": 0.0262, "step": 263280 }, { "epoch": 1.7, "learning_rate": 4.509962113633283e-05, "loss": 0.0228, "step": 263290 }, { "epoch": 1.7, "learning_rate": 4.5089939781975894e-05, "loss": 0.0293, "step": 263300 }, { "epoch": 1.7, "learning_rate": 4.508025842761897e-05, "loss": 0.0234, "step": 263310 }, { "epoch": 1.7, "learning_rate": 4.5070577073262027e-05, "loss": 0.0295, "step": 263320 }, { "epoch": 1.7, "learning_rate": 4.50608957189051e-05, "loss": 0.0273, "step": 263330 }, { "epoch": 1.7, "learning_rate": 4.5051214364548166e-05, "loss": 0.0231, "step": 263340 }, { "epoch": 1.7, "learning_rate": 4.504153301019124e-05, "loss": 0.0236, "step": 263350 }, { "epoch": 1.7, "learning_rate": 4.5031851655834305e-05, "loss": 0.0254, "step": 263360 }, { "epoch": 1.7, "learning_rate": 4.5022170301477364e-05, "loss": 0.0255, "step": 263370 }, { "epoch": 1.7, "learning_rate": 4.501248894712044e-05, "loss": 0.022, "step": 263380 }, { "epoch": 1.7, "learning_rate": 4.5002807592763504e-05, "loss": 0.0267, "step": 263390 }, { "epoch": 1.7, "learning_rate": 4.499312623840658e-05, "loss": 0.0256, "step": 263400 }, { "epoch": 1.7, "learning_rate": 4.498344488404964e-05, "loss": 0.028, "step": 263410 }, { "epoch": 1.7, "learning_rate": 4.4973763529692716e-05, "loss": 0.0282, "step": 263420 }, { "epoch": 1.7, "learning_rate": 4.4964082175335775e-05, "loss": 0.0244, "step": 263430 }, { "epoch": 1.7, "learning_rate": 4.495440082097884e-05, "loss": 0.0263, "step": 263440 }, { "epoch": 1.7, "learning_rate": 4.4944719466621915e-05, "loss": 0.0243, "step": 263450 }, { "epoch": 1.7, "learning_rate": 4.493503811226498e-05, "loss": 0.024, "step": 263460 }, { "epoch": 1.7, "learning_rate": 4.4925356757908054e-05, "loss": 0.0237, "step": 263470 }, { "epoch": 1.7, "learning_rate": 4.4915675403551113e-05, "loss": 0.0261, "step": 263480 }, { "epoch": 1.7, "learning_rate": 4.4905994049194186e-05, "loss": 0.0316, "step": 263490 }, { "epoch": 1.7, "learning_rate": 4.489631269483725e-05, "loss": 0.0239, "step": 263500 }, { "epoch": 1.7, "learning_rate": 4.488663134048032e-05, "loss": 0.0214, "step": 263510 }, { "epoch": 1.7, "learning_rate": 4.487694998612339e-05, "loss": 0.0223, "step": 263520 }, { "epoch": 1.7, "learning_rate": 4.486726863176645e-05, "loss": 0.0248, "step": 263530 }, { "epoch": 1.7, "learning_rate": 4.4857587277409524e-05, "loss": 0.0253, "step": 263540 }, { "epoch": 1.7, "learning_rate": 4.484790592305259e-05, "loss": 0.0244, "step": 263550 }, { "epoch": 1.7, "learning_rate": 4.4838224568695664e-05, "loss": 0.026, "step": 263560 }, { "epoch": 1.7, "learning_rate": 4.482854321433873e-05, "loss": 0.0229, "step": 263570 }, { "epoch": 1.7, "learning_rate": 4.481886185998179e-05, "loss": 0.0211, "step": 263580 }, { "epoch": 1.7, "learning_rate": 4.480918050562486e-05, "loss": 0.0245, "step": 263590 }, { "epoch": 1.7, "learning_rate": 4.479949915126793e-05, "loss": 0.0215, "step": 263600 }, { "epoch": 1.7, "learning_rate": 4.4789817796911e-05, "loss": 0.0235, "step": 263610 }, { "epoch": 1.7, "learning_rate": 4.478013644255407e-05, "loss": 0.0251, "step": 263620 }, { "epoch": 1.7, "learning_rate": 4.477045508819714e-05, "loss": 0.0297, "step": 263630 }, { "epoch": 1.7, "learning_rate": 4.47607737338402e-05, "loss": 0.0249, "step": 263640 }, { "epoch": 1.7, "learning_rate": 4.4751092379483267e-05, "loss": 0.0305, "step": 263650 }, { "epoch": 1.7, "learning_rate": 4.474141102512634e-05, "loss": 0.0243, "step": 263660 }, { "epoch": 1.7, "learning_rate": 4.4731729670769406e-05, "loss": 0.0225, "step": 263670 }, { "epoch": 1.7, "learning_rate": 4.472204831641248e-05, "loss": 0.0205, "step": 263680 }, { "epoch": 1.7, "learning_rate": 4.471236696205554e-05, "loss": 0.0315, "step": 263690 }, { "epoch": 1.7, "learning_rate": 4.470268560769861e-05, "loss": 0.0242, "step": 263700 }, { "epoch": 1.7, "learning_rate": 4.469300425334168e-05, "loss": 0.0213, "step": 263710 }, { "epoch": 1.7, "learning_rate": 4.4683322898984744e-05, "loss": 0.0243, "step": 263720 }, { "epoch": 1.7, "learning_rate": 4.467364154462782e-05, "loss": 0.0212, "step": 263730 }, { "epoch": 1.7, "learning_rate": 4.4663960190270876e-05, "loss": 0.0268, "step": 263740 }, { "epoch": 1.7, "learning_rate": 4.465427883591395e-05, "loss": 0.023, "step": 263750 }, { "epoch": 1.7, "learning_rate": 4.4644597481557016e-05, "loss": 0.0248, "step": 263760 }, { "epoch": 1.7, "learning_rate": 4.463491612720009e-05, "loss": 0.0237, "step": 263770 }, { "epoch": 1.7, "learning_rate": 4.4625234772843155e-05, "loss": 0.0257, "step": 263780 }, { "epoch": 1.7, "learning_rate": 4.4615553418486214e-05, "loss": 0.0209, "step": 263790 }, { "epoch": 1.7, "learning_rate": 4.460587206412929e-05, "loss": 0.0283, "step": 263800 }, { "epoch": 1.7, "learning_rate": 4.4596190709772354e-05, "loss": 0.0213, "step": 263810 }, { "epoch": 1.7, "learning_rate": 4.4586509355415427e-05, "loss": 0.0241, "step": 263820 }, { "epoch": 1.7, "learning_rate": 4.457682800105849e-05, "loss": 0.0241, "step": 263830 }, { "epoch": 1.7, "learning_rate": 4.4567146646701566e-05, "loss": 0.0247, "step": 263840 }, { "epoch": 1.7, "learning_rate": 4.4557465292344625e-05, "loss": 0.0199, "step": 263850 }, { "epoch": 1.7, "learning_rate": 4.454778393798769e-05, "loss": 0.0223, "step": 263860 }, { "epoch": 1.7, "learning_rate": 4.4538102583630765e-05, "loss": 0.0197, "step": 263870 }, { "epoch": 1.7, "learning_rate": 4.452842122927383e-05, "loss": 0.0223, "step": 263880 }, { "epoch": 1.7, "learning_rate": 4.4518739874916904e-05, "loss": 0.0225, "step": 263890 }, { "epoch": 1.7, "learning_rate": 4.450905852055996e-05, "loss": 0.0207, "step": 263900 }, { "epoch": 1.7, "learning_rate": 4.4499377166203036e-05, "loss": 0.0226, "step": 263910 }, { "epoch": 1.7, "learning_rate": 4.44896958118461e-05, "loss": 0.0219, "step": 263920 }, { "epoch": 1.7, "learning_rate": 4.448001445748917e-05, "loss": 0.0193, "step": 263930 }, { "epoch": 1.7, "learning_rate": 4.447033310313224e-05, "loss": 0.0266, "step": 263940 }, { "epoch": 1.7, "learning_rate": 4.44606517487753e-05, "loss": 0.0194, "step": 263950 }, { "epoch": 1.7, "learning_rate": 4.4450970394418374e-05, "loss": 0.0268, "step": 263960 }, { "epoch": 1.7, "learning_rate": 4.444128904006144e-05, "loss": 0.0301, "step": 263970 }, { "epoch": 1.7, "learning_rate": 4.4431607685704513e-05, "loss": 0.0208, "step": 263980 }, { "epoch": 1.7, "learning_rate": 4.442192633134758e-05, "loss": 0.0207, "step": 263990 }, { "epoch": 1.7, "learning_rate": 4.441224497699064e-05, "loss": 0.0228, "step": 264000 }, { "epoch": 1.7, "eval_cer": 0.9198797875946221, "eval_loss": 0.01815461367368698, "eval_runtime": 120.0874, "eval_samples_per_second": 16.655, "eval_steps_per_second": 4.164, "step": 264000 }, { "epoch": 1.7, "learning_rate": 4.440256362263371e-05, "loss": 0.024, "step": 264010 }, { "epoch": 1.7, "learning_rate": 4.439288226827678e-05, "loss": 0.0251, "step": 264020 }, { "epoch": 1.7, "learning_rate": 4.438320091391985e-05, "loss": 0.0223, "step": 264030 }, { "epoch": 1.7, "learning_rate": 4.437351955956292e-05, "loss": 0.0225, "step": 264040 }, { "epoch": 1.7, "learning_rate": 4.4363838205205984e-05, "loss": 0.025, "step": 264050 }, { "epoch": 1.7, "learning_rate": 4.435415685084905e-05, "loss": 0.0219, "step": 264060 }, { "epoch": 1.7, "learning_rate": 4.4344475496492116e-05, "loss": 0.0256, "step": 264070 }, { "epoch": 1.7, "learning_rate": 4.433479414213519e-05, "loss": 0.0216, "step": 264080 }, { "epoch": 1.7, "learning_rate": 4.4325112787778256e-05, "loss": 0.0231, "step": 264090 }, { "epoch": 1.7, "learning_rate": 4.431543143342132e-05, "loss": 0.0198, "step": 264100 }, { "epoch": 1.7, "learning_rate": 4.430575007906439e-05, "loss": 0.0195, "step": 264110 }, { "epoch": 1.7, "learning_rate": 4.429606872470746e-05, "loss": 0.0259, "step": 264120 }, { "epoch": 1.7, "learning_rate": 4.428638737035053e-05, "loss": 0.024, "step": 264130 }, { "epoch": 1.7, "learning_rate": 4.4276706015993594e-05, "loss": 0.0262, "step": 264140 }, { "epoch": 1.7, "learning_rate": 4.426702466163666e-05, "loss": 0.022, "step": 264150 }, { "epoch": 1.7, "learning_rate": 4.4257343307279726e-05, "loss": 0.0241, "step": 264160 }, { "epoch": 1.71, "learning_rate": 4.42476619529228e-05, "loss": 0.0208, "step": 264170 }, { "epoch": 1.71, "learning_rate": 4.4237980598565865e-05, "loss": 0.0248, "step": 264180 }, { "epoch": 1.71, "learning_rate": 4.422829924420894e-05, "loss": 0.0246, "step": 264190 }, { "epoch": 1.71, "learning_rate": 4.4218617889852e-05, "loss": 0.0293, "step": 264200 }, { "epoch": 1.71, "learning_rate": 4.4208936535495064e-05, "loss": 0.0271, "step": 264210 }, { "epoch": 1.71, "learning_rate": 4.419925518113814e-05, "loss": 0.0206, "step": 264220 }, { "epoch": 1.71, "learning_rate": 4.41895738267812e-05, "loss": 0.0246, "step": 264230 }, { "epoch": 1.71, "learning_rate": 4.4179892472424276e-05, "loss": 0.0264, "step": 264240 }, { "epoch": 1.71, "learning_rate": 4.4170211118067336e-05, "loss": 0.022, "step": 264250 }, { "epoch": 1.71, "learning_rate": 4.41605297637104e-05, "loss": 0.0266, "step": 264260 }, { "epoch": 1.71, "learning_rate": 4.4150848409353475e-05, "loss": 0.025, "step": 264270 }, { "epoch": 1.71, "learning_rate": 4.414116705499654e-05, "loss": 0.0262, "step": 264280 }, { "epoch": 1.71, "learning_rate": 4.4131485700639614e-05, "loss": 0.0256, "step": 264290 }, { "epoch": 1.71, "learning_rate": 4.4121804346282674e-05, "loss": 0.0241, "step": 264300 }, { "epoch": 1.71, "learning_rate": 4.411212299192575e-05, "loss": 0.0264, "step": 264310 }, { "epoch": 1.71, "learning_rate": 4.410244163756881e-05, "loss": 0.0257, "step": 264320 }, { "epoch": 1.71, "learning_rate": 4.409276028321188e-05, "loss": 0.0235, "step": 264330 }, { "epoch": 1.71, "learning_rate": 4.408307892885495e-05, "loss": 0.0249, "step": 264340 }, { "epoch": 1.71, "learning_rate": 4.407339757449801e-05, "loss": 0.0226, "step": 264350 }, { "epoch": 1.71, "learning_rate": 4.4063716220141085e-05, "loss": 0.0245, "step": 264360 }, { "epoch": 1.71, "learning_rate": 4.405403486578415e-05, "loss": 0.0294, "step": 264370 }, { "epoch": 1.71, "learning_rate": 4.4044353511427224e-05, "loss": 0.0229, "step": 264380 }, { "epoch": 1.71, "learning_rate": 4.403467215707029e-05, "loss": 0.0252, "step": 264390 }, { "epoch": 1.71, "learning_rate": 4.402499080271335e-05, "loss": 0.025, "step": 264400 }, { "epoch": 1.71, "learning_rate": 4.401530944835642e-05, "loss": 0.0246, "step": 264410 }, { "epoch": 1.71, "learning_rate": 4.400562809399949e-05, "loss": 0.0235, "step": 264420 }, { "epoch": 1.71, "learning_rate": 4.399594673964256e-05, "loss": 0.0261, "step": 264430 }, { "epoch": 1.71, "learning_rate": 4.398626538528563e-05, "loss": 0.0275, "step": 264440 }, { "epoch": 1.71, "learning_rate": 4.39765840309287e-05, "loss": 0.0247, "step": 264450 }, { "epoch": 1.71, "learning_rate": 4.396690267657176e-05, "loss": 0.0229, "step": 264460 }, { "epoch": 1.71, "learning_rate": 4.395722132221483e-05, "loss": 0.0245, "step": 264470 }, { "epoch": 1.71, "learning_rate": 4.39475399678579e-05, "loss": 0.024, "step": 264480 }, { "epoch": 1.71, "learning_rate": 4.3937858613500966e-05, "loss": 0.0251, "step": 264490 }, { "epoch": 1.71, "learning_rate": 4.392817725914404e-05, "loss": 0.0235, "step": 264500 }, { "epoch": 1.71, "learning_rate": 4.39184959047871e-05, "loss": 0.023, "step": 264510 }, { "epoch": 1.71, "learning_rate": 4.390881455043017e-05, "loss": 0.0233, "step": 264520 }, { "epoch": 1.71, "learning_rate": 4.389913319607324e-05, "loss": 0.026, "step": 264530 }, { "epoch": 1.71, "learning_rate": 4.3889451841716304e-05, "loss": 0.0195, "step": 264540 }, { "epoch": 1.71, "learning_rate": 4.387977048735938e-05, "loss": 0.0224, "step": 264550 }, { "epoch": 1.71, "learning_rate": 4.387008913300244e-05, "loss": 0.0276, "step": 264560 }, { "epoch": 1.71, "learning_rate": 4.386040777864551e-05, "loss": 0.0199, "step": 264570 }, { "epoch": 1.71, "learning_rate": 4.3850726424288576e-05, "loss": 0.0247, "step": 264580 }, { "epoch": 1.71, "learning_rate": 4.384104506993165e-05, "loss": 0.0244, "step": 264590 }, { "epoch": 1.71, "learning_rate": 4.3831363715574715e-05, "loss": 0.0253, "step": 264600 }, { "epoch": 1.71, "learning_rate": 4.3821682361217775e-05, "loss": 0.0218, "step": 264610 }, { "epoch": 1.71, "learning_rate": 4.381200100686085e-05, "loss": 0.0231, "step": 264620 }, { "epoch": 1.71, "learning_rate": 4.3802319652503914e-05, "loss": 0.0281, "step": 264630 }, { "epoch": 1.71, "learning_rate": 4.379263829814699e-05, "loss": 0.0254, "step": 264640 }, { "epoch": 1.71, "learning_rate": 4.378295694379005e-05, "loss": 0.022, "step": 264650 }, { "epoch": 1.71, "learning_rate": 4.3773275589433126e-05, "loss": 0.028, "step": 264660 }, { "epoch": 1.71, "learning_rate": 4.3763594235076186e-05, "loss": 0.0219, "step": 264670 }, { "epoch": 1.71, "learning_rate": 4.375391288071925e-05, "loss": 0.025, "step": 264680 }, { "epoch": 1.71, "learning_rate": 4.3744231526362325e-05, "loss": 0.0285, "step": 264690 }, { "epoch": 1.71, "learning_rate": 4.373455017200539e-05, "loss": 0.023, "step": 264700 }, { "epoch": 1.71, "learning_rate": 4.3724868817648464e-05, "loss": 0.0234, "step": 264710 }, { "epoch": 1.71, "learning_rate": 4.3715187463291524e-05, "loss": 0.0245, "step": 264720 }, { "epoch": 1.71, "learning_rate": 4.37055061089346e-05, "loss": 0.0213, "step": 264730 }, { "epoch": 1.71, "learning_rate": 4.369582475457766e-05, "loss": 0.0228, "step": 264740 }, { "epoch": 1.71, "learning_rate": 4.368614340022073e-05, "loss": 0.0252, "step": 264750 }, { "epoch": 1.71, "learning_rate": 4.36764620458638e-05, "loss": 0.0201, "step": 264760 }, { "epoch": 1.71, "learning_rate": 4.366678069150686e-05, "loss": 0.0198, "step": 264770 }, { "epoch": 1.71, "learning_rate": 4.3657099337149935e-05, "loss": 0.028, "step": 264780 }, { "epoch": 1.71, "learning_rate": 4.3647417982793e-05, "loss": 0.0224, "step": 264790 }, { "epoch": 1.71, "learning_rate": 4.3637736628436074e-05, "loss": 0.0264, "step": 264800 }, { "epoch": 1.71, "learning_rate": 4.362805527407914e-05, "loss": 0.0201, "step": 264810 }, { "epoch": 1.71, "learning_rate": 4.36183739197222e-05, "loss": 0.0208, "step": 264820 }, { "epoch": 1.71, "learning_rate": 4.360869256536527e-05, "loss": 0.0259, "step": 264830 }, { "epoch": 1.71, "learning_rate": 4.359901121100834e-05, "loss": 0.0214, "step": 264840 }, { "epoch": 1.71, "learning_rate": 4.358932985665141e-05, "loss": 0.0228, "step": 264850 }, { "epoch": 1.71, "learning_rate": 4.357964850229448e-05, "loss": 0.0249, "step": 264860 }, { "epoch": 1.71, "learning_rate": 4.356996714793755e-05, "loss": 0.0225, "step": 264870 }, { "epoch": 1.71, "learning_rate": 4.356028579358061e-05, "loss": 0.0281, "step": 264880 }, { "epoch": 1.71, "learning_rate": 4.355060443922368e-05, "loss": 0.0195, "step": 264890 }, { "epoch": 1.71, "learning_rate": 4.354092308486675e-05, "loss": 0.0258, "step": 264900 }, { "epoch": 1.71, "learning_rate": 4.3531241730509816e-05, "loss": 0.0251, "step": 264910 }, { "epoch": 1.71, "learning_rate": 4.352156037615289e-05, "loss": 0.0218, "step": 264920 }, { "epoch": 1.71, "learning_rate": 4.351187902179595e-05, "loss": 0.025, "step": 264930 }, { "epoch": 1.71, "learning_rate": 4.350219766743902e-05, "loss": 0.0327, "step": 264940 }, { "epoch": 1.71, "learning_rate": 4.349251631308209e-05, "loss": 0.0228, "step": 264950 }, { "epoch": 1.71, "learning_rate": 4.3482834958725154e-05, "loss": 0.0219, "step": 264960 }, { "epoch": 1.71, "learning_rate": 4.347315360436823e-05, "loss": 0.0227, "step": 264970 }, { "epoch": 1.71, "learning_rate": 4.3463472250011286e-05, "loss": 0.0253, "step": 264980 }, { "epoch": 1.71, "learning_rate": 4.345379089565436e-05, "loss": 0.0188, "step": 264990 }, { "epoch": 1.71, "learning_rate": 4.3444109541297426e-05, "loss": 0.0209, "step": 265000 }, { "epoch": 1.71, "eval_cer": 0.9198490566037736, "eval_loss": 0.01810065098106861, "eval_runtime": 120.1229, "eval_samples_per_second": 16.65, "eval_steps_per_second": 4.162, "step": 265000 }, { "epoch": 1.71, "learning_rate": 4.34344281869405e-05, "loss": 0.0271, "step": 265010 }, { "epoch": 1.71, "learning_rate": 4.3424746832583565e-05, "loss": 0.0219, "step": 265020 }, { "epoch": 1.71, "learning_rate": 4.3415065478226624e-05, "loss": 0.023, "step": 265030 }, { "epoch": 1.71, "learning_rate": 4.34053841238697e-05, "loss": 0.025, "step": 265040 }, { "epoch": 1.71, "learning_rate": 4.3395702769512764e-05, "loss": 0.0251, "step": 265050 }, { "epoch": 1.71, "learning_rate": 4.338602141515584e-05, "loss": 0.0246, "step": 265060 }, { "epoch": 1.71, "learning_rate": 4.33763400607989e-05, "loss": 0.0183, "step": 265070 }, { "epoch": 1.71, "learning_rate": 4.3366658706441976e-05, "loss": 0.0234, "step": 265080 }, { "epoch": 1.71, "learning_rate": 4.3356977352085035e-05, "loss": 0.0269, "step": 265090 }, { "epoch": 1.71, "learning_rate": 4.33472959977281e-05, "loss": 0.0266, "step": 265100 }, { "epoch": 1.71, "learning_rate": 4.3337614643371175e-05, "loss": 0.0239, "step": 265110 }, { "epoch": 1.71, "learning_rate": 4.332793328901424e-05, "loss": 0.0254, "step": 265120 }, { "epoch": 1.71, "learning_rate": 4.3318251934657314e-05, "loss": 0.025, "step": 265130 }, { "epoch": 1.71, "learning_rate": 4.3308570580300373e-05, "loss": 0.0273, "step": 265140 }, { "epoch": 1.71, "learning_rate": 4.3298889225943446e-05, "loss": 0.0241, "step": 265150 }, { "epoch": 1.71, "learning_rate": 4.328920787158651e-05, "loss": 0.0256, "step": 265160 }, { "epoch": 1.71, "learning_rate": 4.327952651722958e-05, "loss": 0.0199, "step": 265170 }, { "epoch": 1.71, "learning_rate": 4.326984516287265e-05, "loss": 0.0198, "step": 265180 }, { "epoch": 1.71, "learning_rate": 4.326016380851571e-05, "loss": 0.026, "step": 265190 }, { "epoch": 1.71, "learning_rate": 4.3250482454158784e-05, "loss": 0.0249, "step": 265200 }, { "epoch": 1.71, "learning_rate": 4.324080109980185e-05, "loss": 0.0226, "step": 265210 }, { "epoch": 1.71, "learning_rate": 4.3231119745444924e-05, "loss": 0.0243, "step": 265220 }, { "epoch": 1.71, "learning_rate": 4.322143839108799e-05, "loss": 0.0259, "step": 265230 }, { "epoch": 1.71, "learning_rate": 4.321175703673105e-05, "loss": 0.0205, "step": 265240 }, { "epoch": 1.71, "learning_rate": 4.320207568237412e-05, "loss": 0.0208, "step": 265250 }, { "epoch": 1.71, "learning_rate": 4.319239432801719e-05, "loss": 0.0211, "step": 265260 }, { "epoch": 1.71, "learning_rate": 4.318271297366026e-05, "loss": 0.0222, "step": 265270 }, { "epoch": 1.71, "learning_rate": 4.317303161930333e-05, "loss": 0.0235, "step": 265280 }, { "epoch": 1.71, "learning_rate": 4.3163350264946394e-05, "loss": 0.0245, "step": 265290 }, { "epoch": 1.71, "learning_rate": 4.315366891058946e-05, "loss": 0.0261, "step": 265300 }, { "epoch": 1.71, "learning_rate": 4.3143987556232527e-05, "loss": 0.0222, "step": 265310 }, { "epoch": 1.71, "learning_rate": 4.31343062018756e-05, "loss": 0.0271, "step": 265320 }, { "epoch": 1.71, "learning_rate": 4.3124624847518666e-05, "loss": 0.0281, "step": 265330 }, { "epoch": 1.71, "learning_rate": 4.311494349316174e-05, "loss": 0.0247, "step": 265340 }, { "epoch": 1.71, "learning_rate": 4.31052621388048e-05, "loss": 0.0238, "step": 265350 }, { "epoch": 1.71, "learning_rate": 4.309558078444787e-05, "loss": 0.0272, "step": 265360 }, { "epoch": 1.71, "learning_rate": 4.308589943009094e-05, "loss": 0.0272, "step": 265370 }, { "epoch": 1.71, "learning_rate": 4.3076218075734004e-05, "loss": 0.0248, "step": 265380 }, { "epoch": 1.71, "learning_rate": 4.306653672137708e-05, "loss": 0.0204, "step": 265390 }, { "epoch": 1.71, "learning_rate": 4.3056855367020136e-05, "loss": 0.0207, "step": 265400 }, { "epoch": 1.71, "learning_rate": 4.304717401266321e-05, "loss": 0.0212, "step": 265410 }, { "epoch": 1.71, "learning_rate": 4.3037492658306276e-05, "loss": 0.0251, "step": 265420 }, { "epoch": 1.71, "learning_rate": 4.302781130394935e-05, "loss": 0.0241, "step": 265430 }, { "epoch": 1.71, "learning_rate": 4.3018129949592415e-05, "loss": 0.0238, "step": 265440 }, { "epoch": 1.71, "learning_rate": 4.3008448595235474e-05, "loss": 0.0271, "step": 265450 }, { "epoch": 1.71, "learning_rate": 4.299876724087855e-05, "loss": 0.0235, "step": 265460 }, { "epoch": 1.71, "learning_rate": 4.2989085886521614e-05, "loss": 0.027, "step": 265470 }, { "epoch": 1.71, "learning_rate": 4.2979404532164687e-05, "loss": 0.0228, "step": 265480 }, { "epoch": 1.71, "learning_rate": 4.296972317780775e-05, "loss": 0.0252, "step": 265490 }, { "epoch": 1.71, "learning_rate": 4.296004182345082e-05, "loss": 0.0174, "step": 265500 }, { "epoch": 1.71, "learning_rate": 4.2950360469093885e-05, "loss": 0.0243, "step": 265510 }, { "epoch": 1.71, "learning_rate": 4.294067911473695e-05, "loss": 0.026, "step": 265520 }, { "epoch": 1.71, "learning_rate": 4.2930997760380024e-05, "loss": 0.0272, "step": 265530 }, { "epoch": 1.71, "learning_rate": 4.292131640602309e-05, "loss": 0.0251, "step": 265540 }, { "epoch": 1.71, "learning_rate": 4.291163505166616e-05, "loss": 0.0284, "step": 265550 }, { "epoch": 1.71, "learning_rate": 4.290195369730922e-05, "loss": 0.0254, "step": 265560 }, { "epoch": 1.71, "learning_rate": 4.2892272342952296e-05, "loss": 0.0261, "step": 265570 }, { "epoch": 1.71, "learning_rate": 4.288259098859536e-05, "loss": 0.0231, "step": 265580 }, { "epoch": 1.71, "learning_rate": 4.287290963423843e-05, "loss": 0.0232, "step": 265590 }, { "epoch": 1.71, "learning_rate": 4.2863228279881495e-05, "loss": 0.0235, "step": 265600 }, { "epoch": 1.71, "learning_rate": 4.285354692552456e-05, "loss": 0.0237, "step": 265610 }, { "epoch": 1.71, "learning_rate": 4.2843865571167634e-05, "loss": 0.0233, "step": 265620 }, { "epoch": 1.71, "learning_rate": 4.28341842168107e-05, "loss": 0.0207, "step": 265630 }, { "epoch": 1.71, "learning_rate": 4.2824502862453773e-05, "loss": 0.0247, "step": 265640 }, { "epoch": 1.71, "learning_rate": 4.281482150809683e-05, "loss": 0.0234, "step": 265650 }, { "epoch": 1.71, "learning_rate": 4.28051401537399e-05, "loss": 0.0273, "step": 265660 }, { "epoch": 1.71, "learning_rate": 4.279545879938297e-05, "loss": 0.0263, "step": 265670 }, { "epoch": 1.71, "learning_rate": 4.278577744502604e-05, "loss": 0.0248, "step": 265680 }, { "epoch": 1.71, "learning_rate": 4.277609609066911e-05, "loss": 0.0234, "step": 265690 }, { "epoch": 1.71, "learning_rate": 4.276641473631217e-05, "loss": 0.0238, "step": 265700 }, { "epoch": 1.71, "learning_rate": 4.2756733381955244e-05, "loss": 0.0286, "step": 265710 }, { "epoch": 1.72, "learning_rate": 4.274705202759831e-05, "loss": 0.0235, "step": 265720 }, { "epoch": 1.72, "learning_rate": 4.2737370673241376e-05, "loss": 0.0238, "step": 265730 }, { "epoch": 1.72, "learning_rate": 4.272768931888445e-05, "loss": 0.0257, "step": 265740 }, { "epoch": 1.72, "learning_rate": 4.271800796452751e-05, "loss": 0.0241, "step": 265750 }, { "epoch": 1.72, "learning_rate": 4.270832661017058e-05, "loss": 0.0276, "step": 265760 }, { "epoch": 1.72, "learning_rate": 4.269864525581365e-05, "loss": 0.0194, "step": 265770 }, { "epoch": 1.72, "learning_rate": 4.268896390145672e-05, "loss": 0.0268, "step": 265780 }, { "epoch": 1.72, "learning_rate": 4.267928254709979e-05, "loss": 0.0219, "step": 265790 }, { "epoch": 1.72, "learning_rate": 4.266960119274285e-05, "loss": 0.0293, "step": 265800 }, { "epoch": 1.72, "learning_rate": 4.265991983838592e-05, "loss": 0.0242, "step": 265810 }, { "epoch": 1.72, "learning_rate": 4.2650238484028986e-05, "loss": 0.0246, "step": 265820 }, { "epoch": 1.72, "learning_rate": 4.264055712967206e-05, "loss": 0.0275, "step": 265830 }, { "epoch": 1.72, "learning_rate": 4.2630875775315125e-05, "loss": 0.0199, "step": 265840 }, { "epoch": 1.72, "learning_rate": 4.26211944209582e-05, "loss": 0.0236, "step": 265850 }, { "epoch": 1.72, "learning_rate": 4.261151306660126e-05, "loss": 0.0238, "step": 265860 }, { "epoch": 1.72, "learning_rate": 4.2601831712244324e-05, "loss": 0.0273, "step": 265870 }, { "epoch": 1.72, "learning_rate": 4.25921503578874e-05, "loss": 0.0211, "step": 265880 }, { "epoch": 1.72, "learning_rate": 4.258246900353046e-05, "loss": 0.0241, "step": 265890 }, { "epoch": 1.72, "learning_rate": 4.2572787649173536e-05, "loss": 0.0206, "step": 265900 }, { "epoch": 1.72, "learning_rate": 4.2563106294816596e-05, "loss": 0.0206, "step": 265910 }, { "epoch": 1.72, "learning_rate": 4.255342494045967e-05, "loss": 0.0258, "step": 265920 }, { "epoch": 1.72, "learning_rate": 4.2543743586102735e-05, "loss": 0.025, "step": 265930 }, { "epoch": 1.72, "learning_rate": 4.25340622317458e-05, "loss": 0.0268, "step": 265940 }, { "epoch": 1.72, "learning_rate": 4.2524380877388874e-05, "loss": 0.0293, "step": 265950 }, { "epoch": 1.72, "learning_rate": 4.2514699523031934e-05, "loss": 0.0286, "step": 265960 }, { "epoch": 1.72, "learning_rate": 4.250501816867501e-05, "loss": 0.0275, "step": 265970 }, { "epoch": 1.72, "learning_rate": 4.249533681431807e-05, "loss": 0.0213, "step": 265980 }, { "epoch": 1.72, "learning_rate": 4.248565545996114e-05, "loss": 0.0307, "step": 265990 }, { "epoch": 1.72, "learning_rate": 4.247597410560421e-05, "loss": 0.0319, "step": 266000 }, { "epoch": 1.72, "eval_cer": 0.9198671336572138, "eval_loss": 0.01788017526268959, "eval_runtime": 120.022, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 266000 }, { "epoch": 1.72, "learning_rate": 4.246629275124727e-05, "loss": 0.025, "step": 266010 }, { "epoch": 1.72, "learning_rate": 4.2456611396890345e-05, "loss": 0.0276, "step": 266020 }, { "epoch": 1.72, "learning_rate": 4.244693004253341e-05, "loss": 0.0299, "step": 266030 }, { "epoch": 1.72, "learning_rate": 4.2437248688176484e-05, "loss": 0.0197, "step": 266040 }, { "epoch": 1.72, "learning_rate": 4.242756733381955e-05, "loss": 0.0212, "step": 266050 }, { "epoch": 1.72, "learning_rate": 4.241788597946261e-05, "loss": 0.0202, "step": 266060 }, { "epoch": 1.72, "learning_rate": 4.240820462510568e-05, "loss": 0.0237, "step": 266070 }, { "epoch": 1.72, "learning_rate": 4.239852327074875e-05, "loss": 0.0237, "step": 266080 }, { "epoch": 1.72, "learning_rate": 4.238884191639182e-05, "loss": 0.0236, "step": 266090 }, { "epoch": 1.72, "learning_rate": 4.237916056203489e-05, "loss": 0.0239, "step": 266100 }, { "epoch": 1.72, "learning_rate": 4.236947920767796e-05, "loss": 0.0193, "step": 266110 }, { "epoch": 1.72, "learning_rate": 4.235979785332102e-05, "loss": 0.0256, "step": 266120 }, { "epoch": 1.72, "learning_rate": 4.235011649896409e-05, "loss": 0.0228, "step": 266130 }, { "epoch": 1.72, "learning_rate": 4.234043514460716e-05, "loss": 0.0202, "step": 266140 }, { "epoch": 1.72, "learning_rate": 4.2330753790250226e-05, "loss": 0.0293, "step": 266150 }, { "epoch": 1.72, "learning_rate": 4.23210724358933e-05, "loss": 0.0173, "step": 266160 }, { "epoch": 1.72, "learning_rate": 4.231139108153636e-05, "loss": 0.0216, "step": 266170 }, { "epoch": 1.72, "learning_rate": 4.230170972717943e-05, "loss": 0.0269, "step": 266180 }, { "epoch": 1.72, "learning_rate": 4.22920283728225e-05, "loss": 0.02, "step": 266190 }, { "epoch": 1.72, "learning_rate": 4.2282347018465564e-05, "loss": 0.0228, "step": 266200 }, { "epoch": 1.72, "learning_rate": 4.227266566410864e-05, "loss": 0.0227, "step": 266210 }, { "epoch": 1.72, "learning_rate": 4.22629843097517e-05, "loss": 0.0233, "step": 266220 }, { "epoch": 1.72, "learning_rate": 4.225330295539477e-05, "loss": 0.0232, "step": 266230 }, { "epoch": 1.72, "learning_rate": 4.2243621601037836e-05, "loss": 0.0295, "step": 266240 }, { "epoch": 1.72, "learning_rate": 4.223394024668091e-05, "loss": 0.0213, "step": 266250 }, { "epoch": 1.72, "learning_rate": 4.2224258892323975e-05, "loss": 0.0251, "step": 266260 }, { "epoch": 1.72, "learning_rate": 4.2214577537967035e-05, "loss": 0.0215, "step": 266270 }, { "epoch": 1.72, "learning_rate": 4.220489618361011e-05, "loss": 0.0239, "step": 266280 }, { "epoch": 1.72, "learning_rate": 4.2195214829253174e-05, "loss": 0.0237, "step": 266290 }, { "epoch": 1.72, "learning_rate": 4.218553347489625e-05, "loss": 0.0194, "step": 266300 }, { "epoch": 1.72, "learning_rate": 4.217585212053931e-05, "loss": 0.0237, "step": 266310 }, { "epoch": 1.72, "learning_rate": 4.2166170766182386e-05, "loss": 0.0213, "step": 266320 }, { "epoch": 1.72, "learning_rate": 4.2156489411825446e-05, "loss": 0.0227, "step": 266330 }, { "epoch": 1.72, "learning_rate": 4.214680805746851e-05, "loss": 0.0251, "step": 266340 }, { "epoch": 1.72, "learning_rate": 4.2137126703111585e-05, "loss": 0.0302, "step": 266350 }, { "epoch": 1.72, "learning_rate": 4.212744534875465e-05, "loss": 0.0219, "step": 266360 }, { "epoch": 1.72, "learning_rate": 4.2117763994397724e-05, "loss": 0.0209, "step": 266370 }, { "epoch": 1.72, "learning_rate": 4.2108082640040784e-05, "loss": 0.0273, "step": 266380 }, { "epoch": 1.72, "learning_rate": 4.2098401285683857e-05, "loss": 0.0282, "step": 266390 }, { "epoch": 1.72, "learning_rate": 4.208871993132692e-05, "loss": 0.027, "step": 266400 }, { "epoch": 1.72, "learning_rate": 4.207903857696999e-05, "loss": 0.0287, "step": 266410 }, { "epoch": 1.72, "learning_rate": 4.206935722261306e-05, "loss": 0.0242, "step": 266420 }, { "epoch": 1.72, "learning_rate": 4.205967586825612e-05, "loss": 0.0252, "step": 266430 }, { "epoch": 1.72, "learning_rate": 4.2049994513899195e-05, "loss": 0.0223, "step": 266440 }, { "epoch": 1.72, "learning_rate": 4.204031315954226e-05, "loss": 0.0261, "step": 266450 }, { "epoch": 1.72, "learning_rate": 4.2030631805185334e-05, "loss": 0.0336, "step": 266460 }, { "epoch": 1.72, "learning_rate": 4.20209504508284e-05, "loss": 0.0217, "step": 266470 }, { "epoch": 1.72, "learning_rate": 4.201126909647146e-05, "loss": 0.0231, "step": 266480 }, { "epoch": 1.72, "learning_rate": 4.200158774211453e-05, "loss": 0.0284, "step": 266490 }, { "epoch": 1.72, "learning_rate": 4.19919063877576e-05, "loss": 0.0275, "step": 266500 }, { "epoch": 1.72, "learning_rate": 4.198222503340067e-05, "loss": 0.0247, "step": 266510 }, { "epoch": 1.72, "learning_rate": 4.197254367904374e-05, "loss": 0.0232, "step": 266520 }, { "epoch": 1.72, "learning_rate": 4.196286232468681e-05, "loss": 0.024, "step": 266530 }, { "epoch": 1.72, "learning_rate": 4.195318097032987e-05, "loss": 0.0172, "step": 266540 }, { "epoch": 1.72, "learning_rate": 4.194349961597294e-05, "loss": 0.0231, "step": 266550 }, { "epoch": 1.72, "learning_rate": 4.193381826161601e-05, "loss": 0.0248, "step": 266560 }, { "epoch": 1.72, "learning_rate": 4.1924136907259076e-05, "loss": 0.0211, "step": 266570 }, { "epoch": 1.72, "learning_rate": 4.191445555290215e-05, "loss": 0.0278, "step": 266580 }, { "epoch": 1.72, "learning_rate": 4.190477419854521e-05, "loss": 0.0233, "step": 266590 }, { "epoch": 1.72, "learning_rate": 4.189509284418828e-05, "loss": 0.0205, "step": 266600 }, { "epoch": 1.72, "learning_rate": 4.188541148983135e-05, "loss": 0.0301, "step": 266610 }, { "epoch": 1.72, "learning_rate": 4.1875730135474414e-05, "loss": 0.0206, "step": 266620 }, { "epoch": 1.72, "learning_rate": 4.186604878111749e-05, "loss": 0.0202, "step": 266630 }, { "epoch": 1.72, "learning_rate": 4.1856367426760546e-05, "loss": 0.0224, "step": 266640 }, { "epoch": 1.72, "learning_rate": 4.184668607240362e-05, "loss": 0.0223, "step": 266650 }, { "epoch": 1.72, "learning_rate": 4.1837004718046686e-05, "loss": 0.0287, "step": 266660 }, { "epoch": 1.72, "learning_rate": 4.182732336368976e-05, "loss": 0.0269, "step": 266670 }, { "epoch": 1.72, "learning_rate": 4.1817642009332825e-05, "loss": 0.0261, "step": 266680 }, { "epoch": 1.72, "learning_rate": 4.1807960654975884e-05, "loss": 0.0226, "step": 266690 }, { "epoch": 1.72, "learning_rate": 4.179827930061896e-05, "loss": 0.021, "step": 266700 }, { "epoch": 1.72, "learning_rate": 4.1788597946262024e-05, "loss": 0.0254, "step": 266710 }, { "epoch": 1.72, "learning_rate": 4.17789165919051e-05, "loss": 0.023, "step": 266720 }, { "epoch": 1.72, "learning_rate": 4.176923523754816e-05, "loss": 0.021, "step": 266730 }, { "epoch": 1.72, "learning_rate": 4.175955388319123e-05, "loss": 0.0256, "step": 266740 }, { "epoch": 1.72, "learning_rate": 4.1749872528834295e-05, "loss": 0.0251, "step": 266750 }, { "epoch": 1.72, "learning_rate": 4.174019117447736e-05, "loss": 0.0216, "step": 266760 }, { "epoch": 1.72, "learning_rate": 4.1730509820120435e-05, "loss": 0.0228, "step": 266770 }, { "epoch": 1.72, "learning_rate": 4.17208284657635e-05, "loss": 0.0213, "step": 266780 }, { "epoch": 1.72, "learning_rate": 4.171114711140657e-05, "loss": 0.0241, "step": 266790 }, { "epoch": 1.72, "learning_rate": 4.170146575704963e-05, "loss": 0.022, "step": 266800 }, { "epoch": 1.72, "learning_rate": 4.1691784402692706e-05, "loss": 0.0253, "step": 266810 }, { "epoch": 1.72, "learning_rate": 4.168210304833577e-05, "loss": 0.0248, "step": 266820 }, { "epoch": 1.72, "learning_rate": 4.167242169397884e-05, "loss": 0.0224, "step": 266830 }, { "epoch": 1.72, "learning_rate": 4.1662740339621905e-05, "loss": 0.0266, "step": 266840 }, { "epoch": 1.72, "learning_rate": 4.165305898526497e-05, "loss": 0.0234, "step": 266850 }, { "epoch": 1.72, "learning_rate": 4.1643377630908044e-05, "loss": 0.0239, "step": 266860 }, { "epoch": 1.72, "learning_rate": 4.163369627655111e-05, "loss": 0.0282, "step": 266870 }, { "epoch": 1.72, "learning_rate": 4.1624014922194184e-05, "loss": 0.0231, "step": 266880 }, { "epoch": 1.72, "learning_rate": 4.161433356783724e-05, "loss": 0.0242, "step": 266890 }, { "epoch": 1.72, "learning_rate": 4.160465221348031e-05, "loss": 0.0276, "step": 266900 }, { "epoch": 1.72, "learning_rate": 4.159497085912338e-05, "loss": 0.0243, "step": 266910 }, { "epoch": 1.72, "learning_rate": 4.158528950476645e-05, "loss": 0.0203, "step": 266920 }, { "epoch": 1.72, "learning_rate": 4.157560815040952e-05, "loss": 0.0268, "step": 266930 }, { "epoch": 1.72, "learning_rate": 4.156592679605258e-05, "loss": 0.0276, "step": 266940 }, { "epoch": 1.72, "learning_rate": 4.1556245441695654e-05, "loss": 0.0227, "step": 266950 }, { "epoch": 1.72, "learning_rate": 4.154656408733872e-05, "loss": 0.0244, "step": 266960 }, { "epoch": 1.72, "learning_rate": 4.1536882732981787e-05, "loss": 0.0202, "step": 266970 }, { "epoch": 1.72, "learning_rate": 4.152720137862486e-05, "loss": 0.0267, "step": 266980 }, { "epoch": 1.72, "learning_rate": 4.151752002426792e-05, "loss": 0.0231, "step": 266990 }, { "epoch": 1.72, "learning_rate": 4.150783866991099e-05, "loss": 0.0236, "step": 267000 }, { "epoch": 1.72, "eval_cer": 0.9198870184159982, "eval_loss": 0.017837153747677803, "eval_runtime": 119.9955, "eval_samples_per_second": 16.667, "eval_steps_per_second": 4.167, "step": 267000 }, { "epoch": 1.72, "learning_rate": 4.149815731555406e-05, "loss": 0.0231, "step": 267010 }, { "epoch": 1.72, "learning_rate": 4.148847596119713e-05, "loss": 0.0239, "step": 267020 }, { "epoch": 1.72, "learning_rate": 4.14787946068402e-05, "loss": 0.0227, "step": 267030 }, { "epoch": 1.72, "learning_rate": 4.146911325248326e-05, "loss": 0.0236, "step": 267040 }, { "epoch": 1.72, "learning_rate": 4.145943189812633e-05, "loss": 0.0262, "step": 267050 }, { "epoch": 1.72, "learning_rate": 4.1449750543769396e-05, "loss": 0.0224, "step": 267060 }, { "epoch": 1.72, "learning_rate": 4.144006918941247e-05, "loss": 0.0239, "step": 267070 }, { "epoch": 1.72, "learning_rate": 4.1430387835055536e-05, "loss": 0.0241, "step": 267080 }, { "epoch": 1.72, "learning_rate": 4.142070648069861e-05, "loss": 0.0261, "step": 267090 }, { "epoch": 1.72, "learning_rate": 4.141102512634167e-05, "loss": 0.0242, "step": 267100 }, { "epoch": 1.72, "learning_rate": 4.1401343771984734e-05, "loss": 0.0266, "step": 267110 }, { "epoch": 1.72, "learning_rate": 4.139166241762781e-05, "loss": 0.0275, "step": 267120 }, { "epoch": 1.72, "learning_rate": 4.1381981063270873e-05, "loss": 0.026, "step": 267130 }, { "epoch": 1.72, "learning_rate": 4.1372299708913947e-05, "loss": 0.0284, "step": 267140 }, { "epoch": 1.72, "learning_rate": 4.1362618354557006e-05, "loss": 0.0263, "step": 267150 }, { "epoch": 1.72, "learning_rate": 4.135293700020008e-05, "loss": 0.0234, "step": 267160 }, { "epoch": 1.72, "learning_rate": 4.1343255645843145e-05, "loss": 0.019, "step": 267170 }, { "epoch": 1.72, "learning_rate": 4.133357429148621e-05, "loss": 0.0302, "step": 267180 }, { "epoch": 1.72, "learning_rate": 4.1323892937129284e-05, "loss": 0.0226, "step": 267190 }, { "epoch": 1.72, "learning_rate": 4.1314211582772344e-05, "loss": 0.027, "step": 267200 }, { "epoch": 1.72, "learning_rate": 4.130453022841542e-05, "loss": 0.0305, "step": 267210 }, { "epoch": 1.72, "learning_rate": 4.129484887405848e-05, "loss": 0.0283, "step": 267220 }, { "epoch": 1.72, "learning_rate": 4.1285167519701556e-05, "loss": 0.024, "step": 267230 }, { "epoch": 1.72, "learning_rate": 4.127548616534462e-05, "loss": 0.0265, "step": 267240 }, { "epoch": 1.72, "learning_rate": 4.126580481098768e-05, "loss": 0.023, "step": 267250 }, { "epoch": 1.72, "learning_rate": 4.1256123456630755e-05, "loss": 0.0236, "step": 267260 }, { "epoch": 1.73, "learning_rate": 4.124644210227382e-05, "loss": 0.0217, "step": 267270 }, { "epoch": 1.73, "learning_rate": 4.1236760747916894e-05, "loss": 0.0217, "step": 267280 }, { "epoch": 1.73, "learning_rate": 4.122707939355996e-05, "loss": 0.0264, "step": 267290 }, { "epoch": 1.73, "learning_rate": 4.1217398039203033e-05, "loss": 0.027, "step": 267300 }, { "epoch": 1.73, "learning_rate": 4.120771668484609e-05, "loss": 0.0212, "step": 267310 }, { "epoch": 1.73, "learning_rate": 4.119803533048916e-05, "loss": 0.0228, "step": 267320 }, { "epoch": 1.73, "learning_rate": 4.118835397613223e-05, "loss": 0.0216, "step": 267330 }, { "epoch": 1.73, "learning_rate": 4.11786726217753e-05, "loss": 0.0277, "step": 267340 }, { "epoch": 1.73, "learning_rate": 4.116899126741837e-05, "loss": 0.0259, "step": 267350 }, { "epoch": 1.73, "learning_rate": 4.115930991306143e-05, "loss": 0.0193, "step": 267360 }, { "epoch": 1.73, "learning_rate": 4.1149628558704504e-05, "loss": 0.0271, "step": 267370 }, { "epoch": 1.73, "learning_rate": 4.113994720434757e-05, "loss": 0.0256, "step": 267380 }, { "epoch": 1.73, "learning_rate": 4.1130265849990636e-05, "loss": 0.0258, "step": 267390 }, { "epoch": 1.73, "learning_rate": 4.112058449563371e-05, "loss": 0.026, "step": 267400 }, { "epoch": 1.73, "learning_rate": 4.111090314127677e-05, "loss": 0.0187, "step": 267410 }, { "epoch": 1.73, "learning_rate": 4.110122178691984e-05, "loss": 0.0199, "step": 267420 }, { "epoch": 1.73, "learning_rate": 4.109154043256291e-05, "loss": 0.0257, "step": 267430 }, { "epoch": 1.73, "learning_rate": 4.108185907820598e-05, "loss": 0.0267, "step": 267440 }, { "epoch": 1.73, "learning_rate": 4.107217772384905e-05, "loss": 0.0237, "step": 267450 }, { "epoch": 1.73, "learning_rate": 4.106249636949211e-05, "loss": 0.0235, "step": 267460 }, { "epoch": 1.73, "learning_rate": 4.105281501513518e-05, "loss": 0.026, "step": 267470 }, { "epoch": 1.73, "learning_rate": 4.1043133660778246e-05, "loss": 0.0247, "step": 267480 }, { "epoch": 1.73, "learning_rate": 4.103345230642132e-05, "loss": 0.0266, "step": 267490 }, { "epoch": 1.73, "learning_rate": 4.1023770952064385e-05, "loss": 0.0225, "step": 267500 }, { "epoch": 1.73, "learning_rate": 4.101408959770746e-05, "loss": 0.0245, "step": 267510 }, { "epoch": 1.73, "learning_rate": 4.100440824335052e-05, "loss": 0.0309, "step": 267520 }, { "epoch": 1.73, "learning_rate": 4.0994726888993584e-05, "loss": 0.0262, "step": 267530 }, { "epoch": 1.73, "learning_rate": 4.098504553463666e-05, "loss": 0.0251, "step": 267540 }, { "epoch": 1.73, "learning_rate": 4.097536418027972e-05, "loss": 0.0266, "step": 267550 }, { "epoch": 1.73, "learning_rate": 4.0965682825922796e-05, "loss": 0.0196, "step": 267560 }, { "epoch": 1.73, "learning_rate": 4.0956001471565856e-05, "loss": 0.0224, "step": 267570 }, { "epoch": 1.73, "learning_rate": 4.094632011720893e-05, "loss": 0.0208, "step": 267580 }, { "epoch": 1.73, "learning_rate": 4.0936638762851995e-05, "loss": 0.0217, "step": 267590 }, { "epoch": 1.73, "learning_rate": 4.092695740849506e-05, "loss": 0.0254, "step": 267600 }, { "epoch": 1.73, "learning_rate": 4.0917276054138134e-05, "loss": 0.0263, "step": 267610 }, { "epoch": 1.73, "learning_rate": 4.0907594699781194e-05, "loss": 0.0221, "step": 267620 }, { "epoch": 1.73, "learning_rate": 4.089791334542427e-05, "loss": 0.0213, "step": 267630 }, { "epoch": 1.73, "learning_rate": 4.088823199106733e-05, "loss": 0.0251, "step": 267640 }, { "epoch": 1.73, "learning_rate": 4.0878550636710406e-05, "loss": 0.0261, "step": 267650 }, { "epoch": 1.73, "learning_rate": 4.086886928235347e-05, "loss": 0.0199, "step": 267660 }, { "epoch": 1.73, "learning_rate": 4.085918792799653e-05, "loss": 0.024, "step": 267670 }, { "epoch": 1.73, "learning_rate": 4.0849506573639605e-05, "loss": 0.025, "step": 267680 }, { "epoch": 1.73, "learning_rate": 4.083982521928267e-05, "loss": 0.0248, "step": 267690 }, { "epoch": 1.73, "learning_rate": 4.0830143864925744e-05, "loss": 0.0283, "step": 267700 }, { "epoch": 1.73, "learning_rate": 4.082046251056881e-05, "loss": 0.0302, "step": 267710 }, { "epoch": 1.73, "learning_rate": 4.081078115621187e-05, "loss": 0.0232, "step": 267720 }, { "epoch": 1.73, "learning_rate": 4.080109980185494e-05, "loss": 0.0251, "step": 267730 }, { "epoch": 1.73, "learning_rate": 4.079141844749801e-05, "loss": 0.0263, "step": 267740 }, { "epoch": 1.73, "learning_rate": 4.078173709314108e-05, "loss": 0.0265, "step": 267750 }, { "epoch": 1.73, "learning_rate": 4.077205573878415e-05, "loss": 0.0196, "step": 267760 }, { "epoch": 1.73, "learning_rate": 4.076237438442722e-05, "loss": 0.0241, "step": 267770 }, { "epoch": 1.73, "learning_rate": 4.075269303007028e-05, "loss": 0.0282, "step": 267780 }, { "epoch": 1.73, "learning_rate": 4.074301167571335e-05, "loss": 0.0262, "step": 267790 }, { "epoch": 1.73, "learning_rate": 4.073333032135642e-05, "loss": 0.0225, "step": 267800 }, { "epoch": 1.73, "learning_rate": 4.0723648966999486e-05, "loss": 0.0287, "step": 267810 }, { "epoch": 1.73, "learning_rate": 4.071396761264256e-05, "loss": 0.0251, "step": 267820 }, { "epoch": 1.73, "learning_rate": 4.070428625828562e-05, "loss": 0.022, "step": 267830 }, { "epoch": 1.73, "learning_rate": 4.069460490392869e-05, "loss": 0.0236, "step": 267840 }, { "epoch": 1.73, "learning_rate": 4.068492354957176e-05, "loss": 0.0251, "step": 267850 }, { "epoch": 1.73, "learning_rate": 4.0675242195214824e-05, "loss": 0.0192, "step": 267860 }, { "epoch": 1.73, "learning_rate": 4.06655608408579e-05, "loss": 0.0204, "step": 267870 }, { "epoch": 1.73, "learning_rate": 4.065587948650096e-05, "loss": 0.0279, "step": 267880 }, { "epoch": 1.73, "learning_rate": 4.064619813214403e-05, "loss": 0.0224, "step": 267890 }, { "epoch": 1.73, "learning_rate": 4.0636516777787096e-05, "loss": 0.0268, "step": 267900 }, { "epoch": 1.73, "learning_rate": 4.062683542343017e-05, "loss": 0.0284, "step": 267910 }, { "epoch": 1.73, "learning_rate": 4.0617154069073235e-05, "loss": 0.0219, "step": 267920 }, { "epoch": 1.73, "learning_rate": 4.0607472714716295e-05, "loss": 0.0287, "step": 267930 }, { "epoch": 1.73, "learning_rate": 4.059779136035937e-05, "loss": 0.0318, "step": 267940 }, { "epoch": 1.73, "learning_rate": 4.0588110006002434e-05, "loss": 0.0248, "step": 267950 }, { "epoch": 1.73, "learning_rate": 4.057842865164551e-05, "loss": 0.0201, "step": 267960 }, { "epoch": 1.73, "learning_rate": 4.056874729728857e-05, "loss": 0.0236, "step": 267970 }, { "epoch": 1.73, "learning_rate": 4.0559065942931646e-05, "loss": 0.0307, "step": 267980 }, { "epoch": 1.73, "learning_rate": 4.0549384588574706e-05, "loss": 0.026, "step": 267990 }, { "epoch": 1.73, "learning_rate": 4.053970323421777e-05, "loss": 0.029, "step": 268000 }, { "epoch": 1.73, "eval_cer": 0.919813806349565, "eval_loss": 0.017884543165564537, "eval_runtime": 120.1776, "eval_samples_per_second": 16.642, "eval_steps_per_second": 4.161, "step": 268000 }, { "epoch": 1.73, "learning_rate": 4.0530021879860845e-05, "loss": 0.0274, "step": 268010 }, { "epoch": 1.73, "learning_rate": 4.052034052550391e-05, "loss": 0.0215, "step": 268020 }, { "epoch": 1.73, "learning_rate": 4.0510659171146984e-05, "loss": 0.0225, "step": 268030 }, { "epoch": 1.73, "learning_rate": 4.0500977816790044e-05, "loss": 0.0263, "step": 268040 }, { "epoch": 1.73, "learning_rate": 4.0491296462433117e-05, "loss": 0.0252, "step": 268050 }, { "epoch": 1.73, "learning_rate": 4.048161510807618e-05, "loss": 0.0221, "step": 268060 }, { "epoch": 1.73, "learning_rate": 4.047193375371925e-05, "loss": 0.0223, "step": 268070 }, { "epoch": 1.73, "learning_rate": 4.046225239936232e-05, "loss": 0.0227, "step": 268080 }, { "epoch": 1.73, "learning_rate": 4.045257104500538e-05, "loss": 0.0238, "step": 268090 }, { "epoch": 1.73, "learning_rate": 4.0442889690648455e-05, "loss": 0.0252, "step": 268100 }, { "epoch": 1.73, "learning_rate": 4.043320833629152e-05, "loss": 0.0345, "step": 268110 }, { "epoch": 1.73, "learning_rate": 4.0423526981934594e-05, "loss": 0.0238, "step": 268120 }, { "epoch": 1.73, "learning_rate": 4.041384562757766e-05, "loss": 0.0238, "step": 268130 }, { "epoch": 1.73, "learning_rate": 4.040416427322072e-05, "loss": 0.0256, "step": 268140 }, { "epoch": 1.73, "learning_rate": 4.039448291886379e-05, "loss": 0.023, "step": 268150 }, { "epoch": 1.73, "learning_rate": 4.038480156450686e-05, "loss": 0.022, "step": 268160 }, { "epoch": 1.73, "learning_rate": 4.037512021014993e-05, "loss": 0.0236, "step": 268170 }, { "epoch": 1.73, "learning_rate": 4.0365438855793e-05, "loss": 0.0247, "step": 268180 }, { "epoch": 1.73, "learning_rate": 4.0355757501436064e-05, "loss": 0.0318, "step": 268190 }, { "epoch": 1.73, "learning_rate": 4.034607614707913e-05, "loss": 0.0311, "step": 268200 }, { "epoch": 1.73, "learning_rate": 4.03363947927222e-05, "loss": 0.0202, "step": 268210 }, { "epoch": 1.73, "learning_rate": 4.032671343836527e-05, "loss": 0.0216, "step": 268220 }, { "epoch": 1.73, "learning_rate": 4.0317032084008336e-05, "loss": 0.0217, "step": 268230 }, { "epoch": 1.73, "learning_rate": 4.03073507296514e-05, "loss": 0.0239, "step": 268240 }, { "epoch": 1.73, "learning_rate": 4.029766937529447e-05, "loss": 0.0242, "step": 268250 }, { "epoch": 1.73, "learning_rate": 4.028798802093754e-05, "loss": 0.0208, "step": 268260 }, { "epoch": 1.73, "learning_rate": 4.027830666658061e-05, "loss": 0.0297, "step": 268270 }, { "epoch": 1.73, "learning_rate": 4.0268625312223674e-05, "loss": 0.0218, "step": 268280 }, { "epoch": 1.73, "learning_rate": 4.025894395786674e-05, "loss": 0.021, "step": 268290 }, { "epoch": 1.73, "learning_rate": 4.0249262603509806e-05, "loss": 0.0227, "step": 268300 }, { "epoch": 1.73, "learning_rate": 4.023958124915288e-05, "loss": 0.0231, "step": 268310 }, { "epoch": 1.73, "learning_rate": 4.0229899894795946e-05, "loss": 0.0236, "step": 268320 }, { "epoch": 1.73, "learning_rate": 4.022021854043902e-05, "loss": 0.0242, "step": 268330 }, { "epoch": 1.73, "learning_rate": 4.021053718608208e-05, "loss": 0.0234, "step": 268340 }, { "epoch": 1.73, "learning_rate": 4.0200855831725144e-05, "loss": 0.0271, "step": 268350 }, { "epoch": 1.73, "learning_rate": 4.019117447736822e-05, "loss": 0.0284, "step": 268360 }, { "epoch": 1.73, "learning_rate": 4.0181493123011284e-05, "loss": 0.0252, "step": 268370 }, { "epoch": 1.73, "learning_rate": 4.017181176865436e-05, "loss": 0.0246, "step": 268380 }, { "epoch": 1.73, "learning_rate": 4.0162130414297416e-05, "loss": 0.0234, "step": 268390 }, { "epoch": 1.73, "learning_rate": 4.015244905994049e-05, "loss": 0.0202, "step": 268400 }, { "epoch": 1.73, "learning_rate": 4.0142767705583555e-05, "loss": 0.03, "step": 268410 }, { "epoch": 1.73, "learning_rate": 4.013308635122662e-05, "loss": 0.0247, "step": 268420 }, { "epoch": 1.73, "learning_rate": 4.0123404996869695e-05, "loss": 0.0234, "step": 268430 }, { "epoch": 1.73, "learning_rate": 4.0113723642512754e-05, "loss": 0.0232, "step": 268440 }, { "epoch": 1.73, "learning_rate": 4.010404228815583e-05, "loss": 0.0302, "step": 268450 }, { "epoch": 1.73, "learning_rate": 4.009436093379889e-05, "loss": 0.0263, "step": 268460 }, { "epoch": 1.73, "learning_rate": 4.0084679579441966e-05, "loss": 0.0241, "step": 268470 }, { "epoch": 1.73, "learning_rate": 4.007499822508503e-05, "loss": 0.0236, "step": 268480 }, { "epoch": 1.73, "learning_rate": 4.006531687072809e-05, "loss": 0.0315, "step": 268490 }, { "epoch": 1.73, "learning_rate": 4.0055635516371165e-05, "loss": 0.0242, "step": 268500 }, { "epoch": 1.73, "learning_rate": 4.004595416201423e-05, "loss": 0.0266, "step": 268510 }, { "epoch": 1.73, "learning_rate": 4.0036272807657304e-05, "loss": 0.0331, "step": 268520 }, { "epoch": 1.73, "learning_rate": 4.002659145330037e-05, "loss": 0.023, "step": 268530 }, { "epoch": 1.73, "learning_rate": 4.0016910098943444e-05, "loss": 0.0228, "step": 268540 }, { "epoch": 1.73, "learning_rate": 4.00072287445865e-05, "loss": 0.0253, "step": 268550 }, { "epoch": 1.73, "learning_rate": 3.999754739022957e-05, "loss": 0.0243, "step": 268560 }, { "epoch": 1.73, "learning_rate": 3.998786603587264e-05, "loss": 0.0236, "step": 268570 }, { "epoch": 1.73, "learning_rate": 3.997818468151571e-05, "loss": 0.0223, "step": 268580 }, { "epoch": 1.73, "learning_rate": 3.996850332715878e-05, "loss": 0.0266, "step": 268590 }, { "epoch": 1.73, "learning_rate": 3.995882197280184e-05, "loss": 0.018, "step": 268600 }, { "epoch": 1.73, "learning_rate": 3.9949140618444914e-05, "loss": 0.0243, "step": 268610 }, { "epoch": 1.73, "learning_rate": 3.993945926408798e-05, "loss": 0.0214, "step": 268620 }, { "epoch": 1.73, "learning_rate": 3.9929777909731047e-05, "loss": 0.024, "step": 268630 }, { "epoch": 1.73, "learning_rate": 3.992009655537412e-05, "loss": 0.0241, "step": 268640 }, { "epoch": 1.73, "learning_rate": 3.991041520101718e-05, "loss": 0.0233, "step": 268650 }, { "epoch": 1.73, "learning_rate": 3.990073384666025e-05, "loss": 0.0249, "step": 268660 }, { "epoch": 1.73, "learning_rate": 3.989105249230332e-05, "loss": 0.0327, "step": 268670 }, { "epoch": 1.73, "learning_rate": 3.988137113794639e-05, "loss": 0.0226, "step": 268680 }, { "epoch": 1.73, "learning_rate": 3.987168978358946e-05, "loss": 0.0252, "step": 268690 }, { "epoch": 1.73, "learning_rate": 3.986200842923252e-05, "loss": 0.0259, "step": 268700 }, { "epoch": 1.73, "learning_rate": 3.985232707487559e-05, "loss": 0.0251, "step": 268710 }, { "epoch": 1.73, "learning_rate": 3.9842645720518656e-05, "loss": 0.0314, "step": 268720 }, { "epoch": 1.73, "learning_rate": 3.983296436616173e-05, "loss": 0.0251, "step": 268730 }, { "epoch": 1.73, "learning_rate": 3.9823283011804795e-05, "loss": 0.0253, "step": 268740 }, { "epoch": 1.73, "learning_rate": 3.981360165744787e-05, "loss": 0.0234, "step": 268750 }, { "epoch": 1.73, "learning_rate": 3.980392030309093e-05, "loss": 0.0217, "step": 268760 }, { "epoch": 1.73, "learning_rate": 3.9794238948733994e-05, "loss": 0.0201, "step": 268770 }, { "epoch": 1.73, "learning_rate": 3.978455759437707e-05, "loss": 0.0266, "step": 268780 }, { "epoch": 1.73, "learning_rate": 3.9774876240020133e-05, "loss": 0.023, "step": 268790 }, { "epoch": 1.73, "learning_rate": 3.9765194885663206e-05, "loss": 0.0225, "step": 268800 }, { "epoch": 1.73, "learning_rate": 3.9755513531306266e-05, "loss": 0.0226, "step": 268810 }, { "epoch": 1.74, "learning_rate": 3.974583217694934e-05, "loss": 0.0252, "step": 268820 }, { "epoch": 1.74, "learning_rate": 3.9736150822592405e-05, "loss": 0.0216, "step": 268830 }, { "epoch": 1.74, "learning_rate": 3.972646946823547e-05, "loss": 0.0202, "step": 268840 }, { "epoch": 1.74, "learning_rate": 3.9716788113878544e-05, "loss": 0.0196, "step": 268850 }, { "epoch": 1.74, "learning_rate": 3.9707106759521604e-05, "loss": 0.0222, "step": 268860 }, { "epoch": 1.74, "learning_rate": 3.969742540516468e-05, "loss": 0.0224, "step": 268870 }, { "epoch": 1.74, "learning_rate": 3.968774405080774e-05, "loss": 0.026, "step": 268880 }, { "epoch": 1.74, "learning_rate": 3.9678062696450816e-05, "loss": 0.0258, "step": 268890 }, { "epoch": 1.74, "learning_rate": 3.966838134209388e-05, "loss": 0.0238, "step": 268900 }, { "epoch": 1.74, "learning_rate": 3.965869998773694e-05, "loss": 0.0217, "step": 268910 }, { "epoch": 1.74, "learning_rate": 3.9649018633380015e-05, "loss": 0.0195, "step": 268920 }, { "epoch": 1.74, "learning_rate": 3.963933727902308e-05, "loss": 0.0263, "step": 268930 }, { "epoch": 1.74, "learning_rate": 3.9629655924666154e-05, "loss": 0.0272, "step": 268940 }, { "epoch": 1.74, "learning_rate": 3.961997457030922e-05, "loss": 0.0232, "step": 268950 }, { "epoch": 1.74, "learning_rate": 3.9610293215952293e-05, "loss": 0.0239, "step": 268960 }, { "epoch": 1.74, "learning_rate": 3.960061186159535e-05, "loss": 0.0218, "step": 268970 }, { "epoch": 1.74, "learning_rate": 3.959093050723842e-05, "loss": 0.025, "step": 268980 }, { "epoch": 1.74, "learning_rate": 3.958124915288149e-05, "loss": 0.0251, "step": 268990 }, { "epoch": 1.74, "learning_rate": 3.957156779852456e-05, "loss": 0.0233, "step": 269000 }, { "epoch": 1.74, "eval_cer": 0.9198192294655971, "eval_loss": 0.0177915096282959, "eval_runtime": 119.9978, "eval_samples_per_second": 16.667, "eval_steps_per_second": 4.167, "step": 269000 }, { "epoch": 1.74, "learning_rate": 3.956188644416763e-05, "loss": 0.0222, "step": 269010 }, { "epoch": 1.74, "learning_rate": 3.955220508981069e-05, "loss": 0.0226, "step": 269020 }, { "epoch": 1.74, "learning_rate": 3.9542523735453764e-05, "loss": 0.0222, "step": 269030 }, { "epoch": 1.74, "learning_rate": 3.953284238109683e-05, "loss": 0.0211, "step": 269040 }, { "epoch": 1.74, "learning_rate": 3.9523161026739896e-05, "loss": 0.0246, "step": 269050 }, { "epoch": 1.74, "learning_rate": 3.951347967238297e-05, "loss": 0.0195, "step": 269060 }, { "epoch": 1.74, "learning_rate": 3.950379831802603e-05, "loss": 0.0295, "step": 269070 }, { "epoch": 1.74, "learning_rate": 3.94941169636691e-05, "loss": 0.024, "step": 269080 }, { "epoch": 1.74, "learning_rate": 3.948443560931217e-05, "loss": 0.0244, "step": 269090 }, { "epoch": 1.74, "learning_rate": 3.947475425495524e-05, "loss": 0.0203, "step": 269100 }, { "epoch": 1.74, "learning_rate": 3.946507290059831e-05, "loss": 0.024, "step": 269110 }, { "epoch": 1.74, "learning_rate": 3.945539154624137e-05, "loss": 0.0238, "step": 269120 }, { "epoch": 1.74, "learning_rate": 3.944571019188444e-05, "loss": 0.0237, "step": 269130 }, { "epoch": 1.74, "learning_rate": 3.9436028837527506e-05, "loss": 0.0264, "step": 269140 }, { "epoch": 1.74, "learning_rate": 3.942634748317058e-05, "loss": 0.0219, "step": 269150 }, { "epoch": 1.74, "learning_rate": 3.9416666128813645e-05, "loss": 0.0224, "step": 269160 }, { "epoch": 1.74, "learning_rate": 3.940698477445672e-05, "loss": 0.0231, "step": 269170 }, { "epoch": 1.74, "learning_rate": 3.939730342009978e-05, "loss": 0.0242, "step": 269180 }, { "epoch": 1.74, "learning_rate": 3.9387622065742844e-05, "loss": 0.0216, "step": 269190 }, { "epoch": 1.74, "learning_rate": 3.937794071138592e-05, "loss": 0.0242, "step": 269200 }, { "epoch": 1.74, "learning_rate": 3.936825935702898e-05, "loss": 0.0245, "step": 269210 }, { "epoch": 1.74, "learning_rate": 3.9358578002672056e-05, "loss": 0.0212, "step": 269220 }, { "epoch": 1.74, "learning_rate": 3.9348896648315116e-05, "loss": 0.0231, "step": 269230 }, { "epoch": 1.74, "learning_rate": 3.933921529395819e-05, "loss": 0.0217, "step": 269240 }, { "epoch": 1.74, "learning_rate": 3.9329533939601255e-05, "loss": 0.0251, "step": 269250 }, { "epoch": 1.74, "learning_rate": 3.931985258524432e-05, "loss": 0.022, "step": 269260 }, { "epoch": 1.74, "learning_rate": 3.9310171230887394e-05, "loss": 0.0283, "step": 269270 }, { "epoch": 1.74, "learning_rate": 3.9300489876530454e-05, "loss": 0.0228, "step": 269280 }, { "epoch": 1.74, "learning_rate": 3.929080852217353e-05, "loss": 0.0207, "step": 269290 }, { "epoch": 1.74, "learning_rate": 3.928112716781659e-05, "loss": 0.0276, "step": 269300 }, { "epoch": 1.74, "learning_rate": 3.9271445813459666e-05, "loss": 0.0279, "step": 269310 }, { "epoch": 1.74, "learning_rate": 3.926176445910273e-05, "loss": 0.0215, "step": 269320 }, { "epoch": 1.74, "learning_rate": 3.925208310474579e-05, "loss": 0.0267, "step": 269330 }, { "epoch": 1.74, "learning_rate": 3.9242401750388865e-05, "loss": 0.023, "step": 269340 }, { "epoch": 1.74, "learning_rate": 3.923272039603193e-05, "loss": 0.0226, "step": 269350 }, { "epoch": 1.74, "learning_rate": 3.9223039041675004e-05, "loss": 0.0255, "step": 269360 }, { "epoch": 1.74, "learning_rate": 3.921335768731807e-05, "loss": 0.0233, "step": 269370 }, { "epoch": 1.74, "learning_rate": 3.9203676332961136e-05, "loss": 0.0268, "step": 269380 }, { "epoch": 1.74, "learning_rate": 3.91939949786042e-05, "loss": 0.0216, "step": 269390 }, { "epoch": 1.74, "learning_rate": 3.918431362424727e-05, "loss": 0.0267, "step": 269400 }, { "epoch": 1.74, "learning_rate": 3.917463226989034e-05, "loss": 0.0251, "step": 269410 }, { "epoch": 1.74, "learning_rate": 3.916495091553341e-05, "loss": 0.0245, "step": 269420 }, { "epoch": 1.74, "learning_rate": 3.9155269561176474e-05, "loss": 0.021, "step": 269430 }, { "epoch": 1.74, "learning_rate": 3.914558820681954e-05, "loss": 0.0212, "step": 269440 }, { "epoch": 1.74, "learning_rate": 3.913590685246261e-05, "loss": 0.0249, "step": 269450 }, { "epoch": 1.74, "learning_rate": 3.912622549810568e-05, "loss": 0.0236, "step": 269460 }, { "epoch": 1.74, "learning_rate": 3.9116544143748746e-05, "loss": 0.024, "step": 269470 }, { "epoch": 1.74, "learning_rate": 3.910686278939181e-05, "loss": 0.0251, "step": 269480 }, { "epoch": 1.74, "learning_rate": 3.909718143503488e-05, "loss": 0.0261, "step": 269490 }, { "epoch": 1.74, "learning_rate": 3.908750008067795e-05, "loss": 0.0229, "step": 269500 }, { "epoch": 1.74, "learning_rate": 3.907781872632102e-05, "loss": 0.0225, "step": 269510 }, { "epoch": 1.74, "learning_rate": 3.9068137371964084e-05, "loss": 0.0242, "step": 269520 }, { "epoch": 1.74, "learning_rate": 3.905845601760715e-05, "loss": 0.0291, "step": 269530 }, { "epoch": 1.74, "learning_rate": 3.9048774663250217e-05, "loss": 0.0229, "step": 269540 }, { "epoch": 1.74, "learning_rate": 3.903909330889329e-05, "loss": 0.0248, "step": 269550 }, { "epoch": 1.74, "learning_rate": 3.9029411954536356e-05, "loss": 0.0248, "step": 269560 }, { "epoch": 1.74, "learning_rate": 3.901973060017943e-05, "loss": 0.028, "step": 269570 }, { "epoch": 1.74, "learning_rate": 3.901004924582249e-05, "loss": 0.0272, "step": 269580 }, { "epoch": 1.74, "learning_rate": 3.9000367891465555e-05, "loss": 0.0225, "step": 269590 }, { "epoch": 1.74, "learning_rate": 3.899068653710863e-05, "loss": 0.0228, "step": 269600 }, { "epoch": 1.74, "learning_rate": 3.8981005182751694e-05, "loss": 0.0257, "step": 269610 }, { "epoch": 1.74, "learning_rate": 3.897132382839477e-05, "loss": 0.0314, "step": 269620 }, { "epoch": 1.74, "learning_rate": 3.8961642474037826e-05, "loss": 0.0231, "step": 269630 }, { "epoch": 1.74, "learning_rate": 3.89519611196809e-05, "loss": 0.0281, "step": 269640 }, { "epoch": 1.74, "learning_rate": 3.8942279765323966e-05, "loss": 0.0235, "step": 269650 }, { "epoch": 1.74, "learning_rate": 3.893259841096703e-05, "loss": 0.0268, "step": 269660 }, { "epoch": 1.74, "learning_rate": 3.8922917056610105e-05, "loss": 0.0265, "step": 269670 }, { "epoch": 1.74, "learning_rate": 3.891323570225317e-05, "loss": 0.0237, "step": 269680 }, { "epoch": 1.74, "learning_rate": 3.890355434789624e-05, "loss": 0.0238, "step": 269690 }, { "epoch": 1.74, "learning_rate": 3.8893872993539304e-05, "loss": 0.0273, "step": 269700 }, { "epoch": 1.74, "learning_rate": 3.8884191639182377e-05, "loss": 0.0233, "step": 269710 }, { "epoch": 1.74, "learning_rate": 3.887451028482544e-05, "loss": 0.028, "step": 269720 }, { "epoch": 1.74, "learning_rate": 3.886482893046851e-05, "loss": 0.0226, "step": 269730 }, { "epoch": 1.74, "learning_rate": 3.8855147576111575e-05, "loss": 0.0212, "step": 269740 }, { "epoch": 1.74, "learning_rate": 3.884546622175464e-05, "loss": 0.0247, "step": 269750 }, { "epoch": 1.74, "learning_rate": 3.8835784867397715e-05, "loss": 0.0227, "step": 269760 }, { "epoch": 1.74, "learning_rate": 3.882610351304078e-05, "loss": 0.0266, "step": 269770 }, { "epoch": 1.74, "learning_rate": 3.8816422158683854e-05, "loss": 0.0256, "step": 269780 }, { "epoch": 1.74, "learning_rate": 3.880674080432691e-05, "loss": 0.0244, "step": 269790 }, { "epoch": 1.74, "learning_rate": 3.879705944996998e-05, "loss": 0.0228, "step": 269800 }, { "epoch": 1.74, "learning_rate": 3.878737809561305e-05, "loss": 0.0197, "step": 269810 }, { "epoch": 1.74, "learning_rate": 3.877769674125612e-05, "loss": 0.024, "step": 269820 }, { "epoch": 1.74, "learning_rate": 3.876801538689919e-05, "loss": 0.0236, "step": 269830 }, { "epoch": 1.74, "learning_rate": 3.875833403254225e-05, "loss": 0.0251, "step": 269840 }, { "epoch": 1.74, "learning_rate": 3.8748652678185324e-05, "loss": 0.0228, "step": 269850 }, { "epoch": 1.74, "learning_rate": 3.873897132382839e-05, "loss": 0.0245, "step": 269860 }, { "epoch": 1.74, "learning_rate": 3.872928996947146e-05, "loss": 0.0198, "step": 269870 }, { "epoch": 1.74, "learning_rate": 3.871960861511453e-05, "loss": 0.0199, "step": 269880 }, { "epoch": 1.74, "learning_rate": 3.870992726075759e-05, "loss": 0.0195, "step": 269890 }, { "epoch": 1.74, "learning_rate": 3.870024590640066e-05, "loss": 0.0255, "step": 269900 }, { "epoch": 1.74, "learning_rate": 3.869056455204373e-05, "loss": 0.0237, "step": 269910 }, { "epoch": 1.74, "learning_rate": 3.86808831976868e-05, "loss": 0.0234, "step": 269920 }, { "epoch": 1.74, "learning_rate": 3.867120184332987e-05, "loss": 0.0275, "step": 269930 }, { "epoch": 1.74, "learning_rate": 3.866152048897293e-05, "loss": 0.0268, "step": 269940 }, { "epoch": 1.74, "learning_rate": 3.8651839134616e-05, "loss": 0.0286, "step": 269950 }, { "epoch": 1.74, "learning_rate": 3.8642157780259066e-05, "loss": 0.0232, "step": 269960 }, { "epoch": 1.74, "learning_rate": 3.863247642590214e-05, "loss": 0.0245, "step": 269970 }, { "epoch": 1.74, "learning_rate": 3.8622795071545206e-05, "loss": 0.0237, "step": 269980 }, { "epoch": 1.74, "learning_rate": 3.861311371718828e-05, "loss": 0.0197, "step": 269990 }, { "epoch": 1.74, "learning_rate": 3.860343236283134e-05, "loss": 0.0248, "step": 270000 }, { "epoch": 1.74, "eval_cer": 0.9198463450457576, "eval_loss": 0.01764541305601597, "eval_runtime": 119.9301, "eval_samples_per_second": 16.676, "eval_steps_per_second": 4.169, "step": 270000 }, { "epoch": 1.74, "learning_rate": 3.8593751008474404e-05, "loss": 0.0227, "step": 270010 }, { "epoch": 1.74, "learning_rate": 3.858406965411748e-05, "loss": 0.0236, "step": 270020 }, { "epoch": 1.74, "learning_rate": 3.8574388299760544e-05, "loss": 0.0244, "step": 270030 }, { "epoch": 1.74, "learning_rate": 3.856470694540362e-05, "loss": 0.0252, "step": 270040 }, { "epoch": 1.74, "learning_rate": 3.8555025591046676e-05, "loss": 0.0235, "step": 270050 }, { "epoch": 1.74, "learning_rate": 3.854534423668975e-05, "loss": 0.0209, "step": 270060 }, { "epoch": 1.74, "learning_rate": 3.8535662882332815e-05, "loss": 0.0219, "step": 270070 }, { "epoch": 1.74, "learning_rate": 3.852598152797588e-05, "loss": 0.027, "step": 270080 }, { "epoch": 1.74, "learning_rate": 3.8516300173618955e-05, "loss": 0.0211, "step": 270090 }, { "epoch": 1.74, "learning_rate": 3.8506618819262014e-05, "loss": 0.0242, "step": 270100 }, { "epoch": 1.74, "learning_rate": 3.849693746490509e-05, "loss": 0.0254, "step": 270110 }, { "epoch": 1.74, "learning_rate": 3.848725611054815e-05, "loss": 0.0271, "step": 270120 }, { "epoch": 1.74, "learning_rate": 3.8477574756191226e-05, "loss": 0.0242, "step": 270130 }, { "epoch": 1.74, "learning_rate": 3.846789340183429e-05, "loss": 0.0222, "step": 270140 }, { "epoch": 1.74, "learning_rate": 3.845821204747735e-05, "loss": 0.0251, "step": 270150 }, { "epoch": 1.74, "learning_rate": 3.8448530693120425e-05, "loss": 0.0207, "step": 270160 }, { "epoch": 1.74, "learning_rate": 3.843884933876349e-05, "loss": 0.0311, "step": 270170 }, { "epoch": 1.74, "learning_rate": 3.8429167984406564e-05, "loss": 0.0266, "step": 270180 }, { "epoch": 1.74, "learning_rate": 3.841948663004963e-05, "loss": 0.0246, "step": 270190 }, { "epoch": 1.74, "learning_rate": 3.8409805275692704e-05, "loss": 0.0215, "step": 270200 }, { "epoch": 1.74, "learning_rate": 3.840012392133576e-05, "loss": 0.0269, "step": 270210 }, { "epoch": 1.74, "learning_rate": 3.839044256697883e-05, "loss": 0.0209, "step": 270220 }, { "epoch": 1.74, "learning_rate": 3.83807612126219e-05, "loss": 0.024, "step": 270230 }, { "epoch": 1.74, "learning_rate": 3.837107985826497e-05, "loss": 0.0229, "step": 270240 }, { "epoch": 1.74, "learning_rate": 3.836139850390804e-05, "loss": 0.0226, "step": 270250 }, { "epoch": 1.74, "learning_rate": 3.83517171495511e-05, "loss": 0.0222, "step": 270260 }, { "epoch": 1.74, "learning_rate": 3.8342035795194174e-05, "loss": 0.0245, "step": 270270 }, { "epoch": 1.74, "learning_rate": 3.833235444083724e-05, "loss": 0.024, "step": 270280 }, { "epoch": 1.74, "learning_rate": 3.8322673086480307e-05, "loss": 0.0206, "step": 270290 }, { "epoch": 1.74, "learning_rate": 3.831299173212338e-05, "loss": 0.0209, "step": 270300 }, { "epoch": 1.74, "learning_rate": 3.830331037776644e-05, "loss": 0.025, "step": 270310 }, { "epoch": 1.74, "learning_rate": 3.829362902340951e-05, "loss": 0.0237, "step": 270320 }, { "epoch": 1.74, "learning_rate": 3.828394766905258e-05, "loss": 0.0242, "step": 270330 }, { "epoch": 1.74, "learning_rate": 3.827426631469565e-05, "loss": 0.0232, "step": 270340 }, { "epoch": 1.74, "learning_rate": 3.826458496033872e-05, "loss": 0.0232, "step": 270350 }, { "epoch": 1.74, "learning_rate": 3.825490360598178e-05, "loss": 0.0267, "step": 270360 }, { "epoch": 1.75, "learning_rate": 3.824522225162485e-05, "loss": 0.0221, "step": 270370 }, { "epoch": 1.75, "learning_rate": 3.8235540897267916e-05, "loss": 0.0205, "step": 270380 }, { "epoch": 1.75, "learning_rate": 3.822585954291099e-05, "loss": 0.0209, "step": 270390 }, { "epoch": 1.75, "learning_rate": 3.8216178188554055e-05, "loss": 0.0232, "step": 270400 }, { "epoch": 1.75, "learning_rate": 3.820649683419713e-05, "loss": 0.0252, "step": 270410 }, { "epoch": 1.75, "learning_rate": 3.819681547984019e-05, "loss": 0.022, "step": 270420 }, { "epoch": 1.75, "learning_rate": 3.8187134125483254e-05, "loss": 0.0227, "step": 270430 }, { "epoch": 1.75, "learning_rate": 3.817745277112633e-05, "loss": 0.0213, "step": 270440 }, { "epoch": 1.75, "learning_rate": 3.8167771416769393e-05, "loss": 0.0215, "step": 270450 }, { "epoch": 1.75, "learning_rate": 3.8158090062412466e-05, "loss": 0.025, "step": 270460 }, { "epoch": 1.75, "learning_rate": 3.8148408708055526e-05, "loss": 0.0259, "step": 270470 }, { "epoch": 1.75, "learning_rate": 3.81387273536986e-05, "loss": 0.0212, "step": 270480 }, { "epoch": 1.75, "learning_rate": 3.8129045999341665e-05, "loss": 0.0267, "step": 270490 }, { "epoch": 1.75, "learning_rate": 3.811936464498473e-05, "loss": 0.0328, "step": 270500 }, { "epoch": 1.75, "learning_rate": 3.8109683290627804e-05, "loss": 0.0188, "step": 270510 }, { "epoch": 1.75, "learning_rate": 3.8100001936270864e-05, "loss": 0.0263, "step": 270520 }, { "epoch": 1.75, "learning_rate": 3.809032058191394e-05, "loss": 0.0211, "step": 270530 }, { "epoch": 1.75, "learning_rate": 3.8080639227557e-05, "loss": 0.0285, "step": 270540 }, { "epoch": 1.75, "learning_rate": 3.8070957873200076e-05, "loss": 0.0242, "step": 270550 }, { "epoch": 1.75, "learning_rate": 3.806127651884314e-05, "loss": 0.019, "step": 270560 }, { "epoch": 1.75, "learning_rate": 3.80515951644862e-05, "loss": 0.0219, "step": 270570 }, { "epoch": 1.75, "learning_rate": 3.8041913810129275e-05, "loss": 0.0249, "step": 270580 }, { "epoch": 1.75, "learning_rate": 3.803223245577234e-05, "loss": 0.0272, "step": 270590 }, { "epoch": 1.75, "learning_rate": 3.8022551101415414e-05, "loss": 0.0252, "step": 270600 }, { "epoch": 1.75, "learning_rate": 3.801286974705848e-05, "loss": 0.0211, "step": 270610 }, { "epoch": 1.75, "learning_rate": 3.800318839270155e-05, "loss": 0.0213, "step": 270620 }, { "epoch": 1.75, "learning_rate": 3.799350703834461e-05, "loss": 0.0245, "step": 270630 }, { "epoch": 1.75, "learning_rate": 3.798382568398768e-05, "loss": 0.0265, "step": 270640 }, { "epoch": 1.75, "learning_rate": 3.797414432963075e-05, "loss": 0.0236, "step": 270650 }, { "epoch": 1.75, "learning_rate": 3.796446297527382e-05, "loss": 0.0227, "step": 270660 }, { "epoch": 1.75, "learning_rate": 3.795478162091689e-05, "loss": 0.0274, "step": 270670 }, { "epoch": 1.75, "learning_rate": 3.794510026655995e-05, "loss": 0.0196, "step": 270680 }, { "epoch": 1.75, "learning_rate": 3.7935418912203024e-05, "loss": 0.024, "step": 270690 }, { "epoch": 1.75, "learning_rate": 3.792573755784609e-05, "loss": 0.0263, "step": 270700 }, { "epoch": 1.75, "learning_rate": 3.7916056203489156e-05, "loss": 0.0239, "step": 270710 }, { "epoch": 1.75, "learning_rate": 3.790637484913223e-05, "loss": 0.0279, "step": 270720 }, { "epoch": 1.75, "learning_rate": 3.789669349477529e-05, "loss": 0.0217, "step": 270730 }, { "epoch": 1.75, "learning_rate": 3.788701214041836e-05, "loss": 0.0219, "step": 270740 }, { "epoch": 1.75, "learning_rate": 3.787733078606143e-05, "loss": 0.0222, "step": 270750 }, { "epoch": 1.75, "learning_rate": 3.78676494317045e-05, "loss": 0.0255, "step": 270760 }, { "epoch": 1.75, "learning_rate": 3.785796807734757e-05, "loss": 0.0252, "step": 270770 }, { "epoch": 1.75, "learning_rate": 3.784828672299063e-05, "loss": 0.025, "step": 270780 }, { "epoch": 1.75, "learning_rate": 3.78386053686337e-05, "loss": 0.0208, "step": 270790 }, { "epoch": 1.75, "learning_rate": 3.7828924014276766e-05, "loss": 0.0221, "step": 270800 }, { "epoch": 1.75, "learning_rate": 3.781924265991984e-05, "loss": 0.0252, "step": 270810 }, { "epoch": 1.75, "learning_rate": 3.7809561305562905e-05, "loss": 0.0242, "step": 270820 }, { "epoch": 1.75, "learning_rate": 3.779987995120597e-05, "loss": 0.0258, "step": 270830 }, { "epoch": 1.75, "learning_rate": 3.779019859684904e-05, "loss": 0.0263, "step": 270840 }, { "epoch": 1.75, "learning_rate": 3.7780517242492104e-05, "loss": 0.021, "step": 270850 }, { "epoch": 1.75, "learning_rate": 3.777083588813518e-05, "loss": 0.022, "step": 270860 }, { "epoch": 1.75, "learning_rate": 3.776115453377824e-05, "loss": 0.0241, "step": 270870 }, { "epoch": 1.75, "learning_rate": 3.775147317942131e-05, "loss": 0.0198, "step": 270880 }, { "epoch": 1.75, "learning_rate": 3.7741791825064376e-05, "loss": 0.0263, "step": 270890 }, { "epoch": 1.75, "learning_rate": 3.773211047070745e-05, "loss": 0.0269, "step": 270900 }, { "epoch": 1.75, "learning_rate": 3.7722429116350515e-05, "loss": 0.0207, "step": 270910 }, { "epoch": 1.75, "learning_rate": 3.771274776199358e-05, "loss": 0.0235, "step": 270920 }, { "epoch": 1.75, "learning_rate": 3.770306640763665e-05, "loss": 0.024, "step": 270930 }, { "epoch": 1.75, "learning_rate": 3.7693385053279714e-05, "loss": 0.017, "step": 270940 }, { "epoch": 1.75, "learning_rate": 3.768370369892279e-05, "loss": 0.019, "step": 270950 }, { "epoch": 1.75, "learning_rate": 3.767402234456585e-05, "loss": 0.0271, "step": 270960 }, { "epoch": 1.75, "learning_rate": 3.7664340990208926e-05, "loss": 0.0256, "step": 270970 }, { "epoch": 1.75, "learning_rate": 3.7654659635851985e-05, "loss": 0.0243, "step": 270980 }, { "epoch": 1.75, "learning_rate": 3.764497828149505e-05, "loss": 0.0229, "step": 270990 }, { "epoch": 1.75, "learning_rate": 3.7635296927138125e-05, "loss": 0.0211, "step": 271000 }, { "epoch": 1.75, "eval_cer": 0.9198490566037736, "eval_loss": 0.01767873205244541, "eval_runtime": 119.9595, "eval_samples_per_second": 16.672, "eval_steps_per_second": 4.168, "step": 271000 }, { "epoch": 1.75, "learning_rate": 3.762561557278119e-05, "loss": 0.0239, "step": 271010 }, { "epoch": 1.75, "learning_rate": 3.7615934218424264e-05, "loss": 0.0231, "step": 271020 }, { "epoch": 1.75, "learning_rate": 3.7606252864067323e-05, "loss": 0.0234, "step": 271030 }, { "epoch": 1.75, "learning_rate": 3.7596571509710396e-05, "loss": 0.0222, "step": 271040 }, { "epoch": 1.75, "learning_rate": 3.758689015535346e-05, "loss": 0.0239, "step": 271050 }, { "epoch": 1.75, "learning_rate": 3.757720880099653e-05, "loss": 0.0275, "step": 271060 }, { "epoch": 1.75, "learning_rate": 3.75675274466396e-05, "loss": 0.03, "step": 271070 }, { "epoch": 1.75, "learning_rate": 3.755784609228266e-05, "loss": 0.0233, "step": 271080 }, { "epoch": 1.75, "learning_rate": 3.7548164737925734e-05, "loss": 0.0258, "step": 271090 }, { "epoch": 1.75, "learning_rate": 3.75384833835688e-05, "loss": 0.021, "step": 271100 }, { "epoch": 1.75, "learning_rate": 3.7528802029211874e-05, "loss": 0.0265, "step": 271110 }, { "epoch": 1.75, "learning_rate": 3.751912067485494e-05, "loss": 0.0223, "step": 271120 }, { "epoch": 1.75, "learning_rate": 3.7509439320498e-05, "loss": 0.0242, "step": 271130 }, { "epoch": 1.75, "learning_rate": 3.749975796614107e-05, "loss": 0.0274, "step": 271140 }, { "epoch": 1.75, "learning_rate": 3.749007661178414e-05, "loss": 0.0292, "step": 271150 }, { "epoch": 1.75, "learning_rate": 3.7480395257427205e-05, "loss": 0.0203, "step": 271160 }, { "epoch": 1.75, "learning_rate": 3.747071390307028e-05, "loss": 0.0284, "step": 271170 }, { "epoch": 1.75, "learning_rate": 3.7461032548713344e-05, "loss": 0.0285, "step": 271180 }, { "epoch": 1.75, "learning_rate": 3.745135119435641e-05, "loss": 0.0247, "step": 271190 }, { "epoch": 1.75, "learning_rate": 3.744166983999948e-05, "loss": 0.0247, "step": 271200 }, { "epoch": 1.75, "learning_rate": 3.743198848564255e-05, "loss": 0.0234, "step": 271210 }, { "epoch": 1.75, "learning_rate": 3.7422307131285616e-05, "loss": 0.0258, "step": 271220 }, { "epoch": 1.75, "learning_rate": 3.741262577692868e-05, "loss": 0.0233, "step": 271230 }, { "epoch": 1.75, "learning_rate": 3.740294442257175e-05, "loss": 0.0269, "step": 271240 }, { "epoch": 1.75, "learning_rate": 3.739326306821482e-05, "loss": 0.0254, "step": 271250 }, { "epoch": 1.75, "learning_rate": 3.738358171385789e-05, "loss": 0.025, "step": 271260 }, { "epoch": 1.75, "learning_rate": 3.7373900359500954e-05, "loss": 0.0222, "step": 271270 }, { "epoch": 1.75, "learning_rate": 3.736421900514403e-05, "loss": 0.0276, "step": 271280 }, { "epoch": 1.75, "learning_rate": 3.7354537650787086e-05, "loss": 0.0246, "step": 271290 }, { "epoch": 1.75, "learning_rate": 3.734485629643016e-05, "loss": 0.0209, "step": 271300 }, { "epoch": 1.75, "learning_rate": 3.7335174942073226e-05, "loss": 0.0242, "step": 271310 }, { "epoch": 1.75, "learning_rate": 3.732549358771629e-05, "loss": 0.0195, "step": 271320 }, { "epoch": 1.75, "learning_rate": 3.7315812233359365e-05, "loss": 0.0253, "step": 271330 }, { "epoch": 1.75, "learning_rate": 3.730613087900243e-05, "loss": 0.0286, "step": 271340 }, { "epoch": 1.75, "learning_rate": 3.72964495246455e-05, "loss": 0.0271, "step": 271350 }, { "epoch": 1.75, "learning_rate": 3.7286768170288563e-05, "loss": 0.0229, "step": 271360 }, { "epoch": 1.75, "learning_rate": 3.727708681593163e-05, "loss": 0.0291, "step": 271370 }, { "epoch": 1.75, "learning_rate": 3.72674054615747e-05, "loss": 0.0246, "step": 271380 }, { "epoch": 1.75, "learning_rate": 3.725772410721777e-05, "loss": 0.0228, "step": 271390 }, { "epoch": 1.75, "learning_rate": 3.7248042752860835e-05, "loss": 0.0276, "step": 271400 }, { "epoch": 1.75, "learning_rate": 3.723836139850391e-05, "loss": 0.0295, "step": 271410 }, { "epoch": 1.75, "learning_rate": 3.7228680044146974e-05, "loss": 0.0225, "step": 271420 }, { "epoch": 1.75, "learning_rate": 3.721899868979004e-05, "loss": 0.0275, "step": 271430 }, { "epoch": 1.75, "learning_rate": 3.720931733543311e-05, "loss": 0.0242, "step": 271440 }, { "epoch": 1.75, "learning_rate": 3.719963598107617e-05, "loss": 0.0217, "step": 271450 }, { "epoch": 1.75, "learning_rate": 3.7189954626719246e-05, "loss": 0.0248, "step": 271460 }, { "epoch": 1.75, "learning_rate": 3.718027327236231e-05, "loss": 0.0237, "step": 271470 }, { "epoch": 1.75, "learning_rate": 3.717059191800538e-05, "loss": 0.0268, "step": 271480 }, { "epoch": 1.75, "learning_rate": 3.716091056364845e-05, "loss": 0.023, "step": 271490 }, { "epoch": 1.75, "learning_rate": 3.715122920929151e-05, "loss": 0.0232, "step": 271500 }, { "epoch": 1.75, "learning_rate": 3.7141547854934584e-05, "loss": 0.0198, "step": 271510 }, { "epoch": 1.75, "learning_rate": 3.713186650057765e-05, "loss": 0.0287, "step": 271520 }, { "epoch": 1.75, "learning_rate": 3.712218514622072e-05, "loss": 0.0327, "step": 271530 }, { "epoch": 1.75, "learning_rate": 3.711250379186379e-05, "loss": 0.0238, "step": 271540 }, { "epoch": 1.75, "learning_rate": 3.7102822437506856e-05, "loss": 0.0208, "step": 271550 }, { "epoch": 1.75, "learning_rate": 3.709314108314992e-05, "loss": 0.0235, "step": 271560 }, { "epoch": 1.75, "learning_rate": 3.708345972879299e-05, "loss": 0.0288, "step": 271570 }, { "epoch": 1.75, "learning_rate": 3.7073778374436055e-05, "loss": 0.0273, "step": 271580 }, { "epoch": 1.75, "learning_rate": 3.706409702007913e-05, "loss": 0.0264, "step": 271590 }, { "epoch": 1.75, "learning_rate": 3.7054415665722194e-05, "loss": 0.0261, "step": 271600 }, { "epoch": 1.75, "learning_rate": 3.704473431136526e-05, "loss": 0.0264, "step": 271610 }, { "epoch": 1.75, "learning_rate": 3.703505295700833e-05, "loss": 0.0201, "step": 271620 }, { "epoch": 1.75, "learning_rate": 3.702537160265139e-05, "loss": 0.0253, "step": 271630 }, { "epoch": 1.75, "learning_rate": 3.7015690248294466e-05, "loss": 0.0249, "step": 271640 }, { "epoch": 1.75, "learning_rate": 3.700600889393753e-05, "loss": 0.0237, "step": 271650 }, { "epoch": 1.75, "learning_rate": 3.69963275395806e-05, "loss": 0.0191, "step": 271660 }, { "epoch": 1.75, "learning_rate": 3.698664618522367e-05, "loss": 0.0237, "step": 271670 }, { "epoch": 1.75, "learning_rate": 3.697696483086674e-05, "loss": 0.0248, "step": 271680 }, { "epoch": 1.75, "learning_rate": 3.6967283476509804e-05, "loss": 0.0247, "step": 271690 }, { "epoch": 1.75, "learning_rate": 3.695760212215287e-05, "loss": 0.0252, "step": 271700 }, { "epoch": 1.75, "learning_rate": 3.6947920767795936e-05, "loss": 0.0208, "step": 271710 }, { "epoch": 1.75, "learning_rate": 3.693823941343901e-05, "loss": 0.0227, "step": 271720 }, { "epoch": 1.75, "learning_rate": 3.6928558059082075e-05, "loss": 0.029, "step": 271730 }, { "epoch": 1.75, "learning_rate": 3.691887670472514e-05, "loss": 0.0261, "step": 271740 }, { "epoch": 1.75, "learning_rate": 3.6909195350368215e-05, "loss": 0.0204, "step": 271750 }, { "epoch": 1.75, "learning_rate": 3.689951399601128e-05, "loss": 0.022, "step": 271760 }, { "epoch": 1.75, "learning_rate": 3.688983264165435e-05, "loss": 0.0188, "step": 271770 }, { "epoch": 1.75, "learning_rate": 3.688015128729741e-05, "loss": 0.0266, "step": 271780 }, { "epoch": 1.75, "learning_rate": 3.687046993294048e-05, "loss": 0.0204, "step": 271790 }, { "epoch": 1.75, "learning_rate": 3.686078857858355e-05, "loss": 0.0261, "step": 271800 }, { "epoch": 1.75, "learning_rate": 3.685110722422662e-05, "loss": 0.0194, "step": 271810 }, { "epoch": 1.75, "learning_rate": 3.6841425869869685e-05, "loss": 0.02, "step": 271820 }, { "epoch": 1.75, "learning_rate": 3.683174451551276e-05, "loss": 0.0253, "step": 271830 }, { "epoch": 1.75, "learning_rate": 3.682206316115582e-05, "loss": 0.0247, "step": 271840 }, { "epoch": 1.75, "learning_rate": 3.681238180679889e-05, "loss": 0.0268, "step": 271850 }, { "epoch": 1.75, "learning_rate": 3.680270045244196e-05, "loss": 0.0213, "step": 271860 }, { "epoch": 1.75, "learning_rate": 3.679301909808502e-05, "loss": 0.0233, "step": 271870 }, { "epoch": 1.75, "learning_rate": 3.6783337743728096e-05, "loss": 0.0261, "step": 271880 }, { "epoch": 1.75, "learning_rate": 3.677365638937116e-05, "loss": 0.0212, "step": 271890 }, { "epoch": 1.75, "learning_rate": 3.676397503501423e-05, "loss": 0.0259, "step": 271900 }, { "epoch": 1.75, "learning_rate": 3.6754293680657295e-05, "loss": 0.0233, "step": 271910 }, { "epoch": 1.76, "learning_rate": 3.674461232630036e-05, "loss": 0.021, "step": 271920 }, { "epoch": 1.76, "learning_rate": 3.6734930971943434e-05, "loss": 0.0281, "step": 271930 }, { "epoch": 1.76, "learning_rate": 3.67252496175865e-05, "loss": 0.0283, "step": 271940 }, { "epoch": 1.76, "learning_rate": 3.6715568263229566e-05, "loss": 0.0243, "step": 271950 }, { "epoch": 1.76, "learning_rate": 3.670588690887264e-05, "loss": 0.0229, "step": 271960 }, { "epoch": 1.76, "learning_rate": 3.6696205554515706e-05, "loss": 0.0257, "step": 271970 }, { "epoch": 1.76, "learning_rate": 3.668652420015877e-05, "loss": 0.0262, "step": 271980 }, { "epoch": 1.76, "learning_rate": 3.667684284580184e-05, "loss": 0.0235, "step": 271990 }, { "epoch": 1.76, "learning_rate": 3.6667161491444904e-05, "loss": 0.0257, "step": 272000 }, { "epoch": 1.76, "eval_cer": 0.9197975370014687, "eval_loss": 0.01773538440465927, "eval_runtime": 119.9524, "eval_samples_per_second": 16.673, "eval_steps_per_second": 4.168, "step": 272000 }, { "epoch": 1.76, "learning_rate": 3.665748013708798e-05, "loss": 0.0232, "step": 272010 }, { "epoch": 1.76, "learning_rate": 3.6647798782731044e-05, "loss": 0.0271, "step": 272020 }, { "epoch": 1.76, "learning_rate": 3.663811742837411e-05, "loss": 0.0254, "step": 272030 }, { "epoch": 1.76, "learning_rate": 3.662843607401718e-05, "loss": 0.0233, "step": 272040 }, { "epoch": 1.76, "learning_rate": 3.661875471966024e-05, "loss": 0.0213, "step": 272050 }, { "epoch": 1.76, "learning_rate": 3.6609073365303315e-05, "loss": 0.0234, "step": 272060 }, { "epoch": 1.76, "learning_rate": 3.659939201094638e-05, "loss": 0.0229, "step": 272070 }, { "epoch": 1.76, "learning_rate": 3.658971065658945e-05, "loss": 0.0236, "step": 272080 }, { "epoch": 1.76, "learning_rate": 3.658002930223252e-05, "loss": 0.0272, "step": 272090 }, { "epoch": 1.76, "learning_rate": 3.657034794787559e-05, "loss": 0.0222, "step": 272100 }, { "epoch": 1.76, "learning_rate": 3.6560666593518653e-05, "loss": 0.0203, "step": 272110 }, { "epoch": 1.76, "learning_rate": 3.655098523916172e-05, "loss": 0.028, "step": 272120 }, { "epoch": 1.76, "learning_rate": 3.6541303884804786e-05, "loss": 0.0247, "step": 272130 }, { "epoch": 1.76, "learning_rate": 3.653162253044786e-05, "loss": 0.0196, "step": 272140 }, { "epoch": 1.76, "learning_rate": 3.6521941176090925e-05, "loss": 0.0251, "step": 272150 }, { "epoch": 1.76, "learning_rate": 3.651225982173399e-05, "loss": 0.0228, "step": 272160 }, { "epoch": 1.76, "learning_rate": 3.6502578467377064e-05, "loss": 0.0235, "step": 272170 }, { "epoch": 1.76, "learning_rate": 3.649289711302013e-05, "loss": 0.023, "step": 272180 }, { "epoch": 1.76, "learning_rate": 3.64832157586632e-05, "loss": 0.0222, "step": 272190 }, { "epoch": 1.76, "learning_rate": 3.647353440430626e-05, "loss": 0.024, "step": 272200 }, { "epoch": 1.76, "learning_rate": 3.646385304994933e-05, "loss": 0.0217, "step": 272210 }, { "epoch": 1.76, "learning_rate": 3.64541716955924e-05, "loss": 0.0258, "step": 272220 }, { "epoch": 1.76, "learning_rate": 3.644449034123547e-05, "loss": 0.0213, "step": 272230 }, { "epoch": 1.76, "learning_rate": 3.6434808986878535e-05, "loss": 0.019, "step": 272240 }, { "epoch": 1.76, "learning_rate": 3.64251276325216e-05, "loss": 0.0217, "step": 272250 }, { "epoch": 1.76, "learning_rate": 3.641544627816467e-05, "loss": 0.0263, "step": 272260 }, { "epoch": 1.76, "learning_rate": 3.640576492380774e-05, "loss": 0.0248, "step": 272270 }, { "epoch": 1.76, "learning_rate": 3.6396083569450807e-05, "loss": 0.0208, "step": 272280 }, { "epoch": 1.76, "learning_rate": 3.638640221509387e-05, "loss": 0.0262, "step": 272290 }, { "epoch": 1.76, "learning_rate": 3.637672086073694e-05, "loss": 0.0263, "step": 272300 }, { "epoch": 1.76, "learning_rate": 3.636703950638001e-05, "loss": 0.0231, "step": 272310 }, { "epoch": 1.76, "learning_rate": 3.635735815202308e-05, "loss": 0.0251, "step": 272320 }, { "epoch": 1.76, "learning_rate": 3.6347676797666145e-05, "loss": 0.0237, "step": 272330 }, { "epoch": 1.76, "learning_rate": 3.633799544330921e-05, "loss": 0.0208, "step": 272340 }, { "epoch": 1.76, "learning_rate": 3.632831408895228e-05, "loss": 0.0211, "step": 272350 }, { "epoch": 1.76, "learning_rate": 3.631863273459535e-05, "loss": 0.0234, "step": 272360 }, { "epoch": 1.76, "learning_rate": 3.6308951380238416e-05, "loss": 0.0228, "step": 272370 }, { "epoch": 1.76, "learning_rate": 3.629927002588148e-05, "loss": 0.0224, "step": 272380 }, { "epoch": 1.76, "learning_rate": 3.6289588671524556e-05, "loss": 0.0237, "step": 272390 }, { "epoch": 1.76, "learning_rate": 3.6279907317167615e-05, "loss": 0.0244, "step": 272400 }, { "epoch": 1.76, "learning_rate": 3.627022596281069e-05, "loss": 0.0244, "step": 272410 }, { "epoch": 1.76, "learning_rate": 3.6260544608453754e-05, "loss": 0.0242, "step": 272420 }, { "epoch": 1.76, "learning_rate": 3.625086325409682e-05, "loss": 0.021, "step": 272430 }, { "epoch": 1.76, "learning_rate": 3.6241181899739894e-05, "loss": 0.0254, "step": 272440 }, { "epoch": 1.76, "learning_rate": 3.623150054538296e-05, "loss": 0.0237, "step": 272450 }, { "epoch": 1.76, "learning_rate": 3.6221819191026026e-05, "loss": 0.0203, "step": 272460 }, { "epoch": 1.76, "learning_rate": 3.621213783666909e-05, "loss": 0.0253, "step": 272470 }, { "epoch": 1.76, "learning_rate": 3.620245648231216e-05, "loss": 0.0245, "step": 272480 }, { "epoch": 1.76, "learning_rate": 3.619277512795523e-05, "loss": 0.019, "step": 272490 }, { "epoch": 1.76, "learning_rate": 3.61830937735983e-05, "loss": 0.0197, "step": 272500 }, { "epoch": 1.76, "learning_rate": 3.6173412419241364e-05, "loss": 0.0213, "step": 272510 }, { "epoch": 1.76, "learning_rate": 3.616373106488444e-05, "loss": 0.0254, "step": 272520 }, { "epoch": 1.76, "learning_rate": 3.6154049710527496e-05, "loss": 0.0267, "step": 272530 }, { "epoch": 1.76, "learning_rate": 3.614436835617057e-05, "loss": 0.0251, "step": 272540 }, { "epoch": 1.76, "learning_rate": 3.6134687001813636e-05, "loss": 0.0281, "step": 272550 }, { "epoch": 1.76, "learning_rate": 3.61250056474567e-05, "loss": 0.0224, "step": 272560 }, { "epoch": 1.76, "learning_rate": 3.6115324293099775e-05, "loss": 0.0301, "step": 272570 }, { "epoch": 1.76, "learning_rate": 3.610564293874284e-05, "loss": 0.0278, "step": 272580 }, { "epoch": 1.76, "learning_rate": 3.609596158438591e-05, "loss": 0.0234, "step": 272590 }, { "epoch": 1.76, "learning_rate": 3.6086280230028974e-05, "loss": 0.0232, "step": 272600 }, { "epoch": 1.76, "learning_rate": 3.607659887567204e-05, "loss": 0.0195, "step": 272610 }, { "epoch": 1.76, "learning_rate": 3.606691752131511e-05, "loss": 0.0243, "step": 272620 }, { "epoch": 1.76, "learning_rate": 3.605723616695818e-05, "loss": 0.0192, "step": 272630 }, { "epoch": 1.76, "learning_rate": 3.6047554812601245e-05, "loss": 0.0225, "step": 272640 }, { "epoch": 1.76, "learning_rate": 3.603787345824432e-05, "loss": 0.0193, "step": 272650 }, { "epoch": 1.76, "learning_rate": 3.6028192103887385e-05, "loss": 0.025, "step": 272660 }, { "epoch": 1.76, "learning_rate": 3.601851074953045e-05, "loss": 0.0233, "step": 272670 }, { "epoch": 1.76, "learning_rate": 3.600882939517352e-05, "loss": 0.0267, "step": 272680 }, { "epoch": 1.76, "learning_rate": 3.599914804081658e-05, "loss": 0.0228, "step": 272690 }, { "epoch": 1.76, "learning_rate": 3.5989466686459656e-05, "loss": 0.0203, "step": 272700 }, { "epoch": 1.76, "learning_rate": 3.597978533210272e-05, "loss": 0.0247, "step": 272710 }, { "epoch": 1.76, "learning_rate": 3.597010397774579e-05, "loss": 0.0227, "step": 272720 }, { "epoch": 1.76, "learning_rate": 3.596042262338886e-05, "loss": 0.027, "step": 272730 }, { "epoch": 1.76, "learning_rate": 3.595074126903192e-05, "loss": 0.0196, "step": 272740 }, { "epoch": 1.76, "learning_rate": 3.5941059914674994e-05, "loss": 0.0209, "step": 272750 }, { "epoch": 1.76, "learning_rate": 3.593137856031806e-05, "loss": 0.0285, "step": 272760 }, { "epoch": 1.76, "learning_rate": 3.592169720596113e-05, "loss": 0.0268, "step": 272770 }, { "epoch": 1.76, "learning_rate": 3.59120158516042e-05, "loss": 0.0316, "step": 272780 }, { "epoch": 1.76, "learning_rate": 3.5902334497247266e-05, "loss": 0.0204, "step": 272790 }, { "epoch": 1.76, "learning_rate": 3.589265314289033e-05, "loss": 0.0267, "step": 272800 }, { "epoch": 1.76, "learning_rate": 3.58829717885334e-05, "loss": 0.0265, "step": 272810 }, { "epoch": 1.76, "learning_rate": 3.5873290434176465e-05, "loss": 0.0263, "step": 272820 }, { "epoch": 1.76, "learning_rate": 3.586360907981954e-05, "loss": 0.0236, "step": 272830 }, { "epoch": 1.76, "learning_rate": 3.5853927725462604e-05, "loss": 0.0252, "step": 272840 }, { "epoch": 1.76, "learning_rate": 3.584424637110567e-05, "loss": 0.0224, "step": 272850 }, { "epoch": 1.76, "learning_rate": 3.583456501674874e-05, "loss": 0.0254, "step": 272860 }, { "epoch": 1.76, "learning_rate": 3.582488366239181e-05, "loss": 0.023, "step": 272870 }, { "epoch": 1.76, "learning_rate": 3.5815202308034876e-05, "loss": 0.0211, "step": 272880 }, { "epoch": 1.76, "learning_rate": 3.580552095367794e-05, "loss": 0.0245, "step": 272890 }, { "epoch": 1.76, "learning_rate": 3.579583959932101e-05, "loss": 0.0207, "step": 272900 }, { "epoch": 1.76, "learning_rate": 3.578615824496408e-05, "loss": 0.026, "step": 272910 }, { "epoch": 1.76, "learning_rate": 3.577647689060715e-05, "loss": 0.0215, "step": 272920 }, { "epoch": 1.76, "learning_rate": 3.5766795536250214e-05, "loss": 0.024, "step": 272930 }, { "epoch": 1.76, "learning_rate": 3.575711418189329e-05, "loss": 0.0196, "step": 272940 }, { "epoch": 1.76, "learning_rate": 3.5747432827536346e-05, "loss": 0.0223, "step": 272950 }, { "epoch": 1.76, "learning_rate": 3.573775147317942e-05, "loss": 0.0237, "step": 272960 }, { "epoch": 1.76, "learning_rate": 3.5728070118822485e-05, "loss": 0.0233, "step": 272970 }, { "epoch": 1.76, "learning_rate": 3.571838876446555e-05, "loss": 0.0255, "step": 272980 }, { "epoch": 1.76, "learning_rate": 3.5708707410108625e-05, "loss": 0.0219, "step": 272990 }, { "epoch": 1.76, "learning_rate": 3.569902605575169e-05, "loss": 0.0247, "step": 273000 }, { "epoch": 1.76, "eval_cer": 0.9198716529205739, "eval_loss": 0.017535319551825523, "eval_runtime": 119.9947, "eval_samples_per_second": 16.667, "eval_steps_per_second": 4.167, "step": 273000 }, { "epoch": 1.76, "learning_rate": 3.568934470139476e-05, "loss": 0.0234, "step": 273010 }, { "epoch": 1.76, "learning_rate": 3.5679663347037823e-05, "loss": 0.026, "step": 273020 }, { "epoch": 1.76, "learning_rate": 3.566998199268089e-05, "loss": 0.0242, "step": 273030 }, { "epoch": 1.76, "learning_rate": 3.566030063832396e-05, "loss": 0.0275, "step": 273040 }, { "epoch": 1.76, "learning_rate": 3.565061928396703e-05, "loss": 0.0208, "step": 273050 }, { "epoch": 1.76, "learning_rate": 3.5640937929610095e-05, "loss": 0.021, "step": 273060 }, { "epoch": 1.76, "learning_rate": 3.563125657525317e-05, "loss": 0.023, "step": 273070 }, { "epoch": 1.76, "learning_rate": 3.5621575220896234e-05, "loss": 0.0286, "step": 273080 }, { "epoch": 1.76, "learning_rate": 3.56118938665393e-05, "loss": 0.0237, "step": 273090 }, { "epoch": 1.76, "learning_rate": 3.560221251218237e-05, "loss": 0.0286, "step": 273100 }, { "epoch": 1.76, "learning_rate": 3.559253115782543e-05, "loss": 0.0224, "step": 273110 }, { "epoch": 1.76, "learning_rate": 3.5582849803468506e-05, "loss": 0.0251, "step": 273120 }, { "epoch": 1.76, "learning_rate": 3.557316844911157e-05, "loss": 0.0227, "step": 273130 }, { "epoch": 1.76, "learning_rate": 3.556348709475464e-05, "loss": 0.0251, "step": 273140 }, { "epoch": 1.76, "learning_rate": 3.555380574039771e-05, "loss": 0.0242, "step": 273150 }, { "epoch": 1.76, "learning_rate": 3.554412438604077e-05, "loss": 0.0219, "step": 273160 }, { "epoch": 1.76, "learning_rate": 3.5534443031683844e-05, "loss": 0.0261, "step": 273170 }, { "epoch": 1.76, "learning_rate": 3.552476167732691e-05, "loss": 0.0254, "step": 273180 }, { "epoch": 1.76, "learning_rate": 3.551508032296998e-05, "loss": 0.02, "step": 273190 }, { "epoch": 1.76, "learning_rate": 3.550539896861305e-05, "loss": 0.0203, "step": 273200 }, { "epoch": 1.76, "learning_rate": 3.5495717614256116e-05, "loss": 0.0249, "step": 273210 }, { "epoch": 1.76, "learning_rate": 3.548603625989918e-05, "loss": 0.023, "step": 273220 }, { "epoch": 1.76, "learning_rate": 3.547635490554225e-05, "loss": 0.0241, "step": 273230 }, { "epoch": 1.76, "learning_rate": 3.5466673551185315e-05, "loss": 0.0225, "step": 273240 }, { "epoch": 1.76, "learning_rate": 3.545699219682839e-05, "loss": 0.0258, "step": 273250 }, { "epoch": 1.76, "learning_rate": 3.5447310842471454e-05, "loss": 0.0203, "step": 273260 }, { "epoch": 1.76, "learning_rate": 3.543762948811452e-05, "loss": 0.0224, "step": 273270 }, { "epoch": 1.76, "learning_rate": 3.542794813375759e-05, "loss": 0.0226, "step": 273280 }, { "epoch": 1.76, "learning_rate": 3.541826677940066e-05, "loss": 0.0301, "step": 273290 }, { "epoch": 1.76, "learning_rate": 3.5408585425043726e-05, "loss": 0.0198, "step": 273300 }, { "epoch": 1.76, "learning_rate": 3.539890407068679e-05, "loss": 0.0267, "step": 273310 }, { "epoch": 1.76, "learning_rate": 3.538922271632986e-05, "loss": 0.0256, "step": 273320 }, { "epoch": 1.76, "learning_rate": 3.537954136197293e-05, "loss": 0.0282, "step": 273330 }, { "epoch": 1.76, "learning_rate": 3.5369860007616e-05, "loss": 0.0225, "step": 273340 }, { "epoch": 1.76, "learning_rate": 3.5360178653259064e-05, "loss": 0.02, "step": 273350 }, { "epoch": 1.76, "learning_rate": 3.535049729890213e-05, "loss": 0.0251, "step": 273360 }, { "epoch": 1.76, "learning_rate": 3.5340815944545196e-05, "loss": 0.0218, "step": 273370 }, { "epoch": 1.76, "learning_rate": 3.533113459018827e-05, "loss": 0.0193, "step": 273380 }, { "epoch": 1.76, "learning_rate": 3.5321453235831335e-05, "loss": 0.018, "step": 273390 }, { "epoch": 1.76, "learning_rate": 3.53117718814744e-05, "loss": 0.0248, "step": 273400 }, { "epoch": 1.76, "learning_rate": 3.5302090527117475e-05, "loss": 0.0211, "step": 273410 }, { "epoch": 1.76, "learning_rate": 3.529240917276054e-05, "loss": 0.0226, "step": 273420 }, { "epoch": 1.76, "learning_rate": 3.528272781840361e-05, "loss": 0.0213, "step": 273430 }, { "epoch": 1.76, "learning_rate": 3.527304646404667e-05, "loss": 0.0238, "step": 273440 }, { "epoch": 1.76, "learning_rate": 3.526336510968974e-05, "loss": 0.0224, "step": 273450 }, { "epoch": 1.76, "learning_rate": 3.525368375533281e-05, "loss": 0.0246, "step": 273460 }, { "epoch": 1.77, "learning_rate": 3.524400240097588e-05, "loss": 0.0258, "step": 273470 }, { "epoch": 1.77, "learning_rate": 3.5234321046618945e-05, "loss": 0.0259, "step": 273480 }, { "epoch": 1.77, "learning_rate": 3.522463969226202e-05, "loss": 0.0241, "step": 273490 }, { "epoch": 1.77, "learning_rate": 3.521495833790508e-05, "loss": 0.0241, "step": 273500 }, { "epoch": 1.77, "learning_rate": 3.520527698354815e-05, "loss": 0.0247, "step": 273510 }, { "epoch": 1.77, "learning_rate": 3.519559562919122e-05, "loss": 0.0206, "step": 273520 }, { "epoch": 1.77, "learning_rate": 3.518591427483428e-05, "loss": 0.0237, "step": 273530 }, { "epoch": 1.77, "learning_rate": 3.5176232920477356e-05, "loss": 0.0222, "step": 273540 }, { "epoch": 1.77, "learning_rate": 3.516655156612042e-05, "loss": 0.0259, "step": 273550 }, { "epoch": 1.77, "learning_rate": 3.515687021176349e-05, "loss": 0.0234, "step": 273560 }, { "epoch": 1.77, "learning_rate": 3.5147188857406555e-05, "loss": 0.0259, "step": 273570 }, { "epoch": 1.77, "learning_rate": 3.513750750304962e-05, "loss": 0.0173, "step": 273580 }, { "epoch": 1.77, "learning_rate": 3.5127826148692694e-05, "loss": 0.0249, "step": 273590 }, { "epoch": 1.77, "learning_rate": 3.511814479433576e-05, "loss": 0.0222, "step": 273600 }, { "epoch": 1.77, "learning_rate": 3.5108463439978826e-05, "loss": 0.0275, "step": 273610 }, { "epoch": 1.77, "learning_rate": 3.509878208562189e-05, "loss": 0.0205, "step": 273620 }, { "epoch": 1.77, "learning_rate": 3.5089100731264966e-05, "loss": 0.0233, "step": 273630 }, { "epoch": 1.77, "learning_rate": 3.507941937690803e-05, "loss": 0.0237, "step": 273640 }, { "epoch": 1.77, "learning_rate": 3.50697380225511e-05, "loss": 0.023, "step": 273650 }, { "epoch": 1.77, "learning_rate": 3.5060056668194164e-05, "loss": 0.0249, "step": 273660 }, { "epoch": 1.77, "learning_rate": 3.505037531383723e-05, "loss": 0.0234, "step": 273670 }, { "epoch": 1.77, "learning_rate": 3.5040693959480304e-05, "loss": 0.0323, "step": 273680 }, { "epoch": 1.77, "learning_rate": 3.503101260512337e-05, "loss": 0.0225, "step": 273690 }, { "epoch": 1.77, "learning_rate": 3.5021331250766436e-05, "loss": 0.0228, "step": 273700 }, { "epoch": 1.77, "learning_rate": 3.50116498964095e-05, "loss": 0.0241, "step": 273710 }, { "epoch": 1.77, "learning_rate": 3.500196854205257e-05, "loss": 0.0228, "step": 273720 }, { "epoch": 1.77, "learning_rate": 3.499228718769564e-05, "loss": 0.0234, "step": 273730 }, { "epoch": 1.77, "learning_rate": 3.498260583333871e-05, "loss": 0.0219, "step": 273740 }, { "epoch": 1.77, "learning_rate": 3.4972924478981774e-05, "loss": 0.0248, "step": 273750 }, { "epoch": 1.77, "learning_rate": 3.496324312462485e-05, "loss": 0.0234, "step": 273760 }, { "epoch": 1.77, "learning_rate": 3.495356177026791e-05, "loss": 0.0276, "step": 273770 }, { "epoch": 1.77, "learning_rate": 3.494388041591098e-05, "loss": 0.023, "step": 273780 }, { "epoch": 1.77, "learning_rate": 3.4934199061554046e-05, "loss": 0.0253, "step": 273790 }, { "epoch": 1.77, "learning_rate": 3.492451770719711e-05, "loss": 0.0204, "step": 273800 }, { "epoch": 1.77, "learning_rate": 3.4914836352840185e-05, "loss": 0.0232, "step": 273810 }, { "epoch": 1.77, "learning_rate": 3.490515499848325e-05, "loss": 0.0187, "step": 273820 }, { "epoch": 1.77, "learning_rate": 3.489547364412632e-05, "loss": 0.024, "step": 273830 }, { "epoch": 1.77, "learning_rate": 3.488579228976939e-05, "loss": 0.0226, "step": 273840 }, { "epoch": 1.77, "learning_rate": 3.487611093541245e-05, "loss": 0.0226, "step": 273850 }, { "epoch": 1.77, "learning_rate": 3.486642958105552e-05, "loss": 0.0292, "step": 273860 }, { "epoch": 1.77, "learning_rate": 3.485674822669859e-05, "loss": 0.023, "step": 273870 }, { "epoch": 1.77, "learning_rate": 3.4847066872341656e-05, "loss": 0.019, "step": 273880 }, { "epoch": 1.77, "learning_rate": 3.483738551798473e-05, "loss": 0.022, "step": 273890 }, { "epoch": 1.77, "learning_rate": 3.4827704163627795e-05, "loss": 0.0236, "step": 273900 }, { "epoch": 1.77, "learning_rate": 3.481802280927086e-05, "loss": 0.0243, "step": 273910 }, { "epoch": 1.77, "learning_rate": 3.480834145491393e-05, "loss": 0.0224, "step": 273920 }, { "epoch": 1.77, "learning_rate": 3.4798660100556994e-05, "loss": 0.0286, "step": 273930 }, { "epoch": 1.77, "learning_rate": 3.4788978746200067e-05, "loss": 0.0249, "step": 273940 }, { "epoch": 1.77, "learning_rate": 3.477929739184313e-05, "loss": 0.0216, "step": 273950 }, { "epoch": 1.77, "learning_rate": 3.47696160374862e-05, "loss": 0.0212, "step": 273960 }, { "epoch": 1.77, "learning_rate": 3.475993468312927e-05, "loss": 0.0264, "step": 273970 }, { "epoch": 1.77, "learning_rate": 3.475025332877234e-05, "loss": 0.0223, "step": 273980 }, { "epoch": 1.77, "learning_rate": 3.4740571974415405e-05, "loss": 0.0199, "step": 273990 }, { "epoch": 1.77, "learning_rate": 3.473089062005847e-05, "loss": 0.0323, "step": 274000 }, { "epoch": 1.77, "eval_cer": 0.9198553835724776, "eval_loss": 0.017592335119843483, "eval_runtime": 119.8118, "eval_samples_per_second": 16.693, "eval_steps_per_second": 4.173, "step": 274000 }, { "epoch": 1.77, "learning_rate": 3.472120926570154e-05, "loss": 0.0225, "step": 274010 }, { "epoch": 1.77, "learning_rate": 3.471152791134461e-05, "loss": 0.0205, "step": 274020 }, { "epoch": 1.77, "learning_rate": 3.4701846556987676e-05, "loss": 0.0267, "step": 274030 }, { "epoch": 1.77, "learning_rate": 3.469216520263074e-05, "loss": 0.0236, "step": 274040 }, { "epoch": 1.77, "learning_rate": 3.4682483848273816e-05, "loss": 0.0201, "step": 274050 }, { "epoch": 1.77, "learning_rate": 3.4672802493916875e-05, "loss": 0.0257, "step": 274060 }, { "epoch": 1.77, "learning_rate": 3.466312113955995e-05, "loss": 0.0254, "step": 274070 }, { "epoch": 1.77, "learning_rate": 3.4653439785203014e-05, "loss": 0.0265, "step": 274080 }, { "epoch": 1.77, "learning_rate": 3.464375843084608e-05, "loss": 0.024, "step": 274090 }, { "epoch": 1.77, "learning_rate": 3.4634077076489153e-05, "loss": 0.0233, "step": 274100 }, { "epoch": 1.77, "learning_rate": 3.462439572213222e-05, "loss": 0.0219, "step": 274110 }, { "epoch": 1.77, "learning_rate": 3.4614714367775286e-05, "loss": 0.0245, "step": 274120 }, { "epoch": 1.77, "learning_rate": 3.460503301341835e-05, "loss": 0.0253, "step": 274130 }, { "epoch": 1.77, "learning_rate": 3.459535165906142e-05, "loss": 0.0248, "step": 274140 }, { "epoch": 1.77, "learning_rate": 3.458567030470449e-05, "loss": 0.0244, "step": 274150 }, { "epoch": 1.77, "learning_rate": 3.457598895034756e-05, "loss": 0.0274, "step": 274160 }, { "epoch": 1.77, "learning_rate": 3.4566307595990624e-05, "loss": 0.0226, "step": 274170 }, { "epoch": 1.77, "learning_rate": 3.45566262416337e-05, "loss": 0.0218, "step": 274180 }, { "epoch": 1.77, "learning_rate": 3.4546944887276756e-05, "loss": 0.0297, "step": 274190 }, { "epoch": 1.77, "learning_rate": 3.453726353291983e-05, "loss": 0.028, "step": 274200 }, { "epoch": 1.77, "learning_rate": 3.4527582178562896e-05, "loss": 0.0209, "step": 274210 }, { "epoch": 1.77, "learning_rate": 3.451790082420596e-05, "loss": 0.0235, "step": 274220 }, { "epoch": 1.77, "learning_rate": 3.4508219469849035e-05, "loss": 0.0261, "step": 274230 }, { "epoch": 1.77, "learning_rate": 3.44985381154921e-05, "loss": 0.0238, "step": 274240 }, { "epoch": 1.77, "learning_rate": 3.448885676113517e-05, "loss": 0.0259, "step": 274250 }, { "epoch": 1.77, "learning_rate": 3.4479175406778234e-05, "loss": 0.0248, "step": 274260 }, { "epoch": 1.77, "learning_rate": 3.44694940524213e-05, "loss": 0.0269, "step": 274270 }, { "epoch": 1.77, "learning_rate": 3.445981269806437e-05, "loss": 0.028, "step": 274280 }, { "epoch": 1.77, "learning_rate": 3.445013134370744e-05, "loss": 0.0215, "step": 274290 }, { "epoch": 1.77, "learning_rate": 3.4440449989350505e-05, "loss": 0.0212, "step": 274300 }, { "epoch": 1.77, "learning_rate": 3.443076863499358e-05, "loss": 0.0218, "step": 274310 }, { "epoch": 1.77, "learning_rate": 3.4421087280636645e-05, "loss": 0.0265, "step": 274320 }, { "epoch": 1.77, "learning_rate": 3.441140592627971e-05, "loss": 0.0255, "step": 274330 }, { "epoch": 1.77, "learning_rate": 3.440172457192278e-05, "loss": 0.0258, "step": 274340 }, { "epoch": 1.77, "learning_rate": 3.439204321756584e-05, "loss": 0.0207, "step": 274350 }, { "epoch": 1.77, "learning_rate": 3.4382361863208916e-05, "loss": 0.025, "step": 274360 }, { "epoch": 1.77, "learning_rate": 3.437268050885198e-05, "loss": 0.0246, "step": 274370 }, { "epoch": 1.77, "learning_rate": 3.436299915449505e-05, "loss": 0.0293, "step": 274380 }, { "epoch": 1.77, "learning_rate": 3.435331780013812e-05, "loss": 0.0268, "step": 274390 }, { "epoch": 1.77, "learning_rate": 3.434363644578118e-05, "loss": 0.0227, "step": 274400 }, { "epoch": 1.77, "learning_rate": 3.4333955091424254e-05, "loss": 0.0229, "step": 274410 }, { "epoch": 1.77, "learning_rate": 3.432427373706732e-05, "loss": 0.0227, "step": 274420 }, { "epoch": 1.77, "learning_rate": 3.431459238271039e-05, "loss": 0.0245, "step": 274430 }, { "epoch": 1.77, "learning_rate": 3.430491102835346e-05, "loss": 0.0248, "step": 274440 }, { "epoch": 1.77, "learning_rate": 3.4295229673996526e-05, "loss": 0.0247, "step": 274450 }, { "epoch": 1.77, "learning_rate": 3.428554831963959e-05, "loss": 0.0218, "step": 274460 }, { "epoch": 1.77, "learning_rate": 3.427586696528266e-05, "loss": 0.0241, "step": 274470 }, { "epoch": 1.77, "learning_rate": 3.4266185610925725e-05, "loss": 0.0232, "step": 274480 }, { "epoch": 1.77, "learning_rate": 3.42565042565688e-05, "loss": 0.0229, "step": 274490 }, { "epoch": 1.77, "learning_rate": 3.4246822902211864e-05, "loss": 0.0274, "step": 274500 }, { "epoch": 1.77, "learning_rate": 3.423714154785493e-05, "loss": 0.0247, "step": 274510 }, { "epoch": 1.77, "learning_rate": 3.4227460193498e-05, "loss": 0.0216, "step": 274520 }, { "epoch": 1.77, "learning_rate": 3.421777883914107e-05, "loss": 0.0231, "step": 274530 }, { "epoch": 1.77, "learning_rate": 3.4208097484784136e-05, "loss": 0.0217, "step": 274540 }, { "epoch": 1.77, "learning_rate": 3.41984161304272e-05, "loss": 0.0215, "step": 274550 }, { "epoch": 1.77, "learning_rate": 3.418873477607027e-05, "loss": 0.0202, "step": 274560 }, { "epoch": 1.77, "learning_rate": 3.417905342171334e-05, "loss": 0.0264, "step": 274570 }, { "epoch": 1.77, "learning_rate": 3.416937206735641e-05, "loss": 0.0252, "step": 274580 }, { "epoch": 1.77, "learning_rate": 3.4159690712999474e-05, "loss": 0.0227, "step": 274590 }, { "epoch": 1.77, "learning_rate": 3.415000935864255e-05, "loss": 0.0256, "step": 274600 }, { "epoch": 1.77, "learning_rate": 3.4140328004285606e-05, "loss": 0.0238, "step": 274610 }, { "epoch": 1.77, "learning_rate": 3.413064664992868e-05, "loss": 0.021, "step": 274620 }, { "epoch": 1.77, "learning_rate": 3.4120965295571745e-05, "loss": 0.0219, "step": 274630 }, { "epoch": 1.77, "learning_rate": 3.411128394121481e-05, "loss": 0.0209, "step": 274640 }, { "epoch": 1.77, "learning_rate": 3.4101602586857885e-05, "loss": 0.0223, "step": 274650 }, { "epoch": 1.77, "learning_rate": 3.409192123250095e-05, "loss": 0.0273, "step": 274660 }, { "epoch": 1.77, "learning_rate": 3.408223987814402e-05, "loss": 0.0226, "step": 274670 }, { "epoch": 1.77, "learning_rate": 3.4072558523787083e-05, "loss": 0.0241, "step": 274680 }, { "epoch": 1.77, "learning_rate": 3.406287716943015e-05, "loss": 0.0185, "step": 274690 }, { "epoch": 1.77, "learning_rate": 3.405319581507322e-05, "loss": 0.0213, "step": 274700 }, { "epoch": 1.77, "learning_rate": 3.404351446071629e-05, "loss": 0.022, "step": 274710 }, { "epoch": 1.77, "learning_rate": 3.4033833106359355e-05, "loss": 0.0211, "step": 274720 }, { "epoch": 1.77, "learning_rate": 3.402415175200243e-05, "loss": 0.026, "step": 274730 }, { "epoch": 1.77, "learning_rate": 3.4014470397645494e-05, "loss": 0.0259, "step": 274740 }, { "epoch": 1.77, "learning_rate": 3.400478904328856e-05, "loss": 0.0208, "step": 274750 }, { "epoch": 1.77, "learning_rate": 3.399510768893163e-05, "loss": 0.0225, "step": 274760 }, { "epoch": 1.77, "learning_rate": 3.398542633457469e-05, "loss": 0.0238, "step": 274770 }, { "epoch": 1.77, "learning_rate": 3.3975744980217766e-05, "loss": 0.0206, "step": 274780 }, { "epoch": 1.77, "learning_rate": 3.396606362586083e-05, "loss": 0.0238, "step": 274790 }, { "epoch": 1.77, "learning_rate": 3.39563822715039e-05, "loss": 0.0207, "step": 274800 }, { "epoch": 1.77, "learning_rate": 3.394670091714697e-05, "loss": 0.0255, "step": 274810 }, { "epoch": 1.77, "learning_rate": 3.393701956279003e-05, "loss": 0.0248, "step": 274820 }, { "epoch": 1.77, "learning_rate": 3.3927338208433104e-05, "loss": 0.0252, "step": 274830 }, { "epoch": 1.77, "learning_rate": 3.391765685407617e-05, "loss": 0.0234, "step": 274840 }, { "epoch": 1.77, "learning_rate": 3.390797549971924e-05, "loss": 0.0237, "step": 274850 }, { "epoch": 1.77, "learning_rate": 3.389829414536231e-05, "loss": 0.0267, "step": 274860 }, { "epoch": 1.77, "learning_rate": 3.3888612791005376e-05, "loss": 0.0198, "step": 274870 }, { "epoch": 1.77, "learning_rate": 3.387893143664844e-05, "loss": 0.0215, "step": 274880 }, { "epoch": 1.77, "learning_rate": 3.386925008229151e-05, "loss": 0.0209, "step": 274890 }, { "epoch": 1.77, "learning_rate": 3.3859568727934575e-05, "loss": 0.0191, "step": 274900 }, { "epoch": 1.77, "learning_rate": 3.384988737357765e-05, "loss": 0.0236, "step": 274910 }, { "epoch": 1.77, "learning_rate": 3.3840206019220714e-05, "loss": 0.0267, "step": 274920 }, { "epoch": 1.77, "learning_rate": 3.383052466486378e-05, "loss": 0.0192, "step": 274930 }, { "epoch": 1.77, "learning_rate": 3.3820843310506846e-05, "loss": 0.0226, "step": 274940 }, { "epoch": 1.77, "learning_rate": 3.381116195614992e-05, "loss": 0.0294, "step": 274950 }, { "epoch": 1.77, "learning_rate": 3.3801480601792986e-05, "loss": 0.0241, "step": 274960 }, { "epoch": 1.77, "learning_rate": 3.379179924743605e-05, "loss": 0.024, "step": 274970 }, { "epoch": 1.77, "learning_rate": 3.378211789307912e-05, "loss": 0.0212, "step": 274980 }, { "epoch": 1.77, "learning_rate": 3.3772436538722184e-05, "loss": 0.024, "step": 274990 }, { "epoch": 1.77, "learning_rate": 3.376275518436526e-05, "loss": 0.0236, "step": 275000 }, { "epoch": 1.77, "eval_cer": 0.9198418257823975, "eval_loss": 0.017496764659881592, "eval_runtime": 119.762, "eval_samples_per_second": 16.7, "eval_steps_per_second": 4.175, "step": 275000 }, { "epoch": 1.77, "learning_rate": 3.3753073830008324e-05, "loss": 0.0252, "step": 275010 }, { "epoch": 1.78, "learning_rate": 3.374339247565139e-05, "loss": 0.0238, "step": 275020 }, { "epoch": 1.78, "learning_rate": 3.3733711121294456e-05, "loss": 0.0222, "step": 275030 }, { "epoch": 1.78, "learning_rate": 3.372402976693752e-05, "loss": 0.0225, "step": 275040 }, { "epoch": 1.78, "learning_rate": 3.3714348412580595e-05, "loss": 0.025, "step": 275050 }, { "epoch": 1.78, "learning_rate": 3.370466705822366e-05, "loss": 0.0213, "step": 275060 }, { "epoch": 1.78, "learning_rate": 3.369498570386673e-05, "loss": 0.0199, "step": 275070 }, { "epoch": 1.78, "learning_rate": 3.36853043495098e-05, "loss": 0.0211, "step": 275080 }, { "epoch": 1.78, "learning_rate": 3.367562299515286e-05, "loss": 0.023, "step": 275090 }, { "epoch": 1.78, "learning_rate": 3.366594164079593e-05, "loss": 0.0233, "step": 275100 }, { "epoch": 1.78, "learning_rate": 3.3656260286439e-05, "loss": 0.0209, "step": 275110 }, { "epoch": 1.78, "learning_rate": 3.3646578932082066e-05, "loss": 0.0227, "step": 275120 }, { "epoch": 1.78, "learning_rate": 3.363689757772514e-05, "loss": 0.0212, "step": 275130 }, { "epoch": 1.78, "learning_rate": 3.3627216223368205e-05, "loss": 0.0245, "step": 275140 }, { "epoch": 1.78, "learning_rate": 3.361753486901127e-05, "loss": 0.0208, "step": 275150 }, { "epoch": 1.78, "learning_rate": 3.360785351465434e-05, "loss": 0.0233, "step": 275160 }, { "epoch": 1.78, "learning_rate": 3.3598172160297404e-05, "loss": 0.023, "step": 275170 }, { "epoch": 1.78, "learning_rate": 3.358849080594048e-05, "loss": 0.0215, "step": 275180 }, { "epoch": 1.78, "learning_rate": 3.357880945158354e-05, "loss": 0.0226, "step": 275190 }, { "epoch": 1.78, "learning_rate": 3.356912809722661e-05, "loss": 0.0221, "step": 275200 }, { "epoch": 1.78, "learning_rate": 3.355944674286968e-05, "loss": 0.0303, "step": 275210 }, { "epoch": 1.78, "learning_rate": 3.354976538851275e-05, "loss": 0.0233, "step": 275220 }, { "epoch": 1.78, "learning_rate": 3.3540084034155815e-05, "loss": 0.0208, "step": 275230 }, { "epoch": 1.78, "learning_rate": 3.353040267979888e-05, "loss": 0.0227, "step": 275240 }, { "epoch": 1.78, "learning_rate": 3.352072132544195e-05, "loss": 0.0234, "step": 275250 }, { "epoch": 1.78, "learning_rate": 3.351103997108502e-05, "loss": 0.0195, "step": 275260 }, { "epoch": 1.78, "learning_rate": 3.3501358616728086e-05, "loss": 0.0233, "step": 275270 }, { "epoch": 1.78, "learning_rate": 3.349167726237115e-05, "loss": 0.0227, "step": 275280 }, { "epoch": 1.78, "learning_rate": 3.3481995908014226e-05, "loss": 0.0244, "step": 275290 }, { "epoch": 1.78, "learning_rate": 3.3472314553657285e-05, "loss": 0.0293, "step": 275300 }, { "epoch": 1.78, "learning_rate": 3.346263319930036e-05, "loss": 0.0291, "step": 275310 }, { "epoch": 1.78, "learning_rate": 3.3452951844943424e-05, "loss": 0.0231, "step": 275320 }, { "epoch": 1.78, "learning_rate": 3.344327049058649e-05, "loss": 0.029, "step": 275330 }, { "epoch": 1.78, "learning_rate": 3.3433589136229564e-05, "loss": 0.0208, "step": 275340 }, { "epoch": 1.78, "learning_rate": 3.342390778187263e-05, "loss": 0.0222, "step": 275350 }, { "epoch": 1.78, "learning_rate": 3.3414226427515696e-05, "loss": 0.0224, "step": 275360 }, { "epoch": 1.78, "learning_rate": 3.340454507315876e-05, "loss": 0.0232, "step": 275370 }, { "epoch": 1.78, "learning_rate": 3.339486371880183e-05, "loss": 0.0207, "step": 275380 }, { "epoch": 1.78, "learning_rate": 3.33851823644449e-05, "loss": 0.0251, "step": 275390 }, { "epoch": 1.78, "learning_rate": 3.337550101008797e-05, "loss": 0.0241, "step": 275400 }, { "epoch": 1.78, "learning_rate": 3.3365819655731034e-05, "loss": 0.025, "step": 275410 }, { "epoch": 1.78, "learning_rate": 3.335613830137411e-05, "loss": 0.0248, "step": 275420 }, { "epoch": 1.78, "learning_rate": 3.334645694701717e-05, "loss": 0.0201, "step": 275430 }, { "epoch": 1.78, "learning_rate": 3.333677559266024e-05, "loss": 0.0198, "step": 275440 }, { "epoch": 1.78, "learning_rate": 3.3327094238303306e-05, "loss": 0.03, "step": 275450 }, { "epoch": 1.78, "learning_rate": 3.331741288394637e-05, "loss": 0.0229, "step": 275460 }, { "epoch": 1.78, "learning_rate": 3.3307731529589445e-05, "loss": 0.0236, "step": 275470 }, { "epoch": 1.78, "learning_rate": 3.329805017523251e-05, "loss": 0.0273, "step": 275480 }, { "epoch": 1.78, "learning_rate": 3.328836882087558e-05, "loss": 0.0237, "step": 275490 }, { "epoch": 1.78, "learning_rate": 3.327868746651865e-05, "loss": 0.0257, "step": 275500 }, { "epoch": 1.78, "learning_rate": 3.326900611216171e-05, "loss": 0.0225, "step": 275510 }, { "epoch": 1.78, "learning_rate": 3.325932475780478e-05, "loss": 0.0293, "step": 275520 }, { "epoch": 1.78, "learning_rate": 3.324964340344785e-05, "loss": 0.0223, "step": 275530 }, { "epoch": 1.78, "learning_rate": 3.3239962049090916e-05, "loss": 0.0209, "step": 275540 }, { "epoch": 1.78, "learning_rate": 3.323028069473399e-05, "loss": 0.0243, "step": 275550 }, { "epoch": 1.78, "learning_rate": 3.3220599340377055e-05, "loss": 0.0255, "step": 275560 }, { "epoch": 1.78, "learning_rate": 3.321091798602012e-05, "loss": 0.0251, "step": 275570 }, { "epoch": 1.78, "learning_rate": 3.320123663166319e-05, "loss": 0.0298, "step": 275580 }, { "epoch": 1.78, "learning_rate": 3.3191555277306254e-05, "loss": 0.0241, "step": 275590 }, { "epoch": 1.78, "learning_rate": 3.3181873922949327e-05, "loss": 0.0241, "step": 275600 }, { "epoch": 1.78, "learning_rate": 3.317219256859239e-05, "loss": 0.0248, "step": 275610 }, { "epoch": 1.78, "learning_rate": 3.316251121423546e-05, "loss": 0.0238, "step": 275620 }, { "epoch": 1.78, "learning_rate": 3.315282985987853e-05, "loss": 0.0207, "step": 275630 }, { "epoch": 1.78, "learning_rate": 3.31431485055216e-05, "loss": 0.0234, "step": 275640 }, { "epoch": 1.78, "learning_rate": 3.3133467151164664e-05, "loss": 0.0299, "step": 275650 }, { "epoch": 1.78, "learning_rate": 3.312378579680773e-05, "loss": 0.023, "step": 275660 }, { "epoch": 1.78, "learning_rate": 3.31141044424508e-05, "loss": 0.0224, "step": 275670 }, { "epoch": 1.78, "learning_rate": 3.310442308809387e-05, "loss": 0.0251, "step": 275680 }, { "epoch": 1.78, "learning_rate": 3.3094741733736936e-05, "loss": 0.0236, "step": 275690 }, { "epoch": 1.78, "learning_rate": 3.308506037938e-05, "loss": 0.0221, "step": 275700 }, { "epoch": 1.78, "learning_rate": 3.3075379025023075e-05, "loss": 0.0289, "step": 275710 }, { "epoch": 1.78, "learning_rate": 3.3065697670666135e-05, "loss": 0.0232, "step": 275720 }, { "epoch": 1.78, "learning_rate": 3.305601631630921e-05, "loss": 0.0264, "step": 275730 }, { "epoch": 1.78, "learning_rate": 3.3046334961952274e-05, "loss": 0.0243, "step": 275740 }, { "epoch": 1.78, "learning_rate": 3.303665360759534e-05, "loss": 0.0206, "step": 275750 }, { "epoch": 1.78, "learning_rate": 3.3026972253238413e-05, "loss": 0.0228, "step": 275760 }, { "epoch": 1.78, "learning_rate": 3.301729089888148e-05, "loss": 0.0233, "step": 275770 }, { "epoch": 1.78, "learning_rate": 3.3007609544524546e-05, "loss": 0.022, "step": 275780 }, { "epoch": 1.78, "learning_rate": 3.299792819016761e-05, "loss": 0.0233, "step": 275790 }, { "epoch": 1.78, "learning_rate": 3.298824683581068e-05, "loss": 0.0262, "step": 275800 }, { "epoch": 1.78, "learning_rate": 3.297856548145375e-05, "loss": 0.0207, "step": 275810 }, { "epoch": 1.78, "learning_rate": 3.296888412709682e-05, "loss": 0.0222, "step": 275820 }, { "epoch": 1.78, "learning_rate": 3.2959202772739884e-05, "loss": 0.0214, "step": 275830 }, { "epoch": 1.78, "learning_rate": 3.294952141838296e-05, "loss": 0.0204, "step": 275840 }, { "epoch": 1.78, "learning_rate": 3.293984006402602e-05, "loss": 0.0252, "step": 275850 }, { "epoch": 1.78, "learning_rate": 3.293015870966909e-05, "loss": 0.0268, "step": 275860 }, { "epoch": 1.78, "learning_rate": 3.2920477355312156e-05, "loss": 0.0249, "step": 275870 }, { "epoch": 1.78, "learning_rate": 3.291079600095522e-05, "loss": 0.0244, "step": 275880 }, { "epoch": 1.78, "learning_rate": 3.2901114646598295e-05, "loss": 0.023, "step": 275890 }, { "epoch": 1.78, "learning_rate": 3.289143329224136e-05, "loss": 0.0191, "step": 275900 }, { "epoch": 1.78, "learning_rate": 3.288175193788443e-05, "loss": 0.0235, "step": 275910 }, { "epoch": 1.78, "learning_rate": 3.2872070583527494e-05, "loss": 0.0266, "step": 275920 }, { "epoch": 1.78, "learning_rate": 3.286238922917056e-05, "loss": 0.0267, "step": 275930 }, { "epoch": 1.78, "learning_rate": 3.285270787481363e-05, "loss": 0.0238, "step": 275940 }, { "epoch": 1.78, "learning_rate": 3.28430265204567e-05, "loss": 0.0255, "step": 275950 }, { "epoch": 1.78, "learning_rate": 3.2833345166099765e-05, "loss": 0.0221, "step": 275960 }, { "epoch": 1.78, "learning_rate": 3.282366381174284e-05, "loss": 0.0244, "step": 275970 }, { "epoch": 1.78, "learning_rate": 3.2813982457385905e-05, "loss": 0.0278, "step": 275980 }, { "epoch": 1.78, "learning_rate": 3.280430110302897e-05, "loss": 0.0245, "step": 275990 }, { "epoch": 1.78, "learning_rate": 3.279461974867204e-05, "loss": 0.0202, "step": 276000 }, { "epoch": 1.78, "eval_cer": 0.9197794599480285, "eval_loss": 0.017633169889450073, "eval_runtime": 120.0188, "eval_samples_per_second": 16.664, "eval_steps_per_second": 4.166, "step": 276000 }, { "epoch": 1.78, "learning_rate": 3.27849383943151e-05, "loss": 0.0197, "step": 276010 }, { "epoch": 1.78, "learning_rate": 3.2775257039958176e-05, "loss": 0.0227, "step": 276020 }, { "epoch": 1.78, "learning_rate": 3.276557568560124e-05, "loss": 0.026, "step": 276030 }, { "epoch": 1.78, "learning_rate": 3.275589433124431e-05, "loss": 0.0253, "step": 276040 }, { "epoch": 1.78, "learning_rate": 3.274621297688738e-05, "loss": 0.0258, "step": 276050 }, { "epoch": 1.78, "learning_rate": 3.273653162253044e-05, "loss": 0.0235, "step": 276060 }, { "epoch": 1.78, "learning_rate": 3.2726850268173514e-05, "loss": 0.0358, "step": 276070 }, { "epoch": 1.78, "learning_rate": 3.271716891381658e-05, "loss": 0.0219, "step": 276080 }, { "epoch": 1.78, "learning_rate": 3.270748755945965e-05, "loss": 0.0241, "step": 276090 }, { "epoch": 1.78, "learning_rate": 3.269780620510272e-05, "loss": 0.0193, "step": 276100 }, { "epoch": 1.78, "learning_rate": 3.2688124850745786e-05, "loss": 0.0227, "step": 276110 }, { "epoch": 1.78, "learning_rate": 3.267844349638885e-05, "loss": 0.024, "step": 276120 }, { "epoch": 1.78, "learning_rate": 3.266876214203192e-05, "loss": 0.0212, "step": 276130 }, { "epoch": 1.78, "learning_rate": 3.2659080787674985e-05, "loss": 0.0241, "step": 276140 }, { "epoch": 1.78, "learning_rate": 3.264939943331806e-05, "loss": 0.0215, "step": 276150 }, { "epoch": 1.78, "learning_rate": 3.2639718078961124e-05, "loss": 0.0226, "step": 276160 }, { "epoch": 1.78, "learning_rate": 3.263003672460419e-05, "loss": 0.0211, "step": 276170 }, { "epoch": 1.78, "learning_rate": 3.262035537024726e-05, "loss": 0.0254, "step": 276180 }, { "epoch": 1.78, "learning_rate": 3.261067401589033e-05, "loss": 0.0228, "step": 276190 }, { "epoch": 1.78, "learning_rate": 3.2600992661533396e-05, "loss": 0.0217, "step": 276200 }, { "epoch": 1.78, "learning_rate": 3.259131130717646e-05, "loss": 0.0242, "step": 276210 }, { "epoch": 1.78, "learning_rate": 3.258162995281953e-05, "loss": 0.0203, "step": 276220 }, { "epoch": 1.78, "learning_rate": 3.25719485984626e-05, "loss": 0.0217, "step": 276230 }, { "epoch": 1.78, "learning_rate": 3.256226724410567e-05, "loss": 0.0216, "step": 276240 }, { "epoch": 1.78, "learning_rate": 3.2552585889748734e-05, "loss": 0.0176, "step": 276250 }, { "epoch": 1.78, "learning_rate": 3.25429045353918e-05, "loss": 0.0233, "step": 276260 }, { "epoch": 1.78, "learning_rate": 3.2533223181034866e-05, "loss": 0.0241, "step": 276270 }, { "epoch": 1.78, "learning_rate": 3.252354182667794e-05, "loss": 0.0239, "step": 276280 }, { "epoch": 1.78, "learning_rate": 3.2513860472321005e-05, "loss": 0.0216, "step": 276290 }, { "epoch": 1.78, "learning_rate": 3.250417911796407e-05, "loss": 0.023, "step": 276300 }, { "epoch": 1.78, "learning_rate": 3.249449776360714e-05, "loss": 0.0213, "step": 276310 }, { "epoch": 1.78, "learning_rate": 3.248481640925021e-05, "loss": 0.0251, "step": 276320 }, { "epoch": 1.78, "learning_rate": 3.247513505489328e-05, "loss": 0.0221, "step": 276330 }, { "epoch": 1.78, "learning_rate": 3.2465453700536343e-05, "loss": 0.0209, "step": 276340 }, { "epoch": 1.78, "learning_rate": 3.245577234617941e-05, "loss": 0.023, "step": 276350 }, { "epoch": 1.78, "learning_rate": 3.244609099182248e-05, "loss": 0.0181, "step": 276360 }, { "epoch": 1.78, "learning_rate": 3.243640963746555e-05, "loss": 0.0235, "step": 276370 }, { "epoch": 1.78, "learning_rate": 3.2426728283108615e-05, "loss": 0.026, "step": 276380 }, { "epoch": 1.78, "learning_rate": 3.241704692875168e-05, "loss": 0.0244, "step": 276390 }, { "epoch": 1.78, "learning_rate": 3.2407365574394754e-05, "loss": 0.0208, "step": 276400 }, { "epoch": 1.78, "learning_rate": 3.239768422003782e-05, "loss": 0.0265, "step": 276410 }, { "epoch": 1.78, "learning_rate": 3.238800286568089e-05, "loss": 0.0205, "step": 276420 }, { "epoch": 1.78, "learning_rate": 3.237832151132395e-05, "loss": 0.0342, "step": 276430 }, { "epoch": 1.78, "learning_rate": 3.236864015696702e-05, "loss": 0.0247, "step": 276440 }, { "epoch": 1.78, "learning_rate": 3.235895880261009e-05, "loss": 0.0229, "step": 276450 }, { "epoch": 1.78, "learning_rate": 3.234927744825316e-05, "loss": 0.0222, "step": 276460 }, { "epoch": 1.78, "learning_rate": 3.2339596093896225e-05, "loss": 0.0227, "step": 276470 }, { "epoch": 1.78, "learning_rate": 3.232991473953929e-05, "loss": 0.0215, "step": 276480 }, { "epoch": 1.78, "learning_rate": 3.232023338518236e-05, "loss": 0.025, "step": 276490 }, { "epoch": 1.78, "learning_rate": 3.231055203082543e-05, "loss": 0.0252, "step": 276500 }, { "epoch": 1.78, "learning_rate": 3.2300870676468497e-05, "loss": 0.0232, "step": 276510 }, { "epoch": 1.78, "learning_rate": 3.229118932211156e-05, "loss": 0.0248, "step": 276520 }, { "epoch": 1.78, "learning_rate": 3.2281507967754636e-05, "loss": 0.0302, "step": 276530 }, { "epoch": 1.78, "learning_rate": 3.22718266133977e-05, "loss": 0.03, "step": 276540 }, { "epoch": 1.78, "learning_rate": 3.226214525904077e-05, "loss": 0.0215, "step": 276550 }, { "epoch": 1.78, "learning_rate": 3.2252463904683835e-05, "loss": 0.0258, "step": 276560 }, { "epoch": 1.79, "learning_rate": 3.22427825503269e-05, "loss": 0.0174, "step": 276570 }, { "epoch": 1.79, "learning_rate": 3.2233101195969974e-05, "loss": 0.024, "step": 276580 }, { "epoch": 1.79, "learning_rate": 3.222341984161304e-05, "loss": 0.0257, "step": 276590 }, { "epoch": 1.79, "learning_rate": 3.2213738487256106e-05, "loss": 0.0241, "step": 276600 }, { "epoch": 1.79, "learning_rate": 3.220405713289918e-05, "loss": 0.0196, "step": 276610 }, { "epoch": 1.79, "learning_rate": 3.219437577854224e-05, "loss": 0.0185, "step": 276620 }, { "epoch": 1.79, "learning_rate": 3.218469442418531e-05, "loss": 0.0233, "step": 276630 }, { "epoch": 1.79, "learning_rate": 3.217501306982838e-05, "loss": 0.0316, "step": 276640 }, { "epoch": 1.79, "learning_rate": 3.2165331715471444e-05, "loss": 0.02, "step": 276650 }, { "epoch": 1.79, "learning_rate": 3.215565036111452e-05, "loss": 0.0236, "step": 276660 }, { "epoch": 1.79, "learning_rate": 3.2145969006757584e-05, "loss": 0.0244, "step": 276670 }, { "epoch": 1.79, "learning_rate": 3.213628765240065e-05, "loss": 0.0216, "step": 276680 }, { "epoch": 1.79, "learning_rate": 3.2126606298043716e-05, "loss": 0.0204, "step": 276690 }, { "epoch": 1.79, "learning_rate": 3.211692494368678e-05, "loss": 0.0281, "step": 276700 }, { "epoch": 1.79, "learning_rate": 3.2107243589329855e-05, "loss": 0.0205, "step": 276710 }, { "epoch": 1.79, "learning_rate": 3.209756223497292e-05, "loss": 0.0292, "step": 276720 }, { "epoch": 1.79, "learning_rate": 3.208788088061599e-05, "loss": 0.0235, "step": 276730 }, { "epoch": 1.79, "learning_rate": 3.207819952625906e-05, "loss": 0.0272, "step": 276740 }, { "epoch": 1.79, "learning_rate": 3.206851817190212e-05, "loss": 0.0216, "step": 276750 }, { "epoch": 1.79, "learning_rate": 3.205883681754519e-05, "loss": 0.0217, "step": 276760 }, { "epoch": 1.79, "learning_rate": 3.204915546318826e-05, "loss": 0.0223, "step": 276770 }, { "epoch": 1.79, "learning_rate": 3.2039474108831326e-05, "loss": 0.0249, "step": 276780 }, { "epoch": 1.79, "learning_rate": 3.20297927544744e-05, "loss": 0.0253, "step": 276790 }, { "epoch": 1.79, "learning_rate": 3.2020111400117465e-05, "loss": 0.0217, "step": 276800 }, { "epoch": 1.79, "learning_rate": 3.201043004576053e-05, "loss": 0.0261, "step": 276810 }, { "epoch": 1.79, "learning_rate": 3.20007486914036e-05, "loss": 0.0197, "step": 276820 }, { "epoch": 1.79, "learning_rate": 3.1991067337046664e-05, "loss": 0.0267, "step": 276830 }, { "epoch": 1.79, "learning_rate": 3.198138598268974e-05, "loss": 0.0213, "step": 276840 }, { "epoch": 1.79, "learning_rate": 3.19717046283328e-05, "loss": 0.0236, "step": 276850 }, { "epoch": 1.79, "learning_rate": 3.196202327397587e-05, "loss": 0.0207, "step": 276860 }, { "epoch": 1.79, "learning_rate": 3.195234191961894e-05, "loss": 0.0269, "step": 276870 }, { "epoch": 1.79, "learning_rate": 3.194266056526201e-05, "loss": 0.027, "step": 276880 }, { "epoch": 1.79, "learning_rate": 3.1932979210905075e-05, "loss": 0.0219, "step": 276890 }, { "epoch": 1.79, "learning_rate": 3.192329785654814e-05, "loss": 0.0246, "step": 276900 }, { "epoch": 1.79, "learning_rate": 3.191361650219121e-05, "loss": 0.021, "step": 276910 }, { "epoch": 1.79, "learning_rate": 3.190393514783428e-05, "loss": 0.0222, "step": 276920 }, { "epoch": 1.79, "learning_rate": 3.1894253793477346e-05, "loss": 0.0219, "step": 276930 }, { "epoch": 1.79, "learning_rate": 3.188457243912041e-05, "loss": 0.0229, "step": 276940 }, { "epoch": 1.79, "learning_rate": 3.1874891084763486e-05, "loss": 0.0263, "step": 276950 }, { "epoch": 1.79, "learning_rate": 3.1865209730406545e-05, "loss": 0.0253, "step": 276960 }, { "epoch": 1.79, "learning_rate": 3.185552837604962e-05, "loss": 0.0195, "step": 276970 }, { "epoch": 1.79, "learning_rate": 3.1845847021692684e-05, "loss": 0.0245, "step": 276980 }, { "epoch": 1.79, "learning_rate": 3.183616566733575e-05, "loss": 0.0246, "step": 276990 }, { "epoch": 1.79, "learning_rate": 3.1826484312978824e-05, "loss": 0.0318, "step": 277000 }, { "epoch": 1.79, "eval_cer": 0.9198689413625579, "eval_loss": 0.01742408238351345, "eval_runtime": 119.8944, "eval_samples_per_second": 16.681, "eval_steps_per_second": 4.17, "step": 277000 }, { "epoch": 1.79, "learning_rate": 3.181680295862189e-05, "loss": 0.0255, "step": 277010 }, { "epoch": 1.79, "learning_rate": 3.1807121604264956e-05, "loss": 0.0216, "step": 277020 }, { "epoch": 1.79, "learning_rate": 3.179744024990802e-05, "loss": 0.0213, "step": 277030 }, { "epoch": 1.79, "learning_rate": 3.178775889555109e-05, "loss": 0.0249, "step": 277040 }, { "epoch": 1.79, "learning_rate": 3.177807754119416e-05, "loss": 0.0203, "step": 277050 }, { "epoch": 1.79, "learning_rate": 3.176839618683723e-05, "loss": 0.0262, "step": 277060 }, { "epoch": 1.79, "learning_rate": 3.1758714832480294e-05, "loss": 0.0298, "step": 277070 }, { "epoch": 1.79, "learning_rate": 3.174903347812337e-05, "loss": 0.0226, "step": 277080 }, { "epoch": 1.79, "learning_rate": 3.173935212376643e-05, "loss": 0.0245, "step": 277090 }, { "epoch": 1.79, "learning_rate": 3.17296707694095e-05, "loss": 0.0241, "step": 277100 }, { "epoch": 1.79, "learning_rate": 3.1719989415052566e-05, "loss": 0.0231, "step": 277110 }, { "epoch": 1.79, "learning_rate": 3.171030806069563e-05, "loss": 0.0195, "step": 277120 }, { "epoch": 1.79, "learning_rate": 3.1700626706338705e-05, "loss": 0.0208, "step": 277130 }, { "epoch": 1.79, "learning_rate": 3.169094535198177e-05, "loss": 0.0218, "step": 277140 }, { "epoch": 1.79, "learning_rate": 3.168126399762484e-05, "loss": 0.0261, "step": 277150 }, { "epoch": 1.79, "learning_rate": 3.167158264326791e-05, "loss": 0.0192, "step": 277160 }, { "epoch": 1.79, "learning_rate": 3.166190128891097e-05, "loss": 0.023, "step": 277170 }, { "epoch": 1.79, "learning_rate": 3.165221993455404e-05, "loss": 0.024, "step": 277180 }, { "epoch": 1.79, "learning_rate": 3.164253858019711e-05, "loss": 0.0266, "step": 277190 }, { "epoch": 1.79, "learning_rate": 3.1632857225840176e-05, "loss": 0.0279, "step": 277200 }, { "epoch": 1.79, "learning_rate": 3.162317587148325e-05, "loss": 0.0226, "step": 277210 }, { "epoch": 1.79, "learning_rate": 3.1613494517126315e-05, "loss": 0.0225, "step": 277220 }, { "epoch": 1.79, "learning_rate": 3.160381316276938e-05, "loss": 0.033, "step": 277230 }, { "epoch": 1.79, "learning_rate": 3.159413180841245e-05, "loss": 0.021, "step": 277240 }, { "epoch": 1.79, "learning_rate": 3.1584450454055513e-05, "loss": 0.0305, "step": 277250 }, { "epoch": 1.79, "learning_rate": 3.1574769099698586e-05, "loss": 0.024, "step": 277260 }, { "epoch": 1.79, "learning_rate": 3.156508774534165e-05, "loss": 0.0233, "step": 277270 }, { "epoch": 1.79, "learning_rate": 3.155540639098472e-05, "loss": 0.0242, "step": 277280 }, { "epoch": 1.79, "learning_rate": 3.154572503662779e-05, "loss": 0.0258, "step": 277290 }, { "epoch": 1.79, "learning_rate": 3.153604368227086e-05, "loss": 0.0286, "step": 277300 }, { "epoch": 1.79, "learning_rate": 3.1526362327913924e-05, "loss": 0.0214, "step": 277310 }, { "epoch": 1.79, "learning_rate": 3.151668097355699e-05, "loss": 0.021, "step": 277320 }, { "epoch": 1.79, "learning_rate": 3.150699961920006e-05, "loss": 0.0226, "step": 277330 }, { "epoch": 1.79, "learning_rate": 3.149731826484313e-05, "loss": 0.0199, "step": 277340 }, { "epoch": 1.79, "learning_rate": 3.1487636910486196e-05, "loss": 0.0222, "step": 277350 }, { "epoch": 1.79, "learning_rate": 3.147795555612926e-05, "loss": 0.0235, "step": 277360 }, { "epoch": 1.79, "learning_rate": 3.1468274201772335e-05, "loss": 0.0236, "step": 277370 }, { "epoch": 1.79, "learning_rate": 3.1458592847415395e-05, "loss": 0.0229, "step": 277380 }, { "epoch": 1.79, "learning_rate": 3.144891149305847e-05, "loss": 0.022, "step": 277390 }, { "epoch": 1.79, "learning_rate": 3.1439230138701534e-05, "loss": 0.0213, "step": 277400 }, { "epoch": 1.79, "learning_rate": 3.14295487843446e-05, "loss": 0.0238, "step": 277410 }, { "epoch": 1.79, "learning_rate": 3.1419867429987673e-05, "loss": 0.0248, "step": 277420 }, { "epoch": 1.79, "learning_rate": 3.141018607563074e-05, "loss": 0.0236, "step": 277430 }, { "epoch": 1.79, "learning_rate": 3.1400504721273806e-05, "loss": 0.0223, "step": 277440 }, { "epoch": 1.79, "learning_rate": 3.139082336691687e-05, "loss": 0.0232, "step": 277450 }, { "epoch": 1.79, "learning_rate": 3.138114201255994e-05, "loss": 0.0217, "step": 277460 }, { "epoch": 1.79, "learning_rate": 3.137146065820301e-05, "loss": 0.0221, "step": 277470 }, { "epoch": 1.79, "learning_rate": 3.136177930384608e-05, "loss": 0.0217, "step": 277480 }, { "epoch": 1.79, "learning_rate": 3.1352097949489144e-05, "loss": 0.0221, "step": 277490 }, { "epoch": 1.79, "learning_rate": 3.134241659513222e-05, "loss": 0.0209, "step": 277500 }, { "epoch": 1.79, "learning_rate": 3.133273524077528e-05, "loss": 0.0267, "step": 277510 }, { "epoch": 1.79, "learning_rate": 3.132305388641835e-05, "loss": 0.0236, "step": 277520 }, { "epoch": 1.79, "learning_rate": 3.1313372532061416e-05, "loss": 0.0261, "step": 277530 }, { "epoch": 1.79, "learning_rate": 3.130369117770448e-05, "loss": 0.022, "step": 277540 }, { "epoch": 1.79, "learning_rate": 3.1294009823347555e-05, "loss": 0.0221, "step": 277550 }, { "epoch": 1.79, "learning_rate": 3.128432846899062e-05, "loss": 0.0194, "step": 277560 }, { "epoch": 1.79, "learning_rate": 3.127464711463369e-05, "loss": 0.0248, "step": 277570 }, { "epoch": 1.79, "learning_rate": 3.126496576027676e-05, "loss": 0.0233, "step": 277580 }, { "epoch": 1.79, "learning_rate": 3.125528440591982e-05, "loss": 0.0255, "step": 277590 }, { "epoch": 1.79, "learning_rate": 3.124560305156289e-05, "loss": 0.0226, "step": 277600 }, { "epoch": 1.79, "learning_rate": 3.123592169720596e-05, "loss": 0.0233, "step": 277610 }, { "epoch": 1.79, "learning_rate": 3.1226240342849025e-05, "loss": 0.0223, "step": 277620 }, { "epoch": 1.79, "learning_rate": 3.12165589884921e-05, "loss": 0.0246, "step": 277630 }, { "epoch": 1.79, "learning_rate": 3.1206877634135165e-05, "loss": 0.0217, "step": 277640 }, { "epoch": 1.79, "learning_rate": 3.119719627977823e-05, "loss": 0.0197, "step": 277650 }, { "epoch": 1.79, "learning_rate": 3.11875149254213e-05, "loss": 0.0267, "step": 277660 }, { "epoch": 1.79, "learning_rate": 3.117783357106436e-05, "loss": 0.0246, "step": 277670 }, { "epoch": 1.79, "learning_rate": 3.1168152216707436e-05, "loss": 0.0264, "step": 277680 }, { "epoch": 1.79, "learning_rate": 3.11584708623505e-05, "loss": 0.0239, "step": 277690 }, { "epoch": 1.79, "learning_rate": 3.114878950799357e-05, "loss": 0.0266, "step": 277700 }, { "epoch": 1.79, "learning_rate": 3.1139108153636635e-05, "loss": 0.0278, "step": 277710 }, { "epoch": 1.79, "learning_rate": 3.11294267992797e-05, "loss": 0.0248, "step": 277720 }, { "epoch": 1.79, "learning_rate": 3.1119745444922774e-05, "loss": 0.0295, "step": 277730 }, { "epoch": 1.79, "learning_rate": 3.111006409056584e-05, "loss": 0.0196, "step": 277740 }, { "epoch": 1.79, "learning_rate": 3.110038273620891e-05, "loss": 0.0207, "step": 277750 }, { "epoch": 1.79, "learning_rate": 3.109070138185197e-05, "loss": 0.0249, "step": 277760 }, { "epoch": 1.79, "learning_rate": 3.1081020027495046e-05, "loss": 0.0233, "step": 277770 }, { "epoch": 1.79, "learning_rate": 3.107133867313811e-05, "loss": 0.0263, "step": 277780 }, { "epoch": 1.79, "learning_rate": 3.106165731878118e-05, "loss": 0.0244, "step": 277790 }, { "epoch": 1.79, "learning_rate": 3.1051975964424245e-05, "loss": 0.0272, "step": 277800 }, { "epoch": 1.79, "learning_rate": 3.104229461006731e-05, "loss": 0.0189, "step": 277810 }, { "epoch": 1.79, "learning_rate": 3.1032613255710384e-05, "loss": 0.0231, "step": 277820 }, { "epoch": 1.79, "learning_rate": 3.102293190135345e-05, "loss": 0.0203, "step": 277830 }, { "epoch": 1.79, "learning_rate": 3.1013250546996516e-05, "loss": 0.0186, "step": 277840 }, { "epoch": 1.79, "learning_rate": 3.100356919263959e-05, "loss": 0.0204, "step": 277850 }, { "epoch": 1.79, "learning_rate": 3.099388783828265e-05, "loss": 0.0259, "step": 277860 }, { "epoch": 1.79, "learning_rate": 3.098420648392572e-05, "loss": 0.0251, "step": 277870 }, { "epoch": 1.79, "learning_rate": 3.097452512956879e-05, "loss": 0.0231, "step": 277880 }, { "epoch": 1.79, "learning_rate": 3.0964843775211854e-05, "loss": 0.0205, "step": 277890 }, { "epoch": 1.79, "learning_rate": 3.095516242085493e-05, "loss": 0.0255, "step": 277900 }, { "epoch": 1.79, "learning_rate": 3.0945481066497994e-05, "loss": 0.0199, "step": 277910 }, { "epoch": 1.79, "learning_rate": 3.093579971214106e-05, "loss": 0.0229, "step": 277920 }, { "epoch": 1.79, "learning_rate": 3.0926118357784126e-05, "loss": 0.0226, "step": 277930 }, { "epoch": 1.79, "learning_rate": 3.091643700342719e-05, "loss": 0.0247, "step": 277940 }, { "epoch": 1.79, "learning_rate": 3.0906755649070265e-05, "loss": 0.0236, "step": 277950 }, { "epoch": 1.79, "learning_rate": 3.089707429471333e-05, "loss": 0.0205, "step": 277960 }, { "epoch": 1.79, "learning_rate": 3.08873929403564e-05, "loss": 0.0273, "step": 277970 }, { "epoch": 1.79, "learning_rate": 3.087771158599947e-05, "loss": 0.0213, "step": 277980 }, { "epoch": 1.79, "learning_rate": 3.086803023164254e-05, "loss": 0.027, "step": 277990 }, { "epoch": 1.79, "learning_rate": 3.0858348877285603e-05, "loss": 0.0206, "step": 278000 }, { "epoch": 1.79, "eval_cer": 0.9198373065190374, "eval_loss": 0.017471129074692726, "eval_runtime": 119.7858, "eval_samples_per_second": 16.696, "eval_steps_per_second": 4.174, "step": 278000 }, { "epoch": 1.79, "learning_rate": 3.084866752292867e-05, "loss": 0.0219, "step": 278010 }, { "epoch": 1.79, "learning_rate": 3.0838986168571736e-05, "loss": 0.0278, "step": 278020 }, { "epoch": 1.79, "learning_rate": 3.082930481421481e-05, "loss": 0.0201, "step": 278030 }, { "epoch": 1.79, "learning_rate": 3.0819623459857875e-05, "loss": 0.0216, "step": 278040 }, { "epoch": 1.79, "learning_rate": 3.080994210550094e-05, "loss": 0.0242, "step": 278050 }, { "epoch": 1.79, "learning_rate": 3.0800260751144014e-05, "loss": 0.0262, "step": 278060 }, { "epoch": 1.79, "learning_rate": 3.0790579396787074e-05, "loss": 0.0192, "step": 278070 }, { "epoch": 1.79, "learning_rate": 3.078089804243015e-05, "loss": 0.0284, "step": 278080 }, { "epoch": 1.79, "learning_rate": 3.077121668807321e-05, "loss": 0.0202, "step": 278090 }, { "epoch": 1.79, "learning_rate": 3.076153533371628e-05, "loss": 0.0216, "step": 278100 }, { "epoch": 1.79, "learning_rate": 3.075185397935935e-05, "loss": 0.0251, "step": 278110 }, { "epoch": 1.8, "learning_rate": 3.074217262500242e-05, "loss": 0.0217, "step": 278120 }, { "epoch": 1.8, "learning_rate": 3.0732491270645485e-05, "loss": 0.0241, "step": 278130 }, { "epoch": 1.8, "learning_rate": 3.072280991628855e-05, "loss": 0.0207, "step": 278140 }, { "epoch": 1.8, "learning_rate": 3.071312856193162e-05, "loss": 0.0252, "step": 278150 }, { "epoch": 1.8, "learning_rate": 3.070344720757469e-05, "loss": 0.0224, "step": 278160 }, { "epoch": 1.8, "learning_rate": 3.0693765853217757e-05, "loss": 0.0254, "step": 278170 }, { "epoch": 1.8, "learning_rate": 3.068408449886082e-05, "loss": 0.0235, "step": 278180 }, { "epoch": 1.8, "learning_rate": 3.0674403144503896e-05, "loss": 0.0235, "step": 278190 }, { "epoch": 1.8, "learning_rate": 3.066472179014696e-05, "loss": 0.0259, "step": 278200 }, { "epoch": 1.8, "learning_rate": 3.065504043579003e-05, "loss": 0.019, "step": 278210 }, { "epoch": 1.8, "learning_rate": 3.0645359081433095e-05, "loss": 0.0214, "step": 278220 }, { "epoch": 1.8, "learning_rate": 3.063567772707616e-05, "loss": 0.0282, "step": 278230 }, { "epoch": 1.8, "learning_rate": 3.0625996372719234e-05, "loss": 0.0241, "step": 278240 }, { "epoch": 1.8, "learning_rate": 3.06163150183623e-05, "loss": 0.0227, "step": 278250 }, { "epoch": 1.8, "learning_rate": 3.0606633664005366e-05, "loss": 0.0258, "step": 278260 }, { "epoch": 1.8, "learning_rate": 3.059695230964844e-05, "loss": 0.0255, "step": 278270 }, { "epoch": 1.8, "learning_rate": 3.05872709552915e-05, "loss": 0.0203, "step": 278280 }, { "epoch": 1.8, "learning_rate": 3.057758960093457e-05, "loss": 0.0231, "step": 278290 }, { "epoch": 1.8, "learning_rate": 3.056790824657764e-05, "loss": 0.0251, "step": 278300 }, { "epoch": 1.8, "learning_rate": 3.0558226892220704e-05, "loss": 0.025, "step": 278310 }, { "epoch": 1.8, "learning_rate": 3.054854553786378e-05, "loss": 0.0226, "step": 278320 }, { "epoch": 1.8, "learning_rate": 3.0538864183506843e-05, "loss": 0.0286, "step": 278330 }, { "epoch": 1.8, "learning_rate": 3.052918282914991e-05, "loss": 0.0236, "step": 278340 }, { "epoch": 1.8, "learning_rate": 3.0519501474792976e-05, "loss": 0.0263, "step": 278350 }, { "epoch": 1.8, "learning_rate": 3.0509820120436046e-05, "loss": 0.0244, "step": 278360 }, { "epoch": 1.8, "learning_rate": 3.0500138766079112e-05, "loss": 0.0285, "step": 278370 }, { "epoch": 1.8, "learning_rate": 3.049045741172218e-05, "loss": 0.0205, "step": 278380 }, { "epoch": 1.8, "learning_rate": 3.048077605736525e-05, "loss": 0.0276, "step": 278390 }, { "epoch": 1.8, "learning_rate": 3.0471094703008317e-05, "loss": 0.0256, "step": 278400 }, { "epoch": 1.8, "learning_rate": 3.0461413348651387e-05, "loss": 0.0264, "step": 278410 }, { "epoch": 1.8, "learning_rate": 3.045173199429445e-05, "loss": 0.0215, "step": 278420 }, { "epoch": 1.8, "learning_rate": 3.044205063993752e-05, "loss": 0.0217, "step": 278430 }, { "epoch": 1.8, "learning_rate": 3.043236928558059e-05, "loss": 0.0261, "step": 278440 }, { "epoch": 1.8, "learning_rate": 3.0422687931223655e-05, "loss": 0.0246, "step": 278450 }, { "epoch": 1.8, "learning_rate": 3.0413006576866725e-05, "loss": 0.0257, "step": 278460 }, { "epoch": 1.8, "learning_rate": 3.0403325222509795e-05, "loss": 0.0284, "step": 278470 }, { "epoch": 1.8, "learning_rate": 3.0393643868152857e-05, "loss": 0.0247, "step": 278480 }, { "epoch": 1.8, "learning_rate": 3.0383962513795927e-05, "loss": 0.0193, "step": 278490 }, { "epoch": 1.8, "learning_rate": 3.0374281159438993e-05, "loss": 0.0243, "step": 278500 }, { "epoch": 1.8, "learning_rate": 3.0364599805082063e-05, "loss": 0.0249, "step": 278510 }, { "epoch": 1.8, "learning_rate": 3.0354918450725133e-05, "loss": 0.0204, "step": 278520 }, { "epoch": 1.8, "learning_rate": 3.03452370963682e-05, "loss": 0.0246, "step": 278530 }, { "epoch": 1.8, "learning_rate": 3.033555574201127e-05, "loss": 0.0279, "step": 278540 }, { "epoch": 1.8, "learning_rate": 3.032587438765433e-05, "loss": 0.0273, "step": 278550 }, { "epoch": 1.8, "learning_rate": 3.03161930332974e-05, "loss": 0.0208, "step": 278560 }, { "epoch": 1.8, "learning_rate": 3.030651167894047e-05, "loss": 0.0268, "step": 278570 }, { "epoch": 1.8, "learning_rate": 3.0296830324583537e-05, "loss": 0.0249, "step": 278580 }, { "epoch": 1.8, "learning_rate": 3.0287148970226606e-05, "loss": 0.0199, "step": 278590 }, { "epoch": 1.8, "learning_rate": 3.0277467615869676e-05, "loss": 0.0306, "step": 278600 }, { "epoch": 1.8, "learning_rate": 3.0267786261512742e-05, "loss": 0.02, "step": 278610 }, { "epoch": 1.8, "learning_rate": 3.025810490715581e-05, "loss": 0.0219, "step": 278620 }, { "epoch": 1.8, "learning_rate": 3.0248423552798875e-05, "loss": 0.0248, "step": 278630 }, { "epoch": 1.8, "learning_rate": 3.0238742198441944e-05, "loss": 0.02, "step": 278640 }, { "epoch": 1.8, "learning_rate": 3.0229060844085014e-05, "loss": 0.021, "step": 278650 }, { "epoch": 1.8, "learning_rate": 3.021937948972808e-05, "loss": 0.0208, "step": 278660 }, { "epoch": 1.8, "learning_rate": 3.020969813537115e-05, "loss": 0.0275, "step": 278670 }, { "epoch": 1.8, "learning_rate": 3.0200016781014216e-05, "loss": 0.028, "step": 278680 }, { "epoch": 1.8, "learning_rate": 3.0190335426657282e-05, "loss": 0.0268, "step": 278690 }, { "epoch": 1.8, "learning_rate": 3.0180654072300352e-05, "loss": 0.0223, "step": 278700 }, { "epoch": 1.8, "learning_rate": 3.0170972717943418e-05, "loss": 0.0251, "step": 278710 }, { "epoch": 1.8, "learning_rate": 3.0161291363586488e-05, "loss": 0.0232, "step": 278720 }, { "epoch": 1.8, "learning_rate": 3.0151610009229554e-05, "loss": 0.0204, "step": 278730 }, { "epoch": 1.8, "learning_rate": 3.0141928654872624e-05, "loss": 0.0241, "step": 278740 }, { "epoch": 1.8, "learning_rate": 3.0132247300515693e-05, "loss": 0.0247, "step": 278750 }, { "epoch": 1.8, "learning_rate": 3.0122565946158756e-05, "loss": 0.0237, "step": 278760 }, { "epoch": 1.8, "learning_rate": 3.0112884591801826e-05, "loss": 0.018, "step": 278770 }, { "epoch": 1.8, "learning_rate": 3.0103203237444892e-05, "loss": 0.0264, "step": 278780 }, { "epoch": 1.8, "learning_rate": 3.009352188308796e-05, "loss": 0.0199, "step": 278790 }, { "epoch": 1.8, "learning_rate": 3.008384052873103e-05, "loss": 0.0208, "step": 278800 }, { "epoch": 1.8, "learning_rate": 3.0074159174374098e-05, "loss": 0.0212, "step": 278810 }, { "epoch": 1.8, "learning_rate": 3.0064477820017167e-05, "loss": 0.0226, "step": 278820 }, { "epoch": 1.8, "learning_rate": 3.005479646566023e-05, "loss": 0.0235, "step": 278830 }, { "epoch": 1.8, "learning_rate": 3.00451151113033e-05, "loss": 0.0215, "step": 278840 }, { "epoch": 1.8, "learning_rate": 3.003543375694637e-05, "loss": 0.0245, "step": 278850 }, { "epoch": 1.8, "learning_rate": 3.0025752402589435e-05, "loss": 0.0226, "step": 278860 }, { "epoch": 1.8, "learning_rate": 3.0016071048232505e-05, "loss": 0.0199, "step": 278870 }, { "epoch": 1.8, "learning_rate": 3.0006389693875575e-05, "loss": 0.028, "step": 278880 }, { "epoch": 1.8, "learning_rate": 2.999670833951864e-05, "loss": 0.0207, "step": 278890 }, { "epoch": 1.8, "learning_rate": 2.9987026985161707e-05, "loss": 0.0261, "step": 278900 }, { "epoch": 1.8, "learning_rate": 2.9977345630804773e-05, "loss": 0.0261, "step": 278910 }, { "epoch": 1.8, "learning_rate": 2.9967664276447843e-05, "loss": 0.0254, "step": 278920 }, { "epoch": 1.8, "learning_rate": 2.9957982922090913e-05, "loss": 0.0281, "step": 278930 }, { "epoch": 1.8, "learning_rate": 2.994830156773398e-05, "loss": 0.0242, "step": 278940 }, { "epoch": 1.8, "learning_rate": 2.993862021337705e-05, "loss": 0.0199, "step": 278950 }, { "epoch": 1.8, "learning_rate": 2.9928938859020118e-05, "loss": 0.0281, "step": 278960 }, { "epoch": 1.8, "learning_rate": 2.991925750466318e-05, "loss": 0.0212, "step": 278970 }, { "epoch": 1.8, "learning_rate": 2.990957615030625e-05, "loss": 0.0198, "step": 278980 }, { "epoch": 1.8, "learning_rate": 2.9899894795949317e-05, "loss": 0.0217, "step": 278990 }, { "epoch": 1.8, "learning_rate": 2.9890213441592387e-05, "loss": 0.0245, "step": 279000 }, { "epoch": 1.8, "eval_cer": 0.9198770760366061, "eval_loss": 0.01735873706638813, "eval_runtime": 119.7924, "eval_samples_per_second": 16.696, "eval_steps_per_second": 4.174, "step": 279000 }, { "epoch": 1.8, "learning_rate": 2.9880532087235456e-05, "loss": 0.0239, "step": 279010 }, { "epoch": 1.8, "learning_rate": 2.9870850732878522e-05, "loss": 0.025, "step": 279020 }, { "epoch": 1.8, "learning_rate": 2.9861169378521592e-05, "loss": 0.0181, "step": 279030 }, { "epoch": 1.8, "learning_rate": 2.9851488024164655e-05, "loss": 0.0233, "step": 279040 }, { "epoch": 1.8, "learning_rate": 2.9841806669807725e-05, "loss": 0.0239, "step": 279050 }, { "epoch": 1.8, "learning_rate": 2.9832125315450794e-05, "loss": 0.0252, "step": 279060 }, { "epoch": 1.8, "learning_rate": 2.982244396109386e-05, "loss": 0.0211, "step": 279070 }, { "epoch": 1.8, "learning_rate": 2.981276260673693e-05, "loss": 0.0202, "step": 279080 }, { "epoch": 1.8, "learning_rate": 2.980308125238e-05, "loss": 0.0246, "step": 279090 }, { "epoch": 1.8, "learning_rate": 2.9793399898023066e-05, "loss": 0.0255, "step": 279100 }, { "epoch": 1.8, "learning_rate": 2.9783718543666132e-05, "loss": 0.0199, "step": 279110 }, { "epoch": 1.8, "learning_rate": 2.97740371893092e-05, "loss": 0.0249, "step": 279120 }, { "epoch": 1.8, "learning_rate": 2.9764355834952268e-05, "loss": 0.0222, "step": 279130 }, { "epoch": 1.8, "learning_rate": 2.9754674480595338e-05, "loss": 0.0282, "step": 279140 }, { "epoch": 1.8, "learning_rate": 2.9744993126238404e-05, "loss": 0.025, "step": 279150 }, { "epoch": 1.8, "learning_rate": 2.9735311771881473e-05, "loss": 0.0211, "step": 279160 }, { "epoch": 1.8, "learning_rate": 2.9725630417524543e-05, "loss": 0.02, "step": 279170 }, { "epoch": 1.8, "learning_rate": 2.9715949063167606e-05, "loss": 0.0219, "step": 279180 }, { "epoch": 1.8, "learning_rate": 2.9706267708810676e-05, "loss": 0.0245, "step": 279190 }, { "epoch": 1.8, "learning_rate": 2.9696586354453742e-05, "loss": 0.0262, "step": 279200 }, { "epoch": 1.8, "learning_rate": 2.968690500009681e-05, "loss": 0.0267, "step": 279210 }, { "epoch": 1.8, "learning_rate": 2.967722364573988e-05, "loss": 0.0233, "step": 279220 }, { "epoch": 1.8, "learning_rate": 2.9667542291382947e-05, "loss": 0.0289, "step": 279230 }, { "epoch": 1.8, "learning_rate": 2.9657860937026017e-05, "loss": 0.0233, "step": 279240 }, { "epoch": 1.8, "learning_rate": 2.964817958266908e-05, "loss": 0.022, "step": 279250 }, { "epoch": 1.8, "learning_rate": 2.963849822831215e-05, "loss": 0.0246, "step": 279260 }, { "epoch": 1.8, "learning_rate": 2.962881687395522e-05, "loss": 0.0227, "step": 279270 }, { "epoch": 1.8, "learning_rate": 2.9619135519598285e-05, "loss": 0.025, "step": 279280 }, { "epoch": 1.8, "learning_rate": 2.9609454165241355e-05, "loss": 0.0215, "step": 279290 }, { "epoch": 1.8, "learning_rate": 2.9599772810884425e-05, "loss": 0.0175, "step": 279300 }, { "epoch": 1.8, "learning_rate": 2.959009145652749e-05, "loss": 0.0234, "step": 279310 }, { "epoch": 1.8, "learning_rate": 2.9580410102170557e-05, "loss": 0.0264, "step": 279320 }, { "epoch": 1.8, "learning_rate": 2.9570728747813623e-05, "loss": 0.0245, "step": 279330 }, { "epoch": 1.8, "learning_rate": 2.9561047393456693e-05, "loss": 0.026, "step": 279340 }, { "epoch": 1.8, "learning_rate": 2.9551366039099763e-05, "loss": 0.0297, "step": 279350 }, { "epoch": 1.8, "learning_rate": 2.954168468474283e-05, "loss": 0.025, "step": 279360 }, { "epoch": 1.8, "learning_rate": 2.95320033303859e-05, "loss": 0.0239, "step": 279370 }, { "epoch": 1.8, "learning_rate": 2.952232197602896e-05, "loss": 0.0215, "step": 279380 }, { "epoch": 1.8, "learning_rate": 2.951264062167203e-05, "loss": 0.0197, "step": 279390 }, { "epoch": 1.8, "learning_rate": 2.95029592673151e-05, "loss": 0.0211, "step": 279400 }, { "epoch": 1.8, "learning_rate": 2.9493277912958167e-05, "loss": 0.0216, "step": 279410 }, { "epoch": 1.8, "learning_rate": 2.9483596558601236e-05, "loss": 0.0234, "step": 279420 }, { "epoch": 1.8, "learning_rate": 2.9473915204244303e-05, "loss": 0.0221, "step": 279430 }, { "epoch": 1.8, "learning_rate": 2.9464233849887372e-05, "loss": 0.0256, "step": 279440 }, { "epoch": 1.8, "learning_rate": 2.945455249553044e-05, "loss": 0.0202, "step": 279450 }, { "epoch": 1.8, "learning_rate": 2.9444871141173505e-05, "loss": 0.0219, "step": 279460 }, { "epoch": 1.8, "learning_rate": 2.9435189786816574e-05, "loss": 0.0224, "step": 279470 }, { "epoch": 1.8, "learning_rate": 2.942550843245964e-05, "loss": 0.0263, "step": 279480 }, { "epoch": 1.8, "learning_rate": 2.941582707810271e-05, "loss": 0.0273, "step": 279490 }, { "epoch": 1.8, "learning_rate": 2.940614572374578e-05, "loss": 0.0256, "step": 279500 }, { "epoch": 1.8, "learning_rate": 2.9396464369388846e-05, "loss": 0.0337, "step": 279510 }, { "epoch": 1.8, "learning_rate": 2.9386783015031912e-05, "loss": 0.0238, "step": 279520 }, { "epoch": 1.8, "learning_rate": 2.937710166067498e-05, "loss": 0.0226, "step": 279530 }, { "epoch": 1.8, "learning_rate": 2.9367420306318048e-05, "loss": 0.0232, "step": 279540 }, { "epoch": 1.8, "learning_rate": 2.9357738951961118e-05, "loss": 0.0192, "step": 279550 }, { "epoch": 1.8, "learning_rate": 2.9348057597604184e-05, "loss": 0.0226, "step": 279560 }, { "epoch": 1.8, "learning_rate": 2.9338376243247254e-05, "loss": 0.0261, "step": 279570 }, { "epoch": 1.8, "learning_rate": 2.9328694888890323e-05, "loss": 0.0253, "step": 279580 }, { "epoch": 1.8, "learning_rate": 2.9319013534533386e-05, "loss": 0.0266, "step": 279590 }, { "epoch": 1.8, "learning_rate": 2.9309332180176456e-05, "loss": 0.0227, "step": 279600 }, { "epoch": 1.8, "learning_rate": 2.9299650825819522e-05, "loss": 0.025, "step": 279610 }, { "epoch": 1.8, "learning_rate": 2.928996947146259e-05, "loss": 0.022, "step": 279620 }, { "epoch": 1.8, "learning_rate": 2.928028811710566e-05, "loss": 0.0203, "step": 279630 }, { "epoch": 1.8, "learning_rate": 2.9270606762748727e-05, "loss": 0.022, "step": 279640 }, { "epoch": 1.8, "learning_rate": 2.9260925408391797e-05, "loss": 0.022, "step": 279650 }, { "epoch": 1.8, "learning_rate": 2.925124405403486e-05, "loss": 0.0231, "step": 279660 }, { "epoch": 1.81, "learning_rate": 2.924156269967793e-05, "loss": 0.0201, "step": 279670 }, { "epoch": 1.81, "learning_rate": 2.9231881345321e-05, "loss": 0.026, "step": 279680 }, { "epoch": 1.81, "learning_rate": 2.9222199990964065e-05, "loss": 0.0235, "step": 279690 }, { "epoch": 1.81, "learning_rate": 2.9212518636607135e-05, "loss": 0.0224, "step": 279700 }, { "epoch": 1.81, "learning_rate": 2.9202837282250205e-05, "loss": 0.0277, "step": 279710 }, { "epoch": 1.81, "learning_rate": 2.919315592789327e-05, "loss": 0.021, "step": 279720 }, { "epoch": 1.81, "learning_rate": 2.9183474573536337e-05, "loss": 0.0208, "step": 279730 }, { "epoch": 1.81, "learning_rate": 2.9173793219179403e-05, "loss": 0.0205, "step": 279740 }, { "epoch": 1.81, "learning_rate": 2.9164111864822473e-05, "loss": 0.0179, "step": 279750 }, { "epoch": 1.81, "learning_rate": 2.9154430510465543e-05, "loss": 0.024, "step": 279760 }, { "epoch": 1.81, "learning_rate": 2.914474915610861e-05, "loss": 0.0264, "step": 279770 }, { "epoch": 1.81, "learning_rate": 2.913506780175168e-05, "loss": 0.0254, "step": 279780 }, { "epoch": 1.81, "learning_rate": 2.9125386447394748e-05, "loss": 0.0221, "step": 279790 }, { "epoch": 1.81, "learning_rate": 2.911570509303781e-05, "loss": 0.0237, "step": 279800 }, { "epoch": 1.81, "learning_rate": 2.910602373868088e-05, "loss": 0.0241, "step": 279810 }, { "epoch": 1.81, "learning_rate": 2.9096342384323947e-05, "loss": 0.0283, "step": 279820 }, { "epoch": 1.81, "learning_rate": 2.9086661029967017e-05, "loss": 0.0176, "step": 279830 }, { "epoch": 1.81, "learning_rate": 2.9076979675610086e-05, "loss": 0.0253, "step": 279840 }, { "epoch": 1.81, "learning_rate": 2.9067298321253152e-05, "loss": 0.0209, "step": 279850 }, { "epoch": 1.81, "learning_rate": 2.9057616966896222e-05, "loss": 0.0247, "step": 279860 }, { "epoch": 1.81, "learning_rate": 2.9047935612539285e-05, "loss": 0.0205, "step": 279870 }, { "epoch": 1.81, "learning_rate": 2.9038254258182355e-05, "loss": 0.0252, "step": 279880 }, { "epoch": 1.81, "learning_rate": 2.9028572903825424e-05, "loss": 0.0224, "step": 279890 }, { "epoch": 1.81, "learning_rate": 2.901889154946849e-05, "loss": 0.0235, "step": 279900 }, { "epoch": 1.81, "learning_rate": 2.900921019511156e-05, "loss": 0.0267, "step": 279910 }, { "epoch": 1.81, "learning_rate": 2.899952884075463e-05, "loss": 0.0242, "step": 279920 }, { "epoch": 1.81, "learning_rate": 2.8989847486397696e-05, "loss": 0.0193, "step": 279930 }, { "epoch": 1.81, "learning_rate": 2.8980166132040762e-05, "loss": 0.0204, "step": 279940 }, { "epoch": 1.81, "learning_rate": 2.897048477768383e-05, "loss": 0.0238, "step": 279950 }, { "epoch": 1.81, "learning_rate": 2.8960803423326898e-05, "loss": 0.0209, "step": 279960 }, { "epoch": 1.81, "learning_rate": 2.8951122068969968e-05, "loss": 0.0212, "step": 279970 }, { "epoch": 1.81, "learning_rate": 2.8941440714613034e-05, "loss": 0.0236, "step": 279980 }, { "epoch": 1.81, "learning_rate": 2.8931759360256103e-05, "loss": 0.0203, "step": 279990 }, { "epoch": 1.81, "learning_rate": 2.892207800589917e-05, "loss": 0.0177, "step": 280000 }, { "epoch": 1.81, "eval_cer": 0.9198617105411818, "eval_loss": 0.017406921833753586, "eval_runtime": 119.8646, "eval_samples_per_second": 16.685, "eval_steps_per_second": 4.171, "step": 280000 }, { "epoch": 1.81, "learning_rate": 2.8912396651542236e-05, "loss": 0.02, "step": 280010 }, { "epoch": 1.81, "learning_rate": 2.8902715297185306e-05, "loss": 0.0184, "step": 280020 }, { "epoch": 1.81, "learning_rate": 2.8893033942828372e-05, "loss": 0.0206, "step": 280030 }, { "epoch": 1.81, "learning_rate": 2.888335258847144e-05, "loss": 0.0251, "step": 280040 }, { "epoch": 1.81, "learning_rate": 2.8873671234114508e-05, "loss": 0.0217, "step": 280050 }, { "epoch": 1.81, "learning_rate": 2.8863989879757577e-05, "loss": 0.0223, "step": 280060 }, { "epoch": 1.81, "learning_rate": 2.8854308525400647e-05, "loss": 0.0206, "step": 280070 }, { "epoch": 1.81, "learning_rate": 2.884462717104371e-05, "loss": 0.0217, "step": 280080 }, { "epoch": 1.81, "learning_rate": 2.883494581668678e-05, "loss": 0.0278, "step": 280090 }, { "epoch": 1.81, "learning_rate": 2.8825264462329846e-05, "loss": 0.0252, "step": 280100 }, { "epoch": 1.81, "learning_rate": 2.8815583107972915e-05, "loss": 0.0191, "step": 280110 }, { "epoch": 1.81, "learning_rate": 2.8805901753615985e-05, "loss": 0.0217, "step": 280120 }, { "epoch": 1.81, "learning_rate": 2.879622039925905e-05, "loss": 0.026, "step": 280130 }, { "epoch": 1.81, "learning_rate": 2.878653904490212e-05, "loss": 0.0252, "step": 280140 }, { "epoch": 1.81, "learning_rate": 2.8776857690545184e-05, "loss": 0.0188, "step": 280150 }, { "epoch": 1.81, "learning_rate": 2.8767176336188253e-05, "loss": 0.0245, "step": 280160 }, { "epoch": 1.81, "learning_rate": 2.8757494981831323e-05, "loss": 0.0215, "step": 280170 }, { "epoch": 1.81, "learning_rate": 2.874781362747439e-05, "loss": 0.0269, "step": 280180 }, { "epoch": 1.81, "learning_rate": 2.873813227311746e-05, "loss": 0.0181, "step": 280190 }, { "epoch": 1.81, "learning_rate": 2.872845091876053e-05, "loss": 0.0231, "step": 280200 }, { "epoch": 1.81, "learning_rate": 2.871876956440359e-05, "loss": 0.0262, "step": 280210 }, { "epoch": 1.81, "learning_rate": 2.870908821004666e-05, "loss": 0.0231, "step": 280220 }, { "epoch": 1.81, "learning_rate": 2.8699406855689727e-05, "loss": 0.02, "step": 280230 }, { "epoch": 1.81, "learning_rate": 2.8689725501332797e-05, "loss": 0.02, "step": 280240 }, { "epoch": 1.81, "learning_rate": 2.8680044146975866e-05, "loss": 0.025, "step": 280250 }, { "epoch": 1.81, "learning_rate": 2.8670362792618933e-05, "loss": 0.0247, "step": 280260 }, { "epoch": 1.81, "learning_rate": 2.8660681438262002e-05, "loss": 0.0253, "step": 280270 }, { "epoch": 1.81, "learning_rate": 2.8651000083905065e-05, "loss": 0.0233, "step": 280280 }, { "epoch": 1.81, "learning_rate": 2.8641318729548135e-05, "loss": 0.0242, "step": 280290 }, { "epoch": 1.81, "learning_rate": 2.8631637375191204e-05, "loss": 0.0206, "step": 280300 }, { "epoch": 1.81, "learning_rate": 2.862195602083427e-05, "loss": 0.0257, "step": 280310 }, { "epoch": 1.81, "learning_rate": 2.861227466647734e-05, "loss": 0.0238, "step": 280320 }, { "epoch": 1.81, "learning_rate": 2.860259331212041e-05, "loss": 0.0218, "step": 280330 }, { "epoch": 1.81, "learning_rate": 2.8592911957763476e-05, "loss": 0.022, "step": 280340 }, { "epoch": 1.81, "learning_rate": 2.8583230603406542e-05, "loss": 0.0228, "step": 280350 }, { "epoch": 1.81, "learning_rate": 2.857354924904961e-05, "loss": 0.021, "step": 280360 }, { "epoch": 1.81, "learning_rate": 2.8563867894692678e-05, "loss": 0.0231, "step": 280370 }, { "epoch": 1.81, "learning_rate": 2.8554186540335748e-05, "loss": 0.0217, "step": 280380 }, { "epoch": 1.81, "learning_rate": 2.8544505185978814e-05, "loss": 0.0188, "step": 280390 }, { "epoch": 1.81, "learning_rate": 2.8534823831621884e-05, "loss": 0.0272, "step": 280400 }, { "epoch": 1.81, "learning_rate": 2.8525142477264953e-05, "loss": 0.0218, "step": 280410 }, { "epoch": 1.81, "learning_rate": 2.8515461122908016e-05, "loss": 0.0223, "step": 280420 }, { "epoch": 1.81, "learning_rate": 2.8505779768551086e-05, "loss": 0.0235, "step": 280430 }, { "epoch": 1.81, "learning_rate": 2.8496098414194152e-05, "loss": 0.0235, "step": 280440 }, { "epoch": 1.81, "learning_rate": 2.848641705983722e-05, "loss": 0.0226, "step": 280450 }, { "epoch": 1.81, "learning_rate": 2.847673570548029e-05, "loss": 0.0245, "step": 280460 }, { "epoch": 1.81, "learning_rate": 2.8467054351123357e-05, "loss": 0.0223, "step": 280470 }, { "epoch": 1.81, "learning_rate": 2.8457372996766427e-05, "loss": 0.0253, "step": 280480 }, { "epoch": 1.81, "learning_rate": 2.844769164240949e-05, "loss": 0.0242, "step": 280490 }, { "epoch": 1.81, "learning_rate": 2.843801028805256e-05, "loss": 0.0195, "step": 280500 }, { "epoch": 1.81, "learning_rate": 2.842832893369563e-05, "loss": 0.0228, "step": 280510 }, { "epoch": 1.81, "learning_rate": 2.8418647579338695e-05, "loss": 0.0263, "step": 280520 }, { "epoch": 1.81, "learning_rate": 2.8408966224981765e-05, "loss": 0.021, "step": 280530 }, { "epoch": 1.81, "learning_rate": 2.8399284870624835e-05, "loss": 0.0196, "step": 280540 }, { "epoch": 1.81, "learning_rate": 2.83896035162679e-05, "loss": 0.0297, "step": 280550 }, { "epoch": 1.81, "learning_rate": 2.8379922161910967e-05, "loss": 0.0243, "step": 280560 }, { "epoch": 1.81, "learning_rate": 2.8370240807554033e-05, "loss": 0.0249, "step": 280570 }, { "epoch": 1.81, "learning_rate": 2.8360559453197103e-05, "loss": 0.027, "step": 280580 }, { "epoch": 1.81, "learning_rate": 2.8350878098840173e-05, "loss": 0.0265, "step": 280590 }, { "epoch": 1.81, "learning_rate": 2.834119674448324e-05, "loss": 0.0252, "step": 280600 }, { "epoch": 1.81, "learning_rate": 2.833151539012631e-05, "loss": 0.027, "step": 280610 }, { "epoch": 1.81, "learning_rate": 2.8321834035769378e-05, "loss": 0.0222, "step": 280620 }, { "epoch": 1.81, "learning_rate": 2.831215268141244e-05, "loss": 0.021, "step": 280630 }, { "epoch": 1.81, "learning_rate": 2.830247132705551e-05, "loss": 0.0229, "step": 280640 }, { "epoch": 1.81, "learning_rate": 2.8292789972698577e-05, "loss": 0.0247, "step": 280650 }, { "epoch": 1.81, "learning_rate": 2.8283108618341647e-05, "loss": 0.0262, "step": 280660 }, { "epoch": 1.81, "learning_rate": 2.8273427263984716e-05, "loss": 0.0258, "step": 280670 }, { "epoch": 1.81, "learning_rate": 2.8263745909627782e-05, "loss": 0.0217, "step": 280680 }, { "epoch": 1.81, "learning_rate": 2.8254064555270852e-05, "loss": 0.0223, "step": 280690 }, { "epoch": 1.81, "learning_rate": 2.8244383200913915e-05, "loss": 0.0224, "step": 280700 }, { "epoch": 1.81, "learning_rate": 2.8234701846556984e-05, "loss": 0.0209, "step": 280710 }, { "epoch": 1.81, "learning_rate": 2.8225020492200054e-05, "loss": 0.0192, "step": 280720 }, { "epoch": 1.81, "learning_rate": 2.821533913784312e-05, "loss": 0.0278, "step": 280730 }, { "epoch": 1.81, "learning_rate": 2.820565778348619e-05, "loss": 0.0214, "step": 280740 }, { "epoch": 1.81, "learning_rate": 2.8195976429129256e-05, "loss": 0.0247, "step": 280750 }, { "epoch": 1.81, "learning_rate": 2.8186295074772326e-05, "loss": 0.0188, "step": 280760 }, { "epoch": 1.81, "learning_rate": 2.8176613720415392e-05, "loss": 0.0223, "step": 280770 }, { "epoch": 1.81, "learning_rate": 2.816693236605846e-05, "loss": 0.0217, "step": 280780 }, { "epoch": 1.81, "learning_rate": 2.8157251011701528e-05, "loss": 0.0203, "step": 280790 }, { "epoch": 1.81, "learning_rate": 2.8147569657344594e-05, "loss": 0.0231, "step": 280800 }, { "epoch": 1.81, "learning_rate": 2.8137888302987664e-05, "loss": 0.0235, "step": 280810 }, { "epoch": 1.81, "learning_rate": 2.8128206948630733e-05, "loss": 0.0225, "step": 280820 }, { "epoch": 1.81, "learning_rate": 2.81185255942738e-05, "loss": 0.026, "step": 280830 }, { "epoch": 1.81, "learning_rate": 2.8108844239916866e-05, "loss": 0.0224, "step": 280840 }, { "epoch": 1.81, "learning_rate": 2.8099162885559932e-05, "loss": 0.0259, "step": 280850 }, { "epoch": 1.81, "learning_rate": 2.8089481531203002e-05, "loss": 0.0224, "step": 280860 }, { "epoch": 1.81, "learning_rate": 2.807980017684607e-05, "loss": 0.028, "step": 280870 }, { "epoch": 1.81, "learning_rate": 2.8070118822489138e-05, "loss": 0.0256, "step": 280880 }, { "epoch": 1.81, "learning_rate": 2.8060437468132207e-05, "loss": 0.0284, "step": 280890 }, { "epoch": 1.81, "learning_rate": 2.8050756113775277e-05, "loss": 0.0204, "step": 280900 }, { "epoch": 1.81, "learning_rate": 2.804107475941834e-05, "loss": 0.0225, "step": 280910 }, { "epoch": 1.81, "learning_rate": 2.803139340506141e-05, "loss": 0.0251, "step": 280920 }, { "epoch": 1.81, "learning_rate": 2.8021712050704476e-05, "loss": 0.0224, "step": 280930 }, { "epoch": 1.81, "learning_rate": 2.8012030696347545e-05, "loss": 0.0282, "step": 280940 }, { "epoch": 1.81, "learning_rate": 2.8002349341990615e-05, "loss": 0.0259, "step": 280950 }, { "epoch": 1.81, "learning_rate": 2.799266798763368e-05, "loss": 0.0223, "step": 280960 }, { "epoch": 1.81, "learning_rate": 2.798298663327675e-05, "loss": 0.0223, "step": 280970 }, { "epoch": 1.81, "learning_rate": 2.7973305278919814e-05, "loss": 0.0232, "step": 280980 }, { "epoch": 1.81, "learning_rate": 2.7963623924562883e-05, "loss": 0.0224, "step": 280990 }, { "epoch": 1.81, "learning_rate": 2.7953942570205953e-05, "loss": 0.0268, "step": 281000 }, { "epoch": 1.81, "eval_cer": 0.9198617105411818, "eval_loss": 0.017409605905413628, "eval_runtime": 119.8225, "eval_samples_per_second": 16.691, "eval_steps_per_second": 4.173, "step": 281000 }, { "epoch": 1.81, "learning_rate": 2.794426121584902e-05, "loss": 0.0201, "step": 281010 }, { "epoch": 1.81, "learning_rate": 2.793457986149209e-05, "loss": 0.0216, "step": 281020 }, { "epoch": 1.81, "learning_rate": 2.792489850713516e-05, "loss": 0.0205, "step": 281030 }, { "epoch": 1.81, "learning_rate": 2.791521715277822e-05, "loss": 0.0269, "step": 281040 }, { "epoch": 1.81, "learning_rate": 2.790553579842129e-05, "loss": 0.0194, "step": 281050 }, { "epoch": 1.81, "learning_rate": 2.7895854444064357e-05, "loss": 0.0205, "step": 281060 }, { "epoch": 1.81, "learning_rate": 2.7886173089707427e-05, "loss": 0.0236, "step": 281070 }, { "epoch": 1.81, "learning_rate": 2.7876491735350496e-05, "loss": 0.0217, "step": 281080 }, { "epoch": 1.81, "learning_rate": 2.7866810380993563e-05, "loss": 0.0265, "step": 281090 }, { "epoch": 1.81, "learning_rate": 2.7857129026636632e-05, "loss": 0.0225, "step": 281100 }, { "epoch": 1.81, "learning_rate": 2.7847447672279695e-05, "loss": 0.0246, "step": 281110 }, { "epoch": 1.81, "learning_rate": 2.7837766317922765e-05, "loss": 0.0209, "step": 281120 }, { "epoch": 1.81, "learning_rate": 2.7828084963565834e-05, "loss": 0.0189, "step": 281130 }, { "epoch": 1.81, "learning_rate": 2.78184036092089e-05, "loss": 0.0222, "step": 281140 }, { "epoch": 1.81, "learning_rate": 2.780872225485197e-05, "loss": 0.0252, "step": 281150 }, { "epoch": 1.81, "learning_rate": 2.779904090049504e-05, "loss": 0.0287, "step": 281160 }, { "epoch": 1.81, "learning_rate": 2.7789359546138106e-05, "loss": 0.0212, "step": 281170 }, { "epoch": 1.81, "learning_rate": 2.7779678191781172e-05, "loss": 0.0233, "step": 281180 }, { "epoch": 1.81, "learning_rate": 2.776999683742424e-05, "loss": 0.0238, "step": 281190 }, { "epoch": 1.81, "learning_rate": 2.7760315483067308e-05, "loss": 0.0228, "step": 281200 }, { "epoch": 1.81, "learning_rate": 2.7750634128710378e-05, "loss": 0.0215, "step": 281210 }, { "epoch": 1.82, "learning_rate": 2.7740952774353444e-05, "loss": 0.0227, "step": 281220 }, { "epoch": 1.82, "learning_rate": 2.7731271419996514e-05, "loss": 0.0236, "step": 281230 }, { "epoch": 1.82, "learning_rate": 2.7721590065639583e-05, "loss": 0.0221, "step": 281240 }, { "epoch": 1.82, "learning_rate": 2.7711908711282646e-05, "loss": 0.0234, "step": 281250 }, { "epoch": 1.82, "learning_rate": 2.7702227356925716e-05, "loss": 0.0256, "step": 281260 }, { "epoch": 1.82, "learning_rate": 2.7692546002568782e-05, "loss": 0.0194, "step": 281270 }, { "epoch": 1.82, "learning_rate": 2.768286464821185e-05, "loss": 0.0226, "step": 281280 }, { "epoch": 1.82, "learning_rate": 2.767318329385492e-05, "loss": 0.0227, "step": 281290 }, { "epoch": 1.82, "learning_rate": 2.7663501939497987e-05, "loss": 0.0232, "step": 281300 }, { "epoch": 1.82, "learning_rate": 2.7653820585141057e-05, "loss": 0.0224, "step": 281310 }, { "epoch": 1.82, "learning_rate": 2.764413923078412e-05, "loss": 0.0266, "step": 281320 }, { "epoch": 1.82, "learning_rate": 2.763445787642719e-05, "loss": 0.0206, "step": 281330 }, { "epoch": 1.82, "learning_rate": 2.762477652207026e-05, "loss": 0.023, "step": 281340 }, { "epoch": 1.82, "learning_rate": 2.7615095167713325e-05, "loss": 0.0211, "step": 281350 }, { "epoch": 1.82, "learning_rate": 2.7605413813356395e-05, "loss": 0.0223, "step": 281360 }, { "epoch": 1.82, "learning_rate": 2.759573245899946e-05, "loss": 0.0217, "step": 281370 }, { "epoch": 1.82, "learning_rate": 2.758605110464253e-05, "loss": 0.0198, "step": 281380 }, { "epoch": 1.82, "learning_rate": 2.7576369750285597e-05, "loss": 0.0265, "step": 281390 }, { "epoch": 1.82, "learning_rate": 2.7566688395928663e-05, "loss": 0.0279, "step": 281400 }, { "epoch": 1.82, "learning_rate": 2.7557007041571733e-05, "loss": 0.0221, "step": 281410 }, { "epoch": 1.82, "learning_rate": 2.7547325687214803e-05, "loss": 0.0226, "step": 281420 }, { "epoch": 1.82, "learning_rate": 2.753764433285787e-05, "loss": 0.0286, "step": 281430 }, { "epoch": 1.82, "learning_rate": 2.752796297850094e-05, "loss": 0.0243, "step": 281440 }, { "epoch": 1.82, "learning_rate": 2.7518281624144005e-05, "loss": 0.0255, "step": 281450 }, { "epoch": 1.82, "learning_rate": 2.750860026978707e-05, "loss": 0.0224, "step": 281460 }, { "epoch": 1.82, "learning_rate": 2.749891891543014e-05, "loss": 0.0188, "step": 281470 }, { "epoch": 1.82, "learning_rate": 2.7489237561073207e-05, "loss": 0.0211, "step": 281480 }, { "epoch": 1.82, "learning_rate": 2.7479556206716277e-05, "loss": 0.023, "step": 281490 }, { "epoch": 1.82, "learning_rate": 2.7469874852359343e-05, "loss": 0.0219, "step": 281500 }, { "epoch": 1.82, "learning_rate": 2.7460193498002412e-05, "loss": 0.023, "step": 281510 }, { "epoch": 1.82, "learning_rate": 2.7450512143645482e-05, "loss": 0.0272, "step": 281520 }, { "epoch": 1.82, "learning_rate": 2.7440830789288545e-05, "loss": 0.0234, "step": 281530 }, { "epoch": 1.82, "learning_rate": 2.7431149434931614e-05, "loss": 0.0221, "step": 281540 }, { "epoch": 1.82, "learning_rate": 2.742146808057468e-05, "loss": 0.0219, "step": 281550 }, { "epoch": 1.82, "learning_rate": 2.741178672621775e-05, "loss": 0.0195, "step": 281560 }, { "epoch": 1.82, "learning_rate": 2.740210537186082e-05, "loss": 0.0195, "step": 281570 }, { "epoch": 1.82, "learning_rate": 2.7392424017503886e-05, "loss": 0.0186, "step": 281580 }, { "epoch": 1.82, "learning_rate": 2.7382742663146956e-05, "loss": 0.0218, "step": 281590 }, { "epoch": 1.82, "learning_rate": 2.737306130879002e-05, "loss": 0.0218, "step": 281600 }, { "epoch": 1.82, "learning_rate": 2.736337995443309e-05, "loss": 0.0206, "step": 281610 }, { "epoch": 1.82, "learning_rate": 2.7353698600076158e-05, "loss": 0.017, "step": 281620 }, { "epoch": 1.82, "learning_rate": 2.7344017245719224e-05, "loss": 0.0207, "step": 281630 }, { "epoch": 1.82, "learning_rate": 2.7334335891362294e-05, "loss": 0.0191, "step": 281640 }, { "epoch": 1.82, "learning_rate": 2.7324654537005363e-05, "loss": 0.0218, "step": 281650 }, { "epoch": 1.82, "learning_rate": 2.731497318264843e-05, "loss": 0.0326, "step": 281660 }, { "epoch": 1.82, "learning_rate": 2.7305291828291496e-05, "loss": 0.0253, "step": 281670 }, { "epoch": 1.82, "learning_rate": 2.7295610473934562e-05, "loss": 0.0255, "step": 281680 }, { "epoch": 1.82, "learning_rate": 2.7285929119577632e-05, "loss": 0.028, "step": 281690 }, { "epoch": 1.82, "learning_rate": 2.72762477652207e-05, "loss": 0.0194, "step": 281700 }, { "epoch": 1.82, "learning_rate": 2.7266566410863768e-05, "loss": 0.0231, "step": 281710 }, { "epoch": 1.82, "learning_rate": 2.7256885056506837e-05, "loss": 0.0233, "step": 281720 }, { "epoch": 1.82, "learning_rate": 2.7247203702149907e-05, "loss": 0.0202, "step": 281730 }, { "epoch": 1.82, "learning_rate": 2.723752234779297e-05, "loss": 0.0222, "step": 281740 }, { "epoch": 1.82, "learning_rate": 2.722784099343604e-05, "loss": 0.0244, "step": 281750 }, { "epoch": 1.82, "learning_rate": 2.7218159639079106e-05, "loss": 0.0202, "step": 281760 }, { "epoch": 1.82, "learning_rate": 2.7208478284722175e-05, "loss": 0.0233, "step": 281770 }, { "epoch": 1.82, "learning_rate": 2.7198796930365245e-05, "loss": 0.0234, "step": 281780 }, { "epoch": 1.82, "learning_rate": 2.718911557600831e-05, "loss": 0.0211, "step": 281790 }, { "epoch": 1.82, "learning_rate": 2.717943422165138e-05, "loss": 0.0229, "step": 281800 }, { "epoch": 1.82, "learning_rate": 2.7169752867294444e-05, "loss": 0.029, "step": 281810 }, { "epoch": 1.82, "learning_rate": 2.7160071512937513e-05, "loss": 0.0206, "step": 281820 }, { "epoch": 1.82, "learning_rate": 2.7150390158580583e-05, "loss": 0.0257, "step": 281830 }, { "epoch": 1.82, "learning_rate": 2.714070880422365e-05, "loss": 0.0251, "step": 281840 }, { "epoch": 1.82, "learning_rate": 2.713102744986672e-05, "loss": 0.0218, "step": 281850 }, { "epoch": 1.82, "learning_rate": 2.712134609550979e-05, "loss": 0.0252, "step": 281860 }, { "epoch": 1.82, "learning_rate": 2.7111664741152855e-05, "loss": 0.0187, "step": 281870 }, { "epoch": 1.82, "learning_rate": 2.710198338679592e-05, "loss": 0.0217, "step": 281880 }, { "epoch": 1.82, "learning_rate": 2.7092302032438987e-05, "loss": 0.0233, "step": 281890 }, { "epoch": 1.82, "learning_rate": 2.7082620678082057e-05, "loss": 0.0203, "step": 281900 }, { "epoch": 1.82, "learning_rate": 2.7072939323725126e-05, "loss": 0.0251, "step": 281910 }, { "epoch": 1.82, "learning_rate": 2.7063257969368193e-05, "loss": 0.0266, "step": 281920 }, { "epoch": 1.82, "learning_rate": 2.7053576615011262e-05, "loss": 0.0241, "step": 281930 }, { "epoch": 1.82, "learning_rate": 2.7043895260654325e-05, "loss": 0.0267, "step": 281940 }, { "epoch": 1.82, "learning_rate": 2.7034213906297395e-05, "loss": 0.0224, "step": 281950 }, { "epoch": 1.82, "learning_rate": 2.7024532551940464e-05, "loss": 0.0207, "step": 281960 }, { "epoch": 1.82, "learning_rate": 2.701485119758353e-05, "loss": 0.0219, "step": 281970 }, { "epoch": 1.82, "learning_rate": 2.70051698432266e-05, "loss": 0.0209, "step": 281980 }, { "epoch": 1.82, "learning_rate": 2.699548848886967e-05, "loss": 0.0236, "step": 281990 }, { "epoch": 1.82, "learning_rate": 2.6985807134512736e-05, "loss": 0.0209, "step": 282000 }, { "epoch": 1.82, "eval_cer": 0.9198553835724776, "eval_loss": 0.017225535586476326, "eval_runtime": 119.8192, "eval_samples_per_second": 16.692, "eval_steps_per_second": 4.173, "step": 282000 }, { "epoch": 1.82, "learning_rate": 2.6976125780155802e-05, "loss": 0.0249, "step": 282010 }, { "epoch": 1.82, "learning_rate": 2.696644442579887e-05, "loss": 0.0264, "step": 282020 }, { "epoch": 1.82, "learning_rate": 2.6956763071441938e-05, "loss": 0.0206, "step": 282030 }, { "epoch": 1.82, "learning_rate": 2.6947081717085008e-05, "loss": 0.0203, "step": 282040 }, { "epoch": 1.82, "learning_rate": 2.6937400362728074e-05, "loss": 0.0226, "step": 282050 }, { "epoch": 1.82, "learning_rate": 2.6927719008371144e-05, "loss": 0.0262, "step": 282060 }, { "epoch": 1.82, "learning_rate": 2.691803765401421e-05, "loss": 0.0241, "step": 282070 }, { "epoch": 1.82, "learning_rate": 2.6908356299657276e-05, "loss": 0.0209, "step": 282080 }, { "epoch": 1.82, "learning_rate": 2.6898674945300346e-05, "loss": 0.0208, "step": 282090 }, { "epoch": 1.82, "learning_rate": 2.6888993590943412e-05, "loss": 0.0225, "step": 282100 }, { "epoch": 1.82, "learning_rate": 2.687931223658648e-05, "loss": 0.0228, "step": 282110 }, { "epoch": 1.82, "learning_rate": 2.6869630882229548e-05, "loss": 0.0242, "step": 282120 }, { "epoch": 1.82, "learning_rate": 2.6859949527872617e-05, "loss": 0.0204, "step": 282130 }, { "epoch": 1.82, "learning_rate": 2.6850268173515687e-05, "loss": 0.0234, "step": 282140 }, { "epoch": 1.82, "learning_rate": 2.684058681915875e-05, "loss": 0.03, "step": 282150 }, { "epoch": 1.82, "learning_rate": 2.683090546480182e-05, "loss": 0.0253, "step": 282160 }, { "epoch": 1.82, "learning_rate": 2.6821224110444886e-05, "loss": 0.022, "step": 282170 }, { "epoch": 1.82, "learning_rate": 2.6811542756087955e-05, "loss": 0.0195, "step": 282180 }, { "epoch": 1.82, "learning_rate": 2.6801861401731025e-05, "loss": 0.0262, "step": 282190 }, { "epoch": 1.82, "learning_rate": 2.679218004737409e-05, "loss": 0.0258, "step": 282200 }, { "epoch": 1.82, "learning_rate": 2.678249869301716e-05, "loss": 0.0225, "step": 282210 }, { "epoch": 1.82, "learning_rate": 2.6772817338660224e-05, "loss": 0.021, "step": 282220 }, { "epoch": 1.82, "learning_rate": 2.6763135984303293e-05, "loss": 0.0205, "step": 282230 }, { "epoch": 1.82, "learning_rate": 2.6753454629946363e-05, "loss": 0.019, "step": 282240 }, { "epoch": 1.82, "learning_rate": 2.674377327558943e-05, "loss": 0.0261, "step": 282250 }, { "epoch": 1.82, "learning_rate": 2.67340919212325e-05, "loss": 0.0203, "step": 282260 }, { "epoch": 1.82, "learning_rate": 2.672441056687557e-05, "loss": 0.0235, "step": 282270 }, { "epoch": 1.82, "learning_rate": 2.6714729212518635e-05, "loss": 0.0226, "step": 282280 }, { "epoch": 1.82, "learning_rate": 2.67050478581617e-05, "loss": 0.0189, "step": 282290 }, { "epoch": 1.82, "learning_rate": 2.6695366503804767e-05, "loss": 0.0186, "step": 282300 }, { "epoch": 1.82, "learning_rate": 2.6685685149447837e-05, "loss": 0.0224, "step": 282310 }, { "epoch": 1.82, "learning_rate": 2.6676003795090906e-05, "loss": 0.0191, "step": 282320 }, { "epoch": 1.82, "learning_rate": 2.6666322440733973e-05, "loss": 0.0235, "step": 282330 }, { "epoch": 1.82, "learning_rate": 2.6656641086377042e-05, "loss": 0.0264, "step": 282340 }, { "epoch": 1.82, "learning_rate": 2.6646959732020112e-05, "loss": 0.0219, "step": 282350 }, { "epoch": 1.82, "learning_rate": 2.6637278377663175e-05, "loss": 0.0216, "step": 282360 }, { "epoch": 1.82, "learning_rate": 2.6627597023306244e-05, "loss": 0.0212, "step": 282370 }, { "epoch": 1.82, "learning_rate": 2.661791566894931e-05, "loss": 0.0213, "step": 282380 }, { "epoch": 1.82, "learning_rate": 2.660823431459238e-05, "loss": 0.021, "step": 282390 }, { "epoch": 1.82, "learning_rate": 2.659855296023545e-05, "loss": 0.0247, "step": 282400 }, { "epoch": 1.82, "learning_rate": 2.6588871605878516e-05, "loss": 0.0222, "step": 282410 }, { "epoch": 1.82, "learning_rate": 2.6579190251521586e-05, "loss": 0.0244, "step": 282420 }, { "epoch": 1.82, "learning_rate": 2.656950889716465e-05, "loss": 0.0222, "step": 282430 }, { "epoch": 1.82, "learning_rate": 2.655982754280772e-05, "loss": 0.0226, "step": 282440 }, { "epoch": 1.82, "learning_rate": 2.6550146188450788e-05, "loss": 0.0255, "step": 282450 }, { "epoch": 1.82, "learning_rate": 2.6540464834093854e-05, "loss": 0.0268, "step": 282460 }, { "epoch": 1.82, "learning_rate": 2.6530783479736924e-05, "loss": 0.0226, "step": 282470 }, { "epoch": 1.82, "learning_rate": 2.6521102125379993e-05, "loss": 0.0301, "step": 282480 }, { "epoch": 1.82, "learning_rate": 2.651142077102306e-05, "loss": 0.021, "step": 282490 }, { "epoch": 1.82, "learning_rate": 2.6501739416666126e-05, "loss": 0.0268, "step": 282500 }, { "epoch": 1.82, "learning_rate": 2.6492058062309192e-05, "loss": 0.022, "step": 282510 }, { "epoch": 1.82, "learning_rate": 2.6482376707952262e-05, "loss": 0.0235, "step": 282520 }, { "epoch": 1.82, "learning_rate": 2.647269535359533e-05, "loss": 0.0223, "step": 282530 }, { "epoch": 1.82, "learning_rate": 2.6463013999238398e-05, "loss": 0.0223, "step": 282540 }, { "epoch": 1.82, "learning_rate": 2.6453332644881467e-05, "loss": 0.0227, "step": 282550 }, { "epoch": 1.82, "learning_rate": 2.6443651290524537e-05, "loss": 0.0188, "step": 282560 }, { "epoch": 1.82, "learning_rate": 2.64339699361676e-05, "loss": 0.0208, "step": 282570 }, { "epoch": 1.82, "learning_rate": 2.642428858181067e-05, "loss": 0.0258, "step": 282580 }, { "epoch": 1.82, "learning_rate": 2.6414607227453736e-05, "loss": 0.0215, "step": 282590 }, { "epoch": 1.82, "learning_rate": 2.6404925873096805e-05, "loss": 0.0274, "step": 282600 }, { "epoch": 1.82, "learning_rate": 2.6395244518739875e-05, "loss": 0.0229, "step": 282610 }, { "epoch": 1.82, "learning_rate": 2.638556316438294e-05, "loss": 0.0232, "step": 282620 }, { "epoch": 1.82, "learning_rate": 2.637588181002601e-05, "loss": 0.0276, "step": 282630 }, { "epoch": 1.82, "learning_rate": 2.6366200455669074e-05, "loss": 0.0215, "step": 282640 }, { "epoch": 1.82, "learning_rate": 2.6356519101312143e-05, "loss": 0.0227, "step": 282650 }, { "epoch": 1.82, "learning_rate": 2.6346837746955213e-05, "loss": 0.0224, "step": 282660 }, { "epoch": 1.82, "learning_rate": 2.633715639259828e-05, "loss": 0.0258, "step": 282670 }, { "epoch": 1.82, "learning_rate": 2.632747503824135e-05, "loss": 0.0234, "step": 282680 }, { "epoch": 1.82, "learning_rate": 2.631779368388442e-05, "loss": 0.0285, "step": 282690 }, { "epoch": 1.82, "learning_rate": 2.6308112329527485e-05, "loss": 0.0202, "step": 282700 }, { "epoch": 1.82, "learning_rate": 2.629843097517055e-05, "loss": 0.0201, "step": 282710 }, { "epoch": 1.82, "learning_rate": 2.6288749620813617e-05, "loss": 0.0222, "step": 282720 }, { "epoch": 1.82, "learning_rate": 2.6279068266456687e-05, "loss": 0.0231, "step": 282730 }, { "epoch": 1.82, "learning_rate": 2.6269386912099756e-05, "loss": 0.0249, "step": 282740 }, { "epoch": 1.82, "learning_rate": 2.6259705557742823e-05, "loss": 0.0209, "step": 282750 }, { "epoch": 1.82, "learning_rate": 2.6250024203385892e-05, "loss": 0.0248, "step": 282760 }, { "epoch": 1.83, "learning_rate": 2.6240342849028955e-05, "loss": 0.0212, "step": 282770 }, { "epoch": 1.83, "learning_rate": 2.6230661494672025e-05, "loss": 0.0192, "step": 282780 }, { "epoch": 1.83, "learning_rate": 2.6220980140315094e-05, "loss": 0.0221, "step": 282790 }, { "epoch": 1.83, "learning_rate": 2.621129878595816e-05, "loss": 0.0252, "step": 282800 }, { "epoch": 1.83, "learning_rate": 2.620161743160123e-05, "loss": 0.0214, "step": 282810 }, { "epoch": 1.83, "learning_rate": 2.6191936077244296e-05, "loss": 0.0255, "step": 282820 }, { "epoch": 1.83, "learning_rate": 2.6182254722887366e-05, "loss": 0.0199, "step": 282830 }, { "epoch": 1.83, "learning_rate": 2.6172573368530432e-05, "loss": 0.0227, "step": 282840 }, { "epoch": 1.83, "learning_rate": 2.61628920141735e-05, "loss": 0.0322, "step": 282850 }, { "epoch": 1.83, "learning_rate": 2.6153210659816568e-05, "loss": 0.0236, "step": 282860 }, { "epoch": 1.83, "learning_rate": 2.6143529305459634e-05, "loss": 0.0194, "step": 282870 }, { "epoch": 1.83, "learning_rate": 2.6133847951102704e-05, "loss": 0.0207, "step": 282880 }, { "epoch": 1.83, "learning_rate": 2.6124166596745774e-05, "loss": 0.0229, "step": 282890 }, { "epoch": 1.83, "learning_rate": 2.611448524238884e-05, "loss": 0.0244, "step": 282900 }, { "epoch": 1.83, "learning_rate": 2.6104803888031906e-05, "loss": 0.0218, "step": 282910 }, { "epoch": 1.83, "learning_rate": 2.6095122533674972e-05, "loss": 0.0271, "step": 282920 }, { "epoch": 1.83, "learning_rate": 2.6085441179318042e-05, "loss": 0.0209, "step": 282930 }, { "epoch": 1.83, "learning_rate": 2.607575982496111e-05, "loss": 0.0266, "step": 282940 }, { "epoch": 1.83, "learning_rate": 2.6066078470604178e-05, "loss": 0.0286, "step": 282950 }, { "epoch": 1.83, "learning_rate": 2.6056397116247247e-05, "loss": 0.0234, "step": 282960 }, { "epoch": 1.83, "learning_rate": 2.6046715761890317e-05, "loss": 0.0267, "step": 282970 }, { "epoch": 1.83, "learning_rate": 2.603703440753338e-05, "loss": 0.0196, "step": 282980 }, { "epoch": 1.83, "learning_rate": 2.602735305317645e-05, "loss": 0.0252, "step": 282990 }, { "epoch": 1.83, "learning_rate": 2.6017671698819516e-05, "loss": 0.0248, "step": 283000 }, { "epoch": 1.83, "eval_cer": 0.9198300756976613, "eval_loss": 0.0171258095651865, "eval_runtime": 119.8965, "eval_samples_per_second": 16.681, "eval_steps_per_second": 4.17, "step": 283000 }, { "epoch": 1.83, "learning_rate": 2.6007990344462585e-05, "loss": 0.0225, "step": 283010 }, { "epoch": 1.83, "learning_rate": 2.5998308990105655e-05, "loss": 0.0224, "step": 283020 }, { "epoch": 1.83, "learning_rate": 2.598862763574872e-05, "loss": 0.0191, "step": 283030 }, { "epoch": 1.83, "learning_rate": 2.597894628139179e-05, "loss": 0.0192, "step": 283040 }, { "epoch": 1.83, "learning_rate": 2.5969264927034854e-05, "loss": 0.0231, "step": 283050 }, { "epoch": 1.83, "learning_rate": 2.5959583572677923e-05, "loss": 0.0194, "step": 283060 }, { "epoch": 1.83, "learning_rate": 2.5949902218320993e-05, "loss": 0.029, "step": 283070 }, { "epoch": 1.83, "learning_rate": 2.594022086396406e-05, "loss": 0.0293, "step": 283080 }, { "epoch": 1.83, "learning_rate": 2.593053950960713e-05, "loss": 0.0197, "step": 283090 }, { "epoch": 1.83, "learning_rate": 2.59208581552502e-05, "loss": 0.0222, "step": 283100 }, { "epoch": 1.83, "learning_rate": 2.5911176800893265e-05, "loss": 0.023, "step": 283110 }, { "epoch": 1.83, "learning_rate": 2.590149544653633e-05, "loss": 0.027, "step": 283120 }, { "epoch": 1.83, "learning_rate": 2.5891814092179397e-05, "loss": 0.0266, "step": 283130 }, { "epoch": 1.83, "learning_rate": 2.5882132737822467e-05, "loss": 0.028, "step": 283140 }, { "epoch": 1.83, "learning_rate": 2.5872451383465536e-05, "loss": 0.023, "step": 283150 }, { "epoch": 1.83, "learning_rate": 2.5862770029108603e-05, "loss": 0.0231, "step": 283160 }, { "epoch": 1.83, "learning_rate": 2.5853088674751672e-05, "loss": 0.0249, "step": 283170 }, { "epoch": 1.83, "learning_rate": 2.5843407320394742e-05, "loss": 0.0281, "step": 283180 }, { "epoch": 1.83, "learning_rate": 2.5833725966037805e-05, "loss": 0.0224, "step": 283190 }, { "epoch": 1.83, "learning_rate": 2.5824044611680874e-05, "loss": 0.0258, "step": 283200 }, { "epoch": 1.83, "learning_rate": 2.581436325732394e-05, "loss": 0.0304, "step": 283210 }, { "epoch": 1.83, "learning_rate": 2.580468190296701e-05, "loss": 0.0235, "step": 283220 }, { "epoch": 1.83, "learning_rate": 2.579500054861008e-05, "loss": 0.0215, "step": 283230 }, { "epoch": 1.83, "learning_rate": 2.5785319194253146e-05, "loss": 0.0251, "step": 283240 }, { "epoch": 1.83, "learning_rate": 2.5775637839896216e-05, "loss": 0.0268, "step": 283250 }, { "epoch": 1.83, "learning_rate": 2.576595648553928e-05, "loss": 0.0244, "step": 283260 }, { "epoch": 1.83, "learning_rate": 2.5756275131182348e-05, "loss": 0.019, "step": 283270 }, { "epoch": 1.83, "learning_rate": 2.5746593776825418e-05, "loss": 0.0188, "step": 283280 }, { "epoch": 1.83, "learning_rate": 2.5736912422468484e-05, "loss": 0.0272, "step": 283290 }, { "epoch": 1.83, "learning_rate": 2.5727231068111554e-05, "loss": 0.0232, "step": 283300 }, { "epoch": 1.83, "learning_rate": 2.5717549713754623e-05, "loss": 0.025, "step": 283310 }, { "epoch": 1.83, "learning_rate": 2.570786835939769e-05, "loss": 0.0297, "step": 283320 }, { "epoch": 1.83, "learning_rate": 2.5698187005040756e-05, "loss": 0.0209, "step": 283330 }, { "epoch": 1.83, "learning_rate": 2.5688505650683822e-05, "loss": 0.0234, "step": 283340 }, { "epoch": 1.83, "learning_rate": 2.5678824296326892e-05, "loss": 0.0234, "step": 283350 }, { "epoch": 1.83, "learning_rate": 2.566914294196996e-05, "loss": 0.0192, "step": 283360 }, { "epoch": 1.83, "learning_rate": 2.5659461587613028e-05, "loss": 0.0233, "step": 283370 }, { "epoch": 1.83, "learning_rate": 2.5649780233256097e-05, "loss": 0.0232, "step": 283380 }, { "epoch": 1.83, "learning_rate": 2.5640098878899163e-05, "loss": 0.0227, "step": 283390 }, { "epoch": 1.83, "learning_rate": 2.563041752454223e-05, "loss": 0.019, "step": 283400 }, { "epoch": 1.83, "learning_rate": 2.56207361701853e-05, "loss": 0.0247, "step": 283410 }, { "epoch": 1.83, "learning_rate": 2.5611054815828366e-05, "loss": 0.0212, "step": 283420 }, { "epoch": 1.83, "learning_rate": 2.5601373461471435e-05, "loss": 0.0259, "step": 283430 }, { "epoch": 1.83, "learning_rate": 2.55916921071145e-05, "loss": 0.0223, "step": 283440 }, { "epoch": 1.83, "learning_rate": 2.558201075275757e-05, "loss": 0.0219, "step": 283450 }, { "epoch": 1.83, "learning_rate": 2.557232939840064e-05, "loss": 0.022, "step": 283460 }, { "epoch": 1.83, "learning_rate": 2.5562648044043704e-05, "loss": 0.0174, "step": 283470 }, { "epoch": 1.83, "learning_rate": 2.5552966689686773e-05, "loss": 0.0196, "step": 283480 }, { "epoch": 1.83, "learning_rate": 2.554328533532984e-05, "loss": 0.0218, "step": 283490 }, { "epoch": 1.83, "learning_rate": 2.553360398097291e-05, "loss": 0.023, "step": 283500 }, { "epoch": 1.83, "learning_rate": 2.552392262661598e-05, "loss": 0.0219, "step": 283510 }, { "epoch": 1.83, "learning_rate": 2.5514241272259045e-05, "loss": 0.0244, "step": 283520 }, { "epoch": 1.83, "learning_rate": 2.5504559917902115e-05, "loss": 0.0213, "step": 283530 }, { "epoch": 1.83, "learning_rate": 2.549487856354518e-05, "loss": 0.0284, "step": 283540 }, { "epoch": 1.83, "learning_rate": 2.5485197209188247e-05, "loss": 0.0247, "step": 283550 }, { "epoch": 1.83, "learning_rate": 2.5475515854831317e-05, "loss": 0.0269, "step": 283560 }, { "epoch": 1.83, "learning_rate": 2.5465834500474383e-05, "loss": 0.0223, "step": 283570 }, { "epoch": 1.83, "learning_rate": 2.5456153146117453e-05, "loss": 0.0328, "step": 283580 }, { "epoch": 1.83, "learning_rate": 2.5446471791760522e-05, "loss": 0.0224, "step": 283590 }, { "epoch": 1.83, "learning_rate": 2.543679043740359e-05, "loss": 0.0231, "step": 283600 }, { "epoch": 1.83, "learning_rate": 2.5427109083046655e-05, "loss": 0.0204, "step": 283610 }, { "epoch": 1.83, "learning_rate": 2.541742772868972e-05, "loss": 0.0202, "step": 283620 }, { "epoch": 1.83, "learning_rate": 2.540774637433279e-05, "loss": 0.0219, "step": 283630 }, { "epoch": 1.83, "learning_rate": 2.539806501997586e-05, "loss": 0.0224, "step": 283640 }, { "epoch": 1.83, "learning_rate": 2.5388383665618926e-05, "loss": 0.0196, "step": 283650 }, { "epoch": 1.83, "learning_rate": 2.5378702311261996e-05, "loss": 0.024, "step": 283660 }, { "epoch": 1.83, "learning_rate": 2.536902095690506e-05, "loss": 0.0232, "step": 283670 }, { "epoch": 1.83, "learning_rate": 2.535933960254813e-05, "loss": 0.0261, "step": 283680 }, { "epoch": 1.83, "learning_rate": 2.5349658248191198e-05, "loss": 0.0191, "step": 283690 }, { "epoch": 1.83, "learning_rate": 2.5339976893834264e-05, "loss": 0.0197, "step": 283700 }, { "epoch": 1.83, "learning_rate": 2.5330295539477334e-05, "loss": 0.0247, "step": 283710 }, { "epoch": 1.83, "learning_rate": 2.5320614185120404e-05, "loss": 0.0262, "step": 283720 }, { "epoch": 1.83, "learning_rate": 2.531093283076347e-05, "loss": 0.0212, "step": 283730 }, { "epoch": 1.83, "learning_rate": 2.5301251476406536e-05, "loss": 0.0268, "step": 283740 }, { "epoch": 1.83, "learning_rate": 2.5291570122049602e-05, "loss": 0.0209, "step": 283750 }, { "epoch": 1.83, "learning_rate": 2.5281888767692672e-05, "loss": 0.0201, "step": 283760 }, { "epoch": 1.83, "learning_rate": 2.527220741333574e-05, "loss": 0.0222, "step": 283770 }, { "epoch": 1.83, "learning_rate": 2.5262526058978808e-05, "loss": 0.024, "step": 283780 }, { "epoch": 1.83, "learning_rate": 2.5252844704621877e-05, "loss": 0.0216, "step": 283790 }, { "epoch": 1.83, "learning_rate": 2.5243163350264947e-05, "loss": 0.0315, "step": 283800 }, { "epoch": 1.83, "learning_rate": 2.523348199590801e-05, "loss": 0.0222, "step": 283810 }, { "epoch": 1.83, "learning_rate": 2.522380064155108e-05, "loss": 0.0206, "step": 283820 }, { "epoch": 1.83, "learning_rate": 2.5214119287194146e-05, "loss": 0.0235, "step": 283830 }, { "epoch": 1.83, "learning_rate": 2.5204437932837215e-05, "loss": 0.0251, "step": 283840 }, { "epoch": 1.83, "learning_rate": 2.5194756578480285e-05, "loss": 0.0261, "step": 283850 }, { "epoch": 1.83, "learning_rate": 2.518507522412335e-05, "loss": 0.0281, "step": 283860 }, { "epoch": 1.83, "learning_rate": 2.517539386976642e-05, "loss": 0.0244, "step": 283870 }, { "epoch": 1.83, "learning_rate": 2.5165712515409484e-05, "loss": 0.0219, "step": 283880 }, { "epoch": 1.83, "learning_rate": 2.5156031161052553e-05, "loss": 0.0232, "step": 283890 }, { "epoch": 1.83, "learning_rate": 2.5146349806695623e-05, "loss": 0.0266, "step": 283900 }, { "epoch": 1.83, "learning_rate": 2.513666845233869e-05, "loss": 0.024, "step": 283910 }, { "epoch": 1.83, "learning_rate": 2.512698709798176e-05, "loss": 0.0243, "step": 283920 }, { "epoch": 1.83, "learning_rate": 2.511730574362483e-05, "loss": 0.0222, "step": 283930 }, { "epoch": 1.83, "learning_rate": 2.5107624389267895e-05, "loss": 0.0232, "step": 283940 }, { "epoch": 1.83, "learning_rate": 2.509794303491096e-05, "loss": 0.0271, "step": 283950 }, { "epoch": 1.83, "learning_rate": 2.5088261680554027e-05, "loss": 0.0207, "step": 283960 }, { "epoch": 1.83, "learning_rate": 2.5078580326197097e-05, "loss": 0.0238, "step": 283970 }, { "epoch": 1.83, "learning_rate": 2.5068898971840166e-05, "loss": 0.0185, "step": 283980 }, { "epoch": 1.83, "learning_rate": 2.5059217617483233e-05, "loss": 0.0257, "step": 283990 }, { "epoch": 1.83, "learning_rate": 2.5049536263126302e-05, "loss": 0.0205, "step": 284000 }, { "epoch": 1.83, "eval_cer": 0.919813806349565, "eval_loss": 0.01731204241514206, "eval_runtime": 119.8623, "eval_samples_per_second": 16.686, "eval_steps_per_second": 4.171, "step": 284000 }, { "epoch": 1.83, "learning_rate": 2.5039854908769372e-05, "loss": 0.0279, "step": 284010 }, { "epoch": 1.83, "learning_rate": 2.5030173554412435e-05, "loss": 0.024, "step": 284020 }, { "epoch": 1.83, "learning_rate": 2.5020492200055504e-05, "loss": 0.0262, "step": 284030 }, { "epoch": 1.83, "learning_rate": 2.501081084569857e-05, "loss": 0.021, "step": 284040 }, { "epoch": 1.83, "learning_rate": 2.500112949134164e-05, "loss": 0.0226, "step": 284050 }, { "epoch": 1.83, "learning_rate": 2.499144813698471e-05, "loss": 0.0215, "step": 284060 }, { "epoch": 1.83, "learning_rate": 2.4981766782627776e-05, "loss": 0.0256, "step": 284070 }, { "epoch": 1.83, "learning_rate": 2.4972085428270846e-05, "loss": 0.0201, "step": 284080 }, { "epoch": 1.83, "learning_rate": 2.496240407391391e-05, "loss": 0.0221, "step": 284090 }, { "epoch": 1.83, "learning_rate": 2.4952722719556978e-05, "loss": 0.0228, "step": 284100 }, { "epoch": 1.83, "learning_rate": 2.4943041365200048e-05, "loss": 0.0243, "step": 284110 }, { "epoch": 1.83, "learning_rate": 2.4933360010843114e-05, "loss": 0.0218, "step": 284120 }, { "epoch": 1.83, "learning_rate": 2.4923678656486184e-05, "loss": 0.0214, "step": 284130 }, { "epoch": 1.83, "learning_rate": 2.491399730212925e-05, "loss": 0.023, "step": 284140 }, { "epoch": 1.83, "learning_rate": 2.490431594777232e-05, "loss": 0.0267, "step": 284150 }, { "epoch": 1.83, "learning_rate": 2.4894634593415386e-05, "loss": 0.0212, "step": 284160 }, { "epoch": 1.83, "learning_rate": 2.4884953239058452e-05, "loss": 0.0182, "step": 284170 }, { "epoch": 1.83, "learning_rate": 2.4875271884701522e-05, "loss": 0.0231, "step": 284180 }, { "epoch": 1.83, "learning_rate": 2.4865590530344588e-05, "loss": 0.022, "step": 284190 }, { "epoch": 1.83, "learning_rate": 2.4855909175987658e-05, "loss": 0.0217, "step": 284200 }, { "epoch": 1.83, "learning_rate": 2.4846227821630727e-05, "loss": 0.0257, "step": 284210 }, { "epoch": 1.83, "learning_rate": 2.4836546467273793e-05, "loss": 0.0212, "step": 284220 }, { "epoch": 1.83, "learning_rate": 2.482686511291686e-05, "loss": 0.0251, "step": 284230 }, { "epoch": 1.83, "learning_rate": 2.4817183758559926e-05, "loss": 0.021, "step": 284240 }, { "epoch": 1.83, "learning_rate": 2.4807502404202996e-05, "loss": 0.0212, "step": 284250 }, { "epoch": 1.83, "learning_rate": 2.4797821049846065e-05, "loss": 0.023, "step": 284260 }, { "epoch": 1.83, "learning_rate": 2.478813969548913e-05, "loss": 0.0272, "step": 284270 }, { "epoch": 1.83, "learning_rate": 2.47784583411322e-05, "loss": 0.0256, "step": 284280 }, { "epoch": 1.83, "learning_rate": 2.476877698677527e-05, "loss": 0.0234, "step": 284290 }, { "epoch": 1.83, "learning_rate": 2.4759095632418334e-05, "loss": 0.0224, "step": 284300 }, { "epoch": 1.83, "learning_rate": 2.4749414278061403e-05, "loss": 0.0241, "step": 284310 }, { "epoch": 1.84, "learning_rate": 2.473973292370447e-05, "loss": 0.0197, "step": 284320 }, { "epoch": 1.84, "learning_rate": 2.473005156934754e-05, "loss": 0.0187, "step": 284330 }, { "epoch": 1.84, "learning_rate": 2.472037021499061e-05, "loss": 0.0233, "step": 284340 }, { "epoch": 1.84, "learning_rate": 2.4710688860633675e-05, "loss": 0.0205, "step": 284350 }, { "epoch": 1.84, "learning_rate": 2.4701007506276745e-05, "loss": 0.0241, "step": 284360 }, { "epoch": 1.84, "learning_rate": 2.4691326151919807e-05, "loss": 0.02, "step": 284370 }, { "epoch": 1.84, "learning_rate": 2.4681644797562877e-05, "loss": 0.0231, "step": 284380 }, { "epoch": 1.84, "learning_rate": 2.4671963443205947e-05, "loss": 0.0209, "step": 284390 }, { "epoch": 1.84, "learning_rate": 2.4662282088849013e-05, "loss": 0.0245, "step": 284400 }, { "epoch": 1.84, "learning_rate": 2.4652600734492083e-05, "loss": 0.0183, "step": 284410 }, { "epoch": 1.84, "learning_rate": 2.4642919380135152e-05, "loss": 0.029, "step": 284420 }, { "epoch": 1.84, "learning_rate": 2.463323802577822e-05, "loss": 0.0267, "step": 284430 }, { "epoch": 1.84, "learning_rate": 2.4623556671421285e-05, "loss": 0.0241, "step": 284440 }, { "epoch": 1.84, "learning_rate": 2.461387531706435e-05, "loss": 0.0226, "step": 284450 }, { "epoch": 1.84, "learning_rate": 2.460419396270742e-05, "loss": 0.023, "step": 284460 }, { "epoch": 1.84, "learning_rate": 2.459451260835049e-05, "loss": 0.0266, "step": 284470 }, { "epoch": 1.84, "learning_rate": 2.4584831253993556e-05, "loss": 0.0241, "step": 284480 }, { "epoch": 1.84, "learning_rate": 2.4575149899636626e-05, "loss": 0.0242, "step": 284490 }, { "epoch": 1.84, "learning_rate": 2.456546854527969e-05, "loss": 0.0181, "step": 284500 }, { "epoch": 1.84, "learning_rate": 2.455578719092276e-05, "loss": 0.0229, "step": 284510 }, { "epoch": 1.84, "learning_rate": 2.4546105836565828e-05, "loss": 0.0208, "step": 284520 }, { "epoch": 1.84, "learning_rate": 2.4536424482208894e-05, "loss": 0.0217, "step": 284530 }, { "epoch": 1.84, "learning_rate": 2.4526743127851964e-05, "loss": 0.0309, "step": 284540 }, { "epoch": 1.84, "learning_rate": 2.4517061773495034e-05, "loss": 0.023, "step": 284550 }, { "epoch": 1.84, "learning_rate": 2.45073804191381e-05, "loss": 0.0225, "step": 284560 }, { "epoch": 1.84, "learning_rate": 2.4497699064781166e-05, "loss": 0.0211, "step": 284570 }, { "epoch": 1.84, "learning_rate": 2.4488017710424232e-05, "loss": 0.0216, "step": 284580 }, { "epoch": 1.84, "learning_rate": 2.4478336356067302e-05, "loss": 0.0187, "step": 284590 }, { "epoch": 1.84, "learning_rate": 2.446865500171037e-05, "loss": 0.022, "step": 284600 }, { "epoch": 1.84, "learning_rate": 2.4458973647353438e-05, "loss": 0.0212, "step": 284610 }, { "epoch": 1.84, "learning_rate": 2.4449292292996507e-05, "loss": 0.0192, "step": 284620 }, { "epoch": 1.84, "learning_rate": 2.4439610938639577e-05, "loss": 0.0273, "step": 284630 }, { "epoch": 1.84, "learning_rate": 2.442992958428264e-05, "loss": 0.0267, "step": 284640 }, { "epoch": 1.84, "learning_rate": 2.442024822992571e-05, "loss": 0.0247, "step": 284650 }, { "epoch": 1.84, "learning_rate": 2.4410566875568776e-05, "loss": 0.0249, "step": 284660 }, { "epoch": 1.84, "learning_rate": 2.4400885521211845e-05, "loss": 0.0189, "step": 284670 }, { "epoch": 1.84, "learning_rate": 2.4391204166854915e-05, "loss": 0.0226, "step": 284680 }, { "epoch": 1.84, "learning_rate": 2.438152281249798e-05, "loss": 0.0198, "step": 284690 }, { "epoch": 1.84, "learning_rate": 2.437184145814105e-05, "loss": 0.0213, "step": 284700 }, { "epoch": 1.84, "learning_rate": 2.4362160103784114e-05, "loss": 0.0244, "step": 284710 }, { "epoch": 1.84, "learning_rate": 2.4352478749427183e-05, "loss": 0.0239, "step": 284720 }, { "epoch": 1.84, "learning_rate": 2.4342797395070253e-05, "loss": 0.025, "step": 284730 }, { "epoch": 1.84, "learning_rate": 2.433311604071332e-05, "loss": 0.0235, "step": 284740 }, { "epoch": 1.84, "learning_rate": 2.432343468635639e-05, "loss": 0.0213, "step": 284750 }, { "epoch": 1.84, "learning_rate": 2.431375333199946e-05, "loss": 0.0235, "step": 284760 }, { "epoch": 1.84, "learning_rate": 2.4304071977642525e-05, "loss": 0.0217, "step": 284770 }, { "epoch": 1.84, "learning_rate": 2.429439062328559e-05, "loss": 0.0232, "step": 284780 }, { "epoch": 1.84, "learning_rate": 2.4284709268928657e-05, "loss": 0.019, "step": 284790 }, { "epoch": 1.84, "learning_rate": 2.4275027914571727e-05, "loss": 0.0267, "step": 284800 }, { "epoch": 1.84, "learning_rate": 2.4265346560214796e-05, "loss": 0.0208, "step": 284810 }, { "epoch": 1.84, "learning_rate": 2.4255665205857863e-05, "loss": 0.0203, "step": 284820 }, { "epoch": 1.84, "learning_rate": 2.4245983851500932e-05, "loss": 0.0278, "step": 284830 }, { "epoch": 1.84, "learning_rate": 2.4236302497144e-05, "loss": 0.021, "step": 284840 }, { "epoch": 1.84, "learning_rate": 2.4226621142787065e-05, "loss": 0.0266, "step": 284850 }, { "epoch": 1.84, "learning_rate": 2.4216939788430134e-05, "loss": 0.0203, "step": 284860 }, { "epoch": 1.84, "learning_rate": 2.42072584340732e-05, "loss": 0.0269, "step": 284870 }, { "epoch": 1.84, "learning_rate": 2.419757707971627e-05, "loss": 0.0234, "step": 284880 }, { "epoch": 1.84, "learning_rate": 2.4187895725359337e-05, "loss": 0.0251, "step": 284890 }, { "epoch": 1.84, "learning_rate": 2.4178214371002406e-05, "loss": 0.0258, "step": 284900 }, { "epoch": 1.84, "learning_rate": 2.4168533016645476e-05, "loss": 0.0289, "step": 284910 }, { "epoch": 1.84, "learning_rate": 2.415885166228854e-05, "loss": 0.0223, "step": 284920 }, { "epoch": 1.84, "learning_rate": 2.4149170307931608e-05, "loss": 0.0209, "step": 284930 }, { "epoch": 1.84, "learning_rate": 2.4139488953574675e-05, "loss": 0.0217, "step": 284940 }, { "epoch": 1.84, "learning_rate": 2.4129807599217744e-05, "loss": 0.0192, "step": 284950 }, { "epoch": 1.84, "learning_rate": 2.4120126244860814e-05, "loss": 0.0227, "step": 284960 }, { "epoch": 1.84, "learning_rate": 2.411044489050388e-05, "loss": 0.0213, "step": 284970 }, { "epoch": 1.84, "learning_rate": 2.410076353614695e-05, "loss": 0.0219, "step": 284980 }, { "epoch": 1.84, "learning_rate": 2.4091082181790012e-05, "loss": 0.0234, "step": 284990 }, { "epoch": 1.84, "learning_rate": 2.4081400827433082e-05, "loss": 0.0231, "step": 285000 }, { "epoch": 1.84, "eval_cer": 0.9198599028358377, "eval_loss": 0.01720038801431656, "eval_runtime": 120.0459, "eval_samples_per_second": 16.66, "eval_steps_per_second": 4.165, "step": 285000 }, { "epoch": 1.84, "learning_rate": 2.4071719473076152e-05, "loss": 0.0181, "step": 285010 }, { "epoch": 1.84, "learning_rate": 2.4062038118719218e-05, "loss": 0.0266, "step": 285020 }, { "epoch": 1.84, "learning_rate": 2.4052356764362288e-05, "loss": 0.0198, "step": 285030 }, { "epoch": 1.84, "learning_rate": 2.4042675410005357e-05, "loss": 0.0249, "step": 285040 }, { "epoch": 1.84, "learning_rate": 2.4032994055648423e-05, "loss": 0.0213, "step": 285050 }, { "epoch": 1.84, "learning_rate": 2.402331270129149e-05, "loss": 0.0286, "step": 285060 }, { "epoch": 1.84, "learning_rate": 2.4013631346934556e-05, "loss": 0.0241, "step": 285070 }, { "epoch": 1.84, "learning_rate": 2.4003949992577626e-05, "loss": 0.0222, "step": 285080 }, { "epoch": 1.84, "learning_rate": 2.3994268638220695e-05, "loss": 0.0228, "step": 285090 }, { "epoch": 1.84, "learning_rate": 2.398458728386376e-05, "loss": 0.0257, "step": 285100 }, { "epoch": 1.84, "learning_rate": 2.397490592950683e-05, "loss": 0.0248, "step": 285110 }, { "epoch": 1.84, "learning_rate": 2.39652245751499e-05, "loss": 0.0248, "step": 285120 }, { "epoch": 1.84, "learning_rate": 2.3955543220792964e-05, "loss": 0.0262, "step": 285130 }, { "epoch": 1.84, "learning_rate": 2.3945861866436033e-05, "loss": 0.0238, "step": 285140 }, { "epoch": 1.84, "learning_rate": 2.39361805120791e-05, "loss": 0.0173, "step": 285150 }, { "epoch": 1.84, "learning_rate": 2.392649915772217e-05, "loss": 0.028, "step": 285160 }, { "epoch": 1.84, "learning_rate": 2.391681780336524e-05, "loss": 0.0259, "step": 285170 }, { "epoch": 1.84, "learning_rate": 2.3907136449008305e-05, "loss": 0.0202, "step": 285180 }, { "epoch": 1.84, "learning_rate": 2.3897455094651375e-05, "loss": 0.0212, "step": 285190 }, { "epoch": 1.84, "learning_rate": 2.3887773740294437e-05, "loss": 0.018, "step": 285200 }, { "epoch": 1.84, "learning_rate": 2.3878092385937507e-05, "loss": 0.02, "step": 285210 }, { "epoch": 1.84, "learning_rate": 2.3868411031580577e-05, "loss": 0.0225, "step": 285220 }, { "epoch": 1.84, "learning_rate": 2.3858729677223643e-05, "loss": 0.0286, "step": 285230 }, { "epoch": 1.84, "learning_rate": 2.3849048322866713e-05, "loss": 0.0209, "step": 285240 }, { "epoch": 1.84, "learning_rate": 2.3839366968509782e-05, "loss": 0.0192, "step": 285250 }, { "epoch": 1.84, "learning_rate": 2.382968561415285e-05, "loss": 0.0258, "step": 285260 }, { "epoch": 1.84, "learning_rate": 2.3820004259795915e-05, "loss": 0.0237, "step": 285270 }, { "epoch": 1.84, "learning_rate": 2.381032290543898e-05, "loss": 0.0244, "step": 285280 }, { "epoch": 1.84, "learning_rate": 2.380064155108205e-05, "loss": 0.0239, "step": 285290 }, { "epoch": 1.84, "learning_rate": 2.379096019672512e-05, "loss": 0.0178, "step": 285300 }, { "epoch": 1.84, "learning_rate": 2.3781278842368186e-05, "loss": 0.0237, "step": 285310 }, { "epoch": 1.84, "learning_rate": 2.3771597488011256e-05, "loss": 0.0208, "step": 285320 }, { "epoch": 1.84, "learning_rate": 2.3761916133654326e-05, "loss": 0.0243, "step": 285330 }, { "epoch": 1.84, "learning_rate": 2.375223477929739e-05, "loss": 0.0253, "step": 285340 }, { "epoch": 1.84, "learning_rate": 2.3742553424940458e-05, "loss": 0.0238, "step": 285350 }, { "epoch": 1.84, "learning_rate": 2.3732872070583524e-05, "loss": 0.0246, "step": 285360 }, { "epoch": 1.84, "learning_rate": 2.3723190716226594e-05, "loss": 0.0231, "step": 285370 }, { "epoch": 1.84, "learning_rate": 2.3713509361869664e-05, "loss": 0.0183, "step": 285380 }, { "epoch": 1.84, "learning_rate": 2.370382800751273e-05, "loss": 0.0239, "step": 285390 }, { "epoch": 1.84, "learning_rate": 2.3694146653155796e-05, "loss": 0.0206, "step": 285400 }, { "epoch": 1.84, "learning_rate": 2.3684465298798862e-05, "loss": 0.0226, "step": 285410 }, { "epoch": 1.84, "learning_rate": 2.3674783944441932e-05, "loss": 0.0256, "step": 285420 }, { "epoch": 1.84, "learning_rate": 2.3665102590085e-05, "loss": 0.0219, "step": 285430 }, { "epoch": 1.84, "learning_rate": 2.3655421235728068e-05, "loss": 0.0223, "step": 285440 }, { "epoch": 1.84, "learning_rate": 2.3645739881371137e-05, "loss": 0.022, "step": 285450 }, { "epoch": 1.84, "learning_rate": 2.3636058527014204e-05, "loss": 0.0198, "step": 285460 }, { "epoch": 1.84, "learning_rate": 2.362637717265727e-05, "loss": 0.0206, "step": 285470 }, { "epoch": 1.84, "learning_rate": 2.361669581830034e-05, "loss": 0.0232, "step": 285480 }, { "epoch": 1.84, "learning_rate": 2.3607014463943406e-05, "loss": 0.0235, "step": 285490 }, { "epoch": 1.84, "learning_rate": 2.3597333109586475e-05, "loss": 0.0221, "step": 285500 }, { "epoch": 1.84, "learning_rate": 2.358765175522954e-05, "loss": 0.0212, "step": 285510 }, { "epoch": 1.84, "learning_rate": 2.357797040087261e-05, "loss": 0.0275, "step": 285520 }, { "epoch": 1.84, "learning_rate": 2.356828904651568e-05, "loss": 0.0235, "step": 285530 }, { "epoch": 1.84, "learning_rate": 2.3558607692158744e-05, "loss": 0.0191, "step": 285540 }, { "epoch": 1.84, "learning_rate": 2.3548926337801813e-05, "loss": 0.0261, "step": 285550 }, { "epoch": 1.84, "learning_rate": 2.353924498344488e-05, "loss": 0.0216, "step": 285560 }, { "epoch": 1.84, "learning_rate": 2.352956362908795e-05, "loss": 0.0216, "step": 285570 }, { "epoch": 1.84, "learning_rate": 2.351988227473102e-05, "loss": 0.0235, "step": 285580 }, { "epoch": 1.84, "learning_rate": 2.3510200920374085e-05, "loss": 0.0275, "step": 285590 }, { "epoch": 1.84, "learning_rate": 2.3500519566017155e-05, "loss": 0.0261, "step": 285600 }, { "epoch": 1.84, "learning_rate": 2.3490838211660218e-05, "loss": 0.0257, "step": 285610 }, { "epoch": 1.84, "learning_rate": 2.3481156857303287e-05, "loss": 0.0277, "step": 285620 }, { "epoch": 1.84, "learning_rate": 2.3471475502946357e-05, "loss": 0.0217, "step": 285630 }, { "epoch": 1.84, "learning_rate": 2.3461794148589423e-05, "loss": 0.0244, "step": 285640 }, { "epoch": 1.84, "learning_rate": 2.3452112794232493e-05, "loss": 0.0255, "step": 285650 }, { "epoch": 1.84, "learning_rate": 2.3442431439875562e-05, "loss": 0.0211, "step": 285660 }, { "epoch": 1.84, "learning_rate": 2.343275008551863e-05, "loss": 0.0285, "step": 285670 }, { "epoch": 1.84, "learning_rate": 2.3423068731161695e-05, "loss": 0.0213, "step": 285680 }, { "epoch": 1.84, "learning_rate": 2.341338737680476e-05, "loss": 0.0233, "step": 285690 }, { "epoch": 1.84, "learning_rate": 2.340370602244783e-05, "loss": 0.0228, "step": 285700 }, { "epoch": 1.84, "learning_rate": 2.33940246680909e-05, "loss": 0.0206, "step": 285710 }, { "epoch": 1.84, "learning_rate": 2.3384343313733967e-05, "loss": 0.0231, "step": 285720 }, { "epoch": 1.84, "learning_rate": 2.3374661959377036e-05, "loss": 0.0346, "step": 285730 }, { "epoch": 1.84, "learning_rate": 2.3364980605020106e-05, "loss": 0.0195, "step": 285740 }, { "epoch": 1.84, "learning_rate": 2.335529925066317e-05, "loss": 0.026, "step": 285750 }, { "epoch": 1.84, "learning_rate": 2.3345617896306238e-05, "loss": 0.0221, "step": 285760 }, { "epoch": 1.84, "learning_rate": 2.3335936541949304e-05, "loss": 0.0265, "step": 285770 }, { "epoch": 1.84, "learning_rate": 2.3326255187592374e-05, "loss": 0.0222, "step": 285780 }, { "epoch": 1.84, "learning_rate": 2.3316573833235444e-05, "loss": 0.0226, "step": 285790 }, { "epoch": 1.84, "learning_rate": 2.330689247887851e-05, "loss": 0.0226, "step": 285800 }, { "epoch": 1.84, "learning_rate": 2.329721112452158e-05, "loss": 0.022, "step": 285810 }, { "epoch": 1.84, "learning_rate": 2.3287529770164642e-05, "loss": 0.024, "step": 285820 }, { "epoch": 1.84, "learning_rate": 2.3277848415807712e-05, "loss": 0.0228, "step": 285830 }, { "epoch": 1.84, "learning_rate": 2.3268167061450782e-05, "loss": 0.0246, "step": 285840 }, { "epoch": 1.84, "learning_rate": 2.3258485707093848e-05, "loss": 0.0247, "step": 285850 }, { "epoch": 1.85, "learning_rate": 2.3248804352736918e-05, "loss": 0.0224, "step": 285860 }, { "epoch": 1.85, "learning_rate": 2.3239122998379987e-05, "loss": 0.026, "step": 285870 }, { "epoch": 1.85, "learning_rate": 2.3229441644023053e-05, "loss": 0.0238, "step": 285880 }, { "epoch": 1.85, "learning_rate": 2.321976028966612e-05, "loss": 0.0265, "step": 285890 }, { "epoch": 1.85, "learning_rate": 2.3210078935309186e-05, "loss": 0.0216, "step": 285900 }, { "epoch": 1.85, "learning_rate": 2.3200397580952256e-05, "loss": 0.029, "step": 285910 }, { "epoch": 1.85, "learning_rate": 2.3190716226595325e-05, "loss": 0.0242, "step": 285920 }, { "epoch": 1.85, "learning_rate": 2.318103487223839e-05, "loss": 0.0222, "step": 285930 }, { "epoch": 1.85, "learning_rate": 2.317135351788146e-05, "loss": 0.0192, "step": 285940 }, { "epoch": 1.85, "learning_rate": 2.316167216352453e-05, "loss": 0.0223, "step": 285950 }, { "epoch": 1.85, "learning_rate": 2.3151990809167594e-05, "loss": 0.021, "step": 285960 }, { "epoch": 1.85, "learning_rate": 2.3142309454810663e-05, "loss": 0.0256, "step": 285970 }, { "epoch": 1.85, "learning_rate": 2.313262810045373e-05, "loss": 0.0212, "step": 285980 }, { "epoch": 1.85, "learning_rate": 2.31229467460968e-05, "loss": 0.0251, "step": 285990 }, { "epoch": 1.85, "learning_rate": 2.311326539173987e-05, "loss": 0.0278, "step": 286000 }, { "epoch": 1.85, "eval_cer": 0.9198391142243815, "eval_loss": 0.017069820314645767, "eval_runtime": 120.131, "eval_samples_per_second": 16.648, "eval_steps_per_second": 4.162, "step": 286000 }, { "epoch": 1.85, "learning_rate": 2.3103584037382935e-05, "loss": 0.0253, "step": 286010 }, { "epoch": 1.85, "learning_rate": 2.3093902683026005e-05, "loss": 0.0194, "step": 286020 }, { "epoch": 1.85, "learning_rate": 2.3084221328669067e-05, "loss": 0.0229, "step": 286030 }, { "epoch": 1.85, "learning_rate": 2.3074539974312137e-05, "loss": 0.0207, "step": 286040 }, { "epoch": 1.85, "learning_rate": 2.3064858619955207e-05, "loss": 0.0254, "step": 286050 }, { "epoch": 1.85, "learning_rate": 2.3055177265598273e-05, "loss": 0.0226, "step": 286060 }, { "epoch": 1.85, "learning_rate": 2.3045495911241342e-05, "loss": 0.0318, "step": 286070 }, { "epoch": 1.85, "learning_rate": 2.3035814556884412e-05, "loss": 0.0185, "step": 286080 }, { "epoch": 1.85, "learning_rate": 2.302613320252748e-05, "loss": 0.0243, "step": 286090 }, { "epoch": 1.85, "learning_rate": 2.3016451848170545e-05, "loss": 0.0232, "step": 286100 }, { "epoch": 1.85, "learning_rate": 2.300677049381361e-05, "loss": 0.0262, "step": 286110 }, { "epoch": 1.85, "learning_rate": 2.299708913945668e-05, "loss": 0.0173, "step": 286120 }, { "epoch": 1.85, "learning_rate": 2.298740778509975e-05, "loss": 0.0198, "step": 286130 }, { "epoch": 1.85, "learning_rate": 2.2977726430742816e-05, "loss": 0.021, "step": 286140 }, { "epoch": 1.85, "learning_rate": 2.2968045076385886e-05, "loss": 0.0229, "step": 286150 }, { "epoch": 1.85, "learning_rate": 2.2958363722028952e-05, "loss": 0.0216, "step": 286160 }, { "epoch": 1.85, "learning_rate": 2.294868236767202e-05, "loss": 0.0224, "step": 286170 }, { "epoch": 1.85, "learning_rate": 2.2939001013315088e-05, "loss": 0.0228, "step": 286180 }, { "epoch": 1.85, "learning_rate": 2.2929319658958154e-05, "loss": 0.0205, "step": 286190 }, { "epoch": 1.85, "learning_rate": 2.2919638304601224e-05, "loss": 0.027, "step": 286200 }, { "epoch": 1.85, "learning_rate": 2.290995695024429e-05, "loss": 0.0244, "step": 286210 }, { "epoch": 1.85, "learning_rate": 2.290027559588736e-05, "loss": 0.03, "step": 286220 }, { "epoch": 1.85, "learning_rate": 2.2890594241530426e-05, "loss": 0.0197, "step": 286230 }, { "epoch": 1.85, "learning_rate": 2.2880912887173492e-05, "loss": 0.0194, "step": 286240 }, { "epoch": 1.85, "learning_rate": 2.2871231532816562e-05, "loss": 0.0268, "step": 286250 }, { "epoch": 1.85, "learning_rate": 2.2861550178459628e-05, "loss": 0.0195, "step": 286260 }, { "epoch": 1.85, "learning_rate": 2.2851868824102698e-05, "loss": 0.0228, "step": 286270 }, { "epoch": 1.85, "learning_rate": 2.2842187469745767e-05, "loss": 0.0223, "step": 286280 }, { "epoch": 1.85, "learning_rate": 2.2832506115388834e-05, "loss": 0.0197, "step": 286290 }, { "epoch": 1.85, "learning_rate": 2.28228247610319e-05, "loss": 0.0212, "step": 286300 }, { "epoch": 1.85, "learning_rate": 2.2813143406674966e-05, "loss": 0.0259, "step": 286310 }, { "epoch": 1.85, "learning_rate": 2.2803462052318036e-05, "loss": 0.0243, "step": 286320 }, { "epoch": 1.85, "learning_rate": 2.2793780697961105e-05, "loss": 0.0278, "step": 286330 }, { "epoch": 1.85, "learning_rate": 2.278409934360417e-05, "loss": 0.0226, "step": 286340 }, { "epoch": 1.85, "learning_rate": 2.277441798924724e-05, "loss": 0.0206, "step": 286350 }, { "epoch": 1.85, "learning_rate": 2.276473663489031e-05, "loss": 0.022, "step": 286360 }, { "epoch": 1.85, "learning_rate": 2.2755055280533374e-05, "loss": 0.0227, "step": 286370 }, { "epoch": 1.85, "learning_rate": 2.2745373926176443e-05, "loss": 0.0235, "step": 286380 }, { "epoch": 1.85, "learning_rate": 2.273569257181951e-05, "loss": 0.0279, "step": 286390 }, { "epoch": 1.85, "learning_rate": 2.272601121746258e-05, "loss": 0.0195, "step": 286400 }, { "epoch": 1.85, "learning_rate": 2.271632986310565e-05, "loss": 0.0237, "step": 286410 }, { "epoch": 1.85, "learning_rate": 2.2706648508748715e-05, "loss": 0.0205, "step": 286420 }, { "epoch": 1.85, "learning_rate": 2.2696967154391785e-05, "loss": 0.0188, "step": 286430 }, { "epoch": 1.85, "learning_rate": 2.2687285800034848e-05, "loss": 0.0192, "step": 286440 }, { "epoch": 1.85, "learning_rate": 2.2677604445677917e-05, "loss": 0.0208, "step": 286450 }, { "epoch": 1.85, "learning_rate": 2.2667923091320987e-05, "loss": 0.0185, "step": 286460 }, { "epoch": 1.85, "learning_rate": 2.2658241736964053e-05, "loss": 0.0181, "step": 286470 }, { "epoch": 1.85, "learning_rate": 2.2648560382607123e-05, "loss": 0.0227, "step": 286480 }, { "epoch": 1.85, "learning_rate": 2.2638879028250192e-05, "loss": 0.0262, "step": 286490 }, { "epoch": 1.85, "learning_rate": 2.262919767389326e-05, "loss": 0.0224, "step": 286500 }, { "epoch": 1.85, "learning_rate": 2.2619516319536325e-05, "loss": 0.0187, "step": 286510 }, { "epoch": 1.85, "learning_rate": 2.260983496517939e-05, "loss": 0.0241, "step": 286520 }, { "epoch": 1.85, "learning_rate": 2.260015361082246e-05, "loss": 0.0178, "step": 286530 }, { "epoch": 1.85, "learning_rate": 2.259047225646553e-05, "loss": 0.0294, "step": 286540 }, { "epoch": 1.85, "learning_rate": 2.2580790902108597e-05, "loss": 0.0198, "step": 286550 }, { "epoch": 1.85, "learning_rate": 2.2571109547751666e-05, "loss": 0.0277, "step": 286560 }, { "epoch": 1.85, "learning_rate": 2.2561428193394736e-05, "loss": 0.0197, "step": 286570 }, { "epoch": 1.85, "learning_rate": 2.25517468390378e-05, "loss": 0.0304, "step": 286580 }, { "epoch": 1.85, "learning_rate": 2.2542065484680868e-05, "loss": 0.0245, "step": 286590 }, { "epoch": 1.85, "learning_rate": 2.2532384130323934e-05, "loss": 0.0269, "step": 286600 }, { "epoch": 1.85, "learning_rate": 2.2522702775967004e-05, "loss": 0.0233, "step": 286610 }, { "epoch": 1.85, "learning_rate": 2.2513021421610074e-05, "loss": 0.0243, "step": 286620 }, { "epoch": 1.85, "learning_rate": 2.250334006725314e-05, "loss": 0.0189, "step": 286630 }, { "epoch": 1.85, "learning_rate": 2.249365871289621e-05, "loss": 0.022, "step": 286640 }, { "epoch": 1.85, "learning_rate": 2.2483977358539272e-05, "loss": 0.0189, "step": 286650 }, { "epoch": 1.85, "learning_rate": 2.2474296004182342e-05, "loss": 0.0226, "step": 286660 }, { "epoch": 1.85, "learning_rate": 2.2464614649825412e-05, "loss": 0.0258, "step": 286670 }, { "epoch": 1.85, "learning_rate": 2.2454933295468478e-05, "loss": 0.0248, "step": 286680 }, { "epoch": 1.85, "learning_rate": 2.2445251941111548e-05, "loss": 0.0238, "step": 286690 }, { "epoch": 1.85, "learning_rate": 2.2435570586754617e-05, "loss": 0.0222, "step": 286700 }, { "epoch": 1.85, "learning_rate": 2.2425889232397683e-05, "loss": 0.0272, "step": 286710 }, { "epoch": 1.85, "learning_rate": 2.241620787804075e-05, "loss": 0.0222, "step": 286720 }, { "epoch": 1.85, "learning_rate": 2.2406526523683816e-05, "loss": 0.0197, "step": 286730 }, { "epoch": 1.85, "learning_rate": 2.2396845169326886e-05, "loss": 0.0239, "step": 286740 }, { "epoch": 1.85, "learning_rate": 2.2387163814969955e-05, "loss": 0.0207, "step": 286750 }, { "epoch": 1.85, "learning_rate": 2.237748246061302e-05, "loss": 0.0204, "step": 286760 }, { "epoch": 1.85, "learning_rate": 2.236780110625609e-05, "loss": 0.0221, "step": 286770 }, { "epoch": 1.85, "learning_rate": 2.2358119751899157e-05, "loss": 0.0208, "step": 286780 }, { "epoch": 1.85, "learning_rate": 2.2348438397542224e-05, "loss": 0.0306, "step": 286790 }, { "epoch": 1.85, "learning_rate": 2.2338757043185293e-05, "loss": 0.0256, "step": 286800 }, { "epoch": 1.85, "learning_rate": 2.232907568882836e-05, "loss": 0.021, "step": 286810 }, { "epoch": 1.85, "learning_rate": 2.231939433447143e-05, "loss": 0.0223, "step": 286820 }, { "epoch": 1.85, "learning_rate": 2.2309712980114495e-05, "loss": 0.0205, "step": 286830 }, { "epoch": 1.85, "learning_rate": 2.2300031625757565e-05, "loss": 0.0213, "step": 286840 }, { "epoch": 1.85, "learning_rate": 2.2290350271400635e-05, "loss": 0.0217, "step": 286850 }, { "epoch": 1.85, "learning_rate": 2.2280668917043697e-05, "loss": 0.0254, "step": 286860 }, { "epoch": 1.85, "learning_rate": 2.2270987562686767e-05, "loss": 0.0222, "step": 286870 }, { "epoch": 1.85, "learning_rate": 2.2261306208329833e-05, "loss": 0.0222, "step": 286880 }, { "epoch": 1.85, "learning_rate": 2.2251624853972903e-05, "loss": 0.023, "step": 286890 }, { "epoch": 1.85, "learning_rate": 2.2241943499615972e-05, "loss": 0.0213, "step": 286900 }, { "epoch": 1.85, "learning_rate": 2.223226214525904e-05, "loss": 0.0228, "step": 286910 }, { "epoch": 1.85, "learning_rate": 2.222258079090211e-05, "loss": 0.0245, "step": 286920 }, { "epoch": 1.85, "learning_rate": 2.2212899436545175e-05, "loss": 0.0227, "step": 286930 }, { "epoch": 1.85, "learning_rate": 2.220321808218824e-05, "loss": 0.0232, "step": 286940 }, { "epoch": 1.85, "learning_rate": 2.219353672783131e-05, "loss": 0.0256, "step": 286950 }, { "epoch": 1.85, "learning_rate": 2.2183855373474377e-05, "loss": 0.0223, "step": 286960 }, { "epoch": 1.85, "learning_rate": 2.2174174019117446e-05, "loss": 0.0259, "step": 286970 }, { "epoch": 1.85, "learning_rate": 2.2164492664760516e-05, "loss": 0.0225, "step": 286980 }, { "epoch": 1.85, "learning_rate": 2.2154811310403582e-05, "loss": 0.0199, "step": 286990 }, { "epoch": 1.85, "learning_rate": 2.214512995604665e-05, "loss": 0.0244, "step": 287000 }, { "epoch": 1.85, "eval_cer": 0.9198436334877415, "eval_loss": 0.017086287960410118, "eval_runtime": 119.8872, "eval_samples_per_second": 16.682, "eval_steps_per_second": 4.171, "step": 287000 }, { "epoch": 1.85, "learning_rate": 2.2135448601689715e-05, "loss": 0.0207, "step": 287010 }, { "epoch": 1.85, "learning_rate": 2.2125767247332784e-05, "loss": 0.0265, "step": 287020 }, { "epoch": 1.85, "learning_rate": 2.2116085892975854e-05, "loss": 0.0233, "step": 287030 }, { "epoch": 1.85, "learning_rate": 2.210640453861892e-05, "loss": 0.023, "step": 287040 }, { "epoch": 1.85, "learning_rate": 2.209672318426199e-05, "loss": 0.0213, "step": 287050 }, { "epoch": 1.85, "learning_rate": 2.208704182990506e-05, "loss": 0.0221, "step": 287060 }, { "epoch": 1.85, "learning_rate": 2.2077360475548122e-05, "loss": 0.0221, "step": 287070 }, { "epoch": 1.85, "learning_rate": 2.2067679121191192e-05, "loss": 0.0203, "step": 287080 }, { "epoch": 1.85, "learning_rate": 2.2057997766834258e-05, "loss": 0.018, "step": 287090 }, { "epoch": 1.85, "learning_rate": 2.2048316412477328e-05, "loss": 0.0229, "step": 287100 }, { "epoch": 1.85, "learning_rate": 2.2038635058120397e-05, "loss": 0.0192, "step": 287110 }, { "epoch": 1.85, "learning_rate": 2.2028953703763464e-05, "loss": 0.0214, "step": 287120 }, { "epoch": 1.85, "learning_rate": 2.201927234940653e-05, "loss": 0.0192, "step": 287130 }, { "epoch": 1.85, "learning_rate": 2.2009590995049596e-05, "loss": 0.0237, "step": 287140 }, { "epoch": 1.85, "learning_rate": 2.1999909640692666e-05, "loss": 0.0257, "step": 287150 }, { "epoch": 1.85, "learning_rate": 2.1990228286335735e-05, "loss": 0.0214, "step": 287160 }, { "epoch": 1.85, "learning_rate": 2.19805469319788e-05, "loss": 0.0225, "step": 287170 }, { "epoch": 1.85, "learning_rate": 2.197086557762187e-05, "loss": 0.0265, "step": 287180 }, { "epoch": 1.85, "learning_rate": 2.196118422326494e-05, "loss": 0.0183, "step": 287190 }, { "epoch": 1.85, "learning_rate": 2.1951502868908004e-05, "loss": 0.0209, "step": 287200 }, { "epoch": 1.85, "learning_rate": 2.1941821514551073e-05, "loss": 0.0182, "step": 287210 }, { "epoch": 1.85, "learning_rate": 2.193214016019414e-05, "loss": 0.0234, "step": 287220 }, { "epoch": 1.85, "learning_rate": 2.192245880583721e-05, "loss": 0.0237, "step": 287230 }, { "epoch": 1.85, "learning_rate": 2.191277745148028e-05, "loss": 0.0217, "step": 287240 }, { "epoch": 1.85, "learning_rate": 2.1903096097123345e-05, "loss": 0.0223, "step": 287250 }, { "epoch": 1.85, "learning_rate": 2.1893414742766415e-05, "loss": 0.0188, "step": 287260 }, { "epoch": 1.85, "learning_rate": 2.1883733388409478e-05, "loss": 0.0208, "step": 287270 }, { "epoch": 1.85, "learning_rate": 2.1874052034052547e-05, "loss": 0.0191, "step": 287280 }, { "epoch": 1.85, "learning_rate": 2.1864370679695617e-05, "loss": 0.0209, "step": 287290 }, { "epoch": 1.85, "learning_rate": 2.1854689325338683e-05, "loss": 0.0185, "step": 287300 }, { "epoch": 1.85, "learning_rate": 2.1845007970981753e-05, "loss": 0.0255, "step": 287310 }, { "epoch": 1.85, "learning_rate": 2.1835326616624822e-05, "loss": 0.021, "step": 287320 }, { "epoch": 1.85, "learning_rate": 2.182564526226789e-05, "loss": 0.0232, "step": 287330 }, { "epoch": 1.85, "learning_rate": 2.1815963907910955e-05, "loss": 0.029, "step": 287340 }, { "epoch": 1.85, "learning_rate": 2.180628255355402e-05, "loss": 0.0194, "step": 287350 }, { "epoch": 1.85, "learning_rate": 2.179660119919709e-05, "loss": 0.022, "step": 287360 }, { "epoch": 1.85, "learning_rate": 2.178691984484016e-05, "loss": 0.0242, "step": 287370 }, { "epoch": 1.85, "learning_rate": 2.1777238490483226e-05, "loss": 0.0208, "step": 287380 }, { "epoch": 1.85, "learning_rate": 2.1767557136126296e-05, "loss": 0.0263, "step": 287390 }, { "epoch": 1.85, "learning_rate": 2.1757875781769366e-05, "loss": 0.0207, "step": 287400 }, { "epoch": 1.86, "learning_rate": 2.174819442741243e-05, "loss": 0.0241, "step": 287410 }, { "epoch": 1.86, "learning_rate": 2.1738513073055498e-05, "loss": 0.0259, "step": 287420 }, { "epoch": 1.86, "learning_rate": 2.1728831718698564e-05, "loss": 0.0247, "step": 287430 }, { "epoch": 1.86, "learning_rate": 2.1719150364341634e-05, "loss": 0.0222, "step": 287440 }, { "epoch": 1.86, "learning_rate": 2.1709469009984704e-05, "loss": 0.0344, "step": 287450 }, { "epoch": 1.86, "learning_rate": 2.169978765562777e-05, "loss": 0.0215, "step": 287460 }, { "epoch": 1.86, "learning_rate": 2.169010630127084e-05, "loss": 0.0187, "step": 287470 }, { "epoch": 1.86, "learning_rate": 2.1680424946913902e-05, "loss": 0.0217, "step": 287480 }, { "epoch": 1.86, "learning_rate": 2.1670743592556972e-05, "loss": 0.0225, "step": 287490 }, { "epoch": 1.86, "learning_rate": 2.166106223820004e-05, "loss": 0.0189, "step": 287500 }, { "epoch": 1.86, "learning_rate": 2.1651380883843108e-05, "loss": 0.0209, "step": 287510 }, { "epoch": 1.86, "learning_rate": 2.1641699529486178e-05, "loss": 0.0255, "step": 287520 }, { "epoch": 1.86, "learning_rate": 2.1632018175129244e-05, "loss": 0.0215, "step": 287530 }, { "epoch": 1.86, "learning_rate": 2.1622336820772313e-05, "loss": 0.0225, "step": 287540 }, { "epoch": 1.86, "learning_rate": 2.161265546641538e-05, "loss": 0.0241, "step": 287550 }, { "epoch": 1.86, "learning_rate": 2.1602974112058446e-05, "loss": 0.0262, "step": 287560 }, { "epoch": 1.86, "learning_rate": 2.1593292757701516e-05, "loss": 0.0231, "step": 287570 }, { "epoch": 1.86, "learning_rate": 2.1583611403344582e-05, "loss": 0.019, "step": 287580 }, { "epoch": 1.86, "learning_rate": 2.157393004898765e-05, "loss": 0.019, "step": 287590 }, { "epoch": 1.86, "learning_rate": 2.156424869463072e-05, "loss": 0.0241, "step": 287600 }, { "epoch": 1.86, "learning_rate": 2.1554567340273787e-05, "loss": 0.0202, "step": 287610 }, { "epoch": 1.86, "learning_rate": 2.1544885985916854e-05, "loss": 0.0285, "step": 287620 }, { "epoch": 1.86, "learning_rate": 2.153520463155992e-05, "loss": 0.0207, "step": 287630 }, { "epoch": 1.86, "learning_rate": 2.152552327720299e-05, "loss": 0.0204, "step": 287640 }, { "epoch": 1.86, "learning_rate": 2.151584192284606e-05, "loss": 0.0251, "step": 287650 }, { "epoch": 1.86, "learning_rate": 2.1506160568489125e-05, "loss": 0.0212, "step": 287660 }, { "epoch": 1.86, "learning_rate": 2.1496479214132195e-05, "loss": 0.0196, "step": 287670 }, { "epoch": 1.86, "learning_rate": 2.1486797859775264e-05, "loss": 0.0184, "step": 287680 }, { "epoch": 1.86, "learning_rate": 2.1477116505418327e-05, "loss": 0.0205, "step": 287690 }, { "epoch": 1.86, "learning_rate": 2.1467435151061397e-05, "loss": 0.0217, "step": 287700 }, { "epoch": 1.86, "learning_rate": 2.1457753796704463e-05, "loss": 0.0225, "step": 287710 }, { "epoch": 1.86, "learning_rate": 2.1448072442347533e-05, "loss": 0.0229, "step": 287720 }, { "epoch": 1.86, "learning_rate": 2.1438391087990602e-05, "loss": 0.0215, "step": 287730 }, { "epoch": 1.86, "learning_rate": 2.142870973363367e-05, "loss": 0.0237, "step": 287740 }, { "epoch": 1.86, "learning_rate": 2.141902837927674e-05, "loss": 0.0273, "step": 287750 }, { "epoch": 1.86, "learning_rate": 2.14093470249198e-05, "loss": 0.0264, "step": 287760 }, { "epoch": 1.86, "learning_rate": 2.139966567056287e-05, "loss": 0.0275, "step": 287770 }, { "epoch": 1.86, "learning_rate": 2.138998431620594e-05, "loss": 0.0215, "step": 287780 }, { "epoch": 1.86, "learning_rate": 2.1380302961849007e-05, "loss": 0.0211, "step": 287790 }, { "epoch": 1.86, "learning_rate": 2.1370621607492076e-05, "loss": 0.0228, "step": 287800 }, { "epoch": 1.86, "learning_rate": 2.1360940253135146e-05, "loss": 0.0276, "step": 287810 }, { "epoch": 1.86, "learning_rate": 2.1351258898778212e-05, "loss": 0.0221, "step": 287820 }, { "epoch": 1.86, "learning_rate": 2.134157754442128e-05, "loss": 0.0227, "step": 287830 }, { "epoch": 1.86, "learning_rate": 2.1331896190064345e-05, "loss": 0.0244, "step": 287840 }, { "epoch": 1.86, "learning_rate": 2.1322214835707414e-05, "loss": 0.0268, "step": 287850 }, { "epoch": 1.86, "learning_rate": 2.1312533481350484e-05, "loss": 0.0249, "step": 287860 }, { "epoch": 1.86, "learning_rate": 2.130285212699355e-05, "loss": 0.0271, "step": 287870 }, { "epoch": 1.86, "learning_rate": 2.129317077263662e-05, "loss": 0.0221, "step": 287880 }, { "epoch": 1.86, "learning_rate": 2.128348941827969e-05, "loss": 0.0217, "step": 287890 }, { "epoch": 1.86, "learning_rate": 2.1273808063922752e-05, "loss": 0.0246, "step": 287900 }, { "epoch": 1.86, "learning_rate": 2.1264126709565822e-05, "loss": 0.026, "step": 287910 }, { "epoch": 1.86, "learning_rate": 2.1254445355208888e-05, "loss": 0.0267, "step": 287920 }, { "epoch": 1.86, "learning_rate": 2.1244764000851958e-05, "loss": 0.0246, "step": 287930 }, { "epoch": 1.86, "learning_rate": 2.1235082646495027e-05, "loss": 0.0205, "step": 287940 }, { "epoch": 1.86, "learning_rate": 2.1225401292138094e-05, "loss": 0.0197, "step": 287950 }, { "epoch": 1.86, "learning_rate": 2.121571993778116e-05, "loss": 0.022, "step": 287960 }, { "epoch": 1.86, "learning_rate": 2.1206038583424226e-05, "loss": 0.0237, "step": 287970 }, { "epoch": 1.86, "learning_rate": 2.1196357229067296e-05, "loss": 0.022, "step": 287980 }, { "epoch": 1.86, "learning_rate": 2.1186675874710365e-05, "loss": 0.0299, "step": 287990 }, { "epoch": 1.86, "learning_rate": 2.117699452035343e-05, "loss": 0.0223, "step": 288000 }, { "epoch": 1.86, "eval_cer": 0.9198327872556773, "eval_loss": 0.016944361850619316, "eval_runtime": 120.4246, "eval_samples_per_second": 16.608, "eval_steps_per_second": 4.152, "step": 288000 }, { "epoch": 1.86, "learning_rate": 2.11673131659965e-05, "loss": 0.025, "step": 288010 }, { "epoch": 1.86, "learning_rate": 2.115763181163957e-05, "loss": 0.0272, "step": 288020 }, { "epoch": 1.86, "learning_rate": 2.1147950457282634e-05, "loss": 0.028, "step": 288030 }, { "epoch": 1.86, "learning_rate": 2.1138269102925703e-05, "loss": 0.0282, "step": 288040 }, { "epoch": 1.86, "learning_rate": 2.112858774856877e-05, "loss": 0.0293, "step": 288050 }, { "epoch": 1.86, "learning_rate": 2.111890639421184e-05, "loss": 0.0233, "step": 288060 }, { "epoch": 1.86, "learning_rate": 2.110922503985491e-05, "loss": 0.0248, "step": 288070 }, { "epoch": 1.86, "learning_rate": 2.1099543685497975e-05, "loss": 0.0184, "step": 288080 }, { "epoch": 1.86, "learning_rate": 2.1089862331141045e-05, "loss": 0.0227, "step": 288090 }, { "epoch": 1.86, "learning_rate": 2.1080180976784108e-05, "loss": 0.0218, "step": 288100 }, { "epoch": 1.86, "learning_rate": 2.1070499622427177e-05, "loss": 0.02, "step": 288110 }, { "epoch": 1.86, "learning_rate": 2.1060818268070247e-05, "loss": 0.0231, "step": 288120 }, { "epoch": 1.86, "learning_rate": 2.1051136913713313e-05, "loss": 0.0227, "step": 288130 }, { "epoch": 1.86, "learning_rate": 2.1041455559356383e-05, "loss": 0.0224, "step": 288140 }, { "epoch": 1.86, "learning_rate": 2.1031774204999452e-05, "loss": 0.0211, "step": 288150 }, { "epoch": 1.86, "learning_rate": 2.102209285064252e-05, "loss": 0.0257, "step": 288160 }, { "epoch": 1.86, "learning_rate": 2.1012411496285585e-05, "loss": 0.0225, "step": 288170 }, { "epoch": 1.86, "learning_rate": 2.100273014192865e-05, "loss": 0.0189, "step": 288180 }, { "epoch": 1.86, "learning_rate": 2.099304878757172e-05, "loss": 0.0247, "step": 288190 }, { "epoch": 1.86, "learning_rate": 2.098336743321479e-05, "loss": 0.0207, "step": 288200 }, { "epoch": 1.86, "learning_rate": 2.0973686078857856e-05, "loss": 0.0244, "step": 288210 }, { "epoch": 1.86, "learning_rate": 2.0964004724500926e-05, "loss": 0.0244, "step": 288220 }, { "epoch": 1.86, "learning_rate": 2.0954323370143992e-05, "loss": 0.0222, "step": 288230 }, { "epoch": 1.86, "learning_rate": 2.094464201578706e-05, "loss": 0.0219, "step": 288240 }, { "epoch": 1.86, "learning_rate": 2.0934960661430128e-05, "loss": 0.0243, "step": 288250 }, { "epoch": 1.86, "learning_rate": 2.0925279307073194e-05, "loss": 0.0197, "step": 288260 }, { "epoch": 1.86, "learning_rate": 2.0915597952716264e-05, "loss": 0.025, "step": 288270 }, { "epoch": 1.86, "learning_rate": 2.090591659835933e-05, "loss": 0.0246, "step": 288280 }, { "epoch": 1.86, "learning_rate": 2.08962352440024e-05, "loss": 0.022, "step": 288290 }, { "epoch": 1.86, "learning_rate": 2.088655388964547e-05, "loss": 0.0222, "step": 288300 }, { "epoch": 1.86, "learning_rate": 2.0876872535288532e-05, "loss": 0.0271, "step": 288310 }, { "epoch": 1.86, "learning_rate": 2.0867191180931602e-05, "loss": 0.0207, "step": 288320 }, { "epoch": 1.86, "learning_rate": 2.0857509826574668e-05, "loss": 0.0178, "step": 288330 }, { "epoch": 1.86, "learning_rate": 2.0847828472217738e-05, "loss": 0.023, "step": 288340 }, { "epoch": 1.86, "learning_rate": 2.0838147117860808e-05, "loss": 0.0235, "step": 288350 }, { "epoch": 1.86, "learning_rate": 2.0828465763503874e-05, "loss": 0.0177, "step": 288360 }, { "epoch": 1.86, "learning_rate": 2.0818784409146943e-05, "loss": 0.0243, "step": 288370 }, { "epoch": 1.86, "learning_rate": 2.0809103054790006e-05, "loss": 0.0214, "step": 288380 }, { "epoch": 1.86, "learning_rate": 2.0799421700433076e-05, "loss": 0.0221, "step": 288390 }, { "epoch": 1.86, "learning_rate": 2.0789740346076146e-05, "loss": 0.0203, "step": 288400 }, { "epoch": 1.86, "learning_rate": 2.0780058991719212e-05, "loss": 0.0175, "step": 288410 }, { "epoch": 1.86, "learning_rate": 2.077037763736228e-05, "loss": 0.0201, "step": 288420 }, { "epoch": 1.86, "learning_rate": 2.076069628300535e-05, "loss": 0.025, "step": 288430 }, { "epoch": 1.86, "learning_rate": 2.0751014928648417e-05, "loss": 0.0187, "step": 288440 }, { "epoch": 1.86, "learning_rate": 2.0741333574291483e-05, "loss": 0.0225, "step": 288450 }, { "epoch": 1.86, "learning_rate": 2.073165221993455e-05, "loss": 0.0215, "step": 288460 }, { "epoch": 1.86, "learning_rate": 2.072197086557762e-05, "loss": 0.0233, "step": 288470 }, { "epoch": 1.86, "learning_rate": 2.071228951122069e-05, "loss": 0.0212, "step": 288480 }, { "epoch": 1.86, "learning_rate": 2.0702608156863755e-05, "loss": 0.0264, "step": 288490 }, { "epoch": 1.86, "learning_rate": 2.0692926802506825e-05, "loss": 0.0206, "step": 288500 }, { "epoch": 1.86, "learning_rate": 2.0683245448149894e-05, "loss": 0.0208, "step": 288510 }, { "epoch": 1.86, "learning_rate": 2.0673564093792957e-05, "loss": 0.0295, "step": 288520 }, { "epoch": 1.86, "learning_rate": 2.0663882739436027e-05, "loss": 0.0207, "step": 288530 }, { "epoch": 1.86, "learning_rate": 2.0654201385079093e-05, "loss": 0.0213, "step": 288540 }, { "epoch": 1.86, "learning_rate": 2.0644520030722163e-05, "loss": 0.0183, "step": 288550 }, { "epoch": 1.86, "learning_rate": 2.0634838676365232e-05, "loss": 0.0213, "step": 288560 }, { "epoch": 1.86, "learning_rate": 2.06251573220083e-05, "loss": 0.0219, "step": 288570 }, { "epoch": 1.86, "learning_rate": 2.061547596765137e-05, "loss": 0.024, "step": 288580 }, { "epoch": 1.86, "learning_rate": 2.060579461329443e-05, "loss": 0.0185, "step": 288590 }, { "epoch": 1.86, "learning_rate": 2.05961132589375e-05, "loss": 0.0271, "step": 288600 }, { "epoch": 1.86, "learning_rate": 2.058643190458057e-05, "loss": 0.0255, "step": 288610 }, { "epoch": 1.86, "learning_rate": 2.0576750550223637e-05, "loss": 0.0278, "step": 288620 }, { "epoch": 1.86, "learning_rate": 2.0567069195866706e-05, "loss": 0.0206, "step": 288630 }, { "epoch": 1.86, "learning_rate": 2.0557387841509776e-05, "loss": 0.024, "step": 288640 }, { "epoch": 1.86, "learning_rate": 2.0547706487152842e-05, "loss": 0.021, "step": 288650 }, { "epoch": 1.86, "learning_rate": 2.053802513279591e-05, "loss": 0.0278, "step": 288660 }, { "epoch": 1.86, "learning_rate": 2.0528343778438975e-05, "loss": 0.0231, "step": 288670 }, { "epoch": 1.86, "learning_rate": 2.0518662424082044e-05, "loss": 0.0242, "step": 288680 }, { "epoch": 1.86, "learning_rate": 2.0508981069725114e-05, "loss": 0.019, "step": 288690 }, { "epoch": 1.86, "learning_rate": 2.049929971536818e-05, "loss": 0.0216, "step": 288700 }, { "epoch": 1.86, "learning_rate": 2.048961836101125e-05, "loss": 0.0221, "step": 288710 }, { "epoch": 1.86, "learning_rate": 2.047993700665432e-05, "loss": 0.0245, "step": 288720 }, { "epoch": 1.86, "learning_rate": 2.0470255652297382e-05, "loss": 0.0231, "step": 288730 }, { "epoch": 1.86, "learning_rate": 2.0460574297940452e-05, "loss": 0.0216, "step": 288740 }, { "epoch": 1.86, "learning_rate": 2.0450892943583518e-05, "loss": 0.0234, "step": 288750 }, { "epoch": 1.86, "learning_rate": 2.0441211589226588e-05, "loss": 0.0217, "step": 288760 }, { "epoch": 1.86, "learning_rate": 2.0431530234869657e-05, "loss": 0.0238, "step": 288770 }, { "epoch": 1.86, "learning_rate": 2.0421848880512724e-05, "loss": 0.0208, "step": 288780 }, { "epoch": 1.86, "learning_rate": 2.041216752615579e-05, "loss": 0.0252, "step": 288790 }, { "epoch": 1.86, "learning_rate": 2.0402486171798856e-05, "loss": 0.0195, "step": 288800 }, { "epoch": 1.86, "learning_rate": 2.0392804817441926e-05, "loss": 0.0242, "step": 288810 }, { "epoch": 1.86, "learning_rate": 2.0383123463084995e-05, "loss": 0.0252, "step": 288820 }, { "epoch": 1.86, "learning_rate": 2.037344210872806e-05, "loss": 0.025, "step": 288830 }, { "epoch": 1.86, "learning_rate": 2.036376075437113e-05, "loss": 0.0286, "step": 288840 }, { "epoch": 1.86, "learning_rate": 2.0354079400014197e-05, "loss": 0.0181, "step": 288850 }, { "epoch": 1.86, "learning_rate": 2.0344398045657264e-05, "loss": 0.0233, "step": 288860 }, { "epoch": 1.86, "learning_rate": 2.0334716691300333e-05, "loss": 0.0216, "step": 288870 }, { "epoch": 1.86, "learning_rate": 2.03250353369434e-05, "loss": 0.0275, "step": 288880 }, { "epoch": 1.86, "learning_rate": 2.031535398258647e-05, "loss": 0.0263, "step": 288890 }, { "epoch": 1.86, "learning_rate": 2.0305672628229535e-05, "loss": 0.0256, "step": 288900 }, { "epoch": 1.86, "learning_rate": 2.0295991273872605e-05, "loss": 0.0202, "step": 288910 }, { "epoch": 1.86, "learning_rate": 2.0286309919515675e-05, "loss": 0.0258, "step": 288920 }, { "epoch": 1.86, "learning_rate": 2.0276628565158738e-05, "loss": 0.0202, "step": 288930 }, { "epoch": 1.86, "learning_rate": 2.0266947210801807e-05, "loss": 0.0221, "step": 288940 }, { "epoch": 1.86, "learning_rate": 2.0257265856444873e-05, "loss": 0.0227, "step": 288950 }, { "epoch": 1.87, "learning_rate": 2.0247584502087943e-05, "loss": 0.0245, "step": 288960 }, { "epoch": 1.87, "learning_rate": 2.0237903147731013e-05, "loss": 0.0208, "step": 288970 }, { "epoch": 1.87, "learning_rate": 2.022822179337408e-05, "loss": 0.0341, "step": 288980 }, { "epoch": 1.87, "learning_rate": 2.021854043901715e-05, "loss": 0.0197, "step": 288990 }, { "epoch": 1.87, "learning_rate": 2.020885908466021e-05, "loss": 0.0285, "step": 289000 }, { "epoch": 1.87, "eval_cer": 0.9198481527511015, "eval_loss": 0.016835737973451614, "eval_runtime": 119.8731, "eval_samples_per_second": 16.684, "eval_steps_per_second": 4.171, "step": 289000 }, { "epoch": 1.87, "learning_rate": 2.019917773030328e-05, "loss": 0.0222, "step": 289010 }, { "epoch": 1.87, "learning_rate": 2.018949637594635e-05, "loss": 0.0217, "step": 289020 }, { "epoch": 1.87, "learning_rate": 2.0179815021589417e-05, "loss": 0.0216, "step": 289030 }, { "epoch": 1.87, "learning_rate": 2.0170133667232486e-05, "loss": 0.0236, "step": 289040 }, { "epoch": 1.87, "learning_rate": 2.0160452312875556e-05, "loss": 0.0253, "step": 289050 }, { "epoch": 1.87, "learning_rate": 2.0150770958518622e-05, "loss": 0.021, "step": 289060 }, { "epoch": 1.87, "learning_rate": 2.014108960416169e-05, "loss": 0.0255, "step": 289070 }, { "epoch": 1.87, "learning_rate": 2.0131408249804755e-05, "loss": 0.0206, "step": 289080 }, { "epoch": 1.87, "learning_rate": 2.0121726895447824e-05, "loss": 0.0239, "step": 289090 }, { "epoch": 1.87, "learning_rate": 2.0112045541090894e-05, "loss": 0.0224, "step": 289100 }, { "epoch": 1.87, "learning_rate": 2.010236418673396e-05, "loss": 0.0174, "step": 289110 }, { "epoch": 1.87, "learning_rate": 2.009268283237703e-05, "loss": 0.0199, "step": 289120 }, { "epoch": 1.87, "learning_rate": 2.00830014780201e-05, "loss": 0.0259, "step": 289130 }, { "epoch": 1.87, "learning_rate": 2.0073320123663162e-05, "loss": 0.0218, "step": 289140 }, { "epoch": 1.87, "learning_rate": 2.0063638769306232e-05, "loss": 0.0208, "step": 289150 }, { "epoch": 1.87, "learning_rate": 2.0053957414949298e-05, "loss": 0.0254, "step": 289160 }, { "epoch": 1.87, "learning_rate": 2.0044276060592368e-05, "loss": 0.0212, "step": 289170 }, { "epoch": 1.87, "learning_rate": 2.0034594706235438e-05, "loss": 0.0288, "step": 289180 }, { "epoch": 1.87, "learning_rate": 2.0024913351878504e-05, "loss": 0.0245, "step": 289190 }, { "epoch": 1.87, "learning_rate": 2.0015231997521573e-05, "loss": 0.0237, "step": 289200 }, { "epoch": 1.87, "learning_rate": 2.0005550643164636e-05, "loss": 0.0228, "step": 289210 }, { "epoch": 1.87, "learning_rate": 1.9995869288807706e-05, "loss": 0.0226, "step": 289220 }, { "epoch": 1.87, "learning_rate": 1.9986187934450776e-05, "loss": 0.0171, "step": 289230 }, { "epoch": 1.87, "learning_rate": 1.9976506580093842e-05, "loss": 0.0223, "step": 289240 }, { "epoch": 1.87, "learning_rate": 1.996682522573691e-05, "loss": 0.0219, "step": 289250 }, { "epoch": 1.87, "learning_rate": 1.995714387137998e-05, "loss": 0.0206, "step": 289260 }, { "epoch": 1.87, "learning_rate": 1.9947462517023047e-05, "loss": 0.0234, "step": 289270 }, { "epoch": 1.87, "learning_rate": 1.9937781162666113e-05, "loss": 0.0208, "step": 289280 }, { "epoch": 1.87, "learning_rate": 1.992809980830918e-05, "loss": 0.0258, "step": 289290 }, { "epoch": 1.87, "learning_rate": 1.991841845395225e-05, "loss": 0.0287, "step": 289300 }, { "epoch": 1.87, "learning_rate": 1.990873709959532e-05, "loss": 0.0187, "step": 289310 }, { "epoch": 1.87, "learning_rate": 1.9899055745238385e-05, "loss": 0.0211, "step": 289320 }, { "epoch": 1.87, "learning_rate": 1.9889374390881455e-05, "loss": 0.019, "step": 289330 }, { "epoch": 1.87, "learning_rate": 1.9879693036524524e-05, "loss": 0.0247, "step": 289340 }, { "epoch": 1.87, "learning_rate": 1.9870011682167587e-05, "loss": 0.0205, "step": 289350 }, { "epoch": 1.87, "learning_rate": 1.9860330327810657e-05, "loss": 0.0213, "step": 289360 }, { "epoch": 1.87, "learning_rate": 1.9850648973453723e-05, "loss": 0.0196, "step": 289370 }, { "epoch": 1.87, "learning_rate": 1.9840967619096793e-05, "loss": 0.0182, "step": 289380 }, { "epoch": 1.87, "learning_rate": 1.9831286264739862e-05, "loss": 0.0208, "step": 289390 }, { "epoch": 1.87, "learning_rate": 1.982160491038293e-05, "loss": 0.0209, "step": 289400 }, { "epoch": 1.87, "learning_rate": 1.9811923556025998e-05, "loss": 0.024, "step": 289410 }, { "epoch": 1.87, "learning_rate": 1.980224220166906e-05, "loss": 0.0249, "step": 289420 }, { "epoch": 1.87, "learning_rate": 1.979256084731213e-05, "loss": 0.0209, "step": 289430 }, { "epoch": 1.87, "learning_rate": 1.97828794929552e-05, "loss": 0.021, "step": 289440 }, { "epoch": 1.87, "learning_rate": 1.9773198138598267e-05, "loss": 0.0209, "step": 289450 }, { "epoch": 1.87, "learning_rate": 1.9763516784241336e-05, "loss": 0.0207, "step": 289460 }, { "epoch": 1.87, "learning_rate": 1.9753835429884406e-05, "loss": 0.0233, "step": 289470 }, { "epoch": 1.87, "learning_rate": 1.9744154075527472e-05, "loss": 0.0332, "step": 289480 }, { "epoch": 1.87, "learning_rate": 1.973447272117054e-05, "loss": 0.0299, "step": 289490 }, { "epoch": 1.87, "learning_rate": 1.9724791366813605e-05, "loss": 0.0267, "step": 289500 }, { "epoch": 1.87, "learning_rate": 1.9715110012456674e-05, "loss": 0.0223, "step": 289510 }, { "epoch": 1.87, "learning_rate": 1.9705428658099744e-05, "loss": 0.0207, "step": 289520 }, { "epoch": 1.87, "learning_rate": 1.969574730374281e-05, "loss": 0.0207, "step": 289530 }, { "epoch": 1.87, "learning_rate": 1.968606594938588e-05, "loss": 0.0228, "step": 289540 }, { "epoch": 1.87, "learning_rate": 1.9676384595028946e-05, "loss": 0.0289, "step": 289550 }, { "epoch": 1.87, "learning_rate": 1.9666703240672012e-05, "loss": 0.0223, "step": 289560 }, { "epoch": 1.87, "learning_rate": 1.9657021886315082e-05, "loss": 0.0189, "step": 289570 }, { "epoch": 1.87, "learning_rate": 1.9647340531958148e-05, "loss": 0.0232, "step": 289580 }, { "epoch": 1.87, "learning_rate": 1.9637659177601218e-05, "loss": 0.0189, "step": 289590 }, { "epoch": 1.87, "learning_rate": 1.9627977823244284e-05, "loss": 0.023, "step": 289600 }, { "epoch": 1.87, "learning_rate": 1.9618296468887354e-05, "loss": 0.0194, "step": 289610 }, { "epoch": 1.87, "learning_rate": 1.9608615114530423e-05, "loss": 0.0218, "step": 289620 }, { "epoch": 1.87, "learning_rate": 1.9598933760173486e-05, "loss": 0.0251, "step": 289630 }, { "epoch": 1.87, "learning_rate": 1.9589252405816556e-05, "loss": 0.0193, "step": 289640 }, { "epoch": 1.87, "learning_rate": 1.9579571051459622e-05, "loss": 0.0186, "step": 289650 }, { "epoch": 1.87, "learning_rate": 1.956988969710269e-05, "loss": 0.0246, "step": 289660 }, { "epoch": 1.87, "learning_rate": 1.956020834274576e-05, "loss": 0.0194, "step": 289670 }, { "epoch": 1.87, "learning_rate": 1.9550526988388827e-05, "loss": 0.022, "step": 289680 }, { "epoch": 1.87, "learning_rate": 1.9540845634031894e-05, "loss": 0.031, "step": 289690 }, { "epoch": 1.87, "learning_rate": 1.953116427967496e-05, "loss": 0.0227, "step": 289700 }, { "epoch": 1.87, "learning_rate": 1.952148292531803e-05, "loss": 0.0257, "step": 289710 }, { "epoch": 1.87, "learning_rate": 1.95118015709611e-05, "loss": 0.0233, "step": 289720 }, { "epoch": 1.87, "learning_rate": 1.9502120216604165e-05, "loss": 0.0199, "step": 289730 }, { "epoch": 1.87, "learning_rate": 1.9492438862247235e-05, "loss": 0.0231, "step": 289740 }, { "epoch": 1.87, "learning_rate": 1.9482757507890305e-05, "loss": 0.022, "step": 289750 }, { "epoch": 1.87, "learning_rate": 1.9473076153533367e-05, "loss": 0.0244, "step": 289760 }, { "epoch": 1.87, "learning_rate": 1.9463394799176437e-05, "loss": 0.0311, "step": 289770 }, { "epoch": 1.87, "learning_rate": 1.9453713444819503e-05, "loss": 0.0241, "step": 289780 }, { "epoch": 1.87, "learning_rate": 1.9444032090462573e-05, "loss": 0.018, "step": 289790 }, { "epoch": 1.87, "learning_rate": 1.9434350736105643e-05, "loss": 0.0263, "step": 289800 }, { "epoch": 1.87, "learning_rate": 1.942466938174871e-05, "loss": 0.0224, "step": 289810 }, { "epoch": 1.87, "learning_rate": 1.941498802739178e-05, "loss": 0.0223, "step": 289820 }, { "epoch": 1.87, "learning_rate": 1.940530667303484e-05, "loss": 0.0227, "step": 289830 }, { "epoch": 1.87, "learning_rate": 1.939562531867791e-05, "loss": 0.0225, "step": 289840 }, { "epoch": 1.87, "learning_rate": 1.938594396432098e-05, "loss": 0.0198, "step": 289850 }, { "epoch": 1.87, "learning_rate": 1.9376262609964047e-05, "loss": 0.0203, "step": 289860 }, { "epoch": 1.87, "learning_rate": 1.9366581255607116e-05, "loss": 0.0211, "step": 289870 }, { "epoch": 1.87, "learning_rate": 1.9356899901250186e-05, "loss": 0.0211, "step": 289880 }, { "epoch": 1.87, "learning_rate": 1.9347218546893252e-05, "loss": 0.0212, "step": 289890 }, { "epoch": 1.87, "learning_rate": 1.933753719253632e-05, "loss": 0.0213, "step": 289900 }, { "epoch": 1.87, "learning_rate": 1.9327855838179385e-05, "loss": 0.02, "step": 289910 }, { "epoch": 1.87, "learning_rate": 1.9318174483822454e-05, "loss": 0.0233, "step": 289920 }, { "epoch": 1.87, "learning_rate": 1.9308493129465524e-05, "loss": 0.0196, "step": 289930 }, { "epoch": 1.87, "learning_rate": 1.929881177510859e-05, "loss": 0.0188, "step": 289940 }, { "epoch": 1.87, "learning_rate": 1.928913042075166e-05, "loss": 0.0233, "step": 289950 }, { "epoch": 1.87, "learning_rate": 1.927944906639473e-05, "loss": 0.0251, "step": 289960 }, { "epoch": 1.87, "learning_rate": 1.9269767712037792e-05, "loss": 0.0217, "step": 289970 }, { "epoch": 1.87, "learning_rate": 1.9260086357680862e-05, "loss": 0.0216, "step": 289980 }, { "epoch": 1.87, "learning_rate": 1.9250405003323928e-05, "loss": 0.0218, "step": 289990 }, { "epoch": 1.87, "learning_rate": 1.9240723648966998e-05, "loss": 0.0223, "step": 290000 }, { "epoch": 1.87, "eval_cer": 0.9198074793808609, "eval_loss": 0.016939295455813408, "eval_runtime": 120.1344, "eval_samples_per_second": 16.648, "eval_steps_per_second": 4.162, "step": 290000 }, { "epoch": 1.87, "learning_rate": 1.9231042294610068e-05, "loss": 0.0252, "step": 290010 }, { "epoch": 1.87, "learning_rate": 1.9221360940253134e-05, "loss": 0.024, "step": 290020 }, { "epoch": 1.87, "learning_rate": 1.9211679585896203e-05, "loss": 0.0221, "step": 290030 }, { "epoch": 1.87, "learning_rate": 1.9201998231539266e-05, "loss": 0.0208, "step": 290040 }, { "epoch": 1.87, "learning_rate": 1.9192316877182336e-05, "loss": 0.0196, "step": 290050 }, { "epoch": 1.87, "learning_rate": 1.9182635522825405e-05, "loss": 0.0239, "step": 290060 }, { "epoch": 1.87, "learning_rate": 1.9172954168468472e-05, "loss": 0.0235, "step": 290070 }, { "epoch": 1.87, "learning_rate": 1.916327281411154e-05, "loss": 0.0207, "step": 290080 }, { "epoch": 1.87, "learning_rate": 1.915359145975461e-05, "loss": 0.0335, "step": 290090 }, { "epoch": 1.87, "learning_rate": 1.9143910105397677e-05, "loss": 0.0246, "step": 290100 }, { "epoch": 1.87, "learning_rate": 1.9134228751040743e-05, "loss": 0.02, "step": 290110 }, { "epoch": 1.87, "learning_rate": 1.912454739668381e-05, "loss": 0.0226, "step": 290120 }, { "epoch": 1.87, "learning_rate": 1.911486604232688e-05, "loss": 0.0214, "step": 290130 }, { "epoch": 1.87, "learning_rate": 1.910518468796995e-05, "loss": 0.0305, "step": 290140 }, { "epoch": 1.87, "learning_rate": 1.9095503333613015e-05, "loss": 0.0202, "step": 290150 }, { "epoch": 1.87, "learning_rate": 1.9085821979256085e-05, "loss": 0.0238, "step": 290160 }, { "epoch": 1.87, "learning_rate": 1.907614062489915e-05, "loss": 0.0206, "step": 290170 }, { "epoch": 1.87, "learning_rate": 1.9066459270542217e-05, "loss": 0.0218, "step": 290180 }, { "epoch": 1.87, "learning_rate": 1.9056777916185287e-05, "loss": 0.0204, "step": 290190 }, { "epoch": 1.87, "learning_rate": 1.9047096561828353e-05, "loss": 0.0218, "step": 290200 }, { "epoch": 1.87, "learning_rate": 1.9037415207471423e-05, "loss": 0.0287, "step": 290210 }, { "epoch": 1.87, "learning_rate": 1.902773385311449e-05, "loss": 0.0244, "step": 290220 }, { "epoch": 1.87, "learning_rate": 1.901805249875756e-05, "loss": 0.0221, "step": 290230 }, { "epoch": 1.87, "learning_rate": 1.9008371144400628e-05, "loss": 0.0212, "step": 290240 }, { "epoch": 1.87, "learning_rate": 1.899868979004369e-05, "loss": 0.0191, "step": 290250 }, { "epoch": 1.87, "learning_rate": 1.898900843568676e-05, "loss": 0.0241, "step": 290260 }, { "epoch": 1.87, "learning_rate": 1.897932708132983e-05, "loss": 0.0223, "step": 290270 }, { "epoch": 1.87, "learning_rate": 1.8969645726972897e-05, "loss": 0.0229, "step": 290280 }, { "epoch": 1.87, "learning_rate": 1.8959964372615966e-05, "loss": 0.0231, "step": 290290 }, { "epoch": 1.87, "learning_rate": 1.8950283018259033e-05, "loss": 0.0277, "step": 290300 }, { "epoch": 1.87, "learning_rate": 1.8940601663902102e-05, "loss": 0.0234, "step": 290310 }, { "epoch": 1.87, "learning_rate": 1.893092030954517e-05, "loss": 0.0236, "step": 290320 }, { "epoch": 1.87, "learning_rate": 1.8921238955188235e-05, "loss": 0.0228, "step": 290330 }, { "epoch": 1.87, "learning_rate": 1.8911557600831304e-05, "loss": 0.0208, "step": 290340 }, { "epoch": 1.87, "learning_rate": 1.890187624647437e-05, "loss": 0.0192, "step": 290350 }, { "epoch": 1.87, "learning_rate": 1.889219489211744e-05, "loss": 0.0226, "step": 290360 }, { "epoch": 1.87, "learning_rate": 1.888251353776051e-05, "loss": 0.0238, "step": 290370 }, { "epoch": 1.87, "learning_rate": 1.8872832183403576e-05, "loss": 0.0235, "step": 290380 }, { "epoch": 1.87, "learning_rate": 1.8863150829046642e-05, "loss": 0.0231, "step": 290390 }, { "epoch": 1.87, "learning_rate": 1.885346947468971e-05, "loss": 0.0202, "step": 290400 }, { "epoch": 1.87, "learning_rate": 1.8843788120332778e-05, "loss": 0.0176, "step": 290410 }, { "epoch": 1.87, "learning_rate": 1.8834106765975848e-05, "loss": 0.0234, "step": 290420 }, { "epoch": 1.87, "learning_rate": 1.8824425411618914e-05, "loss": 0.0215, "step": 290430 }, { "epoch": 1.87, "learning_rate": 1.8814744057261984e-05, "loss": 0.022, "step": 290440 }, { "epoch": 1.87, "learning_rate": 1.8805062702905053e-05, "loss": 0.0198, "step": 290450 }, { "epoch": 1.87, "learning_rate": 1.8795381348548116e-05, "loss": 0.0241, "step": 290460 }, { "epoch": 1.87, "learning_rate": 1.8785699994191186e-05, "loss": 0.0208, "step": 290470 }, { "epoch": 1.87, "learning_rate": 1.8776018639834252e-05, "loss": 0.0211, "step": 290480 }, { "epoch": 1.87, "learning_rate": 1.876633728547732e-05, "loss": 0.0229, "step": 290490 }, { "epoch": 1.87, "learning_rate": 1.875665593112039e-05, "loss": 0.019, "step": 290500 }, { "epoch": 1.88, "learning_rate": 1.8746974576763457e-05, "loss": 0.0204, "step": 290510 }, { "epoch": 1.88, "learning_rate": 1.8737293222406524e-05, "loss": 0.0239, "step": 290520 }, { "epoch": 1.88, "learning_rate": 1.8727611868049593e-05, "loss": 0.0236, "step": 290530 }, { "epoch": 1.88, "learning_rate": 1.871793051369266e-05, "loss": 0.0248, "step": 290540 }, { "epoch": 1.88, "learning_rate": 1.870824915933573e-05, "loss": 0.0235, "step": 290550 }, { "epoch": 1.88, "learning_rate": 1.8698567804978795e-05, "loss": 0.0177, "step": 290560 }, { "epoch": 1.88, "learning_rate": 1.8688886450621865e-05, "loss": 0.02, "step": 290570 }, { "epoch": 1.88, "learning_rate": 1.867920509626493e-05, "loss": 0.0182, "step": 290580 }, { "epoch": 1.88, "learning_rate": 1.8669523741908e-05, "loss": 0.0205, "step": 290590 }, { "epoch": 1.88, "learning_rate": 1.8659842387551067e-05, "loss": 0.0241, "step": 290600 }, { "epoch": 1.88, "learning_rate": 1.8650161033194133e-05, "loss": 0.0256, "step": 290610 }, { "epoch": 1.88, "learning_rate": 1.8640479678837203e-05, "loss": 0.022, "step": 290620 }, { "epoch": 1.88, "learning_rate": 1.8630798324480273e-05, "loss": 0.0277, "step": 290630 }, { "epoch": 1.88, "learning_rate": 1.862111697012334e-05, "loss": 0.0281, "step": 290640 }, { "epoch": 1.88, "learning_rate": 1.8611435615766405e-05, "loss": 0.0182, "step": 290650 }, { "epoch": 1.88, "learning_rate": 1.8601754261409475e-05, "loss": 0.0224, "step": 290660 }, { "epoch": 1.88, "learning_rate": 1.8592072907052544e-05, "loss": 0.0209, "step": 290670 }, { "epoch": 1.88, "learning_rate": 1.858239155269561e-05, "loss": 0.0231, "step": 290680 }, { "epoch": 1.88, "learning_rate": 1.8572710198338677e-05, "loss": 0.0255, "step": 290690 }, { "epoch": 1.88, "learning_rate": 1.8563028843981746e-05, "loss": 0.0228, "step": 290700 }, { "epoch": 1.88, "learning_rate": 1.8553347489624816e-05, "loss": 0.0197, "step": 290710 }, { "epoch": 1.88, "learning_rate": 1.8543666135267882e-05, "loss": 0.0217, "step": 290720 }, { "epoch": 1.88, "learning_rate": 1.853398478091095e-05, "loss": 0.0223, "step": 290730 }, { "epoch": 1.88, "learning_rate": 1.8524303426554018e-05, "loss": 0.0221, "step": 290740 }, { "epoch": 1.88, "learning_rate": 1.8514622072197084e-05, "loss": 0.02, "step": 290750 }, { "epoch": 1.88, "learning_rate": 1.8504940717840154e-05, "loss": 0.0182, "step": 290760 }, { "epoch": 1.88, "learning_rate": 1.849525936348322e-05, "loss": 0.0221, "step": 290770 }, { "epoch": 1.88, "learning_rate": 1.8485578009126287e-05, "loss": 0.0244, "step": 290780 }, { "epoch": 1.88, "learning_rate": 1.8475896654769356e-05, "loss": 0.022, "step": 290790 }, { "epoch": 1.88, "learning_rate": 1.8466215300412426e-05, "loss": 0.023, "step": 290800 }, { "epoch": 1.88, "learning_rate": 1.8456533946055492e-05, "loss": 0.0209, "step": 290810 }, { "epoch": 1.88, "learning_rate": 1.8446852591698558e-05, "loss": 0.0258, "step": 290820 }, { "epoch": 1.88, "learning_rate": 1.8437171237341628e-05, "loss": 0.0182, "step": 290830 }, { "epoch": 1.88, "learning_rate": 1.8427489882984698e-05, "loss": 0.0242, "step": 290840 }, { "epoch": 1.88, "learning_rate": 1.8417808528627764e-05, "loss": 0.0195, "step": 290850 }, { "epoch": 1.88, "learning_rate": 1.840812717427083e-05, "loss": 0.0216, "step": 290860 }, { "epoch": 1.88, "learning_rate": 1.83984458199139e-05, "loss": 0.0207, "step": 290870 }, { "epoch": 1.88, "learning_rate": 1.838876446555697e-05, "loss": 0.0204, "step": 290880 }, { "epoch": 1.88, "learning_rate": 1.8379083111200035e-05, "loss": 0.027, "step": 290890 }, { "epoch": 1.88, "learning_rate": 1.8369401756843102e-05, "loss": 0.0213, "step": 290900 }, { "epoch": 1.88, "learning_rate": 1.835972040248617e-05, "loss": 0.0235, "step": 290910 }, { "epoch": 1.88, "learning_rate": 1.8350039048129238e-05, "loss": 0.0258, "step": 290920 }, { "epoch": 1.88, "learning_rate": 1.8340357693772307e-05, "loss": 0.0177, "step": 290930 }, { "epoch": 1.88, "learning_rate": 1.8330676339415373e-05, "loss": 0.021, "step": 290940 }, { "epoch": 1.88, "learning_rate": 1.8320994985058443e-05, "loss": 0.0202, "step": 290950 }, { "epoch": 1.88, "learning_rate": 1.831131363070151e-05, "loss": 0.0232, "step": 290960 }, { "epoch": 1.88, "learning_rate": 1.8301632276344576e-05, "loss": 0.0236, "step": 290970 }, { "epoch": 1.88, "learning_rate": 1.8291950921987645e-05, "loss": 0.0258, "step": 290980 }, { "epoch": 1.88, "learning_rate": 1.828226956763071e-05, "loss": 0.021, "step": 290990 }, { "epoch": 1.88, "learning_rate": 1.827258821327378e-05, "loss": 0.0231, "step": 291000 }, { "epoch": 1.88, "eval_cer": 0.9198291718449892, "eval_loss": 0.016914011910557747, "eval_runtime": 120.5766, "eval_samples_per_second": 16.587, "eval_steps_per_second": 4.147, "step": 291000 }, { "epoch": 1.88, "learning_rate": 1.8262906858916847e-05, "loss": 0.0221, "step": 291010 }, { "epoch": 1.88, "learning_rate": 1.8253225504559917e-05, "loss": 0.0218, "step": 291020 }, { "epoch": 1.88, "learning_rate": 1.8243544150202983e-05, "loss": 0.0275, "step": 291030 }, { "epoch": 1.88, "learning_rate": 1.8233862795846053e-05, "loss": 0.0208, "step": 291040 }, { "epoch": 1.88, "learning_rate": 1.822418144148912e-05, "loss": 0.0234, "step": 291050 }, { "epoch": 1.88, "learning_rate": 1.8214500087132185e-05, "loss": 0.0262, "step": 291060 }, { "epoch": 1.88, "learning_rate": 1.8204818732775255e-05, "loss": 0.0214, "step": 291070 }, { "epoch": 1.88, "learning_rate": 1.8195137378418325e-05, "loss": 0.0214, "step": 291080 }, { "epoch": 1.88, "learning_rate": 1.818545602406139e-05, "loss": 0.0212, "step": 291090 }, { "epoch": 1.88, "learning_rate": 1.8175774669704457e-05, "loss": 0.0226, "step": 291100 }, { "epoch": 1.88, "learning_rate": 1.8166093315347527e-05, "loss": 0.0231, "step": 291110 }, { "epoch": 1.88, "learning_rate": 1.8156411960990596e-05, "loss": 0.0205, "step": 291120 }, { "epoch": 1.88, "learning_rate": 1.8146730606633662e-05, "loss": 0.0175, "step": 291130 }, { "epoch": 1.88, "learning_rate": 1.813704925227673e-05, "loss": 0.0187, "step": 291140 }, { "epoch": 1.88, "learning_rate": 1.81273678979198e-05, "loss": 0.0214, "step": 291150 }, { "epoch": 1.88, "learning_rate": 1.8117686543562865e-05, "loss": 0.0301, "step": 291160 }, { "epoch": 1.88, "learning_rate": 1.8108005189205934e-05, "loss": 0.0205, "step": 291170 }, { "epoch": 1.88, "learning_rate": 1.8098323834849e-05, "loss": 0.0218, "step": 291180 }, { "epoch": 1.88, "learning_rate": 1.808864248049207e-05, "loss": 0.0232, "step": 291190 }, { "epoch": 1.88, "learning_rate": 1.8078961126135136e-05, "loss": 0.0231, "step": 291200 }, { "epoch": 1.88, "learning_rate": 1.8069279771778206e-05, "loss": 0.0223, "step": 291210 }, { "epoch": 1.88, "learning_rate": 1.8059598417421272e-05, "loss": 0.0192, "step": 291220 }, { "epoch": 1.88, "learning_rate": 1.804991706306434e-05, "loss": 0.0222, "step": 291230 }, { "epoch": 1.88, "learning_rate": 1.8040235708707408e-05, "loss": 0.0244, "step": 291240 }, { "epoch": 1.88, "learning_rate": 1.8030554354350478e-05, "loss": 0.0249, "step": 291250 }, { "epoch": 1.88, "learning_rate": 1.8020872999993544e-05, "loss": 0.025, "step": 291260 }, { "epoch": 1.88, "learning_rate": 1.801119164563661e-05, "loss": 0.0236, "step": 291270 }, { "epoch": 1.88, "learning_rate": 1.800151029127968e-05, "loss": 0.0252, "step": 291280 }, { "epoch": 1.88, "learning_rate": 1.799182893692275e-05, "loss": 0.0231, "step": 291290 }, { "epoch": 1.88, "learning_rate": 1.7982147582565816e-05, "loss": 0.0224, "step": 291300 }, { "epoch": 1.88, "learning_rate": 1.7972466228208882e-05, "loss": 0.02, "step": 291310 }, { "epoch": 1.88, "learning_rate": 1.796278487385195e-05, "loss": 0.0217, "step": 291320 }, { "epoch": 1.88, "learning_rate": 1.795310351949502e-05, "loss": 0.023, "step": 291330 }, { "epoch": 1.88, "learning_rate": 1.7943422165138087e-05, "loss": 0.0226, "step": 291340 }, { "epoch": 1.88, "learning_rate": 1.7933740810781154e-05, "loss": 0.0245, "step": 291350 }, { "epoch": 1.88, "learning_rate": 1.7924059456424223e-05, "loss": 0.0219, "step": 291360 }, { "epoch": 1.88, "learning_rate": 1.791437810206729e-05, "loss": 0.02, "step": 291370 }, { "epoch": 1.88, "learning_rate": 1.790469674771036e-05, "loss": 0.0229, "step": 291380 }, { "epoch": 1.88, "learning_rate": 1.7895015393353425e-05, "loss": 0.0232, "step": 291390 }, { "epoch": 1.88, "learning_rate": 1.7885334038996495e-05, "loss": 0.0195, "step": 291400 }, { "epoch": 1.88, "learning_rate": 1.787565268463956e-05, "loss": 0.0195, "step": 291410 }, { "epoch": 1.88, "learning_rate": 1.786597133028263e-05, "loss": 0.0249, "step": 291420 }, { "epoch": 1.88, "learning_rate": 1.7856289975925697e-05, "loss": 0.0205, "step": 291430 }, { "epoch": 1.88, "learning_rate": 1.7846608621568763e-05, "loss": 0.0301, "step": 291440 }, { "epoch": 1.88, "learning_rate": 1.7836927267211833e-05, "loss": 0.0204, "step": 291450 }, { "epoch": 1.88, "learning_rate": 1.7827245912854903e-05, "loss": 0.022, "step": 291460 }, { "epoch": 1.88, "learning_rate": 1.781756455849797e-05, "loss": 0.0185, "step": 291470 }, { "epoch": 1.88, "learning_rate": 1.7807883204141035e-05, "loss": 0.0218, "step": 291480 }, { "epoch": 1.88, "learning_rate": 1.7798201849784105e-05, "loss": 0.0242, "step": 291490 }, { "epoch": 1.88, "learning_rate": 1.7788520495427174e-05, "loss": 0.0188, "step": 291500 }, { "epoch": 1.88, "learning_rate": 1.777883914107024e-05, "loss": 0.0219, "step": 291510 }, { "epoch": 1.88, "learning_rate": 1.7769157786713307e-05, "loss": 0.0258, "step": 291520 }, { "epoch": 1.88, "learning_rate": 1.7759476432356376e-05, "loss": 0.0245, "step": 291530 }, { "epoch": 1.88, "learning_rate": 1.7749795077999446e-05, "loss": 0.0197, "step": 291540 }, { "epoch": 1.88, "learning_rate": 1.7740113723642512e-05, "loss": 0.0312, "step": 291550 }, { "epoch": 1.88, "learning_rate": 1.773043236928558e-05, "loss": 0.025, "step": 291560 }, { "epoch": 1.88, "learning_rate": 1.7720751014928648e-05, "loss": 0.0228, "step": 291570 }, { "epoch": 1.88, "learning_rate": 1.7711069660571714e-05, "loss": 0.0267, "step": 291580 }, { "epoch": 1.88, "learning_rate": 1.7701388306214784e-05, "loss": 0.0192, "step": 291590 }, { "epoch": 1.88, "learning_rate": 1.769170695185785e-05, "loss": 0.02, "step": 291600 }, { "epoch": 1.88, "learning_rate": 1.7682025597500917e-05, "loss": 0.0262, "step": 291610 }, { "epoch": 1.88, "learning_rate": 1.7672344243143986e-05, "loss": 0.0211, "step": 291620 }, { "epoch": 1.88, "learning_rate": 1.7662662888787052e-05, "loss": 0.0233, "step": 291630 }, { "epoch": 1.88, "learning_rate": 1.7652981534430122e-05, "loss": 0.022, "step": 291640 }, { "epoch": 1.88, "learning_rate": 1.7643300180073188e-05, "loss": 0.0266, "step": 291650 }, { "epoch": 1.88, "learning_rate": 1.7633618825716258e-05, "loss": 0.0226, "step": 291660 }, { "epoch": 1.88, "learning_rate": 1.7623937471359324e-05, "loss": 0.0204, "step": 291670 }, { "epoch": 1.88, "learning_rate": 1.761425611700239e-05, "loss": 0.0186, "step": 291680 }, { "epoch": 1.88, "learning_rate": 1.760457476264546e-05, "loss": 0.0196, "step": 291690 }, { "epoch": 1.88, "learning_rate": 1.759489340828853e-05, "loss": 0.0207, "step": 291700 }, { "epoch": 1.88, "learning_rate": 1.7585212053931596e-05, "loss": 0.0231, "step": 291710 }, { "epoch": 1.88, "learning_rate": 1.7575530699574662e-05, "loss": 0.0234, "step": 291720 }, { "epoch": 1.88, "learning_rate": 1.7565849345217732e-05, "loss": 0.0224, "step": 291730 }, { "epoch": 1.88, "learning_rate": 1.75561679908608e-05, "loss": 0.0222, "step": 291740 }, { "epoch": 1.88, "learning_rate": 1.7546486636503868e-05, "loss": 0.0217, "step": 291750 }, { "epoch": 1.88, "learning_rate": 1.7536805282146934e-05, "loss": 0.0236, "step": 291760 }, { "epoch": 1.88, "learning_rate": 1.7527123927790003e-05, "loss": 0.0234, "step": 291770 }, { "epoch": 1.88, "learning_rate": 1.7517442573433073e-05, "loss": 0.0246, "step": 291780 }, { "epoch": 1.88, "learning_rate": 1.750776121907614e-05, "loss": 0.0211, "step": 291790 }, { "epoch": 1.88, "learning_rate": 1.7498079864719206e-05, "loss": 0.0225, "step": 291800 }, { "epoch": 1.88, "learning_rate": 1.7488398510362275e-05, "loss": 0.0218, "step": 291810 }, { "epoch": 1.88, "learning_rate": 1.747871715600534e-05, "loss": 0.0218, "step": 291820 }, { "epoch": 1.88, "learning_rate": 1.746903580164841e-05, "loss": 0.0263, "step": 291830 }, { "epoch": 1.88, "learning_rate": 1.7459354447291477e-05, "loss": 0.0238, "step": 291840 }, { "epoch": 1.88, "learning_rate": 1.7449673092934547e-05, "loss": 0.0208, "step": 291850 }, { "epoch": 1.88, "learning_rate": 1.7439991738577613e-05, "loss": 0.0227, "step": 291860 }, { "epoch": 1.88, "learning_rate": 1.7430310384220683e-05, "loss": 0.0197, "step": 291870 }, { "epoch": 1.88, "learning_rate": 1.742062902986375e-05, "loss": 0.0226, "step": 291880 }, { "epoch": 1.88, "learning_rate": 1.7410947675506815e-05, "loss": 0.0227, "step": 291890 }, { "epoch": 1.88, "learning_rate": 1.7401266321149885e-05, "loss": 0.02, "step": 291900 }, { "epoch": 1.88, "learning_rate": 1.7391584966792955e-05, "loss": 0.0197, "step": 291910 }, { "epoch": 1.88, "learning_rate": 1.738190361243602e-05, "loss": 0.0228, "step": 291920 }, { "epoch": 1.88, "learning_rate": 1.7372222258079087e-05, "loss": 0.0196, "step": 291930 }, { "epoch": 1.88, "learning_rate": 1.7362540903722157e-05, "loss": 0.0305, "step": 291940 }, { "epoch": 1.88, "learning_rate": 1.7352859549365226e-05, "loss": 0.0226, "step": 291950 }, { "epoch": 1.88, "learning_rate": 1.7343178195008292e-05, "loss": 0.0262, "step": 291960 }, { "epoch": 1.88, "learning_rate": 1.733349684065136e-05, "loss": 0.0228, "step": 291970 }, { "epoch": 1.88, "learning_rate": 1.732381548629443e-05, "loss": 0.019, "step": 291980 }, { "epoch": 1.88, "learning_rate": 1.7314134131937498e-05, "loss": 0.0169, "step": 291990 }, { "epoch": 1.88, "learning_rate": 1.7304452777580564e-05, "loss": 0.0192, "step": 292000 }, { "epoch": 1.88, "eval_cer": 0.9198345949610214, "eval_loss": 0.01690409518778324, "eval_runtime": 120.2396, "eval_samples_per_second": 16.633, "eval_steps_per_second": 4.158, "step": 292000 }, { "epoch": 1.88, "learning_rate": 1.729477142322363e-05, "loss": 0.0219, "step": 292010 }, { "epoch": 1.88, "learning_rate": 1.72850900688667e-05, "loss": 0.0224, "step": 292020 }, { "epoch": 1.88, "learning_rate": 1.7275408714509766e-05, "loss": 0.0229, "step": 292030 }, { "epoch": 1.88, "learning_rate": 1.7265727360152836e-05, "loss": 0.0231, "step": 292040 }, { "epoch": 1.88, "learning_rate": 1.7256046005795902e-05, "loss": 0.0235, "step": 292050 }, { "epoch": 1.89, "learning_rate": 1.724636465143897e-05, "loss": 0.0221, "step": 292060 }, { "epoch": 1.89, "learning_rate": 1.7236683297082038e-05, "loss": 0.0217, "step": 292070 }, { "epoch": 1.89, "learning_rate": 1.7227001942725108e-05, "loss": 0.0217, "step": 292080 }, { "epoch": 1.89, "learning_rate": 1.7217320588368174e-05, "loss": 0.0216, "step": 292090 }, { "epoch": 1.89, "learning_rate": 1.720763923401124e-05, "loss": 0.0216, "step": 292100 }, { "epoch": 1.89, "learning_rate": 1.719795787965431e-05, "loss": 0.0228, "step": 292110 }, { "epoch": 1.89, "learning_rate": 1.718827652529738e-05, "loss": 0.0252, "step": 292120 }, { "epoch": 1.89, "learning_rate": 1.7178595170940446e-05, "loss": 0.0258, "step": 292130 }, { "epoch": 1.89, "learning_rate": 1.7168913816583512e-05, "loss": 0.0255, "step": 292140 }, { "epoch": 1.89, "learning_rate": 1.715923246222658e-05, "loss": 0.0225, "step": 292150 }, { "epoch": 1.89, "learning_rate": 1.714955110786965e-05, "loss": 0.0255, "step": 292160 }, { "epoch": 1.89, "learning_rate": 1.7139869753512717e-05, "loss": 0.0241, "step": 292170 }, { "epoch": 1.89, "learning_rate": 1.7130188399155784e-05, "loss": 0.0283, "step": 292180 }, { "epoch": 1.89, "learning_rate": 1.7120507044798853e-05, "loss": 0.0222, "step": 292190 }, { "epoch": 1.89, "learning_rate": 1.711082569044192e-05, "loss": 0.0243, "step": 292200 }, { "epoch": 1.89, "learning_rate": 1.710114433608499e-05, "loss": 0.0226, "step": 292210 }, { "epoch": 1.89, "learning_rate": 1.7091462981728055e-05, "loss": 0.0197, "step": 292220 }, { "epoch": 1.89, "learning_rate": 1.7081781627371125e-05, "loss": 0.022, "step": 292230 }, { "epoch": 1.89, "learning_rate": 1.707210027301419e-05, "loss": 0.0167, "step": 292240 }, { "epoch": 1.89, "learning_rate": 1.706241891865726e-05, "loss": 0.0205, "step": 292250 }, { "epoch": 1.89, "learning_rate": 1.7052737564300327e-05, "loss": 0.0208, "step": 292260 }, { "epoch": 1.89, "learning_rate": 1.7043056209943393e-05, "loss": 0.019, "step": 292270 }, { "epoch": 1.89, "learning_rate": 1.7033374855586463e-05, "loss": 0.0225, "step": 292280 }, { "epoch": 1.89, "learning_rate": 1.702369350122953e-05, "loss": 0.0237, "step": 292290 }, { "epoch": 1.89, "learning_rate": 1.70140121468726e-05, "loss": 0.0204, "step": 292300 }, { "epoch": 1.89, "learning_rate": 1.7004330792515665e-05, "loss": 0.0222, "step": 292310 }, { "epoch": 1.89, "learning_rate": 1.6994649438158735e-05, "loss": 0.0252, "step": 292320 }, { "epoch": 1.89, "learning_rate": 1.69849680838018e-05, "loss": 0.0239, "step": 292330 }, { "epoch": 1.89, "learning_rate": 1.6975286729444867e-05, "loss": 0.0229, "step": 292340 }, { "epoch": 1.89, "learning_rate": 1.6965605375087937e-05, "loss": 0.021, "step": 292350 }, { "epoch": 1.89, "learning_rate": 1.6955924020731006e-05, "loss": 0.0234, "step": 292360 }, { "epoch": 1.89, "learning_rate": 1.6946242666374073e-05, "loss": 0.0185, "step": 292370 }, { "epoch": 1.89, "learning_rate": 1.693656131201714e-05, "loss": 0.023, "step": 292380 }, { "epoch": 1.89, "learning_rate": 1.692687995766021e-05, "loss": 0.0236, "step": 292390 }, { "epoch": 1.89, "learning_rate": 1.6917198603303278e-05, "loss": 0.0242, "step": 292400 }, { "epoch": 1.89, "learning_rate": 1.6907517248946344e-05, "loss": 0.0273, "step": 292410 }, { "epoch": 1.89, "learning_rate": 1.689783589458941e-05, "loss": 0.0243, "step": 292420 }, { "epoch": 1.89, "learning_rate": 1.688815454023248e-05, "loss": 0.0195, "step": 292430 }, { "epoch": 1.89, "learning_rate": 1.687847318587555e-05, "loss": 0.0225, "step": 292440 }, { "epoch": 1.89, "learning_rate": 1.6868791831518616e-05, "loss": 0.0189, "step": 292450 }, { "epoch": 1.89, "learning_rate": 1.6859110477161682e-05, "loss": 0.0217, "step": 292460 }, { "epoch": 1.89, "learning_rate": 1.6849429122804752e-05, "loss": 0.0281, "step": 292470 }, { "epoch": 1.89, "learning_rate": 1.6839747768447818e-05, "loss": 0.0225, "step": 292480 }, { "epoch": 1.89, "learning_rate": 1.6830066414090888e-05, "loss": 0.0193, "step": 292490 }, { "epoch": 1.89, "learning_rate": 1.6820385059733954e-05, "loss": 0.0259, "step": 292500 }, { "epoch": 1.89, "learning_rate": 1.681070370537702e-05, "loss": 0.0189, "step": 292510 }, { "epoch": 1.89, "learning_rate": 1.680102235102009e-05, "loss": 0.0206, "step": 292520 }, { "epoch": 1.89, "learning_rate": 1.679134099666316e-05, "loss": 0.0258, "step": 292530 }, { "epoch": 1.89, "learning_rate": 1.6781659642306226e-05, "loss": 0.0309, "step": 292540 }, { "epoch": 1.89, "learning_rate": 1.6771978287949292e-05, "loss": 0.0184, "step": 292550 }, { "epoch": 1.89, "learning_rate": 1.676229693359236e-05, "loss": 0.0247, "step": 292560 }, { "epoch": 1.89, "learning_rate": 1.675261557923543e-05, "loss": 0.0216, "step": 292570 }, { "epoch": 1.89, "learning_rate": 1.6742934224878498e-05, "loss": 0.0179, "step": 292580 }, { "epoch": 1.89, "learning_rate": 1.6733252870521564e-05, "loss": 0.0235, "step": 292590 }, { "epoch": 1.89, "learning_rate": 1.6723571516164633e-05, "loss": 0.0218, "step": 292600 }, { "epoch": 1.89, "learning_rate": 1.6713890161807703e-05, "loss": 0.0275, "step": 292610 }, { "epoch": 1.89, "learning_rate": 1.670420880745077e-05, "loss": 0.0226, "step": 292620 }, { "epoch": 1.89, "learning_rate": 1.6694527453093836e-05, "loss": 0.0291, "step": 292630 }, { "epoch": 1.89, "learning_rate": 1.6684846098736905e-05, "loss": 0.0243, "step": 292640 }, { "epoch": 1.89, "learning_rate": 1.667516474437997e-05, "loss": 0.0203, "step": 292650 }, { "epoch": 1.89, "learning_rate": 1.666548339002304e-05, "loss": 0.0216, "step": 292660 }, { "epoch": 1.89, "learning_rate": 1.6655802035666107e-05, "loss": 0.0224, "step": 292670 }, { "epoch": 1.89, "learning_rate": 1.6646120681309177e-05, "loss": 0.0223, "step": 292680 }, { "epoch": 1.89, "learning_rate": 1.6636439326952243e-05, "loss": 0.0197, "step": 292690 }, { "epoch": 1.89, "learning_rate": 1.6626757972595313e-05, "loss": 0.0218, "step": 292700 }, { "epoch": 1.89, "learning_rate": 1.661707661823838e-05, "loss": 0.0226, "step": 292710 }, { "epoch": 1.89, "learning_rate": 1.6607395263881445e-05, "loss": 0.0236, "step": 292720 }, { "epoch": 1.89, "learning_rate": 1.6597713909524515e-05, "loss": 0.0232, "step": 292730 }, { "epoch": 1.89, "learning_rate": 1.6588032555167584e-05, "loss": 0.0233, "step": 292740 }, { "epoch": 1.89, "learning_rate": 1.657835120081065e-05, "loss": 0.0216, "step": 292750 }, { "epoch": 1.89, "learning_rate": 1.6568669846453717e-05, "loss": 0.0201, "step": 292760 }, { "epoch": 1.89, "learning_rate": 1.6558988492096787e-05, "loss": 0.0237, "step": 292770 }, { "epoch": 1.89, "learning_rate": 1.6549307137739856e-05, "loss": 0.0207, "step": 292780 }, { "epoch": 1.89, "learning_rate": 1.6539625783382922e-05, "loss": 0.0222, "step": 292790 }, { "epoch": 1.89, "learning_rate": 1.652994442902599e-05, "loss": 0.0226, "step": 292800 }, { "epoch": 1.89, "learning_rate": 1.652026307466906e-05, "loss": 0.0219, "step": 292810 }, { "epoch": 1.89, "learning_rate": 1.6510581720312128e-05, "loss": 0.0214, "step": 292820 }, { "epoch": 1.89, "learning_rate": 1.6500900365955194e-05, "loss": 0.0205, "step": 292830 }, { "epoch": 1.89, "learning_rate": 1.649121901159826e-05, "loss": 0.0238, "step": 292840 }, { "epoch": 1.89, "learning_rate": 1.648153765724133e-05, "loss": 0.0241, "step": 292850 }, { "epoch": 1.89, "learning_rate": 1.6471856302884396e-05, "loss": 0.0263, "step": 292860 }, { "epoch": 1.89, "learning_rate": 1.6462174948527466e-05, "loss": 0.0307, "step": 292870 }, { "epoch": 1.89, "learning_rate": 1.6452493594170532e-05, "loss": 0.0255, "step": 292880 }, { "epoch": 1.89, "learning_rate": 1.64428122398136e-05, "loss": 0.0218, "step": 292890 }, { "epoch": 1.89, "learning_rate": 1.6433130885456668e-05, "loss": 0.0259, "step": 292900 }, { "epoch": 1.89, "learning_rate": 1.6423449531099738e-05, "loss": 0.025, "step": 292910 }, { "epoch": 1.89, "learning_rate": 1.6413768176742804e-05, "loss": 0.0252, "step": 292920 }, { "epoch": 1.89, "learning_rate": 1.640408682238587e-05, "loss": 0.0252, "step": 292930 }, { "epoch": 1.89, "learning_rate": 1.639440546802894e-05, "loss": 0.0204, "step": 292940 }, { "epoch": 1.89, "learning_rate": 1.6384724113672006e-05, "loss": 0.0245, "step": 292950 }, { "epoch": 1.89, "learning_rate": 1.6375042759315076e-05, "loss": 0.02, "step": 292960 }, { "epoch": 1.89, "learning_rate": 1.6365361404958142e-05, "loss": 0.0262, "step": 292970 }, { "epoch": 1.89, "learning_rate": 1.635568005060121e-05, "loss": 0.0235, "step": 292980 }, { "epoch": 1.89, "learning_rate": 1.6345998696244278e-05, "loss": 0.0216, "step": 292990 }, { "epoch": 1.89, "learning_rate": 1.6336317341887347e-05, "loss": 0.0234, "step": 293000 }, { "epoch": 1.89, "eval_cer": 0.9198382103717094, "eval_loss": 0.016830649226903915, "eval_runtime": 120.2142, "eval_samples_per_second": 16.637, "eval_steps_per_second": 4.159, "step": 293000 }, { "epoch": 1.89, "learning_rate": 1.6326635987530414e-05, "loss": 0.0237, "step": 293010 }, { "epoch": 1.89, "learning_rate": 1.6316954633173483e-05, "loss": 0.0241, "step": 293020 }, { "epoch": 1.89, "learning_rate": 1.630727327881655e-05, "loss": 0.0203, "step": 293030 }, { "epoch": 1.89, "learning_rate": 1.6297591924459616e-05, "loss": 0.0252, "step": 293040 }, { "epoch": 1.89, "learning_rate": 1.6287910570102685e-05, "loss": 0.0223, "step": 293050 }, { "epoch": 1.89, "learning_rate": 1.6278229215745755e-05, "loss": 0.026, "step": 293060 }, { "epoch": 1.89, "learning_rate": 1.626854786138882e-05, "loss": 0.0253, "step": 293070 }, { "epoch": 1.89, "learning_rate": 1.6258866507031887e-05, "loss": 0.0222, "step": 293080 }, { "epoch": 1.89, "learning_rate": 1.6249185152674957e-05, "loss": 0.0234, "step": 293090 }, { "epoch": 1.89, "learning_rate": 1.6239503798318023e-05, "loss": 0.0179, "step": 293100 }, { "epoch": 1.89, "learning_rate": 1.6229822443961093e-05, "loss": 0.0227, "step": 293110 }, { "epoch": 1.89, "learning_rate": 1.622014108960416e-05, "loss": 0.0272, "step": 293120 }, { "epoch": 1.89, "learning_rate": 1.621045973524723e-05, "loss": 0.024, "step": 293130 }, { "epoch": 1.89, "learning_rate": 1.6200778380890295e-05, "loss": 0.0248, "step": 293140 }, { "epoch": 1.89, "learning_rate": 1.6191097026533365e-05, "loss": 0.0212, "step": 293150 }, { "epoch": 1.89, "learning_rate": 1.618141567217643e-05, "loss": 0.0258, "step": 293160 }, { "epoch": 1.89, "learning_rate": 1.6171734317819497e-05, "loss": 0.0189, "step": 293170 }, { "epoch": 1.89, "learning_rate": 1.6162052963462567e-05, "loss": 0.0211, "step": 293180 }, { "epoch": 1.89, "learning_rate": 1.6152371609105636e-05, "loss": 0.0191, "step": 293190 }, { "epoch": 1.89, "learning_rate": 1.6142690254748703e-05, "loss": 0.0212, "step": 293200 }, { "epoch": 1.89, "learning_rate": 1.613300890039177e-05, "loss": 0.0229, "step": 293210 }, { "epoch": 1.89, "learning_rate": 1.612332754603484e-05, "loss": 0.0219, "step": 293220 }, { "epoch": 1.89, "learning_rate": 1.6113646191677908e-05, "loss": 0.0245, "step": 293230 }, { "epoch": 1.89, "learning_rate": 1.6103964837320974e-05, "loss": 0.0209, "step": 293240 }, { "epoch": 1.89, "learning_rate": 1.609428348296404e-05, "loss": 0.0208, "step": 293250 }, { "epoch": 1.89, "learning_rate": 1.608460212860711e-05, "loss": 0.0193, "step": 293260 }, { "epoch": 1.89, "learning_rate": 1.607492077425018e-05, "loss": 0.0222, "step": 293270 }, { "epoch": 1.89, "learning_rate": 1.6065239419893246e-05, "loss": 0.0241, "step": 293280 }, { "epoch": 1.89, "learning_rate": 1.6055558065536312e-05, "loss": 0.0228, "step": 293290 }, { "epoch": 1.89, "learning_rate": 1.6045876711179382e-05, "loss": 0.0193, "step": 293300 }, { "epoch": 1.89, "learning_rate": 1.6036195356822448e-05, "loss": 0.0253, "step": 293310 }, { "epoch": 1.89, "learning_rate": 1.6026514002465518e-05, "loss": 0.0223, "step": 293320 }, { "epoch": 1.89, "learning_rate": 1.6016832648108584e-05, "loss": 0.0215, "step": 293330 }, { "epoch": 1.89, "learning_rate": 1.600715129375165e-05, "loss": 0.0196, "step": 293340 }, { "epoch": 1.89, "learning_rate": 1.599746993939472e-05, "loss": 0.0208, "step": 293350 }, { "epoch": 1.89, "learning_rate": 1.598778858503779e-05, "loss": 0.0238, "step": 293360 }, { "epoch": 1.89, "learning_rate": 1.5978107230680856e-05, "loss": 0.0196, "step": 293370 }, { "epoch": 1.89, "learning_rate": 1.5968425876323922e-05, "loss": 0.0238, "step": 293380 }, { "epoch": 1.89, "learning_rate": 1.595874452196699e-05, "loss": 0.0254, "step": 293390 }, { "epoch": 1.89, "learning_rate": 1.594906316761006e-05, "loss": 0.0292, "step": 293400 }, { "epoch": 1.89, "learning_rate": 1.5939381813253128e-05, "loss": 0.0249, "step": 293410 }, { "epoch": 1.89, "learning_rate": 1.5929700458896194e-05, "loss": 0.0204, "step": 293420 }, { "epoch": 1.89, "learning_rate": 1.5920019104539263e-05, "loss": 0.0236, "step": 293430 }, { "epoch": 1.89, "learning_rate": 1.5910337750182333e-05, "loss": 0.0198, "step": 293440 }, { "epoch": 1.89, "learning_rate": 1.59006563958254e-05, "loss": 0.0239, "step": 293450 }, { "epoch": 1.89, "learning_rate": 1.5890975041468466e-05, "loss": 0.0229, "step": 293460 }, { "epoch": 1.89, "learning_rate": 1.5881293687111535e-05, "loss": 0.0193, "step": 293470 }, { "epoch": 1.89, "learning_rate": 1.58716123327546e-05, "loss": 0.0259, "step": 293480 }, { "epoch": 1.89, "learning_rate": 1.586193097839767e-05, "loss": 0.0209, "step": 293490 }, { "epoch": 1.89, "learning_rate": 1.5852249624040737e-05, "loss": 0.0298, "step": 293500 }, { "epoch": 1.89, "learning_rate": 1.5842568269683807e-05, "loss": 0.0224, "step": 293510 }, { "epoch": 1.89, "learning_rate": 1.5832886915326873e-05, "loss": 0.0244, "step": 293520 }, { "epoch": 1.89, "learning_rate": 1.5823205560969943e-05, "loss": 0.0243, "step": 293530 }, { "epoch": 1.89, "learning_rate": 1.581352420661301e-05, "loss": 0.0213, "step": 293540 }, { "epoch": 1.89, "learning_rate": 1.5803842852256075e-05, "loss": 0.023, "step": 293550 }, { "epoch": 1.89, "learning_rate": 1.5794161497899145e-05, "loss": 0.0209, "step": 293560 }, { "epoch": 1.89, "learning_rate": 1.5784480143542214e-05, "loss": 0.0246, "step": 293570 }, { "epoch": 1.89, "learning_rate": 1.577479878918528e-05, "loss": 0.0198, "step": 293580 }, { "epoch": 1.89, "learning_rate": 1.5765117434828347e-05, "loss": 0.0204, "step": 293590 }, { "epoch": 1.89, "learning_rate": 1.5755436080471417e-05, "loss": 0.0205, "step": 293600 }, { "epoch": 1.9, "learning_rate": 1.5745754726114486e-05, "loss": 0.0215, "step": 293610 }, { "epoch": 1.9, "learning_rate": 1.5736073371757552e-05, "loss": 0.025, "step": 293620 }, { "epoch": 1.9, "learning_rate": 1.572639201740062e-05, "loss": 0.024, "step": 293630 }, { "epoch": 1.9, "learning_rate": 1.571671066304369e-05, "loss": 0.0229, "step": 293640 }, { "epoch": 1.9, "learning_rate": 1.5707029308686755e-05, "loss": 0.0253, "step": 293650 }, { "epoch": 1.9, "learning_rate": 1.5697347954329824e-05, "loss": 0.0234, "step": 293660 }, { "epoch": 1.9, "learning_rate": 1.568766659997289e-05, "loss": 0.0248, "step": 293670 }, { "epoch": 1.9, "learning_rate": 1.567798524561596e-05, "loss": 0.0159, "step": 293680 }, { "epoch": 1.9, "learning_rate": 1.5668303891259026e-05, "loss": 0.0213, "step": 293690 }, { "epoch": 1.9, "learning_rate": 1.5658622536902093e-05, "loss": 0.0265, "step": 293700 }, { "epoch": 1.9, "learning_rate": 1.5648941182545162e-05, "loss": 0.0239, "step": 293710 }, { "epoch": 1.9, "learning_rate": 1.5639259828188232e-05, "loss": 0.0218, "step": 293720 }, { "epoch": 1.9, "learning_rate": 1.5629578473831298e-05, "loss": 0.0185, "step": 293730 }, { "epoch": 1.9, "learning_rate": 1.5619897119474364e-05, "loss": 0.0259, "step": 293740 }, { "epoch": 1.9, "learning_rate": 1.5610215765117434e-05, "loss": 0.0274, "step": 293750 }, { "epoch": 1.9, "learning_rate": 1.56005344107605e-05, "loss": 0.0227, "step": 293760 }, { "epoch": 1.9, "learning_rate": 1.559085305640357e-05, "loss": 0.0248, "step": 293770 }, { "epoch": 1.9, "learning_rate": 1.5581171702046636e-05, "loss": 0.0241, "step": 293780 }, { "epoch": 1.9, "learning_rate": 1.5571490347689702e-05, "loss": 0.0255, "step": 293790 }, { "epoch": 1.9, "learning_rate": 1.5561808993332772e-05, "loss": 0.0191, "step": 293800 }, { "epoch": 1.9, "learning_rate": 1.555212763897584e-05, "loss": 0.0205, "step": 293810 }, { "epoch": 1.9, "learning_rate": 1.5542446284618908e-05, "loss": 0.0229, "step": 293820 }, { "epoch": 1.9, "learning_rate": 1.5532764930261974e-05, "loss": 0.0263, "step": 293830 }, { "epoch": 1.9, "learning_rate": 1.5523083575905044e-05, "loss": 0.0233, "step": 293840 }, { "epoch": 1.9, "learning_rate": 1.5513402221548113e-05, "loss": 0.0235, "step": 293850 }, { "epoch": 1.9, "learning_rate": 1.550372086719118e-05, "loss": 0.0222, "step": 293860 }, { "epoch": 1.9, "learning_rate": 1.5494039512834246e-05, "loss": 0.0243, "step": 293870 }, { "epoch": 1.9, "learning_rate": 1.5484358158477315e-05, "loss": 0.0223, "step": 293880 }, { "epoch": 1.9, "learning_rate": 1.5474676804120385e-05, "loss": 0.0273, "step": 293890 }, { "epoch": 1.9, "learning_rate": 1.546499544976345e-05, "loss": 0.0209, "step": 293900 }, { "epoch": 1.9, "learning_rate": 1.5455314095406517e-05, "loss": 0.0234, "step": 293910 }, { "epoch": 1.9, "learning_rate": 1.5445632741049587e-05, "loss": 0.0201, "step": 293920 }, { "epoch": 1.9, "learning_rate": 1.5435951386692653e-05, "loss": 0.0188, "step": 293930 }, { "epoch": 1.9, "learning_rate": 1.5426270032335723e-05, "loss": 0.0215, "step": 293940 }, { "epoch": 1.9, "learning_rate": 1.541658867797879e-05, "loss": 0.0254, "step": 293950 }, { "epoch": 1.9, "learning_rate": 1.540690732362186e-05, "loss": 0.0228, "step": 293960 }, { "epoch": 1.9, "learning_rate": 1.5397225969264925e-05, "loss": 0.0195, "step": 293970 }, { "epoch": 1.9, "learning_rate": 1.5387544614907995e-05, "loss": 0.0181, "step": 293980 }, { "epoch": 1.9, "learning_rate": 1.537786326055106e-05, "loss": 0.0216, "step": 293990 }, { "epoch": 1.9, "learning_rate": 1.5368181906194127e-05, "loss": 0.0223, "step": 294000 }, { "epoch": 1.9, "eval_cer": 0.9198427296350695, "eval_loss": 0.016799306496977806, "eval_runtime": 120.1061, "eval_samples_per_second": 16.652, "eval_steps_per_second": 4.163, "step": 294000 }, { "epoch": 1.9, "learning_rate": 1.5358500551837197e-05, "loss": 0.0189, "step": 294010 }, { "epoch": 1.9, "learning_rate": 1.5348819197480266e-05, "loss": 0.0198, "step": 294020 }, { "epoch": 1.9, "learning_rate": 1.5339137843123333e-05, "loss": 0.0212, "step": 294030 }, { "epoch": 1.9, "learning_rate": 1.53294564887664e-05, "loss": 0.0218, "step": 294040 }, { "epoch": 1.9, "learning_rate": 1.531977513440947e-05, "loss": 0.0271, "step": 294050 }, { "epoch": 1.9, "learning_rate": 1.5310093780052538e-05, "loss": 0.0209, "step": 294060 }, { "epoch": 1.9, "learning_rate": 1.5300412425695604e-05, "loss": 0.0185, "step": 294070 }, { "epoch": 1.9, "learning_rate": 1.529073107133867e-05, "loss": 0.0206, "step": 294080 }, { "epoch": 1.9, "learning_rate": 1.528104971698174e-05, "loss": 0.0236, "step": 294090 }, { "epoch": 1.9, "learning_rate": 1.527136836262481e-05, "loss": 0.0239, "step": 294100 }, { "epoch": 1.9, "learning_rate": 1.5261687008267876e-05, "loss": 0.0236, "step": 294110 }, { "epoch": 1.9, "learning_rate": 1.5252005653910944e-05, "loss": 0.0239, "step": 294120 }, { "epoch": 1.9, "learning_rate": 1.5242324299554012e-05, "loss": 0.0235, "step": 294130 }, { "epoch": 1.9, "learning_rate": 1.5232642945197078e-05, "loss": 0.0193, "step": 294140 }, { "epoch": 1.9, "learning_rate": 1.5222961590840146e-05, "loss": 0.0219, "step": 294150 }, { "epoch": 1.9, "learning_rate": 1.5213280236483214e-05, "loss": 0.0251, "step": 294160 }, { "epoch": 1.9, "learning_rate": 1.5203598882126282e-05, "loss": 0.0234, "step": 294170 }, { "epoch": 1.9, "learning_rate": 1.519391752776935e-05, "loss": 0.0215, "step": 294180 }, { "epoch": 1.9, "learning_rate": 1.5184236173412418e-05, "loss": 0.023, "step": 294190 }, { "epoch": 1.9, "learning_rate": 1.5174554819055486e-05, "loss": 0.0259, "step": 294200 }, { "epoch": 1.9, "learning_rate": 1.5164873464698552e-05, "loss": 0.0252, "step": 294210 }, { "epoch": 1.9, "learning_rate": 1.5155192110341622e-05, "loss": 0.0205, "step": 294220 }, { "epoch": 1.9, "learning_rate": 1.514551075598469e-05, "loss": 0.022, "step": 294230 }, { "epoch": 1.9, "learning_rate": 1.5135829401627756e-05, "loss": 0.0242, "step": 294240 }, { "epoch": 1.9, "learning_rate": 1.5126148047270824e-05, "loss": 0.0217, "step": 294250 }, { "epoch": 1.9, "learning_rate": 1.5116466692913893e-05, "loss": 0.0223, "step": 294260 }, { "epoch": 1.9, "learning_rate": 1.5106785338556961e-05, "loss": 0.0193, "step": 294270 }, { "epoch": 1.9, "learning_rate": 1.5097103984200028e-05, "loss": 0.0217, "step": 294280 }, { "epoch": 1.9, "learning_rate": 1.5087422629843096e-05, "loss": 0.0219, "step": 294290 }, { "epoch": 1.9, "learning_rate": 1.5077741275486165e-05, "loss": 0.0219, "step": 294300 }, { "epoch": 1.9, "learning_rate": 1.5068059921129231e-05, "loss": 0.0244, "step": 294310 }, { "epoch": 1.9, "learning_rate": 1.50583785667723e-05, "loss": 0.0259, "step": 294320 }, { "epoch": 1.9, "learning_rate": 1.5048697212415367e-05, "loss": 0.0258, "step": 294330 }, { "epoch": 1.9, "learning_rate": 1.5039015858058437e-05, "loss": 0.0204, "step": 294340 }, { "epoch": 1.9, "learning_rate": 1.5029334503701503e-05, "loss": 0.0239, "step": 294350 }, { "epoch": 1.9, "learning_rate": 1.5019653149344571e-05, "loss": 0.0234, "step": 294360 }, { "epoch": 1.9, "learning_rate": 1.5009971794987639e-05, "loss": 0.0226, "step": 294370 }, { "epoch": 1.9, "learning_rate": 1.5000290440630705e-05, "loss": 0.0237, "step": 294380 }, { "epoch": 1.9, "learning_rate": 1.4990609086273775e-05, "loss": 0.0248, "step": 294390 }, { "epoch": 1.9, "learning_rate": 1.4980927731916843e-05, "loss": 0.0215, "step": 294400 }, { "epoch": 1.9, "learning_rate": 1.497124637755991e-05, "loss": 0.0266, "step": 294410 }, { "epoch": 1.9, "learning_rate": 1.4961565023202977e-05, "loss": 0.0231, "step": 294420 }, { "epoch": 1.9, "learning_rate": 1.4951883668846047e-05, "loss": 0.0203, "step": 294430 }, { "epoch": 1.9, "learning_rate": 1.4942202314489115e-05, "loss": 0.0192, "step": 294440 }, { "epoch": 1.9, "learning_rate": 1.493252096013218e-05, "loss": 0.02, "step": 294450 }, { "epoch": 1.9, "learning_rate": 1.4922839605775249e-05, "loss": 0.0191, "step": 294460 }, { "epoch": 1.9, "learning_rate": 1.4913158251418318e-05, "loss": 0.0229, "step": 294470 }, { "epoch": 1.9, "learning_rate": 1.4903476897061386e-05, "loss": 0.0265, "step": 294480 }, { "epoch": 1.9, "learning_rate": 1.4893795542704452e-05, "loss": 0.0199, "step": 294490 }, { "epoch": 1.9, "learning_rate": 1.488411418834752e-05, "loss": 0.0245, "step": 294500 }, { "epoch": 1.9, "learning_rate": 1.4874432833990588e-05, "loss": 0.0206, "step": 294510 }, { "epoch": 1.9, "learning_rate": 1.4864751479633656e-05, "loss": 0.025, "step": 294520 }, { "epoch": 1.9, "learning_rate": 1.4855070125276724e-05, "loss": 0.0252, "step": 294530 }, { "epoch": 1.9, "learning_rate": 1.4845388770919792e-05, "loss": 0.0242, "step": 294540 }, { "epoch": 1.9, "learning_rate": 1.483570741656286e-05, "loss": 0.0219, "step": 294550 }, { "epoch": 1.9, "learning_rate": 1.4826026062205926e-05, "loss": 0.0205, "step": 294560 }, { "epoch": 1.9, "learning_rate": 1.4816344707848996e-05, "loss": 0.0214, "step": 294570 }, { "epoch": 1.9, "learning_rate": 1.4806663353492064e-05, "loss": 0.0242, "step": 294580 }, { "epoch": 1.9, "learning_rate": 1.479698199913513e-05, "loss": 0.0186, "step": 294590 }, { "epoch": 1.9, "learning_rate": 1.4787300644778198e-05, "loss": 0.0216, "step": 294600 }, { "epoch": 1.9, "learning_rate": 1.4777619290421268e-05, "loss": 0.0236, "step": 294610 }, { "epoch": 1.9, "learning_rate": 1.4767937936064334e-05, "loss": 0.0214, "step": 294620 }, { "epoch": 1.9, "learning_rate": 1.4758256581707402e-05, "loss": 0.022, "step": 294630 }, { "epoch": 1.9, "learning_rate": 1.474857522735047e-05, "loss": 0.0226, "step": 294640 }, { "epoch": 1.9, "learning_rate": 1.473889387299354e-05, "loss": 0.0231, "step": 294650 }, { "epoch": 1.9, "learning_rate": 1.4729212518636606e-05, "loss": 0.0217, "step": 294660 }, { "epoch": 1.9, "learning_rate": 1.4719531164279674e-05, "loss": 0.023, "step": 294670 }, { "epoch": 1.9, "learning_rate": 1.4709849809922742e-05, "loss": 0.0267, "step": 294680 }, { "epoch": 1.9, "learning_rate": 1.4700168455565808e-05, "loss": 0.0244, "step": 294690 }, { "epoch": 1.9, "learning_rate": 1.4690487101208877e-05, "loss": 0.0223, "step": 294700 }, { "epoch": 1.9, "learning_rate": 1.4680805746851945e-05, "loss": 0.017, "step": 294710 }, { "epoch": 1.9, "learning_rate": 1.4671124392495013e-05, "loss": 0.0246, "step": 294720 }, { "epoch": 1.9, "learning_rate": 1.466144303813808e-05, "loss": 0.0259, "step": 294730 }, { "epoch": 1.9, "learning_rate": 1.4651761683781149e-05, "loss": 0.0227, "step": 294740 }, { "epoch": 1.9, "learning_rate": 1.4642080329424217e-05, "loss": 0.0205, "step": 294750 }, { "epoch": 1.9, "learning_rate": 1.4632398975067283e-05, "loss": 0.0237, "step": 294760 }, { "epoch": 1.9, "learning_rate": 1.4622717620710351e-05, "loss": 0.0226, "step": 294770 }, { "epoch": 1.9, "learning_rate": 1.461303626635342e-05, "loss": 0.0194, "step": 294780 }, { "epoch": 1.9, "learning_rate": 1.4603354911996489e-05, "loss": 0.0226, "step": 294790 }, { "epoch": 1.9, "learning_rate": 1.4593673557639555e-05, "loss": 0.021, "step": 294800 }, { "epoch": 1.9, "learning_rate": 1.4583992203282623e-05, "loss": 0.0214, "step": 294810 }, { "epoch": 1.9, "learning_rate": 1.4574310848925691e-05, "loss": 0.0273, "step": 294820 }, { "epoch": 1.9, "learning_rate": 1.4564629494568759e-05, "loss": 0.0273, "step": 294830 }, { "epoch": 1.9, "learning_rate": 1.4554948140211827e-05, "loss": 0.019, "step": 294840 }, { "epoch": 1.9, "learning_rate": 1.4545266785854895e-05, "loss": 0.0231, "step": 294850 }, { "epoch": 1.9, "learning_rate": 1.4535585431497963e-05, "loss": 0.0226, "step": 294860 }, { "epoch": 1.9, "learning_rate": 1.4525904077141029e-05, "loss": 0.0174, "step": 294870 }, { "epoch": 1.9, "learning_rate": 1.4516222722784098e-05, "loss": 0.0191, "step": 294880 }, { "epoch": 1.9, "learning_rate": 1.4506541368427166e-05, "loss": 0.0197, "step": 294890 }, { "epoch": 1.9, "learning_rate": 1.4496860014070233e-05, "loss": 0.0235, "step": 294900 }, { "epoch": 1.9, "learning_rate": 1.44871786597133e-05, "loss": 0.0209, "step": 294910 }, { "epoch": 1.9, "learning_rate": 1.447749730535637e-05, "loss": 0.0242, "step": 294920 }, { "epoch": 1.9, "learning_rate": 1.4467815950999438e-05, "loss": 0.0241, "step": 294930 }, { "epoch": 1.9, "learning_rate": 1.4458134596642504e-05, "loss": 0.0216, "step": 294940 }, { "epoch": 1.9, "learning_rate": 1.4448453242285572e-05, "loss": 0.0205, "step": 294950 }, { "epoch": 1.9, "learning_rate": 1.4438771887928642e-05, "loss": 0.0194, "step": 294960 }, { "epoch": 1.9, "learning_rate": 1.4429090533571708e-05, "loss": 0.0201, "step": 294970 }, { "epoch": 1.9, "learning_rate": 1.4419409179214776e-05, "loss": 0.0347, "step": 294980 }, { "epoch": 1.9, "learning_rate": 1.4409727824857844e-05, "loss": 0.0224, "step": 294990 }, { "epoch": 1.9, "learning_rate": 1.4400046470500914e-05, "loss": 0.0255, "step": 295000 }, { "epoch": 1.9, "eval_cer": 0.9198345949610214, "eval_loss": 0.01676587574183941, "eval_runtime": 120.4368, "eval_samples_per_second": 16.606, "eval_steps_per_second": 4.152, "step": 295000 }, { "epoch": 1.9, "learning_rate": 1.439036511614398e-05, "loss": 0.0216, "step": 295010 }, { "epoch": 1.9, "learning_rate": 1.4380683761787048e-05, "loss": 0.0258, "step": 295020 }, { "epoch": 1.9, "learning_rate": 1.4371002407430116e-05, "loss": 0.0238, "step": 295030 }, { "epoch": 1.9, "learning_rate": 1.4361321053073182e-05, "loss": 0.0207, "step": 295040 }, { "epoch": 1.9, "learning_rate": 1.4351639698716252e-05, "loss": 0.0224, "step": 295050 }, { "epoch": 1.9, "learning_rate": 1.434195834435932e-05, "loss": 0.0238, "step": 295060 }, { "epoch": 1.9, "learning_rate": 1.4332276990002386e-05, "loss": 0.022, "step": 295070 }, { "epoch": 1.9, "learning_rate": 1.4322595635645454e-05, "loss": 0.0232, "step": 295080 }, { "epoch": 1.9, "learning_rate": 1.4312914281288523e-05, "loss": 0.0234, "step": 295090 }, { "epoch": 1.9, "learning_rate": 1.4303232926931591e-05, "loss": 0.0184, "step": 295100 }, { "epoch": 1.9, "learning_rate": 1.4293551572574658e-05, "loss": 0.0217, "step": 295110 }, { "epoch": 1.9, "learning_rate": 1.4283870218217725e-05, "loss": 0.0216, "step": 295120 }, { "epoch": 1.9, "learning_rate": 1.4274188863860795e-05, "loss": 0.0229, "step": 295130 }, { "epoch": 1.9, "learning_rate": 1.4264507509503861e-05, "loss": 0.0217, "step": 295140 }, { "epoch": 1.9, "learning_rate": 1.425482615514693e-05, "loss": 0.0242, "step": 295150 }, { "epoch": 1.91, "learning_rate": 1.4245144800789997e-05, "loss": 0.0233, "step": 295160 }, { "epoch": 1.91, "learning_rate": 1.4235463446433065e-05, "loss": 0.0173, "step": 295170 }, { "epoch": 1.91, "learning_rate": 1.4225782092076133e-05, "loss": 0.0195, "step": 295180 }, { "epoch": 1.91, "learning_rate": 1.4216100737719201e-05, "loss": 0.0249, "step": 295190 }, { "epoch": 1.91, "learning_rate": 1.4206419383362269e-05, "loss": 0.0236, "step": 295200 }, { "epoch": 1.91, "learning_rate": 1.4196738029005335e-05, "loss": 0.0262, "step": 295210 }, { "epoch": 1.91, "learning_rate": 1.4187056674648403e-05, "loss": 0.0204, "step": 295220 }, { "epoch": 1.91, "learning_rate": 1.4177375320291473e-05, "loss": 0.0212, "step": 295230 }, { "epoch": 1.91, "learning_rate": 1.416769396593454e-05, "loss": 0.0172, "step": 295240 }, { "epoch": 1.91, "learning_rate": 1.4158012611577607e-05, "loss": 0.022, "step": 295250 }, { "epoch": 1.91, "learning_rate": 1.4148331257220675e-05, "loss": 0.0229, "step": 295260 }, { "epoch": 1.91, "learning_rate": 1.4138649902863744e-05, "loss": 0.0218, "step": 295270 }, { "epoch": 1.91, "learning_rate": 1.412896854850681e-05, "loss": 0.0215, "step": 295280 }, { "epoch": 1.91, "learning_rate": 1.4119287194149879e-05, "loss": 0.0217, "step": 295290 }, { "epoch": 1.91, "learning_rate": 1.4109605839792947e-05, "loss": 0.024, "step": 295300 }, { "epoch": 1.91, "learning_rate": 1.4099924485436016e-05, "loss": 0.0238, "step": 295310 }, { "epoch": 1.91, "learning_rate": 1.4090243131079082e-05, "loss": 0.0222, "step": 295320 }, { "epoch": 1.91, "learning_rate": 1.408056177672215e-05, "loss": 0.0244, "step": 295330 }, { "epoch": 1.91, "learning_rate": 1.4070880422365218e-05, "loss": 0.026, "step": 295340 }, { "epoch": 1.91, "learning_rate": 1.4061199068008285e-05, "loss": 0.0169, "step": 295350 }, { "epoch": 1.91, "learning_rate": 1.4051517713651354e-05, "loss": 0.0232, "step": 295360 }, { "epoch": 1.91, "learning_rate": 1.4041836359294422e-05, "loss": 0.0263, "step": 295370 }, { "epoch": 1.91, "learning_rate": 1.403215500493749e-05, "loss": 0.021, "step": 295380 }, { "epoch": 1.91, "learning_rate": 1.4022473650580556e-05, "loss": 0.0195, "step": 295390 }, { "epoch": 1.91, "learning_rate": 1.4012792296223626e-05, "loss": 0.0211, "step": 295400 }, { "epoch": 1.91, "learning_rate": 1.4003110941866694e-05, "loss": 0.0251, "step": 295410 }, { "epoch": 1.91, "learning_rate": 1.399342958750976e-05, "loss": 0.0182, "step": 295420 }, { "epoch": 1.91, "learning_rate": 1.3983748233152828e-05, "loss": 0.0245, "step": 295430 }, { "epoch": 1.91, "learning_rate": 1.3974066878795898e-05, "loss": 0.0169, "step": 295440 }, { "epoch": 1.91, "learning_rate": 1.3964385524438966e-05, "loss": 0.0232, "step": 295450 }, { "epoch": 1.91, "learning_rate": 1.3954704170082032e-05, "loss": 0.0275, "step": 295460 }, { "epoch": 1.91, "learning_rate": 1.39450228157251e-05, "loss": 0.021, "step": 295470 }, { "epoch": 1.91, "learning_rate": 1.3935341461368168e-05, "loss": 0.0209, "step": 295480 }, { "epoch": 1.91, "learning_rate": 1.3925660107011236e-05, "loss": 0.0231, "step": 295490 }, { "epoch": 1.91, "learning_rate": 1.3915978752654304e-05, "loss": 0.0224, "step": 295500 }, { "epoch": 1.91, "learning_rate": 1.3906297398297371e-05, "loss": 0.0223, "step": 295510 }, { "epoch": 1.91, "learning_rate": 1.3896616043940438e-05, "loss": 0.0236, "step": 295520 }, { "epoch": 1.91, "learning_rate": 1.3886934689583507e-05, "loss": 0.0213, "step": 295530 }, { "epoch": 1.91, "learning_rate": 1.3877253335226575e-05, "loss": 0.0248, "step": 295540 }, { "epoch": 1.91, "learning_rate": 1.3867571980869643e-05, "loss": 0.0185, "step": 295550 }, { "epoch": 1.91, "learning_rate": 1.385789062651271e-05, "loss": 0.0218, "step": 295560 }, { "epoch": 1.91, "learning_rate": 1.3848209272155777e-05, "loss": 0.0201, "step": 295570 }, { "epoch": 1.91, "learning_rate": 1.3838527917798847e-05, "loss": 0.025, "step": 295580 }, { "epoch": 1.91, "learning_rate": 1.3828846563441913e-05, "loss": 0.0227, "step": 295590 }, { "epoch": 1.91, "learning_rate": 1.3819165209084981e-05, "loss": 0.0216, "step": 295600 }, { "epoch": 1.91, "learning_rate": 1.3809483854728049e-05, "loss": 0.0252, "step": 295610 }, { "epoch": 1.91, "learning_rate": 1.3799802500371119e-05, "loss": 0.0195, "step": 295620 }, { "epoch": 1.91, "learning_rate": 1.3790121146014185e-05, "loss": 0.0214, "step": 295630 }, { "epoch": 1.91, "learning_rate": 1.3780439791657253e-05, "loss": 0.0253, "step": 295640 }, { "epoch": 1.91, "learning_rate": 1.3770758437300321e-05, "loss": 0.0209, "step": 295650 }, { "epoch": 1.91, "learning_rate": 1.3761077082943387e-05, "loss": 0.0204, "step": 295660 }, { "epoch": 1.91, "learning_rate": 1.3751395728586457e-05, "loss": 0.0229, "step": 295670 }, { "epoch": 1.91, "learning_rate": 1.3741714374229525e-05, "loss": 0.0265, "step": 295680 }, { "epoch": 1.91, "learning_rate": 1.3732033019872593e-05, "loss": 0.02, "step": 295690 }, { "epoch": 1.91, "learning_rate": 1.3722351665515659e-05, "loss": 0.0211, "step": 295700 }, { "epoch": 1.91, "learning_rate": 1.3712670311158728e-05, "loss": 0.0232, "step": 295710 }, { "epoch": 1.91, "learning_rate": 1.3702988956801796e-05, "loss": 0.0233, "step": 295720 }, { "epoch": 1.91, "learning_rate": 1.3693307602444863e-05, "loss": 0.028, "step": 295730 }, { "epoch": 1.91, "learning_rate": 1.368362624808793e-05, "loss": 0.0224, "step": 295740 }, { "epoch": 1.91, "learning_rate": 1.3673944893731e-05, "loss": 0.0186, "step": 295750 }, { "epoch": 1.91, "learning_rate": 1.3664263539374068e-05, "loss": 0.0215, "step": 295760 }, { "epoch": 1.91, "learning_rate": 1.3654582185017134e-05, "loss": 0.0232, "step": 295770 }, { "epoch": 1.91, "learning_rate": 1.3644900830660202e-05, "loss": 0.0194, "step": 295780 }, { "epoch": 1.91, "learning_rate": 1.3635219476303272e-05, "loss": 0.026, "step": 295790 }, { "epoch": 1.91, "learning_rate": 1.3625538121946338e-05, "loss": 0.0231, "step": 295800 }, { "epoch": 1.91, "learning_rate": 1.3615856767589406e-05, "loss": 0.0199, "step": 295810 }, { "epoch": 1.91, "learning_rate": 1.3606175413232474e-05, "loss": 0.0206, "step": 295820 }, { "epoch": 1.91, "learning_rate": 1.3596494058875542e-05, "loss": 0.0272, "step": 295830 }, { "epoch": 1.91, "learning_rate": 1.358681270451861e-05, "loss": 0.0242, "step": 295840 }, { "epoch": 1.91, "learning_rate": 1.3577131350161678e-05, "loss": 0.0236, "step": 295850 }, { "epoch": 1.91, "learning_rate": 1.3567449995804746e-05, "loss": 0.0206, "step": 295860 }, { "epoch": 1.91, "learning_rate": 1.3557768641447812e-05, "loss": 0.0184, "step": 295870 }, { "epoch": 1.91, "learning_rate": 1.354808728709088e-05, "loss": 0.0213, "step": 295880 }, { "epoch": 1.91, "learning_rate": 1.353840593273395e-05, "loss": 0.0209, "step": 295890 }, { "epoch": 1.91, "learning_rate": 1.3528724578377016e-05, "loss": 0.0225, "step": 295900 }, { "epoch": 1.91, "learning_rate": 1.3519043224020084e-05, "loss": 0.0203, "step": 295910 }, { "epoch": 1.91, "learning_rate": 1.3509361869663152e-05, "loss": 0.0206, "step": 295920 }, { "epoch": 1.91, "learning_rate": 1.3499680515306221e-05, "loss": 0.0246, "step": 295930 }, { "epoch": 1.91, "learning_rate": 1.3489999160949288e-05, "loss": 0.0189, "step": 295940 }, { "epoch": 1.91, "learning_rate": 1.3480317806592355e-05, "loss": 0.0229, "step": 295950 }, { "epoch": 1.91, "learning_rate": 1.3470636452235423e-05, "loss": 0.023, "step": 295960 }, { "epoch": 1.91, "learning_rate": 1.346095509787849e-05, "loss": 0.0237, "step": 295970 }, { "epoch": 1.91, "learning_rate": 1.345127374352156e-05, "loss": 0.0212, "step": 295980 }, { "epoch": 1.91, "learning_rate": 1.3441592389164627e-05, "loss": 0.0192, "step": 295990 }, { "epoch": 1.91, "learning_rate": 1.3431911034807695e-05, "loss": 0.0248, "step": 296000 }, { "epoch": 1.91, "eval_cer": 0.9198454411930855, "eval_loss": 0.0166392233222723, "eval_runtime": 120.6295, "eval_samples_per_second": 16.58, "eval_steps_per_second": 4.145, "step": 296000 }, { "epoch": 1.91, "learning_rate": 1.3422229680450761e-05, "loss": 0.0237, "step": 296010 }, { "epoch": 1.91, "learning_rate": 1.3412548326093831e-05, "loss": 0.0253, "step": 296020 }, { "epoch": 1.91, "learning_rate": 1.3402866971736899e-05, "loss": 0.0262, "step": 296030 }, { "epoch": 1.91, "learning_rate": 1.3393185617379965e-05, "loss": 0.0233, "step": 296040 }, { "epoch": 1.91, "learning_rate": 1.3383504263023033e-05, "loss": 0.0249, "step": 296050 }, { "epoch": 1.91, "learning_rate": 1.3373822908666103e-05, "loss": 0.0229, "step": 296060 }, { "epoch": 1.91, "learning_rate": 1.336414155430917e-05, "loss": 0.0212, "step": 296070 }, { "epoch": 1.91, "learning_rate": 1.3354460199952237e-05, "loss": 0.0217, "step": 296080 }, { "epoch": 1.91, "learning_rate": 1.3344778845595305e-05, "loss": 0.0225, "step": 296090 }, { "epoch": 1.91, "learning_rate": 1.3335097491238374e-05, "loss": 0.0216, "step": 296100 }, { "epoch": 1.91, "learning_rate": 1.332541613688144e-05, "loss": 0.0338, "step": 296110 }, { "epoch": 1.91, "learning_rate": 1.3315734782524509e-05, "loss": 0.0252, "step": 296120 }, { "epoch": 1.91, "learning_rate": 1.3306053428167577e-05, "loss": 0.026, "step": 296130 }, { "epoch": 1.91, "learning_rate": 1.3296372073810646e-05, "loss": 0.0255, "step": 296140 }, { "epoch": 1.91, "learning_rate": 1.3286690719453712e-05, "loss": 0.02, "step": 296150 }, { "epoch": 1.91, "learning_rate": 1.327700936509678e-05, "loss": 0.0219, "step": 296160 }, { "epoch": 1.91, "learning_rate": 1.3267328010739848e-05, "loss": 0.029, "step": 296170 }, { "epoch": 1.91, "learning_rate": 1.3257646656382915e-05, "loss": 0.0295, "step": 296180 }, { "epoch": 1.91, "learning_rate": 1.3247965302025984e-05, "loss": 0.019, "step": 296190 }, { "epoch": 1.91, "learning_rate": 1.3238283947669052e-05, "loss": 0.023, "step": 296200 }, { "epoch": 1.91, "learning_rate": 1.322860259331212e-05, "loss": 0.0252, "step": 296210 }, { "epoch": 1.91, "learning_rate": 1.3218921238955186e-05, "loss": 0.023, "step": 296220 }, { "epoch": 1.91, "learning_rate": 1.3209239884598254e-05, "loss": 0.0218, "step": 296230 }, { "epoch": 1.91, "learning_rate": 1.3199558530241324e-05, "loss": 0.0235, "step": 296240 }, { "epoch": 1.91, "learning_rate": 1.318987717588439e-05, "loss": 0.0208, "step": 296250 }, { "epoch": 1.91, "learning_rate": 1.3180195821527458e-05, "loss": 0.0291, "step": 296260 }, { "epoch": 1.91, "learning_rate": 1.3170514467170526e-05, "loss": 0.0206, "step": 296270 }, { "epoch": 1.91, "learning_rate": 1.3160833112813596e-05, "loss": 0.02, "step": 296280 }, { "epoch": 1.91, "learning_rate": 1.3151151758456662e-05, "loss": 0.0203, "step": 296290 }, { "epoch": 1.91, "learning_rate": 1.314147040409973e-05, "loss": 0.0185, "step": 296300 }, { "epoch": 1.91, "learning_rate": 1.3131789049742798e-05, "loss": 0.0194, "step": 296310 }, { "epoch": 1.91, "learning_rate": 1.3122107695385864e-05, "loss": 0.02, "step": 296320 }, { "epoch": 1.91, "learning_rate": 1.3112426341028934e-05, "loss": 0.0204, "step": 296330 }, { "epoch": 1.91, "learning_rate": 1.3102744986672001e-05, "loss": 0.0233, "step": 296340 }, { "epoch": 1.91, "learning_rate": 1.3093063632315068e-05, "loss": 0.0207, "step": 296350 }, { "epoch": 1.91, "learning_rate": 1.3083382277958136e-05, "loss": 0.0237, "step": 296360 }, { "epoch": 1.91, "learning_rate": 1.3073700923601205e-05, "loss": 0.0223, "step": 296370 }, { "epoch": 1.91, "learning_rate": 1.3064019569244273e-05, "loss": 0.0239, "step": 296380 }, { "epoch": 1.91, "learning_rate": 1.305433821488734e-05, "loss": 0.0223, "step": 296390 }, { "epoch": 1.91, "learning_rate": 1.3044656860530407e-05, "loss": 0.0195, "step": 296400 }, { "epoch": 1.91, "learning_rate": 1.3034975506173477e-05, "loss": 0.0217, "step": 296410 }, { "epoch": 1.91, "learning_rate": 1.3025294151816543e-05, "loss": 0.0233, "step": 296420 }, { "epoch": 1.91, "learning_rate": 1.3015612797459611e-05, "loss": 0.0239, "step": 296430 }, { "epoch": 1.91, "learning_rate": 1.3005931443102679e-05, "loss": 0.0224, "step": 296440 }, { "epoch": 1.91, "learning_rate": 1.2996250088745749e-05, "loss": 0.0272, "step": 296450 }, { "epoch": 1.91, "learning_rate": 1.2986568734388815e-05, "loss": 0.0196, "step": 296460 }, { "epoch": 1.91, "learning_rate": 1.2976887380031883e-05, "loss": 0.0212, "step": 296470 }, { "epoch": 1.91, "learning_rate": 1.2967206025674951e-05, "loss": 0.0231, "step": 296480 }, { "epoch": 1.91, "learning_rate": 1.2957524671318017e-05, "loss": 0.0241, "step": 296490 }, { "epoch": 1.91, "learning_rate": 1.2947843316961087e-05, "loss": 0.0253, "step": 296500 }, { "epoch": 1.91, "learning_rate": 1.2938161962604155e-05, "loss": 0.0226, "step": 296510 }, { "epoch": 1.91, "learning_rate": 1.2928480608247223e-05, "loss": 0.0209, "step": 296520 }, { "epoch": 1.91, "learning_rate": 1.2918799253890289e-05, "loss": 0.022, "step": 296530 }, { "epoch": 1.91, "learning_rate": 1.2909117899533357e-05, "loss": 0.0267, "step": 296540 }, { "epoch": 1.91, "learning_rate": 1.2899436545176426e-05, "loss": 0.0271, "step": 296550 }, { "epoch": 1.91, "learning_rate": 1.2889755190819493e-05, "loss": 0.0235, "step": 296560 }, { "epoch": 1.91, "learning_rate": 1.288007383646256e-05, "loss": 0.0216, "step": 296570 }, { "epoch": 1.91, "learning_rate": 1.2870392482105628e-05, "loss": 0.0209, "step": 296580 }, { "epoch": 1.91, "learning_rate": 1.2860711127748698e-05, "loss": 0.0203, "step": 296590 }, { "epoch": 1.91, "learning_rate": 1.2851029773391764e-05, "loss": 0.0266, "step": 296600 }, { "epoch": 1.91, "learning_rate": 1.2841348419034832e-05, "loss": 0.0207, "step": 296610 }, { "epoch": 1.91, "learning_rate": 1.28316670646779e-05, "loss": 0.0193, "step": 296620 }, { "epoch": 1.91, "learning_rate": 1.2821985710320966e-05, "loss": 0.0222, "step": 296630 }, { "epoch": 1.91, "learning_rate": 1.2812304355964036e-05, "loss": 0.0186, "step": 296640 }, { "epoch": 1.91, "learning_rate": 1.2802623001607104e-05, "loss": 0.0234, "step": 296650 }, { "epoch": 1.91, "learning_rate": 1.2792941647250172e-05, "loss": 0.0251, "step": 296660 }, { "epoch": 1.91, "learning_rate": 1.2783260292893238e-05, "loss": 0.0232, "step": 296670 }, { "epoch": 1.91, "learning_rate": 1.2773578938536308e-05, "loss": 0.0194, "step": 296680 }, { "epoch": 1.91, "learning_rate": 1.2763897584179376e-05, "loss": 0.0199, "step": 296690 }, { "epoch": 1.91, "learning_rate": 1.2754216229822442e-05, "loss": 0.0249, "step": 296700 }, { "epoch": 1.92, "learning_rate": 1.274453487546551e-05, "loss": 0.0237, "step": 296710 }, { "epoch": 1.92, "learning_rate": 1.273485352110858e-05, "loss": 0.0235, "step": 296720 }, { "epoch": 1.92, "learning_rate": 1.2725172166751647e-05, "loss": 0.0201, "step": 296730 }, { "epoch": 1.92, "learning_rate": 1.2715490812394714e-05, "loss": 0.0235, "step": 296740 }, { "epoch": 1.92, "learning_rate": 1.2705809458037782e-05, "loss": 0.0195, "step": 296750 }, { "epoch": 1.92, "learning_rate": 1.2696128103680851e-05, "loss": 0.0235, "step": 296760 }, { "epoch": 1.92, "learning_rate": 1.2686446749323918e-05, "loss": 0.0216, "step": 296770 }, { "epoch": 1.92, "learning_rate": 1.2676765394966985e-05, "loss": 0.0268, "step": 296780 }, { "epoch": 1.92, "learning_rate": 1.2667084040610053e-05, "loss": 0.0176, "step": 296790 }, { "epoch": 1.92, "learning_rate": 1.265740268625312e-05, "loss": 0.024, "step": 296800 }, { "epoch": 1.92, "learning_rate": 1.264772133189619e-05, "loss": 0.0251, "step": 296810 }, { "epoch": 1.92, "learning_rate": 1.2638039977539257e-05, "loss": 0.0245, "step": 296820 }, { "epoch": 1.92, "learning_rate": 1.2628358623182325e-05, "loss": 0.0282, "step": 296830 }, { "epoch": 1.92, "learning_rate": 1.2618677268825391e-05, "loss": 0.0229, "step": 296840 }, { "epoch": 1.92, "learning_rate": 1.2608995914468461e-05, "loss": 0.0189, "step": 296850 }, { "epoch": 1.92, "learning_rate": 1.2599314560111529e-05, "loss": 0.0247, "step": 296860 }, { "epoch": 1.92, "learning_rate": 1.2589633205754595e-05, "loss": 0.0258, "step": 296870 }, { "epoch": 1.92, "learning_rate": 1.2579951851397663e-05, "loss": 0.0289, "step": 296880 }, { "epoch": 1.92, "learning_rate": 1.2570270497040731e-05, "loss": 0.0298, "step": 296890 }, { "epoch": 1.92, "learning_rate": 1.25605891426838e-05, "loss": 0.0228, "step": 296900 }, { "epoch": 1.92, "learning_rate": 1.2550907788326867e-05, "loss": 0.0247, "step": 296910 }, { "epoch": 1.92, "learning_rate": 1.2541226433969935e-05, "loss": 0.0251, "step": 296920 }, { "epoch": 1.92, "learning_rate": 1.2531545079613003e-05, "loss": 0.0191, "step": 296930 }, { "epoch": 1.92, "learning_rate": 1.2521863725256069e-05, "loss": 0.0229, "step": 296940 }, { "epoch": 1.92, "learning_rate": 1.2512182370899139e-05, "loss": 0.0236, "step": 296950 }, { "epoch": 1.92, "learning_rate": 1.2502501016542207e-05, "loss": 0.0159, "step": 296960 }, { "epoch": 1.92, "learning_rate": 1.2492819662185275e-05, "loss": 0.0254, "step": 296970 }, { "epoch": 1.92, "learning_rate": 1.248313830782834e-05, "loss": 0.0226, "step": 296980 }, { "epoch": 1.92, "learning_rate": 1.247345695347141e-05, "loss": 0.0248, "step": 296990 }, { "epoch": 1.92, "learning_rate": 1.2463775599114478e-05, "loss": 0.0216, "step": 297000 }, { "epoch": 1.92, "eval_cer": 0.9198427296350695, "eval_loss": 0.016580868512392044, "eval_runtime": 120.5977, "eval_samples_per_second": 16.584, "eval_steps_per_second": 4.146, "step": 297000 }, { "epoch": 1.92, "learning_rate": 1.2454094244757545e-05, "loss": 0.0207, "step": 297010 }, { "epoch": 1.92, "learning_rate": 1.2444412890400612e-05, "loss": 0.0212, "step": 297020 }, { "epoch": 1.92, "learning_rate": 1.2434731536043682e-05, "loss": 0.0192, "step": 297030 }, { "epoch": 1.92, "learning_rate": 1.242505018168675e-05, "loss": 0.0201, "step": 297040 }, { "epoch": 1.92, "learning_rate": 1.2415368827329816e-05, "loss": 0.0199, "step": 297050 }, { "epoch": 1.92, "learning_rate": 1.2405687472972884e-05, "loss": 0.024, "step": 297060 }, { "epoch": 1.92, "learning_rate": 1.2396006118615954e-05, "loss": 0.0193, "step": 297070 }, { "epoch": 1.92, "learning_rate": 1.238632476425902e-05, "loss": 0.0257, "step": 297080 }, { "epoch": 1.92, "learning_rate": 1.2376643409902088e-05, "loss": 0.0252, "step": 297090 }, { "epoch": 1.92, "learning_rate": 1.2366962055545156e-05, "loss": 0.0248, "step": 297100 }, { "epoch": 1.92, "learning_rate": 1.2357280701188226e-05, "loss": 0.026, "step": 297110 }, { "epoch": 1.92, "learning_rate": 1.2347599346831292e-05, "loss": 0.0227, "step": 297120 }, { "epoch": 1.92, "learning_rate": 1.233791799247436e-05, "loss": 0.0298, "step": 297130 }, { "epoch": 1.92, "learning_rate": 1.2328236638117428e-05, "loss": 0.0227, "step": 297140 }, { "epoch": 1.92, "learning_rate": 1.2318555283760494e-05, "loss": 0.019, "step": 297150 }, { "epoch": 1.92, "learning_rate": 1.2308873929403564e-05, "loss": 0.0174, "step": 297160 }, { "epoch": 1.92, "learning_rate": 1.2299192575046631e-05, "loss": 0.021, "step": 297170 }, { "epoch": 1.92, "learning_rate": 1.2289511220689698e-05, "loss": 0.0208, "step": 297180 }, { "epoch": 1.92, "learning_rate": 1.2279829866332766e-05, "loss": 0.0207, "step": 297190 }, { "epoch": 1.92, "learning_rate": 1.2270148511975835e-05, "loss": 0.0237, "step": 297200 }, { "epoch": 1.92, "learning_rate": 1.2260467157618903e-05, "loss": 0.0219, "step": 297210 }, { "epoch": 1.92, "learning_rate": 1.225078580326197e-05, "loss": 0.0228, "step": 297220 }, { "epoch": 1.92, "learning_rate": 1.2241104448905037e-05, "loss": 0.0237, "step": 297230 }, { "epoch": 1.92, "learning_rate": 1.2231423094548105e-05, "loss": 0.0242, "step": 297240 }, { "epoch": 1.92, "learning_rate": 1.2221741740191173e-05, "loss": 0.0247, "step": 297250 }, { "epoch": 1.92, "learning_rate": 1.2212060385834241e-05, "loss": 0.0206, "step": 297260 }, { "epoch": 1.92, "learning_rate": 1.2202379031477309e-05, "loss": 0.0212, "step": 297270 }, { "epoch": 1.92, "learning_rate": 1.2192697677120377e-05, "loss": 0.0199, "step": 297280 }, { "epoch": 1.92, "learning_rate": 1.2183016322763443e-05, "loss": 0.0243, "step": 297290 }, { "epoch": 1.92, "learning_rate": 1.2173334968406513e-05, "loss": 0.0228, "step": 297300 }, { "epoch": 1.92, "learning_rate": 1.216365361404958e-05, "loss": 0.0194, "step": 297310 }, { "epoch": 1.92, "learning_rate": 1.2153972259692647e-05, "loss": 0.0244, "step": 297320 }, { "epoch": 1.92, "learning_rate": 1.2144290905335715e-05, "loss": 0.018, "step": 297330 }, { "epoch": 1.92, "learning_rate": 1.2134609550978785e-05, "loss": 0.0212, "step": 297340 }, { "epoch": 1.92, "learning_rate": 1.2124928196621853e-05, "loss": 0.0193, "step": 297350 }, { "epoch": 1.92, "learning_rate": 1.2115246842264919e-05, "loss": 0.0216, "step": 297360 }, { "epoch": 1.92, "learning_rate": 1.2105565487907987e-05, "loss": 0.0212, "step": 297370 }, { "epoch": 1.92, "learning_rate": 1.2095884133551056e-05, "loss": 0.02, "step": 297380 }, { "epoch": 1.92, "learning_rate": 1.2086202779194123e-05, "loss": 0.0264, "step": 297390 }, { "epoch": 1.92, "learning_rate": 1.207652142483719e-05, "loss": 0.0254, "step": 297400 }, { "epoch": 1.92, "learning_rate": 1.2066840070480258e-05, "loss": 0.0188, "step": 297410 }, { "epoch": 1.92, "learning_rate": 1.2057158716123328e-05, "loss": 0.021, "step": 297420 }, { "epoch": 1.92, "learning_rate": 1.2047477361766394e-05, "loss": 0.0204, "step": 297430 }, { "epoch": 1.92, "learning_rate": 1.2037796007409462e-05, "loss": 0.0217, "step": 297440 }, { "epoch": 1.92, "learning_rate": 1.202811465305253e-05, "loss": 0.0248, "step": 297450 }, { "epoch": 1.92, "learning_rate": 1.2018433298695596e-05, "loss": 0.0178, "step": 297460 }, { "epoch": 1.92, "learning_rate": 1.2008751944338666e-05, "loss": 0.0229, "step": 297470 }, { "epoch": 1.92, "learning_rate": 1.1999070589981734e-05, "loss": 0.0255, "step": 297480 }, { "epoch": 1.92, "learning_rate": 1.1989389235624802e-05, "loss": 0.0208, "step": 297490 }, { "epoch": 1.92, "learning_rate": 1.1979707881267868e-05, "loss": 0.0227, "step": 297500 }, { "epoch": 1.92, "learning_rate": 1.1970026526910938e-05, "loss": 0.0264, "step": 297510 }, { "epoch": 1.92, "learning_rate": 1.1960345172554006e-05, "loss": 0.0219, "step": 297520 }, { "epoch": 1.92, "learning_rate": 1.1950663818197072e-05, "loss": 0.0216, "step": 297530 }, { "epoch": 1.92, "learning_rate": 1.194098246384014e-05, "loss": 0.0235, "step": 297540 }, { "epoch": 1.92, "learning_rate": 1.1931301109483208e-05, "loss": 0.0202, "step": 297550 }, { "epoch": 1.92, "learning_rate": 1.1921619755126277e-05, "loss": 0.021, "step": 297560 }, { "epoch": 1.92, "learning_rate": 1.1911938400769344e-05, "loss": 0.0188, "step": 297570 }, { "epoch": 1.92, "learning_rate": 1.1902257046412412e-05, "loss": 0.02, "step": 297580 }, { "epoch": 1.92, "learning_rate": 1.189257569205548e-05, "loss": 0.0232, "step": 297590 }, { "epoch": 1.92, "learning_rate": 1.1882894337698546e-05, "loss": 0.0186, "step": 297600 }, { "epoch": 1.92, "learning_rate": 1.1873212983341615e-05, "loss": 0.0199, "step": 297610 }, { "epoch": 1.92, "learning_rate": 1.1863531628984683e-05, "loss": 0.0213, "step": 297620 }, { "epoch": 1.92, "learning_rate": 1.185385027462775e-05, "loss": 0.0192, "step": 297630 }, { "epoch": 1.92, "learning_rate": 1.1844168920270818e-05, "loss": 0.0224, "step": 297640 }, { "epoch": 1.92, "learning_rate": 1.1834487565913887e-05, "loss": 0.0207, "step": 297650 }, { "epoch": 1.92, "learning_rate": 1.1824806211556955e-05, "loss": 0.0227, "step": 297660 }, { "epoch": 1.92, "learning_rate": 1.1815124857200021e-05, "loss": 0.0211, "step": 297670 }, { "epoch": 1.92, "learning_rate": 1.180544350284309e-05, "loss": 0.0216, "step": 297680 }, { "epoch": 1.92, "learning_rate": 1.1795762148486159e-05, "loss": 0.0202, "step": 297690 }, { "epoch": 1.92, "learning_rate": 1.1786080794129225e-05, "loss": 0.022, "step": 297700 }, { "epoch": 1.92, "learning_rate": 1.1776399439772293e-05, "loss": 0.0207, "step": 297710 }, { "epoch": 1.92, "learning_rate": 1.1766718085415361e-05, "loss": 0.022, "step": 297720 }, { "epoch": 1.92, "learning_rate": 1.175703673105843e-05, "loss": 0.0235, "step": 297730 }, { "epoch": 1.92, "learning_rate": 1.1747355376701497e-05, "loss": 0.0213, "step": 297740 }, { "epoch": 1.92, "learning_rate": 1.1737674022344565e-05, "loss": 0.0201, "step": 297750 }, { "epoch": 1.92, "learning_rate": 1.1727992667987633e-05, "loss": 0.0202, "step": 297760 }, { "epoch": 1.92, "learning_rate": 1.1718311313630699e-05, "loss": 0.0219, "step": 297770 }, { "epoch": 1.92, "learning_rate": 1.1708629959273769e-05, "loss": 0.023, "step": 297780 }, { "epoch": 1.92, "learning_rate": 1.1698948604916837e-05, "loss": 0.0198, "step": 297790 }, { "epoch": 1.92, "learning_rate": 1.1689267250559904e-05, "loss": 0.0198, "step": 297800 }, { "epoch": 1.92, "learning_rate": 1.167958589620297e-05, "loss": 0.0183, "step": 297810 }, { "epoch": 1.92, "learning_rate": 1.166990454184604e-05, "loss": 0.0251, "step": 297820 }, { "epoch": 1.92, "learning_rate": 1.1660223187489108e-05, "loss": 0.0203, "step": 297830 }, { "epoch": 1.92, "learning_rate": 1.1650541833132175e-05, "loss": 0.0233, "step": 297840 }, { "epoch": 1.92, "learning_rate": 1.1640860478775242e-05, "loss": 0.0203, "step": 297850 }, { "epoch": 1.92, "learning_rate": 1.1631179124418312e-05, "loss": 0.0225, "step": 297860 }, { "epoch": 1.92, "learning_rate": 1.162149777006138e-05, "loss": 0.0213, "step": 297870 }, { "epoch": 1.92, "learning_rate": 1.1611816415704446e-05, "loss": 0.0226, "step": 297880 }, { "epoch": 1.92, "learning_rate": 1.1602135061347514e-05, "loss": 0.0193, "step": 297890 }, { "epoch": 1.92, "learning_rate": 1.1592453706990582e-05, "loss": 0.0256, "step": 297900 }, { "epoch": 1.92, "learning_rate": 1.158277235263365e-05, "loss": 0.0239, "step": 297910 }, { "epoch": 1.92, "learning_rate": 1.1573090998276718e-05, "loss": 0.0244, "step": 297920 }, { "epoch": 1.92, "learning_rate": 1.1563409643919786e-05, "loss": 0.0176, "step": 297930 }, { "epoch": 1.92, "learning_rate": 1.1553728289562854e-05, "loss": 0.0206, "step": 297940 }, { "epoch": 1.92, "learning_rate": 1.154404693520592e-05, "loss": 0.0201, "step": 297950 }, { "epoch": 1.92, "learning_rate": 1.153436558084899e-05, "loss": 0.0205, "step": 297960 }, { "epoch": 1.92, "learning_rate": 1.1524684226492058e-05, "loss": 0.0181, "step": 297970 }, { "epoch": 1.92, "learning_rate": 1.1515002872135124e-05, "loss": 0.0254, "step": 297980 }, { "epoch": 1.92, "learning_rate": 1.1505321517778192e-05, "loss": 0.0255, "step": 297990 }, { "epoch": 1.92, "learning_rate": 1.1495640163421261e-05, "loss": 0.0219, "step": 298000 }, { "epoch": 1.92, "eval_cer": 0.9198427296350695, "eval_loss": 0.016680259257555008, "eval_runtime": 120.6259, "eval_samples_per_second": 16.58, "eval_steps_per_second": 4.145, "step": 298000 }, { "epoch": 1.92, "learning_rate": 1.148595880906433e-05, "loss": 0.0187, "step": 298010 }, { "epoch": 1.92, "learning_rate": 1.1476277454707396e-05, "loss": 0.03, "step": 298020 }, { "epoch": 1.92, "learning_rate": 1.1466596100350464e-05, "loss": 0.0263, "step": 298030 }, { "epoch": 1.92, "learning_rate": 1.1456914745993533e-05, "loss": 0.0191, "step": 298040 }, { "epoch": 1.92, "learning_rate": 1.14472333916366e-05, "loss": 0.0175, "step": 298050 }, { "epoch": 1.92, "learning_rate": 1.1437552037279667e-05, "loss": 0.0223, "step": 298060 }, { "epoch": 1.92, "learning_rate": 1.1427870682922735e-05, "loss": 0.0195, "step": 298070 }, { "epoch": 1.92, "learning_rate": 1.1418189328565802e-05, "loss": 0.0282, "step": 298080 }, { "epoch": 1.92, "learning_rate": 1.1408507974208871e-05, "loss": 0.0231, "step": 298090 }, { "epoch": 1.92, "learning_rate": 1.1398826619851939e-05, "loss": 0.0211, "step": 298100 }, { "epoch": 1.92, "learning_rate": 1.1389145265495007e-05, "loss": 0.0215, "step": 298110 }, { "epoch": 1.92, "learning_rate": 1.1379463911138073e-05, "loss": 0.0199, "step": 298120 }, { "epoch": 1.92, "learning_rate": 1.1369782556781143e-05, "loss": 0.0235, "step": 298130 }, { "epoch": 1.92, "learning_rate": 1.136010120242421e-05, "loss": 0.0212, "step": 298140 }, { "epoch": 1.92, "learning_rate": 1.1350419848067277e-05, "loss": 0.0223, "step": 298150 }, { "epoch": 1.92, "learning_rate": 1.1340738493710345e-05, "loss": 0.0227, "step": 298160 }, { "epoch": 1.92, "learning_rate": 1.1331057139353415e-05, "loss": 0.0268, "step": 298170 }, { "epoch": 1.92, "learning_rate": 1.1321375784996483e-05, "loss": 0.0245, "step": 298180 }, { "epoch": 1.92, "learning_rate": 1.1311694430639549e-05, "loss": 0.0241, "step": 298190 }, { "epoch": 1.92, "learning_rate": 1.1302013076282617e-05, "loss": 0.0235, "step": 298200 }, { "epoch": 1.92, "learning_rate": 1.1292331721925685e-05, "loss": 0.0226, "step": 298210 }, { "epoch": 1.92, "learning_rate": 1.1282650367568753e-05, "loss": 0.0226, "step": 298220 }, { "epoch": 1.92, "learning_rate": 1.127296901321182e-05, "loss": 0.0215, "step": 298230 }, { "epoch": 1.92, "learning_rate": 1.1263287658854888e-05, "loss": 0.0207, "step": 298240 }, { "epoch": 1.92, "learning_rate": 1.1253606304497956e-05, "loss": 0.0263, "step": 298250 }, { "epoch": 1.93, "learning_rate": 1.1243924950141024e-05, "loss": 0.017, "step": 298260 }, { "epoch": 1.93, "learning_rate": 1.1234243595784092e-05, "loss": 0.0208, "step": 298270 }, { "epoch": 1.93, "learning_rate": 1.122456224142716e-05, "loss": 0.0195, "step": 298280 }, { "epoch": 1.93, "learning_rate": 1.1214880887070226e-05, "loss": 0.0226, "step": 298290 }, { "epoch": 1.93, "learning_rate": 1.1205199532713294e-05, "loss": 0.0227, "step": 298300 }, { "epoch": 1.93, "learning_rate": 1.1195518178356364e-05, "loss": 0.0214, "step": 298310 }, { "epoch": 1.93, "learning_rate": 1.1185836823999432e-05, "loss": 0.0223, "step": 298320 }, { "epoch": 1.93, "learning_rate": 1.1176155469642498e-05, "loss": 0.0196, "step": 298330 }, { "epoch": 1.93, "learning_rate": 1.1166474115285566e-05, "loss": 0.0201, "step": 298340 }, { "epoch": 1.93, "learning_rate": 1.1156792760928636e-05, "loss": 0.0247, "step": 298350 }, { "epoch": 1.93, "learning_rate": 1.1147111406571702e-05, "loss": 0.0213, "step": 298360 }, { "epoch": 1.93, "learning_rate": 1.113743005221477e-05, "loss": 0.0186, "step": 298370 }, { "epoch": 1.93, "learning_rate": 1.1127748697857838e-05, "loss": 0.0248, "step": 298380 }, { "epoch": 1.93, "learning_rate": 1.1118067343500907e-05, "loss": 0.0233, "step": 298390 }, { "epoch": 1.93, "learning_rate": 1.1108385989143974e-05, "loss": 0.0223, "step": 298400 }, { "epoch": 1.93, "learning_rate": 1.1098704634787042e-05, "loss": 0.0181, "step": 298410 }, { "epoch": 1.93, "learning_rate": 1.108902328043011e-05, "loss": 0.028, "step": 298420 }, { "epoch": 1.93, "learning_rate": 1.1079341926073176e-05, "loss": 0.0232, "step": 298430 }, { "epoch": 1.93, "learning_rate": 1.1069660571716245e-05, "loss": 0.0208, "step": 298440 }, { "epoch": 1.93, "learning_rate": 1.1059979217359313e-05, "loss": 0.0208, "step": 298450 }, { "epoch": 1.93, "learning_rate": 1.1050297863002381e-05, "loss": 0.0261, "step": 298460 }, { "epoch": 1.93, "learning_rate": 1.1040616508645448e-05, "loss": 0.0188, "step": 298470 }, { "epoch": 1.93, "learning_rate": 1.1030935154288517e-05, "loss": 0.0239, "step": 298480 }, { "epoch": 1.93, "learning_rate": 1.1021253799931585e-05, "loss": 0.0229, "step": 298490 }, { "epoch": 1.93, "learning_rate": 1.1011572445574651e-05, "loss": 0.0221, "step": 298500 }, { "epoch": 1.93, "learning_rate": 1.100189109121772e-05, "loss": 0.0272, "step": 298510 }, { "epoch": 1.93, "learning_rate": 1.0992209736860789e-05, "loss": 0.0209, "step": 298520 }, { "epoch": 1.93, "learning_rate": 1.0982528382503855e-05, "loss": 0.0198, "step": 298530 }, { "epoch": 1.93, "learning_rate": 1.0972847028146923e-05, "loss": 0.0294, "step": 298540 }, { "epoch": 1.93, "learning_rate": 1.0963165673789991e-05, "loss": 0.0203, "step": 298550 }, { "epoch": 1.93, "learning_rate": 1.0953484319433059e-05, "loss": 0.0201, "step": 298560 }, { "epoch": 1.93, "learning_rate": 1.0943802965076127e-05, "loss": 0.0175, "step": 298570 }, { "epoch": 1.93, "learning_rate": 1.0934121610719195e-05, "loss": 0.0222, "step": 298580 }, { "epoch": 1.93, "learning_rate": 1.0924440256362263e-05, "loss": 0.0197, "step": 298590 }, { "epoch": 1.93, "learning_rate": 1.0914758902005329e-05, "loss": 0.0225, "step": 298600 }, { "epoch": 1.93, "learning_rate": 1.0905077547648397e-05, "loss": 0.0239, "step": 298610 }, { "epoch": 1.93, "learning_rate": 1.0895396193291467e-05, "loss": 0.0198, "step": 298620 }, { "epoch": 1.93, "learning_rate": 1.0885714838934534e-05, "loss": 0.0211, "step": 298630 }, { "epoch": 1.93, "learning_rate": 1.08760334845776e-05, "loss": 0.0175, "step": 298640 }, { "epoch": 1.93, "learning_rate": 1.0866352130220669e-05, "loss": 0.0241, "step": 298650 }, { "epoch": 1.93, "learning_rate": 1.0856670775863738e-05, "loss": 0.0235, "step": 298660 }, { "epoch": 1.93, "learning_rate": 1.0846989421506805e-05, "loss": 0.0159, "step": 298670 }, { "epoch": 1.93, "learning_rate": 1.0837308067149872e-05, "loss": 0.0202, "step": 298680 }, { "epoch": 1.93, "learning_rate": 1.082762671279294e-05, "loss": 0.0204, "step": 298690 }, { "epoch": 1.93, "learning_rate": 1.081794535843601e-05, "loss": 0.0171, "step": 298700 }, { "epoch": 1.93, "learning_rate": 1.0808264004079076e-05, "loss": 0.0228, "step": 298710 }, { "epoch": 1.93, "learning_rate": 1.0798582649722144e-05, "loss": 0.0224, "step": 298720 }, { "epoch": 1.93, "learning_rate": 1.0788901295365212e-05, "loss": 0.0227, "step": 298730 }, { "epoch": 1.93, "learning_rate": 1.0779219941008278e-05, "loss": 0.0221, "step": 298740 }, { "epoch": 1.93, "learning_rate": 1.0769538586651348e-05, "loss": 0.0221, "step": 298750 }, { "epoch": 1.93, "learning_rate": 1.0759857232294416e-05, "loss": 0.0202, "step": 298760 }, { "epoch": 1.93, "learning_rate": 1.0750175877937484e-05, "loss": 0.0215, "step": 298770 }, { "epoch": 1.93, "learning_rate": 1.074049452358055e-05, "loss": 0.0203, "step": 298780 }, { "epoch": 1.93, "learning_rate": 1.073081316922362e-05, "loss": 0.0256, "step": 298790 }, { "epoch": 1.93, "learning_rate": 1.0721131814866688e-05, "loss": 0.0236, "step": 298800 }, { "epoch": 1.93, "learning_rate": 1.0711450460509754e-05, "loss": 0.0193, "step": 298810 }, { "epoch": 1.93, "learning_rate": 1.0701769106152822e-05, "loss": 0.0202, "step": 298820 }, { "epoch": 1.93, "learning_rate": 1.0692087751795891e-05, "loss": 0.0255, "step": 298830 }, { "epoch": 1.93, "learning_rate": 1.068240639743896e-05, "loss": 0.0237, "step": 298840 }, { "epoch": 1.93, "learning_rate": 1.0672725043082026e-05, "loss": 0.025, "step": 298850 }, { "epoch": 1.93, "learning_rate": 1.0663043688725094e-05, "loss": 0.022, "step": 298860 }, { "epoch": 1.93, "learning_rate": 1.0653362334368163e-05, "loss": 0.0226, "step": 298870 }, { "epoch": 1.93, "learning_rate": 1.064368098001123e-05, "loss": 0.0225, "step": 298880 }, { "epoch": 1.93, "learning_rate": 1.0633999625654297e-05, "loss": 0.02, "step": 298890 }, { "epoch": 1.93, "learning_rate": 1.0624318271297365e-05, "loss": 0.0225, "step": 298900 }, { "epoch": 1.93, "learning_rate": 1.0614636916940432e-05, "loss": 0.0183, "step": 298910 }, { "epoch": 1.93, "learning_rate": 1.0604955562583501e-05, "loss": 0.0266, "step": 298920 }, { "epoch": 1.93, "learning_rate": 1.0595274208226569e-05, "loss": 0.0196, "step": 298930 }, { "epoch": 1.93, "learning_rate": 1.0585592853869637e-05, "loss": 0.0203, "step": 298940 }, { "epoch": 1.93, "learning_rate": 1.0575911499512703e-05, "loss": 0.0192, "step": 298950 }, { "epoch": 1.93, "learning_rate": 1.0566230145155771e-05, "loss": 0.0213, "step": 298960 }, { "epoch": 1.93, "learning_rate": 1.055654879079884e-05, "loss": 0.0228, "step": 298970 }, { "epoch": 1.93, "learning_rate": 1.0546867436441907e-05, "loss": 0.0177, "step": 298980 }, { "epoch": 1.93, "learning_rate": 1.0537186082084975e-05, "loss": 0.023, "step": 298990 }, { "epoch": 1.93, "learning_rate": 1.0527504727728043e-05, "loss": 0.0196, "step": 299000 }, { "epoch": 1.93, "eval_cer": 0.919811998644221, "eval_loss": 0.016669558361172676, "eval_runtime": 120.4327, "eval_samples_per_second": 16.607, "eval_steps_per_second": 4.152, "step": 299000 }, { "epoch": 1.93, "learning_rate": 1.0517823373371113e-05, "loss": 0.0249, "step": 299010 }, { "epoch": 1.93, "learning_rate": 1.0508142019014179e-05, "loss": 0.0218, "step": 299020 }, { "epoch": 1.93, "learning_rate": 1.0498460664657247e-05, "loss": 0.0258, "step": 299030 }, { "epoch": 1.93, "learning_rate": 1.0488779310300315e-05, "loss": 0.0226, "step": 299040 }, { "epoch": 1.93, "learning_rate": 1.0479097955943381e-05, "loss": 0.021, "step": 299050 }, { "epoch": 1.93, "learning_rate": 1.046941660158645e-05, "loss": 0.0235, "step": 299060 }, { "epoch": 1.93, "learning_rate": 1.0459735247229518e-05, "loss": 0.0238, "step": 299070 }, { "epoch": 1.93, "learning_rate": 1.0450053892872586e-05, "loss": 0.0196, "step": 299080 }, { "epoch": 1.93, "learning_rate": 1.0440372538515653e-05, "loss": 0.0235, "step": 299090 }, { "epoch": 1.93, "learning_rate": 1.0430691184158722e-05, "loss": 0.0226, "step": 299100 }, { "epoch": 1.93, "learning_rate": 1.042100982980179e-05, "loss": 0.0227, "step": 299110 }, { "epoch": 1.93, "learning_rate": 1.0411328475444856e-05, "loss": 0.0225, "step": 299120 }, { "epoch": 1.93, "learning_rate": 1.0401647121087924e-05, "loss": 0.0226, "step": 299130 }, { "epoch": 1.93, "learning_rate": 1.0391965766730994e-05, "loss": 0.0221, "step": 299140 }, { "epoch": 1.93, "learning_rate": 1.0382284412374062e-05, "loss": 0.0198, "step": 299150 }, { "epoch": 1.93, "learning_rate": 1.0372603058017128e-05, "loss": 0.029, "step": 299160 }, { "epoch": 1.93, "learning_rate": 1.0362921703660196e-05, "loss": 0.0228, "step": 299170 }, { "epoch": 1.93, "learning_rate": 1.0353240349303266e-05, "loss": 0.0252, "step": 299180 }, { "epoch": 1.93, "learning_rate": 1.0343558994946332e-05, "loss": 0.0205, "step": 299190 }, { "epoch": 1.93, "learning_rate": 1.03338776405894e-05, "loss": 0.0195, "step": 299200 }, { "epoch": 1.93, "learning_rate": 1.0324196286232468e-05, "loss": 0.0276, "step": 299210 }, { "epoch": 1.93, "learning_rate": 1.0314514931875536e-05, "loss": 0.0237, "step": 299220 }, { "epoch": 1.93, "learning_rate": 1.0304833577518604e-05, "loss": 0.0195, "step": 299230 }, { "epoch": 1.93, "learning_rate": 1.0295152223161672e-05, "loss": 0.0185, "step": 299240 }, { "epoch": 1.93, "learning_rate": 1.028547086880474e-05, "loss": 0.0194, "step": 299250 }, { "epoch": 1.93, "learning_rate": 1.0275789514447806e-05, "loss": 0.0213, "step": 299260 }, { "epoch": 1.93, "learning_rate": 1.0266108160090874e-05, "loss": 0.0206, "step": 299270 }, { "epoch": 1.93, "learning_rate": 1.0256426805733943e-05, "loss": 0.0218, "step": 299280 }, { "epoch": 1.93, "learning_rate": 1.0246745451377011e-05, "loss": 0.0202, "step": 299290 }, { "epoch": 1.93, "learning_rate": 1.0237064097020078e-05, "loss": 0.0252, "step": 299300 }, { "epoch": 1.93, "learning_rate": 1.0227382742663145e-05, "loss": 0.0254, "step": 299310 }, { "epoch": 1.93, "learning_rate": 1.0217701388306215e-05, "loss": 0.019, "step": 299320 }, { "epoch": 1.93, "learning_rate": 1.0208020033949281e-05, "loss": 0.0212, "step": 299330 }, { "epoch": 1.93, "learning_rate": 1.019833867959235e-05, "loss": 0.0197, "step": 299340 }, { "epoch": 1.93, "learning_rate": 1.0188657325235417e-05, "loss": 0.0245, "step": 299350 }, { "epoch": 1.93, "learning_rate": 1.0178975970878483e-05, "loss": 0.0308, "step": 299360 }, { "epoch": 1.93, "learning_rate": 1.0169294616521553e-05, "loss": 0.0203, "step": 299370 }, { "epoch": 1.93, "learning_rate": 1.0159613262164621e-05, "loss": 0.0215, "step": 299380 }, { "epoch": 1.93, "learning_rate": 1.0149931907807689e-05, "loss": 0.0187, "step": 299390 }, { "epoch": 1.93, "learning_rate": 1.0140250553450755e-05, "loss": 0.0223, "step": 299400 }, { "epoch": 1.93, "learning_rate": 1.0130569199093825e-05, "loss": 0.0214, "step": 299410 }, { "epoch": 1.93, "learning_rate": 1.0120887844736893e-05, "loss": 0.0221, "step": 299420 }, { "epoch": 1.93, "learning_rate": 1.0111206490379959e-05, "loss": 0.0227, "step": 299430 }, { "epoch": 1.93, "learning_rate": 1.0101525136023027e-05, "loss": 0.0228, "step": 299440 }, { "epoch": 1.93, "learning_rate": 1.0091843781666097e-05, "loss": 0.0213, "step": 299450 }, { "epoch": 1.93, "learning_rate": 1.0082162427309164e-05, "loss": 0.0255, "step": 299460 }, { "epoch": 1.93, "learning_rate": 1.007248107295223e-05, "loss": 0.0215, "step": 299470 }, { "epoch": 1.93, "learning_rate": 1.0062799718595299e-05, "loss": 0.0209, "step": 299480 }, { "epoch": 1.93, "learning_rate": 1.0053118364238368e-05, "loss": 0.0244, "step": 299490 }, { "epoch": 1.93, "learning_rate": 1.0043437009881434e-05, "loss": 0.0229, "step": 299500 }, { "epoch": 1.93, "learning_rate": 1.0033755655524502e-05, "loss": 0.0275, "step": 299510 }, { "epoch": 1.93, "learning_rate": 1.002407430116757e-05, "loss": 0.02, "step": 299520 }, { "epoch": 1.93, "learning_rate": 1.001439294681064e-05, "loss": 0.025, "step": 299530 }, { "epoch": 1.93, "learning_rate": 1.0004711592453706e-05, "loss": 0.0264, "step": 299540 }, { "epoch": 1.93, "learning_rate": 9.995030238096774e-06, "loss": 0.0209, "step": 299550 }, { "epoch": 1.93, "learning_rate": 9.985348883739842e-06, "loss": 0.0187, "step": 299560 }, { "epoch": 1.93, "learning_rate": 9.975667529382908e-06, "loss": 0.019, "step": 299570 }, { "epoch": 1.93, "learning_rate": 9.965986175025978e-06, "loss": 0.0196, "step": 299580 }, { "epoch": 1.93, "learning_rate": 9.956304820669046e-06, "loss": 0.0232, "step": 299590 }, { "epoch": 1.93, "learning_rate": 9.946623466312114e-06, "loss": 0.0209, "step": 299600 }, { "epoch": 1.93, "learning_rate": 9.93694211195518e-06, "loss": 0.0211, "step": 299610 }, { "epoch": 1.93, "learning_rate": 9.927260757598248e-06, "loss": 0.0172, "step": 299620 }, { "epoch": 1.93, "learning_rate": 9.917579403241318e-06, "loss": 0.021, "step": 299630 }, { "epoch": 1.93, "learning_rate": 9.907898048884384e-06, "loss": 0.0214, "step": 299640 }, { "epoch": 1.93, "learning_rate": 9.898216694527452e-06, "loss": 0.0213, "step": 299650 }, { "epoch": 1.93, "learning_rate": 9.88853534017052e-06, "loss": 0.0216, "step": 299660 }, { "epoch": 1.93, "learning_rate": 9.87885398581359e-06, "loss": 0.0284, "step": 299670 }, { "epoch": 1.93, "learning_rate": 9.869172631456656e-06, "loss": 0.0238, "step": 299680 }, { "epoch": 1.93, "learning_rate": 9.859491277099724e-06, "loss": 0.0211, "step": 299690 }, { "epoch": 1.93, "learning_rate": 9.849809922742791e-06, "loss": 0.0198, "step": 299700 }, { "epoch": 1.93, "learning_rate": 9.840128568385858e-06, "loss": 0.0171, "step": 299710 }, { "epoch": 1.93, "learning_rate": 9.830447214028927e-06, "loss": 0.0264, "step": 299720 }, { "epoch": 1.93, "learning_rate": 9.820765859671995e-06, "loss": 0.0279, "step": 299730 }, { "epoch": 1.93, "learning_rate": 9.811084505315063e-06, "loss": 0.0213, "step": 299740 }, { "epoch": 1.93, "learning_rate": 9.80140315095813e-06, "loss": 0.0204, "step": 299750 }, { "epoch": 1.93, "learning_rate": 9.791721796601199e-06, "loss": 0.0217, "step": 299760 }, { "epoch": 1.93, "learning_rate": 9.782040442244267e-06, "loss": 0.022, "step": 299770 }, { "epoch": 1.93, "learning_rate": 9.772359087887333e-06, "loss": 0.0297, "step": 299780 }, { "epoch": 1.93, "learning_rate": 9.762677733530401e-06, "loss": 0.0209, "step": 299790 }, { "epoch": 1.93, "learning_rate": 9.75299637917347e-06, "loss": 0.0226, "step": 299800 }, { "epoch": 1.94, "learning_rate": 9.743315024816537e-06, "loss": 0.021, "step": 299810 }, { "epoch": 1.94, "learning_rate": 9.733633670459605e-06, "loss": 0.0204, "step": 299820 }, { "epoch": 1.94, "learning_rate": 9.723952316102673e-06, "loss": 0.0222, "step": 299830 }, { "epoch": 1.94, "learning_rate": 9.714270961745743e-06, "loss": 0.0261, "step": 299840 }, { "epoch": 1.94, "learning_rate": 9.704589607388809e-06, "loss": 0.0181, "step": 299850 }, { "epoch": 1.94, "learning_rate": 9.694908253031877e-06, "loss": 0.0233, "step": 299860 }, { "epoch": 1.94, "learning_rate": 9.685226898674945e-06, "loss": 0.0263, "step": 299870 }, { "epoch": 1.94, "learning_rate": 9.675545544318011e-06, "loss": 0.0203, "step": 299880 }, { "epoch": 1.94, "learning_rate": 9.66586418996108e-06, "loss": 0.0187, "step": 299890 }, { "epoch": 1.94, "learning_rate": 9.656182835604148e-06, "loss": 0.0226, "step": 299900 }, { "epoch": 1.94, "learning_rate": 9.646501481247216e-06, "loss": 0.0194, "step": 299910 }, { "epoch": 1.94, "learning_rate": 9.636820126890283e-06, "loss": 0.0197, "step": 299920 }, { "epoch": 1.94, "learning_rate": 9.62713877253335e-06, "loss": 0.0212, "step": 299930 }, { "epoch": 1.94, "learning_rate": 9.61745741817642e-06, "loss": 0.0205, "step": 299940 }, { "epoch": 1.94, "learning_rate": 9.607776063819486e-06, "loss": 0.0221, "step": 299950 }, { "epoch": 1.94, "learning_rate": 9.598094709462554e-06, "loss": 0.0207, "step": 299960 }, { "epoch": 1.94, "learning_rate": 9.588413355105622e-06, "loss": 0.0157, "step": 299970 }, { "epoch": 1.94, "learning_rate": 9.578732000748692e-06, "loss": 0.0219, "step": 299980 }, { "epoch": 1.94, "learning_rate": 9.569050646391758e-06, "loss": 0.0325, "step": 299990 }, { "epoch": 1.94, "learning_rate": 9.559369292034826e-06, "loss": 0.0175, "step": 300000 }, { "epoch": 1.94, "eval_cer": 0.9198219410236131, "eval_loss": 0.0166050735861063, "eval_runtime": 120.2268, "eval_samples_per_second": 16.635, "eval_steps_per_second": 4.159, "step": 300000 }, { "epoch": 1.94, "learning_rate": 9.549687937677894e-06, "loss": 0.0235, "step": 300010 }, { "epoch": 1.94, "learning_rate": 9.54000658332096e-06, "loss": 0.0249, "step": 300020 }, { "epoch": 1.94, "learning_rate": 9.53032522896403e-06, "loss": 0.022, "step": 300030 }, { "epoch": 1.94, "learning_rate": 9.520643874607098e-06, "loss": 0.0221, "step": 300040 }, { "epoch": 1.94, "learning_rate": 9.510962520250166e-06, "loss": 0.0196, "step": 300050 }, { "epoch": 1.94, "learning_rate": 9.501281165893232e-06, "loss": 0.0206, "step": 300060 }, { "epoch": 1.94, "learning_rate": 9.491599811536302e-06, "loss": 0.0238, "step": 300070 }, { "epoch": 1.94, "learning_rate": 9.48191845717937e-06, "loss": 0.021, "step": 300080 }, { "epoch": 1.94, "learning_rate": 9.472237102822436e-06, "loss": 0.0202, "step": 300090 }, { "epoch": 1.94, "learning_rate": 9.462555748465504e-06, "loss": 0.0199, "step": 300100 }, { "epoch": 1.94, "learning_rate": 9.452874394108573e-06, "loss": 0.0233, "step": 300110 }, { "epoch": 1.94, "learning_rate": 9.443193039751641e-06, "loss": 0.019, "step": 300120 }, { "epoch": 1.94, "learning_rate": 9.433511685394708e-06, "loss": 0.0239, "step": 300130 }, { "epoch": 1.94, "learning_rate": 9.423830331037775e-06, "loss": 0.0219, "step": 300140 }, { "epoch": 1.94, "learning_rate": 9.414148976680845e-06, "loss": 0.0188, "step": 300150 }, { "epoch": 1.94, "learning_rate": 9.404467622323911e-06, "loss": 0.0245, "step": 300160 }, { "epoch": 1.94, "learning_rate": 9.39478626796698e-06, "loss": 0.0241, "step": 300170 }, { "epoch": 1.94, "learning_rate": 9.385104913610047e-06, "loss": 0.0225, "step": 300180 }, { "epoch": 1.94, "learning_rate": 9.375423559253117e-06, "loss": 0.0221, "step": 300190 }, { "epoch": 1.94, "learning_rate": 9.365742204896183e-06, "loss": 0.0216, "step": 300200 }, { "epoch": 1.94, "learning_rate": 9.356060850539251e-06, "loss": 0.0229, "step": 300210 }, { "epoch": 1.94, "learning_rate": 9.346379496182319e-06, "loss": 0.0218, "step": 300220 }, { "epoch": 1.94, "learning_rate": 9.336698141825387e-06, "loss": 0.0259, "step": 300230 }, { "epoch": 1.94, "learning_rate": 9.327016787468455e-06, "loss": 0.0233, "step": 300240 }, { "epoch": 1.94, "learning_rate": 9.317335433111523e-06, "loss": 0.0209, "step": 300250 }, { "epoch": 1.94, "learning_rate": 9.30765407875459e-06, "loss": 0.0232, "step": 300260 }, { "epoch": 1.94, "learning_rate": 9.297972724397657e-06, "loss": 0.0207, "step": 300270 }, { "epoch": 1.94, "learning_rate": 9.288291370040725e-06, "loss": 0.0225, "step": 300280 }, { "epoch": 1.94, "learning_rate": 9.278610015683793e-06, "loss": 0.0227, "step": 300290 }, { "epoch": 1.94, "learning_rate": 9.26892866132686e-06, "loss": 0.0223, "step": 300300 }, { "epoch": 1.94, "learning_rate": 9.259247306969929e-06, "loss": 0.0194, "step": 300310 }, { "epoch": 1.94, "learning_rate": 9.249565952612997e-06, "loss": 0.0244, "step": 300320 }, { "epoch": 1.94, "learning_rate": 9.239884598256064e-06, "loss": 0.02, "step": 300330 }, { "epoch": 1.94, "learning_rate": 9.230203243899132e-06, "loss": 0.0211, "step": 300340 }, { "epoch": 1.94, "learning_rate": 9.2205218895422e-06, "loss": 0.0286, "step": 300350 }, { "epoch": 1.94, "learning_rate": 9.210840535185268e-06, "loss": 0.0202, "step": 300360 }, { "epoch": 1.94, "learning_rate": 9.201159180828336e-06, "loss": 0.0267, "step": 300370 }, { "epoch": 1.94, "learning_rate": 9.191477826471404e-06, "loss": 0.0251, "step": 300380 }, { "epoch": 1.94, "learning_rate": 9.18179647211447e-06, "loss": 0.0234, "step": 300390 }, { "epoch": 1.94, "learning_rate": 9.17211511775754e-06, "loss": 0.0164, "step": 300400 }, { "epoch": 1.94, "learning_rate": 9.162433763400606e-06, "loss": 0.0235, "step": 300410 }, { "epoch": 1.94, "learning_rate": 9.152752409043676e-06, "loss": 0.022, "step": 300420 }, { "epoch": 1.94, "learning_rate": 9.143071054686742e-06, "loss": 0.0216, "step": 300430 }, { "epoch": 1.94, "learning_rate": 9.133389700329812e-06, "loss": 0.0224, "step": 300440 }, { "epoch": 1.94, "learning_rate": 9.123708345972878e-06, "loss": 0.0252, "step": 300450 }, { "epoch": 1.94, "learning_rate": 9.114026991615946e-06, "loss": 0.0243, "step": 300460 }, { "epoch": 1.94, "learning_rate": 9.104345637259014e-06, "loss": 0.0189, "step": 300470 }, { "epoch": 1.94, "learning_rate": 9.094664282902082e-06, "loss": 0.0218, "step": 300480 }, { "epoch": 1.94, "learning_rate": 9.08498292854515e-06, "loss": 0.0277, "step": 300490 }, { "epoch": 1.94, "learning_rate": 9.075301574188218e-06, "loss": 0.0231, "step": 300500 }, { "epoch": 1.94, "learning_rate": 9.065620219831286e-06, "loss": 0.0197, "step": 300510 }, { "epoch": 1.94, "learning_rate": 9.055938865474354e-06, "loss": 0.019, "step": 300520 }, { "epoch": 1.94, "learning_rate": 9.046257511117421e-06, "loss": 0.018, "step": 300530 }, { "epoch": 1.94, "learning_rate": 9.03657615676049e-06, "loss": 0.0211, "step": 300540 }, { "epoch": 1.94, "learning_rate": 9.026894802403557e-06, "loss": 0.0223, "step": 300550 }, { "epoch": 1.94, "learning_rate": 9.017213448046625e-06, "loss": 0.0226, "step": 300560 }, { "epoch": 1.94, "learning_rate": 9.007532093689693e-06, "loss": 0.0251, "step": 300570 }, { "epoch": 1.94, "learning_rate": 8.99785073933276e-06, "loss": 0.021, "step": 300580 }, { "epoch": 1.94, "learning_rate": 8.988169384975829e-06, "loss": 0.0199, "step": 300590 }, { "epoch": 1.94, "learning_rate": 8.978488030618895e-06, "loss": 0.0205, "step": 300600 }, { "epoch": 1.94, "learning_rate": 8.968806676261963e-06, "loss": 0.0211, "step": 300610 }, { "epoch": 1.94, "learning_rate": 8.959125321905031e-06, "loss": 0.0235, "step": 300620 }, { "epoch": 1.94, "learning_rate": 8.949443967548099e-06, "loss": 0.0243, "step": 300630 }, { "epoch": 1.94, "learning_rate": 8.939762613191167e-06, "loss": 0.0227, "step": 300640 }, { "epoch": 1.94, "learning_rate": 8.930081258834235e-06, "loss": 0.02, "step": 300650 }, { "epoch": 1.94, "learning_rate": 8.920399904477303e-06, "loss": 0.0282, "step": 300660 }, { "epoch": 1.94, "learning_rate": 8.91071855012037e-06, "loss": 0.0227, "step": 300670 }, { "epoch": 1.94, "learning_rate": 8.901037195763439e-06, "loss": 0.0221, "step": 300680 }, { "epoch": 1.94, "learning_rate": 8.891355841406507e-06, "loss": 0.018, "step": 300690 }, { "epoch": 1.94, "learning_rate": 8.881674487049575e-06, "loss": 0.0226, "step": 300700 }, { "epoch": 1.94, "learning_rate": 8.871993132692643e-06, "loss": 0.0224, "step": 300710 }, { "epoch": 1.94, "learning_rate": 8.862311778335709e-06, "loss": 0.0217, "step": 300720 }, { "epoch": 1.94, "learning_rate": 8.852630423978778e-06, "loss": 0.0228, "step": 300730 }, { "epoch": 1.94, "learning_rate": 8.842949069621845e-06, "loss": 0.0198, "step": 300740 }, { "epoch": 1.94, "learning_rate": 8.833267715264914e-06, "loss": 0.0189, "step": 300750 }, { "epoch": 1.94, "learning_rate": 8.82358636090798e-06, "loss": 0.0208, "step": 300760 }, { "epoch": 1.94, "learning_rate": 8.813905006551048e-06, "loss": 0.0215, "step": 300770 }, { "epoch": 1.94, "learning_rate": 8.804223652194116e-06, "loss": 0.0198, "step": 300780 }, { "epoch": 1.94, "learning_rate": 8.794542297837184e-06, "loss": 0.026, "step": 300790 }, { "epoch": 1.94, "learning_rate": 8.784860943480252e-06, "loss": 0.0216, "step": 300800 }, { "epoch": 1.94, "learning_rate": 8.77517958912332e-06, "loss": 0.0183, "step": 300810 }, { "epoch": 1.94, "learning_rate": 8.765498234766388e-06, "loss": 0.0227, "step": 300820 }, { "epoch": 1.94, "learning_rate": 8.755816880409456e-06, "loss": 0.0188, "step": 300830 }, { "epoch": 1.94, "learning_rate": 8.746135526052524e-06, "loss": 0.0172, "step": 300840 }, { "epoch": 1.94, "learning_rate": 8.736454171695592e-06, "loss": 0.0198, "step": 300850 }, { "epoch": 1.94, "learning_rate": 8.72677281733866e-06, "loss": 0.0239, "step": 300860 }, { "epoch": 1.94, "learning_rate": 8.717091462981728e-06, "loss": 0.0201, "step": 300870 }, { "epoch": 1.94, "learning_rate": 8.707410108624796e-06, "loss": 0.0209, "step": 300880 }, { "epoch": 1.94, "learning_rate": 8.697728754267864e-06, "loss": 0.0226, "step": 300890 }, { "epoch": 1.94, "learning_rate": 8.688047399910932e-06, "loss": 0.0259, "step": 300900 }, { "epoch": 1.94, "learning_rate": 8.678366045553998e-06, "loss": 0.0199, "step": 300910 }, { "epoch": 1.94, "learning_rate": 8.668684691197067e-06, "loss": 0.02, "step": 300920 }, { "epoch": 1.94, "learning_rate": 8.659003336840134e-06, "loss": 0.0237, "step": 300930 }, { "epoch": 1.94, "learning_rate": 8.649321982483202e-06, "loss": 0.0182, "step": 300940 }, { "epoch": 1.94, "learning_rate": 8.63964062812627e-06, "loss": 0.0203, "step": 300950 }, { "epoch": 1.94, "learning_rate": 8.629959273769338e-06, "loss": 0.0232, "step": 300960 }, { "epoch": 1.94, "learning_rate": 8.620277919412405e-06, "loss": 0.0219, "step": 300970 }, { "epoch": 1.94, "learning_rate": 8.610596565055473e-06, "loss": 0.0239, "step": 300980 }, { "epoch": 1.94, "learning_rate": 8.600915210698541e-06, "loss": 0.0189, "step": 300990 }, { "epoch": 1.94, "learning_rate": 8.59123385634161e-06, "loss": 0.0228, "step": 301000 }, { "epoch": 1.94, "eval_cer": 0.9198273641396453, "eval_loss": 0.016501974314451218, "eval_runtime": 120.1039, "eval_samples_per_second": 16.652, "eval_steps_per_second": 4.163, "step": 301000 }, { "epoch": 1.94, "learning_rate": 8.581552501984677e-06, "loss": 0.0258, "step": 301010 }, { "epoch": 1.94, "learning_rate": 8.571871147627745e-06, "loss": 0.0265, "step": 301020 }, { "epoch": 1.94, "learning_rate": 8.562189793270811e-06, "loss": 0.0176, "step": 301030 }, { "epoch": 1.94, "learning_rate": 8.552508438913881e-06, "loss": 0.0223, "step": 301040 }, { "epoch": 1.94, "learning_rate": 8.542827084556947e-06, "loss": 0.0191, "step": 301050 }, { "epoch": 1.94, "learning_rate": 8.533145730200017e-06, "loss": 0.0207, "step": 301060 }, { "epoch": 1.94, "learning_rate": 8.523464375843083e-06, "loss": 0.0229, "step": 301070 }, { "epoch": 1.94, "learning_rate": 8.513783021486153e-06, "loss": 0.0203, "step": 301080 }, { "epoch": 1.94, "learning_rate": 8.504101667129219e-06, "loss": 0.0241, "step": 301090 }, { "epoch": 1.94, "learning_rate": 8.494420312772287e-06, "loss": 0.0182, "step": 301100 }, { "epoch": 1.94, "learning_rate": 8.484738958415355e-06, "loss": 0.023, "step": 301110 }, { "epoch": 1.94, "learning_rate": 8.475057604058423e-06, "loss": 0.0234, "step": 301120 }, { "epoch": 1.94, "learning_rate": 8.46537624970149e-06, "loss": 0.0217, "step": 301130 }, { "epoch": 1.94, "learning_rate": 8.455694895344559e-06, "loss": 0.0247, "step": 301140 }, { "epoch": 1.94, "learning_rate": 8.446013540987627e-06, "loss": 0.0193, "step": 301150 }, { "epoch": 1.94, "learning_rate": 8.436332186630694e-06, "loss": 0.0227, "step": 301160 }, { "epoch": 1.94, "learning_rate": 8.426650832273762e-06, "loss": 0.0252, "step": 301170 }, { "epoch": 1.94, "learning_rate": 8.41696947791683e-06, "loss": 0.0224, "step": 301180 }, { "epoch": 1.94, "learning_rate": 8.407288123559898e-06, "loss": 0.0198, "step": 301190 }, { "epoch": 1.94, "learning_rate": 8.397606769202966e-06, "loss": 0.02, "step": 301200 }, { "epoch": 1.94, "learning_rate": 8.387925414846034e-06, "loss": 0.0231, "step": 301210 }, { "epoch": 1.94, "learning_rate": 8.3782440604891e-06, "loss": 0.0193, "step": 301220 }, { "epoch": 1.94, "learning_rate": 8.36856270613217e-06, "loss": 0.0238, "step": 301230 }, { "epoch": 1.94, "learning_rate": 8.358881351775236e-06, "loss": 0.0221, "step": 301240 }, { "epoch": 1.94, "learning_rate": 8.349199997418306e-06, "loss": 0.0231, "step": 301250 }, { "epoch": 1.94, "learning_rate": 8.339518643061372e-06, "loss": 0.0173, "step": 301260 }, { "epoch": 1.94, "learning_rate": 8.32983728870444e-06, "loss": 0.0232, "step": 301270 }, { "epoch": 1.94, "learning_rate": 8.320155934347508e-06, "loss": 0.0226, "step": 301280 }, { "epoch": 1.94, "learning_rate": 8.310474579990576e-06, "loss": 0.0244, "step": 301290 }, { "epoch": 1.94, "learning_rate": 8.300793225633644e-06, "loss": 0.0197, "step": 301300 }, { "epoch": 1.94, "learning_rate": 8.291111871276712e-06, "loss": 0.0222, "step": 301310 }, { "epoch": 1.94, "learning_rate": 8.28143051691978e-06, "loss": 0.0229, "step": 301320 }, { "epoch": 1.94, "learning_rate": 8.271749162562848e-06, "loss": 0.0195, "step": 301330 }, { "epoch": 1.94, "learning_rate": 8.262067808205916e-06, "loss": 0.0209, "step": 301340 }, { "epoch": 1.94, "learning_rate": 8.252386453848984e-06, "loss": 0.0215, "step": 301350 }, { "epoch": 1.95, "learning_rate": 8.24270509949205e-06, "loss": 0.0286, "step": 301360 }, { "epoch": 1.95, "learning_rate": 8.23302374513512e-06, "loss": 0.0278, "step": 301370 }, { "epoch": 1.95, "learning_rate": 8.223342390778186e-06, "loss": 0.026, "step": 301380 }, { "epoch": 1.95, "learning_rate": 8.213661036421255e-06, "loss": 0.0212, "step": 301390 }, { "epoch": 1.95, "learning_rate": 8.203979682064321e-06, "loss": 0.0235, "step": 301400 }, { "epoch": 1.95, "learning_rate": 8.19429832770739e-06, "loss": 0.0252, "step": 301410 }, { "epoch": 1.95, "learning_rate": 8.184616973350457e-06, "loss": 0.022, "step": 301420 }, { "epoch": 1.95, "learning_rate": 8.174935618993525e-06, "loss": 0.02, "step": 301430 }, { "epoch": 1.95, "learning_rate": 8.165254264636593e-06, "loss": 0.0219, "step": 301440 }, { "epoch": 1.95, "learning_rate": 8.155572910279661e-06, "loss": 0.0277, "step": 301450 }, { "epoch": 1.95, "learning_rate": 8.145891555922729e-06, "loss": 0.0205, "step": 301460 }, { "epoch": 1.95, "learning_rate": 8.136210201565797e-06, "loss": 0.0184, "step": 301470 }, { "epoch": 1.95, "learning_rate": 8.126528847208865e-06, "loss": 0.02, "step": 301480 }, { "epoch": 1.95, "learning_rate": 8.116847492851933e-06, "loss": 0.0276, "step": 301490 }, { "epoch": 1.95, "learning_rate": 8.107166138495e-06, "loss": 0.0236, "step": 301500 }, { "epoch": 1.95, "learning_rate": 8.097484784138069e-06, "loss": 0.0206, "step": 301510 }, { "epoch": 1.95, "learning_rate": 8.087803429781137e-06, "loss": 0.024, "step": 301520 }, { "epoch": 1.95, "learning_rate": 8.078122075424205e-06, "loss": 0.0234, "step": 301530 }, { "epoch": 1.95, "learning_rate": 8.068440721067273e-06, "loss": 0.0227, "step": 301540 }, { "epoch": 1.95, "learning_rate": 8.058759366710339e-06, "loss": 0.0225, "step": 301550 }, { "epoch": 1.95, "learning_rate": 8.049078012353408e-06, "loss": 0.023, "step": 301560 }, { "epoch": 1.95, "learning_rate": 8.039396657996475e-06, "loss": 0.0216, "step": 301570 }, { "epoch": 1.95, "learning_rate": 8.029715303639544e-06, "loss": 0.0222, "step": 301580 }, { "epoch": 1.95, "learning_rate": 8.02003394928261e-06, "loss": 0.0238, "step": 301590 }, { "epoch": 1.95, "learning_rate": 8.010352594925678e-06, "loss": 0.0198, "step": 301600 }, { "epoch": 1.95, "learning_rate": 8.000671240568746e-06, "loss": 0.0249, "step": 301610 }, { "epoch": 1.95, "learning_rate": 7.990989886211814e-06, "loss": 0.023, "step": 301620 }, { "epoch": 1.95, "learning_rate": 7.981308531854882e-06, "loss": 0.0211, "step": 301630 }, { "epoch": 1.95, "learning_rate": 7.97162717749795e-06, "loss": 0.0187, "step": 301640 }, { "epoch": 1.95, "learning_rate": 7.961945823141018e-06, "loss": 0.0206, "step": 301650 }, { "epoch": 1.95, "learning_rate": 7.952264468784086e-06, "loss": 0.02, "step": 301660 }, { "epoch": 1.95, "learning_rate": 7.942583114427152e-06, "loss": 0.0293, "step": 301670 }, { "epoch": 1.95, "learning_rate": 7.932901760070222e-06, "loss": 0.0278, "step": 301680 }, { "epoch": 1.95, "learning_rate": 7.923220405713288e-06, "loss": 0.021, "step": 301690 }, { "epoch": 1.95, "learning_rate": 7.913539051356358e-06, "loss": 0.0225, "step": 301700 }, { "epoch": 1.95, "learning_rate": 7.903857696999424e-06, "loss": 0.0301, "step": 301710 }, { "epoch": 1.95, "learning_rate": 7.894176342642494e-06, "loss": 0.0218, "step": 301720 }, { "epoch": 1.95, "learning_rate": 7.88449498828556e-06, "loss": 0.0186, "step": 301730 }, { "epoch": 1.95, "learning_rate": 7.874813633928628e-06, "loss": 0.0204, "step": 301740 }, { "epoch": 1.95, "learning_rate": 7.865132279571696e-06, "loss": 0.0202, "step": 301750 }, { "epoch": 1.95, "learning_rate": 7.855450925214764e-06, "loss": 0.0221, "step": 301760 }, { "epoch": 1.95, "learning_rate": 7.845769570857832e-06, "loss": 0.0236, "step": 301770 }, { "epoch": 1.95, "learning_rate": 7.8360882165009e-06, "loss": 0.0242, "step": 301780 }, { "epoch": 1.95, "learning_rate": 7.826406862143967e-06, "loss": 0.02, "step": 301790 }, { "epoch": 1.95, "learning_rate": 7.816725507787035e-06, "loss": 0.0223, "step": 301800 }, { "epoch": 1.95, "learning_rate": 7.807044153430103e-06, "loss": 0.0202, "step": 301810 }, { "epoch": 1.95, "learning_rate": 7.797362799073171e-06, "loss": 0.0218, "step": 301820 }, { "epoch": 1.95, "learning_rate": 7.78768144471624e-06, "loss": 0.0189, "step": 301830 }, { "epoch": 1.95, "learning_rate": 7.778000090359307e-06, "loss": 0.0213, "step": 301840 }, { "epoch": 1.95, "learning_rate": 7.768318736002375e-06, "loss": 0.0206, "step": 301850 }, { "epoch": 1.95, "learning_rate": 7.758637381645441e-06, "loss": 0.021, "step": 301860 }, { "epoch": 1.95, "learning_rate": 7.748956027288511e-06, "loss": 0.0247, "step": 301870 }, { "epoch": 1.95, "learning_rate": 7.739274672931577e-06, "loss": 0.0215, "step": 301880 }, { "epoch": 1.95, "learning_rate": 7.729593318574647e-06, "loss": 0.0201, "step": 301890 }, { "epoch": 1.95, "learning_rate": 7.719911964217713e-06, "loss": 0.02, "step": 301900 }, { "epoch": 1.95, "learning_rate": 7.710230609860783e-06, "loss": 0.0268, "step": 301910 }, { "epoch": 1.95, "learning_rate": 7.700549255503849e-06, "loss": 0.0201, "step": 301920 }, { "epoch": 1.95, "learning_rate": 7.690867901146917e-06, "loss": 0.0227, "step": 301930 }, { "epoch": 1.95, "learning_rate": 7.681186546789985e-06, "loss": 0.0288, "step": 301940 }, { "epoch": 1.95, "learning_rate": 7.671505192433053e-06, "loss": 0.0219, "step": 301950 }, { "epoch": 1.95, "learning_rate": 7.66182383807612e-06, "loss": 0.0248, "step": 301960 }, { "epoch": 1.95, "learning_rate": 7.652142483719189e-06, "loss": 0.0197, "step": 301970 }, { "epoch": 1.95, "learning_rate": 7.642461129362257e-06, "loss": 0.02, "step": 301980 }, { "epoch": 1.95, "learning_rate": 7.632779775005324e-06, "loss": 0.0198, "step": 301990 }, { "epoch": 1.95, "learning_rate": 7.6230984206483915e-06, "loss": 0.019, "step": 302000 }, { "epoch": 1.95, "eval_cer": 0.9198327872556773, "eval_loss": 0.016491882503032684, "eval_runtime": 120.5919, "eval_samples_per_second": 16.585, "eval_steps_per_second": 4.146, "step": 302000 }, { "epoch": 1.95, "learning_rate": 7.61341706629146e-06, "loss": 0.0247, "step": 302010 }, { "epoch": 1.95, "learning_rate": 7.603735711934527e-06, "loss": 0.0204, "step": 302020 }, { "epoch": 1.95, "learning_rate": 7.594054357577595e-06, "loss": 0.0265, "step": 302030 }, { "epoch": 1.95, "learning_rate": 7.584373003220663e-06, "loss": 0.0241, "step": 302040 }, { "epoch": 1.95, "learning_rate": 7.57469164886373e-06, "loss": 0.0178, "step": 302050 }, { "epoch": 1.95, "learning_rate": 7.565010294506799e-06, "loss": 0.0224, "step": 302060 }, { "epoch": 1.95, "learning_rate": 7.555328940149866e-06, "loss": 0.0218, "step": 302070 }, { "epoch": 1.95, "learning_rate": 7.545647585792935e-06, "loss": 0.0254, "step": 302080 }, { "epoch": 1.95, "learning_rate": 7.535966231436002e-06, "loss": 0.0221, "step": 302090 }, { "epoch": 1.95, "learning_rate": 7.526284877079071e-06, "loss": 0.0216, "step": 302100 }, { "epoch": 1.95, "learning_rate": 7.516603522722138e-06, "loss": 0.0237, "step": 302110 }, { "epoch": 1.95, "learning_rate": 7.506922168365205e-06, "loss": 0.0195, "step": 302120 }, { "epoch": 1.95, "learning_rate": 7.497240814008274e-06, "loss": 0.0225, "step": 302130 }, { "epoch": 1.95, "learning_rate": 7.487559459651341e-06, "loss": 0.024, "step": 302140 }, { "epoch": 1.95, "learning_rate": 7.47787810529441e-06, "loss": 0.0201, "step": 302150 }, { "epoch": 1.95, "learning_rate": 7.468196750937477e-06, "loss": 0.0201, "step": 302160 }, { "epoch": 1.95, "learning_rate": 7.4585153965805456e-06, "loss": 0.0238, "step": 302170 }, { "epoch": 1.95, "learning_rate": 7.448834042223613e-06, "loss": 0.0229, "step": 302180 }, { "epoch": 1.95, "learning_rate": 7.439152687866681e-06, "loss": 0.0205, "step": 302190 }, { "epoch": 1.95, "learning_rate": 7.4294713335097485e-06, "loss": 0.024, "step": 302200 }, { "epoch": 1.95, "learning_rate": 7.4197899791528164e-06, "loss": 0.0164, "step": 302210 }, { "epoch": 1.95, "learning_rate": 7.410108624795884e-06, "loss": 0.0188, "step": 302220 }, { "epoch": 1.95, "learning_rate": 7.4004272704389515e-06, "loss": 0.0207, "step": 302230 }, { "epoch": 1.95, "learning_rate": 7.390745916082019e-06, "loss": 0.0199, "step": 302240 }, { "epoch": 1.95, "learning_rate": 7.381064561725087e-06, "loss": 0.0204, "step": 302250 }, { "epoch": 1.95, "learning_rate": 7.371383207368155e-06, "loss": 0.0192, "step": 302260 }, { "epoch": 1.95, "learning_rate": 7.361701853011223e-06, "loss": 0.0264, "step": 302270 }, { "epoch": 1.95, "learning_rate": 7.352020498654291e-06, "loss": 0.022, "step": 302280 }, { "epoch": 1.95, "learning_rate": 7.342339144297359e-06, "loss": 0.0201, "step": 302290 }, { "epoch": 1.95, "learning_rate": 7.332657789940427e-06, "loss": 0.0184, "step": 302300 }, { "epoch": 1.95, "learning_rate": 7.322976435583494e-06, "loss": 0.0199, "step": 302310 }, { "epoch": 1.95, "learning_rate": 7.313295081226563e-06, "loss": 0.0244, "step": 302320 }, { "epoch": 1.95, "learning_rate": 7.30361372686963e-06, "loss": 0.0236, "step": 302330 }, { "epoch": 1.95, "learning_rate": 7.293932372512699e-06, "loss": 0.0209, "step": 302340 }, { "epoch": 1.95, "learning_rate": 7.284251018155766e-06, "loss": 0.0242, "step": 302350 }, { "epoch": 1.95, "learning_rate": 7.274569663798835e-06, "loss": 0.0245, "step": 302360 }, { "epoch": 1.95, "learning_rate": 7.264888309441902e-06, "loss": 0.0243, "step": 302370 }, { "epoch": 1.95, "learning_rate": 7.255206955084969e-06, "loss": 0.0235, "step": 302380 }, { "epoch": 1.95, "learning_rate": 7.2455256007280376e-06, "loss": 0.0237, "step": 302390 }, { "epoch": 1.95, "learning_rate": 7.235844246371105e-06, "loss": 0.0198, "step": 302400 }, { "epoch": 1.95, "learning_rate": 7.226162892014173e-06, "loss": 0.0282, "step": 302410 }, { "epoch": 1.95, "learning_rate": 7.2164815376572405e-06, "loss": 0.0246, "step": 302420 }, { "epoch": 1.95, "learning_rate": 7.206800183300309e-06, "loss": 0.0172, "step": 302430 }, { "epoch": 1.95, "learning_rate": 7.197118828943376e-06, "loss": 0.0215, "step": 302440 }, { "epoch": 1.95, "learning_rate": 7.1874374745864435e-06, "loss": 0.0207, "step": 302450 }, { "epoch": 1.95, "learning_rate": 7.177756120229512e-06, "loss": 0.0261, "step": 302460 }, { "epoch": 1.95, "learning_rate": 7.168074765872579e-06, "loss": 0.0179, "step": 302470 }, { "epoch": 1.95, "learning_rate": 7.158393411515648e-06, "loss": 0.0204, "step": 302480 }, { "epoch": 1.95, "learning_rate": 7.148712057158715e-06, "loss": 0.0267, "step": 302490 }, { "epoch": 1.95, "learning_rate": 7.139030702801783e-06, "loss": 0.0243, "step": 302500 }, { "epoch": 1.95, "learning_rate": 7.129349348444851e-06, "loss": 0.0241, "step": 302510 }, { "epoch": 1.95, "learning_rate": 7.119667994087919e-06, "loss": 0.022, "step": 302520 }, { "epoch": 1.95, "learning_rate": 7.109986639730987e-06, "loss": 0.0191, "step": 302530 }, { "epoch": 1.95, "learning_rate": 7.100305285374055e-06, "loss": 0.0237, "step": 302540 }, { "epoch": 1.95, "learning_rate": 7.090623931017123e-06, "loss": 0.0198, "step": 302550 }, { "epoch": 1.95, "learning_rate": 7.08094257666019e-06, "loss": 0.0222, "step": 302560 }, { "epoch": 1.95, "learning_rate": 7.071261222303258e-06, "loss": 0.0221, "step": 302570 }, { "epoch": 1.95, "learning_rate": 7.061579867946326e-06, "loss": 0.0268, "step": 302580 }, { "epoch": 1.95, "learning_rate": 7.051898513589394e-06, "loss": 0.0268, "step": 302590 }, { "epoch": 1.95, "learning_rate": 7.042217159232462e-06, "loss": 0.0207, "step": 302600 }, { "epoch": 1.95, "learning_rate": 7.0325358048755295e-06, "loss": 0.0163, "step": 302610 }, { "epoch": 1.95, "learning_rate": 7.0228544505185975e-06, "loss": 0.021, "step": 302620 }, { "epoch": 1.95, "learning_rate": 7.013173096161665e-06, "loss": 0.0189, "step": 302630 }, { "epoch": 1.95, "learning_rate": 7.0034917418047325e-06, "loss": 0.0187, "step": 302640 }, { "epoch": 1.95, "learning_rate": 6.993810387447801e-06, "loss": 0.0184, "step": 302650 }, { "epoch": 1.95, "learning_rate": 6.984129033090868e-06, "loss": 0.0207, "step": 302660 }, { "epoch": 1.95, "learning_rate": 6.974447678733937e-06, "loss": 0.0177, "step": 302670 }, { "epoch": 1.95, "learning_rate": 6.964766324377004e-06, "loss": 0.0195, "step": 302680 }, { "epoch": 1.95, "learning_rate": 6.955084970020071e-06, "loss": 0.0225, "step": 302690 }, { "epoch": 1.95, "learning_rate": 6.94540361566314e-06, "loss": 0.0173, "step": 302700 }, { "epoch": 1.95, "learning_rate": 6.935722261306207e-06, "loss": 0.0202, "step": 302710 }, { "epoch": 1.95, "learning_rate": 6.926040906949276e-06, "loss": 0.0231, "step": 302720 }, { "epoch": 1.95, "learning_rate": 6.916359552592343e-06, "loss": 0.0256, "step": 302730 }, { "epoch": 1.95, "learning_rate": 6.906678198235412e-06, "loss": 0.0205, "step": 302740 }, { "epoch": 1.95, "learning_rate": 6.896996843878479e-06, "loss": 0.0243, "step": 302750 }, { "epoch": 1.95, "learning_rate": 6.887315489521546e-06, "loss": 0.02, "step": 302760 }, { "epoch": 1.95, "learning_rate": 6.877634135164615e-06, "loss": 0.0161, "step": 302770 }, { "epoch": 1.95, "learning_rate": 6.867952780807682e-06, "loss": 0.0255, "step": 302780 }, { "epoch": 1.95, "learning_rate": 6.858271426450751e-06, "loss": 0.0215, "step": 302790 }, { "epoch": 1.95, "learning_rate": 6.848590072093818e-06, "loss": 0.0246, "step": 302800 }, { "epoch": 1.95, "learning_rate": 6.8389087177368865e-06, "loss": 0.0211, "step": 302810 }, { "epoch": 1.95, "learning_rate": 6.829227363379954e-06, "loss": 0.0218, "step": 302820 }, { "epoch": 1.95, "learning_rate": 6.8195460090230215e-06, "loss": 0.0247, "step": 302830 }, { "epoch": 1.95, "learning_rate": 6.8098646546660895e-06, "loss": 0.0232, "step": 302840 }, { "epoch": 1.95, "learning_rate": 6.800183300309157e-06, "loss": 0.0195, "step": 302850 }, { "epoch": 1.95, "learning_rate": 6.790501945952225e-06, "loss": 0.0236, "step": 302860 }, { "epoch": 1.95, "learning_rate": 6.780820591595293e-06, "loss": 0.021, "step": 302870 }, { "epoch": 1.95, "learning_rate": 6.771139237238361e-06, "loss": 0.0208, "step": 302880 }, { "epoch": 1.95, "learning_rate": 6.761457882881429e-06, "loss": 0.0209, "step": 302890 }, { "epoch": 1.95, "learning_rate": 6.751776528524496e-06, "loss": 0.0222, "step": 302900 }, { "epoch": 1.96, "learning_rate": 6.742095174167564e-06, "loss": 0.0233, "step": 302910 }, { "epoch": 1.96, "learning_rate": 6.732413819810632e-06, "loss": 0.023, "step": 302920 }, { "epoch": 1.96, "learning_rate": 6.7227324654537e-06, "loss": 0.0239, "step": 302930 }, { "epoch": 1.96, "learning_rate": 6.713051111096768e-06, "loss": 0.0314, "step": 302940 }, { "epoch": 1.96, "learning_rate": 6.703369756739835e-06, "loss": 0.0205, "step": 302950 }, { "epoch": 1.96, "learning_rate": 6.693688402382904e-06, "loss": 0.023, "step": 302960 }, { "epoch": 1.96, "learning_rate": 6.684007048025971e-06, "loss": 0.0217, "step": 302970 }, { "epoch": 1.96, "learning_rate": 6.67432569366904e-06, "loss": 0.025, "step": 302980 }, { "epoch": 1.96, "learning_rate": 6.664644339312107e-06, "loss": 0.02, "step": 302990 }, { "epoch": 1.96, "learning_rate": 6.6549629849551756e-06, "loss": 0.0191, "step": 303000 }, { "epoch": 1.96, "eval_cer": 0.9198228448762852, "eval_loss": 0.016516968607902527, "eval_runtime": 120.4114, "eval_samples_per_second": 16.61, "eval_steps_per_second": 4.152, "step": 303000 }, { "epoch": 1.96, "learning_rate": 6.645281630598243e-06, "loss": 0.0222, "step": 303010 }, { "epoch": 1.96, "learning_rate": 6.63560027624131e-06, "loss": 0.025, "step": 303020 }, { "epoch": 1.96, "learning_rate": 6.6259189218843785e-06, "loss": 0.034, "step": 303030 }, { "epoch": 1.96, "learning_rate": 6.616237567527446e-06, "loss": 0.0218, "step": 303040 }, { "epoch": 1.96, "learning_rate": 6.606556213170514e-06, "loss": 0.0288, "step": 303050 }, { "epoch": 1.96, "learning_rate": 6.5968748588135815e-06, "loss": 0.0241, "step": 303060 }, { "epoch": 1.96, "learning_rate": 6.58719350445665e-06, "loss": 0.0191, "step": 303070 }, { "epoch": 1.96, "learning_rate": 6.577512150099717e-06, "loss": 0.0217, "step": 303080 }, { "epoch": 1.96, "learning_rate": 6.567830795742784e-06, "loss": 0.0176, "step": 303090 }, { "epoch": 1.96, "learning_rate": 6.558149441385853e-06, "loss": 0.027, "step": 303100 }, { "epoch": 1.96, "learning_rate": 6.54846808702892e-06, "loss": 0.0202, "step": 303110 }, { "epoch": 1.96, "learning_rate": 6.538786732671989e-06, "loss": 0.0166, "step": 303120 }, { "epoch": 1.96, "learning_rate": 6.529105378315056e-06, "loss": 0.0187, "step": 303130 }, { "epoch": 1.96, "learning_rate": 6.519424023958124e-06, "loss": 0.0176, "step": 303140 }, { "epoch": 1.96, "learning_rate": 6.509742669601192e-06, "loss": 0.0235, "step": 303150 }, { "epoch": 1.96, "learning_rate": 6.50006131524426e-06, "loss": 0.0218, "step": 303160 }, { "epoch": 1.96, "learning_rate": 6.490379960887328e-06, "loss": 0.0236, "step": 303170 }, { "epoch": 1.96, "learning_rate": 6.480698606530396e-06, "loss": 0.0216, "step": 303180 }, { "epoch": 1.96, "learning_rate": 6.471017252173464e-06, "loss": 0.0253, "step": 303190 }, { "epoch": 1.96, "learning_rate": 6.461335897816532e-06, "loss": 0.0214, "step": 303200 }, { "epoch": 1.96, "learning_rate": 6.451654543459599e-06, "loss": 0.024, "step": 303210 }, { "epoch": 1.96, "learning_rate": 6.4419731891026675e-06, "loss": 0.0214, "step": 303220 }, { "epoch": 1.96, "learning_rate": 6.432291834745735e-06, "loss": 0.024, "step": 303230 }, { "epoch": 1.96, "learning_rate": 6.4226104803888026e-06, "loss": 0.0227, "step": 303240 }, { "epoch": 1.96, "learning_rate": 6.4129291260318705e-06, "loss": 0.0268, "step": 303250 }, { "epoch": 1.96, "learning_rate": 6.4032477716749384e-06, "loss": 0.0191, "step": 303260 }, { "epoch": 1.96, "learning_rate": 6.393566417318006e-06, "loss": 0.0225, "step": 303270 }, { "epoch": 1.96, "learning_rate": 6.3838850629610734e-06, "loss": 0.0178, "step": 303280 }, { "epoch": 1.96, "learning_rate": 6.374203708604142e-06, "loss": 0.0193, "step": 303290 }, { "epoch": 1.96, "learning_rate": 6.364522354247209e-06, "loss": 0.023, "step": 303300 }, { "epoch": 1.96, "learning_rate": 6.354840999890278e-06, "loss": 0.0214, "step": 303310 }, { "epoch": 1.96, "learning_rate": 6.345159645533345e-06, "loss": 0.0218, "step": 303320 }, { "epoch": 1.96, "learning_rate": 6.335478291176412e-06, "loss": 0.0203, "step": 303330 }, { "epoch": 1.96, "learning_rate": 6.325796936819481e-06, "loss": 0.0205, "step": 303340 }, { "epoch": 1.96, "learning_rate": 6.316115582462548e-06, "loss": 0.0198, "step": 303350 }, { "epoch": 1.96, "learning_rate": 6.306434228105617e-06, "loss": 0.0274, "step": 303360 }, { "epoch": 1.96, "learning_rate": 6.296752873748684e-06, "loss": 0.0236, "step": 303370 }, { "epoch": 1.96, "learning_rate": 6.287071519391753e-06, "loss": 0.0258, "step": 303380 }, { "epoch": 1.96, "learning_rate": 6.27739016503482e-06, "loss": 0.0202, "step": 303390 }, { "epoch": 1.96, "learning_rate": 6.267708810677888e-06, "loss": 0.0242, "step": 303400 }, { "epoch": 1.96, "learning_rate": 6.258027456320956e-06, "loss": 0.0212, "step": 303410 }, { "epoch": 1.96, "learning_rate": 6.248346101964024e-06, "loss": 0.0197, "step": 303420 }, { "epoch": 1.96, "learning_rate": 6.238664747607092e-06, "loss": 0.021, "step": 303430 }, { "epoch": 1.96, "learning_rate": 6.228983393250159e-06, "loss": 0.0248, "step": 303440 }, { "epoch": 1.96, "learning_rate": 6.2193020388932275e-06, "loss": 0.0218, "step": 303450 }, { "epoch": 1.96, "learning_rate": 6.2096206845362945e-06, "loss": 0.0252, "step": 303460 }, { "epoch": 1.96, "learning_rate": 6.1999393301793625e-06, "loss": 0.022, "step": 303470 }, { "epoch": 1.96, "learning_rate": 6.19025797582243e-06, "loss": 0.0276, "step": 303480 }, { "epoch": 1.96, "learning_rate": 6.180576621465498e-06, "loss": 0.0211, "step": 303490 }, { "epoch": 1.96, "learning_rate": 6.170895267108566e-06, "loss": 0.0256, "step": 303500 }, { "epoch": 1.96, "learning_rate": 6.161213912751634e-06, "loss": 0.0204, "step": 303510 }, { "epoch": 1.96, "learning_rate": 6.151532558394702e-06, "loss": 0.021, "step": 303520 }, { "epoch": 1.96, "learning_rate": 6.14185120403777e-06, "loss": 0.0205, "step": 303530 }, { "epoch": 1.96, "learning_rate": 6.132169849680837e-06, "loss": 0.0233, "step": 303540 }, { "epoch": 1.96, "learning_rate": 6.122488495323906e-06, "loss": 0.0206, "step": 303550 }, { "epoch": 1.96, "learning_rate": 6.112807140966973e-06, "loss": 0.0201, "step": 303560 }, { "epoch": 1.96, "learning_rate": 6.103125786610041e-06, "loss": 0.0208, "step": 303570 }, { "epoch": 1.96, "learning_rate": 6.093444432253109e-06, "loss": 0.0183, "step": 303580 }, { "epoch": 1.96, "learning_rate": 6.083763077896176e-06, "loss": 0.0182, "step": 303590 }, { "epoch": 1.96, "learning_rate": 6.074081723539245e-06, "loss": 0.0176, "step": 303600 }, { "epoch": 1.96, "learning_rate": 6.064400369182312e-06, "loss": 0.0217, "step": 303610 }, { "epoch": 1.96, "learning_rate": 6.054719014825381e-06, "loss": 0.0189, "step": 303620 }, { "epoch": 1.96, "learning_rate": 6.045037660468448e-06, "loss": 0.0229, "step": 303630 }, { "epoch": 1.96, "learning_rate": 6.0353563061115165e-06, "loss": 0.0174, "step": 303640 }, { "epoch": 1.96, "learning_rate": 6.025674951754584e-06, "loss": 0.0206, "step": 303650 }, { "epoch": 1.96, "learning_rate": 6.015993597397651e-06, "loss": 0.0273, "step": 303660 }, { "epoch": 1.96, "learning_rate": 6.0063122430407195e-06, "loss": 0.0256, "step": 303670 }, { "epoch": 1.96, "learning_rate": 5.9966308886837865e-06, "loss": 0.0212, "step": 303680 }, { "epoch": 1.96, "learning_rate": 5.986949534326855e-06, "loss": 0.0185, "step": 303690 }, { "epoch": 1.96, "learning_rate": 5.977268179969922e-06, "loss": 0.0193, "step": 303700 }, { "epoch": 1.96, "learning_rate": 5.967586825612991e-06, "loss": 0.0241, "step": 303710 }, { "epoch": 1.96, "learning_rate": 5.957905471256058e-06, "loss": 0.0212, "step": 303720 }, { "epoch": 1.96, "learning_rate": 5.948224116899126e-06, "loss": 0.0203, "step": 303730 }, { "epoch": 1.96, "learning_rate": 5.938542762542194e-06, "loss": 0.0233, "step": 303740 }, { "epoch": 1.96, "learning_rate": 5.928861408185262e-06, "loss": 0.0252, "step": 303750 }, { "epoch": 1.96, "learning_rate": 5.91918005382833e-06, "loss": 0.0242, "step": 303760 }, { "epoch": 1.96, "learning_rate": 5.909498699471397e-06, "loss": 0.0236, "step": 303770 }, { "epoch": 1.96, "learning_rate": 5.899817345114465e-06, "loss": 0.0233, "step": 303780 }, { "epoch": 1.96, "learning_rate": 5.890135990757533e-06, "loss": 0.0187, "step": 303790 }, { "epoch": 1.96, "learning_rate": 5.880454636400601e-06, "loss": 0.0211, "step": 303800 }, { "epoch": 1.96, "learning_rate": 5.870773282043669e-06, "loss": 0.0237, "step": 303810 }, { "epoch": 1.96, "learning_rate": 5.861091927686737e-06, "loss": 0.0189, "step": 303820 }, { "epoch": 1.96, "learning_rate": 5.851410573329805e-06, "loss": 0.026, "step": 303830 }, { "epoch": 1.96, "learning_rate": 5.841729218972873e-06, "loss": 0.0194, "step": 303840 }, { "epoch": 1.96, "learning_rate": 5.83204786461594e-06, "loss": 0.0207, "step": 303850 }, { "epoch": 1.96, "learning_rate": 5.8223665102590085e-06, "loss": 0.0189, "step": 303860 }, { "epoch": 1.96, "learning_rate": 5.8126851559020756e-06, "loss": 0.0202, "step": 303870 }, { "epoch": 1.96, "learning_rate": 5.803003801545144e-06, "loss": 0.0174, "step": 303880 }, { "epoch": 1.96, "learning_rate": 5.7933224471882114e-06, "loss": 0.0226, "step": 303890 }, { "epoch": 1.96, "learning_rate": 5.783641092831279e-06, "loss": 0.0239, "step": 303900 }, { "epoch": 1.96, "learning_rate": 5.773959738474347e-06, "loss": 0.0195, "step": 303910 }, { "epoch": 1.96, "learning_rate": 5.764278384117414e-06, "loss": 0.0191, "step": 303920 }, { "epoch": 1.96, "learning_rate": 5.754597029760483e-06, "loss": 0.0192, "step": 303930 }, { "epoch": 1.96, "learning_rate": 5.74491567540355e-06, "loss": 0.0177, "step": 303940 }, { "epoch": 1.96, "learning_rate": 5.735234321046619e-06, "loss": 0.0204, "step": 303950 }, { "epoch": 1.96, "learning_rate": 5.725552966689686e-06, "loss": 0.0253, "step": 303960 }, { "epoch": 1.96, "learning_rate": 5.715871612332753e-06, "loss": 0.0227, "step": 303970 }, { "epoch": 1.96, "learning_rate": 5.706190257975822e-06, "loss": 0.0195, "step": 303980 }, { "epoch": 1.96, "learning_rate": 5.696508903618889e-06, "loss": 0.0247, "step": 303990 }, { "epoch": 1.96, "learning_rate": 5.686827549261958e-06, "loss": 0.0249, "step": 304000 }, { "epoch": 1.96, "eval_cer": 0.9197939215907807, "eval_loss": 0.016484426334500313, "eval_runtime": 120.4979, "eval_samples_per_second": 16.598, "eval_steps_per_second": 4.149, "step": 304000 }, { "epoch": 1.96, "learning_rate": 5.677146194905025e-06, "loss": 0.0266, "step": 304010 }, { "epoch": 1.96, "learning_rate": 5.667464840548094e-06, "loss": 0.026, "step": 304020 }, { "epoch": 1.96, "learning_rate": 5.657783486191161e-06, "loss": 0.0257, "step": 304030 }, { "epoch": 1.96, "learning_rate": 5.648102131834229e-06, "loss": 0.0213, "step": 304040 }, { "epoch": 1.96, "learning_rate": 5.638420777477297e-06, "loss": 0.0222, "step": 304050 }, { "epoch": 1.96, "learning_rate": 5.628739423120365e-06, "loss": 0.0196, "step": 304060 }, { "epoch": 1.96, "learning_rate": 5.6190580687634325e-06, "loss": 0.0224, "step": 304070 }, { "epoch": 1.96, "learning_rate": 5.6093767144065005e-06, "loss": 0.0203, "step": 304080 }, { "epoch": 1.96, "learning_rate": 5.599695360049568e-06, "loss": 0.0242, "step": 304090 }, { "epoch": 1.96, "learning_rate": 5.5900140056926355e-06, "loss": 0.02, "step": 304100 }, { "epoch": 1.96, "learning_rate": 5.5803326513357034e-06, "loss": 0.0226, "step": 304110 }, { "epoch": 1.96, "learning_rate": 5.570651296978771e-06, "loss": 0.0185, "step": 304120 }, { "epoch": 1.96, "learning_rate": 5.560969942621839e-06, "loss": 0.0209, "step": 304130 }, { "epoch": 1.96, "learning_rate": 5.551288588264907e-06, "loss": 0.0199, "step": 304140 }, { "epoch": 1.96, "learning_rate": 5.541607233907975e-06, "loss": 0.0214, "step": 304150 }, { "epoch": 1.96, "learning_rate": 5.531925879551043e-06, "loss": 0.021, "step": 304160 }, { "epoch": 1.96, "learning_rate": 5.522244525194111e-06, "loss": 0.0191, "step": 304170 }, { "epoch": 1.96, "learning_rate": 5.512563170837178e-06, "loss": 0.0191, "step": 304180 }, { "epoch": 1.96, "learning_rate": 5.502881816480247e-06, "loss": 0.021, "step": 304190 }, { "epoch": 1.96, "learning_rate": 5.493200462123314e-06, "loss": 0.024, "step": 304200 }, { "epoch": 1.96, "learning_rate": 5.483519107766383e-06, "loss": 0.0205, "step": 304210 }, { "epoch": 1.96, "learning_rate": 5.47383775340945e-06, "loss": 0.0234, "step": 304220 }, { "epoch": 1.96, "learning_rate": 5.464156399052517e-06, "loss": 0.0206, "step": 304230 }, { "epoch": 1.96, "learning_rate": 5.454475044695586e-06, "loss": 0.028, "step": 304240 }, { "epoch": 1.96, "learning_rate": 5.444793690338653e-06, "loss": 0.0237, "step": 304250 }, { "epoch": 1.96, "learning_rate": 5.435112335981722e-06, "loss": 0.0238, "step": 304260 }, { "epoch": 1.96, "learning_rate": 5.425430981624789e-06, "loss": 0.0217, "step": 304270 }, { "epoch": 1.96, "learning_rate": 5.4157496272678575e-06, "loss": 0.0231, "step": 304280 }, { "epoch": 1.96, "learning_rate": 5.4060682729109245e-06, "loss": 0.0204, "step": 304290 }, { "epoch": 1.96, "learning_rate": 5.396386918553992e-06, "loss": 0.0223, "step": 304300 }, { "epoch": 1.96, "learning_rate": 5.38670556419706e-06, "loss": 0.0246, "step": 304310 }, { "epoch": 1.96, "learning_rate": 5.3770242098401275e-06, "loss": 0.0219, "step": 304320 }, { "epoch": 1.96, "learning_rate": 5.367342855483196e-06, "loss": 0.021, "step": 304330 }, { "epoch": 1.96, "learning_rate": 5.357661501126263e-06, "loss": 0.0193, "step": 304340 }, { "epoch": 1.96, "learning_rate": 5.347980146769332e-06, "loss": 0.0175, "step": 304350 }, { "epoch": 1.96, "learning_rate": 5.338298792412399e-06, "loss": 0.0216, "step": 304360 }, { "epoch": 1.96, "learning_rate": 5.328617438055467e-06, "loss": 0.021, "step": 304370 }, { "epoch": 1.96, "learning_rate": 5.318936083698535e-06, "loss": 0.0263, "step": 304380 }, { "epoch": 1.96, "learning_rate": 5.309254729341603e-06, "loss": 0.0212, "step": 304390 }, { "epoch": 1.96, "learning_rate": 5.299573374984671e-06, "loss": 0.023, "step": 304400 }, { "epoch": 1.96, "learning_rate": 5.289892020627739e-06, "loss": 0.0205, "step": 304410 }, { "epoch": 1.96, "learning_rate": 5.280210666270806e-06, "loss": 0.0215, "step": 304420 }, { "epoch": 1.96, "learning_rate": 5.270529311913874e-06, "loss": 0.0191, "step": 304430 }, { "epoch": 1.96, "learning_rate": 5.260847957556942e-06, "loss": 0.0206, "step": 304440 }, { "epoch": 1.96, "learning_rate": 5.25116660320001e-06, "loss": 0.0226, "step": 304450 }, { "epoch": 1.97, "learning_rate": 5.241485248843078e-06, "loss": 0.0258, "step": 304460 }, { "epoch": 1.97, "learning_rate": 5.231803894486146e-06, "loss": 0.0248, "step": 304470 }, { "epoch": 1.97, "learning_rate": 5.2221225401292136e-06, "loss": 0.018, "step": 304480 }, { "epoch": 1.97, "learning_rate": 5.212441185772281e-06, "loss": 0.0215, "step": 304490 }, { "epoch": 1.97, "learning_rate": 5.2027598314153494e-06, "loss": 0.0269, "step": 304500 }, { "epoch": 1.97, "learning_rate": 5.1930784770584165e-06, "loss": 0.0205, "step": 304510 }, { "epoch": 1.97, "learning_rate": 5.183397122701485e-06, "loss": 0.0201, "step": 304520 }, { "epoch": 1.97, "learning_rate": 5.173715768344552e-06, "loss": 0.0201, "step": 304530 }, { "epoch": 1.97, "learning_rate": 5.164034413987621e-06, "loss": 0.0184, "step": 304540 }, { "epoch": 1.97, "learning_rate": 5.154353059630688e-06, "loss": 0.0212, "step": 304550 }, { "epoch": 1.97, "learning_rate": 5.144671705273755e-06, "loss": 0.0215, "step": 304560 }, { "epoch": 1.97, "learning_rate": 5.134990350916824e-06, "loss": 0.0197, "step": 304570 }, { "epoch": 1.97, "learning_rate": 5.125308996559891e-06, "loss": 0.0199, "step": 304580 }, { "epoch": 1.97, "learning_rate": 5.11562764220296e-06, "loss": 0.0264, "step": 304590 }, { "epoch": 1.97, "learning_rate": 5.105946287846027e-06, "loss": 0.0186, "step": 304600 }, { "epoch": 1.97, "learning_rate": 5.096264933489095e-06, "loss": 0.0241, "step": 304610 }, { "epoch": 1.97, "learning_rate": 5.086583579132163e-06, "loss": 0.0219, "step": 304620 }, { "epoch": 1.97, "learning_rate": 5.07690222477523e-06, "loss": 0.0217, "step": 304630 }, { "epoch": 1.97, "learning_rate": 5.067220870418299e-06, "loss": 0.0203, "step": 304640 }, { "epoch": 1.97, "learning_rate": 5.057539516061366e-06, "loss": 0.0224, "step": 304650 }, { "epoch": 1.97, "learning_rate": 5.047858161704435e-06, "loss": 0.0243, "step": 304660 }, { "epoch": 1.97, "learning_rate": 5.038176807347502e-06, "loss": 0.0187, "step": 304670 }, { "epoch": 1.97, "learning_rate": 5.02849545299057e-06, "loss": 0.0217, "step": 304680 }, { "epoch": 1.97, "learning_rate": 5.018814098633638e-06, "loss": 0.0177, "step": 304690 }, { "epoch": 1.97, "learning_rate": 5.0091327442767056e-06, "loss": 0.0219, "step": 304700 }, { "epoch": 1.97, "learning_rate": 4.9994513899197735e-06, "loss": 0.0223, "step": 304710 }, { "epoch": 1.97, "learning_rate": 4.9897700355628414e-06, "loss": 0.0198, "step": 304720 }, { "epoch": 1.97, "learning_rate": 4.980088681205909e-06, "loss": 0.0262, "step": 304730 }, { "epoch": 1.97, "learning_rate": 4.970407326848977e-06, "loss": 0.0233, "step": 304740 }, { "epoch": 1.97, "learning_rate": 4.960725972492044e-06, "loss": 0.0198, "step": 304750 }, { "epoch": 1.97, "learning_rate": 4.951044618135112e-06, "loss": 0.0214, "step": 304760 }, { "epoch": 1.97, "learning_rate": 4.94136326377818e-06, "loss": 0.0252, "step": 304770 }, { "epoch": 1.97, "learning_rate": 4.931681909421248e-06, "loss": 0.0221, "step": 304780 }, { "epoch": 1.97, "learning_rate": 4.922000555064316e-06, "loss": 0.0255, "step": 304790 }, { "epoch": 1.97, "learning_rate": 4.912319200707384e-06, "loss": 0.0262, "step": 304800 }, { "epoch": 1.97, "learning_rate": 4.902637846350452e-06, "loss": 0.0242, "step": 304810 }, { "epoch": 1.97, "learning_rate": 4.892956491993519e-06, "loss": 0.0252, "step": 304820 }, { "epoch": 1.97, "learning_rate": 4.883275137636588e-06, "loss": 0.022, "step": 304830 }, { "epoch": 1.97, "learning_rate": 4.873593783279655e-06, "loss": 0.023, "step": 304840 }, { "epoch": 1.97, "learning_rate": 4.863912428922724e-06, "loss": 0.022, "step": 304850 }, { "epoch": 1.97, "learning_rate": 4.854231074565791e-06, "loss": 0.0195, "step": 304860 }, { "epoch": 1.97, "learning_rate": 4.844549720208858e-06, "loss": 0.0236, "step": 304870 }, { "epoch": 1.97, "learning_rate": 4.834868365851927e-06, "loss": 0.0259, "step": 304880 }, { "epoch": 1.97, "learning_rate": 4.825187011494994e-06, "loss": 0.02, "step": 304890 }, { "epoch": 1.97, "learning_rate": 4.8155056571380625e-06, "loss": 0.0194, "step": 304900 }, { "epoch": 1.97, "learning_rate": 4.80582430278113e-06, "loss": 0.0256, "step": 304910 }, { "epoch": 1.97, "learning_rate": 4.796142948424198e-06, "loss": 0.024, "step": 304920 }, { "epoch": 1.97, "learning_rate": 4.7864615940672655e-06, "loss": 0.0261, "step": 304930 }, { "epoch": 1.97, "learning_rate": 4.776780239710333e-06, "loss": 0.0206, "step": 304940 }, { "epoch": 1.97, "learning_rate": 4.767098885353401e-06, "loss": 0.0223, "step": 304950 }, { "epoch": 1.97, "learning_rate": 4.7574175309964684e-06, "loss": 0.0175, "step": 304960 }, { "epoch": 1.97, "learning_rate": 4.747736176639537e-06, "loss": 0.0189, "step": 304970 }, { "epoch": 1.97, "learning_rate": 4.738054822282604e-06, "loss": 0.0245, "step": 304980 }, { "epoch": 1.97, "learning_rate": 4.728373467925673e-06, "loss": 0.0249, "step": 304990 }, { "epoch": 1.97, "learning_rate": 4.71869211356874e-06, "loss": 0.0233, "step": 305000 }, { "epoch": 1.97, "eval_cer": 0.9198092870862049, "eval_loss": 0.016421254724264145, "eval_runtime": 120.2527, "eval_samples_per_second": 16.632, "eval_steps_per_second": 4.158, "step": 305000 }, { "epoch": 1.97, "learning_rate": 4.709010759211808e-06, "loss": 0.0207, "step": 305010 }, { "epoch": 1.97, "learning_rate": 4.699329404854876e-06, "loss": 0.0231, "step": 305020 }, { "epoch": 1.97, "learning_rate": 4.689648050497944e-06, "loss": 0.0218, "step": 305030 }, { "epoch": 1.97, "learning_rate": 4.679966696141012e-06, "loss": 0.0242, "step": 305040 }, { "epoch": 1.97, "learning_rate": 4.67028534178408e-06, "loss": 0.021, "step": 305050 }, { "epoch": 1.97, "learning_rate": 4.660603987427148e-06, "loss": 0.024, "step": 305060 }, { "epoch": 1.97, "learning_rate": 4.650922633070216e-06, "loss": 0.0197, "step": 305070 }, { "epoch": 1.97, "learning_rate": 4.641241278713284e-06, "loss": 0.0237, "step": 305080 }, { "epoch": 1.97, "learning_rate": 4.631559924356351e-06, "loss": 0.022, "step": 305090 }, { "epoch": 1.97, "learning_rate": 4.621878569999419e-06, "loss": 0.0203, "step": 305100 }, { "epoch": 1.97, "learning_rate": 4.612197215642487e-06, "loss": 0.0221, "step": 305110 }, { "epoch": 1.97, "learning_rate": 4.6025158612855545e-06, "loss": 0.0183, "step": 305120 }, { "epoch": 1.97, "learning_rate": 4.5928345069286225e-06, "loss": 0.0192, "step": 305130 }, { "epoch": 1.97, "learning_rate": 4.58315315257169e-06, "loss": 0.0199, "step": 305140 }, { "epoch": 1.97, "learning_rate": 4.573471798214758e-06, "loss": 0.0198, "step": 305150 }, { "epoch": 1.97, "learning_rate": 4.563790443857825e-06, "loss": 0.0196, "step": 305160 }, { "epoch": 1.97, "learning_rate": 4.554109089500893e-06, "loss": 0.0188, "step": 305170 }, { "epoch": 1.97, "learning_rate": 4.544427735143961e-06, "loss": 0.0219, "step": 305180 }, { "epoch": 1.97, "learning_rate": 4.534746380787029e-06, "loss": 0.0215, "step": 305190 }, { "epoch": 1.97, "learning_rate": 4.525065026430097e-06, "loss": 0.0199, "step": 305200 }, { "epoch": 1.97, "learning_rate": 4.515383672073165e-06, "loss": 0.0207, "step": 305210 }, { "epoch": 1.97, "learning_rate": 4.505702317716232e-06, "loss": 0.0194, "step": 305220 }, { "epoch": 1.97, "learning_rate": 4.4960209633593e-06, "loss": 0.0184, "step": 305230 }, { "epoch": 1.97, "learning_rate": 4.486339609002368e-06, "loss": 0.0194, "step": 305240 }, { "epoch": 1.97, "learning_rate": 4.476658254645436e-06, "loss": 0.0232, "step": 305250 }, { "epoch": 1.97, "learning_rate": 4.466976900288504e-06, "loss": 0.0205, "step": 305260 }, { "epoch": 1.97, "learning_rate": 4.457295545931572e-06, "loss": 0.0234, "step": 305270 }, { "epoch": 1.97, "learning_rate": 4.44761419157464e-06, "loss": 0.021, "step": 305280 }, { "epoch": 1.97, "learning_rate": 4.437932837217707e-06, "loss": 0.0198, "step": 305290 }, { "epoch": 1.97, "learning_rate": 4.428251482860775e-06, "loss": 0.0227, "step": 305300 }, { "epoch": 1.97, "learning_rate": 4.418570128503843e-06, "loss": 0.0213, "step": 305310 }, { "epoch": 1.97, "learning_rate": 4.408888774146911e-06, "loss": 0.0226, "step": 305320 }, { "epoch": 1.97, "learning_rate": 4.399207419789979e-06, "loss": 0.0206, "step": 305330 }, { "epoch": 1.97, "learning_rate": 4.3895260654330465e-06, "loss": 0.0185, "step": 305340 }, { "epoch": 1.97, "learning_rate": 4.3798447110761144e-06, "loss": 0.0236, "step": 305350 }, { "epoch": 1.97, "learning_rate": 4.370163356719182e-06, "loss": 0.019, "step": 305360 }, { "epoch": 1.97, "learning_rate": 4.36048200236225e-06, "loss": 0.0223, "step": 305370 }, { "epoch": 1.97, "learning_rate": 4.350800648005318e-06, "loss": 0.0217, "step": 305380 }, { "epoch": 1.97, "learning_rate": 4.341119293648386e-06, "loss": 0.0244, "step": 305390 }, { "epoch": 1.97, "learning_rate": 4.331437939291454e-06, "loss": 0.0212, "step": 305400 }, { "epoch": 1.97, "learning_rate": 4.321756584934521e-06, "loss": 0.0231, "step": 305410 }, { "epoch": 1.97, "learning_rate": 4.312075230577589e-06, "loss": 0.0204, "step": 305420 }, { "epoch": 1.97, "learning_rate": 4.302393876220657e-06, "loss": 0.0221, "step": 305430 }, { "epoch": 1.97, "learning_rate": 4.292712521863725e-06, "loss": 0.0214, "step": 305440 }, { "epoch": 1.97, "learning_rate": 4.283031167506793e-06, "loss": 0.0174, "step": 305450 }, { "epoch": 1.97, "learning_rate": 4.273349813149861e-06, "loss": 0.0223, "step": 305460 }, { "epoch": 1.97, "learning_rate": 4.263668458792929e-06, "loss": 0.0198, "step": 305470 }, { "epoch": 1.97, "learning_rate": 4.253987104435996e-06, "loss": 0.0189, "step": 305480 }, { "epoch": 1.97, "learning_rate": 4.244305750079064e-06, "loss": 0.0188, "step": 305490 }, { "epoch": 1.97, "learning_rate": 4.234624395722132e-06, "loss": 0.0225, "step": 305500 }, { "epoch": 1.97, "learning_rate": 4.2249430413652e-06, "loss": 0.0249, "step": 305510 }, { "epoch": 1.97, "learning_rate": 4.215261687008268e-06, "loss": 0.024, "step": 305520 }, { "epoch": 1.97, "learning_rate": 4.2055803326513355e-06, "loss": 0.0232, "step": 305530 }, { "epoch": 1.97, "learning_rate": 4.195898978294403e-06, "loss": 0.021, "step": 305540 }, { "epoch": 1.97, "learning_rate": 4.1862176239374706e-06, "loss": 0.0287, "step": 305550 }, { "epoch": 1.97, "learning_rate": 4.1765362695805385e-06, "loss": 0.0214, "step": 305560 }, { "epoch": 1.97, "learning_rate": 4.1668549152236064e-06, "loss": 0.0226, "step": 305570 }, { "epoch": 1.97, "learning_rate": 4.157173560866674e-06, "loss": 0.0225, "step": 305580 }, { "epoch": 1.97, "learning_rate": 4.147492206509742e-06, "loss": 0.0216, "step": 305590 }, { "epoch": 1.97, "learning_rate": 4.13781085215281e-06, "loss": 0.0194, "step": 305600 }, { "epoch": 1.97, "learning_rate": 4.128129497795878e-06, "loss": 0.0238, "step": 305610 }, { "epoch": 1.97, "learning_rate": 4.118448143438945e-06, "loss": 0.0225, "step": 305620 }, { "epoch": 1.97, "learning_rate": 4.108766789082013e-06, "loss": 0.0186, "step": 305630 }, { "epoch": 1.97, "learning_rate": 4.099085434725081e-06, "loss": 0.0222, "step": 305640 }, { "epoch": 1.97, "learning_rate": 4.089404080368149e-06, "loss": 0.0197, "step": 305650 }, { "epoch": 1.97, "learning_rate": 4.079722726011217e-06, "loss": 0.033, "step": 305660 }, { "epoch": 1.97, "learning_rate": 4.070041371654285e-06, "loss": 0.0229, "step": 305670 }, { "epoch": 1.97, "learning_rate": 4.060360017297353e-06, "loss": 0.0186, "step": 305680 }, { "epoch": 1.97, "learning_rate": 4.050678662940421e-06, "loss": 0.0266, "step": 305690 }, { "epoch": 1.97, "learning_rate": 4.040997308583489e-06, "loss": 0.0243, "step": 305700 }, { "epoch": 1.97, "learning_rate": 4.031315954226557e-06, "loss": 0.0238, "step": 305710 }, { "epoch": 1.97, "learning_rate": 4.021634599869625e-06, "loss": 0.0239, "step": 305720 }, { "epoch": 1.97, "learning_rate": 4.0119532455126925e-06, "loss": 0.0202, "step": 305730 }, { "epoch": 1.97, "learning_rate": 4.00227189115576e-06, "loss": 0.0238, "step": 305740 }, { "epoch": 1.97, "learning_rate": 3.9925905367988275e-06, "loss": 0.0162, "step": 305750 }, { "epoch": 1.97, "learning_rate": 3.9829091824418955e-06, "loss": 0.0218, "step": 305760 }, { "epoch": 1.97, "learning_rate": 3.973227828084963e-06, "loss": 0.0195, "step": 305770 }, { "epoch": 1.97, "learning_rate": 3.963546473728031e-06, "loss": 0.0203, "step": 305780 }, { "epoch": 1.97, "learning_rate": 3.953865119371099e-06, "loss": 0.0214, "step": 305790 }, { "epoch": 1.97, "learning_rate": 3.944183765014166e-06, "loss": 0.021, "step": 305800 }, { "epoch": 1.97, "learning_rate": 3.934502410657234e-06, "loss": 0.0216, "step": 305810 }, { "epoch": 1.97, "learning_rate": 3.924821056300302e-06, "loss": 0.0274, "step": 305820 }, { "epoch": 1.97, "learning_rate": 3.91513970194337e-06, "loss": 0.0205, "step": 305830 }, { "epoch": 1.97, "learning_rate": 3.905458347586438e-06, "loss": 0.0159, "step": 305840 }, { "epoch": 1.97, "learning_rate": 3.895776993229506e-06, "loss": 0.0267, "step": 305850 }, { "epoch": 1.97, "learning_rate": 3.886095638872573e-06, "loss": 0.0217, "step": 305860 }, { "epoch": 1.97, "learning_rate": 3.876414284515641e-06, "loss": 0.0197, "step": 305870 }, { "epoch": 1.97, "learning_rate": 3.866732930158709e-06, "loss": 0.0238, "step": 305880 }, { "epoch": 1.97, "learning_rate": 3.857051575801777e-06, "loss": 0.0221, "step": 305890 }, { "epoch": 1.97, "learning_rate": 3.847370221444845e-06, "loss": 0.0273, "step": 305900 }, { "epoch": 1.97, "learning_rate": 3.837688867087913e-06, "loss": 0.0239, "step": 305910 }, { "epoch": 1.97, "learning_rate": 3.828007512730981e-06, "loss": 0.0252, "step": 305920 }, { "epoch": 1.97, "learning_rate": 3.818326158374049e-06, "loss": 0.0186, "step": 305930 }, { "epoch": 1.97, "learning_rate": 3.808644804017116e-06, "loss": 0.0226, "step": 305940 }, { "epoch": 1.97, "learning_rate": 3.798963449660184e-06, "loss": 0.0198, "step": 305950 }, { "epoch": 1.97, "learning_rate": 3.789282095303252e-06, "loss": 0.0268, "step": 305960 }, { "epoch": 1.97, "learning_rate": 3.77960074094632e-06, "loss": 0.025, "step": 305970 }, { "epoch": 1.97, "learning_rate": 3.769919386589388e-06, "loss": 0.0217, "step": 305980 }, { "epoch": 1.97, "learning_rate": 3.7602380322324554e-06, "loss": 0.0207, "step": 305990 }, { "epoch": 1.97, "learning_rate": 3.7505566778755233e-06, "loss": 0.0211, "step": 306000 }, { "epoch": 1.97, "eval_cer": 0.919808383233533, "eval_loss": 0.01641755923628807, "eval_runtime": 120.3007, "eval_samples_per_second": 16.625, "eval_steps_per_second": 4.156, "step": 306000 }, { "epoch": 1.98, "learning_rate": 3.740875323518591e-06, "loss": 0.0277, "step": 306010 }, { "epoch": 1.98, "learning_rate": 3.7311939691616588e-06, "loss": 0.0268, "step": 306020 }, { "epoch": 1.98, "learning_rate": 3.7215126148047267e-06, "loss": 0.023, "step": 306030 }, { "epoch": 1.98, "learning_rate": 3.7118312604477946e-06, "loss": 0.0248, "step": 306040 }, { "epoch": 1.98, "learning_rate": 3.7021499060908626e-06, "loss": 0.0182, "step": 306050 }, { "epoch": 1.98, "learning_rate": 3.69246855173393e-06, "loss": 0.0163, "step": 306060 }, { "epoch": 1.98, "learning_rate": 3.682787197376998e-06, "loss": 0.021, "step": 306070 }, { "epoch": 1.98, "learning_rate": 3.673105843020066e-06, "loss": 0.023, "step": 306080 }, { "epoch": 1.98, "learning_rate": 3.663424488663134e-06, "loss": 0.0205, "step": 306090 }, { "epoch": 1.98, "learning_rate": 3.653743134306202e-06, "loss": 0.0184, "step": 306100 }, { "epoch": 1.98, "learning_rate": 3.6440617799492697e-06, "loss": 0.0239, "step": 306110 }, { "epoch": 1.98, "learning_rate": 3.634380425592337e-06, "loss": 0.0217, "step": 306120 }, { "epoch": 1.98, "learning_rate": 3.6246990712354048e-06, "loss": 0.0224, "step": 306130 }, { "epoch": 1.98, "learning_rate": 3.6150177168784727e-06, "loss": 0.0256, "step": 306140 }, { "epoch": 1.98, "learning_rate": 3.6053363625215406e-06, "loss": 0.0191, "step": 306150 }, { "epoch": 1.98, "learning_rate": 3.5956550081646086e-06, "loss": 0.0208, "step": 306160 }, { "epoch": 1.98, "learning_rate": 3.5859736538076765e-06, "loss": 0.0193, "step": 306170 }, { "epoch": 1.98, "learning_rate": 3.576292299450744e-06, "loss": 0.0213, "step": 306180 }, { "epoch": 1.98, "learning_rate": 3.566610945093812e-06, "loss": 0.0213, "step": 306190 }, { "epoch": 1.98, "learning_rate": 3.55692959073688e-06, "loss": 0.0223, "step": 306200 }, { "epoch": 1.98, "learning_rate": 3.547248236379948e-06, "loss": 0.0171, "step": 306210 }, { "epoch": 1.98, "learning_rate": 3.5375668820230157e-06, "loss": 0.0223, "step": 306220 }, { "epoch": 1.98, "learning_rate": 3.5278855276660837e-06, "loss": 0.0204, "step": 306230 }, { "epoch": 1.98, "learning_rate": 3.518204173309151e-06, "loss": 0.0236, "step": 306240 }, { "epoch": 1.98, "learning_rate": 3.5085228189522187e-06, "loss": 0.0223, "step": 306250 }, { "epoch": 1.98, "learning_rate": 3.4988414645952866e-06, "loss": 0.0224, "step": 306260 }, { "epoch": 1.98, "learning_rate": 3.4891601102383546e-06, "loss": 0.024, "step": 306270 }, { "epoch": 1.98, "learning_rate": 3.4794787558814225e-06, "loss": 0.0245, "step": 306280 }, { "epoch": 1.98, "learning_rate": 3.4697974015244904e-06, "loss": 0.0195, "step": 306290 }, { "epoch": 1.98, "learning_rate": 3.4601160471675584e-06, "loss": 0.0284, "step": 306300 }, { "epoch": 1.98, "learning_rate": 3.450434692810626e-06, "loss": 0.0191, "step": 306310 }, { "epoch": 1.98, "learning_rate": 3.440753338453694e-06, "loss": 0.0194, "step": 306320 }, { "epoch": 1.98, "learning_rate": 3.4310719840967617e-06, "loss": 0.0212, "step": 306330 }, { "epoch": 1.98, "learning_rate": 3.4213906297398292e-06, "loss": 0.02, "step": 306340 }, { "epoch": 1.98, "learning_rate": 3.411709275382897e-06, "loss": 0.0256, "step": 306350 }, { "epoch": 1.98, "learning_rate": 3.402027921025965e-06, "loss": 0.0208, "step": 306360 }, { "epoch": 1.98, "learning_rate": 3.392346566669033e-06, "loss": 0.0183, "step": 306370 }, { "epoch": 1.98, "learning_rate": 3.3826652123121006e-06, "loss": 0.025, "step": 306380 }, { "epoch": 1.98, "learning_rate": 3.3729838579551685e-06, "loss": 0.0246, "step": 306390 }, { "epoch": 1.98, "learning_rate": 3.3633025035982364e-06, "loss": 0.0194, "step": 306400 }, { "epoch": 1.98, "learning_rate": 3.3536211492413044e-06, "loss": 0.0214, "step": 306410 }, { "epoch": 1.98, "learning_rate": 3.3439397948843723e-06, "loss": 0.0199, "step": 306420 }, { "epoch": 1.98, "learning_rate": 3.3342584405274402e-06, "loss": 0.0201, "step": 306430 }, { "epoch": 1.98, "learning_rate": 3.3245770861705073e-06, "loss": 0.0208, "step": 306440 }, { "epoch": 1.98, "learning_rate": 3.3148957318135752e-06, "loss": 0.0197, "step": 306450 }, { "epoch": 1.98, "learning_rate": 3.305214377456643e-06, "loss": 0.0263, "step": 306460 }, { "epoch": 1.98, "learning_rate": 3.295533023099711e-06, "loss": 0.029, "step": 306470 }, { "epoch": 1.98, "learning_rate": 3.285851668742779e-06, "loss": 0.0262, "step": 306480 }, { "epoch": 1.98, "learning_rate": 3.276170314385847e-06, "loss": 0.0186, "step": 306490 }, { "epoch": 1.98, "learning_rate": 3.2664889600289145e-06, "loss": 0.0271, "step": 306500 }, { "epoch": 1.98, "learning_rate": 3.2568076056719824e-06, "loss": 0.0225, "step": 306510 }, { "epoch": 1.98, "learning_rate": 3.2471262513150504e-06, "loss": 0.0255, "step": 306520 }, { "epoch": 1.98, "learning_rate": 3.2374448969581183e-06, "loss": 0.0212, "step": 306530 }, { "epoch": 1.98, "learning_rate": 3.2277635426011862e-06, "loss": 0.0204, "step": 306540 }, { "epoch": 1.98, "learning_rate": 3.218082188244254e-06, "loss": 0.0208, "step": 306550 }, { "epoch": 1.98, "learning_rate": 3.208400833887322e-06, "loss": 0.0259, "step": 306560 }, { "epoch": 1.98, "learning_rate": 3.198719479530389e-06, "loss": 0.023, "step": 306570 }, { "epoch": 1.98, "learning_rate": 3.189038125173457e-06, "loss": 0.0219, "step": 306580 }, { "epoch": 1.98, "learning_rate": 3.179356770816525e-06, "loss": 0.0238, "step": 306590 }, { "epoch": 1.98, "learning_rate": 3.169675416459593e-06, "loss": 0.021, "step": 306600 }, { "epoch": 1.98, "learning_rate": 3.159994062102661e-06, "loss": 0.024, "step": 306610 }, { "epoch": 1.98, "learning_rate": 3.150312707745729e-06, "loss": 0.02, "step": 306620 }, { "epoch": 1.98, "learning_rate": 3.1406313533887963e-06, "loss": 0.0239, "step": 306630 }, { "epoch": 1.98, "learning_rate": 3.1309499990318643e-06, "loss": 0.0211, "step": 306640 }, { "epoch": 1.98, "learning_rate": 3.1212686446749322e-06, "loss": 0.0256, "step": 306650 }, { "epoch": 1.98, "learning_rate": 3.111587290318e-06, "loss": 0.0259, "step": 306660 }, { "epoch": 1.98, "learning_rate": 3.1019059359610677e-06, "loss": 0.0184, "step": 306670 }, { "epoch": 1.98, "learning_rate": 3.0922245816041356e-06, "loss": 0.0199, "step": 306680 }, { "epoch": 1.98, "learning_rate": 3.0825432272472035e-06, "loss": 0.0294, "step": 306690 }, { "epoch": 1.98, "learning_rate": 3.072861872890271e-06, "loss": 0.0211, "step": 306700 }, { "epoch": 1.98, "learning_rate": 3.063180518533339e-06, "loss": 0.0236, "step": 306710 }, { "epoch": 1.98, "learning_rate": 3.053499164176407e-06, "loss": 0.0247, "step": 306720 }, { "epoch": 1.98, "learning_rate": 3.043817809819475e-06, "loss": 0.029, "step": 306730 }, { "epoch": 1.98, "learning_rate": 3.0341364554625428e-06, "loss": 0.0216, "step": 306740 }, { "epoch": 1.98, "learning_rate": 3.0244551011056107e-06, "loss": 0.0204, "step": 306750 }, { "epoch": 1.98, "learning_rate": 3.014773746748678e-06, "loss": 0.0322, "step": 306760 }, { "epoch": 1.98, "learning_rate": 3.0050923923917457e-06, "loss": 0.0234, "step": 306770 }, { "epoch": 1.98, "learning_rate": 2.9954110380348136e-06, "loss": 0.0216, "step": 306780 }, { "epoch": 1.98, "learning_rate": 2.9857296836778816e-06, "loss": 0.0215, "step": 306790 }, { "epoch": 1.98, "learning_rate": 2.9760483293209495e-06, "loss": 0.0241, "step": 306800 }, { "epoch": 1.98, "learning_rate": 2.9663669749640174e-06, "loss": 0.0231, "step": 306810 }, { "epoch": 1.98, "learning_rate": 2.956685620607085e-06, "loss": 0.0328, "step": 306820 }, { "epoch": 1.98, "learning_rate": 2.947004266250153e-06, "loss": 0.024, "step": 306830 }, { "epoch": 1.98, "learning_rate": 2.937322911893221e-06, "loss": 0.0216, "step": 306840 }, { "epoch": 1.98, "learning_rate": 2.9276415575362888e-06, "loss": 0.0194, "step": 306850 }, { "epoch": 1.98, "learning_rate": 2.9179602031793567e-06, "loss": 0.0242, "step": 306860 }, { "epoch": 1.98, "learning_rate": 2.9082788488224246e-06, "loss": 0.0194, "step": 306870 }, { "epoch": 1.98, "learning_rate": 2.8985974944654926e-06, "loss": 0.0215, "step": 306880 }, { "epoch": 1.98, "learning_rate": 2.8889161401085596e-06, "loss": 0.027, "step": 306890 }, { "epoch": 1.98, "learning_rate": 2.8792347857516276e-06, "loss": 0.0241, "step": 306900 }, { "epoch": 1.98, "learning_rate": 2.8695534313946955e-06, "loss": 0.0198, "step": 306910 }, { "epoch": 1.98, "learning_rate": 2.8598720770377634e-06, "loss": 0.018, "step": 306920 }, { "epoch": 1.98, "learning_rate": 2.8501907226808314e-06, "loss": 0.0218, "step": 306930 }, { "epoch": 1.98, "learning_rate": 2.8405093683238993e-06, "loss": 0.0239, "step": 306940 }, { "epoch": 1.98, "learning_rate": 2.830828013966967e-06, "loss": 0.0226, "step": 306950 }, { "epoch": 1.98, "learning_rate": 2.8211466596100348e-06, "loss": 0.0225, "step": 306960 }, { "epoch": 1.98, "learning_rate": 2.8114653052531027e-06, "loss": 0.0217, "step": 306970 }, { "epoch": 1.98, "learning_rate": 2.8017839508961706e-06, "loss": 0.0192, "step": 306980 }, { "epoch": 1.98, "learning_rate": 2.7921025965392386e-06, "loss": 0.0219, "step": 306990 }, { "epoch": 1.98, "learning_rate": 2.7824212421823065e-06, "loss": 0.02, "step": 307000 }, { "epoch": 1.98, "eval_cer": 0.9198192294655971, "eval_loss": 0.016391895711421967, "eval_runtime": 120.1873, "eval_samples_per_second": 16.641, "eval_steps_per_second": 4.16, "step": 307000 }, { "epoch": 1.98, "learning_rate": 2.772739887825374e-06, "loss": 0.0237, "step": 307010 }, { "epoch": 1.98, "learning_rate": 2.7630585334684415e-06, "loss": 0.0232, "step": 307020 }, { "epoch": 1.98, "learning_rate": 2.7533771791115094e-06, "loss": 0.0225, "step": 307030 }, { "epoch": 1.98, "learning_rate": 2.7436958247545774e-06, "loss": 0.0165, "step": 307040 }, { "epoch": 1.98, "learning_rate": 2.7340144703976453e-06, "loss": 0.0203, "step": 307050 }, { "epoch": 1.98, "learning_rate": 2.7243331160407132e-06, "loss": 0.0196, "step": 307060 }, { "epoch": 1.98, "learning_rate": 2.714651761683781e-06, "loss": 0.022, "step": 307070 }, { "epoch": 1.98, "learning_rate": 2.7049704073268487e-06, "loss": 0.0179, "step": 307080 }, { "epoch": 1.98, "learning_rate": 2.6952890529699166e-06, "loss": 0.0221, "step": 307090 }, { "epoch": 1.98, "learning_rate": 2.6856076986129845e-06, "loss": 0.022, "step": 307100 }, { "epoch": 1.98, "learning_rate": 2.675926344256052e-06, "loss": 0.0234, "step": 307110 }, { "epoch": 1.98, "learning_rate": 2.66624498989912e-06, "loss": 0.0239, "step": 307120 }, { "epoch": 1.98, "learning_rate": 2.656563635542188e-06, "loss": 0.0224, "step": 307130 }, { "epoch": 1.98, "learning_rate": 2.6468822811852554e-06, "loss": 0.0225, "step": 307140 }, { "epoch": 1.98, "learning_rate": 2.6372009268283234e-06, "loss": 0.0196, "step": 307150 }, { "epoch": 1.98, "learning_rate": 2.6275195724713913e-06, "loss": 0.0194, "step": 307160 }, { "epoch": 1.98, "learning_rate": 2.6178382181144592e-06, "loss": 0.0168, "step": 307170 }, { "epoch": 1.98, "learning_rate": 2.608156863757527e-06, "loss": 0.0236, "step": 307180 }, { "epoch": 1.98, "learning_rate": 2.598475509400595e-06, "loss": 0.0165, "step": 307190 }, { "epoch": 1.98, "learning_rate": 2.588794155043663e-06, "loss": 0.0216, "step": 307200 }, { "epoch": 1.98, "learning_rate": 2.57911280068673e-06, "loss": 0.0235, "step": 307210 }, { "epoch": 1.98, "learning_rate": 2.569431446329798e-06, "loss": 0.0205, "step": 307220 }, { "epoch": 1.98, "learning_rate": 2.559750091972866e-06, "loss": 0.0214, "step": 307230 }, { "epoch": 1.98, "learning_rate": 2.550068737615934e-06, "loss": 0.0201, "step": 307240 }, { "epoch": 1.98, "learning_rate": 2.540387383259002e-06, "loss": 0.022, "step": 307250 }, { "epoch": 1.98, "learning_rate": 2.5307060289020698e-06, "loss": 0.0254, "step": 307260 }, { "epoch": 1.98, "learning_rate": 2.5210246745451373e-06, "loss": 0.0237, "step": 307270 }, { "epoch": 1.98, "learning_rate": 2.5113433201882052e-06, "loss": 0.0289, "step": 307280 }, { "epoch": 1.98, "learning_rate": 2.501661965831273e-06, "loss": 0.0205, "step": 307290 }, { "epoch": 1.98, "learning_rate": 2.491980611474341e-06, "loss": 0.0266, "step": 307300 }, { "epoch": 1.98, "learning_rate": 2.482299257117409e-06, "loss": 0.022, "step": 307310 }, { "epoch": 1.98, "learning_rate": 2.472617902760477e-06, "loss": 0.031, "step": 307320 }, { "epoch": 1.98, "learning_rate": 2.462936548403545e-06, "loss": 0.0198, "step": 307330 }, { "epoch": 1.98, "learning_rate": 2.453255194046612e-06, "loss": 0.0244, "step": 307340 }, { "epoch": 1.98, "learning_rate": 2.44357383968968e-06, "loss": 0.0232, "step": 307350 }, { "epoch": 1.98, "learning_rate": 2.433892485332748e-06, "loss": 0.0248, "step": 307360 }, { "epoch": 1.98, "learning_rate": 2.4242111309758158e-06, "loss": 0.0275, "step": 307370 }, { "epoch": 1.98, "learning_rate": 2.4145297766188837e-06, "loss": 0.0207, "step": 307380 }, { "epoch": 1.98, "learning_rate": 2.4048484222619516e-06, "loss": 0.0201, "step": 307390 }, { "epoch": 1.98, "learning_rate": 2.395167067905019e-06, "loss": 0.0244, "step": 307400 }, { "epoch": 1.98, "learning_rate": 2.385485713548087e-06, "loss": 0.0229, "step": 307410 }, { "epoch": 1.98, "learning_rate": 2.375804359191155e-06, "loss": 0.0194, "step": 307420 }, { "epoch": 1.98, "learning_rate": 2.366123004834223e-06, "loss": 0.0232, "step": 307430 }, { "epoch": 1.98, "learning_rate": 2.3564416504772905e-06, "loss": 0.019, "step": 307440 }, { "epoch": 1.98, "learning_rate": 2.3467602961203584e-06, "loss": 0.0234, "step": 307450 }, { "epoch": 1.98, "learning_rate": 2.3370789417634263e-06, "loss": 0.0244, "step": 307460 }, { "epoch": 1.98, "learning_rate": 2.3273975874064943e-06, "loss": 0.0217, "step": 307470 }, { "epoch": 1.98, "learning_rate": 2.3177162330495618e-06, "loss": 0.0207, "step": 307480 }, { "epoch": 1.98, "learning_rate": 2.3080348786926297e-06, "loss": 0.0169, "step": 307490 }, { "epoch": 1.98, "learning_rate": 2.2983535243356976e-06, "loss": 0.0218, "step": 307500 }, { "epoch": 1.98, "learning_rate": 2.288672169978765e-06, "loss": 0.0197, "step": 307510 }, { "epoch": 1.98, "learning_rate": 2.278990815621833e-06, "loss": 0.0186, "step": 307520 }, { "epoch": 1.98, "learning_rate": 2.269309461264901e-06, "loss": 0.0226, "step": 307530 }, { "epoch": 1.98, "learning_rate": 2.2596281069079685e-06, "loss": 0.027, "step": 307540 }, { "epoch": 1.98, "learning_rate": 2.2499467525510365e-06, "loss": 0.0291, "step": 307550 }, { "epoch": 1.99, "learning_rate": 2.2402653981941044e-06, "loss": 0.0182, "step": 307560 }, { "epoch": 1.99, "learning_rate": 2.2305840438371723e-06, "loss": 0.0224, "step": 307570 }, { "epoch": 1.99, "learning_rate": 2.2209026894802403e-06, "loss": 0.0224, "step": 307580 }, { "epoch": 1.99, "learning_rate": 2.211221335123308e-06, "loss": 0.02, "step": 307590 }, { "epoch": 1.99, "learning_rate": 2.201539980766376e-06, "loss": 0.0218, "step": 307600 }, { "epoch": 1.99, "learning_rate": 2.1918586264094436e-06, "loss": 0.022, "step": 307610 }, { "epoch": 1.99, "learning_rate": 2.1821772720525116e-06, "loss": 0.0229, "step": 307620 }, { "epoch": 1.99, "learning_rate": 2.1724959176955795e-06, "loss": 0.03, "step": 307630 }, { "epoch": 1.99, "learning_rate": 2.162814563338647e-06, "loss": 0.0274, "step": 307640 }, { "epoch": 1.99, "learning_rate": 2.153133208981715e-06, "loss": 0.0185, "step": 307650 }, { "epoch": 1.99, "learning_rate": 2.143451854624783e-06, "loss": 0.0198, "step": 307660 }, { "epoch": 1.99, "learning_rate": 2.1337705002678504e-06, "loss": 0.0229, "step": 307670 }, { "epoch": 1.99, "learning_rate": 2.1240891459109183e-06, "loss": 0.0179, "step": 307680 }, { "epoch": 1.99, "learning_rate": 2.1144077915539863e-06, "loss": 0.0231, "step": 307690 }, { "epoch": 1.99, "learning_rate": 2.1047264371970538e-06, "loss": 0.0207, "step": 307700 }, { "epoch": 1.99, "learning_rate": 2.0950450828401217e-06, "loss": 0.0213, "step": 307710 }, { "epoch": 1.99, "learning_rate": 2.0853637284831896e-06, "loss": 0.022, "step": 307720 }, { "epoch": 1.99, "learning_rate": 2.0756823741262576e-06, "loss": 0.0191, "step": 307730 }, { "epoch": 1.99, "learning_rate": 2.0660010197693255e-06, "loss": 0.0195, "step": 307740 }, { "epoch": 1.99, "learning_rate": 2.0563196654123934e-06, "loss": 0.0229, "step": 307750 }, { "epoch": 1.99, "learning_rate": 2.0466383110554614e-06, "loss": 0.0205, "step": 307760 }, { "epoch": 1.99, "learning_rate": 2.036956956698529e-06, "loss": 0.0214, "step": 307770 }, { "epoch": 1.99, "learning_rate": 2.027275602341597e-06, "loss": 0.0193, "step": 307780 }, { "epoch": 1.99, "learning_rate": 2.0175942479846647e-06, "loss": 0.0196, "step": 307790 }, { "epoch": 1.99, "learning_rate": 2.0079128936277322e-06, "loss": 0.0221, "step": 307800 }, { "epoch": 1.99, "learning_rate": 1.9982315392708e-06, "loss": 0.0232, "step": 307810 }, { "epoch": 1.99, "learning_rate": 1.988550184913868e-06, "loss": 0.0241, "step": 307820 }, { "epoch": 1.99, "learning_rate": 1.9788688305569356e-06, "loss": 0.0244, "step": 307830 }, { "epoch": 1.99, "learning_rate": 1.9691874762000036e-06, "loss": 0.0232, "step": 307840 }, { "epoch": 1.99, "learning_rate": 1.9595061218430715e-06, "loss": 0.0206, "step": 307850 }, { "epoch": 1.99, "learning_rate": 1.9498247674861394e-06, "loss": 0.0219, "step": 307860 }, { "epoch": 1.99, "learning_rate": 1.940143413129207e-06, "loss": 0.0202, "step": 307870 }, { "epoch": 1.99, "learning_rate": 1.930462058772275e-06, "loss": 0.0223, "step": 307880 }, { "epoch": 1.99, "learning_rate": 1.920780704415343e-06, "loss": 0.0241, "step": 307890 }, { "epoch": 1.99, "learning_rate": 1.9110993500584107e-06, "loss": 0.0186, "step": 307900 }, { "epoch": 1.99, "learning_rate": 1.9014179957014785e-06, "loss": 0.0193, "step": 307910 }, { "epoch": 1.99, "learning_rate": 1.8917366413445464e-06, "loss": 0.0212, "step": 307920 }, { "epoch": 1.99, "learning_rate": 1.8820552869876141e-06, "loss": 0.0203, "step": 307930 }, { "epoch": 1.99, "learning_rate": 1.872373932630682e-06, "loss": 0.0236, "step": 307940 }, { "epoch": 1.99, "learning_rate": 1.86269257827375e-06, "loss": 0.0195, "step": 307950 }, { "epoch": 1.99, "learning_rate": 1.8530112239168175e-06, "loss": 0.0214, "step": 307960 }, { "epoch": 1.99, "learning_rate": 1.8433298695598854e-06, "loss": 0.0229, "step": 307970 }, { "epoch": 1.99, "learning_rate": 1.8336485152029534e-06, "loss": 0.0215, "step": 307980 }, { "epoch": 1.99, "learning_rate": 1.823967160846021e-06, "loss": 0.023, "step": 307990 }, { "epoch": 1.99, "learning_rate": 1.814285806489089e-06, "loss": 0.0191, "step": 308000 }, { "epoch": 1.99, "eval_cer": 0.9198192294655971, "eval_loss": 0.01642085798084736, "eval_runtime": 120.209, "eval_samples_per_second": 16.638, "eval_steps_per_second": 4.159, "step": 308000 }, { "epoch": 1.99, "learning_rate": 1.8046044521321567e-06, "loss": 0.018, "step": 308010 }, { "epoch": 1.99, "learning_rate": 1.7949230977752245e-06, "loss": 0.0222, "step": 308020 }, { "epoch": 1.99, "learning_rate": 1.7852417434182924e-06, "loss": 0.0233, "step": 308030 }, { "epoch": 1.99, "learning_rate": 1.7755603890613603e-06, "loss": 0.0199, "step": 308040 }, { "epoch": 1.99, "learning_rate": 1.7658790347044283e-06, "loss": 0.0227, "step": 308050 }, { "epoch": 1.99, "learning_rate": 1.7561976803474958e-06, "loss": 0.0196, "step": 308060 }, { "epoch": 1.99, "learning_rate": 1.7465163259905637e-06, "loss": 0.0246, "step": 308070 }, { "epoch": 1.99, "learning_rate": 1.7368349716336316e-06, "loss": 0.0237, "step": 308080 }, { "epoch": 1.99, "learning_rate": 1.7271536172766993e-06, "loss": 0.0187, "step": 308090 }, { "epoch": 1.99, "learning_rate": 1.7174722629197673e-06, "loss": 0.0234, "step": 308100 }, { "epoch": 1.99, "learning_rate": 1.7077909085628352e-06, "loss": 0.0291, "step": 308110 }, { "epoch": 1.99, "learning_rate": 1.6981095542059027e-06, "loss": 0.0203, "step": 308120 }, { "epoch": 1.99, "learning_rate": 1.6884281998489707e-06, "loss": 0.0216, "step": 308130 }, { "epoch": 1.99, "learning_rate": 1.6787468454920386e-06, "loss": 0.0252, "step": 308140 }, { "epoch": 1.99, "learning_rate": 1.6690654911351063e-06, "loss": 0.0244, "step": 308150 }, { "epoch": 1.99, "learning_rate": 1.6593841367781742e-06, "loss": 0.0222, "step": 308160 }, { "epoch": 1.99, "learning_rate": 1.6497027824212422e-06, "loss": 0.0238, "step": 308170 }, { "epoch": 1.99, "learning_rate": 1.6400214280643097e-06, "loss": 0.0221, "step": 308180 }, { "epoch": 1.99, "learning_rate": 1.6303400737073776e-06, "loss": 0.0215, "step": 308190 }, { "epoch": 1.99, "learning_rate": 1.6206587193504456e-06, "loss": 0.0267, "step": 308200 }, { "epoch": 1.99, "learning_rate": 1.6109773649935135e-06, "loss": 0.023, "step": 308210 }, { "epoch": 1.99, "learning_rate": 1.6012960106365812e-06, "loss": 0.0217, "step": 308220 }, { "epoch": 1.99, "learning_rate": 1.591614656279649e-06, "loss": 0.0244, "step": 308230 }, { "epoch": 1.99, "learning_rate": 1.5819333019227169e-06, "loss": 0.0263, "step": 308240 }, { "epoch": 1.99, "learning_rate": 1.5722519475657846e-06, "loss": 0.0201, "step": 308250 }, { "epoch": 1.99, "learning_rate": 1.5625705932088525e-06, "loss": 0.0188, "step": 308260 }, { "epoch": 1.99, "learning_rate": 1.5528892388519205e-06, "loss": 0.0218, "step": 308270 }, { "epoch": 1.99, "learning_rate": 1.543207884494988e-06, "loss": 0.0226, "step": 308280 }, { "epoch": 1.99, "learning_rate": 1.533526530138056e-06, "loss": 0.0189, "step": 308290 }, { "epoch": 1.99, "learning_rate": 1.5238451757811238e-06, "loss": 0.0217, "step": 308300 }, { "epoch": 1.99, "learning_rate": 1.5141638214241916e-06, "loss": 0.0302, "step": 308310 }, { "epoch": 1.99, "learning_rate": 1.5044824670672595e-06, "loss": 0.0224, "step": 308320 }, { "epoch": 1.99, "learning_rate": 1.4948011127103274e-06, "loss": 0.0195, "step": 308330 }, { "epoch": 1.99, "learning_rate": 1.4851197583533953e-06, "loss": 0.0195, "step": 308340 }, { "epoch": 1.99, "learning_rate": 1.4754384039964629e-06, "loss": 0.0183, "step": 308350 }, { "epoch": 1.99, "learning_rate": 1.4657570496395308e-06, "loss": 0.0216, "step": 308360 }, { "epoch": 1.99, "learning_rate": 1.4560756952825987e-06, "loss": 0.0282, "step": 308370 }, { "epoch": 1.99, "learning_rate": 1.4463943409256664e-06, "loss": 0.0182, "step": 308380 }, { "epoch": 1.99, "learning_rate": 1.4367129865687344e-06, "loss": 0.0198, "step": 308390 }, { "epoch": 1.99, "learning_rate": 1.427031632211802e-06, "loss": 0.0212, "step": 308400 }, { "epoch": 1.99, "learning_rate": 1.4173502778548698e-06, "loss": 0.0228, "step": 308410 }, { "epoch": 1.99, "learning_rate": 1.4076689234979378e-06, "loss": 0.0213, "step": 308420 }, { "epoch": 1.99, "learning_rate": 1.3979875691410057e-06, "loss": 0.0239, "step": 308430 }, { "epoch": 1.99, "learning_rate": 1.3883062147840734e-06, "loss": 0.0251, "step": 308440 }, { "epoch": 1.99, "learning_rate": 1.3786248604271411e-06, "loss": 0.0245, "step": 308450 }, { "epoch": 1.99, "learning_rate": 1.368943506070209e-06, "loss": 0.024, "step": 308460 }, { "epoch": 1.99, "learning_rate": 1.3592621517132768e-06, "loss": 0.0225, "step": 308470 }, { "epoch": 1.99, "learning_rate": 1.3495807973563447e-06, "loss": 0.0216, "step": 308480 }, { "epoch": 1.99, "learning_rate": 1.3398994429994127e-06, "loss": 0.0208, "step": 308490 }, { "epoch": 1.99, "learning_rate": 1.3302180886424806e-06, "loss": 0.0197, "step": 308500 }, { "epoch": 1.99, "learning_rate": 1.320536734285548e-06, "loss": 0.0211, "step": 308510 }, { "epoch": 1.99, "learning_rate": 1.310855379928616e-06, "loss": 0.0237, "step": 308520 }, { "epoch": 1.99, "learning_rate": 1.301174025571684e-06, "loss": 0.0256, "step": 308530 }, { "epoch": 1.99, "learning_rate": 1.2914926712147517e-06, "loss": 0.0215, "step": 308540 }, { "epoch": 1.99, "learning_rate": 1.2818113168578196e-06, "loss": 0.0227, "step": 308550 }, { "epoch": 1.99, "learning_rate": 1.2721299625008873e-06, "loss": 0.0238, "step": 308560 }, { "epoch": 1.99, "learning_rate": 1.262448608143955e-06, "loss": 0.0237, "step": 308570 }, { "epoch": 1.99, "learning_rate": 1.252767253787023e-06, "loss": 0.024, "step": 308580 }, { "epoch": 1.99, "learning_rate": 1.243085899430091e-06, "loss": 0.0259, "step": 308590 }, { "epoch": 1.99, "learning_rate": 1.2334045450731586e-06, "loss": 0.0283, "step": 308600 }, { "epoch": 1.99, "learning_rate": 1.2237231907162264e-06, "loss": 0.0272, "step": 308610 }, { "epoch": 1.99, "learning_rate": 1.2140418363592943e-06, "loss": 0.0203, "step": 308620 }, { "epoch": 1.99, "learning_rate": 1.204360482002362e-06, "loss": 0.0279, "step": 308630 }, { "epoch": 1.99, "learning_rate": 1.19467912764543e-06, "loss": 0.0195, "step": 308640 }, { "epoch": 1.99, "learning_rate": 1.1849977732884979e-06, "loss": 0.0172, "step": 308650 }, { "epoch": 1.99, "learning_rate": 1.1753164189315658e-06, "loss": 0.0217, "step": 308660 }, { "epoch": 1.99, "learning_rate": 1.1656350645746333e-06, "loss": 0.021, "step": 308670 }, { "epoch": 1.99, "learning_rate": 1.1559537102177013e-06, "loss": 0.0214, "step": 308680 }, { "epoch": 1.99, "learning_rate": 1.1462723558607692e-06, "loss": 0.0228, "step": 308690 }, { "epoch": 1.99, "learning_rate": 1.136591001503837e-06, "loss": 0.0208, "step": 308700 }, { "epoch": 1.99, "learning_rate": 1.1269096471469049e-06, "loss": 0.0196, "step": 308710 }, { "epoch": 1.99, "learning_rate": 1.1172282927899726e-06, "loss": 0.0195, "step": 308720 }, { "epoch": 1.99, "learning_rate": 1.1075469384330405e-06, "loss": 0.0187, "step": 308730 }, { "epoch": 1.99, "learning_rate": 1.0978655840761082e-06, "loss": 0.0224, "step": 308740 }, { "epoch": 1.99, "learning_rate": 1.088184229719176e-06, "loss": 0.0282, "step": 308750 }, { "epoch": 1.99, "learning_rate": 1.0785028753622439e-06, "loss": 0.0201, "step": 308760 }, { "epoch": 1.99, "learning_rate": 1.0688215210053118e-06, "loss": 0.0205, "step": 308770 }, { "epoch": 1.99, "learning_rate": 1.0591401666483795e-06, "loss": 0.023, "step": 308780 }, { "epoch": 1.99, "learning_rate": 1.0494588122914475e-06, "loss": 0.0209, "step": 308790 }, { "epoch": 1.99, "learning_rate": 1.0397774579345152e-06, "loss": 0.0205, "step": 308800 }, { "epoch": 1.99, "learning_rate": 1.0300961035775831e-06, "loss": 0.0243, "step": 308810 }, { "epoch": 1.99, "learning_rate": 1.0204147492206509e-06, "loss": 0.017, "step": 308820 }, { "epoch": 1.99, "learning_rate": 1.0107333948637186e-06, "loss": 0.0207, "step": 308830 }, { "epoch": 1.99, "learning_rate": 1.0010520405067865e-06, "loss": 0.0254, "step": 308840 }, { "epoch": 1.99, "learning_rate": 9.913706861498544e-07, "loss": 0.0208, "step": 308850 }, { "epoch": 1.99, "learning_rate": 9.816893317929222e-07, "loss": 0.0217, "step": 308860 }, { "epoch": 1.99, "learning_rate": 9.7200797743599e-07, "loss": 0.0231, "step": 308870 }, { "epoch": 1.99, "learning_rate": 9.623266230790578e-07, "loss": 0.0256, "step": 308880 }, { "epoch": 1.99, "learning_rate": 9.526452687221257e-07, "loss": 0.0196, "step": 308890 }, { "epoch": 1.99, "learning_rate": 9.429639143651935e-07, "loss": 0.022, "step": 308900 }, { "epoch": 1.99, "learning_rate": 9.332825600082613e-07, "loss": 0.0212, "step": 308910 }, { "epoch": 1.99, "learning_rate": 9.236012056513292e-07, "loss": 0.0233, "step": 308920 }, { "epoch": 1.99, "learning_rate": 9.13919851294397e-07, "loss": 0.0182, "step": 308930 }, { "epoch": 1.99, "learning_rate": 9.042384969374649e-07, "loss": 0.0243, "step": 308940 }, { "epoch": 1.99, "learning_rate": 8.945571425805327e-07, "loss": 0.0216, "step": 308950 }, { "epoch": 1.99, "learning_rate": 8.848757882236004e-07, "loss": 0.0222, "step": 308960 }, { "epoch": 1.99, "learning_rate": 8.751944338666684e-07, "loss": 0.0233, "step": 308970 }, { "epoch": 1.99, "learning_rate": 8.655130795097361e-07, "loss": 0.0198, "step": 308980 }, { "epoch": 1.99, "learning_rate": 8.558317251528039e-07, "loss": 0.0205, "step": 308990 }, { "epoch": 1.99, "learning_rate": 8.461503707958718e-07, "loss": 0.0214, "step": 309000 }, { "epoch": 1.99, "eval_cer": 0.919811094791549, "eval_loss": 0.016410965472459793, "eval_runtime": 120.1413, "eval_samples_per_second": 16.647, "eval_steps_per_second": 4.162, "step": 309000 }, { "epoch": 1.99, "learning_rate": 8.364690164389396e-07, "loss": 0.022, "step": 309010 }, { "epoch": 1.99, "learning_rate": 8.267876620820075e-07, "loss": 0.0201, "step": 309020 }, { "epoch": 1.99, "learning_rate": 8.171063077250753e-07, "loss": 0.0271, "step": 309030 }, { "epoch": 1.99, "learning_rate": 8.07424953368143e-07, "loss": 0.0189, "step": 309040 }, { "epoch": 1.99, "learning_rate": 7.97743599011211e-07, "loss": 0.0204, "step": 309050 }, { "epoch": 1.99, "learning_rate": 7.880622446542788e-07, "loss": 0.0211, "step": 309060 }, { "epoch": 1.99, "learning_rate": 7.783808902973465e-07, "loss": 0.0202, "step": 309070 }, { "epoch": 1.99, "learning_rate": 7.686995359404145e-07, "loss": 0.0188, "step": 309080 }, { "epoch": 1.99, "learning_rate": 7.590181815834822e-07, "loss": 0.0189, "step": 309090 }, { "epoch": 1.99, "learning_rate": 7.493368272265501e-07, "loss": 0.0161, "step": 309100 }, { "epoch": 2.0, "learning_rate": 7.39655472869618e-07, "loss": 0.0226, "step": 309110 }, { "epoch": 2.0, "learning_rate": 7.299741185126857e-07, "loss": 0.0187, "step": 309120 }, { "epoch": 2.0, "learning_rate": 7.202927641557536e-07, "loss": 0.02, "step": 309130 }, { "epoch": 2.0, "learning_rate": 7.106114097988214e-07, "loss": 0.0207, "step": 309140 }, { "epoch": 2.0, "learning_rate": 7.009300554418892e-07, "loss": 0.0258, "step": 309150 }, { "epoch": 2.0, "learning_rate": 6.912487010849571e-07, "loss": 0.0249, "step": 309160 }, { "epoch": 2.0, "learning_rate": 6.815673467280248e-07, "loss": 0.0228, "step": 309170 }, { "epoch": 2.0, "learning_rate": 6.718859923710927e-07, "loss": 0.0217, "step": 309180 }, { "epoch": 2.0, "learning_rate": 6.622046380141606e-07, "loss": 0.0216, "step": 309190 }, { "epoch": 2.0, "learning_rate": 6.525232836572283e-07, "loss": 0.0192, "step": 309200 }, { "epoch": 2.0, "learning_rate": 6.428419293002962e-07, "loss": 0.0241, "step": 309210 }, { "epoch": 2.0, "learning_rate": 6.33160574943364e-07, "loss": 0.0195, "step": 309220 }, { "epoch": 2.0, "learning_rate": 6.234792205864318e-07, "loss": 0.0193, "step": 309230 }, { "epoch": 2.0, "learning_rate": 6.137978662294997e-07, "loss": 0.021, "step": 309240 }, { "epoch": 2.0, "learning_rate": 6.041165118725675e-07, "loss": 0.0211, "step": 309250 }, { "epoch": 2.0, "learning_rate": 5.944351575156354e-07, "loss": 0.0178, "step": 309260 }, { "epoch": 2.0, "learning_rate": 5.847538031587032e-07, "loss": 0.0253, "step": 309270 }, { "epoch": 2.0, "learning_rate": 5.75072448801771e-07, "loss": 0.0181, "step": 309280 }, { "epoch": 2.0, "learning_rate": 5.653910944448388e-07, "loss": 0.0175, "step": 309290 }, { "epoch": 2.0, "learning_rate": 5.557097400879067e-07, "loss": 0.0185, "step": 309300 }, { "epoch": 2.0, "learning_rate": 5.460283857309745e-07, "loss": 0.0199, "step": 309310 }, { "epoch": 2.0, "learning_rate": 5.363470313740423e-07, "loss": 0.02, "step": 309320 }, { "epoch": 2.0, "learning_rate": 5.266656770171102e-07, "loss": 0.0195, "step": 309330 }, { "epoch": 2.0, "learning_rate": 5.16984322660178e-07, "loss": 0.0241, "step": 309340 }, { "epoch": 2.0, "learning_rate": 5.073029683032458e-07, "loss": 0.0263, "step": 309350 }, { "epoch": 2.0, "learning_rate": 4.976216139463136e-07, "loss": 0.0194, "step": 309360 }, { "epoch": 2.0, "learning_rate": 4.879402595893815e-07, "loss": 0.018, "step": 309370 }, { "epoch": 2.0, "learning_rate": 4.782589052324493e-07, "loss": 0.0213, "step": 309380 }, { "epoch": 2.0, "learning_rate": 4.685775508755171e-07, "loss": 0.0267, "step": 309390 }, { "epoch": 2.0, "learning_rate": 4.5889619651858494e-07, "loss": 0.0219, "step": 309400 }, { "epoch": 2.0, "learning_rate": 4.492148421616527e-07, "loss": 0.0181, "step": 309410 }, { "epoch": 2.0, "learning_rate": 4.395334878047206e-07, "loss": 0.0169, "step": 309420 }, { "epoch": 2.0, "learning_rate": 4.298521334477884e-07, "loss": 0.02, "step": 309430 }, { "epoch": 2.0, "learning_rate": 4.2017077909085625e-07, "loss": 0.0221, "step": 309440 }, { "epoch": 2.0, "learning_rate": 4.10489424733924e-07, "loss": 0.0243, "step": 309450 }, { "epoch": 2.0, "learning_rate": 4.008080703769919e-07, "loss": 0.0244, "step": 309460 }, { "epoch": 2.0, "learning_rate": 3.9112671602005973e-07, "loss": 0.0197, "step": 309470 }, { "epoch": 2.0, "learning_rate": 3.8144536166312756e-07, "loss": 0.0207, "step": 309480 }, { "epoch": 2.0, "learning_rate": 3.717640073061954e-07, "loss": 0.0229, "step": 309490 }, { "epoch": 2.0, "learning_rate": 3.620826529492632e-07, "loss": 0.0178, "step": 309500 }, { "epoch": 2.0, "learning_rate": 3.5240129859233104e-07, "loss": 0.0212, "step": 309510 }, { "epoch": 2.0, "learning_rate": 3.427199442353989e-07, "loss": 0.026, "step": 309520 }, { "epoch": 2.0, "learning_rate": 3.330385898784667e-07, "loss": 0.0204, "step": 309530 }, { "epoch": 2.0, "learning_rate": 3.233572355215345e-07, "loss": 0.0204, "step": 309540 }, { "epoch": 2.0, "learning_rate": 3.1367588116460235e-07, "loss": 0.024, "step": 309550 }, { "epoch": 2.0, "learning_rate": 3.0399452680767023e-07, "loss": 0.0198, "step": 309560 }, { "epoch": 2.0, "learning_rate": 2.94313172450738e-07, "loss": 0.0202, "step": 309570 }, { "epoch": 2.0, "learning_rate": 2.8463181809380583e-07, "loss": 0.023, "step": 309580 }, { "epoch": 2.0, "learning_rate": 2.7495046373687366e-07, "loss": 0.0253, "step": 309590 }, { "epoch": 2.0, "learning_rate": 2.652691093799415e-07, "loss": 0.0201, "step": 309600 }, { "epoch": 2.0, "learning_rate": 2.555877550230093e-07, "loss": 0.0198, "step": 309610 }, { "epoch": 2.0, "learning_rate": 2.4590640066607714e-07, "loss": 0.0246, "step": 309620 }, { "epoch": 2.0, "learning_rate": 2.36225046309145e-07, "loss": 0.021, "step": 309630 }, { "epoch": 2.0, "learning_rate": 2.265436919522128e-07, "loss": 0.0251, "step": 309640 }, { "epoch": 2.0, "learning_rate": 2.1686233759528065e-07, "loss": 0.0274, "step": 309650 }, { "epoch": 2.0, "learning_rate": 2.0718098323834845e-07, "loss": 0.0197, "step": 309660 }, { "epoch": 2.0, "learning_rate": 1.974996288814163e-07, "loss": 0.0201, "step": 309670 }, { "epoch": 2.0, "learning_rate": 1.878182745244841e-07, "loss": 0.0232, "step": 309680 }, { "epoch": 2.0, "learning_rate": 1.7813692016755196e-07, "loss": 0.0234, "step": 309690 }, { "epoch": 2.0, "learning_rate": 1.684555658106198e-07, "loss": 0.0169, "step": 309700 }, { "epoch": 2.0, "learning_rate": 1.5877421145368762e-07, "loss": 0.024, "step": 309710 }, { "epoch": 2.0, "learning_rate": 1.4909285709675544e-07, "loss": 0.02, "step": 309720 }, { "epoch": 2.0, "learning_rate": 1.3941150273982327e-07, "loss": 0.0213, "step": 309730 }, { "epoch": 2.0, "learning_rate": 1.297301483828911e-07, "loss": 0.0179, "step": 309740 }, { "epoch": 2.0, "learning_rate": 1.2004879402595893e-07, "loss": 0.0265, "step": 309750 }, { "epoch": 2.0, "learning_rate": 1.1036743966902677e-07, "loss": 0.0202, "step": 309760 }, { "epoch": 2.0, "learning_rate": 1.0068608531209459e-07, "loss": 0.0183, "step": 309770 }, { "epoch": 2.0, "learning_rate": 9.100473095516242e-08, "loss": 0.0225, "step": 309780 }, { "epoch": 2.0, "learning_rate": 8.132337659823025e-08, "loss": 0.0196, "step": 309790 }, { "epoch": 2.0, "learning_rate": 7.164202224129808e-08, "loss": 0.0184, "step": 309800 }, { "epoch": 2.0, "learning_rate": 6.19606678843659e-08, "loss": 0.0256, "step": 309810 }, { "epoch": 2.0, "learning_rate": 5.227931352743372e-08, "loss": 0.0201, "step": 309820 }, { "epoch": 2.0, "learning_rate": 4.259795917050155e-08, "loss": 0.0249, "step": 309830 }, { "epoch": 2.0, "learning_rate": 3.2916604813569384e-08, "loss": 0.0227, "step": 309840 }, { "epoch": 2.0, "learning_rate": 2.3235250456637212e-08, "loss": 0.0218, "step": 309850 }, { "epoch": 2.0, "learning_rate": 1.355389609970504e-08, "loss": 0.0212, "step": 309860 }, { "epoch": 2.0, "learning_rate": 3.872541742772869e-09, "loss": 0.0204, "step": 309870 }, { "epoch": 2.0, "step": 309874, "total_flos": 1.6340823463826534e+18, "train_loss": 0.047053869794253175, "train_runtime": 343177.6492, "train_samples_per_second": 28.895, "train_steps_per_second": 0.903 } ], "max_steps": 309874, "num_train_epochs": 2, "total_flos": 1.6340823463826534e+18, "trial_name": null, "trial_params": null }